FileContentSearch/Source/packages/Lucene.Net.Sandbox.4.8.0-beta00017/lib/net8.0/Lucene.Net.Sandbox.xml
zilinsoft 004cf875cf ## 📅2025-07-14 星期一更新
### FileContentSearch    V1.0.2507.1401
- *.[新增]初始版本。
2025-07-14 17:24:51 +08:00

366 lines
21 KiB
XML

<?xml version="1.0"?>
<doc>
<assembly>
<name>Lucene.Net.Sandbox</name>
</assembly>
<members>
<member name="T:Lucene.Net.Sandbox.Queries.DuplicateFilter">
<summary>
Filter to remove duplicate values from search results.
<para/>
WARNING: for this to work correctly, you may have to wrap
your reader as it cannot current deduplicate across different
index segments.
</summary>
<seealso cref="T:Lucene.Net.Index.SlowCompositeReaderWrapper"/>
</member>
<member name="T:Lucene.Net.Sandbox.Queries.KeepMode">
<summary>
KeepMode determines which document id to consider as the master, all others being
identified as duplicates. Selecting the "first occurrence" can potentially save on IO.
</summary>
</member>
<member name="T:Lucene.Net.Sandbox.Queries.ProcessingMode">
<summary>
"Full" processing mode starts by setting all bits to false and only setting bits
for documents that contain the given field and are identified as none-duplicates.
<para/>
"Fast" processing sets all bits to true then unsets all duplicate docs found for the
given field. This approach avoids the need to read DocsEnum for terms that are seen
to have a document frequency of exactly "1" (i.e. no duplicates). While a potentially
faster approach , the downside is that bitsets produced will include bits set for
documents that do not actually contain the field given.
</summary>
</member>
<member name="F:Lucene.Net.Sandbox.Queries.ProcessingMode.PM_FULL_VALIDATION">
<summary>
"Full" processing mode starts by setting all bits to false and only setting bits
for documents that contain the given field and are identified as none-duplicates.
</summary>
</member>
<member name="F:Lucene.Net.Sandbox.Queries.ProcessingMode.PM_FAST_INVALIDATION">
<summary>
"Fast" processing sets all bits to true then unsets all duplicate docs found for the
given field. This approach avoids the need to read DocsEnum for terms that are seen
to have a document frequency of exactly "1" (i.e. no duplicates). While a potentially
faster approach , the downside is that bitsets produced will include bits set for
documents that do not actually contain the field given.
</summary>
</member>
<member name="T:Lucene.Net.Sandbox.Queries.FuzzyLikeThisQuery">
<summary>
Fuzzifies ALL terms provided as strings and then picks the best n differentiating terms.
In effect this mixes the behaviour of <see cref="T:Lucene.Net.Search.FuzzyQuery"/> and MoreLikeThis but with special consideration
of fuzzy scoring factors.
This generally produces good results for queries where users may provide details in a number of
fields and have no knowledge of boolean query syntax and also want a degree of fuzzy matching and
a fast query.
<para/>
For each source term the fuzzy variants are held in a <see cref="T:Lucene.Net.Search.BooleanQuery"/> with no coord factor (because
we are not looking for matches on multiple variants in any one doc). Additionally, a specialized
<see cref="T:Lucene.Net.Search.TermQuery"/> is used for variants and does not use that variant term's IDF because this would favour rarer
terms eg misspellings. Instead, all variants use the same IDF ranking (the one for the source query
term) and this is factored into the variant's boost. If the source query term does not exist in the
index the average IDF of the variants is used.
</summary>
</member>
<member name="M:Lucene.Net.Sandbox.Queries.FuzzyLikeThisQuery.#ctor(System.Int32,Lucene.Net.Analysis.Analyzer)">
<summary>
</summary>
<param name="maxNumTerms">The total number of terms clauses that will appear once rewritten as a <see cref="T:Lucene.Net.Search.BooleanQuery"/></param>
<param name="analyzer"></param>
</member>
<member name="M:Lucene.Net.Sandbox.Queries.FuzzyLikeThisQuery.AddTerms(System.String,System.String,System.Single,System.Int32)">
<summary>
Adds user input for "fuzzification"
</summary>
<param name="queryString">The string which will be parsed by the analyzer and for which fuzzy variants will be parsed</param>
<param name="fieldName">The minimum similarity of the term variants (see <see cref="T:Lucene.Net.Search.FuzzyTermsEnum"/>)</param>
<param name="minSimilarity">Length of required common prefix on variant terms (see <see cref="T:Lucene.Net.Search.FuzzyTermsEnum"/>)</param>
<param name="prefixLength"></param>
</member>
<member name="M:Lucene.Net.Sandbox.Queries.FuzzyLikeThisQuery.ScoreTermQueue.LessThan(Lucene.Net.Sandbox.Queries.FuzzyLikeThisQuery.ScoreTerm,Lucene.Net.Sandbox.Queries.FuzzyLikeThisQuery.ScoreTerm)">
<summary>
(non-Javadoc)
<see cref="M:Lucene.Net.Util.PriorityQueue`1.LessThan(`0,`0)"/>
</summary>
</member>
<member name="M:Lucene.Net.Sandbox.Queries.FuzzyLikeThisQuery.ToString(System.String)">
<summary>
(non-Javadoc)
<see cref="M:Lucene.Net.Search.Query.ToString(System.String)"/>
</summary>
<param name="field"></param>
<returns></returns>
</member>
<member name="T:Lucene.Net.Sandbox.Queries.SlowFuzzyQuery">
<summary>
Implements the classic fuzzy search query. The similarity measurement
is based on the Levenshtein (edit distance) algorithm.
<para/>
Note that, unlike <see cref="T:Lucene.Net.Search.FuzzyQuery"/>, this query will silently allow
for a (possibly huge) number of edit distances in comparisons, and may
be extremely slow (comparing every term in the index).
</summary>
</member>
<member name="M:Lucene.Net.Sandbox.Queries.SlowFuzzyQuery.#ctor(Lucene.Net.Index.Term,System.Single,System.Int32,System.Int32)">
<summary>
Create a new <see cref="T:Lucene.Net.Sandbox.Queries.SlowFuzzyQuery"/> that will match terms with a similarity
of at least <paramref name="minimumSimilarity"/> to <paramref name="term"/>.
If a <paramref name="prefixLength"/> &gt; 0 is specified, a common prefix
of that length is also required.
</summary>
<param name="term">the term to search for</param>
<param name="minimumSimilarity">
a value between 0 and 1 to set the required similarity
between the query term and the matching terms. For example, for a
<paramref name="minimumSimilarity"/> of <c>0.5</c> a term of the same length
as the query term is considered similar to the query term if the edit distance
between both terms is less than <c>length(term)*0.5</c>
<para/>
Alternatively, if <paramref name="minimumSimilarity"/> is >= 1f, it is interpreted
as a pure Levenshtein edit distance. For example, a value of <c>2f</c>
will match all terms within an edit distance of <c>2</c> from the
query term. Edit distances specified in this way may not be fractional.
</param>
<param name="prefixLength">length of common (non-fuzzy) prefix</param>
<param name="maxExpansions">
the maximum number of terms to match. If this number is
greater than <see cref="P:Lucene.Net.Search.BooleanQuery.MaxClauseCount"/> when the query is rewritten,
then the maxClauseCount will be used instead.
</param>
<exception cref="T:System.ArgumentException">
if <paramref name="minimumSimilarity"/> is &gt;= 1 or &lt; 0
or if <paramref name="prefixLength"/> &lt; 0
</exception>
</member>
<member name="M:Lucene.Net.Sandbox.Queries.SlowFuzzyQuery.#ctor(Lucene.Net.Index.Term,System.Single,System.Int32)">
<summary>
Calls <see cref="M:Lucene.Net.Sandbox.Queries.SlowFuzzyQuery.#ctor(Lucene.Net.Index.Term,System.Single)">SlowFuzzyQuery(term, minimumSimilarity, prefixLength, defaultMaxExpansions)</see>.
</summary>
</member>
<member name="M:Lucene.Net.Sandbox.Queries.SlowFuzzyQuery.#ctor(Lucene.Net.Index.Term,System.Single)">
<summary>
Calls <see cref="M:Lucene.Net.Sandbox.Queries.SlowFuzzyQuery.#ctor(Lucene.Net.Index.Term,System.Single)">SlowFuzzyQuery(term, minimumSimilarity, 0, defaultMaxExpansions)</see>.
</summary>
</member>
<member name="M:Lucene.Net.Sandbox.Queries.SlowFuzzyQuery.#ctor(Lucene.Net.Index.Term)">
<summary>
Calls <see cref="M:Lucene.Net.Sandbox.Queries.SlowFuzzyQuery.#ctor(Lucene.Net.Index.Term,System.Single)">SlowFuzzyQuery(term, defaultMinSimilarity, 0, defaultMaxExpansions)</see>.
</summary>
</member>
<member name="P:Lucene.Net.Sandbox.Queries.SlowFuzzyQuery.MinSimilarity">
<summary>
Gets the minimum similarity that is required for this query to match.
Returns float value between 0.0 and 1.0.
</summary>
</member>
<member name="P:Lucene.Net.Sandbox.Queries.SlowFuzzyQuery.PrefixLength">
<summary>
Gets the non-fuzzy prefix length. This is the number of characters at the start
of a term that must be identical (not fuzzy) to the query term if the query
is to match that term.
</summary>
</member>
<member name="P:Lucene.Net.Sandbox.Queries.SlowFuzzyQuery.Term">
<summary>
Gets the pattern term.
</summary>
</member>
<member name="T:Lucene.Net.Sandbox.Queries.SlowFuzzyTermsEnum">
<summary>
Potentially slow fuzzy <see cref="T:Lucene.Net.Index.TermsEnum"/> for enumerating all terms that are similar
to the specified filter term.
<para/>
If the minSimilarity or maxEdits is greater than the Automaton's
allowable range, this backs off to the classic (brute force)
fuzzy terms enum method by calling <see cref="M:Lucene.Net.Search.FuzzyTermsEnum.GetAutomatonEnum(System.Int32,Lucene.Net.Util.BytesRef)"/>.
<para/>
Term enumerations are always ordered by
<see cref="P:Lucene.Net.Search.FuzzyTermsEnum.Comparer"/>. Each term in the enumeration is
greater than all that precede it.
</summary>
</member>
<member name="T:Lucene.Net.Sandbox.Queries.SlowFuzzyTermsEnum.LinearFuzzyTermsEnum">
<summary>
Implement fuzzy enumeration with linear brute force.
</summary>
</member>
<member name="F:Lucene.Net.Sandbox.Queries.SlowFuzzyTermsEnum.LinearFuzzyTermsEnum.d">
<summary>
Allows us save time required to create a new array
every time similarity is called.
</summary>
</member>
<member name="F:Lucene.Net.Sandbox.Queries.SlowFuzzyTermsEnum.LinearFuzzyTermsEnum.text">
<summary>this is the text, minus the prefix</summary>
</member>
<member name="M:Lucene.Net.Sandbox.Queries.SlowFuzzyTermsEnum.LinearFuzzyTermsEnum.#ctor(Lucene.Net.Sandbox.Queries.SlowFuzzyTermsEnum)">
<summary>
Constructor for enumeration of all terms from specified <c>reader</c> which share a prefix of
length <c>prefixLength</c> with <c>term</c> and which have a fuzzy similarity &gt;
<c>minSimilarity</c>.
<para/>
After calling the constructor the enumeration is already pointing to the first
valid term if such a term exists.
</summary>
<exception cref="T:System.IO.IOException">If there is a low-level I/O error.</exception>
</member>
<member name="F:Lucene.Net.Sandbox.Queries.SlowFuzzyTermsEnum.LinearFuzzyTermsEnum.utf32">
<summary>used for unicode conversion from BytesRef byte[] to int[]</summary>
</member>
<member name="M:Lucene.Net.Sandbox.Queries.SlowFuzzyTermsEnum.LinearFuzzyTermsEnum.Accept(Lucene.Net.Util.BytesRef)">
<summary>
<para>
The termCompare method in FuzzyTermEnum uses Levenshtein distance to
calculate the distance between the given term and the comparing term.
</para>
<para>
If the minSimilarity is >= 1.0, this uses the maxEdits as the comparison.
Otherwise, this method uses the following logic to calculate similarity.
<code>
similarity = 1 - ((float)distance / (float) (prefixLength + Math.min(textlen, targetlen)));
</code>
where distance is the Levenshtein distance for the two words.
</para>
</summary>
</member>
<member name="M:Lucene.Net.Sandbox.Queries.SlowFuzzyTermsEnum.LinearFuzzyTermsEnum.CalcDistance(System.Int32[],System.Int32,System.Int32)">
<summary>
<para>
<see cref="M:Lucene.Net.Sandbox.Queries.SlowFuzzyTermsEnum.LinearFuzzyTermsEnum.CalcDistance(System.Int32[],System.Int32,System.Int32)"/> returns the Levenshtein distance between the query term
and the target term.
</para>
<para>
Embedded within this algorithm is a fail-fast Levenshtein distance
algorithm. The fail-fast algorithm differs from the standard Levenshtein
distance algorithm in that it is aborted if it is discovered that the
minimum distance between the words is greater than some threshold.
</para>
<para>
Levenshtein distance (also known as edit distance) is a measure of similarity
between two strings where the distance is measured as the number of character
deletions, insertions or substitutions required to transform one string to
the other string.
</para>
</summary>
<param name="target">the target word or phrase</param>
<param name="offset">the offset at which to start the comparison</param>
<param name="length">the length of what's left of the string to compare</param>
<returns>
the number of edits or <see cref="F:System.Int32.MaxValue"/> if the edit distance is
greater than maxDistance.
</returns>
</member>
<member name="M:Lucene.Net.Sandbox.Queries.SlowFuzzyTermsEnum.LinearFuzzyTermsEnum.CalculateMaxDistance(System.Int32)">
<summary>
The max Distance is the maximum Levenshtein distance for the text
compared to some other value that results in score that is
better than the minimum similarity.
</summary>
<param name="m">the length of the "other value"</param>
<returns>the maximum levenshtein distance that we care about</returns>
</member>
<member name="T:Lucene.Net.Sandbox.Queries.SortedSetSortField">
<summary>
SortField for <see cref="T:Lucene.Net.Index.SortedSetDocValues"/>.
<para/>
A <see cref="T:Lucene.Net.Index.SortedSetDocValues"/> contains multiple values for a field, so sorting with
this technique "selects" a value as the representative sort value for the document.
<para/>
By default, the minimum value in the set is selected as the sort value, but
this can be customized. Selectors other than the default do have some limitations
(see below) to ensure that all selections happen in constant-time for performance.
<para/>
Like sorting by string, this also supports sorting missing values as first or last,
via <see cref="M:Lucene.Net.Search.SortField.SetMissingValue(System.Object)"/>.
<para/>
Limitations:
<list type="bullet">
<item><description>
Fields containing <see cref="F:System.Int32.MaxValue"/> or more unique values
are unsupported.
</description></item>
<item><description>
Selectors other than the default <see cref="F:Lucene.Net.Sandbox.Queries.Selector.MIN"/> require
optional codec support. However several codecs provided by Lucene,
including the current default codec, support this.
</description></item>
</list>
</summary>
</member>
<member name="M:Lucene.Net.Sandbox.Queries.SortedSetSortField.#ctor(System.String,System.Boolean)">
<summary>
Creates a sort, possibly in reverse, by the minimum value in the set
for the document.
</summary>
<param name="field">Name of field to sort by. Must not be null.</param>
<param name="reverse">True if natural order should be reversed.</param>
</member>
<member name="M:Lucene.Net.Sandbox.Queries.SortedSetSortField.#ctor(System.String,System.Boolean,Lucene.Net.Sandbox.Queries.Selector)">
<summary>
Creates a sort, possibly in reverse, specifying how the sort value from
the document's set is selected.
</summary>
<param name="field">Name of field to sort by. Must not be null.</param>
<param name="reverse">True if natural order should be reversed.</param>
<param name="selector">
custom selector for choosing the sort value from the set.
<para/>
NOTE: selectors other than <see cref="F:Lucene.Net.Sandbox.Queries.Selector.MIN"/> require optional codec support.
</param>
</member>
<member name="P:Lucene.Net.Sandbox.Queries.SortedSetSortField.Selector">
<summary>Returns the selector in use for this sort</summary>
</member>
<member name="M:Lucene.Net.Sandbox.Queries.SortedSetSortField.SetMissingValue(System.Object)">
<summary>
Set how missing values (the empty set) are sorted.
<para/>
Note that this must be <see cref="F:Lucene.Net.Search.SortField.STRING_FIRST"/> or
<see cref="F:Lucene.Net.Search.SortField.STRING_LAST"/>.
</summary>
</member>
<member name="T:Lucene.Net.Sandbox.Queries.SortedSetSortField.MinValue">
<summary>Wraps a <see cref="T:Lucene.Net.Index.SortedSetDocValues"/> and returns the first ordinal (min)</summary>
</member>
<member name="T:Lucene.Net.Sandbox.Queries.SortedSetSortField.MaxValue">
<summary>Wraps a <see cref="T:Lucene.Net.Index.SortedSetDocValues"/> and returns the last ordinal (max)</summary>
</member>
<member name="T:Lucene.Net.Sandbox.Queries.SortedSetSortField.MiddleMinValue">
<summary>Wraps a <see cref="T:Lucene.Net.Index.SortedSetDocValues"/> and returns the middle ordinal (or min of the two)</summary>
</member>
<member name="T:Lucene.Net.Sandbox.Queries.SortedSetSortField.MiddleMaxValue">
<summary>Wraps a <see cref="T:Lucene.Net.Index.SortedSetDocValues"/> and returns the middle ordinal (or max of the two)</summary>
</member>
<member name="T:Lucene.Net.Sandbox.Queries.Selector">
<summary>Selects a value from the document's set to use as the sort value</summary>
</member>
<member name="F:Lucene.Net.Sandbox.Queries.Selector.MIN">
<summary>
Selects the minimum value in the set
</summary>
</member>
<member name="F:Lucene.Net.Sandbox.Queries.Selector.MAX">
<summary>
Selects the maximum value in the set
</summary>
</member>
<member name="F:Lucene.Net.Sandbox.Queries.Selector.MIDDLE_MIN">
<summary>
Selects the middle value in the set.
<para/>
If the set has an even number of values, the lower of the middle two is chosen.
</summary>
</member>
<member name="F:Lucene.Net.Sandbox.Queries.Selector.MIDDLE_MAX">
<summary>
Selects the middle value in the set.
<para/>
If the set has an even number of values, the higher of the middle two is chosen
</summary>
</member>
</members>
</doc>