Class CompoundWordTokenFilterBase
Base class for decomposition token filters.
You must specify the required LuceneVersion compatibility when creating
CompoundWordTokenFilterBase:
- As of 3.1, CompoundWordTokenFilterBase correctly handles Unicode 4.0
supplementary characters in strings and char arrays provided as compound word
dictionaries.
- As of 4.4, CompoundWordTokenFilterBase doesn't update offsets.
Inheritance
System.Object
CompoundWordTokenFilterBase
Assembly: Lucene.Net.Analysis.Common.dll
Syntax
public abstract class CompoundWordTokenFilterBase : TokenFilter, IDisposable
Constructors
|
Improve this Doc
View Source
CompoundWordTokenFilterBase(LuceneVersion, TokenStream, CharArraySet)
Declaration
protected CompoundWordTokenFilterBase(LuceneVersion matchVersion, TokenStream input, CharArraySet dictionary)
Parameters
|
Improve this Doc
View Source
CompoundWordTokenFilterBase(LuceneVersion, TokenStream, CharArraySet, Boolean)
Declaration
protected CompoundWordTokenFilterBase(LuceneVersion matchVersion, TokenStream input, CharArraySet dictionary, bool onlyLongestMatch)
Parameters
|
Improve this Doc
View Source
CompoundWordTokenFilterBase(LuceneVersion, TokenStream, CharArraySet, Int32, Int32, Int32, Boolean)
Declaration
protected CompoundWordTokenFilterBase(LuceneVersion matchVersion, TokenStream input, CharArraySet dictionary, int minWordSize, int minSubwordSize, int maxSubwordSize, bool onlyLongestMatch)
Parameters
Type |
Name |
Description |
LuceneVersion |
matchVersion |
|
TokenStream |
input |
|
CharArraySet |
dictionary |
|
System.Int32 |
minWordSize |
|
System.Int32 |
minSubwordSize |
|
System.Int32 |
maxSubwordSize |
|
System.Boolean |
onlyLongestMatch |
|
Fields
|
Improve this Doc
View Source
DEFAULT_MAX_SUBWORD_SIZE
The default for maximal length of subwords that get propagated to the output of this filter
Declaration
public const int DEFAULT_MAX_SUBWORD_SIZE = null
Field Value
Type |
Description |
System.Int32 |
|
|
Improve this Doc
View Source
DEFAULT_MIN_SUBWORD_SIZE
The default for minimal length of subwords that get propagated to the output of this filter
Declaration
public const int DEFAULT_MIN_SUBWORD_SIZE = null
Field Value
Type |
Description |
System.Int32 |
|
|
Improve this Doc
View Source
DEFAULT_MIN_WORD_SIZE
The default for minimal word length that gets decomposed
Declaration
public const int DEFAULT_MIN_WORD_SIZE = null
Field Value
Type |
Description |
System.Int32 |
|
|
Improve this Doc
View Source
m_dictionary
Declaration
protected readonly CharArraySet m_dictionary
Field Value
|
Improve this Doc
View Source
m_matchVersion
Declaration
protected readonly LuceneVersion m_matchVersion
Field Value
|
Improve this Doc
View Source
m_maxSubwordSize
Declaration
protected readonly int m_maxSubwordSize
Field Value
Type |
Description |
System.Int32 |
|
|
Improve this Doc
View Source
m_minSubwordSize
Declaration
protected readonly int m_minSubwordSize
Field Value
Type |
Description |
System.Int32 |
|
|
Improve this Doc
View Source
m_minWordSize
Declaration
protected readonly int m_minWordSize
Field Value
Type |
Description |
System.Int32 |
|
|
Improve this Doc
View Source
m_offsetAtt
Declaration
protected readonly IOffsetAttribute m_offsetAtt
Field Value
|
Improve this Doc
View Source
m_onlyLongestMatch
Declaration
protected readonly bool m_onlyLongestMatch
Field Value
Type |
Description |
System.Boolean |
|
|
Improve this Doc
View Source
m_termAtt
Declaration
protected readonly ICharTermAttribute m_termAtt
Field Value
|
Improve this Doc
View Source
m_tokens
Declaration
protected readonly LinkedList<CompoundWordTokenFilterBase.CompoundToken> m_tokens
Field Value
Methods
|
Improve this Doc
View Source
Decompose()
Declaration
protected abstract void Decompose()
|
Improve this Doc
View Source
IncrementToken()
Declaration
public override sealed bool IncrementToken()
Returns
Type |
Description |
System.Boolean |
|
Overrides
|
Improve this Doc
View Source
Reset()
Declaration
public override void Reset()
Overrides
Implements
IDisposable