Fork me on GitHub
  • API

    Show / Hide Table of Contents

    Class ThaiTokenizer

    Tokenizer that use ICU4N.Text.BreakIterator to tokenize Thai text.

    Inheritance
    System.Object
    Lucene.Net.Util.AttributeSource
    Lucene.Net.Analysis.TokenStream
    Lucene.Net.Analysis.Tokenizer
    SegmentingTokenizerBase
    ThaiTokenizer
    Implements
    System.IDisposable
    Inherited Members
    SegmentingTokenizerBase.BUFFERMAX
    SegmentingTokenizerBase.m_buffer
    SegmentingTokenizerBase.m_offset
    SegmentingTokenizerBase.IncrementToken()
    SegmentingTokenizerBase.End()
    SegmentingTokenizerBase.IsSafeEnd(Char)
    Lucene.Net.Analysis.Tokenizer.m_input
    Tokenizer.Dispose(Boolean)
    Tokenizer.CorrectOffset(Int32)
    Tokenizer.SetReader(TextReader)
    Lucene.Net.Analysis.TokenStream.Dispose()
    Lucene.Net.Util.AttributeSource.GetAttributeFactory()
    Lucene.Net.Util.AttributeSource.GetAttributeClassesEnumerator()
    Lucene.Net.Util.AttributeSource.GetAttributeImplsEnumerator()
    Lucene.Net.Util.AttributeSource.AddAttributeImpl(Lucene.Net.Util.Attribute)
    Lucene.Net.Util.AttributeSource.AddAttribute<T>()
    Lucene.Net.Util.AttributeSource.HasAttributes
    Lucene.Net.Util.AttributeSource.HasAttribute<T>()
    Lucene.Net.Util.AttributeSource.GetAttribute<T>()
    Lucene.Net.Util.AttributeSource.ClearAttributes()
    Lucene.Net.Util.AttributeSource.RestoreState(Lucene.Net.Util.AttributeSource.State)
    Lucene.Net.Util.AttributeSource.GetHashCode()
    AttributeSource.Equals(Object)
    AttributeSource.ReflectAsString(Boolean)
    Lucene.Net.Util.AttributeSource.ReflectWith(Lucene.Net.Util.IAttributeReflector)
    Lucene.Net.Util.AttributeSource.CloneAttributes()
    Lucene.Net.Util.AttributeSource.CopyTo(Lucene.Net.Util.AttributeSource)
    Lucene.Net.Util.AttributeSource.ToString()
    System.Object.Equals(System.Object, System.Object)
    System.Object.GetType()
    System.Object.MemberwiseClone()
    System.Object.ReferenceEquals(System.Object, System.Object)
    Namespace: Lucene.Net.Analysis.Th
    Assembly: Lucene.Net.ICU.dll
    Syntax
    public class ThaiTokenizer : SegmentingTokenizerBase, IDisposable

    Constructors

    | Improve this Doc View Source

    ThaiTokenizer(AttributeSource.AttributeFactory, TextReader)

    Creates a new ThaiTokenizer, supplying the Lucene.Net.Util.AttributeSource.AttributeFactory

    Declaration
    public ThaiTokenizer(AttributeSource.AttributeFactory factory, TextReader reader)
    Parameters
    Type Name Description
    Lucene.Net.Util.AttributeSource.AttributeFactory factory
    System.IO.TextReader reader
    | Improve this Doc View Source

    ThaiTokenizer(TextReader)

    Creates a new ThaiTokenizer

    Declaration
    public ThaiTokenizer(TextReader reader)
    Parameters
    Type Name Description
    System.IO.TextReader reader

    Methods

    | Improve this Doc View Source

    CaptureState()

    Declaration
    public override AttributeSource.State CaptureState()
    Returns
    Type Description
    Lucene.Net.Util.AttributeSource.State
    Overrides
    Lucene.Net.Util.AttributeSource.CaptureState()
    | Improve this Doc View Source

    IncrementWord()

    Declaration
    protected override bool IncrementWord()
    Returns
    Type Description
    System.Boolean
    Overrides
    SegmentingTokenizerBase.IncrementWord()
    | Improve this Doc View Source

    Reset()

    Declaration
    public override void Reset()
    Overrides
    SegmentingTokenizerBase.Reset()
    | Improve this Doc View Source

    SetNextSentence(Int32, Int32)

    Declaration
    protected override void SetNextSentence(int sentenceStart, int sentenceEnd)
    Parameters
    Type Name Description
    System.Int32 sentenceStart
    System.Int32 sentenceEnd
    Overrides
    SegmentingTokenizerBase.SetNextSentence(Int32, Int32)

    Implements

    System.IDisposable
    • Improve this Doc
    • View Source
    Back to top Copyright © 2022 The Apache Software Foundation, Licensed under the Apache License, Version 2.0
    Apache Lucene.Net, Lucene.Net, Apache, the Apache feather logo, and the Apache Lucene.Net project logo are trademarks of The Apache Software Foundation.
    All other marks mentioned may be trademarks or registered trademarks of their respective owners.