Lucene.Net  3.0.3
Lucene.Net is a port of the Lucene search engine library, written in C# and targeted at .NET runtime users.
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Properties Pages
RussianLetterTokenizer.cs
Go to the documentation of this file.
1 /*
2  *
3  * Licensed to the Apache Software Foundation (ASF) under one
4  * or more contributor license agreements. See the NOTICE file
5  * distributed with this work for additional information
6  * regarding copyright ownership. The ASF licenses this file
7  * to you under the Apache License, Version 2.0 (the
8  * "License"); you may not use this file except in compliance
9  * with the License. You may obtain a copy of the License at
10  *
11  * http://www.apache.org/licenses/LICENSE-2.0
12  *
13  * Unless required by applicable law or agreed to in writing,
14  * software distributed under the License is distributed on an
15  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
16  * KIND, either express or implied. See the License for the
17  * specific language governing permissions and limitations
18  * under the License.
19  *
20 */
21 
22 using System;
23 using System.IO;
24 using Lucene.Net.Analysis;
25 using Lucene.Net.Util;
26 
27 namespace Lucene.Net.Analysis.Ru
28 {
29  ///<summary>
30  /// A RussianLetterTokenizer is a {@link Tokenizer} that extends {@link LetterTokenizer}
31  /// by also allowing the basic latin digits 0-9.
32  ///</summary>
34  {
35  public RussianLetterTokenizer(TextReader _in)
36  : base(_in)
37  {
38  }
39 
40  public RussianLetterTokenizer(AttributeSource source, TextReader _in)
41  : base(source, _in)
42  {
43  }
44 
45  public RussianLetterTokenizer(AttributeSource.AttributeFactory factory, TextReader __in)
46  : base(factory, __in)
47  {
48  }
49 
50  /*
51  * Collects only characters which satisfy
52  * {@link Character#isLetter(char)}.
53  */
54  protected override bool IsTokenChar(char c)
55  {
56  if (char.IsLetter(c) || (c >= '0' && c <= '9'))
57  return true;
58  else
59  return false;
60  }
61  }
62 }