Lucene.Net  3.0.3
Lucene.Net is a port of the Lucene search engine library, written in C# and targeted at .NET runtime users.
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Properties Pages
ArabicNormalizationFilter.cs
Go to the documentation of this file.
1 /*
2  * Licensed to the Apache Software Foundation (ASF) under one or more
3  * contributor license agreements. See the NOTICE file distributed with
4  * this work for additional information regarding copyright ownership.
5  * The ASF licenses this file to You under the Apache License, Version 2.0
6  * (the "License"); you may not use this file except in compliance with
7  * the License. You may obtain a copy of the License at
8  *
9  * http://www.apache.org/licenses/LICENSE-2.0
10  *
11  * Unless required by applicable law or agreed to in writing, software
12  * distributed under the License is distributed on an "AS IS" BASIS,
13  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14  * See the License for the specific language governing permissions and
15  * limitations under the License.
16  */
17 
18 using System.IO;
19 using System.Collections;
20 
21 using Lucene.Net.Analysis;
22 using Lucene.Net.Analysis.Tokenattributes;
23 using Lucene.Net.Util;
24 
25 
26 namespace Lucene.Net.Analysis.AR
27 {
28 
29  /*
30  * A <see cref="TokenFilter"/> that applies <see cref="ArabicNormalizer"/> to normalize the orthography.
31  *
32  */
33 
35  {
36 
37  protected ArabicNormalizer normalizer = null;
38  private ITermAttribute termAtt;
39 
40  public ArabicNormalizationFilter(TokenStream input) : base(input)
41  {
42 
43  normalizer = new ArabicNormalizer();
44  termAtt = AddAttribute<ITermAttribute>();
45  }
46 
47  public override bool IncrementToken()
48  {
49  if (input.IncrementToken())
50  {
51  int newlen = normalizer.Normalize(termAtt.TermBuffer(), termAtt.TermLength());
52  termAtt.SetTermLength(newlen);
53  return true;
54  }
55  return false;
56  }
57  }
58 }