Lucene.Net  3.0.3
Lucene.Net is a port of the Lucene search engine library, written in C# and targeted at .NET runtime users.
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Properties Pages
PorterStemFilter.cs
Go to the documentation of this file.
1 /*
2  * Licensed to the Apache Software Foundation (ASF) under one or more
3  * contributor license agreements. See the NOTICE file distributed with
4  * this work for additional information regarding copyright ownership.
5  * The ASF licenses this file to You under the Apache License, Version 2.0
6  * (the "License"); you may not use this file except in compliance with
7  * the License. You may obtain a copy of the License at
8  *
9  * http://www.apache.org/licenses/LICENSE-2.0
10  *
11  * Unless required by applicable law or agreed to in writing, software
12  * distributed under the License is distributed on an "AS IS" BASIS,
13  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14  * See the License for the specific language governing permissions and
15  * limitations under the License.
16  */
17 
18 using Lucene.Net.Analysis.Tokenattributes;
19 
20 namespace Lucene.Net.Analysis
21 {
22 
23  /// <summary>Transforms the token stream as per the Porter stemming algorithm.
24  /// Note: the input to the stemming filter must already be in lower case,
25  /// so you will need to use LowerCaseFilter or LowerCaseTokenizer farther
26  /// down the Tokenizer chain in order for this to work properly!
27  /// <p/>
28  /// To use this filter with other analyzers, you'll want to write an
29  /// Analyzer class that sets up the TokenStream chain as you want it.
30  /// To use this with LowerCaseTokenizer, for example, you'd write an
31  /// analyzer like this:
32  /// <p/>
33  /// <code>
34  /// class MyAnalyzer extends Analyzer {
35  /// public final TokenStream tokenStream(String fieldName, Reader reader) {
36  /// return new PorterStemFilter(new LowerCaseTokenizer(reader));
37  /// }
38  /// }
39  /// </code>
40  /// </summary>
41  public sealed class PorterStemFilter:TokenFilter
42  {
43  private readonly PorterStemmer stemmer;
44  private readonly ITermAttribute termAtt;
45 
46  public PorterStemFilter(TokenStream in_Renamed):base(in_Renamed)
47  {
48  stemmer = new PorterStemmer();
49  termAtt = AddAttribute<ITermAttribute>();
50  }
51 
52  public override bool IncrementToken()
53  {
54  if (!input.IncrementToken())
55  return false;
56 
57  if (stemmer.Stem(termAtt.TermBuffer(), 0, termAtt.TermLength()))
58  termAtt.SetTermBuffer(stemmer.ResultBuffer, 0, stemmer.ResultLength);
59  return true;
60  }
61  }
62 }