Lucene.Net  3.0.3
Lucene.Net is a port of the Lucene search engine library, written in C# and targeted at .NET runtime users.
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Properties Pages
Tags.cs
Go to the documentation of this file.
1 /*
2  * Licensed to the Apache Software Foundation (ASF) under one or more
3  * contributor license agreements. See the NOTICE file distributed with
4  * this work for additional information regarding copyright ownership.
5  * The ASF licenses this file to You under the Apache License, Version 2.0
6  * (the "License"); you may not use this file except in compliance with
7  * the License. You may obtain a copy of the License at
8  *
9  * http://www.apache.org/licenses/LICENSE-2.0
10  *
11  * Unless required by applicable law or agreed to in writing, software
12  * distributed under the License is distributed on an "AS IS" BASIS,
13  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14  * See the License for the specific language governing permissions and
15  * limitations under the License.
16  */
17 
18 using System;
19 
20 namespace Lucene.Net.Demo.Html
21 {
22 
23 
24  public sealed class Tags
25  {
26 
27  /// <summary> contains all tags for which whitespaces have to be inserted for proper tokenization</summary>
28  public static readonly System.Collections.Hashtable WS_ELEMS = new System.Collections.Hashtable();
29  static Tags()
30  {
31  {
32  WS_ELEMS.Add("<hr", "<hr");
33  WS_ELEMS.Add("<hr/", "<hr/"); // note that "<hr />" does not need to be listed explicitly
34  WS_ELEMS.Add("<br", "<br");
35  WS_ELEMS.Add("<br/", "<br/");
36  WS_ELEMS.Add("<p", "<p");
37  WS_ELEMS.Add("</p", "</p");
38  WS_ELEMS.Add("<div", "<div");
39  WS_ELEMS.Add("</div", "</div");
40  WS_ELEMS.Add("<td", "<td");
41  WS_ELEMS.Add("</td", "</td");
42  WS_ELEMS.Add("<li", "<li");
43  WS_ELEMS.Add("</li", "</li");
44  WS_ELEMS.Add("<q", "<q");
45  WS_ELEMS.Add("</q", "</q");
46  WS_ELEMS.Add("<blockquote", "<blockquote");
47  WS_ELEMS.Add("</blockquote", "</blockquote");
48  WS_ELEMS.Add("<dt", "<dt");
49  WS_ELEMS.Add("</dt", "</dt");
50  WS_ELEMS.Add("<h1", "<h1");
51  WS_ELEMS.Add("</h1", "</h1");
52  WS_ELEMS.Add("<h2", "<h2");
53  WS_ELEMS.Add("</h2", "</h2");
54  WS_ELEMS.Add("<h3", "<h3");
55  WS_ELEMS.Add("</h3", "</h3");
56  WS_ELEMS.Add("<h4", "<h4");
57  WS_ELEMS.Add("</h4", "</h4");
58  WS_ELEMS.Add("<h5", "<h5");
59  WS_ELEMS.Add("</h5", "</h5");
60  WS_ELEMS.Add("<h6", "<h6");
61  WS_ELEMS.Add("</h6", "</h6");
62  }
63  }
64  }
65 }