| ChineseLuceneAnalyzer.java |
1 /**
2 * Distribution License:
3 * JSword is free software; you can redistribute it and/or modify it under
4 * the terms of the GNU Lesser General Public License, version 2.1 or later
5 * as published by the Free Software Foundation. This program is distributed
6 * in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even
7 * the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
8 * See the GNU Lesser General Public License for more details.
9 *
10 * The License is available on the internet at:
11 * http://www.gnu.org/copyleft/lgpl.html
12 * or by writing to:
13 * Free Software Foundation, Inc.
14 * 59 Temple Place - Suite 330
15 * Boston, MA 02111-1307, USA
16 *
17 * © CrossWire Bible Society, 2007 - 2016
18 *
19 */
20 package org.crosswire.jsword.index.lucene.analysis;
21
22 import java.io.IOException;
23 import java.io.Reader;
24
25 import org.apache.lucene.analysis.TokenStream;
26 import org.apache.lucene.analysis.cn.ChineseAnalyzer;
27
28 /**
29 * Uses org.apache.lucene.analysis.cn.ChineseAnalyzer Analysis:
30 * ChineseTokenizer, ChineseFilter StopFilter, Stemming not implemented yet
31 *
32 * Note: org.apache.lucene.analysis.cn.CJKAnalyzer takes overlapping two
33 * character tokenization approach which leads to larger index size.
34 *
35 * @see gnu.lgpl.License The GNU Lesser General Public License for details.
36 * @author Sijo Cherian
37 */
38 public class ChineseLuceneAnalyzer extends AbstractBookAnalyzer {
39 public ChineseLuceneAnalyzer() {
40 myAnalyzer = new ChineseAnalyzer();
41 }
42
43 /* (non-Javadoc)
44 * @see org.apache.lucene.analysis.Analyzer#tokenStream(java.lang.String, java.io.Reader)
45 */
46 @Override
47 public final TokenStream tokenStream(String fieldName, Reader reader) {
48 return myAnalyzer.tokenStream(fieldName, reader);
49 }
50
51 /* (non-Javadoc)
52 * @see org.apache.lucene.analysis.Analyzer#reusableTokenStream(java.lang.String, java.io.Reader)
53 */
54 @Override
55 public final TokenStream reusableTokenStream(String fieldName, Reader reader) throws IOException {
56 return myAnalyzer.reusableTokenStream(fieldName, reader);
57 }
58
59 private ChineseAnalyzer myAnalyzer;
60 }
61