1   /**
2    * Distribution License:
3    * JSword is free software; you can redistribute it and/or modify it under
4    * the terms of the GNU Lesser General Public License, version 2.1 or later
5    * as published by the Free Software Foundation. This program is distributed
6    * in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even
7    * the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
8    * See the GNU Lesser General Public License for more details.
9    *
10   * The License is available on the internet at:
11   *      http://www.gnu.org/copyleft/lgpl.html
12   * or by writing to:
13   *      Free Software Foundation, Inc.
14   *      59 Temple Place - Suite 330
15   *      Boston, MA 02111-1307, USA
16   *
17   * © CrossWire Bible Society, 2007 - 2016
18   *
19   */
20  package org.crosswire.jsword.index.lucene.analysis;
21  
22  import java.io.IOException;
23  import java.io.Reader;
24  
25  import org.apache.lucene.analysis.TokenStream;
26  import org.apache.lucene.analysis.cn.ChineseAnalyzer;
27  
28  /**
29   * Uses org.apache.lucene.analysis.cn.ChineseAnalyzer Analysis:
30   * ChineseTokenizer, ChineseFilter StopFilter, Stemming not implemented yet
31   * 
32   * Note: org.apache.lucene.analysis.cn.CJKAnalyzer takes overlapping two
33   * character tokenization approach which leads to larger index size.
34   * 
35   * @see gnu.lgpl.License The GNU Lesser General Public License for details.
36   * @author Sijo Cherian
37   */
38  public class ChineseLuceneAnalyzer extends AbstractBookAnalyzer {
39      public ChineseLuceneAnalyzer() {
40          myAnalyzer = new ChineseAnalyzer();
41      }
42  
43      /* (non-Javadoc)
44       * @see org.apache.lucene.analysis.Analyzer#tokenStream(java.lang.String, java.io.Reader)
45       */
46      @Override
47      public final TokenStream tokenStream(String fieldName, Reader reader) {
48          return myAnalyzer.tokenStream(fieldName, reader);
49      }
50  
51      /* (non-Javadoc)
52       * @see org.apache.lucene.analysis.Analyzer#reusableTokenStream(java.lang.String, java.io.Reader)
53       */
54      @Override
55      public final TokenStream reusableTokenStream(String fieldName, Reader reader) throws IOException {
56          return myAnalyzer.reusableTokenStream(fieldName, reader);
57      }
58  
59      private ChineseAnalyzer myAnalyzer;
60  }
61