List of usage examples for org.apache.lucene.analysis.cn.smart HMMChineseTokenizer HMMChineseTokenizer
public HMMChineseTokenizer(AttributeFactory factory)
From source file:cn.tung.javacn.pinyin.SimpleChineseAnalyzer.java
License:Apache License
@Override public TokenStreamComponents createComponents(String fieldName, Reader reader) { final Tokenizer tokenizer = new HMMChineseTokenizer(reader); TokenStream result = new PorterStemFilter(tokenizer); if (!stopWords.isEmpty()) { result = new StopFilter(result, stopWords); }//from w w w.j a v a 2s . c om return new TokenStreamComponents(tokenizer, result); }