List of usage examples for org.apache.lucene.analysis.fi FinnishAnalyzer FinnishAnalyzer
public FinnishAnalyzer(CharArraySet stopwords, CharArraySet stemExclusionSet)
From source file:org.elasticsearch.analysis.common.FinnishAnalyzerProvider.java
License:Apache License
FinnishAnalyzerProvider(IndexSettings indexSettings, Environment env, String name, Settings settings) {
super(indexSettings, name, settings);
analyzer = new FinnishAnalyzer(Analysis.parseStopWords(env, settings, FinnishAnalyzer.getDefaultStopSet()),
Analysis.parseStemExclusion(settings, CharArraySet.EMPTY_SET));
analyzer.setVersion(version);//from w w w . ja v a2s . c o m
}
From source file:org.omegat.tokenizer.LuceneFinnishTokenizer.java
License:Open Source License
@Override protected TokenStream getTokenStream(final String strOrig, final boolean stemsAllowed, final boolean stopWordsAllowed) { if (stemsAllowed) { Set<?> stopWords = stopWordsAllowed ? FinnishAnalyzer.getDefaultStopSet() : Collections.EMPTY_SET; return new FinnishAnalyzer(getBehavior(), stopWords).tokenStream("", new StringReader(strOrig)); } else {/*ww w . j a v a 2 s. c o m*/ return new StandardTokenizer(getBehavior(), new StringReader(strOrig)); } }