List of usage examples for org.apache.lucene.analysis.de GermanAnalyzer GermanAnalyzer
public GermanAnalyzer(CharArraySet stopwords, CharArraySet stemExclusionSet)
From source file:de.ingrid.interfaces.csw.tools.LuceneTools.java
License:EUPL
/** METHOD WILL BE INJECTED BY SPRING TO RETURN NEW INSTANCE OF ANALYZER ! * In non spring environment we return new default analyzer (German). *///from www . j a va 2 s .c o m public Analyzer createAnalyzer() { return new GermanAnalyzer(Version.LUCENE_36, new HashSet()); }
From source file:org.elasticsearch.analysis.common.GermanAnalyzerProvider.java
License:Apache License
GermanAnalyzerProvider(IndexSettings indexSettings, Environment env, String name, Settings settings) { super(indexSettings, name, settings); analyzer = new GermanAnalyzer(Analysis.parseStopWords(env, settings, GermanAnalyzer.getDefaultStopSet()), Analysis.parseStemExclusion(settings, CharArraySet.EMPTY_SET)); analyzer.setVersion(version);//from w ww . ja v a 2s .co m }
From source file:org.omegat.tokenizer.LuceneGermanTokenizer.java
License:Open Source License
@Override protected TokenStream getTokenStream(final String strOrig, final boolean stemsAllowed, final boolean stopWordsAllowed) { if (stemsAllowed) { String[] stopWords = stopWordsAllowed ? GermanAnalyzer.GERMAN_STOP_WORDS : EMPTY_STRING_LIST; return new GermanAnalyzer(getBehavior(), stopWords).tokenStream("", new StringReader(strOrig)); } else {/* w ww . j a v a 2s . c om*/ return new StandardTokenizer(getBehavior(), new StringReader(strOrig)); } }
From source file:org.thiesen.jiffs.jobs.preprocessor.Preprocessor.java
License:Open Source License
private void preproecessText(StoryDBO story) { switch (story.getLanguage()) { case GERMAN:/*from w w w .j a va 2s . co m*/ preprocess(story, new GermanAnalyzer(Version.LUCENE_30, GERMAN_STOP_WORDS)); return; default: preprocess(story, new StandardAnalyzer(Version.LUCENE_30, ENGLISH_STOP_WORDS)); return; } }