Example usage for org.apache.lucene.analysis.de GermanAnalyzer GermanAnalyzer

List of usage examples for org.apache.lucene.analysis.de GermanAnalyzer GermanAnalyzer

Introduction

In this page you can find the example usage for org.apache.lucene.analysis.de GermanAnalyzer GermanAnalyzer.

Prototype

public GermanAnalyzer(CharArraySet stopwords, CharArraySet stemExclusionSet) 

Source Link

Document

Builds an analyzer with the given stop words

Usage

From source file:de.ingrid.interfaces.csw.tools.LuceneTools.java

License:EUPL

/** METHOD WILL BE INJECTED BY SPRING TO RETURN NEW INSTANCE OF ANALYZER !
 * In non spring environment we return new default analyzer (German).
 *///from  www  .  j a va 2 s .c o m
public Analyzer createAnalyzer() {
    return new GermanAnalyzer(Version.LUCENE_36, new HashSet());
}

From source file:org.elasticsearch.analysis.common.GermanAnalyzerProvider.java

License:Apache License

GermanAnalyzerProvider(IndexSettings indexSettings, Environment env, String name, Settings settings) {
    super(indexSettings, name, settings);
    analyzer = new GermanAnalyzer(Analysis.parseStopWords(env, settings, GermanAnalyzer.getDefaultStopSet()),
            Analysis.parseStemExclusion(settings, CharArraySet.EMPTY_SET));
    analyzer.setVersion(version);//from w ww  . ja  v  a  2s .co  m
}

From source file:org.omegat.tokenizer.LuceneGermanTokenizer.java

License:Open Source License

@Override
protected TokenStream getTokenStream(final String strOrig, final boolean stemsAllowed,
        final boolean stopWordsAllowed) {
    if (stemsAllowed) {
        String[] stopWords = stopWordsAllowed ? GermanAnalyzer.GERMAN_STOP_WORDS : EMPTY_STRING_LIST;
        return new GermanAnalyzer(getBehavior(), stopWords).tokenStream("", new StringReader(strOrig));
    } else {/* w  ww  . j a  v  a  2s . c om*/
        return new StandardTokenizer(getBehavior(), new StringReader(strOrig));
    }
}

From source file:org.thiesen.jiffs.jobs.preprocessor.Preprocessor.java

License:Open Source License

private void preproecessText(StoryDBO story) {
    switch (story.getLanguage()) {
    case GERMAN:/*from  w w  w  .j  a  va 2s  .  co  m*/
        preprocess(story, new GermanAnalyzer(Version.LUCENE_30, GERMAN_STOP_WORDS));
        return;
    default:
        preprocess(story, new StandardAnalyzer(Version.LUCENE_30, ENGLISH_STOP_WORDS));
        return;
    }
}