List of usage examples for org.apache.lucene.analysis.miscellaneous WordDelimiterFilter WordDelimiterFilter
public WordDelimiterFilter(TokenStream in, byte[] charTypeTable, int configurationFlags, CharArraySet protWords)
From source file:org.elasticsearch.analysis.common.WordDelimiterTokenFilterFactory.java
License:Apache License
@Override public TokenStream create(TokenStream tokenStream) { return new WordDelimiterFilter(tokenStream, charTypeTable, flags, protoWords); }
From source file:org.ohdsi.usagi.UsagiAnalyzer.java
License:Apache License
@Override protected TokenStreamComponents createComponents(String fieldName, Reader reader) { final Tokenizer source = new StandardTokenizer(matchVersion, reader); TokenStream result = new StandardFilter(matchVersion, source); result = new EnglishPossessiveFilter(matchVersion, result); result = new LowerCaseFilter(matchVersion, result); result = new PorterStemFilter(result); result = new WordDelimiterFilter(matchVersion, result, WordDelimiterFilter.ALPHANUM | WordDelimiterFilter.SUBWORD_DELIM | WordDelimiterFilter.SPLIT_ON_NUMERICS, null); return new TokenStreamComponents(source, result); }