List of usage examples for org.apache.lucene.analysis.charfilter MappingCharFilter MappingCharFilter
public MappingCharFilter(NormalizeCharMap normMap, Reader in)
From source file:com.google.gerrit.lucene.CustomMappingAnalyzer.java
License:Apache License
@Override protected Reader wrapReader(String fieldName, Reader reader) { NormalizeCharMap.Builder builder = new NormalizeCharMap.Builder(); for (Map.Entry<String, String> e : customMappings.entrySet()) { builder.add(e.getKey(), e.getValue()); }/*from w w w . j a v a 2 s . com*/ return new MappingCharFilter(builder.build(), reader); }
From source file:com.netcrest.pado.index.provider.lucene.analyzer.ExtendedEnglishAnalyzer.java
License:Open Source License
@Override protected Reader initReader(String fieldName, Reader reader) { // TODO Auto-generated method stub NormalizeCharMap.Builder builder = new NormalizeCharMap.Builder(); builder.add(".", " "); //builder.add("_", " "); NormalizeCharMap normMap = builder.build(); return new MappingCharFilter(normMap, reader); }
From source file:jp.co.atware.solr.analizers.cjk.MultistageMappingCharFilterFactory.java
License:Apache License
@Override public Reader create(Reader input) { for (NormalizeCharMap charMap : normMapList) { input = charMap == null ? input : new MappingCharFilter(charMap, input); }/*ww w. j a v a 2 s . co m*/ return input; }
From source file:org.elasticsearch.analysis.common.MappingCharFilterFactory.java
License:Apache License
@Override public Reader create(Reader tokenStream) { return new MappingCharFilter(normMap, tokenStream); }
From source file:org.elasticsearch.index.analysis.PatternTokenizerTests.java
License:Apache License
@Test public void testOffsetCorrection() throws Exception { final String INPUT = "Günther Günther is here"; // create MappingCharFilter List<String> mappingRules = new ArrayList<>(); mappingRules.add("\"ü\" => \"\""); NormalizeCharMap.Builder builder = new NormalizeCharMap.Builder(); builder.add("ü", ""); NormalizeCharMap normMap = builder.build(); CharFilter charStream = new MappingCharFilter(normMap, new StringReader(INPUT)); // create PatternTokenizer Tokenizer stream = new PatternTokenizer(newAttributeFactory(), Pattern.compile("[,;/\\s]+"), -1); stream.setReader(charStream);/* w w w . ja v a2 s. c o m*/ assertTokenStreamContents(stream, new String[] { "Gnther", "Gnther", "is", "here" }, new int[] { 0, 13, 26, 29 }, new int[] { 12, 25, 28, 33 }, INPUT.length()); charStream = new MappingCharFilter(normMap, new StringReader(INPUT)); stream = new PatternTokenizer(newAttributeFactory(), Pattern.compile("Gnther"), 0); stream.setReader(charStream); assertTokenStreamContents(stream, new String[] { "Gnther", "Gnther" }, new int[] { 0, 13 }, new int[] { 12, 25 }, INPUT.length()); }