List of usage examples for org.apache.lucene.analysis TokenStream subclass-usage
From source file lux.search.highlight.StreamingElementTokens.java
/** * Wraps a TokenStream, modifying its CharTermAttribute so as to return * the original term, and the term prefixed by each of its enclosing element's QNames, * in turn. */ public final class StreamingElementTokens extends TokenStream {
From source file net.dataninja.ee.textIndexer.tokenizer.Tokenizer.java
/** A Tokenizer is a TokenStream whose input is a Reader. <p> This is an abstract class. */ public abstract class Tokenizer extends TokenStream {
From source file nl.inl.blacklab.filter.StubTokenStream.java
public class StubTokenStream extends TokenStream { private CharTermAttribute ta; private int i = -1; private String[] terms;
From source file nl.inl.blacklab.index.complex.TokenStreamFromList.java
/** * Takes an Iterable<String> and iterates through it as a TokenStream. * * The Strings are taken as terms, and the position increment is always 1. */ class TokenStreamFromList extends TokenStream {
From source file nl.inl.blacklab.index.complex.TokenStreamWithOffsets.java
/**
* Takes a List<String> plus two List<Integer>'s and iterates through them as a
* TokenStream.
*
* The Strings are taken as terms. The two integer-lists are taken as start chars and end chars.
* Token position increment is always 1.
From source file no.trank.openpipe.solr.analysis.AnnotationTokenStream.java
/** * @version $Revision$ */ public class AnnotationTokenStream extends TokenStream { private ResolvedAnnotation[] anns; private ListIterator<ResolvedAnnotation>[] iterators;
From source file org.alfresco.repo.search.impl.lucene.analysis.MLTokenDuplicator.java
/**
* Create duplicate tokens for multilingual varients The forms are Tokens: Token - all languages {fr}Token - if a
* language is specified {fr_CA}Token - if a language and country is specified {fr_CA_Varient}Token - for all three
* {fr__Varient}Token - for a language varient with no country
*
* @author andyh
From source file org.allenai.blacklab.filter.StubTokenStream.java
public class StubTokenStream extends TokenStream { private CharTermAttribute ta; private int i = -1; private String[] terms;
From source file org.allenai.blacklab.index.complex.TokenStreamFromList.java
/** * Takes an Iterable<String> and iterates through it as a TokenStream. * * The Strings are taken as terms, and the position increment is always 1. */ class TokenStreamFromList extends TokenStream {
From source file org.allenai.blacklab.index.complex.TokenStreamWithOffsets.java
/**
* Takes a List<String> plus two List<Integer>'s and iterates through them as a
* TokenStream.
*
* The Strings are taken as terms. The two integer-lists are taken as start chars and end chars.
* Token position increment is always 1.