List of usage examples for org.apache.mahout.vectorizer.encoders LuceneTextValueEncoder LuceneTextValueEncoder
public LuceneTextValueEncoder(String name)
From source file:de.isabeldrostfromm.sof.naive.Vectoriser.java
License:Open Source License
/** * @return Returns a vector generated for the given text based on encoding with LuceneTextValueEncoder * *//*w w w .ja v a2 s.co m*/ private static Vector luceneEncode(int probes, String text) { LuceneTextValueEncoder encoder = new LuceneTextValueEncoder("sof"); encoder.setAnalyzer(new StandardAnalyzer(Version.LUCENE_36)); encoder.setProbes(probes); encoder.addText(text); Vector vector = new SequentialAccessSparseVector(probes); encoder.flush(1, vector); return vector; }