List of usage examples for opennlp.tools.postag POSDictionary POSDictionary
public POSDictionary()
From source file:es.ehu.si.ixa.pipe.convert.Convert.java
/** * Generates {@code POSDictionary} from a list of monosemic words and its postag. * form\tab\lemma\tabpostag/* w w w. jav a 2 s . c o m*/ * * @param inputLines * the list of words and postag per line * @return the POSDictionary */ private POSDictionary getPOSTaggerDict(List<String> inputLines) { POSDictionary posTaggerDict = new POSDictionary(); ListMultimap<String, String> dictMultiMap = ArrayListMultimap.create(); for (String line : inputLines) { String[] lineArray = line.split("\t"); if (lineArray.length == 3) { if (!lineArray[0].contains("<")) { dictMultiMap.put(lineArray[0], lineArray[2]); } } } for (String token : dictMultiMap.keySet()) { List<String> tags = dictMultiMap.get(token); //add only monosemic words if (tags.size() == 1) { posTaggerDict.put(token, tags.toArray(new String[tags.size()])); } } return posTaggerDict; }