Example usage for opennlp.tools.postag POSDictionary POSDictionary

List of usage examples for opennlp.tools.postag POSDictionary POSDictionary

Introduction

In this page you can find the example usage for opennlp.tools.postag POSDictionary POSDictionary.

Prototype

public POSDictionary() 

Source Link

Document

Initializes an empty case sensitive POSDictionary .

Usage

From source file:es.ehu.si.ixa.pipe.convert.Convert.java

/**
 * Generates {@code POSDictionary} from a list of monosemic words and its postag.
 * form\tab\lemma\tabpostag/* w  w  w.  jav  a  2 s .  c  o m*/
 * 
 * @param inputLines
 *          the list of words and postag per line
 * @return the POSDictionary
 */
private POSDictionary getPOSTaggerDict(List<String> inputLines) {
    POSDictionary posTaggerDict = new POSDictionary();
    ListMultimap<String, String> dictMultiMap = ArrayListMultimap.create();
    for (String line : inputLines) {
        String[] lineArray = line.split("\t");
        if (lineArray.length == 3) {
            if (!lineArray[0].contains("<")) {
                dictMultiMap.put(lineArray[0], lineArray[2]);
            }
        }
    }
    for (String token : dictMultiMap.keySet()) {
        List<String> tags = dictMultiMap.get(token);
        //add only monosemic words
        if (tags.size() == 1) {
            posTaggerDict.put(token, tags.toArray(new String[tags.size()]));
        }
    }
    return posTaggerDict;
}