Example usage for edu.stanford.nlp.ling TaggedWord TaggedWord

List of usage examples for edu.stanford.nlp.ling TaggedWord TaggedWord

Introduction

In this page you can find the example usage for edu.stanford.nlp.ling TaggedWord TaggedWord.

Prototype

public TaggedWord(Label oldLabel) 

Source Link

Document

Create a new TaggedWord.

Usage

From source file:at.illecker.storm.commons.preprocessor.Preprocessor.java

License:Apache License

private TaggedWord pretagToken(String token, boolean tokenIsHashTag, boolean tokenIsUser, boolean tokenIsURL) {
    TaggedWord preTaggedToken = new TaggedWord(token);
    if (tokenIsHashTag) {
        preTaggedToken.setTag("HT");
    } else if (tokenIsUser) {
        preTaggedToken.setTag("USR");
    } else if (tokenIsURL) {
        preTaggedToken.setTag("URL");
    } else if (StringUtils.isRetweet(token)) {
        preTaggedToken.setTag("RT");
    } else if (m_nameEntities.isNameEntity(token)) {
        if (LOGGING) {
            LOG.info("NameEntity labelled for " + token);
        }/*from www .  ja v a  2 s  .c  o  m*/
        preTaggedToken.setTag("NNP");
    } else if ((m_interjections.isInterjection(token)) || (StringUtils.isEmoticon(token))) {
        if (LOGGING) {
            LOG.info("Interjection or Emoticon labelled for " + token);
        }
        preTaggedToken.setTag("UH");
    }
    return preTaggedToken;
}

From source file:de.tudarmstadt.ukp.dkpro.core.stanfordnlp.StanfordPosTagger.java

License:Open Source License

@Override
public void process(JCas aJCas) throws AnalysisEngineProcessException {
    CAS cas = aJCas.getCas();//  ww w .  j av a2 s  . c o m

    modelProvider.configure(cas);
    posMappingProvider.configure(cas);

    for (Sentence sentence : select(aJCas, Sentence.class)) {
        List<Token> tokens = selectCovered(aJCas, Token.class, sentence);

        List<HasWord> words = new ArrayList<HasWord>(tokens.size());
        for (Token t : tokens) {
            words.add(new TaggedWord(t.getCoveredText()));
        }

        if (ptb3Escaping) {
            words = CoreNlpUtils.applyPtbEscaping(words, quoteBegin, quoteEnd);
        }

        List<TaggedWord> taggedWords = modelProvider.getResource().tagSentence(words);

        int i = 0;
        for (Token t : tokens) {
            TaggedWord tt = taggedWords.get(i);
            Type posTag = posMappingProvider.getTagType(tt.tag());
            POS posAnno = (POS) cas.createAnnotation(posTag, t.getBegin(), t.getEnd());
            posAnno.setStringValue(posTag.getFeatureByBaseName("PosValue"),
                    internStrings ? tt.tag().intern() : tt.tag());
            posAnno.addToIndexes();
            t.setPos(posAnno);
            i++;
        }
    }
}