List of usage examples for edu.stanford.nlp.ling TaggedWord TaggedWord
public TaggedWord(Label oldLabel)
TaggedWord. From source file:at.illecker.storm.commons.preprocessor.Preprocessor.java
License:Apache License
private TaggedWord pretagToken(String token, boolean tokenIsHashTag, boolean tokenIsUser, boolean tokenIsURL) { TaggedWord preTaggedToken = new TaggedWord(token); if (tokenIsHashTag) { preTaggedToken.setTag("HT"); } else if (tokenIsUser) { preTaggedToken.setTag("USR"); } else if (tokenIsURL) { preTaggedToken.setTag("URL"); } else if (StringUtils.isRetweet(token)) { preTaggedToken.setTag("RT"); } else if (m_nameEntities.isNameEntity(token)) { if (LOGGING) { LOG.info("NameEntity labelled for " + token); }/*from www . ja v a 2 s .c o m*/ preTaggedToken.setTag("NNP"); } else if ((m_interjections.isInterjection(token)) || (StringUtils.isEmoticon(token))) { if (LOGGING) { LOG.info("Interjection or Emoticon labelled for " + token); } preTaggedToken.setTag("UH"); } return preTaggedToken; }
From source file:de.tudarmstadt.ukp.dkpro.core.stanfordnlp.StanfordPosTagger.java
License:Open Source License
@Override public void process(JCas aJCas) throws AnalysisEngineProcessException { CAS cas = aJCas.getCas();// ww w . j av a2 s . c o m modelProvider.configure(cas); posMappingProvider.configure(cas); for (Sentence sentence : select(aJCas, Sentence.class)) { List<Token> tokens = selectCovered(aJCas, Token.class, sentence); List<HasWord> words = new ArrayList<HasWord>(tokens.size()); for (Token t : tokens) { words.add(new TaggedWord(t.getCoveredText())); } if (ptb3Escaping) { words = CoreNlpUtils.applyPtbEscaping(words, quoteBegin, quoteEnd); } List<TaggedWord> taggedWords = modelProvider.getResource().tagSentence(words); int i = 0; for (Token t : tokens) { TaggedWord tt = taggedWords.get(i); Type posTag = posMappingProvider.getTagType(tt.tag()); POS posAnno = (POS) cas.createAnnotation(posTag, t.getBegin(), t.getEnd()); posAnno.setStringValue(posTag.getFeatureByBaseName("PosValue"), internStrings ? tt.tag().intern() : tt.tag()); posAnno.addToIndexes(); t.setPos(posAnno); i++; } } }