Example usage for edu.stanford.nlp.util StringUtils join

Introduction

In this page you can find the example usage for edu.stanford.nlp.util StringUtils join.

Prototype

public static String join(Object[] elements)

Source Link

Document

Joins elements with a space.

Usage

From source file:knu.univ.lingvo.coref.Mention.java

License:Open Source License

public String getPattern(List<CoreLabel> pTokens) {

    ArrayList<String> phrase_string = new ArrayList<String>();
    String ne = "";
    for (CoreLabel token : pTokens) {
        if (token.index() == headWord.index()) {
            phrase_string.add(token.lemma());
            ne = "";

        } else if ((token.lemma().equals("and") || StringUtils.isPunct(token.lemma()))
                && pTokens.size() > pTokens.indexOf(token) + 1 && pTokens.indexOf(token) > 0
                && pTokens.get(pTokens.indexOf(token) + 1).ner()
                        .equals(pTokens.get(pTokens.indexOf(token) - 1).ner())) {

        } else if (token.index() == headWord.index() - 1 && token.ner().equals(nerString)) {
            phrase_string.add(token.lemma());
            ne = "";

        } else if (!token.ner().equals("O")) {
            if (!token.ner().equals(ne)) {
                ne = token.ner();// w w w. ja  v  a  2 s. c  om
                phrase_string.add("<" + ne + ">");
            }

        } else {
            phrase_string.add(token.lemma());
            ne = "";
        }
    }
    return StringUtils.join(phrase_string);
}

From source file:org.seasr.meandre.components.analytics.psychometrics.LIWC.java

License:Open Source License

@Override
public void executeCallBack(ComponentContext cc) throws Exception {
    Object inTokens = cc.getDataComponentFromInput(IN_TOKENS);
    String[] tokens = DataTypeParser.parseAsString(inTokens);

    WordClassCount[] LIWC_Values = null;
    try {//from  www.j  a  v  a 2 s. com
        LIWC_Values = dict.countClasses(StringUtils.join(tokens));
    } catch (IllegalArgumentException e) {
        console.warning(String.format("Failed to calculate LIWC values! : %s", e.getMessage()));
        LIWC_Values = new WordClassCount[0];
    }
    //      System.out.print("LIWCOnTokenDoubleValues:");
    Map<String, Integer> out = new Hashtable<String, Integer>();
    for (WordClassCount fc : LIWC_Values) {
        out.put(dict.getClassName(fc.classId), fc.count);
        //         System.out.print(fc);
    }

    //      System.out.println();
    //      System.out.println(String.format("LIWCOnTokenDoubleValues: found %d classes",out.size()));
    Integer count = out.get(dict.getClassName(WordClassDictionary.CLASS_TOTAL_WORDS));
    if (count == null)
        count = -1;
    console.fine(String.format("LIWC counter found %d classes from %d tokens", out.size(), count));

    cc.pushDataComponentToOutput(OUT_LIWC_SCORES, BasicDataTypesTools.mapToIntegerMap(out, false));
    cc.pushDataComponentToOutput(OUT_WORD_COUNT, BasicDataTypesTools.integerToIntegers(count));
    cc.pushDataComponentToOutput(OUT_TOKENS, inTokens);
}

From source file:process.PTBTokenizer.java

License:Open Source License

/**
 * Returns a presentable version of the given PTB-tokenized words. Pass in a
 * List of Strings and this method will join the words with spaces and call
 * {@link #ptb2Text(String)} on the output.
 * /*w ww . ja va 2 s  .c o m*/
 * @param ptbWords
 *            A list of String
 * @return A presentable version of the given PTB-tokenized words
 */
public static String ptb2Text(List<String> ptbWords) {
    return ptb2Text(StringUtils.join(ptbWords));
}