Java String Tokenize unpackConllSentenceToTokens(String input)

Here you can find the source of unpackConllSentenceToTokens(String input)

Description

unpack Conll Sentence To Tokens

License

Open Source License

Declaration

public static List<List<String>> unpackConllSentenceToTokens(String input) 

Method Source Code

//package com.java2s;
/* /*  ww w . jav a  2s  .  co m*/
 * Copyright (C) 2015 ikonstas
 *
 * This program is free software: you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 */

import java.util.ArrayList;
import java.util.Arrays;

import java.util.List;

public class Main {
    public static List<List<String>> unpackConllSentenceToTokens(String input) {
        List<List<String>> list = new ArrayList();
        for (String word : unpackConllSentence(input)) {
            list.add(unpackConllWord(word));
        }
        return list;
    }

    public static List<String> unpackConllSentence(String input) {
        return unpack(input, "\n");
    }

    public static double[] add(double[] a, double b) {
        for (int i = 0; i < a.length; i++) {
            a[i] += b;
        }
        return a;
    }

    public static double[] add(double[] a, double scale, double[] b) {
        for (int i = 0; i < a.length; i++) {
            a[i] += scale * b[i];
        }
        return a;
    }

    public static List<String> unpackConllWord(String input) {
        return unpack(input, "\t");
    }

    public static List<String> unpack(String input, String delimiter) {
        List<String> list = new ArrayList<String>();
        list.addAll(Arrays.asList(input.split(delimiter)));
        return list;
    }

    public static List<Integer> asList(int[] ar) {
        List<Integer> list = new ArrayList<Integer>(ar.length);
        for (int a : ar) {
            list.add(a);
        }
        return list;
    }
}

Related

  1. tokenizeToStringArray(String str, String seperators)
  2. tokenizeWhitespace(String input)
  3. tokens(String exp)
  4. toStringToArray(String str, String token)
  5. toTokens(String s)