List of usage examples for org.apache.mahout.math NamedVector getDelegate
public Vector getDelegate()
From source file:csvToSequence.ConvertToSeqLargeTxtVec.java
public static void main(String[] args) throws IOException { String filename = "/home/ivan/WorkDir/ccFraud.csv"; String outputfilename = "/home/ivan/WorkDir/part-0000"; SequenceFile.Writer writer;/* w w w .j a v a2 s. com*/ Configuration conf = new Configuration(); FileSystem fs = FileSystem.get(conf); Path path = new Path(outputfilename); writer = new SequenceFile.Writer(fs, conf, path, Text.class, VectorWritable.class); VectorWritable vec = new VectorWritable(); BufferedReader br = new BufferedReader(new FileReader(filename)); String s; br.readLine(); //skip line while ((s = br.readLine()) != null) { String[] value = s.split(","); double[] numValue = new double[8]; for (int i = 0; i < 8; i++) numValue[i] = Double.parseDouble(value[i]); if (Integer.parseInt(value[8]) == 1) value[8] = "Fraud/" + value[8]; else value[8] = "Normal/" + value[8]; NamedVector oneV = new NamedVector(new DenseVector(numValue), value[8]); vec.set(oneV.getDelegate()); writer.append(new Text(oneV.getName()), vec); } writer.close(); }
From source file:csvToSequence.ConvertToSeqTextVecWritable.java
public static void main(String[] args) throws FileNotFoundException, IOException { String filename = "/home/ivan/WorkDir/ccFraud.csv"; String outputfilename = "/home/ivan/WorkDir/part-0000"; SequenceFile.Writer writer;/*from w ww . j av a 2s .c o m*/ Configuration conf = new Configuration(); List<NamedVector> namedVectors = new ArrayList<>(); /*Integer i = 1; CSVVectorIterator vectorCSVVectorIterator = new CSVVectorIterator(new FileReader(filename)); //System.out.println("Densvector"+vec.next()): while(vectorCSVVectorIterator.hasNext()){ NamedVector vecIt = new NamedVector(vectorCSVVectorIterator.next(),i.toString()); namedVectors.add(vecIt); i++; }*/ BufferedReader br = new BufferedReader(new FileReader(filename)); String s; br.readLine(); //skip line while ((s = br.readLine()) != null) { String[] value = s.split(","); double[] numValue = new double[8]; for (int i = 0; i < 8; i++) numValue[i] = Double.parseDouble(value[i]); if (Integer.parseInt(value[8]) == 1) value[8] = "Fraud/" + value[8]; else value[8] = "Normal/" + value[8]; NamedVector oneV = new NamedVector(new DenseVector(numValue), value[8]); namedVectors.add(oneV); } FileSystem fs = FileSystem.get(conf); Path path = new Path(outputfilename); writer = new SequenceFile.Writer(fs, conf, path, Text.class, VectorWritable.class); VectorWritable vec = new VectorWritable(); for (NamedVector iter : namedVectors) { vec.set(iter.getDelegate()); writer.append(new Text(iter.getName()), vec); } writer.close(); /*try (SequenceFile.Reader reader = new SequenceFile.Reader(fs,path, conf)) { Text key = new Text(); VectorWritable value = new VectorWritable(); while (reader.next(key, value)) { System.out.println(key + " "+ value); } }*/ }