List of usage examples for org.apache.hadoop.io Text write
@Override public void write(DataOutput out) throws IOException
From source file:org.zuinnote.hadoop.office.format.common.dao.SpreadSheetCellDAO.java
License:Apache License
/** Writable **/ @Override/* w w w. j av a 2s. c o m*/ public void write(DataOutput dataOutput) throws IOException { Text formattedValueText = new Text(""); if (formattedValue != null) { formattedValueText = new Text(formattedValue); } Text commentText = new Text(""); if (comment != null) { commentText = new Text(comment); } Text formulaText = new Text(""); if (formula != null) { formulaText = new Text(formula); } Text addressText = new Text(""); if (address != null) { addressText = new Text(address); } Text sheetNameText = new Text(""); if (sheetName != null) { sheetNameText = new Text(sheetName); } formattedValueText.write(dataOutput); commentText.write(dataOutput); formulaText.write(dataOutput); addressText.write(dataOutput); sheetNameText.write(dataOutput); }
From source file:uk.ac.cam.eng.rule.retrieval.HFileRuleQuery.java
License:Apache License
@SuppressWarnings("unchecked") @Override// w ww.j a v a 2 s.c om public void run() { List<Text> sortedQuery = new ArrayList<>(query); query.clear(); StopWatch stopWatch = new StopWatch(); System.out.println("Sorting query"); stopWatch.start(); Collections.sort(sortedQuery, new MergeComparator()); System.out.printf("Query sort took %d seconds\n", stopWatch.getTime() / 1000); stopWatch.reset(); stopWatch.start(); try { for (Text source : sortedQuery) { SidePattern sourcePattern = SidePattern.getPattern(source.toString()); tempOut.reset(); source.write(tempOut); if (!bf.contains(tempOut.getData(), 0, tempOut.getLength(), null)) { continue; } if (reader.seek(source)) { if (retriever.testVocab.contains(source)) { synchronized (retriever.foundTestVocab) { retriever.foundTestVocab.add(source); } } Set<RuleWritable> existingRules = new HashSet<>(); List<Pair<RuleWritable, AlignmentAndFeatureMap>> allFiltered = new ArrayList<>(); List<String> provenances = new ArrayList<>(); provenances.add(""); provenances.addAll(conf.getStringCollection(ProvenanceCountMap.PROV)); for (String provenance : provenances) { if (!retriever.filter.isProvenanceUnion() && !provenance.equals("")) { continue; } SortedSet<Pair<RuleWritable, AlignmentAndFeatureMap>> rules = new TreeSet<Pair<RuleWritable, AlignmentAndFeatureMap>>( retriever.filter.getComparator(provenance)); for (Pair<RuleWritable, AlignmentAndFeatureMap> entry : reader.getRulesForSource()) { RuleWritable rule = entry.getFirst(); AlignmentAndFeatureMap rawFeatures = entry.getSecond(); if (retriever.filter.filterRule(sourcePattern, rule, rawFeatures.getSecond(), provenance)) { continue; } rules.add(Pair.createPair(new RuleWritable(rule), rawFeatures)); } List<Pair<RuleWritable, AlignmentAndFeatureMap>> filtered = retriever.filter .filterRulesBySource(sourcePattern, rules, provenance); for (Pair<RuleWritable, AlignmentAndFeatureMap> ruleFiltered : filtered) { if (!existingRules.contains(ruleFiltered.getFirst())) { allFiltered.add(ruleFiltered); existingRules.add(ruleFiltered.getFirst()); } } } queue.addAll(allFiltered); if (queue.size() > BATCH_SIZE) { drainQueue(); } } } drainQueue(); } catch (IOException e) { e.printStackTrace(); System.exit(1); } System.out.printf("Query took %d seconds\n", stopWatch.getTime() / 1000); }
From source file:uk.ac.cam.eng.rule.retrieval.HFileRuleReader.java
License:Apache License
boolean seek(Text source) throws IOException { out.reset();//from w w w.j a v a2s. c om source.write(out); int pos = scanner.seekTo(out.getData(), 0, out.getLength()); if (pos == 0) { key.set(source); return true; } else { return false; } }