terasort.processors.PartitionProcessor.java Source code

Introduction

Here is the source code for terasort.processors.PartitionProcessor.java
Source

/**
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 * <p/>
 * http://www.apache.org/licenses/LICENSE-2.0
 * <p/>
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package terasort.processors;

import com.google.common.collect.Lists;
import org.apache.hadoop.conf.Configurable;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.MRJobConfig;
import org.apache.tez.mapreduce.processor.SimpleMRProcessor;
import org.apache.tez.runtime.api.ProcessorContext;
import org.apache.tez.runtime.library.api.KeyValuesWriter;
import org.apache.tez.runtime.library.api.Partitioner;
import org.apache.tez.runtime.library.common.readers.UnorderedKVReader;
import terasort.TeraSort;

import java.io.DataInputStream;
import java.io.IOException;
import java.io.PrintStream;
import java.util.List;

/**
 * Read partition info, build the trie.
 * Send data to sink vertex.
 */
public class PartitionProcessor extends SimpleMRProcessor {

    private static TrieNode trie;

    public PartitionProcessor(ProcessorContext context) {
        super(context);
    }

    @Override
    public void run() throws Exception {
        UnorderedKVReader reader = (UnorderedKVReader) (getInputs().get(TeraSort.SAMPLER_VERTEX).getReader());
        List<Text> splitPoints = Lists.newLinkedList();
        while (reader.next()) {
            Text partitionData = (Text) reader.getCurrentKey();
            splitPoints.add(partitionData);
        }
        trie = buildTrie(splitPoints.toArray(new Text[splitPoints.size()]), 0, splitPoints.size(), new Text(), 2);

        UnorderedKVReader dataReader = (UnorderedKVReader) (getInputs().get(TeraSort.SCAN_VERTEX).getReader());
        KeyValuesWriter writer = (KeyValuesWriter) getOutputs().get(TeraSort.SINK_VERTEX).getWriter();
        while (dataReader.next()) {
            Object key = dataReader.getCurrentKey();
            Object val = dataReader.getCurrentValue();
            writer.write(key, val);
        }
    }

    /**
     * A generic trie node
     */
    static abstract class TrieNode {
        private int level;

        TrieNode(int level) {
            this.level = level;
        }

        abstract int findPartition(Text key);

        abstract void print(PrintStream strm) throws IOException;

        int getLevel() {
            return level;
        }
    }

    /**
     * An inner trie node that contains 256 children based on the next
     * character.
     */
    static class InnerTrieNode extends TrieNode {
        private TrieNode[] child = new TrieNode[256];

        InnerTrieNode(int level) {
            super(level);
        }

        int findPartition(Text key) {
            int level = getLevel();
            if (key.getLength() <= level) {
                return child[0].findPartition(key);
            }
            return child[key.getBytes()[level] & 0xff].findPartition(key);
        }

        void setChild(int idx, TrieNode child) {
            this.child[idx] = child;
        }

        void print(PrintStream strm) throws IOException {
            for (int ch = 0; ch < 256; ++ch) {
                for (int i = 0; i < 2 * getLevel(); ++i) {
                    strm.print(' ');
                }
                strm.print(ch);
                strm.println(" ->");
                if (child[ch] != null) {
                    child[ch].print(strm);
                }
            }
        }
    }

    /**
     * A leaf trie node that does string compares to figure out where the given
     * key belongs between lower..upper.
     */
    static class LeafTrieNode extends TrieNode {
        int lower;
        int upper;
        Text[] splitPoints;

        LeafTrieNode(int level, Text[] splitPoints, int lower, int upper) {
            super(level);
            this.splitPoints = splitPoints;
            this.lower = lower;
            this.upper = upper;
        }

        int findPartition(Text key) {
            for (int i = lower; i < upper; ++i) {
                if (splitPoints[i].compareTo(key) > 0) {
                    return i;
                }
            }
            return upper;
        }

        void print(PrintStream strm) throws IOException {
            for (int i = 0; i < 2 * getLevel(); ++i) {
                strm.print(' ');
            }
            strm.print(lower);
            strm.print(", ");
            strm.println(upper);
        }
    }

    /**
     * Given a sorted set of cut points, build a trie that will find the correct
     * partition quickly.
     *
     * @param splits   the list of cut points
     * @param lower    the lower bound of partitions 0..numPartitions-1
     * @param upper    the upper bound of partitions 0..numPartitions-1
     * @param prefix   the prefix that we have already checked against
     * @param maxDepth the maximum depth we will build a trie for
     * @return the trie node that will divide the splits correctly
     */
    private static TrieNode buildTrie(Text[] splits, int lower, int upper, Text prefix, int maxDepth) {
        int depth = prefix.getLength();
        if (depth >= maxDepth || lower == upper) {
            return new LeafTrieNode(depth, splits, lower, upper);
        }
        InnerTrieNode result = new InnerTrieNode(depth);
        Text trial = new Text(prefix);
        // append an extra byte on to the prefix
        trial.append(new byte[1], 0, 1);
        int currentBound = lower;
        for (int ch = 0; ch < 255; ++ch) {
            trial.getBytes()[depth] = (byte) (ch + 1);
            lower = currentBound;
            while (currentBound < upper) {
                if (splits[currentBound].compareTo(trial) >= 0) {
                    break;
                }
                currentBound += 1;
            }
            trial.getBytes()[depth] = (byte) ch;
            result.child[ch] = buildTrie(splits, lower, currentBound, trial, maxDepth);
        }
        // pick up the rest
        trial.getBytes()[depth] = (byte) 255;
        result.child[255] = buildTrie(splits, currentBound, upper, trial, maxDepth);
        return result;
    }

    /**
     * A partitioner that splits text keys into roughly equal partitions
     * in a global sorted order.
     */
    public static class TotalOrderPartitioner implements Partitioner {

        @Override
        public int getPartition(Object key, Object value, int numPartitions) {
            return trie.findPartition((Text) key);
        }
    }
}