org.apache.hadoop.hbase.util.TestRegionSplitter.java Source code

Introduction

Here is the source code for org.apache.hadoop.hbase.util.TestRegionSplitter.java
Source

/**
 *
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.hadoop.hbase.util;

import static org.junit.Assert.assertArrayEquals;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertNotSame;
import static org.junit.Assert.assertTrue;

import java.util.ArrayList;
import java.util.List;
import java.util.Map;

import org.apache.commons.lang.ArrayUtils;
import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.hbase.HBaseTestingUtility;
import org.apache.hadoop.hbase.HRegionInfo;
import org.apache.hadoop.hbase.MediumTests;
import org.apache.hadoop.hbase.ServerName;
import org.apache.hadoop.hbase.client.HTable;
import org.apache.hadoop.hbase.util.RegionSplitter.HexStringSplit;
import org.apache.hadoop.hbase.util.RegionSplitter.SplitAlgorithm;
import org.apache.hadoop.hbase.util.RegionSplitter.UniformSplit;
import org.junit.AfterClass;
import org.junit.BeforeClass;
import org.junit.Test;
import org.junit.experimental.categories.Category;

/**
 * Tests for {@link RegionSplitter}, which can create a pre-split table or do a
 * rolling split of an existing table.
 */
@Category(MediumTests.class)
public class TestRegionSplitter {
    private final static Log LOG = LogFactory.getLog(TestRegionSplitter.class);
    private final static HBaseTestingUtility UTIL = new HBaseTestingUtility();
    private final static String CF_NAME = "SPLIT_TEST_CF";
    private final static byte xFF = (byte) 0xff;

    @BeforeClass
    public static void setup() throws Exception {
        UTIL.startMiniCluster();
    }

    @AfterClass
    public static void teardown() throws Exception {
        UTIL.shutdownMiniCluster();
    }

    /**
     * Test creating a pre-split table using the HexStringSplit algorithm.
     */
    @Test
    public void testCreatePresplitTableHex() throws Exception {
        final List<byte[]> expectedBounds = new ArrayList<byte[]>();
        expectedBounds.add(ArrayUtils.EMPTY_BYTE_ARRAY);
        expectedBounds.add("10000000".getBytes());
        expectedBounds.add("20000000".getBytes());
        expectedBounds.add("30000000".getBytes());
        expectedBounds.add("40000000".getBytes());
        expectedBounds.add("50000000".getBytes());
        expectedBounds.add("60000000".getBytes());
        expectedBounds.add("70000000".getBytes());
        expectedBounds.add("80000000".getBytes());
        expectedBounds.add("90000000".getBytes());
        expectedBounds.add("a0000000".getBytes());
        expectedBounds.add("b0000000".getBytes());
        expectedBounds.add("c0000000".getBytes());
        expectedBounds.add("d0000000".getBytes());
        expectedBounds.add("e0000000".getBytes());
        expectedBounds.add("f0000000".getBytes());
        expectedBounds.add(ArrayUtils.EMPTY_BYTE_ARRAY);

        // Do table creation/pre-splitting and verification of region boundaries
        preSplitTableAndVerify(expectedBounds, HexStringSplit.class.getSimpleName(), "NewHexPresplitTable");
    }

    /**
     * Test creating a pre-split table using the UniformSplit algorithm.
     */
    @Test
    public void testCreatePresplitTableUniform() throws Exception {
        List<byte[]> expectedBounds = new ArrayList<byte[]>();
        expectedBounds.add(ArrayUtils.EMPTY_BYTE_ARRAY);
        expectedBounds.add(new byte[] { 0x10, 0, 0, 0, 0, 0, 0, 0 });
        expectedBounds.add(new byte[] { 0x20, 0, 0, 0, 0, 0, 0, 0 });
        expectedBounds.add(new byte[] { 0x30, 0, 0, 0, 0, 0, 0, 0 });
        expectedBounds.add(new byte[] { 0x40, 0, 0, 0, 0, 0, 0, 0 });
        expectedBounds.add(new byte[] { 0x50, 0, 0, 0, 0, 0, 0, 0 });
        expectedBounds.add(new byte[] { 0x60, 0, 0, 0, 0, 0, 0, 0 });
        expectedBounds.add(new byte[] { 0x70, 0, 0, 0, 0, 0, 0, 0 });
        expectedBounds.add(new byte[] { (byte) 0x80, 0, 0, 0, 0, 0, 0, 0 });
        expectedBounds.add(new byte[] { (byte) 0x90, 0, 0, 0, 0, 0, 0, 0 });
        expectedBounds.add(new byte[] { (byte) 0xa0, 0, 0, 0, 0, 0, 0, 0 });
        expectedBounds.add(new byte[] { (byte) 0xb0, 0, 0, 0, 0, 0, 0, 0 });
        expectedBounds.add(new byte[] { (byte) 0xc0, 0, 0, 0, 0, 0, 0, 0 });
        expectedBounds.add(new byte[] { (byte) 0xd0, 0, 0, 0, 0, 0, 0, 0 });
        expectedBounds.add(new byte[] { (byte) 0xe0, 0, 0, 0, 0, 0, 0, 0 });
        expectedBounds.add(new byte[] { (byte) 0xf0, 0, 0, 0, 0, 0, 0, 0 });
        expectedBounds.add(ArrayUtils.EMPTY_BYTE_ARRAY);

        // Do table creation/pre-splitting and verification of region boundaries
        preSplitTableAndVerify(expectedBounds, UniformSplit.class.getSimpleName(), "NewUniformPresplitTable");
    }

    /**
     * Unit tests for the HexStringSplit algorithm. Makes sure it divides up the
     * space of keys in the way that we expect.
     */
    @Test
    public void unitTestHexStringSplit() {
        HexStringSplit splitter = new HexStringSplit();
        // Check splitting while starting from scratch

        byte[][] twoRegionsSplits = splitter.split(2);
        assertEquals(1, twoRegionsSplits.length);
        assertArrayEquals(twoRegionsSplits[0], "80000000".getBytes());

        byte[][] threeRegionsSplits = splitter.split(3);
        assertEquals(2, threeRegionsSplits.length);
        byte[] expectedSplit0 = "55555555".getBytes();
        assertArrayEquals(expectedSplit0, threeRegionsSplits[0]);
        byte[] expectedSplit1 = "aaaaaaaa".getBytes();
        assertArrayEquals(expectedSplit1, threeRegionsSplits[1]);

        // Check splitting existing regions that have start and end points
        byte[] splitPoint = splitter.split("10000000".getBytes(), "30000000".getBytes());
        assertArrayEquals("20000000".getBytes(), splitPoint);

        byte[] lastRow = "ffffffff".getBytes();
        assertArrayEquals(lastRow, splitter.lastRow());
        byte[] firstRow = "00000000".getBytes();
        assertArrayEquals(firstRow, splitter.firstRow());

        // Halfway between 00... and 20... should be 10...
        splitPoint = splitter.split(firstRow, "20000000".getBytes());
        assertArrayEquals(splitPoint, "10000000".getBytes());

        // Halfway between df... and ff... should be ef....
        splitPoint = splitter.split("dfffffff".getBytes(), lastRow);
        assertArrayEquals(splitPoint, "efffffff".getBytes());
    }

    /**
     * Unit tests for the UniformSplit algorithm. Makes sure it divides up the space of
     * keys in the way that we expect.
     */
    @Test
    public void unitTestUniformSplit() {
        UniformSplit splitter = new UniformSplit();

        // Check splitting while starting from scratch
        try {
            splitter.split(1);
            throw new AssertionError("Splitting into <2 regions should have thrown exception");
        } catch (IllegalArgumentException e) {
        }

        byte[][] twoRegionsSplits = splitter.split(2);
        assertEquals(1, twoRegionsSplits.length);
        assertArrayEquals(twoRegionsSplits[0], new byte[] { (byte) 0x80, 0, 0, 0, 0, 0, 0, 0 });

        byte[][] threeRegionsSplits = splitter.split(3);
        assertEquals(2, threeRegionsSplits.length);
        byte[] expectedSplit0 = new byte[] { 0x55, 0x55, 0x55, 0x55, 0x55, 0x55, 0x55, 0x55 };
        assertArrayEquals(expectedSplit0, threeRegionsSplits[0]);
        byte[] expectedSplit1 = new byte[] { (byte) 0xAA, (byte) 0xAA, (byte) 0xAA, (byte) 0xAA, (byte) 0xAA,
                (byte) 0xAA, (byte) 0xAA, (byte) 0xAA };
        assertArrayEquals(expectedSplit1, threeRegionsSplits[1]);

        // Check splitting existing regions that have start and end points
        byte[] splitPoint = splitter.split(new byte[] { 0x10 }, new byte[] { 0x30 });
        assertArrayEquals(new byte[] { 0x20 }, splitPoint);

        byte[] lastRow = new byte[] { xFF, xFF, xFF, xFF, xFF, xFF, xFF, xFF };
        assertArrayEquals(lastRow, splitter.lastRow());
        byte[] firstRow = ArrayUtils.EMPTY_BYTE_ARRAY;
        assertArrayEquals(firstRow, splitter.firstRow());

        splitPoint = splitter.split(firstRow, new byte[] { 0x20 });
        assertArrayEquals(splitPoint, new byte[] { 0x10 });

        splitPoint = splitter.split(new byte[] { (byte) 0xdf, xFF, xFF, xFF, xFF, xFF, xFF, xFF }, lastRow);
        assertArrayEquals(splitPoint, new byte[] { (byte) 0xef, xFF, xFF, xFF, xFF, xFF, xFF, xFF });
    }

    @Test
    public void testUserInput() {
        SplitAlgorithm algo = new HexStringSplit();
        assertFalse(splitFailsPrecondition(algo)); // default settings are fine
        assertFalse(splitFailsPrecondition(algo, "00", "AA")); // custom is fine
        assertTrue(splitFailsPrecondition(algo, "AA", "00")); // range error
        assertTrue(splitFailsPrecondition(algo, "AA", "AA")); // range error
        assertFalse(splitFailsPrecondition(algo, "0", "2", 3)); // should be fine
        assertFalse(splitFailsPrecondition(algo, "0", "A", 11)); // should be fine
        assertTrue(splitFailsPrecondition(algo, "0", "A", 12)); // too granular

        algo = new UniformSplit();
        assertFalse(splitFailsPrecondition(algo)); // default settings are fine
        assertFalse(splitFailsPrecondition(algo, "\\x00", "\\xAA")); // custom is fine
        assertTrue(splitFailsPrecondition(algo, "\\xAA", "\\x00")); // range error
        assertTrue(splitFailsPrecondition(algo, "\\xAA", "\\xAA")); // range error
        assertFalse(splitFailsPrecondition(algo, "\\x00", "\\x02", 3)); // should be fine
        assertFalse(splitFailsPrecondition(algo, "\\x00", "\\x0A", 11)); // should be fine
        assertTrue(splitFailsPrecondition(algo, "\\x00", "\\x0A", 12)); // too granular
    }

    private boolean splitFailsPrecondition(SplitAlgorithm algo) {
        return splitFailsPrecondition(algo, 100);
    }

    private boolean splitFailsPrecondition(SplitAlgorithm algo, String firstRow, String lastRow) {
        return splitFailsPrecondition(algo, firstRow, lastRow, 100);
    }

    private boolean splitFailsPrecondition(SplitAlgorithm algo, String firstRow, String lastRow, int numRegions) {
        algo.setFirstRow(firstRow);
        algo.setLastRow(lastRow);
        return splitFailsPrecondition(algo, numRegions);
    }

    private boolean splitFailsPrecondition(SplitAlgorithm algo, int numRegions) {
        try {
            byte[][] s = algo.split(numRegions);
            LOG.debug("split algo = " + algo);
            if (s != null) {
                StringBuilder sb = new StringBuilder();
                for (byte[] b : s) {
                    sb.append(Bytes.toStringBinary(b) + "  ");
                }
                LOG.debug(sb.toString());
            }
            return false;
        } catch (IllegalArgumentException e) {
            return true;
        } catch (IllegalStateException e) {
            return true;
        } catch (IndexOutOfBoundsException e) {
            return true;
        }
    }

    /**
     * Creates a pre-split table with expectedBounds.size()+1 regions, then
     * verifies that the region boundaries are the same as the expected
     * region boundaries in expectedBounds.
     * @throws Various junit assertions
     */
    private void preSplitTableAndVerify(List<byte[]> expectedBounds, String splitClass, String tableName)
            throws Exception {
        final int numRegions = expectedBounds.size() - 1;
        final Configuration conf = UTIL.getConfiguration();
        conf.setInt("split.count", numRegions);
        SplitAlgorithm splitAlgo = RegionSplitter.newSplitAlgoInstance(conf, splitClass);
        RegionSplitter.createPresplitTable(tableName, splitAlgo, new String[] { CF_NAME }, conf);
        verifyBounds(expectedBounds, tableName);
    }

    private void rollingSplitAndVerify(String tableName, String splitClass, List<byte[]> expectedBounds)
            throws Exception {
        final Configuration conf = UTIL.getConfiguration();

        // Set this larger than the number of splits so RegionSplitter won't block
        conf.setInt("split.outstanding", 5);
        SplitAlgorithm splitAlgo = RegionSplitter.newSplitAlgoInstance(conf, splitClass);
        RegionSplitter.rollingSplit(tableName, splitAlgo, conf);
        verifyBounds(expectedBounds, tableName);
    }

    private void verifyBounds(List<byte[]> expectedBounds, String tableName) throws Exception {
        // Get region boundaries from the cluster and verify their endpoints
        final Configuration conf = UTIL.getConfiguration();
        final int numRegions = expectedBounds.size() - 1;
        final HTable hTable = new HTable(conf, tableName.getBytes());
        final Map<HRegionInfo, ServerName> regionInfoMap = hTable.getRegionLocations();
        assertEquals(numRegions, regionInfoMap.size());
        for (Map.Entry<HRegionInfo, ServerName> entry : regionInfoMap.entrySet()) {
            final HRegionInfo regionInfo = entry.getKey();
            byte[] regionStart = regionInfo.getStartKey();
            byte[] regionEnd = regionInfo.getEndKey();

            // This region's start key should be one of the region boundaries
            int startBoundaryIndex = indexOfBytes(expectedBounds, regionStart);
            assertNotSame(-1, startBoundaryIndex);

            // This region's end key should be the region boundary that comes
            // after the starting boundary.
            byte[] expectedRegionEnd = expectedBounds.get(startBoundaryIndex + 1);
            assertEquals(0, Bytes.compareTo(regionEnd, expectedRegionEnd));
        }
    }

    /**
     * List.indexOf() doesn't really work for a List<byte[]>, because byte[]
     * doesn't override equals(). This method checks whether a list contains
     * a given element by checking each element using the byte array
     * comparator.
     * @return the index of the first element that equals compareTo, or -1
     * if no elements are equal.
     */
    static private int indexOfBytes(List<byte[]> list, byte[] compareTo) {
        int listIndex = 0;
        for (byte[] elem : list) {
            if (Bytes.BYTES_COMPARATOR.compare(elem, compareTo) == 0) {
                return listIndex;
            }
            listIndex++;
        }
        return -1;
    }

}