java source code of RegionSplitter

phoenix-omid-master
- timestamp-storage
  - src
    - main
      - java
        org
        apache
        omid
        timestamp
        storage
        ZKModule.java
        HBaseTimestampStorageModule.java
        HBaseTimestampStorage.java
        HBaseTimestampStorageConfig.java
        DefaultHBaseTimestampStorageModule.java
        DefaultZKTimestampStorageModule.java
        ZKTimestampPaths.java
        TimestampStorage.java
        ZKTimestampStorage.java
        ZKTimestampStorageModule.java
    - test
      - resources
        log4j.properties
      - java
        org
        apache
        omid
        timestamp
        storage
        TestZKTimestampStorage.java
        TestHBaseTimestampStorage.java
  - pom.xml
- hbase-common
  - src
    - main
      - java
        org
        apache
        omid
        transaction
        CellUtils.java
        CellInfo.java
        committable
        hbase
        KeyGeneratorImplementations.java
        RegionSplitter.java
        KeyGenerator.java
        tools
        hbase
        HBaseLogin.java
        SecureHBaseConfig.java
        HBaseConfigModule.java
    - test
      - java
        org
        apache
        omid
        committable
        hbase
        TestHBaseCommitTableKey.java
  - pom.xml
- examples
  - src
    - main
      - resources
        hbase-omid-client-config.yml
        log4j.properties
      - java
        org
        apache
        omid
        examples
        RowIdGenerator.java
        ConfigurationExample.java
        ParallelExecution.java
        BasicExample.java
        SnapshotIsolationExample.java
  - maven
    - assembly
      - assembly.xml
  - pom.xml
  - run.sh
- pom.xml
- hbase-coprocessor
  - src
    - main
      - java
        org
        apache
        hadoop
        hbase
        regionserver
        RegionAccessWrapper.java
        RegionConnectionFactory.java
        omid
        transaction
        CompactorScanner.java
        HRegionCellGetterAdapter.java
        OmidSnapshotFilter.java
        OmidCompactor.java
        TransactionVisibilityFilterBase.java
        TransactionFilters.java
        CompactorUtil.java
        CellSkipFilterBase.java
    - test
      - resources
        log4j.xml
      - java
        org
        apache
        omid
        transaction
        TestCompactorScanner.java
        TestSnapshotFilter.java
        TSOForSnapshotFilterTestModule.java
        TestCompaction.java
        TSOForHBaseCompactorTestModule.java
        TestCompactionLL.java
        TestSnapshotFilterLL.java
  - pom.xml
  - .gitignore
- common
  - src
    - main
      - proto
        TSOProto.proto
      - java
        org
        apache
        omid
        zk
        ZKUtils.java
        NetworkUtils.java
        YAMLUtils.java
        ReflectionHelper.java
    - test
      - resources
        test.yml
        default-test.yml
      - java
        org
        apache
        omid
        TestReflectionHelper.java
        YAMLUtilsTest.java
  - pom.xml
- hbase-tools
  - src
    - main
      - java
        org
        apache
        omid
        tools
        hbase
        OmidTableManager.java
    - test
      - java
        org
        apache
        omid
        tools
        hbase
        TestOmidTableManager.java
  - pom.xml
- statemachine
  - src
    - main
      - java
        org
        apache
        statemachine
        StateMachineLogParser.java
        StateMachine.java
    - test
      - java
        org
        apache
        statemachine
        TestStateMachine.java
  - pom.xml
- codahale-metrics
  - src
    - main
      - java
        org
        apache
        omid
        metrics
        CodahaleMetricsConfig.java
        CodahaleMetricsProvider.java
  - pom.xml
- hbase-client
  - src
    - main
      - resources
        default-hbase-omid-client-config.yml
      - java
        org
        apache
        omid
        transaction
        HTableAccessWrapper.java
        HBaseTransaction.java
        TableAccessWrapper.java
        SnapshotFilter.java
        TTableCellGetterAdapter.java
        HBaseTransactionManager.java
        HBaseTransactionClient.java
        SnapshotFilterImpl.java
        AttributeSetSnapshotFilter.java
        HBaseAsyncPostCommitter.java
        HBaseOmidClientConfiguration.java
        ColumnWrapper.java
        HBaseSyncPostCommitter.java
        TTable.java
        HBaseCellId.java
    - test
      - resources
        log4j.properties
        test-hbase-omid-client-config.yml
      - java
        org
        apache
        omid
        transaction
        TestSingleColumnFamily.java
        TestTransactionCleanup.java
        TestBaillisAnomaliesWithTXs.java
        TestUpdateScan.java
        TestHALeaseManagementModule.java
        TestCellUtils.java
        TestTransactionConflict.java
        TestColumnIterator.java
        TestTxMgrFailover.java
        TestCheckpoint.java
        TestHBaseTransactionClient.java
        TestMultiplePut.java
        OmidTestBase.java
        TestAsynchronousPostCommitter.java
        TestMarkPutAsCommitted.java
        TestDeletion.java
        TestAutoFlush.java
        TestOmidLLRaces.java
        TestBasicTransaction.java
        TestTSOModule.java
        TestHBaseTransactionManager.java
        TestTTableBehaviour.java
        TestFilters.java
        TestEndToEndScenariosWithHA.java
        TestReadPath.java
        TestHBaseOmidClientConfiguration.java
        TestShadowCells.java
  - pom.xml
- misc
  - header.txt
  - omid_checks.xml
  - findbugs-exclude.xml
- benchmarks
  - src
    - main
      - resources
        default-tso-server-benchmark-config.yml
      - java
        org
        apache
        omid
        benchmarks
        utils
        ScrambledZipfianGenerator.java
        ZipfianGenerator.java
        Generator.java
        IntegerGenerator.java
        UniformGenerator.java
        hbase
        HBaseCommitTableTester.java
        tso
        RawTxRunner.java
        TSOServerBenchmarkConfig.java
        TSOServerBenchmark.java
  - maven
    - assembly
      - bin.xml
  - pom.xml
  - bin
    - omid-env.sh
    - benchmarks.sh
  - conf
    - hbase-site.xml
    - log4j.xml
- DISCLAIMER
- transaction-client
  - src
    - main
      - resources
        omid-client-config.yml
      - java
        org
        apache
        omid
        transaction
        TransactionManager.java
        AbstractTransactionManager.java
        RollbackException.java
        CommitTimestampLocator.java
        Transaction.java
        PostCommitActions.java
        AbstractTransaction.java
        TransactionManagerException.java
        TransactionException.java
        tso
        client
        OmidClientConfiguration.java
        TSOFuture.java
        TSOClient.java
        ClosingException.java
        ForwardingTSOFuture.java
        CellId.java
        TSOProtocol.java
        ServiceUnavailableException.java
        HandshakeFailedException.java
        AbortException.java
        MockTSOClient.java
        ConnectionException.java
        util
        DummyCellIdImpl.java
    - test
      - java
        org
        apache
        omid
        tso
        client
        TestOmidClientConfiguration.java
        TestMockTSOClient.java
  - pom.xml
- bintray-settings.xml
- .travis.yml
- README.md
- KEYS
- hbase-shims
  - pom.xml
  - hbase-2
    - src
      - main
        java
        org
        apache
        hadoop
        hbase
        coprocessor
        BaseRegionObserver.java
        ipc
        controller
        InterRegionServerRpcController.java
        InterRegionServerRpcControllerFactory.java
        omid
        HBaseShims.java
        OmidFilterBase.java
    - pom.xml
  - hbase-1
    - src
      - main
        java
        org
        apache
        hadoop
        hbase
        ipc
        controller
        InterRegionServerRpcController.java
        InterRegionServerRpcControllerFactory.java
        omid
        HBaseShims.java
        RegionWrapper.java
        OmidFilterBase.java
    - pom.xml
- metrics
  - src
    - main
      - java
        org
        apache
        omid
        metrics
        MetricsProvider.java
        Gauge.java
        MetricsRegistry.java
        MetricsRegistryMap.java
        NullMetricsProvider.java
        Metric.java
        Histogram.java
        Timer.java
        Meter.java
        Counter.java
        AbstractMetricsConfig.java
        MetricsUtils.java
  - pom.xml
- packaging
  - maven
    - assembly
      - src.xml
  - pom.xml
- NOTICE
- commit-table
  - src
    - main
      - java
        org
        apache
        omid
        committable
        NullCommitTable.java
        InMemoryCommitTable.java
        CommitTable.java
    - test
      - java
        org
        apache
        omid
        committable
        NullCommitTableTest.java
  - pom.xml
- .gitignore
- LICENSE.txt
- doc
  - images
    - ModuleDependencies.graffle
  - site
    - resources
      - images
      - css
        site.css
    - markdown
      - quickstart.md
      - basic-examples.md
      - mailing-lists.md
      - basic-algorithm.md
      - omid-components.md
      - index.md
      - basic-concepts.md
      - coding-guide-and-style.md
      - client-failure-management.md
    - site.xml
- hbase-commit-table
  - src
    - main
      - java
        org
        apache
        omid
        committable
        hbase
        HBaseCommitTableStorageModule.java
        HBaseCommitTable.java
        HBaseCommitTableConfig.java
        DefaultHBaseCommitTableStorageModule.java
    - test
      - java
        org
        apache
        omid
        committable
        hbase
        TestHBaseCommitTable.java
  - pom.xml
- tso-server
  - src
    - main
      - resources
        log4j.properties
        default-omid-server-configuration.yml
      - java
        org
        apache
        omid
        tso
        WorldClockOracleImpl.java
        PersistEvent.java
        RequestProcessorPersistCT.java
        LowWatermarkWriterImpl.java
        InMemoryCommitTableStorageModule.java
        VoidLeaseManagementModule.java
        ReplyProcessorImpl.java
        SystemExitPanicker.java
        MonitoringContextImpl.java
        MockPanicker.java
        CommitHashMap.java
        BatchPoolModule.java
        TsoServerDaemon.java
        InMemoryTimestampStorageModule.java
        TimestampOracle.java
        HALeaseManagementModule.java
        LongCache.java
        VoidLeaseManager.java
        PersistenceProcessorImpl.java
        RetryProcessorImpl.java
        Batch.java
        MonitoringContextFactory.java
        DisruptorModule.java
        TSOModule.java
        FatalExceptionHandler.java
        AbstractRequestProcessor.java
        PersitenceProcessorNullImpl.java
        TSOStateManagerImpl.java
        MonitoringContext.java
        NetworkInterfaceUtils.java
        MonitoringContextNullImpl.java
        TSOStateManager.java
        LeaseManagement.java
        RequestProcessor.java
        CacheEvaluation.java
        TimestampOracleImpl.java
        LeaseManager.java
        ReplyProcessor.java
        TSOServerConfig.java
        Panicker.java
        LowWatermarkWriter.java
        TSOServer.java
        PersistenceProcessor.java
        TSOChannelHandler.java
        RetryProcessor.java
        RequestProcessorSkipCT.java
        RuntimeExceptionPanicker.java
        PersistenceProcessorHandler.java
    - test
      - resources
        test-omid.yml
        log4j.properties
      - java
        org
        apache
        omid
        tso
        PausableTimestampOracle.java
        TestPanicker.java
        TestLongCache.java
        PausableLeaseManager.java
        TestRetryProcessor.java
        client
        TestTSOClientRequestAndResponseBehaviours.java
        TestTSOClientConnectionToTSO.java
        TestIntegrationOfTSOClientServerBasicFunctionality.java
        TSOClientRaw.java
        TestTSOClientResponseHandling.java
        TSOClientAccessor.java
        TSOClientOneShot.java
        TestUnconnectedTSOClient.java
        TestTSOClientRowAndCellLevelConflict.java
        TestRequestProcessor.java
        TestBatchPool.java
        TestLeaseManager.java
        TestPersistenceProcessor.java
        TestTSOLL.java
        ProgrammableTSOServer.java
        TestPersistenceProcessorHandler.java
        TestReplyProcessor.java
        TestWorldTimeOracle.java
        TSOMockModule.java
        TSOServerConfigTest.java
        TestTSOStateManager.java
        TestBatch.java
        TestTimestampOracle.java
        TestTSOChannelHandlerNetty.java
        TestUtils.java
  - maven
    - assembly
      - bin.xml
  - pom.xml
  - bin
    - omid-env.sh
    - omid.sh
  - conf
    - omid-server-configuration.yml
    - hbase-site.xml
    - log4j.xml

/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.omid.committable.hbase;

import com.google.common.base.Preconditions;

import org.apache.commons.lang.ArrayUtils;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.hbase.util.Bytes;

import java.io.IOException;
import java.util.Arrays;

/**
 * This class contains only the required behavior of the original
 * org.apache.hadoop.hbase.util.RegionSplitter class to avoid
 * having a reference to hbase-testing-util, which transitively
 * imports hbase-server causing dependency conflicts for this module.
 */
public class RegionSplitter {

    /**
     * A generic interface for the RegionSplitter code to use for all it's functionality. Note that the original authors
     * of this code use see org.apache.hadoop.hbase.util.HexStringSplit to partition their table and set it as default, but provided this for
     * your custom algorithm. To use, create a new derived class from this interface and call
     * see RegionSplitter#createPresplitTable or
     * see RegionSplitter#rollingSplit(String, SplitAlgorithm, Configuration)} with the argument splitClassName
     * giving the name of your class.
     */
    public interface SplitAlgorithm {

        /**
         * Split a pre-existing region into 2 regions.
         *
         * @param start
         *            first row (inclusive)
         * @param end
         *            last row (exclusive)
         * @return the split row to use
         */
        byte[] split(byte[] start, byte[] end);

        /**
         * Split an entire table.
         *
         * @param numRegions
         *            number of regions to split the table into
         *
         * @throws RuntimeException
         *             user input is validated at this time. may throw a runtime exception in response to a parse
         *             failure
         * @return array of split keys for the initial regions of the table. The length of the returned array should be
         *         numRegions-1.
         */
        byte[][] split(int numRegions);

        /**
         * In HBase, the first row is represented by an empty byte array. This might cause problems with your split
         * algorithm or row printing. All your APIs will be passed firstRow() instead of empty array.
         *
         * @return your representation of your first row
         */
        byte[] firstRow();

        /**
         * In HBase, the last row is represented by an empty byte array. This might cause problems with your split
         * algorithm or row printing. All your APIs will be passed firstRow() instead of empty array.
         *
         * @return your representation of your last row
         */
        byte[] lastRow();

        /**
         * In HBase, the last row is represented by an empty byte array. Set this value to help the split code
         * understand how to evenly divide the first region.
         *
         * @param userInput
         *            raw user input (may throw RuntimeException on parse failure)
         */
        void setFirstRow(String userInput);

        /**
         * In HBase, the last row is represented by an empty byte array. Set this value to help the split code
         * understand how to evenly divide the last region. Note that this last row is inclusive for all rows sharing
         * the same prefix.
         *
         * @param userInput raw user input (may throw RuntimeException on parse failure)
         */
        void setLastRow(String userInput);

        /**
         * @param input
         *            user or file input for row
         * @return byte array representation of this row for HBase
         */
        byte[] strToRow(String input);

        /**
         * @param row byte array representing a row in HBase
         * @return String to use for debug and file printing
         */
        String rowToStr(byte[] row);

        /**
         * @return the separator character to use when storing / printing the row
         */
        String separator();

        /**
         * Set the first row
         *
         * @param userInput
         *            byte array of the row key.
         */
        void setFirstRow(byte[] userInput);

        /**
         * Set the last row
         *
         * @param userInput
         *            byte array of the row key.
         */
        void setLastRow(byte[] userInput);
    }

    /**
     * @param conf Hbase conf
     * @param splitClassName split class name to be used
     * @return an instance of SplitAlgorithm
     * @throws IOException if the specified SplitAlgorithm class couldn't be instantiated
     */
    public static SplitAlgorithm newSplitAlgoInstance(Configuration conf,
                                                      String splitClassName) throws IOException {
        Class<?> splitClass;

        // For split algorithms builtin to RegionSplitter, the user can specify
        // their simple class name instead of a fully qualified class name.
        if (splitClassName.equals(UniformSplit.class.getSimpleName())) {
            splitClass = UniformSplit.class;
        } else {
            try {
                splitClass = conf.getClassByName(splitClassName);
            } catch (ClassNotFoundException e) {
                throw new IOException("Couldn't load split class " + splitClassName, e);
            }
            if (splitClass == null) {
                throw new IOException("Failed loading split class " + splitClassName);
            }
            if (!SplitAlgorithm.class.isAssignableFrom(splitClass)) {
                throw new IOException(
                    "Specified split class doesn't implement SplitAlgorithm");
            }
        }
        try {
            return splitClass.asSubclass(SplitAlgorithm.class).newInstance();
        } catch (Exception e) {
            throw new IOException("Problem loading split algorithm: ", e);
        }
    }

    /**
     * A SplitAlgorithm that divides the space of possible keys evenly. Useful when the keys are approximately uniform
     * random bytes (e.g. hashes). Rows are raw byte values in the range [00..FF] and are right-padded with zeros
     * to keep the same memcmp() order. This is the natural algorithm to use for a byte[] environment and saves space,
     * but is not necessarily the easiest for readability.
     */
    public static class UniformSplit implements SplitAlgorithm {

        static final byte xFF = (byte) 0xFF;
        byte[] firstRowBytes = ArrayUtils.EMPTY_BYTE_ARRAY;
        byte[] lastRowBytes =
            new byte[]{xFF, xFF, xFF, xFF, xFF, xFF, xFF, xFF};

        public byte[] split(byte[] start, byte[] end) {
            return Bytes.split(start, end, 1)[1];
        }

        @Override
        public byte[][] split(int numRegions) {
            Preconditions.checkArgument(
                Bytes.compareTo(lastRowBytes, firstRowBytes) > 0,
                "last row (%s) is configured less than first row (%s)",
                Bytes.toStringBinary(lastRowBytes),
                Bytes.toStringBinary(firstRowBytes));

            byte[][] splits = Bytes.split(firstRowBytes, lastRowBytes, true,
                                          numRegions - 1);
            Preconditions.checkState(splits != null,
                                     "Could not split region with given user input: " + this);

            // remove endpoints, which are included in the splits list
            return Arrays.copyOfRange(splits, 1, splits.length - 1);
        }

        @Override
        public byte[] firstRow() {
            return firstRowBytes;
        }

        @Override
        public byte[] lastRow() {
            return lastRowBytes;
        }

        @Override
        public void setFirstRow(String userInput) {
            firstRowBytes = Bytes.toBytesBinary(userInput);
        }

        @Override
        public void setLastRow(String userInput) {
            lastRowBytes = Bytes.toBytesBinary(userInput);
        }

        @Override
        public void setFirstRow(byte[] userInput) {
            firstRowBytes = userInput;
        }

        @Override
        public void setLastRow(byte[] userInput) {
            lastRowBytes = userInput;
        }

        @Override
        public byte[] strToRow(String input) {
            return Bytes.toBytesBinary(input);
        }

        @Override
        public String rowToStr(byte[] row) {
            return Bytes.toStringBinary(row);
        }

        @Override
        public String separator() {
            return ",";
        }

        @Override
        public String toString() {
            return this.getClass().getSimpleName() + " [" + rowToStr(firstRow())
                   + "," + rowToStr(lastRow()) + "]";
        }
    }
}