java source code of TrieDictionary

Kylin-master
- script
  - compress.sh
  - download-tomcat.sh
  - package.sh
  - prepare.sh
  - build.sh
- jdbc
  - src
    - main
      - resources
        log4j.properties
        org-apache-kylin-jdbc.properties
      - java
        org
        apache
        kylin
        jdbc
        Driver.java
        KylinPrepare.java
        stub
        RemoteClient.java
        KylinColumnMetaData.java
        TableMetaStub.java
        DataSet.java
        SQLResponseStub.java
        KylinClient.java
        ConnectionException.java
        KylinJdbc41Factory.java
        KylinStatementImpl.java
        KylinMetaImpl.java
        KylinPrepareImpl.java
        util
        SQLTypeMap.java
        DefaultX509TrustManager.java
        DefaultSslProtocolSocketFactory.java
        KylinEnumerator.java
        KylinJdbc40Factory.java
        KylinResultSet.java
        KylinPrepareStatementImpl.java
        KylinConnectionImpl.java
    - test
      - java
        org
        apache
        kylin
        jdbc
        DriverTest.java
        DummyDriver.java
        DummyJdbc41Factory.java
        DummyClient.java
  - pom.xml
  - .settings
    - org.eclipse.jdt.ui.prefs
    - org.eclipse.jdt.core.prefs
    - org.eclipse.core.resources.prefs
- storage
  - src
    - main
      - java
        org
        apache
        kylin
        storage
        IStorageEngine.java
        hbase
        HBaseClientKVIterator.java
        HBaseKeyRange.java
        ResultScannerAdapter.java
        coprocessor
        endpoint
        EndpointEnabler.java
        EndpointAggregators.java
        protobuf
        II.proto
        IIEndpoint.java
        EndpointAggregationCache.java
        HbaseServerKVIterator.java
        EndpointTupleIterator.java
        IIResponseAdapter.java
        SliceBitMapProvider.java
        generated
        IIProtos.java
        CoprocessorFilter.java
        CoprocessorRowType.java
        CoprocessorConstants.java
        CoprocessorProjector.java
        AggregationCache.java
        observer
        AggregateRegionObserver.java
        ObserverAggregationCache.java
        ObserverAggregators.java
        ObserverTuple.java
        AggregationScanner.java
        ObserverEnabler.java
        CubeSegmentTupleIterator.java
        PingHBaseCLI.java
        ScanOutOfLimitException.java
        FuzzyValueCombination.java
        RegionScannerAdapter.java
        SerializedHBaseTupleIterator.java
        ColumnValueRange.java
        CubeStorageEngine.java
        InvertedIndexStorageEngine.java
        DerivedFilterTranslator.java
        StorageContext.java
        tuple
        Tuple.java
        TupleInfo.java
        filter
        BitMapFilterEvaluator.java
        StorageEngineFactory.java
    - test
      - java
        org
        apache
        kylin
        storage
        minicluster
        HiveMiniClusterTest.java
        HiveJDBCClientTest.java
        hbase
        FuzzyValueCombinationTest.java
        coprocessor
        endpoint
        EndpointAggregationTest.java
        TableRecordInfoTest.java
        RowProjectorTest.java
        observer
        RowAggregatorsTest.java
        AggregateRegionObserverTest.java
        RowTypeTest.java
        InvertedIndexHBaseTest.java
        test
        StorageTest.java
        filter
        FilterSerializeTest.java
        FilterBaseTest.java
        BitMapFilterEvaluatorTest.java
        FilterEvaluateTest.java
        MiniClusterTest.java
  - pom.xml
  - .settings
    - org.eclipse.jdt.ui.prefs
    - org.eclipse.jdt.core.prefs
    - org.eclipse.core.resources.prefs
- dictionary
  - src
    - main
      - java
        org
        apache
        kylin
        dict
        NumberDictionaryBuilder.java
        lookup
        LookupTable.java
        ReadableTable.java
        FileTable.java
        FileTableReader.java
        LookupBytesTable.java
        SnapshotTable.java
        HiveTableReader.java
        TableSignature.java
        LookupStringTable.java
        HiveTable.java
        TableReader.java
        SnapshotTableSerializer.java
        SnapshotManager.java
        DateStrDictionary.java
        DictionaryInfo.java
        Dictionary.java
        TrieDictionary.java
        TrieDictionaryBuilder.java
        StringBytesConverter.java
        BytesConverter.java
        DictionaryInfoSerializer.java
        DictionaryManager.java
        DictionaryGenerator.java
        ISegment.java
        NumberDictionary.java
    - test
      - resources
        dict
        DW_SITES
      - java
        org
        apache
        kylin
        dict
        SnapshotManagerTest.java
        TrieDictionaryTest.java
        TableReaderTest.java
        lookup
        LookupTableTest.java
        LookupTableTest.java
        NumberDictionaryTest.java
        DateStrDictionaryTest.java
        HiveTableReaderTest.java
  - pom.xml
  - .settings
    - org.eclipse.jdt.ui.prefs
    - org.eclipse.jdt.core.prefs
    - org.eclipse.core.resources.prefs
- examples
  - test_case_data
    - localmeta
      - table_snapshot
        TEST_CATEGORY_GROUPINGS.csv
        df8a90f1-bbbe-49ff-937a-2a2a6e5f8615.snapshot
        89715f33-15c9-4745-83f9-f2b9817d9100.snapshot
        59a675fc-64d2-40d1-bbd7-492db2510cd1.snapshot
        e172b442-ae10-447e-9071-c7dbb2bb38cc.snapshot
        TEST_CAL_DT.csv
        TEST_SITES.csv
        1271e1f2-dd65-4249-a1f2-aca02a651158.snapshot
        1888015f-f059-4ccc-8324-0cdd70b46673.snapshot
        d95e0b5b-a399-4f08-8f40-b0fa53b565e0.snapshot
        28130338-fcf4-429e-91b0-cd8dfd397280.snapshot
        7d70b82e-43f6-4999-b012-0e91a9bb8408.snapshot
        TEST_SELLER_TYPE_DIM.csv
        b43dd3f1-9a34-4721-8abc-df90962e94d8.snapshot
        f818054b-1a76-4cbd-bdd8-7871a240360c.snapshot
        4fe75ccd-9b24-4cdf-ac9d-b4038e947f89.snapshot
        97238b77-a45d-420f-a249-5f1572ea4d62.snapshot
        d1b6a60a-14d4-4653-92f7-c96d01191c75.snapshot
      - project
        onlyinner.json
        onlyleft.json
        default.json
      - invertedindex
        test_kylin_ii.json
      - model_desc
        test_kylin_with_slr_left_join_model_desc.json
        test_kylin_ii_model_desc.json
        test_kylin_with_slr_model_desc.json
        test_kylin_without_slr_model_desc.json
        test_kylin_without_slr_left_join_model_desc.json
      - table
        EDW.TEST_SITES.json
        EDW.TEST_SELLER_TYPE_DIM.json
        EDW.TEST_CAL_DT.json
        DEFAULT.TEST_CATEGORY_GROUPINGS.json
        DEFAULT.TEST_KYLIN_FACT.json
      - kylin_job_conf.xml
      - cube_desc
        test_kylin_cube_with_slr_desc.json
        test_kylin_cube_without_slr_desc.json
        test_kylin_cube_without_slr_left_join_desc.json
        test_kylin_cube_with_slr_left_join_desc.json
      - data
        EDW.TEST_SITES.csv
        flatten_data_for_ii.csv
        DEFAULT.TEST_CATEGORY_GROUPINGS.csv
        data_gen_config.json
        EDW.TEST_SELLER_TYPE_DIM.csv
        .gitignore
        DEFAULT.TEST_KYLIN_FACT.csv
      - dict
        TEST_SITES
        SITE_ID
        652bd393-678a-4f16-a504-fd8ce1229355.dict
        ff7e8943-ac0f-4e66-b9ed-510f6a0b875d.dict
        0bec6bb3-1b0d-469c-8289-b8c4ca5d5001.dict
        31edf35b-ffca-4f24-8229-f87dc34e3087.dict
        792eb972-d046-48e6-9428-f6a3aed92fad.dict
        d25e554e-deac-4e4a-9289-96f0d121d8fc.dict
        914536f8-1e14-43e9-b8ef-525bb5bdb3b2.dict
        TEST_SELLER_TYPE_DIM
        SELLER_TYPE_CD
        1d383a36-81b9-4177-a822-04eab3683e5b.dict
        0c5d77ec-316b-47e0-ba9a-0616be890ad6.dict
        2a44ff38-f64b-42e7-9fcf-66afccac8047.dict
        14fe66b3-5956-498c-bd93-40182cac5510.dict
        c6bf9b51-6e90-4337-8082-4e2fdf78307f.dict
        TEST_CAL_DT
        CAL_DT
        aa634e3e-22d3-4cc2-9de5-085e9ac35c1f.dict
        ed0c3451-593c-494c-9019-64f63fcb0b8e.dict
        DEFAULT.TEST_KYLIN_FACT
        LEAF_CATEG_ID
        f7fe5157-f9a0-4f64-ad36-d9c92b9c9e2a.dict
        LSTG_SITE_ID
        e11524a1-0fcf-4da1-b12f-c9410610ab8d.dict
        TRANS_ID
        7fb8fed8-7f3b-4089-a85d-3ac07f575c82.dict
        SELLER_ID
        fea3a18d-3f20-4b8b-a880-7af93e69241b.dict
        SLR_SEGMENT_CD
        fe91daba-e89b-4911-ad75-41e1335a35cb.dict
        CAL_DT
        d1094cfe-3a15-4270-b066-241c543b3fd9.dict
        LSTG_FORMAT_NAME
        d5c40465-75e1-40bc-a960-06308f0134a6.dict
        TEST_CATEGORY_GROUPINGS
        META_CATEG_NAME
        51ff5e6c-22b3-444e-9915-d376a10f20cb.dict
        aceae914-4246-4251-a0c2-692fe7a300df.dict
        b298089f-9656-4693-b9b2-8fea46f06dd5.dict
        ac797050-e152-4923-a20a-02282fcf6086.dict
        a4e57e55-48fc-4f25-a9c8-485deed25925.dict
        70c8d6ef-f55b-4cdd-8be4-9c2b236cc8e9.dict
        0410d2c4-4686-40bc-ba14-170042a2de94.dict
        c2af25cf-6c79-45e6-a6f6-6d2a8ecc6592.dict
        CATEG_LVL2_NAME
        9bb0b83a-97b2-434f-905f-4d9e04b62018.dict
        c12ae49d-9dbe-4a58-b169-19afac317696.dict
        ec83ebce-7534-4e62-ac6d-7445ee141ab4.dict
        16d8185c-ee6b-4f8c-a919-756d9809f937.dict
        eaed91b0-4182-4ee5-a733-1047a622ee29.dict
        LEAF_CATEG_ID
        ac520edd-f9d2-419f-a7de-587bfb97dc81.dict
        8b4b1c06-fb74-486b-a2ad-74420afebcda.dict
        2602386c-debb-4968-8d2f-b52b8215e385.dict
        4243889f-bc81-4807-a975-7041bbbf35e7.dict
        494683c1-52d1-4d9a-a3f7-8c53b30fd898.dict
        CATEG_LVL3_NAME
        270fbfb0-281c-4602-8413-2970a7439c47.dict
        8f92faa4-7d2d-455c-8623-6e1d1b272afe.dict
        7228fad8-a764-4bd4-8934-50e0d7cbcb19.dict
        eacccee7-d120-4f4d-97d0-c99a5b83ec32.dict
        ad09f2d5-054a-4e1b-a776-7cc07399a6c1.dict
        DEFAULT.TEST_CATEGORY_GROUPINGS
        META_CATEG_NAME
        895739d6-27e1-4ecc-b798-5851c319ea40.dict
        CATEG_LVL2_NAME
        9355165b-06ad-4c04-977c-a251e66e7e98.dict
        LEAF_CATEG_ID
        38361fbc-b875-4273-b8b4-1b8a26ef8570.dict
        USER_DEFINED_FIELD3
        278d7283-518a-4cd0-b6e1-2573b523bf1f.dict
        CATEG_LVL3_NAME
        b2d6fae1-eaac-4ac2-8a01-42e5c8b5c198.dict
        USER_DEFINED_FIELD1
        8ae44fb8-b01a-4db1-a901-dc5f463038cb.dict
        UPD_DATE
        1fc93a94-1feb-4af4-8078-81a6f1b65e2b.dict
        UPD_USER
        bb1bb7a5-b02d-45eb-b3c8-f1a4515264ca.dict
        SITE_ID
        30c9d5f0-abe4-4d1c-a147-610234d90ff1.dict
        TEST_KYLIN_FACT
        LEAF_CATEG_ID
        9fc2360e-172a-43f3-acef-be16748a9bb7.dict
        96b7c577-b209-45b3-a848-4d2d7af5c0cc.dict
        4059cab1-9b99-47ed-a494-751da52a7d58.dict
        LSTG_SITE_ID
        7df5789b-0280-453c-b406-b75cad6770d1.dict
        TRANS_ID
        c8d19f95-b6cd-4219-a114-54aaddcb2909.dict
        SELLER_ID
        6e285e1e-ed16-4012-9f1e-f950dd6927ce.dict
        SLR_SEGMENT_CD
        8300bf83-053e-48bb-8c87-88c8d483afd1.dict
        CAL_DT
        48433f91-0d68-495f-b7f2-295414591275.dict
        ITEM_COUNT
        73c9bfe1-6496-4ff8-9467-6cbee2924c16.dict
        LSTG_FORMAT_NAME
        bd9f6b22-36ba-4e6b-92aa-0d585faf0b39.dict
        PRICE
        927dde3f-6999-4434-b57c-adfa73160334.dict
        EDW.TEST_SITES
        SITE_NAME
        f363531d-e969-4264-bffd-ac18f8f47220.dict
        CRE_USER
        244af7a2-7352-4b30-811f-46e637d7a133.dict
        SITE_ID
        4ef43390-b07e-4d4c-872a-77c0bd783acb.dict
        PREDEFINED
        date(yyyy-mm-dd)
        64ac4f82-f2af-476e-85b9-f0805001014e.dict
        f5e85644-db92-42b5-9ad5-240ab227d7b0.dict
        EDW.TEST_CAL_DT
        WEEK_BEG_DT
        962b5f64-bee1-49ee-a072-af882193b719.dict
        CAL_DT
        5e4b4f35-0fc8-4940-b123-b18c9f77da19.dict
        EDW.TEST_SELLER_TYPE_DIM
        SELLER_TYPE_CD
        bec11fda-9ae0-4668-98ea-f0f4e9dd6993.dict
        SELLER_TYPE_DESC
        bfb86010-bf4c-4534-a2b0-59d020aed197.dict
      - kylin.properties
      - cube
        test_kylin_cube_with_slr_1_new_segment.json
        test_kylin_cube_with_slr_ready.json
        test_kylin_cube_with_slr_ready_2_segments.json
        test_kylin_cube_with_slr_left_join_empty.json
        test_kylin_cube_without_slr_left_join_empty.json
        test_kylin_cube_without_slr_empty.json
        test_kylin_cube_without_slr_left_join_ready_2_segments.json
        test_kylin_cube_without_slr_ready.json
        test_kylin_cube_with_slr_empty.json
        test_kylin_cube_with_slr_left_join_ready.json
        test_kylin_cube_without_slr_left_join_ready.json
      - invertedindex_desc
        test_kylin_ii_desc.json
    - minicluster
      - b-kylin
        kylin.properties
        meta
        kylin.properties
      - kylin_job_conf.lzo_disabled.xml
      - kylin_job_conf.lzo_enabled.xml
      - kylin_job_conf.xml
      - kylin.properties
    - localmeta_v1
      - project
        onlyinner.json
        onlyleft.json
        default.json
      - table
        TEST_SELLER_TYPE_DIM.json
        TEST_CAL_DT.json
        TEST_CATEGORY_GROUPINGS.json
        TEST_SITES.json
        TEST_KYLIN_FACT.json
      - cube_desc
        test_kylin_cube_with_slr_desc.json
        test_kylin_cube_without_slr_desc.json
        test_kylin_cube_without_slr_left_join_desc.json
        test_kylin_cube_with_slr_left_join_desc.json
      - table_exd
        TEST_KYLIN_FACT.json
      - kylin.properties
      - cube
        test_kylin_cube_with_slr_1_new_segment.json
        test_kylin_cube_with_slr_ready.json
        test_kylin_cube_with_slr_ready_2_segments.json
        test_kylin_cube_with_slr_left_join_empty.json
        test_kylin_cube_without_slr_left_join_empty.json
        test_kylin_cube_without_slr_empty.json
        test_kylin_cube_without_slr_left_join_ready_2_segments.json
        test_kylin_cube_without_slr_ready.json
        test_kylin_cube_with_slr_empty.json
        test_kylin_cube_with_slr_left_join_ready.json
        test_kylin_cube_without_slr_left_join_ready.json
    - sandbox-hdp21
      - hdfs-site.xml
      - capacity-scheduler.xml
      - kylin_job_conf.lzo_disabled.xml
      - kylin_job_conf.lzo_enabled.xml
      - kylin_job_conf.xml
      - hbase-site.xml
      - hive-site.xml
      - httpfs-site.xml
      - hadoop-policy.xml
      - mapred-site.xml
      - yarn-site.xml
      - kylin.properties
      - core-site.xml
    - sandbox
      - hdfs-site.xml
      - hbase-policy.xml
      - capacity-scheduler.xml
      - kylin_job_conf.xml
      - hbase-site.xml
      - hive-site.xml
      - hadoop-policy.xml
      - mapred-site.xml
      - yarn-site.xml
      - kylin.properties
      - core-site.xml
  - sample_cube
    - metadata
      - project
        learn_kylin.json
      - model_desc
        kylin_sales_model.json
      - table
        DEFAULT.KYLIN_CATEGORY_GROUPINGS.json
        DEFAULT.KYLIN_CAL_DT.json
        DEFAULT.KYLIN_SALES.json
      - cube_desc
        kylin_sales_cube_desc.json
      - cube
        kylin_sales_cube.json
    - data
      - DEFAULT.KYLIN_CATEGORY_GROUPINGS.csv
    - create_sample_tables.sql
  - ReleaseNotes.md
  - .gitignore
- pom.xml
- metadata
  - src
    - main
      - java
        org
        apache
        kylin
        metadata
        measure
        DoubleMinAggregator.java
        BigDecimalMaxAggregator.java
        BigDecimalMinAggregator.java
        fixedlen
        FixedLenMeasureCodec.java
        FixedPointLongCodec.java
        FixedHLLCodec.java
        LongMinAggregator.java
        DoubleSerializer.java
        HLLCSerializer.java
        BigDecimalSumAggregator.java
        HLLCAggregator.java
        DoubleSumAggregator.java
        LongSumAggregator.java
        MeasureAggregator.java
        MeasureAggregators.java
        MeasureCodec.java
        LongSerializer.java
        BigDecimalSerializer.java
        LDCAggregator.java
        DoubleMaxAggregator.java
        LongMaxAggregator.java
        MeasureSerializer.java
        realization
        IRealizationConstants.java
        IRealization.java
        SQLDigest.java
        RealizationType.java
        RealizationRegistry.java
        RealizationStatusEnum.java
        IRealizationProvider.java
        tool
        HiveSourceTableLoader.java
        MetadataConstants.java
        project
        RealizationEntry.java
        ProjectInstance.java
        ProjectStatusEnum.java
        ProjectL2Cache.java
        ProjectTable.java
        ProjectManager.java
        MetadataManager.java
        tuple
        ITupleIterator.java
        ITuple.java
        model
        DataModelDesc.java
        DataType.java
        MeasureDesc.java
        DatabaseDesc.java
        PartitionDesc.java
        TableDesc.java
        TblColRef.java
        LookupDesc.java
        ColumnDesc.java
        JoinDesc.java
        ParameterDesc.java
        SegmentStatusEnum.java
        FunctionDesc.java
        filter
        CaseTupleFilter.java
        TupleFilterSerializer.java
        DynamicTupleFilter.java
        ColumnTupleFilter.java
        ConstantTupleFilter.java
        CompareTupleFilter.java
        TupleFilter.java
        LogicalTupleFilter.java
        ExtractTupleFilter.java
      - assembly
        assemble.xml
    - test
      - resources
        org
        apache
        kylin
        metadata
        kylin_env.properties
      - test.json
      - java
        org
        apache
        kylin
        metadata
        tool
        HiveSourceTableLoaderTest.java
        MetadataManagerTest.java
        tuple
        EmptyTupleIteratorTest.java
        model
        TableDescTest.java
  - pom.xml
  - .settings
    - org.eclipse.jdt.ui.prefs
    - org.eclipse.jdt.core.prefs
    - org.eclipse.core.resources.prefs
- LICENSE
- common
  - src
    - main
      - resources
        log4j.properties
        kylinlog4j.properties
      - java
        org
        apache
        kylin
        common
        mr
        KylinMapper.java
        KylinReducer.java
        util
        TarGZUtil.java
        MyLogFormatter.java
        BytesSerializer.java
        Array.java
        StringUtil.java
        SSHClientOutput.java
        ThreadUtil.java
        MailService.java
        CliCommandExecutor.java
        ClassUtil.java
        SoutLogger.java
        HiveClient.java
        ByteArray.java
        SSHClient.java
        LogTitlePrinter.java
        JsonUtil.java
        HBaseRegionSizeCalculator.java
        BytesUtil.java
        BytesSplitter.java
        PartialSorter.java
        CaseInsensitiveStringMap.java
        Logger.java
        SplittedBytes.java
        HadoopUtil.java
        RandomSampler.java
        StringSplitter.java
        KylinConfig.java
        restclient
        CaseInsensitiveStringCache.java
        Broadcaster.java
        AbstractRestCache.java
        RestClient.java
        MultiValueCache.java
        SingleValueCache.java
        persistence
        StorageException.java
        HBaseConnection.java
        Serializer.java
        FileResourceStore.java
        HBaseResourceStore.java
        ResourceTool.java
        JsonSerializer.java
        AclEntity.java
        RootPersistentEntity.java
        ResourceStore.java
        hll
        HyperLogLogPlusTable.java
        HyperLogLogPlusCounter.java
    - test
      - java
        org
        apache
        kylin
        common
        util
        AbstractKylinTestCase.java
        PartialSorterTest.java
        MailServiceTest.java
        BasicTest.java
        HBaseMiniclusterHelper.java
        RandomSamplerTest.java
        BytesUtilTest.java
        SSHClientTest.java
        HBaseMetadataTestCase.java
        HyperLogLogCounterTest.java
        HbaseImporter.java
        InstallJarIntoMavenTest.java
        LocalFileMetadataTestCase.java
        BasicHadoopTest.java
        restclient
        RestClientTest.java
        persistence
        LocalFileResourceStoreTest.java
        HBaseResourceStoreTest.java
        ResourceToolTest.java
  - pom.xml
  - .settings
    - org.eclipse.jdt.ui.prefs
    - org.eclipse.jdt.core.prefs
    - org.eclipse.core.resources.prefs
- invertedindex
  - src
    - main
      - java
        org
        apache
        kylin
        invertedindex
        IIDescManager.java
        index
        TableRecordInfo.java
        ColumnValueContainer.java
        Slice.java
        BitMapContainer.java
        CompressedValueContainer.java
        TableRecordInfoDigest.java
        TableRecord.java
        SliceBuilder.java
        RawTableRecord.java
        ShardingSliceBuilder.java
        ShardingHash.java
        IIManager.java
        tools
        IICLI.java
        model
        IIDesc.java
        IIKeyValueCodec.java
        IIDimension.java
        IIInstance.java
        IISegment.java
    - test
      - java
        org
        apache
        kylin
        invertedindex
        invertedindex
        IIDescTest.java
        LZFTest.java
        IIInstanceTest.java
        InvertedIndexLocalTest.java
        IIDescManagerTest.java
  - pom.xml
  - .settings
    - org.eclipse.jdt.ui.prefs
    - org.eclipse.jdt.core.prefs
    - org.eclipse.core.resources.prefs
- deploy
  - server.xml
- job
  - src
    - main
      - java
        org
        apache
        kylin
        job
        impl
        threadpool
        DefaultScheduler.java
        DefaultContext.java
        dao
        ExecutableDao.java
        ExecutableOutputPO.java
        ExecutablePO.java
        hadoop
        hbase
        BulkLoadJob.java
        CreateHTableJob.java
        cardinality
        ColumnCardinalityMapper.java
        HiveColumnCardinalityUpdateJob.java
        HiveColumnCardinalityJob.java
        ColumnCardinalityReducer.java
        invertedindex
        IICreateHFileJob.java
        RandomKeyDistributionMapper.java
        IIBulkLoadJob.java
        RandomKeyDistributionReducer.java
        IIFlattenHiveJob.java
        IICreateHFileMapper.java
        IIDistinctColumnsJob.java
        InvertedIndexPartitioner.java
        IIDistinctColumnsMapper.java
        RandomKeyDistributionJob.java
        IIDistinctColumnsCombiner.java
        IICreateHTableJob.java
        InvertedIndexReducer.java
        InvertedIndexJob.java
        InvertedIndexMapper.java
        IIDistinctColumnsReducer.java
        hive
        CubeJoinedFlatTableDesc.java
        IJoinedFlatTableDesc.java
        IIJoinedFlatTableDesc.java
        SqlHiveDataTypeMapping.java
        IntermediateColumnDesc.java
        dict
        CreateDictionaryJob.java
        CreateInvertedIndexDictionaryJob.java
        cube
        FactDistinctColumnsCombiner.java
        FactDistinctColumnsReducer.java
        CuboidReducer.java
        CubeHFileJob.java
        BaseCuboidJob.java
        KeyDistributionJob.java
        RowKeyDistributionCheckerJob.java
        CubeHFileMapper.java
        RangeKeyDistributionMapper.java
        NewBaseCuboidMapper.java
        RowKeyDistributionCheckerMapper.java
        NDCuboidMapper.java
        BaseCuboidMapper.java
        FactDistinctColumnsJob.java
        KeyDistributionMapper.java
        CuboidJob.java
        FactDistinctColumnsMapper.java
        NDCuboidJob.java
        RangeKeyDistributionJob.java
        RangeKeyDistributionReducer.java
        MergeCuboidMapper.java
        KeyDistributionReducer.java
        StorageCleanupJob.java
        RowKeyDistributionCheckerReducer.java
        MergeCuboidJob.java
        AbstractHadoopJob.java
        JoinedFlatTable.java
        JobInstance.java
        constant
        ExecutableConstants.java
        JobStepCmdTypeEnum.java
        JobStepStatusEnum.java
        BatchConstants.java
        JobStatusEnum.java
        common
        MapReduceExecutable.java
        HadoopShellExecutable.java
        HadoopCmdOutput.java
        ShellExecutable.java
        HqlExecutable.java
        CubeMetadataUpgrade.java
        invertedindex
        IIJob.java
        IIJobBuilder.java
        exception
        LockException.java
        SchedulerException.java
        JobException.java
        ExecuteException.java
        PersistentException.java
        IllegalStateTranferException.java
        engine
        JobEngineConfig.java
        deployment
        HbaseConfigPrinterCLI.java
        AbstractJobBuilder.java
        execution
        DefaultChainedExecutable.java
        ExecuteResult.java
        Executable.java
        AbstractExecutable.java
        ExecutableState.java
        Output.java
        Idempotent.java
        ExecutableContext.java
        ChainedExecutable.java
        DefaultOutput.java
        tools
        OptionsHelper.java
        LZOSupportnessChecker.java
        CubeMigrationCLI.java
        HadoopStatusGetter.java
        HtableAlterMetadataCLI.java
        DefaultX509TrustManager.java
        HadoopStatusChecker.java
        DeployCoprocessorCLI.java
        DefaultSslProtocolSocketFactory.java
        GridTableHBaseBenchmark.java
        CleanHtableCLI.java
        manager
        ExecutableManager.java
        cmd
        BaseCommandOutput.java
        IJobCommand.java
        ICommandOutput.java
        ShellCmdOutput.java
        ShellCmd.java
        Scheduler.java
        cube
        MergeDictionaryStep.java
        CubingJobBuilder.java
        CubingJob.java
        UpdateCubeInfoAfterMergeStep.java
        UpdateCubeInfoAfterBuildStep.java
    - test
      - resources
        expected_result
        flat_item
        part-r-00000
        jarfile
        SampleBadJavaProgram.jarfile
        SampleJavaProgram.jarfile
        data
        flat_table
        base_cuboid
        test_cal_dt
        6d_cuboid
        json
        dummy_jobinstance.json
        partition_list
        _partition.lst
        part-r-00000
      - java
        org
        apache
        kylin
        job
        impl
        threadpool
        DefaultSchedulerTest.java
        BaseSchedulerTest.java
        BuildCubeWithEngineTest.java
        dataGen
        FactTableGenerator.java
        GenConfig.java
        ColumnConfig.java
        ImportHBaseData.java
        SucceedTestExecutable.java
        hadoop
        hbase
        TestHbaseClient.java
        CreateHTableTest.java
        hdfs
        HdfsOpsTest.java
        hive
        JoinedFlatTableTest.java
        cube
        BaseCuboidJobTest.java
        RandomKeyDistributionMapperTest.java
        RangeKeyDistributionJobTest.java
        BaseCuboidMapperTest.java
        RandomKeyDistributionReducerTest.java
        NDCuboidMapperTest.java
        MergeCuboidJobTest.java
        BaseCuboidMapperPerformanceTest.java
        RangeKeyDistributionMapperTest.java
        CubeReducerTest.java
        MockupMapContext.java
        KeyDistributionMapperTest.java
        MergeCuboidMapperTest.java
        CubeHFileMapper2Test.java
        NDCuboidJobTest.java
        CopySeq.java
        CubeHFileMapperTest.java
        KeyDistributionJobTest.java
        RangeKeyDistributionReducerTest.java
        ErrorTestExecutable.java
        SelfStopExecutable.java
        BuildIIWithEngineTest.java
        ExportHBaseData.java
        DeployUtil.java
        BaseTestExecutable.java
        DataGenTest.java
        tools
        ColumnCardinalityReducerTest.java
        ColumnCardinalityJobTest.java
        ColumnCardinalityMapperTest.java
        CubeMigrationTests.java
        HBaseRowDigestTest.java
        manager
        ExecutableManagerTest.java
        FailedTestExecutable.java
        SampleCubeSetupTest.java
  - pom.xml
  - .settings
    - org.eclipse.jdt.ui.prefs
    - org.eclipse.jdt.core.prefs
    - org.eclipse.core.resources.prefs
  - dependency-reduced-pom.xml
  - .gitignore
- query
  - src
    - main
      - java
        org
        apache
        kylin
        query
        optrule
        OLAPToEnumerableConverterRule.java
        OLAPProjectRule.java
        OLAPAggregateRule.java
        OLAPFilterRule.java
        OLAPLimitRule.java
        OLAPJoinRule.java
        OLAPSortRule.java
        QueryCli.java
        relnode
        OLAPAggregateRel.java
        OLAPFilterRel.java
        OLAPContext.java
        OLAPToEnumerableConverter.java
        OLAPLimitRel.java
        OLAPSortRel.java
        OLAPProjectRel.java
        OLAPTableScan.java
        OLAPJoinRel.java
        ColumnRowType.java
        OLAPRel.java
        sqlfunc
        QuarterBase.java
        HLLDistinctCountAggFunc.java
        QuarterFunc.java
        enumerator
        HiveEnumerator.java
        LookupTableEnumerator.java
        OLAPQuery.java
        CubeEnumerator.java
        routing
        RoutingRules
        RealizationPriorityRule.java
        SimpleQueryMoreColumnsCubeFirstRule.java
        CubesSortRule.java
        AdjustForWeeklyMatchedRealization.java
        RemoveUncapableRealizationsRule.java
        RoutingRule.java
        QueryRouter.java
        NoRealizationFoundException.java
        schema
        OLAPSchema.java
        OLAPTable.java
        OLAPSchemaFactory.java
    - test
      - resources
        logging.properties
        query
        sql
        query04.sql
        query59.sql
        query32.sql
        query75.sql
        query49.sql
        query22.sql
        query43.sql
        query66.sql
        query23.sql
        query31.sql
        query02.sql
        query41.sql
        query18.sql
        query26.sql
        query50.sql
        query45.sql
        query61.sql
        query79.sql
        query42.sql
        query20.sql
        query19.sql
        query57.sql
        query62.sql
        query73.sql
        query24.sql
        query69.sql
        query00.sql
        query53.sql
        query14.sql
        query48.sql
        query28.sql
        query67.sql
        query72.sql
        query71.sql
        query52.sql
        query08.sql
        query17.sql
        query76.sql
        query25.sql
        query12.sql
        query70.sql
        query77.sql
        query74.sql
        query05.sql
        query44.sql
        query46.sql
        query27.sql
        query33.sql
        query38.sql
        query60.sql
        query21.sql
        query64.sql
        query16.sql
        query34.sql
        query51.sql
        query47.sql
        query01.sql
        query65.sql
        query29.sql
        query58.sql
        query40.sql
        query07.sql
        query54.sql
        query06.sql
        query68.sql
        query03.sql
        query63.sql
        query55.sql
        query78.sql
        query37.sql
        query39.sql
        query35.sql
        query13.sql
        query36.sql
        query15.sql
        query11.sql
        query10.sql
        query30.sql
        query56.sql
        query09.sql
        sql_subquery
        query04.sql
        query02.sql.disable
        query00.sql
        query05.sql
        query01.sql
        query07.sql
        query06.sql
        query03.sql
        sql_verifyCount
        query04.sql
        query07.sql.expected
        query06.sql.expected
        query04.sql.expected
        query05.sql
        query05.sql.expected
        query07.sql
        query06.sql
        sql_fast_common
        query00.sql
        h2
        query07.sql
        query10.sql
        query09.sql
        sql_tableau
        query04.sql
        query23.sql
        query08.sql.disabled
        query02.sql
        query18.sql
        query09.sql.disabled
        query20.sql
        query19.sql
        query22.sql.disabled
        query24.sql
        query00.sql
        query14.sql
        query67.sql
        query17.sql
        query25.sql
        query12.sql
        query05.sql
        query27.sql
        query21.sql
        query16.sql
        query01.sql
        query07.sql
        query06.sql
        query03.sql
        query13.sql
        query15.sql
        query11.sql
        query10.sql
        sql_ii
        query04.sql
        query07.sql.disabled
        query02.sql
        query06.sql.disabled
        query08.sql
        query05.sql
        query01.sql
        query03.sql
        query09.sql
        sql_distinct
        query04.sql
        query02.sql
        query00.sql
        query05.sql
        query01.sql
        query07.sql
        query06.sql
        query03.sql
        sql_derived
        query04.sql
        query08.sql.disabled
        query02.sql
        query05.sql
        query01.sql
        query07.sql
        query06.sql
        query03.sql
        query10.sql
        query09.sql
        sql_invalid
        query31_invalid_SQL.sql
        query29_invalid_SQL.sql
        query34_invalid_SQL.sql
        query_count_distinct_on_dimension.sql.disabled
        query33_invalid_SQL.sql
        query32_invalid_SQL.sql
        query30_invalid_SQL.sql
        sql_casewhen
        query02.sql
        query01.sql
        query55.sql.disable
        query03.sql
        query56.sql
        sql_lookup
        query04.sql
        query02.sql
        query01.sql
        query03.sql
        sql_dynamic
        query01.dat
        query02.sql
        query02.dat
        query01.sql
        sql_hive
        query01.sql
        query10.sql
        sql_optimize
        enable-limit01.sql
        sql_all_types
        query04.sql
        query02.sql
        query00.sql
        query08.sql
        query05.sql
        query01.sql
        query07.sql
        query06.sql
        query03.sql
        query09.sql
        tableau_probing
        query04.sql
        query02.sql
        query05.sql
        query01.sql
        query07.sql
        query06.sql
        query03.sql
        sql_orderby
        query02.sql
        query01.sql
        query03.sql
      - java
        org
        apache
        kylin
        query
        test
        KylinTestBase.java
        RealizationRegistryTest.java
        KylinQueryTest.java
        CombinationTest.java
        H2Database.java
        IIQueryTest.java
  - pom.xml
  - .settings
    - org.eclipse.jdt.ui.prefs
    - org.eclipse.jdt.core.prefs
    - org.eclipse.core.resources.prefs
- .settings
  - org.eclipse.core.resources.prefs
- DISCLAIMER
- atopcalcite
  - src
    - main
      - java
        net
        hydromatic
        optiq
        runtime
        SqlFunctions.java
        org
        eigenbase
        sql2rel
        SqlToRelConverter.java
  - pom.xml
  - .settings
    - org.eclipse.jdt.ui.prefs
    - org.eclipse.jdt.core.prefs
    - org.eclipse.core.resources.prefs
- README.md
- server
  - src
    - main
      - resources
        ehcache.xml
        log4j.properties
        applicationContext.xml
        kylinSecurity.xml
        ehcache-test.xml
        dbSqls
        schema.sql
        .gitignore
      - java
        org
        apache
        kylin
        rest
        security
        AclPermission.java
        AuthoritiesPopulator.java
        UnauthorisedEntryPoint.java
        AclPermissionFactory.java
        AclEntityFactory.java
        LdapProvider.java
        PasswordPlaceholderConfigurer.java
        CrossDomainFilter.java
        UserManager.java
        response
        MetricsResponse.java
        ErrorResponse.java
        TableDescResponse.java
        GeneralResponse.java
        HBaseResponse.java
        AccessEntryResponse.java
        SQLResponse.java
        constant
        Constant.java
        util
        Serializer.java
        QueryUtil.java
        ClasspathUtil.java
        request
        SQLRequest.java
        CardinalityRequest.java
        SaveSqlRequest.java
        PrepareSqlRequest.java
        JobListRequest.java
        MetricsRequest.java
        AccessRequest.java
        CreateProjectRequest.java
        JobBuildRequest.java
        MetaRequest.java
        CubeRequest.java
        UpdateConfigRequest.java
        UpdateProjectRequest.java
        service
        UserService.java
        AclService.java
        CubeService.java
        ProjectService.java
        JobService.java
        QueryService.java
        MetricsService.java
        AccessService.java
        BasicService.java
        AdminService.java
        CacheService.java
        exception
        InternalErrorException.java
        ForbiddenException.java
        BadRequestException.java
        NotFoundException.java
        DebugTomcat.java
        model
        ColumnMeta.java
        SelectedColumnMeta.java
        Query.java
        TableMeta.java
        metrics
        JobMetrics.java
        QueryMetrics.java
        KylinInstrumentedFilterContextListener.java
        controller
        UserController.java
        CubeDescController.java
        AccessController.java
        JobController.java
        TableController.java
        CacheController.java
        ModelController.java
        BasicController.java
        QueryController.java
        CubeController.java
        AdminController.java
        ProjectController.java
      - webapp
        WEB-INF
        kylin-servlet.xml
        web.xml
        index.html
    - test
      - java
        org
        apache
        kylin
        jdbc
        JDBCDriverTest.java
        rest
        broadcaster
        BroadcasterReceiveServlet.java
        service
        ServiceTestBase.java
        JobServiceTest.java
        QueryServiceTest.java
        UserServiceTest.java
        AccessServiceTest.java
        CubeServiceTest.java
        CacheServiceTest.java
        bean
        BeanValidator.java
        BeanTest.java
        controller
        CubeControllerTest.java
        JobControllerTest.java
        TableControllerTest.java
        UserControllerTest.java
        CacheControllerTest.java
        BaseControllerTest.java
        QueryControllerTest.java
        ProjectControllerTest.java
        AccessControllerTest.java
        AdminControllerTest.java
  - ServiceConfig.md
  - pom.xml
  - .settings
    - org.eclipse.jdt.ui.prefs
    - org.eclipse.jdt.core.prefs
    - org.eclipse.core.resources.prefs
- bin
  - check-env.sh
  - setenv.sh
  - find-hive-dependency.sh
  - health-check.sh
  - kylin.sh
  - sample.sh
- webapp
  - Gruntfile.js
  - bower.json
  - .editorconfig
  - .jshintrc
  - grunt.json
  - .bowerrc
  - README.md
  - package.json
  - app
    - routes.json
    - fonts
      - toadOcfmlt9b38dHJxOBGKUt5Ot5NIMarvNW-hkYWvT3rGVtsTkPsbDajuO5ueQw.woff2
      - ODelI1aHBYDBqgeIAH2zlPytCVloACqnDHJwh-em2k8.woff2
    - less
      - navbar.less
      - app.less
      - component.less
      - animation.less
      - layout.less
      - build.less
      - home.less
    - htaccess.dist
    - js
      - utils
        utils.js
      - services
        ngLoading.js
        tables.js
        auth.js
        query.js
        access.js
        cache.js
        cubeDesc.js
        projects.js
        admin.js
        jobs.js
        message.js
        tree.js
        cubes.js
        users.js
        kylinProperties.js
        model.js
        graph.js
      - app.js
      - directives
        directives.js
      - controllers
        cubeSchema.js
        auth.js
        query.js
        page.js
        cube.js
        access.js
        cubeEdit.js
        cubeModel.js
        cubeAdvanceSetting.js
        projects.js
        admin.js
        cubeFilter.js
        job.js
        cubeRefresh.js
        cubes.js
        cubeDimensions.js
        sourceMeta.js
        projectMeta.js
        index.js
      - filters
        filter.js
      - listeners.js
      - config.js
      - model
        tableModel.js
        jobConfig.js
        tableConfig.js
        cubesManager.js
        jobListModel.js
        metaModel.js
        projectModel.js
        cubeConfig.js
        cubeDescModel.js
        cubeListModel.js
        projectConfig.js
      - factories
        graph.js
    - index.html
    - partials
      - home.html
      - admin
        admin.html
      - cubeDesigner
        data_model.html
        filter.html
        measures.html
        advanced_settings.html
        overview.html
        incremental.html
        info.html
        dimensions.html
      - tables
        source_table_tree.html
        source_metadata.html
      - cubes
        cube_edit.html
        cube_schema.html
        cube_detail.html
        cubes.html
        cube_json_edit.html
      - common
        access.html
      - directives
        typeahead.html
        noResult.html
        pagination.html
        loading.html
      - query
        query.html
        query_detail.html
      - projects
        projects.html
        project_detail.html
        project_table_tree.html
        project_create.html
      - footer.html
      - header.html
      - jobs
        job_refresh.html
        job_steps.html
        jobs.html
        job_merge.html
        job_submit.html
      - login.html
    - image
      - ajax-loader.gif
      - waiting.gif
      - favicon.ico
    - .gitignore
    - css
      - AdminLTE.css
      - AdminLTE-fonts.css
  - .gitignore
- .gitignore
- docs
  - JobEngine
    - Design.md
  - MISC
    - FAQ on Kylin Installation and Usage.md
    - How to Contribute.md
    - Kylin Document Conventions.md
  - TechInside
    - Kylin 0.7 Lambda Architecture.md
    - New meta data model structure.md
  - website
    - BingSiteAuth.xml
    - blog
      - index.md
      - index.html
    - about
      - index.md
    - _sass
      - _syntax-highlighting.scss
      - _layout.scss
      - _base.scss
    - _config.yml
    - feed.xml
    - _config-prod.yml
    - _includes
      - head.html
      - footer.html
      - header.html
      - header.cn.html
      - head.cn.html
    - CNAME
    - LICENSE
    - index.md
    - _layouts
      - page.html
      - post.html
      - default-cn.html
      - default.html
    - download
      - index.md
    - favicon.ico
    - google0f781a4ad9402c21.html
    - index.cn.md
    - community
      - index.html
    - README.md
    - .gitignore
    - docs
      - installation-content.html
      - intro-content.html
      - index.html
    - css
      - main.scss
    - assets
      - images
        kylin_logo.jpg
      - fonts
        helveticaneue_lt.ttf
        helveticaneue-webfont.css
        fontawesome-webfont.woff
        fontawesome-webfont.eot
        opensans-light-webfont.svg
        helveticaneue-webfont.eot
        opensans-light-webfont.woff
        helveticaneue-webfont.svg
        opensans-regular-webfont.eot
        helveticaneue-webfont.woff
        helveticaneue_lt.eot
        FontAwesome.otf
        helveticaneue-webfont.ttf
        helveticaneue_lt.woff
        opensans-regular-webfont.woff
        opensans-regular-webfont.svg
        opensans-regular-webfont.ttf
        helveticaneue_lt.css
        opensans-light-webfont.eot
        opensans-light-webfont.ttf
        fontawesome-webfont.ttf
        helveticaneue_lt.svg
      - js
        bootstrap.min.js
        main.js
        jquery-1.9.1.min.js
      - css
        animate.css
        styles.css
        bootstrap.min.css
        font-awesome.min.css
    - _posts
      - 2015-01-25-introduce-data-model.md
  - REST
    - How to consume Kylin REST API in javascript.md
    - Build Cube with Restful API.md
    - Kylin Restful API List.md
  - Test
    - Run Kylin test case with HBase Mini Cluster.md
  - Tutorial
    - Kylin and Excel Tutorial.md
    - Kylin ODBC Driver Tutorial.md
    - Kylin Web Tutorial.md
    - Kylin Cube Permission Grant Tutorial.md
    - Kylin Cube Creation Tutorial.md
    - How to use kylin remote jdbc driver.md
    - Kylin Cube Build and Job Monitoring Tutorial.md
    - Kylin and Tableau Tutorial.md
    - Quick play with a sample cube.md
  - Operations
    - Export Kylin HBase data.md
    - Kylin Metadata Store.md
    - Advanced settings of Kylin environment.md
  - Installation
    - Multiple Kylin REST servers.md
    - Hadoop Environment.md
    - On Hadoop CLI installation.md
    - Installation.md
    - On Hadoop Kylin installation using Docker.md
    - Off Hadoop CLI Installation.md
    - How to generate install binaries.md
- cube
  - src
    - main
      - java
        org
        apache
        kylin
        cube
        kv
        RowKeyDecoder.java
        RowKeyEncoder.java
        RowValueDecoder.java
        AbstractRowKeyEncoder.java
        RowKeyColumnIO.java
        FuzzyKeyEncoder.java
        RowKeyColumnOrder.java
        FuzzyMaskEncoder.java
        RowConstants.java
        cli
        DumpDictionaryCLI.java
        DictionaryGeneratorCLI.java
        CubeManager.java
        common
        RowKeySplitter.java
        CubeDescManager.java
        CubeDescUpgrader.java
        cuboid
        CuboidScheduler.java
        CuboidCLI.java
        Cuboid.java
        CubeSegment.java
        model
        RowKeyColDesc.java
        v1
        ProjectInstance.java
        CubeStatusEnum.java
        CubeSegmentTypeEnum.java
        CubeSegmentStatusEnum.java
        CubeDesc.java
        DimensionDesc.java
        CubeBuildTypeEnum.java
        CubeSegment.java
        CubePartitionDesc.java
        CubeInstance.java
        HBaseColumnFamilyDesc.java
        HBaseMappingDesc.java
        HBaseColumnDesc.java
        CubeDesc.java
        DimensionDesc.java
        CubeBuildTypeEnum.java
        validation
        IValidatorRule.java
        ValidateContext.java
        ResultLevel.java
        CubeMetadataValidator.java
        SourceTableMetadataValidator.java
        rule
        FunctionRule.java
        MandatoryColumnRule.java
        RowKeyAttrRule.java
        IKylinValidationConstants.java
        AggregationGroupSizeRule.java
        HierarchyDesc.java
        RowKeyDesc.java
        CubeCapabilityChecker.java
        CubeDimensionDeriver.java
        estimation
        CubeSizeEstimationCLI.java
        CubeInstance.java
      - assembly
        assemble.xml
    - test
      - resources
        data
        TEST2_desc.json
        TEST3_desc.json
        TEST1_desc.json
      - java
        org
        apache
        kylin
        metadata
        measure
        MeasureCodecTest.java
        MetadataUpgradeTest.java
        cube
        MandatoryColumnRuleTest.java
        RowKeyAttrRuleTest.java
        kv
        RowKeyDecoderTest.java
        RowKeyEncoderTest.java
        RowValueDecoderTest.java
        CubeManagerCacheTest.java
        common
        RowKeySplitterTest.java
        BytesSplitterTest.java
        project
        ProjectManagerTest.java
        AggregationGroupSizeRuleTest.java
        cuboid
        CuboidSchedulerTest.java
        CuboidTest.java
        CombinationTest.java
        CubeManagerTest.java
        CubeDescTest.java
        CubeSizeEstimationCLITest.java
        CubeSegmentsTest.java
        DictionaryManagerTest.java
  - pom.xml
  - .settings
    - org.eclipse.jdt.ui.prefs
    - org.eclipse.jdt.core.prefs
    - org.eclipse.core.resources.prefs
- conf
  - kylin_job_conf.xml
  - kylin.properties

/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 * 
 *     http://www.apache.org/licenses/LICENSE-2.0
 * 
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
*/

package org.apache.kylin.dict;

import java.io.ByteArrayInputStream;
import java.io.DataInput;
import java.io.DataInputStream;
import java.io.DataOutput;
import java.io.IOException;
import java.io.PrintStream;
import java.lang.ref.SoftReference;
import java.util.Arrays;
import java.util.HashMap;

import org.apache.kylin.common.util.BytesUtil;
import org.apache.kylin.common.util.ClassUtil;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

/**
 * A dictionary based on Trie data structure that maps enumerations of byte[] to
 * int IDs.
 * 
 * With Trie the memory footprint of the mapping is kinda minimized at the cost
 * CPU, if compared to HashMap of ID Arrays. Performance test shows Trie is
 * roughly 10 times slower, so there's a cache layer overlays on top of Trie and
 * gracefully fall back to Trie using a weak reference.
 * 
 * The implementation is thread-safe.
 * 
 * @author yangli9
 */
@SuppressWarnings({ "rawtypes", "unchecked" })
public class TrieDictionary<T> extends Dictionary<T> {

    public static final byte[] HEAD_MAGIC = new byte[] { 0x54, 0x72, 0x69, 0x65, 0x44, 0x69, 0x63, 0x74 }; // "TrieDict"
    public static final int HEAD_SIZE_I = HEAD_MAGIC.length;

    public static final int BIT_IS_LAST_CHILD = 0x80;
    public static final int BIT_IS_END_OF_VALUE = 0x40;

    private static final Logger logger = LoggerFactory.getLogger(TrieDictionary.class);

    private byte[] trieBytes;

    // non-persistent part
    transient private int headSize;
    @SuppressWarnings("unused")
    transient private int bodyLen;
    transient private int sizeChildOffset;
    transient private int sizeNoValuesBeneath;
    transient private int baseId;
    transient private int maxValueLength;
    transient private BytesConverter<T> bytesConvert;

    transient private int nValues;
    transient private int sizeOfId;
    transient private int childOffsetMask;
    transient private int firstByteOffset;

    transient private boolean enableCache = true;
    transient private SoftReference<HashMap> valueToIdCache;
    transient private SoftReference<Object[]> idToValueCache;

    public TrieDictionary() { // default constructor for Writable interface
    }

    public TrieDictionary(byte[] trieBytes) {
        init(trieBytes);
    }

    private void init(byte[] trieBytes) {
        this.trieBytes = trieBytes;
        if (BytesUtil.compareBytes(HEAD_MAGIC, 0, trieBytes, 0, HEAD_MAGIC.length) != 0)
            throw new IllegalArgumentException("Wrong file type (magic does not match)");

        try {
            DataInputStream headIn = new DataInputStream( //
                    new ByteArrayInputStream(trieBytes, HEAD_SIZE_I, trieBytes.length - HEAD_SIZE_I));
            this.headSize = headIn.readShort();
            this.bodyLen = headIn.readInt();
            this.sizeChildOffset = headIn.read();
            this.sizeNoValuesBeneath = headIn.read();
            this.baseId = headIn.readShort();
            this.maxValueLength = headIn.readShort();

            String converterName = headIn.readUTF();
            if (converterName.isEmpty() == false)
                this.bytesConvert = (BytesConverter<T>) ClassUtil.forName(converterName, BytesConverter.class).newInstance();

            this.nValues = BytesUtil.readUnsigned(trieBytes, headSize + sizeChildOffset, sizeNoValuesBeneath);
            this.sizeOfId = BytesUtil.sizeForValue(baseId + nValues + 1); // note baseId could raise 1 byte in ID space, +1 to reserve all 0xFF for NULL case
            this.childOffsetMask = ~((BIT_IS_LAST_CHILD | BIT_IS_END_OF_VALUE) << ((sizeChildOffset - 1) * 8));
            this.firstByteOffset = sizeChildOffset + sizeNoValuesBeneath + 1; // the offset from begin of node to its first value byte
        } catch (Exception e) {
            if (e instanceof RuntimeException)
                throw (RuntimeException) e;
            else
                throw new RuntimeException(e);
        }

        if (enableCache) {
            valueToIdCache = new SoftReference<HashMap>(new HashMap());
            idToValueCache = new SoftReference<Object[]>(new Object[nValues]);
        }
    }

    @Override
    public int getMinId() {
        return baseId;
    }

    @Override
    public int getMaxId() {
        return baseId + nValues - 1;
    }

    @Override
    public int getSizeOfId() {
        return sizeOfId;
    }

    @Override
    public int getSizeOfValue() {
        return maxValueLength;
    }

    @Override
    final protected int getIdFromValueImpl(T value, int roundingFlag) {
        if (enableCache && roundingFlag == 0) {
            HashMap cache = valueToIdCache.get(); // SoftReference to skip cache
                                                  // gracefully when short of
                                                  // memory
            if (cache != null) {
                Integer id = null;
                id = (Integer) cache.get(value);
                if (id != null)
                    return id.intValue();

                byte[] valueBytes = bytesConvert.convertToBytes(value);
                id = getIdFromValueBytes(valueBytes, 0, valueBytes.length, roundingFlag);

                cache.put(value, id);
                return id;
            }
        }
        byte[] valueBytes = bytesConvert.convertToBytes(value);
        return getIdFromValueBytes(valueBytes, 0, valueBytes.length, roundingFlag);
    }

    @Override
    protected int getIdFromValueBytesImpl(byte[] value, int offset, int len, int roundingFlag) {
        int seq = lookupSeqNoFromValue(headSize, value, offset, offset + len, roundingFlag);
        int id = calcIdFromSeqNo(seq);
        if (id < 0)
            throw new IllegalArgumentException("Not a valid value: " + bytesConvert.convertFromBytes(value, offset, len));
        return id;
    }

    /**
     * returns a code point from [0, nValues), preserving order of value
     * 
     * @param n
     *            -- the offset of current node
     * @param inp
     *            -- input value bytes to lookup
     * @param o
     *            -- offset in the input value bytes matched so far
     * @param inpEnd
     *            -- end of input
     * @param roundingFlag
     *            -- =0: return -1 if not found -- <0: return closest smaller if
     *            not found, might be -1 -- >0: return closest bigger if not
     *            found, might be nValues
     */
    private int lookupSeqNoFromValue(int n, byte[] inp, int o, int inpEnd, int roundingFlag) {
        if (inp.length == 0) // special 'empty' value
            return checkFlag(headSize, BIT_IS_END_OF_VALUE) ? 0 : roundSeqNo(roundingFlag, -1, -1, 0);

        int seq = 0; // the sequence no under track

        while (true) {
            // match the current node, note [0] of node's value has been matched
            // when this node is selected by its parent
            int p = n + firstByteOffset; // start of node's value
            int end = p + BytesUtil.readUnsigned(trieBytes, p - 1, 1); // end of
                                                                       // node's
                                                                       // value
            for (p++; p < end && o < inpEnd; p++, o++) { // note matching start
                                                         // from [1]
                if (trieBytes[p] != inp[o]) {
                    int comp = BytesUtil.compareByteUnsigned(trieBytes[p], inp[o]);
                    if (comp < 0) {
                        seq += BytesUtil.readUnsigned(trieBytes, n + sizeChildOffset, sizeNoValuesBeneath);
                    }
                    return roundSeqNo(roundingFlag, seq - 1, -1, seq); // mismatch
                }
            }

            // node completely matched, is input all consumed?
            boolean isEndOfValue = checkFlag(n, BIT_IS_END_OF_VALUE);
            if (o == inpEnd) {
                return p == end && isEndOfValue ? seq : roundSeqNo(roundingFlag, seq - 1, -1, seq); // input
                                                                                                    // all
                                                                                                    // matched
            }
            if (isEndOfValue)
                seq++;

            // find a child to continue
            int c = headSize + (BytesUtil.readUnsigned(trieBytes, n, sizeChildOffset) & childOffsetMask);
            if (c == headSize) // has no children
                return roundSeqNo(roundingFlag, seq - 1, -1, seq); // input only
                                                                   // partially
                                                                   // matched
            byte inpByte = inp[o];
            int comp;
            while (true) {
                p = c + firstByteOffset;
                comp = BytesUtil.compareByteUnsigned(trieBytes[p], inpByte);
                if (comp == 0) { // continue in the matching child, reset n and
                                 // loop again
                    n = c;
                    o++;
                    break;
                } else if (comp < 0) { // try next child
                    seq += BytesUtil.readUnsigned(trieBytes, c + sizeChildOffset, sizeNoValuesBeneath);
                    if (checkFlag(c, BIT_IS_LAST_CHILD))
                        return roundSeqNo(roundingFlag, seq - 1, -1, seq); // no
                                                                           // child
                                                                           // can
                                                                           // match
                                                                           // the
                                                                           // next
                                                                           // byte
                                                                           // of
                                                                           // input
                    c = p + BytesUtil.readUnsigned(trieBytes, p - 1, 1);
                } else { // children are ordered by their first value byte
                    return roundSeqNo(roundingFlag, seq - 1, -1, seq); // no
                                                                       // child
                                                                       // can
                                                                       // match
                                                                       // the
                                                                       // next
                                                                       // byte
                                                                       // of
                                                                       // input
                }
            }
        }
    }

    private int roundSeqNo(int roundingFlag, int i, int j, int k) {
        if (roundingFlag == 0)
            return j;
        else if (roundingFlag < 0)
            return i;
        else
            return k;
    }

    @Override
    final protected T getValueFromIdImpl(int id) {
        if (enableCache) {
            Object[] cache = idToValueCache.get(); // SoftReference to skip
                                                   // cache gracefully when
                                                   // short of memory
            if (cache != null) {
                int seq = calcSeqNoFromId(id);
                if (seq < 0 || seq >= nValues)
                    throw new IllegalArgumentException("Not a valid ID: " + id);
                if (cache[seq] != null)
                    return (T) cache[seq];

                byte[] value = new byte[getSizeOfValue()];
                int length = getValueBytesFromId(id, value, 0);
                T result = bytesConvert.convertFromBytes(value, 0, length);

                cache[seq] = result;
                return result;
            }
        }
        byte[] value = new byte[getSizeOfValue()];
        int length = getValueBytesFromId(id, value, 0);
        return bytesConvert.convertFromBytes(value, 0, length);
    }

    @Override
    protected int getValueBytesFromIdImpl(int id, byte[] returnValue, int offset) {
        if (id < baseId || id >= baseId + nValues)
            throw new IllegalArgumentException("Not a valid ID: " + id);

        int seq = calcSeqNoFromId(id);

        return lookupValueFromSeqNo(headSize, seq, returnValue, offset);
    }

    /**
     * returns a code point from [0, nValues), preserving order of value, or -1
     * if not found
     * 
     * @param n
     *            -- the offset of current node
     * @param seq
     *            -- the code point under track
     * @param returnValue
     *            -- where return value is written to
     */
    private int lookupValueFromSeqNo(int n, int seq, byte[] returnValue, int offset) {
        int o = offset;
        while (true) {
            // write current node value
            int p = n + firstByteOffset;
            int len = BytesUtil.readUnsigned(trieBytes, p - 1, 1);
            System.arraycopy(trieBytes, p, returnValue, o, len);
            o += len;

            // if the value is ended
            boolean isEndOfValue = checkFlag(n, BIT_IS_END_OF_VALUE);
            if (isEndOfValue) {
                seq--;
                if (seq < 0)
                    return o - offset;
            }

            // find a child to continue
            int c = headSize + (BytesUtil.readUnsigned(trieBytes, n, sizeChildOffset) & childOffsetMask);
            if (c == headSize) // has no children
                return -1; // no child? corrupted dictionary!
            int nValuesBeneath;
            while (true) {
                nValuesBeneath = BytesUtil.readUnsigned(trieBytes, c + sizeChildOffset, sizeNoValuesBeneath);
                if (seq - nValuesBeneath < 0) { // value is under this child,
                                                // reset n and loop again
                    n = c;
                    break;
                } else { // go to next child
                    seq -= nValuesBeneath;
                    if (checkFlag(c, BIT_IS_LAST_CHILD))
                        return -1; // no more child? corrupted dictionary!
                    p = c + firstByteOffset;
                    c = p + BytesUtil.readUnsigned(trieBytes, p - 1, 1);
                }
            }
        }
    }

    private boolean checkFlag(int offset, int bit) {
        return (trieBytes[offset] & bit) > 0;
    }

    private int calcIdFromSeqNo(int seq) {
        if (seq < 0 || seq >= nValues)
            return -1;
        else
            return baseId + seq;
    }

    private int calcSeqNoFromId(int id) {
        return id - baseId;
    }

    @Override
    public void write(DataOutput out) throws IOException {
        out.write(trieBytes);
    }

    @Override
    public void readFields(DataInput in) throws IOException {
        byte[] headPartial = new byte[HEAD_MAGIC.length + Short.SIZE + Integer.SIZE];
        in.readFully(headPartial);

        if (BytesUtil.compareBytes(HEAD_MAGIC, 0, headPartial, 0, HEAD_MAGIC.length) != 0)
            throw new IllegalArgumentException("Wrong file type (magic does not match)");

        DataInputStream headIn = new DataInputStream( //
                new ByteArrayInputStream(headPartial, HEAD_SIZE_I, headPartial.length - HEAD_SIZE_I));
        int headSize = headIn.readShort();
        int bodyLen = headIn.readInt();
        headIn.close();

        byte[] all = new byte[headSize + bodyLen];
        System.arraycopy(headPartial, 0, all, 0, headPartial.length);
        in.readFully(all, headPartial.length, all.length - headPartial.length);

        init(all);
    }

    @Override
    public void dump(PrintStream out) {
        out.println("Total " + nValues + " values");
        for (int i = 0; i < nValues; i++) {
            int id = calcIdFromSeqNo(i);
            T value = getValueFromId(id);
            out.println(id + " (" + Integer.toHexString(id) + "): " + value);
        }
    }

    @Override
    public int hashCode() {
        return Arrays.hashCode(trieBytes);
    }

    @Override
    public boolean equals(Object o) {
        if ((o instanceof TrieDictionary) == false) {
            logger.info("Equals return false because o is not TrieDictionary");
            return false;
        }
        TrieDictionary that = (TrieDictionary) o;
        return Arrays.equals(this.trieBytes, that.trieBytes);
    }

    public static void main(String[] args) throws Exception {
        TrieDictionaryBuilder<String> b = new TrieDictionaryBuilder<String>(new StringBytesConverter());
        // b.addValue("part");
        // b.print();
        // b.addValue("part");
        // b.print();
        // b.addValue("par");
        // b.print();
        // b.addValue("partition");
        // b.print();
        // b.addValue("party");
        // b.print();
        // b.addValue("parties");
        // b.print();
        // b.addValue("paint");
        // b.print();
        b.addValue("-000000.41");
        b.addValue("0000101.81");
        b.addValue("6779331");
        String t = "0000001.6131";
        TrieDictionary<String> dict = b.build(0);

        System.out.println(dict.getIdFromValue(t, -1));
        System.out.println(dict.getIdFromValue(t, 1));
    }
}