java source code of TezMerger

tez-master
- NOTICE.txt
- tez-build-tools
  - src
    - main
      - resources
        checkstyle
        checkstyle.xml
        suppressions.xml
  - pom.xml
- tez-mapreduce
  - src
    - main
      - proto
        MRRuntimeProtos.proto
      - resources
        META-INF
        NOTICE.txt
        services
        org.apache.hadoop.mapreduce.protocol.ClientProtocolProvider
        LICENSE.txt
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        hadoop
        mapred
        split
        TezGroupedSplit.java
        TezMapredSplitsGrouper.java
        SplitLocationProvider.java
        SplitSizeEstimator.java
        TezGroupedSplitsInputFormat.java
        mapreduce
        split
        TezMapReduceSplitsGrouper.java
        SplitMetaInfoReaderTez.java
        TezGroupedSplit.java
        SplitLocationProvider.java
        SplitLocationProviderMapReduce.java
        SplitSizeEstimator.java
        TezGroupedSplitsInputFormat.java
        tez
        dag
        api
        client
        MRDAGClient.java
        client
        MRTezClient.java
        common
        MRFrameworkConfigs.java
        mapreduce
        committer
        MROutputCommitter.java
        processor
        MRTaskReporter.java
        MRTask.java
        reduce
        ReduceProcessor.java
        map
        MapProcessor.java
        SimpleMRProcessor.java
        hadoop
        MRHelpers.java
        MRJobConfig.java
        MRInputHelpers.java
        TezTypeConverters.java
        MRConfig.java
        IDConverter.java
        mapred
        MRCounters.java
        JobContextImpl.java
        MRReporter.java
        package-info.java
        TaskAttemptContextImpl.java
        InputSplitInfoDisk.java
        MultiStageMRConfToTezTranslator.java
        package-info.java
        MultiStageMRConfigUtil.java
        InputSplitInfo.java
        DeprecatedKeys.java
        mapreduce
        JobContextImpl.java
        MapContextImpl.java
        TezNullOutputCommitter.java
        package-info.java
        TaskInputOutputContextImpl.java
        TaskAttemptContextImpl.java
        InputSplitInfoMem.java
        client
        ClientServiceDelegate.java
        YARNRunner.java
        ResourceMgrDelegate.java
        package-info.java
        YarnTezClientProtocolProvider.java
        ClientCache.java
        NotRunningJob.java
        DAGJobStatus.java
        partition
        MRPartitioner.java
        combine
        MRCombiner.java
        output
        MultiMROutput.java
        MROutputLegacy.java
        MROutput.java
        common
        Utils.java
        MRInputAMSplitGenerator.java
        MRInputSplitDistributor.java
        lib
        MRInputUtils.java
        MRReaderMapred.java
        package-info.java
        MRReader.java
        MRReaderMapReduce.java
        input
        base
        MRInputBase.java
        MRInputLegacy.java
        MRInput.java
        MultiMRInput.java
        grouper
        SplitLocationProviderWrapper.java
        SplitLocationProviderWrapperMapred.java
        SplitSizeEstimatorWrapperMapReduce.java
        GroupedSplitContainer.java
        MapReduceSplitContainer.java
        SplitSizeEstimatorWrapperMapred.java
        MapredSplitContainer.java
        TezSplitGrouper.java
        SplitSizeEstimatorWrapper.java
        SplitContainer.java
    - test
      - resources
        log4j.properties
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        hadoop
        mapred
        split
        TestGroupedSplits.java
        tez
        mapreduce
        processor
        reduce
        TestReduceProcessor.java
        map
        TestMapProcessor.java
        MapUtils.java
        hadoop
        TestMRHelpers.java
        TestDeprecatedKeys.java
        TestMRInputHelpers.java
        TestConfigTranslationMRToTez.java
        combine
        TestMRCombiner.java
        TezTestUtils.java
        output
        TestMROutput.java
        TestMROutputLegacy.java
        TestMROutputConfigBuilder.java
        TestMultiMROutput.java
        common
        TestMRInputAMSplitGenerator.java
        TestMRInputSplitDistributor.java
        lib
        TestKVReadersWithMR.java
        TestUmbilical.java
        input
        TestMultiMRInput.java
        MultiMRInputForTest.java
        MRInputForTest.java
        TestMRInput.java
  - pom.xml
  - findbugs-exclude.xml
- hadoop-shim
  - src
    - main
      - java
        org
        apache
        tez
        hadoop
        shim
        HadoopShimsLoader.java
        DefaultHadoopShim.java
        HadoopShim.java
        HadoopShimProvider.java
    - test
      - resources
        log4j.properties
      - java
        org
        apache
        tez
        hadoop
        shim
        TestHadoopShimsLoader.java
        DummyShimProvider.java
  - pom.xml
  - findbugs-exclude.xml
- tez-tests
  - src
    - main
      - resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        mapreduce
        examples
        MRRSleepJob.java
        processor
        FilterByWordOutputProcessor.java
        FilterByWordInputProcessor.java
        BroadcastAndOneToOneExample.java
        TestOrderedWordCount.java
        helpers
        SplitsInClientOptionParser.java
        FilterLinesByWordOneToOne.java
        SecondarySort.java
        Sort.java
        UnionExample.java
        RandomTextWriter.java
        Join.java
        CartesianProduct.java
        RPCLoadGen.java
        MultipleCommitsExample.java
        RandomWriter.java
        MapredWordCount.java
        BroadcastLoadGen.java
        FilterLinesByWord.java
        ExampleDriver.java
    - test
      - resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        test
        FaultToleranceTestRunner.java
        TestLocalMode.java
        TestDAGRecovery2.java
        AMShutdownController.java
        TestSecureShuffle.java
        TestTaskErrorsUsingLocalMode.java
        RecoveryServiceWithEventHandlingHook.java
        dag
        ThreeLevelsFailingDAG.java
        SixLevelsFailingDAG.java
        TwoLevelsFailingDAG.java
        SimpleReverseVTestDAG.java
        SimpleVTestDAG.java
        MultiAttemptDAG.java
        TestPipelinedShuffle.java
        TestDAGRecovery.java
        TestMiniTezCluster.java
        SimpleTestDAG.java
        TestDriver.java
        TestTezJobs.java
        TestFaultTolerance.java
        TestInput.java
        TestProcessor.java
        TestOutput.java
        TestExceptionPropagation.java
        TestRecovery.java
        TestAMRecovery.java
        SimpleTestDAG3Vertices.java
        MiniTezCluster.java
        mapreduce
        TestMRRJobsDAGApi.java
        TestMRRJobs.java
  - pom.xml
  - findbugs-exclude.xml
- tez-examples
  - src
    - main
      - resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        examples
        SimpleSessionExample.java
        WordCount.java
        JoinValidate.java
        SortMergeJoinExample.java
        TezExampleBase.java
        JoinDataGen.java
        HashJoinExample.java
        OrderedWordCount.java
        CartesianProduct.java
        ExampleDriver.java
    - test
      - resources
        META-INF
        NOTICE.txt
        LICENSE.txt
  - pom.xml
  - findbugs-exclude.xml
- tez-runtime-internals
  - src
    - main
      - proto
        RuntimeEvents.proto
      - resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        common
        ProtoConverters.java
        TezLocalResource.java
        TezConverterUtils.java
        TezTaskUmbilicalProtocol.java
        ContainerTask.java
        ContainerContext.java
        runtime
        internals
        api
        TaskReporterInterface.java
        task
        EndReason.java
        ContainerReporter.java
        TezTaskRunner2.java
        ErrorReporter.java
        TezChild.java
        TaskRunner2Callable.java
        TaskReporter.java
        TaskRunner2Result.java
        RuntimeTask.java
        InputReadyTracker.java
        api
        impl
        TezHeartbeatResponse.java
        TezMergedInputContextImpl.java
        TezHeartbeatRequest.java
        EventType.java
        TezCountersDelegate.java
        TezProcessorContextImpl.java
        TezEvent.java
        EventMetaData.java
        TaskStatistics.java
        GroupInputSpec.java
        TaskSpec.java
        TezOutputContextImpl.java
        IOStatistics.java
        TezUmbilical.java
        TezInputContextImpl.java
        InputSpec.java
        OutputSpec.java
        ExecutionContextImpl.java
        TezTaskContextImpl.java
        events
        TaskAttemptCompletedEvent.java
        TaskAttemptFailedEvent.java
        TaskAttemptKilledEvent.java
        TaskStatusUpdateEvent.java
        common
        security
        JobTokenSelector.java
        resources
        MemoryDistributor.java
        ScalingAllocator.java
        objectregistry
        ObjectRegistryImpl.java
        LogicalIOProcessorRuntimeTask.java
        metrics
        FileSystemStatisticUpdater.java
        TaskCounterUpdater.java
    - test
      - resources
        log4j.properties
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        runtime
        task
        TaskExecutionTestHelpers.java
        TestContainerExecution.java
        TestTaskReporter.java
        TestTezTaskRunner2.java
        TestTaskExecution2.java
        api
        impl
        TestTezEvent.java
        TestTaskSpec.java
        TestProcessorContext.java
        common
        resources
        TestMemoryDistributor.java
        objectregistry
        TestObjectRegistry.java
        TestLogicalIOProcessorRuntimeTask.java
        TestInputReadyTracker.java
  - pom.xml
  - findbugs-exclude.xml
- tez-dag
  - src
    - main
      - proto
        HistoryEvents.proto
      - resources
        tez-container-log4j.properties
        tez-dag-version-info.properties
        META-INF
        NOTICE.txt
        LICENSE.txt
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        dag
        utils
        ProtoUtils.java
        TaskSpecificLaunchCmdOption.java
        TezBuilderUtils.java
        Graph.java
        Simple2LevelVersionComparator.java
        TezRuntimeChildJVM.java
        api
        client
        VertexStatusBuilder.java
        ProgressBuilder.java
        DAGClientHandler.java
        rpc
        DAGClientAMProtocolBlockingPBServerImpl.java
        DAGClientServer.java
        DAGStatusBuilder.java
        oldrecords
        TaskAttemptState.java
        AMInfo.java
        TaskReport.java
        TaskState.java
        TaskAttemptReport.java
        history
        utils
        DAGUtils.java
        TezEventUtils.java
        HistoryEvent.java
        DAGHistoryEvent.java
        HistoryEventType.java
        SummaryEvent.java
        RecoveryConverters.java
        recovery
        RecoveryService.java
        HistoryEventHandler.java
        logging
        impl
        HistoryEventJsonConversion.java
        SimpleHistoryLoggingService.java
        DevNullHistoryLoggingService.java
        HistoryLoggingService.java
        events
        DAGCommitStartedEvent.java
        VertexStartedEvent.java
        AMLaunchedEvent.java
        ContainerStoppedEvent.java
        TaskStartedEvent.java
        VertexGroupCommitFinishedEvent.java
        VertexGroupCommitStartedEvent.java
        ContainerLaunchedEvent.java
        VertexConfigurationDoneEvent.java
        VertexCommitStartedEvent.java
        DAGRecoveredEvent.java
        VertexInitializedEvent.java
        VertexFinishedEvent.java
        TaskFinishedEvent.java
        AppLaunchedEvent.java
        DAGFinishedEvent.java
        TaskAttemptStartedEvent.java
        DAGSubmittedEvent.java
        DAGStartedEvent.java
        DAGKillRequestEvent.java
        TaskAttemptFinishedEvent.java
        DAGInitializedEvent.java
        AMStartedEvent.java
        app
        security
        authorize
        TezAMPolicyProvider.java
        package-info.java
        RecoveryParser.java
        TaskAttemptEventInfo.java
        DAGAppMaster.java
        dag
        impl
        TaskImpl.java
        AMUserCodeException.java
        TezRootInputInitializerContextImpl.java
        OneToOneEdgeManager.java
        DAGSchedulerNaturalOrder.java
        OneToOneEdgeManagerOnDemand.java
        DAGImpl.java
        BroadcastEdgeManager.java
        Edge.java
        TaskReportImpl.java
        RootInputVertexManager.java
        ImmediateStartVertexManager.java
        OutputCommitterContextImpl.java
        ScatterGatherEdgeManager.java
        package-info.java
        VertexManager.java
        ServicePluginInfo.java
        TaskAttemptImplHelpers.java
        TaskAttemptImpl.java
        VertexStats.java
        VertexImpl.java
        DAGSchedulerNaturalOrderControlled.java
        StateChangeNotifier.java
        Task.java
        DAGState.java
        VertexTerminationCause.java
        VertexStateUpdateListener.java
        speculation
        legacy
        TaskRuntimeEstimator.java
        DataStatistics.java
        LegacyTaskRuntimeEstimator.java
        LegacySpeculator.java
        forecast
        SimpleExponentialSmoothing.java
        package-info.java
        StartEndTimesBase.java
        SimpleExponentialTaskRuntimeEstimator.java
        DAGTerminationCause.java
        Vertex.java
        RootInputInitializerManager.java
        TaskStateInternal.java
        package-info.java
        DAGReport.java
        event
        VertexEventTaskAttemptCompleted.java
        VertexEventSourceVertexStarted.java
        CallableEvent.java
        TaskAttemptEventContainerTerminating.java
        DAGAppMasterEvent.java
        VertexEventRootInputFailed.java
        TaskAttemptEvent.java
        TaskEvent.java
        DAGEvent.java
        DAGAppMasterEventDagCleanup.java
        DAGAppMasterEventDAGFinished.java
        DAGAppMasterEventType.java
        DAGEventCommitCompleted.java
        TaskAttemptEventSubmitted.java
        SpeculatorEventType.java
        TaskAttemptEventStartedRemotely.java
        DAGEventSchedulerUpdate.java
        TaskAttemptEventNodeFailed.java
        DAGEventRecoverEvent.java
        DiagnosableEvent.java
        DAGAppMasterEventUserServiceFatalError.java
        TaskAttemptEventSchedule.java
        DAGEventInternalError.java
        VertexEventRecoverVertex.java
        VertexEventSourceTaskAttemptCompleted.java
        TaskAttemptEventContainerTerminated.java
        TaskEventScheduleTask.java
        TaskAttemptEventContainerTerminatedBySystem.java
        VertexEventInputDataInformation.java
        TaskEventType.java
        DAGEventVertexReRunning.java
        TaskEventTAKilled.java
        DAGEventStartDag.java
        TaskEventTASucceeded.java
        DAGEventCounterUpdate.java
        TaskAttemptEventType.java
        VertexEventRouteEvent.java
        DAGEventType.java
        DAGEventTerminateDag.java
        DAGEventVertexCompleted.java
        package-info.java
        CallableEventType.java
        VertexEventRootInputInitialized.java
        RecoveryEvent.java
        VertexEventTermination.java
        TaskAttemptEventAttemptKilled.java
        SpeculatorEvent.java
        VertexEvent.java
        DAGEventDiagnosticsUpdate.java
        TaskAttemptEventOutputFailed.java
        DAGAppMasterEventSchedulingServiceError.java
        TaskAttemptEventKillRequest.java
        TaskAttemptEventTezEventUpdate.java
        TaskEventTAFailed.java
        TaskAttemptEventTerminationCauseEvent.java
        VertexEventTaskReschedule.java
        TaskAttemptEventStatusUpdate.java
        VertexEventManagerUserCodeError.java
        TaskEventTALaunched.java
        VertexEventType.java
        TaskEventTermination.java
        VertexEventCommitCompleted.java
        VertexEventNullEdgeInitialized.java
        VertexEventTaskCompleted.java
        SpeculatorEventTaskAttemptStatusUpdate.java
        TaskAttemptEventAttemptFailed.java
        TaskEventTAUpdate.java
        DAG.java
        TaskTerminationCause.java
        DAGScheduler.java
        TaskStateUpdateListener.java
        TaskAttemptStateInternal.java
        VertexState.java
        TaskAttempt.java
        TaskCommunicatorContextImpl.java
        ServicePluginLifecycleAbstractService.java
        TezTaskCommunicatorImpl.java
        web
        WebUIService.java
        AMWebController.java
        TezLocalTaskCommunicatorImpl.java
        TaskCommunicatorWrapper.java
        AppContext.java
        ClusterInfo.java
        HeartbeatHandlerBase.java
        TaskCommunicatorManagerInterface.java
        TezDagVersionInfo.java
        package-info.java
        rm
        ContainerAllocator.java
        AMSchedulerEventTAStateUpdated.java
        ContainerLauncherEventType.java
        AMSchedulerEventTALaunchRequest.java
        AMSchedulerEventTAEnded.java
        TezAMRMClientAsync.java
        TaskSchedulerContextImplWrapper.java
        TaskSchedulerManager.java
        node
        AMNodeImpl.java
        AMNodeEventNodeCountUpdated.java
        AMNodeEventContainerCompleted.java
        AMNodeEventTaskAttemptEnded.java
        AMNodeEventTaskAttemptSucceeded.java
        AMNodeTracker.java
        AMNodeEventType.java
        AMNode.java
        AMNodeEventContainerAllocated.java
        PerSourceNodeTracker.java
        AMNodeState.java
        AMNodeEventStateChanged.java
        AMNodeEvent.java
        ExtendedNodeId.java
        AMSchedulerEventType.java
        DagAwareYarnTaskScheduler.java
        ContainerLauncherEvent.java
        ContainerLauncherLaunchRequestEvent.java
        package-info.java
        AMSchedulerEventDeallocateContainer.java
        ContainerLauncherStopRequestEvent.java
        LocalTaskSchedulerService.java
        AMSchedulerEvent.java
        container
        AMContainerMap.java
        AMContainerEventAssignTA.java
        AMContainerImpl.java
        AMContainerEventCompleted.java
        AMContainerEventLaunched.java
        AMContainerEventLaunchRequest.java
        ContainerContextMatcher.java
        AMContainer.java
        AMContainerEvent.java
        AMContainerEventNodeFailed.java
        AMContainerEventStopFailed.java
        AMContainerTask.java
        AMContainerHelpers.java
        AMContainerState.java
        AMContainerEventType.java
        AMContainerEventTASucceeded.java
        AMContainerEventStopRequest.java
        AMContainerEventLaunchFailed.java
        AMSchedulerEventNodeBlacklistUpdate.java
        TaskSchedulerWrapper.java
        YarnTaskSchedulerService.java
        TaskSchedulerContextImpl.java
        YarnTaskSchedulerServiceError.java
        ContainerLauncherContextImpl.java
        TaskCommunicatorManager.java
        DAGAppMasterState.java
        TaskHeartbeatHandler.java
        ContainerContext.java
        ContainerHeartbeatHandler.java
        launcher
        DagDeleteRunnable.java
        TezLocalCacheManager.java
        TezContainerLauncherImpl.java
        ContainerOp.java
        package-info.java
        ContainerLauncherManager.java
        DeletionTracker.java
        DeletionTrackerImpl.java
        ContainerLauncherWrapper.java
        LocalContainerLauncher.java
        serviceplugins
        api
        TaskCommunicator.java
        TaskHeartbeatRequest.java
        TaskHeartbeatResponse.java
        TaskCommunicatorContext.java
        state
        StateMachineTez.java
        OnStateChangedCallback.java
        Utils.java
        client
        LocalClient.java
    - test
      - resources
        log4j.properties
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        dag
        utils
        TestSimple2LevelVersionComparator.java
        TestTaskSpecificLaunchCmdOption.java
        helpers
        DagInfoImplForTest.java
        api
        client
        TestDAGClientHandler.java
        rpc
        TestDAGClientAMProtocolBlockingPBServerImpl.java
        TestVertexStatusBuilder.java
        TestDAGClientServer.java
        history
        utils
        TestDAGUtils.java
        TestHistoryEventType.java
        recovery
        TestRecoveryService.java
        TestHistoryEventHandler.java
        logging
        impl
        TestHistoryEventJsonConversion.java
        events
        TestHistoryEventsProtoConversion.java
        app
        MockTezClient.java
        dag
        impl
        TestDAGScheduler.java
        TestImmediateStartVertexManager.java
        TestEdge.java
        TestCommit.java
        TestDAGRecovery.java
        TestRootInputVertexManager.java
        TestVertexStats.java
        TestVertexImpl2.java
        TestTaskImpl.java
        TestDAGImpl.java
        TestTaskAttempt.java
        CallableEventDispatcher.java
        TestVertexManager.java
        TestDAGSchedulerNaturalOrderControlled.java
        speculation
        legacy
        TestDataStatistics.java
        app
        TestTezTaskCommunicatorManager.java
        TestStateChangeNotifier.java
        TestRootInputInitializerManager.java
        PluginWrapperTestHelpers.java
        TestMockDAGAppMaster.java
        web
        TestAMWebController.java
        TestTaskCommunicatorManager.java
        TestTaskCommunicatorWrapper.java
        TestRecoveryParser.java
        MockLocalClient.java
        TestSpeculation.java
        TestMemoryWithEvents.java
        TestTaskCommunicatorManager2.java
        TestTaskCommunicatorContextImpl.java
        TestTaskCommunicatorManager1.java
        MockClock.java
        rm
        TestTaskSchedulerWrapper.java
        TestDagAwareYarnTaskScheduler.java
        node
        TestAMNodeTracker.java
        TestTaskSchedulerHelpers.java
        TestTezAMRMClient.java
        container
        TestAMContainerMap.java
        TestAMContainer.java
        TestContainerReuse.java
        TestLocalTaskScheduler.java
        TestTaskScheduler.java
        TestLocalTaskSchedulerService.java
        TestTaskSchedulerManager.java
        TestDAGAppMaster.java
        TestPreemption.java
        MockDAGAppMaster.java
        launcher
        TestContainerLauncherManager.java
        TestContainerLauncherWrapper.java
        TestDeletionTracker.java
        TestTezLocalCacheManager.java
        test
        ControlledScheduledExecutorService.java
        GraceShuffleVertexManagerForTest.java
        EdgeManagerForTest.java
        VertexManagerPluginForTest.java
  - pom.xml
  - findbugs-exclude.xml
- tez-plugins
  - tez-history-parser
    - src
      - main
        java
        org
        apache
        tez
        history
        ATSImportTool.java
        parser
        utils
        Utils.java
        ATSData.java
        SimpleHistoryParser.java
        datamodel
        TaskInfo.java
        Event.java
        BaseInfo.java
        EdgeInfo.java
        Constants.java
        VertexInfo.java
        BaseParser.java
        AdditionalInputOutputDetails.java
        VersionInfo.java
        TaskAttemptInfo.java
        DagInfo.java
        Container.java
        ProtoHistoryParser.java
        ATSFileParser.java
      - test
        java
        org
        apache
        tez
        history
        TestHistoryParser.java
    - pom.xml
    - findbugs-exclude.xml
  - pom.xml
  - tez-yarn-timeline-history-with-acls
    - src
      - main
        java
        org
        apache
        tez
        dag
        history
        ats
        acls
        ATSHistoryACLPolicyManager.java
      - test
        java
        org
        apache
        tez
        dag
        history
        ats
        acls
        TestATSHistoryWithACLs.java
    - pom.xml
    - findbugs-exclude.xml
  - tez-aux-services
    - src
      - main
        java
        org
        apache
        tez
        auxservices
        FadvisedChunkedFile.java
        IndexCache.java
        FadvisedFileRegion.java
        ShuffleHandler.java
      - test
        java
        org
        apache
        tez
        auxservices
        TestShuffleHandler.java
        TestIndexCache.java
        TestShuffleHandlerJobs.java
    - pom.xml
    - findbugs-exclude.xml
  - tez-yarn-timeline-cache-plugin
    - src
      - main
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
        javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
        java
        org
        apache
        tez
        dag
        history
        logging
        ats
        TimelineCachePluginImpl.java
      - test
        java
        org
        apache
        tez
        dag
        history
        logging
        ats
        TestTimelineCachePluginImpl.java
    - pom.xml
    - findbugs-exclude.xml
  - tez-yarn-timeline-history
    - src
      - main
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
        javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
        java
        org
        apache
        tez
        dag
        history
        logging
        ats
        HistoryEventTimelineConversion.java
        ATSHistoryLoggingService.java
      - test
        resources
        log4j.properties
        META-INF
        NOTICE.txt
        LICENSE.txt
        java
        org
        apache
        tez
        dag
        history
        logging
        ats
        TestATSHistoryLoggingService.java
        TestATSHistoryWithMiniCluster.java
        TestHistoryEventTimelineConversion.java
        tests
        MiniTezClusterWithTimeline.java
    - pom.xml
    - findbugs-exclude.xml
  - tez-yarn-timeline-history-with-fs
    - src
      - main
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
        javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
        java
        org
        apache
        tez
        dag
        history
        ats
        acls
        ATSV15HistoryACLPolicyManager.java
        logging
        ats
        ATSV15HistoryLoggingService.java
      - test
        java
        org
        apache
        tez
        dag
        history
        ats
        acls
        TestATSHistoryV15.java
        logging
        ats
        TestATSV15HistoryLoggingService.java
    - pom.xml
    - findbugs-exclude.xml
  - tez-protobuf-history-plugin
    - src
      - main
        proto
        HistoryLogger.proto
        java
        org
        apache
        tez
        dag
        history
        logging
        proto
        ProtoMessageReader.java
        ProtoMessageWriter.java
        HistoryEventProtoJsonConversion.java
        ProtoMessageWritable.java
        DagManifesFileScanner.java
        TezProtoLoggers.java
        HistoryEventProtoConverter.java
        ProtoHistoryLoggingService.java
        DatePartitionedLogger.java
      - test
        java
        org
        apache
        tez
        dag
        history
        logging
        proto
        TestProtoHistoryLoggingService.java
        TestDagManifestFileScanner.java
        TestHistoryEventProtoConverter.java
    - pom.xml
    - findbugs-exclude.xml
- tez-tools
  - tez-tfile-parser
    - src
      - main
        java
        org
        apache
        tez
        tools
        TFileLoader.java
        TFileRecordReader.java
    - pom.xml
    - README.txt
  - analyzers
    - job-analyzer
      - src
        main
        java
        org
        apache
        tez
        analyzer
        utils
        SVGUtils.java
        Utils.java
        Analyzer.java
        Result.java
        plugins
        SkewAnalyzer.java
        ShuffleTimeAnalyzer.java
        SlowestVertexAnalyzer.java
        SlowTaskIdentifier.java
        CriticalPathAnalyzer.java
        SlowNodeAnalyzer.java
        LocalityAnalyzer.java
        SpillAnalyzerImpl.java
        TaskAssignmentAnalyzer.java
        VertexLevelCriticalPathAnalyzer.java
        TaskAttemptResultStatisticsAnalyzer.java
        TezAnalyzerBase.java
        ContainerReuseAnalyzer.java
        AnalyzerDriver.java
        TaskConcurrencyAnalyzer.java
        OneOnOneEdgeAnalyzer.java
        CSVResult.java
        test
        java
        org
        apache
        tez
        analyzer
        TestAnalyzer.java
      - pom.xml
      - findbugs-exclude.xml
    - pom.xml
  - pom.xml
  - tez-javadoc-tools
    - src
      - main
        java
        org
        apache
        tez
        tools
        javadoc
        util
        XmlWriter.java
        Writer.java
        HtmlWriter.java
        doclet
        ConfigStandardDoclet.java
        model
        Config.java
        ConfigProperty.java
    - pom.xml
    - findbugs-exclude.xml
  - tez-log-split
    - logsplit.py
    - README.md
    - tez-log-splitter.sh
  - counter-diff
    - counter-diff.py
    - README.md
  - swimlanes
    - amlogparser.py
    - swimlane.py
    - README.md
    - yarn-swimlanes.sh
- hadoop-shim-impls
  - hadoop-shim-2.7
    - src
      - main
        resources
        META-INF
        services
        org.apache.tez.hadoop.shim.HadoopShimProvider
        java
        org
        apache
        tez
        hadoop
        shim
        HadoopShim27.java
        HadoopShim25_26_27Provider.java
      - test
        java
        org
        apache
        tez
        hadoop
        shim
        TestHadoop25_26_27ShimProvider.java
    - pom.xml
    - findbugs-exclude.xml
  - pom.xml
  - hadoop-shim-2.8
    - src
      - main
        resources
        META-INF
        services
        org.apache.tez.hadoop.shim.HadoopShimProvider
        java
        org
        apache
        tez
        hadoop
        shim
        HadoopShim28Provider.java
        HadoopShim28.java
      - test
        java
        org
        apache
        tez
        hadoop
        shim
        TestHadoopShim28Provider.java
        TestHadoopShim28.java
    - pom.xml
    - findbugs-exclude.xml
  - findbugs-exclude.xml
- pom.xml
- tez-api
  - src
    - main
      - proto
        Events.proto
        DAGClientAMProtocol.proto
        DAGApiRecords.proto
      - resources
        tez-api-version-info.properties
        META-INF
        NOTICE.txt
        services
        org.apache.hadoop.security.SecurityInfo
        LICENSE.txt
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        dag
        api
        TezReflectionException.java
        TezConfiguration.java
        VertexManagerPlugin.java
        HistoryLogLevel.java
        VertexManagerPluginContext.java
        InputDescriptor.java
        SessionNotReady.java
        client
        TimelineReaderFactory.java
        DAGClient.java
        DAGStatus.java
        VertexStatus.java
        DAGClientInternal.java
        StatusGetOpts.java
        DAGClientTimelineImpl.java
        rpc
        DAGClientAMProtocolBlockingPB.java
        package-info.java
        DAGClientRPCImpl.java
        DagStatusSource.java
        DAGClientImpl.java
        Progress.java
        TezConfigurationConstants.java
        DagTypeConverters.java
        Edge.java
        DataSinkDescriptor.java
        VertexGroup.java
        Vertex.java
        TezException.java
        InputInitializerDescriptor.java
        EdgeManagerPluginDescriptor.java
        NamedEntityDescriptor.java
        GroupInputEdge.java
        EdgeProperty.java
        Scope.java
        ConfigurationScope.java
        EdgeManagerPlugin.java
        VertexLocationHint.java
        OutputCommitterDescriptor.java
        DAGSubmissionTimedOut.java
        event
        VertexStateUpdateParallelismUpdated.java
        VertexStateUpdate.java
        VertexState.java
        EntityDescriptor.java
        TezConstants.java
        EdgeManagerPluginOnDemand.java
        DAG.java
        UserPayload.java
        DataSourceDescriptor.java
        ProcessorDescriptor.java
        TaskLocationHint.java
        OutputDescriptor.java
        PreWarmVertex.java
        EdgeManagerPluginContext.java
        TezUncheckedException.java
        DAGNotRunningException.java
        VertexManagerPluginDescriptor.java
        SessionNotRunning.java
        RootInputLeafOutput.java
        serviceplugins
        api
        ContainerEndReason.java
        TaskSchedulerContext.java
        TaskAttemptEndReason.java
        ContainerLauncherDescriptor.java
        TaskScheduler.java
        ContainerLauncherOperationBase.java
        ServicePluginContextBase.java
        TaskSchedulerDescriptor.java
        ContainerLauncherContext.java
        ContainerStopRequest.java
        ServicePluginErrorDefaults.java
        ContainerLauncher.java
        ServicePluginError.java
        TaskCommunicatorDescriptor.java
        ContainerLaunchRequest.java
        ServicePluginException.java
        DagInfo.java
        ServicePluginsDescriptor.java
        client
        AMConfiguration.java
        TezApiVersionInfo.java
        FrameworkClient.java
        TezYarnClient.java
        CallerContext.java
        TezAppMasterStatus.java
        TezClient.java
        TezClientUtils.java
        common
        security
        Master.java
        DAGAccessControls.java
        JobTokenIdentifier.java
        TokenCache.java
        HistoryACLPolicyException.java
        ACLConfigurationParser.java
        DAGClientSecurityInfo.java
        ACLManager.java
        JobTokenSecretManager.java
        ACLType.java
        HistoryACLPolicyManager.java
        TezYARNUtils.java
        Preconditions.java
        ATSConstants.java
        TezClassLoader.java
        JavaOptsChecker.java
        counters
        AggregateFrameworkCounter.java
        TezCounter.java
        AggregateTezCounter.java
        GenericCounter.java
        CounterGroupFactory.java
        AbstractCounters.java
        AggregateTezCounters.java
        CounterGroupBase.java
        CounterGroup.java
        FileSystemCounter.java
        JobCounter.java
        AbstractCounterGroup.java
        AbstractCounter.java
        AggregateTezCounterDelegate.java
        Limits.java
        FileSystemCounterGroup.java
        DAGCounter.java
        LimitExceededException.java
        FrameworkCounterGroup.java
        TezCounters.java
        TaskCounter.java
        ServicePluginLifecycle.java
        TezCommonUtils.java
        ReflectionUtils.java
        TezUtils.java
        VersionInfo.java
        annotation
        ConfigurationClass.java
        ConfigurationProperty.java
        GuavaShim.java
        ProgressHelper.java
        ContainerSignatureMatcher.java
        RPCUtil.java
        runtime
        api
        Reader.java
        LogicalIOProcessor.java
        MergedInputContext.java
        TaskFailureType.java
        LogicalInput.java
        VertexIdentifier.java
        Event.java
        Input.java
        ObjectRegistry.java
        OutputContext.java
        ProcessorContext.java
        Writer.java
        TaskIdentifier.java
        InputInitializer.java
        InputContext.java
        OutputStatistics.java
        LogicalIOProcessorFrameworkInterface.java
        OutputCommitter.java
        OutputStatisticsReporter.java
        ProcessorFrameworkInterface.java
        LogicalOutputFrameworkInterface.java
        AbstractLogicalIOProcessor.java
        InputSpecUpdate.java
        LogicalInputFrameworkInterface.java
        Processor.java
        Output.java
        AbstractLogicalInput.java
        InputInitializerContext.java
        DagIdentifier.java
        InputStatisticsReporter.java
        ExecutionContext.java
        OutputFrameworkInterface.java
        TaskAttemptIdentifier.java
        InputFrameworkInterface.java
        VertexStatistics.java
        InputStatistics.java
        AbstractLogicalOutput.java
        MemoryUpdateCallback.java
        MergedLogicalInput.java
        LogicalOutput.java
        ProgressFailedException.java
        OutputCommitterContext.java
        TaskContext.java
        events
        InputUpdatePayloadEvent.java
        InputConfigureVertexTasksEvent.java
        VertexManagerEvent.java
        CompositeDataMovementEvent.java
        InputFailedEvent.java
        InputInitializerEvent.java
        DataMovementEvent.java
        CustomProcessorEvent.java
        InputDataInformationEvent.java
        CompositeRoutedDataMovementEvent.java
        InputReadErrorEvent.java
    - test
      - resources
        tez-site.xml
        log4j.properties
        test3-version-info.properties
        META-INF
        NOTICE.txt
        LICENSE.txt
        test1-version-info.properties
        test2-version-info.properties
      - java
        org
        apache
        tez
        dag
        api
        TestDagTypeConverters.java
        TestEntityDescriptor.java
        client
        TestATSHttpClient.java
        rpc
        TestDAGClient.java
        TestTimelineReaderFactory.java
        TestDAG.java
        TestHistoryLogLevel.java
        TestTaskLocationHint.java
        TestDAGVerify.java
        TestDAGPlan.java
        TestTezConfiguration.java
        client
        TestTezClientUtils.java
        TestTezClient.java
        common
        security
        TestACLManager.java
        TestACLConfigurationParser.java
        TestTokenCache.java
        TestDAGAccessControls.java
        TestTezCommonUtils.java
        TestTezYARNUtils.java
        TestJavaOptsChecker.java
        TestVersionInfo.java
        TestRPCUtil.java
        TestReflectionUtils.java
        runtime
        api
        event
        TestCompositeDataMovementEvent.java
  - pom.xml
  - findbugs-exclude.xml
- BUILDING.txt
- build-tools
  - test-patch.sh
  - docker
    - Dockerfile
    - tez_env_checks.sh
  - install-protobuf.sh
  - smart-apply-patch.sh
- tez-common
  - src
    - main
      - resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        dag
        utils
        package-info.java
        RelocalizationUtils.java
        history
        logging
        EntityTypes.java
        records
        TezTaskID.java
        TaskIdentifierImpl.java
        TaskAttemptIdentifierImpl.java
        DagIdentifierImpl.java
        TezDAGID.java
        TezTaskAttemptID.java
        TezVertexID.java
        package-info.java
        TaskAttemptTerminationCause.java
        VertexIdentifierImpl.java
        TezID.java
        common
        TezAbstractEvent.java
        TezExecutors.java
        Preconditions.java
        AsyncDispatcher.java
        DagContainerLauncher.java
        AsyncDispatcherConcurrent.java
        TezUtilsInternal.java
        TezContainerLogAppender.java
        package-info.java
        CallableWithNdc.java
        io
        NonSyncDataOutputStream.java
        NonSyncByteArrayOutputStream.java
        NonSyncByteArrayInputStream.java
        EnvironmentUpdateUtils.java
        GcTimeUpdater.java
        RunnableWithNdc.java
        TezLog4jConfigurator.java
        TezSharedExecutor.java
        util
        TezMxBeanResourceCalculator.java
        StopWatch.java
        FastNumberFormat.java
        runtime
        common
        resources
        InitialMemoryRequestContext.java
        package-info.java
        InitialMemoryAllocator.java
    - test
      - resources
        log4j.properties
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        dag
        records
        TestTezIds.java
        common
        DrainDispatcher.java
        MockDNSToSwitchMapping.java
        TestTezSharedExecutor.java
        TestAsyncDispatcherConcurrent.java
        TestAsyncDispatcher.java
        TestTezUtils.java
        TestEnvironmentUpdateUtils.java
        util
        TestStopWatch.java
        TestNumberFormat.java
        TestTezMxBeanResourceCalculator.java
  - pom.xml
  - findbugs-exclude.xml
- tez-ui
  - src
    - main
      - resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - webapp
        .ember-cli
        bower.json
        bower-shrinkwrap.json
        public
        assets
        images
        yarn.lock
        ember-cli-build.js
        testem.json
        .editorconfig
        .jshintrc
        config
        environment.js
        default-app-conf.js
        build-info.js
        configs.env
        blueprints
        entity
        files
        app
        entities
        __name__.js
        index.js
        entity-test
        files
        tests
        unit
        entities
        __name__-test.js
        index.js
        .jshintrc
        .bowerrc
        WEB-INF
        wro.xml
        web.xml
        README.md
        package.json
        tests
        integration
        components
        home-table-controls-test.js
        em-table-tasks-log-link-cell-test.js
        em-swimlane-process-name-test.js
        pagination-ui-test.js
        em-swimlane-consolidated-process-test.js
        em-swimlane-test.js
        error-bar-test.js
        em-tooltip-test.js
        date-formatter-test.js
        em-swimlane-process-line-test.js
        em-swimlane-ruler-test.js
        query-timeline-test.js
        tab-n-refresh-test.js
        dags-page-search-test.js
        em-table-status-cell-test.js
        queries-page-search-test.js
        zip-download-modal-test.js
        em-swimlane-event-bar-test.js
        stats-link-test.js
        table-controls-test.js
        em-swimlane-event-test.js
        em-swimlane-blocking-event-test.js
        em-swimlane-vertex-name-test.js
        column-selector-test.js
        em-swimlane-process-visual-test.js
        caller-info-test.js
        helpers
        resolver.js
        start-app.js
        destroy-app.js
        module-for-acceptance.js
        test-helper.js
        .jshintrc
        index.html
        unit
        utils
        process-test.js
        virtual-anchor-test.js
        processor-test.js
        process-definition-test.js
        counter-column-definition-test.js
        download-dag-zip-test.js
        misc-test.js
        vertex-process-test.js
        services
        loader-test.js
        env-test.js
        pollster-test.js
        local-storage-test.js
        hosts-test.js
        initializers
        loader-test.js
        env-test.js
        local-storage-test.js
        jquery-test.js
        entities-test.js
        hosts-test.js
        models
        abstract-test.js
        ahs-app-test.js
        vertex-test.js
        dag-test.js
        attempt-test.js
        dag-am-test.js
        dag-info-test.js
        vertex-am-test.js
        am-test.js
        task-am-test.js
        app-rm-test.js
        hive-query-test.js
        timed-test.js
        app-test.js
        task-test.js
        timeline-test.js
        attempt-am-test.js
        am-timeline-test.js
        rm-test.js
        controllers
        abstract-test.js
        home
        queries-test.js
        index-test.js
        vertex-test.js
        dag-test.js
        dag
        index
        index-test.js
        vertices-test.js
        tasks-test.js
        counters-test.js
        attempts-test.js
        index-test.js
        swimlane-test.js
        graphical-test.js
        attempt-test.js
        task
        counters-test.js
        attempts-test.js
        index-test.js
        counters-table-test.js
        home-test.js
        attempt
        counters-test.js
        index-test.js
        query-test.js
        multi-table-test.js
        query
        index-test.js
        configs-test.js
        timeline-test.js
        app-test.js
        task-test.js
        parent-test.js
        page-test.js
        app
        dags-test.js
        index-test.js
        configs-test.js
        table-test.js
        vertex
        tasks-test.js
        counters-test.js
        attempts-test.js
        index-test.js
        configs-test.js
        application-test.js
        entities
        dag-test.js
        vertex-am-test.js
        am-test.js
        task-am-test.js
        entity-test.js
        attempt-am-test.js
        serializers
        loader-test.js
        ahs-app-test.js
        vertex-test.js
        dag-test.js
        attempt-test.js
        dag-am-test.js
        dag-info-test.js
        vertex-am-test.js
        am-test.js
        task-am-test.js
        app-rm-test.js
        hive-query-test.js
        app-test.js
        task-test.js
        timeline-test.js
        attempt-am-test.js
        rm-test.js
        routes
        abstract-test.js
        multi-am-pollster-test.js
        home
        queries-test.js
        index-test.js
        vertex-test.js
        dag-test.js
        dag
        index
        index-test.js
        vertices-test.js
        tasks-test.js
        counters-test.js
        attempts-test.js
        index-test.js
        swimlane-test.js
        graphical-test.js
        attempt-test.js
        task
        counters-test.js
        attempts-test.js
        index-test.js
        home-test.js
        attempt
        counters-test.js
        index-test.js
        am-pollster-test.js
        query-test.js
        query
        index-test.js
        configs-test.js
        timeline-test.js
        pollster-test.js
        app-test.js
        task-test.js
        app
        dags-test.js
        index-test.js
        configs-test.js
        single-am-pollster-test.js
        vertex
        tasks-test.js
        counters-test.js
        attempts-test.js
        index-test.js
        configs-test.js
        application-test.js
        server-side-ops-test.js
        mixins
        name-test.js
        auto-counter-column-test.js
        adapters
        abstract-test.js
        loader-test.js
        ahs-app-test.js
        vertex-test.js
        dag-test.js
        attempt-test.js
        dag-am-test.js
        dag-info-test.js
        vertex-am-test.js
        am-test.js
        task-am-test.js
        app-rm-test.js
        hive-query-test.js
        app-test.js
        task-test.js
        timeline-test.js
        attempt-am-test.js
        rm-test.js
        transforms
        object-test.js
        app
        utils
        vertex-process.js
        counter-column-definition.js
        misc.js
        virtual-anchor.js
        process.js
        processor.js
        download-dag-zip.js
        process-definition.js
        services
        env.js
        local-storage.js
        loader.js
        pollster.js
        hosts.js
        initializers
        jquery.js
        env.js
        local-storage.js
        loader.js
        hosts.js
        entities.js
        models
        task-am.js
        am-timeline.js
        abstract.js
        dag-info.js
        app-rm.js
        app.js
        hive-query.js
        vertex.js
        dag-am.js
        dag.js
        attempt.js
        rm.js
        am.js
        vertex-am.js
        timed.js
        task.js
        ahs-app.js
        timeline.js
        attempt-am.js
        templates
        home
        index.hbs
        queries.hbs
        dag
        index.hbs
        vertices.hbs
        tasks.hbs
        index
        index.hbs
        counters.hbs
        graphical.hbs
        attempts.hbs
        swimlane.hbs
        query.hbs
        application.hbs
        task
        index.hbs
        counters.hbs
        attempts.hbs
        attempt
        index.hbs
        counters.hbs
        components
        em-table-status-cell.hbs
        table-controls.hbs
        em-swimlane-event.hbs
        em-swimlane-process-visual.hbs
        query-timeline.hbs
        column-selector.hbs
        em-swimlane-ruler.hbs
        queries-page-search.hbs
        em-swimlane-vertex-name.hbs
        em-tooltip.hbs
        error-bar.hbs
        em-table-tasks-log-link-cell.hbs
        em-swimlane-event-bar.hbs
        zip-download-modal.hbs
        em-swimlane-consolidated-process.hbs
        em-swimlane.hbs
        dags-page-search.hbs
        em-swimlane-process-name.hbs
        tab-n-refresh.hbs
        date-formatter.hbs
        caller-info.hbs
        em-swimlane-blocking-event.hbs
        pagination-ui.hbs
        home-table-controls.hbs
        stats-link.hbs
        em-swimlane-process-line.hbs
        query
        index.hbs
        configs.hbs
        timeline.hbs
        home.hbs
        vertex.hbs
        attempt.hbs
        task.hbs
        app
        index.hbs
        configs.hbs
        dags.hbs
        app.hbs
        vertex
        index.hbs
        tasks.hbs
        counters.hbs
        configs.hbs
        attempts.hbs
        dag.hbs
        loading.hbs
        simple-modal.hbs
        components
        table-controls.js
        zip-download-modal.js
        em-swimlane-ruler.js
        stats-link.js
        em-swimlane.js
        em-swimlane-consolidated-process.js
        caller-info.js
        em-tooltip.js
        em-table-status-cell.js
        pagination-ui.js
        dags-page-search.js
        column-selector.js
        em-swimlane-event-bar.js
        em-swimlane-process-name.js
        home-table-controls.js
        em-table-tasks-log-link-cell.js
        tab-n-refresh.js
        em-swimlane-vertex-name.js
        em-swimlane-process-line.js
        em-swimlane-event.js
        em-swimlane-blocking-event.js
        date-formatter.js
        em-swimlane-process-visual.js
        query-timeline.js
        queries-page-search.js
        error-bar.js
        app.js
        controllers
        home
        queries.js
        index.js
        query.js
        dag
        index
        index.js
        attempts.js
        vertices.js
        graphical.js
        tasks.js
        counters.js
        index.js
        swimlane.js
        page.js
        task
        attempts.js
        counters.js
        index.js
        counters-table.js
        home.js
        attempt
        counters.js
        index.js
        abstract.js
        app.js
        table.js
        query
        configs.js
        timeline.js
        index.js
        multi-table.js
        vertex.js
        parent.js
        application.js
        dag.js
        attempt.js
        task.js
        app
        dags.js
        configs.js
        index.js
        vertex
        attempts.js
        configs.js
        tasks.js
        counters.js
        index.js
        router.js
        styles
        caller-info.less
        details-page.less
        dags-page-search.less
        app.less
        shared.less
        em-swimlane.less
        page-layout.less
        query-timeline.less
        table-controls.less
        vertex-configs-page.less
        queries-page-search.less
        em-table-status-cell.less
        swimlane-page.less
        zip-download-modal.less
        column-selector.less
        em-tooltip.less
        colors.less
        date-formatter.less
        em-swimlane-vertex-name.less
        tab-n-refresh.less
        tooltip.less
        home-table-controls.less
        error-bar.less
        index.html
        entities
        task-am.js
        dag.js
        am.js
        vertex-am.js
        entity.js
        attempt-am.js
        errors
        unlinked-promise.js
        serializers
        task-am.js
        dag-info.js
        app-rm.js
        app.js
        hive-query.js
        vertex.js
        dag-am.js
        loader.js
        dag.js
        attempt.js
        rm.js
        am.js
        vertex-am.js
        task.js
        ahs-app.js
        timeline.js
        attempt-am.js
        routes
        home
        queries.js
        index.js
        query.js
        dag
        index
        index.js
        attempts.js
        vertices.js
        graphical.js
        tasks.js
        counters.js
        index.js
        swimlane.js
        task
        attempts.js
        counters.js
        index.js
        home.js
        attempt
        counters.js
        index.js
        abstract.js
        multi-am-pollster.js
        app.js
        query
        configs.js
        timeline.js
        index.js
        vertex.js
        application.js
        dag.js
        attempt.js
        single-am-pollster.js
        am-pollster.js
        server-side-ops.js
        pollster.js
        task.js
        app
        dags.js
        configs.js
        index.js
        vertex
        attempts.js
        configs.js
        tasks.js
        counters.js
        index.js
        mixins
        name.js
        auto-counter-column.js
        adapters
        task-am.js
        abstract.js
        dag-info.js
        app-rm.js
        app.js
        hive-query.js
        vertex.js
        dag-am.js
        loader.js
        dag.js
        attempt.js
        rm.js
        am.js
        vertex-am.js
        task.js
        ahs-app.js
        timeline.js
        attempt-am.js
        transforms
        object.js
        .watchmanconfig
        .gitignore
  - pom.xml
  - README.md
  - findbugs-exclude.xml
- Tez_DOAP.rdf
- tez-ext-service-tests
  - src
    - test
      - proto
        TezDaemonProtocol.proto
      - resources
        log4j.properties
      - java
        org
        apache
        tez
        dag
        app
        TezTestServiceCommunicator.java
        taskcomm
        TezTestServiceTaskCommunicatorImpl.java
        TezTestServiceTaskCommunicatorWithErrors.java
        rm
        TezTestServiceTaskSchedulerServiceWithErrors.java
        TezTestServiceTaskSchedulerService.java
        ErrorPluginConfiguration.java
        launcher
        TezTestServiceContainerLauncherWithErrors.java
        TezTestServiceContainerLauncher.java
        TezTestServiceNoOpContainerLauncher.java
        shufflehandler
        IndexCache.java
        ShuffleHandler.java
        examples
        JoinValidateConfigured.java
        util
        ProtoConverters.java
        service
        impl
        TezTestServiceProtocolServerImpl.java
        TezTestServiceProtocolClientImpl.java
        TezTestService.java
        ContainerRunnerImpl.java
        TezTestServiceConfConstants.java
        MiniTezTestServiceCluster.java
        ContainerRunner.java
        TezTestServiceProtocolBlockingPB.java
        tests
        TestExtServicesWithLocalMode.java
        TestExternalTezServices.java
        ExternalTezServiceTestHelper.java
        TestExternalTezServicesErrors.java
  - pom.xml
  - findbugs-exclude.xml
- .travis.yml
- README.md
- KEYS
- tez-runtime-library
  - src
    - main
      - proto
        FairShufflePayloads.proto
        ShufflePayloads.proto
        CartesianProductPayload.proto
      - resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        hadoop
        io
        FileChunk.java
        tez
        dag
        library
        vertexmanager
        VertexManagerWithConcurrentInput.java
        FairShuffleEdgeManager.java
        DestinationTaskInputsProperty.java
        FairShuffleVertexManager.java
        ShuffleVertexManager.java
        FairEdgeConfiguration.java
        ShuffleVertexManagerBase.java
        InputReadyVertexManager.java
        edgemanager
        SilentEdgeManager.java
        common
        TezRuntimeFrameworkConfigs.java
        runtime
        library
        utils
        LocalProgress.java
        BufferUtils.java
        DATA_RANGE_IN_MB.java
        FastByteComparisons.java
        Grouper.java
        resources
        WeightedScalingMemoryDistributor.java
        processor
        SleepProcessor.java
        PreWarmProcessor.java
        SimpleProcessor.java
        hadoop
        compat
        NullProgressable.java
        output
        package-info.java
        UnorderedKVOutput.java
        OrderedPartitionedKVOutput.java
        UnorderedPartitionedKVOutput.java
        api
        KeyValueWriter.java
        TezRuntimeConfiguration.java
        KeyValuesReader.java
        KeyValueWriterWithBasePath.java
        IOInterruptedException.java
        KeyValuesWriter.java
        KeyValueReader.java
        Partitioner.java
        common
        security
        SecureShuffleUtils.java
        task
        local
        output
        TezTaskOutput.java
        package-info.java
        TezTaskOutputFiles.java
        ConfigUtils.java
        ValuesIterator.java
        TezRuntimeUtils.java
        combine
        Combiner.java
        InputAttemptIdentifier.java
        sort
        impl
        TezSpillRecord.java
        TezRawKeyValueIterator.java
        dflt
        package-info.java
        DefaultSorter.java
        PipelinedSorter.java
        IFileOutputStream.java
        ExternalSorter.java
        package-info.java
        TezIndexRecord.java
        IFile.java
        TezMerger.java
        IFileInputStream.java
        InputIdentifier.java
        Constants.java
        comparator
        ProxyComparator.java
        TezBytesComparator.java
        writers
        BaseUnorderedPartitionedKVWriter.java
        package-info.java
        UnorderedPartitionedKVWriter.java
        CompositeInputAttemptIdentifier.java
        readers
        UnorderedKVReader.java
        MemoryUpdateCallbackHandler.java
        shuffle
        impl
        SimpleFetchedInputAllocator.java
        ShuffleManager.java
        package-info.java
        ShuffleInputEventHandlerImpl.java
        InputHost.java
        FetchedInputAllocator.java
        DiskFetchedInput.java
        FetcherCallback.java
        FetchResult.java
        ShuffleEventHandler.java
        orderedgrouped
        Shuffle.java
        InMemoryReader.java
        MapHost.java
        ShuffleScheduler.java
        ShuffleHeader.java
        InMemoryWriter.java
        package-info.java
        ShuffleInputEventHandlerOrderedGrouped.java
        FetchedInputAllocatorOrderedGrouped.java
        FetcherOrderedGrouped.java
        ExceptionReporter.java
        MergeManager.java
        MergeThread.java
        MapOutput.java
        ShuffleUtils.java
        HostPort.java
        Fetcher.java
        MemoryFetchedInput.java
        FetchedInput.java
        package-info.java
        LocalDiskFetchedInput.java
        FetchedInputCallback.java
        serializer
        TezBytesWritableSerialization.java
        cartesianproduct
        CartesianProductEdgeManagerReal.java
        CartesianProductFilter.java
        CartesianProductVertexManagerReal.java
        CartesianProductEdgeManagerPartitioned.java
        CartesianProductEdgeManager.java
        CartesianProductCombination.java
        FairCartesianProductEdgeManager.java
        FairCartesianProductVertexManager.java
        CartesianProductVertexManager.java
        CartesianProductConfig.java
        CartesianProductVertexManagerPartitioned.java
        CartesianProductFilterDescriptor.java
        partitioner
        RoundRobinPartitioner.java
        HashPartitioner.java
        exceptions
        FetcherReadTimeoutException.java
        InputAlreadyClosedException.java
        input
        ConcatenatedMergedKeyValuesInput.java
        OrderedGroupedKVInput.java
        package-info.java
        OrderedGroupedInputLegacy.java
        OrderedGroupedMergedKVInput.java
        ConcatenatedMergedKeyValueInput.java
        UnorderedKVInput.java
        conf
        UnorderedKVEdgeConfig.java
        UnorderedPartitionedKVEdgeConfig.java
        UnorderedPartitionedKVOutputConfig.java
        Utils.java
        UnorderedKVOutputConfig.java
        OrderedGroupedKVInputConfig.java
        package-info.java
        OrderedPartitionedKVOutputConfig.java
        BaseConfigBuilder.java
        OrderedPartitionedKVEdgeConfig.java
        HadoopKeyValuesBasedBaseEdgeConfig.java
        UnorderedKVInputConfig.java
        http
        BaseHttpConnection.java
        HttpConnectionParams.java
        SSLFactory.java
        HttpConnection.java
        async
        netty
        TezBodyDeferringAsyncHandler.java
        AsyncHttpConnection.java
    - test
      - resources
        tez-site.xml
        log4j.properties
        TestIFile_concatenated_compressed.bin
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        dag
        library
        vertexmanager
        TestShuffleVertexManagerUtils.java
        TestVertexManagerWithConcurrentInput.java
        TestInputReadyVertexManager.java
        TestShuffleVertexManagerBase.java
        TestFairShuffleVertexManager.java
        TestShuffleVertexManager.java
        runtime
        library
        testutils
        RandomTextGenerator.java
        KVDataGen.java
        output
        OutputTestHelpers.java
        TestOnFileUnorderedKVOutput.java
        TestUnorderedPartitionedKVOutput2.java
        TestOnFileSortedOutput.java
        TestOrderedPartitionedKVOutput2.java
        TestUnorderedKVOutput2.java
        api
        TestTezRuntimeConfiguration.java
        common
        TestValuesIterator.java
        sort
        impl
        dflt
        TestDefaultSorter.java
        TestTezMerger.java
        TestIFile.java
        TestPipelinedSorter.java
        comparator
        TestProxyComparator.java
        writers
        TestUnorderedPartitionedKVWriter.java
        readers
        TestUnorderedKVReader.java
        shuffle
        impl
        TestSimpleFetchedInputAllocator.java
        TestShuffleManager.java
        TestShuffleInputEventHandlerImpl.java
        TestShuffleUtils.java
        orderedgrouped
        TestShuffleScheduler.java
        TestMergeManager.java
        TestShuffleInputEventHandlerOrderedGrouped.java
        TestFetcher.java
        TestShuffle.java
        TestFetcher.java
        TestInputIdentifiers.java
        cartesianproduct
        TestGrouper.java
        TestFairCartesianProductEdgeManager.java
        TestFairCartesianProductVertexManager.java
        TestCartesianProductCombination.java
        TestCartesianProductVertexManager.java
        TestCartesianProductConfig.java
        TestCartesianProductEdgeManagerPartitioned.java
        TestCartesianProductVertexManagerPartitioned.java
        TestCartesianProductEdgeManager.java
        input
        TestOrderedGroupedKVInput.java
        TestSortedGroupedMergedInput.java
        conf
        TestOrderedPartitionedKVOutputConfig.java
        TestUnorderedPartitionedKVEdgeConfig.java
        TestUnorderedPartitionedKVOutputConfig.java
        TestUnorderedKVEdgeConfig.java
        TestOrderedGroupedMergedKVInputConfig.java
        TestOrderedPartitionedKVEdgeConfig.java
        TestUnorderedKVOutputConfig.java
        TestUnorderedKVInputConfig.java
        common
        resources
        TestWeightedScalingMemoryDistributor.java
        http
        TestHttpConnection.java
  - pom.xml
  - findbugs-exclude.xml
- .gitignore
- docs
  - src
    - site
      - resources
        images
        pmc
        tez.rdf
      - markdown
        shuffle-handler.md
        tez-ui.md
        tez_yarn_timeline.md
        install.md
        index.md
        user_guides.md
        by-laws.md
        localmode.md
        releases
        apache-tez-0-6-2.md
        apache-tez-0-8-0-alpha.md
        apache-tez-0-6-0.md
        apache-tez-0-8-1-alpha.md
        index.md
        apache-tez-0-8-4.md
        apache-tez-0-5-4.md
        apache-tez-0-8-2.md
        apache-tez-0-7-1.md
        apache-tez-0-5-2.md
        apache-tez-0-7-0.md
        apache-tez-0-8-5.md
        apache-tez-0-6-1.md
        apache-tez-0-5-0.md
        apache-tez-0-9-2.md
        apache-tez-0-9-0.md
        apache-tez-0-8-3.md
        apache-tez-0-5-1.md
        apache-tez-0-9-1.md
        apache-tez-0-5-3.md
        tez_acls.md
        tez_ui_user_data.md
        install_pre_0_5_0.md
        talks.md
        privacy-policy.md
      - site.xml
      - custom
        project-info-report.properties
  - pom.xml
- INSTALL.md
- LICENSE.txt
- tez-dist
  - src
    - main
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - assembly
        tez-dist-minimal.xml
        tez-dist.xml
  - pom.xml
  - dist-files
    - minimal
      - LICENSE-CDDLv1.1-GPLv2_withCPE
      - LICENSE
      - LICENSE-SIL_OpenFontLicense-v1.1
      - LICENSE-BSD-3clause
      - NOTICE
      - LICENSE-MIT
    - full
      - LICENSE-CDDLv1.1-GPLv2_withCPE
      - LICENSE
      - LICENSE-SIL_OpenFontLicense-v1.1
      - LICENSE-BSD-3clause
      - NOTICE
      - LICENSE-MIT
      - LICENSE-CDDLv1.0

/**
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.tez.runtime.library.common.sort.impl;

import java.io.IOException;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Collections;
import java.util.Comparator;
import java.util.List;

import com.google.common.annotations.VisibleForTesting;

import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.apache.hadoop.classification.InterfaceAudience;
import org.apache.hadoop.classification.InterfaceStability;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.ChecksumFileSystem;
import org.apache.hadoop.fs.FSDataInputStream;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.LocalDirAllocator;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.DataInputBuffer;
import org.apache.hadoop.io.DataOutputBuffer;
import org.apache.hadoop.io.RawComparator;
import org.apache.hadoop.io.compress.CompressionCodec;
import org.apache.hadoop.util.PriorityQueue;
import org.apache.hadoop.util.Progress;
import org.apache.hadoop.util.Progressable;
import org.apache.tez.common.TezRuntimeFrameworkConfigs;
import org.apache.tez.common.counters.TezCounter;
import org.apache.tez.runtime.library.api.TezRuntimeConfiguration;
import org.apache.tez.runtime.library.common.Constants;
import org.apache.tez.runtime.library.common.sort.impl.IFile.Reader;
import org.apache.tez.runtime.library.common.sort.impl.IFile.Reader.KeyState;
import org.apache.tez.runtime.library.common.sort.impl.IFile.Writer;
import org.apache.tez.runtime.library.utils.BufferUtils;
import org.apache.tez.runtime.library.utils.LocalProgress;

/**
 * Merger is an utility class used by the Map and Reduce tasks for merging
 * both their memory and disk segments
 */
@InterfaceAudience.Private
@InterfaceStability.Unstable
@SuppressWarnings({"unchecked", "rawtypes"})
public class TezMerger {
  private static final Logger LOG = LoggerFactory.getLogger(TezMerger.class);

  
  // Local directories
  private static LocalDirAllocator lDirAlloc = 
    new LocalDirAllocator(TezRuntimeFrameworkConfigs.LOCAL_DIRS);

  public static
  TezRawKeyValueIterator merge(Configuration conf, FileSystem fs,
                            Class keyClass, Class valueClass, 
                            CompressionCodec codec, boolean ifileReadAhead,
                            int ifileReadAheadLength, int ifileBufferSize,
                            Path[] inputs, boolean deleteInputs, 
                            int mergeFactor, Path tmpDir,
                            RawComparator comparator, Progressable reporter,
                            TezCounter readsCounter,
                            TezCounter writesCounter,
                            TezCounter bytesReadCounter,
                            Progress mergePhase)
      throws IOException, InterruptedException {
    return 
      new MergeQueue(conf, fs, inputs, deleteInputs, codec, ifileReadAhead,
                           ifileReadAheadLength, ifileBufferSize, false, comparator, 
                           reporter, null).merge(keyClass, valueClass,
                                           mergeFactor, tmpDir,
                                           readsCounter, writesCounter,
                                           bytesReadCounter,
                                           mergePhase);
  }

  // Used by the in-memory merger.
  public static
  TezRawKeyValueIterator merge(Configuration conf, FileSystem fs, 
                            Class keyClass, Class valueClass, 
                            List<Segment> segments, 
                            int mergeFactor, Path tmpDir,
                            RawComparator comparator, Progressable reporter,
                            TezCounter readsCounter,
                            TezCounter writesCounter,
                            TezCounter bytesReadCounter,
                            Progress mergePhase)
      throws IOException, InterruptedException {
    // Get rid of this ?
    return merge(conf, fs, keyClass, valueClass, segments, mergeFactor, tmpDir,
                 comparator, reporter, false, readsCounter, writesCounter, bytesReadCounter,
                 mergePhase);
  }

  public static <K extends Object, V extends Object>
  TezRawKeyValueIterator merge(Configuration conf, FileSystem fs,
                            Class keyClass, Class valueClass,
                            List<Segment> segments,
                            int mergeFactor, Path tmpDir,
                            RawComparator comparator, Progressable reporter,
                            boolean sortSegments,
                            TezCounter readsCounter,
                            TezCounter writesCounter,
                            TezCounter bytesReadCounter,
                            Progress mergePhase)
      throws IOException, InterruptedException {
    return new MergeQueue(conf, fs, segments, comparator, reporter,
                           sortSegments, false).merge(keyClass, valueClass,
                                               mergeFactor, tmpDir,
                                               readsCounter, writesCounter,
                                               bytesReadCounter, mergePhase);
  }

  public static <K extends Object, V extends Object>
  TezRawKeyValueIterator merge(Configuration conf, FileSystem fs,
      Class keyClass, Class valueClass,
      CompressionCodec codec,
      List<Segment> segments,
      int mergeFactor, Path tmpDir,
      RawComparator comparator, Progressable reporter,
      boolean sortSegments,
      boolean considerFinalMergeForProgress,
      TezCounter readsCounter,
      TezCounter writesCounter,
      TezCounter bytesReadCounter,
      Progress mergePhase, boolean checkForSameKeys)
      throws IOException, InterruptedException {
    return new MergeQueue(conf, fs, segments, comparator, reporter,
        sortSegments, codec, considerFinalMergeForProgress, checkForSameKeys).
        merge(keyClass, valueClass,
            mergeFactor, tmpDir,
            readsCounter, writesCounter,
            bytesReadCounter,
            mergePhase);
  }

  public static <K extends Object, V extends Object>
  TezRawKeyValueIterator merge(Configuration conf, FileSystem fs,
                            Class keyClass, Class valueClass,
                            CompressionCodec codec,
                            List<Segment> segments,
                            int mergeFactor, Path tmpDir,
                            RawComparator comparator, Progressable reporter,
                            boolean sortSegments,
                            boolean considerFinalMergeForProgress,
                            TezCounter readsCounter,
                            TezCounter writesCounter,
                            TezCounter bytesReadCounter,
                            Progress mergePhase)
      throws IOException, InterruptedException {
    return new MergeQueue(conf, fs, segments, comparator, reporter,
                           sortSegments, codec, considerFinalMergeForProgress).
                                         merge(keyClass, valueClass,
                                             mergeFactor, tmpDir,
                                             readsCounter, writesCounter,
                                             bytesReadCounter,
                                             mergePhase);
  }

  public static <K extends Object, V extends Object>
  TezRawKeyValueIterator merge(Configuration conf, FileSystem fs,
                          Class keyClass, Class valueClass,
                          CompressionCodec codec,
                          List<Segment> segments,
                          int mergeFactor, int inMemSegments, Path tmpDir,
                          RawComparator comparator, Progressable reporter,
                          boolean sortSegments,
                          TezCounter readsCounter,
                          TezCounter writesCounter,
                          TezCounter bytesReadCounter,
                          Progress mergePhase)
      throws IOException, InterruptedException {
  return new MergeQueue(conf, fs, segments, comparator, reporter,
                         sortSegments, codec, false).merge(keyClass, valueClass,
                                             mergeFactor, inMemSegments,
                                             tmpDir,
                                             readsCounter, writesCounter,
                                             bytesReadCounter,
                                             mergePhase);
}

  public static <K extends Object, V extends Object>
  void writeFile(TezRawKeyValueIterator records, Writer writer,
      Progressable progressable, long recordsBeforeProgress)
      throws IOException, InterruptedException {
    long recordCtr = 0;
    long count = 0;
    while(records.next()) {
      if (records.isSameKey()) {
        writer.append(IFile.REPEAT_KEY, records.getValue());
        count++;
      } else {
        writer.append(records.getKey(), records.getValue());
      }
      
      if (((recordCtr++) % recordsBeforeProgress) == 0) {
        progressable.progress();
        if (Thread.currentThread().isInterrupted()) {
          /**
           * Takes care DefaultSorter.mergeParts, MergeManager's merger threads,
           * PipelinedSorter's flush(). This is not expensive check as it is carried out every
           * 10000 records or so.
           */
          throw new InterruptedException("Current thread=" + Thread.currentThread().getName() + " got "
              + "interrupted");
        }
      }
    }
    if ((count > 0) && LOG.isTraceEnabled()) {
      LOG.trace("writeFile SAME_KEY count=" + count);
    }
  }

  @InterfaceAudience.Private
  @InterfaceStability.Unstable
  static class KeyValueBuffer {
    private byte[] buf;
    private int position;
    private int length;

    public KeyValueBuffer(byte buf[], int position, int length) {
      reset(buf, position, length);
    }

    public void reset(byte[] input, int position, int length) {
      this.buf = input;
      this.position = position;
      this.length = length;
    }

    public byte[] getData() {
      return buf;
    }

    public int getPosition() {
      return position;
    }

    public int getLength() {
      return length;
    }
  }

  @InterfaceAudience.Private
  @InterfaceStability.Unstable
  public static class Segment {
    static final byte[] EMPTY_BYTES = new byte[0];
    Reader reader = null;
    final KeyValueBuffer key = new KeyValueBuffer(EMPTY_BYTES, 0, 0);
    TezCounter mapOutputsCounter = null;

    public Segment(Reader reader, TezCounter mapOutputsCounter) {
      this.reader = reader;
      this.mapOutputsCounter = mapOutputsCounter;
    }

    void init(TezCounter readsCounter, TezCounter bytesReadCounter) throws IOException {
      if (mapOutputsCounter != null) {
        mapOutputsCounter.increment(1);
      }
    }

    boolean inMemory() {
      return true;
    }

    KeyValueBuffer getKey() { return key; }

    DataInputBuffer getValue(DataInputBuffer value) throws IOException {
      nextRawValue(value);
      return value;
    }

    public long getLength() {
      return reader.getLength();
    }

    KeyState readRawKey(DataInputBuffer nextKey) throws IOException {
      KeyState keyState = reader.readRawKey(nextKey);
      key.reset(nextKey.getData(), nextKey.getPosition(), nextKey.getLength() - nextKey.getPosition());
      return keyState;
    }

    boolean nextRawKey(DataInputBuffer nextKey) throws IOException {
      boolean hasNext = reader.nextRawKey(nextKey);
      key.reset(nextKey.getData(), nextKey.getPosition(), nextKey.getLength() - nextKey.getPosition());
      return hasNext;
    }

    void nextRawValue(DataInputBuffer value) throws IOException {
      reader.nextRawValue(value);
    }

    void closeReader() throws IOException {
      if (reader != null) {
        reader.close();
        reader = null;
      }
    }

    void close() throws IOException {
      closeReader();
    }

    public long getPosition() throws IOException {
      return reader.getPosition();
    }

    // This method is used by BackupStore to extract the
    // absolute position after a reset
    long getActualPosition() throws IOException {
      return reader.getPosition();
    }

    Reader getReader() {
      return reader;
    }

    // This method is used by BackupStore to reinitialize the
    // reader to start reading from a different segment offset
    void reinitReader(int offset) throws IOException {
    }
  }

  @InterfaceAudience.Private
  @InterfaceStability.Unstable
  public static class DiskSegment extends Segment {

    FileSystem fs = null;
    Path file = null;
    boolean preserve = false; // Signifies whether the segment should be kept after a merge is complete. Checked in the close method.
    CompressionCodec codec = null;
    long segmentOffset = 0;
    long segmentLength = -1;
    boolean ifileReadAhead;
    int ifileReadAheadLength;
    int bufferSize = -1;

    public DiskSegment(FileSystem fs, Path file,
        CompressionCodec codec, boolean ifileReadAhead,
        int ifileReadAheadLength, int bufferSize, boolean preserve)
    throws IOException {
      this(fs, file, codec, ifileReadAhead, ifileReadAheadLength,
          bufferSize, preserve, null);
    }

    public DiskSegment(FileSystem fs, Path file,
                   CompressionCodec codec, boolean ifileReadAhead, int ifileReadAheadLenth,
                   int bufferSize, boolean preserve, TezCounter mergedMapOutputsCounter)
  throws IOException {
      this(fs, file, 0, fs.getFileStatus(file).getLen(), codec,
          ifileReadAhead, ifileReadAheadLenth, bufferSize, preserve,
          mergedMapOutputsCounter);
    }

    public DiskSegment(FileSystem fs, Path file,
                   long segmentOffset, long segmentLength,
                   CompressionCodec codec, boolean ifileReadAhead,
                   int ifileReadAheadLength,  int bufferSize, 
                   boolean preserve) throws IOException {
      this(fs, file, segmentOffset, segmentLength, codec, ifileReadAhead,
          ifileReadAheadLength, bufferSize, preserve, null);
    }

    public DiskSegment(FileSystem fs, Path file,
        long segmentOffset, long segmentLength, CompressionCodec codec,
        boolean ifileReadAhead, int ifileReadAheadLength, int bufferSize,
        boolean preserve, TezCounter mergedMapOutputsCounter)
    throws IOException {
      super(null, mergedMapOutputsCounter);
      this.fs = fs;
      this.file = file;
      this.codec = codec;
      this.preserve = preserve;
      this.ifileReadAhead = ifileReadAhead;
      this.ifileReadAheadLength =ifileReadAheadLength;
      this.bufferSize = bufferSize;

      this.segmentOffset = segmentOffset;
      this.segmentLength = segmentLength;
    }

    @Override
    void init(TezCounter readsCounter, TezCounter bytesReadCounter) throws IOException {
      super.init(readsCounter, bytesReadCounter);
      FSDataInputStream in = fs.open(file);
      in.seek(segmentOffset);
      reader = new Reader(in, segmentLength, codec, readsCounter, bytesReadCounter, ifileReadAhead,
          ifileReadAheadLength, bufferSize);
    }

    @Override
    boolean inMemory() {
      return false;
    }

    @Override
    public long getLength() {
      return (reader == null) ?
        segmentLength : reader.getLength();
    }

    @Override
    void close() throws IOException {
      super.close();
      if (!preserve && fs != null) {
        fs.delete(file, false);
      }
    }
    // This method is used by BackupStore to extract the
    // absolute position after a reset
    @Override
    long getActualPosition() throws IOException {
      return segmentOffset + reader.getPosition();
    }

    // This method is used by BackupStore to reinitialize the
    // reader to start reading from a different segment offset
    @Override
    void reinitReader(int offset) throws IOException {
      if (!inMemory()) {
        closeReader();
        segmentOffset = offset;
        segmentLength = fs.getFileStatus(file).getLen() - segmentOffset;
        init(null, null);
      }
    }
  }

  @VisibleForTesting
  static class MergeQueue<K extends Object, V extends Object>
  extends PriorityQueue<Segment> implements TezRawKeyValueIterator {
    final Configuration conf;
    final FileSystem fs;
    final CompressionCodec codec;
    final boolean checkForSameKeys;
    static final boolean ifileReadAhead = TezRuntimeConfiguration.TEZ_RUNTIME_IFILE_READAHEAD_DEFAULT;
    static final int ifileReadAheadLength = TezRuntimeConfiguration.TEZ_RUNTIME_IFILE_READAHEAD_BYTES_DEFAULT;
    static final int ifileBufferSize = TezRuntimeConfiguration.TEZ_RUNTIME_IFILE_BUFFER_SIZE_DEFAULT;
    static final long recordsBeforeProgress = TezRuntimeConfiguration.TEZ_RUNTIME_RECORDS_BEFORE_PROGRESS_DEFAULT;
    
    List<Segment> segments = new ArrayList<Segment>();
    
    final RawComparator comparator;

    private long totalBytesProcessed;
    private float progPerByte;
    private Progress mergeProgress = new LocalProgress();
    // Boolean variable for including/considering final merge as part of sort
    // phase or not. This is true in map task, false in reduce task. It is
    // used in calculating mergeProgress.
    private final boolean considerFinalMergeForProgress;

    final Progressable reporter;
    
    final DataInputBuffer key = new DataInputBuffer();
    final DataInputBuffer value = new DataInputBuffer();
    final DataInputBuffer nextKey = new DataInputBuffer();
    final DataInputBuffer diskIFileValue = new DataInputBuffer();
    
    Segment minSegment;
    Comparator<Segment> segmentComparator =   
      new Comparator<Segment>() {
      public int compare(Segment o1, Segment o2) {
        if (o1.getLength() == o2.getLength()) {
          return 0;
        }

        return o1.getLength() < o2.getLength() ? -1 : 1;
      }
    };

    KeyState hasNext;
    DataOutputBuffer prevKey = new DataOutputBuffer();

    public MergeQueue(Configuration conf, FileSystem fs, 
                      Path[] inputs, boolean deleteInputs,
                      CompressionCodec codec, boolean ifileReadAhead,
                      int ifileReadAheadLength, int ifileBufferSize,
                      boolean considerFinalMergeForProgress,
                      RawComparator comparator, Progressable reporter, 
                      TezCounter mergedMapOutputsCounter) 
    throws IOException {
      this.conf = conf;
      this.checkForSameKeys = true;
      // this.recordsBeforeProgress =
      // conf.getLong(TezJobConfig.TEZ_RUNTIME_RECORDS_BEFORE_PROGRESS,
      // TezJobConfig.TEZ_RUNTIME_RECORDS_BEFORE_PROGRESS_DEFAULT);
      this.fs = fs;
      this.codec = codec;
      this.comparator = comparator;
      this.reporter = reporter;
      this.considerFinalMergeForProgress = considerFinalMergeForProgress;
      
      for (Path file : inputs) {
        if (LOG.isTraceEnabled()) {
          LOG.trace("MergeQ: adding: " + file);
        }
        segments.add(new DiskSegment(fs, file, codec, ifileReadAhead,
                                      ifileReadAheadLength, ifileBufferSize,
                                      !deleteInputs, 
                                       (file.toString().endsWith(
                                           Constants.MERGED_OUTPUT_PREFIX) ? 
                                        null : mergedMapOutputsCounter)));
      }
      
      // Sort segments on file-lengths
      Collections.sort(segments, segmentComparator); 
    }
    
    public MergeQueue(Configuration conf, FileSystem fs,
        List<Segment> segments, RawComparator comparator,
        Progressable reporter, boolean sortSegments, boolean considerFinalMergeForProgress) {
      this(conf, fs, segments, comparator, reporter, sortSegments, null,
          considerFinalMergeForProgress);
    }

    public MergeQueue(Configuration conf, FileSystem fs,
        List<Segment> segments, RawComparator comparator,
        Progressable reporter, boolean sortSegments, CompressionCodec codec,
        boolean considerFinalMergeForProgress) {
      this(conf, fs, segments, comparator, reporter, sortSegments, null,
          considerFinalMergeForProgress, true);
    }

    public MergeQueue(Configuration conf, FileSystem fs,
        List<Segment> segments, RawComparator comparator,
        Progressable reporter, boolean sortSegments, CompressionCodec codec,
        boolean considerFinalMergeForProgress, boolean checkForSameKeys) {
      this.conf = conf;
      this.fs = fs;
      this.comparator = comparator;
      this.segments = segments;
      this.reporter = reporter;
      this.considerFinalMergeForProgress = considerFinalMergeForProgress;
      if (sortSegments) {
        Collections.sort(segments, segmentComparator);
      }
      this.checkForSameKeys = checkForSameKeys;
      this.codec = codec;
    }

    public void close() throws IOException {
      Segment segment;
      while((segment = pop()) != null) {
        segment.close();
      }
    }

    public DataInputBuffer getKey() throws IOException {
      return key;
    }

    public DataInputBuffer getValue() throws IOException {
      return value;
    }

    private void populatePreviousKey() throws IOException {
      key.reset();
      BufferUtils.copy(key, prevKey);
    }

    private void adjustPriorityQueue(Segment reader) throws IOException{
      long startPos = reader.getPosition();
      if (checkForSameKeys) {
        if (hasNext == null) {
          /**
           * hasNext can be null during first iteration & prevKey is initialized here.
           * In cases of NO_KEY/NEW_KEY, we readjust the queue later. If new segment/file is found
           * during this process, we need to compare keys for RLE across segment boundaries.
           * prevKey can't be empty at that time (e.g custom comparators)
           */
          populatePreviousKey();
        } else {
          //indicates a key has been read already
          if (hasNext != KeyState.SAME_KEY) {
            /**
             * Store previous key before reading next for later key comparisons.
             * If all keys in a segment are unique, it would always hit this code path and key copies
             * are wasteful in such condition, as these comparisons are mainly done for RLE.
             * TODO: When better stats are available, this condition can be avoided.
             */
            populatePreviousKey();
          }
        }
      }
      hasNext = reader.readRawKey(nextKey);
      long endPos = reader.getPosition();
      totalBytesProcessed += endPos - startPos;
      mergeProgress.set(totalBytesProcessed * progPerByte);
      if (hasNext == KeyState.NEW_KEY) {
        adjustTop();
        compareKeyWithNextTopKey(reader);
      } else if(hasNext == KeyState.NO_KEY) {
        pop();
        reader.close();
        compareKeyWithNextTopKey(null);
      } else if(hasNext == KeyState.SAME_KEY) {
        // do not rebalance the priority queue
      }
    }

    /**
     * Check if the previous key is same as the next top segment's key.
     * This would be useful to compute whether same key is spread across multiple segments.
     *
     * @param current
     * @throws IOException
     */
    void compareKeyWithNextTopKey(Segment current) throws IOException {
      Segment nextTop = top();
      if (checkForSameKeys && nextTop != current) {
        //we have a different file. Compare it with previous key
        KeyValueBuffer nextKey = nextTop.getKey();
        int compare = compare(nextKey, prevKey);
        if (compare == 0) {
          //Same key is available in the next segment.
          hasNext = KeyState.SAME_KEY;
        }
      }
    }

    public boolean next() throws IOException {
      if (!hasNext()) {
        return false;
      }

      minSegment = top();
      long startPos = minSegment.getPosition();
      KeyValueBuffer nextKey = minSegment.getKey();
      key.reset(nextKey.getData(), nextKey.getPosition(), nextKey.getLength());
      if (!minSegment.inMemory()) {
        //When we load the value from an inmemory segment, we reset
        //the "value" DIB in this class to the inmem segment's byte[].
        //When we load the value bytes from disk, we shouldn't use
        //the same byte[] since it would corrupt the data in the inmem
        //segment. So we maintain an explicit DIB for value bytes
        //obtained from disk, and if the current segment is a disk
        //segment, we reset the "value" DIB to the byte[] in that (so 
        //we reuse the disk segment DIB whenever we consider
        //a disk segment).
        minSegment.getValue(diskIFileValue);
        value.reset(diskIFileValue.getData(), diskIFileValue.getLength());
      } else {
        minSegment.getValue(value);
      }
      long endPos = minSegment.getPosition();
      totalBytesProcessed += endPos - startPos;
      mergeProgress.set(totalBytesProcessed * progPerByte);

      return true;
    }

    int compare(KeyValueBuffer nextKey, DataOutputBuffer buf2) {
      byte[] b1 = nextKey.getData();
      byte[] b2 = buf2.getData();
      int s1 = nextKey.getPosition();
      int s2 = 0;
      int l1 = nextKey.getLength();
      int l2 = buf2.getLength();
      return comparator.compare(b1, s1, l1, b2, s2, l2);
    }

    protected boolean lessThan(Object a, Object b) {
      KeyValueBuffer key1 = ((Segment)a).getKey();
      KeyValueBuffer key2 = ((Segment)b).getKey();
      int s1 = key1.getPosition();
      int l1 = key1.getLength();
      int s2 = key2.getPosition();
      int l2 = key2.getLength();;

      return comparator.compare(key1.getData(), s1, l1, key2.getData(), s2, l2) < 0;
    }
    
    public TezRawKeyValueIterator merge(Class keyClass, Class valueClass,
                                     int factor, Path tmpDir,
                                     TezCounter readsCounter,
                                     TezCounter writesCounter,
                                     TezCounter bytesReadCounter,
                                     Progress mergePhase)
        throws IOException, InterruptedException {
      return merge(keyClass, valueClass, factor, 0, tmpDir,
                   readsCounter, writesCounter, bytesReadCounter, mergePhase);
    }

    TezRawKeyValueIterator merge(Class keyClass, Class valueClass,
                                     int factor, int inMem, Path tmpDir,
                                     TezCounter readsCounter,
                                     TezCounter writesCounter,
                                     TezCounter bytesReadCounter,
                                     Progress mergePhase)
        throws IOException, InterruptedException {
      if (segments.size() == 0) {
        LOG.info("Nothing to merge. Returning an empty iterator");
        return new EmptyIterator();
      }
      if (LOG.isDebugEnabled()) {
        LOG.debug("Merging " + segments.size() + " sorted segments");
      }

      /*
       * If there are inMemory segments, then they come first in the segments
       * list and then the sorted disk segments. Otherwise(if there are only
       * disk segments), then they are sorted segments if there are more than
       * factor segments in the segments list.
       */
      int numSegments = segments.size();
      int origFactor = factor;
      int passNo = 1;
      if (mergePhase != null) {
        mergeProgress = mergePhase;
      }

      long totalBytes = computeBytesInMerges(segments, factor, inMem, considerFinalMergeForProgress);
      if (totalBytes != 0) {
        progPerByte = 1.0f / (float)totalBytes;
      }
      
      //create the MergeStreams from the sorted map created in the constructor
      //and dump the final output to a file
      do {
        //get the factor for this pass of merge. We assume in-memory segments
        //are the first entries in the segment list and that the pass factor
        //doesn't apply to them
        factor = getPassFactor(factor, passNo, numSegments - inMem);
        if (1 == passNo) {
          factor += inMem;
        }
        List<Segment> segmentsToMerge =
          new ArrayList<Segment>();
        int segmentsConsidered = 0;
        int numSegmentsToConsider = factor;
        long startBytes = 0; // starting bytes of segments of this merge
        while (true) {
          //extract the smallest 'factor' number of segments  
          //Call cleanup on the empty segments (no key/value data)
          List<Segment> mStream = 
            getSegmentDescriptors(numSegmentsToConsider);
          for (Segment segment : mStream) {
            // Initialize the segment at the last possible moment;
            // this helps in ensuring we don't use buffers until we need them

            segment.init(readsCounter, bytesReadCounter);
            long startPos = segment.getPosition();
            boolean hasNext = segment.nextRawKey(nextKey);
            long endPos = segment.getPosition();
            
            if (hasNext) {
              startBytes += endPos - startPos;
              segmentsToMerge.add(segment);
              segmentsConsidered++;
            }
            else { // Empty segments. Can this be avoided altogether ?
              segment.close();
              numSegments--; //we ignore this segment for the merge
            }
          }
          //if we have the desired number of segments
          //or looked at all available segments, we break
          if (segmentsConsidered == factor || 
              segments.size() == 0) {
            break;
          }

          // Get the correct # of segments in case some of them were empty.
          numSegmentsToConsider = factor - segmentsConsidered;
        }
        
        //feed the streams to the priority queue
        initialize(segmentsToMerge.size());
        clear();
        for (Segment segment : segmentsToMerge) {
          put(segment);
        }
        
        //if we have lesser number of segments remaining, then just return the
        //iterator, else do another single level merge
        if (numSegments <= factor) { // Will always kick in if only in-mem segments are provided.
          if (!considerFinalMergeForProgress) { // for reduce task

            // Reset totalBytesProcessed and recalculate totalBytes from the
            // remaining segments to track the progress of the final merge.
            // Final merge is considered as the progress of the reducePhase,
            // the 3rd phase of reduce task.
            totalBytesProcessed = 0;
            totalBytes = 0;
            for (int i = 0; i < segmentsToMerge.size(); i++) {
              totalBytes += segmentsToMerge.get(i).getLength();
            }
          }
          if (totalBytes != 0) //being paranoid
            progPerByte = 1.0f / (float)totalBytes;
          
          totalBytesProcessed += startBytes;
          if (totalBytes != 0)
            mergeProgress.set(totalBytesProcessed * progPerByte);
          else
            mergeProgress.set(1.0f); // Last pass and no segments left - we're done

          if (LOG.isDebugEnabled()) {
            LOG.debug("Down to the last merge-pass, with " + numSegments +
                " segments left of total size: " +
                (totalBytes - totalBytesProcessed) + " bytes");
          }
          // At this point, Factor Segments have not been physically
          // materialized. The merge will be done dynamically. Some of them may
          // be in-memory segments, other on-disk semgnets. Decision to be made
          // by a finalMerge is that is required.
          return this;
        } else {
          if (LOG.isDebugEnabled()) {
            LOG.debug("Merging " + segmentsToMerge.size() +
                " intermediate segments out of a total of " +
                (segments.size() + segmentsToMerge.size()));
          }
          
          long bytesProcessedInPrevMerges = totalBytesProcessed;
          totalBytesProcessed += startBytes;

          //we want to spread the creation of temp files on multiple disks if 
          //available under the space constraints
          long approxOutputSize = 0; 
          for (Segment s : segmentsToMerge) {
            approxOutputSize += s.getLength() + 
                                ChecksumFileSystem.getApproxChkSumLength(
                                s.getLength());
          }
          Path tmpFilename = 
            new Path(tmpDir, "intermediate").suffix("." + passNo);

          Path outputFile =  lDirAlloc.getLocalPathForWrite(
                                              tmpFilename.toString(),
                                              approxOutputSize, conf);

          // TODO Would it ever make sense to make this an in-memory writer ?
          // Merging because of too many disk segments - might fit in memory.
          Writer writer = 
            new Writer(conf, fs, outputFile, keyClass, valueClass, codec,
                             writesCounter, null);

          writeFile(this, writer, reporter, recordsBeforeProgress);
          writer.close();
          
          //we finished one single level merge; now clean up the priority 
          //queue
          this.close();

          // Add the newly create segment to the list of segments to be merged
          Segment tempSegment = 
            new DiskSegment(fs, outputFile, codec, ifileReadAhead,
                ifileReadAheadLength, ifileBufferSize, false);

          // Insert new merged segment into the sorted list
          int pos = Collections.binarySearch(segments, tempSegment,
                                             segmentComparator);
          if (pos < 0) {
            // binary search failed. So position to be inserted at is -pos-1
            pos = -pos-1;
          }
          segments.add(pos, tempSegment);
          numSegments = segments.size();
          
          // Subtract the difference between expected size of new segment and 
          // actual size of new segment(Expected size of new segment is
          // inputBytesOfThisMerge) from totalBytes. Expected size and actual
          // size will match(almost) if combiner is not called in merge.
          long inputBytesOfThisMerge = totalBytesProcessed -
                                       bytesProcessedInPrevMerges;
          totalBytes -= inputBytesOfThisMerge - tempSegment.getLength();
          if (totalBytes != 0) {
            progPerByte = 1.0f / (float)totalBytes;
          }
          
          passNo++;
        }
        //we are worried about only the first pass merge factor. So reset the 
        //factor to what it originally was
        factor = origFactor;
      } while(true);
    }
    
    /**
     * Determine the number of segments to merge in a given pass. Assuming more
     * than factor segments, the first pass should attempt to bring the total
     * number of segments - 1 to be divisible by the factor - 1 (each pass
     * takes X segments and produces 1) to minimize the number of merges.
     */
    private static int getPassFactor(int factor, int passNo, int numSegments) {
      // passNo > 1 in the OR list - is that correct ?
      if (passNo > 1 || numSegments <= factor || factor == 1) 
        return factor;
      int mod = (numSegments - 1) % (factor - 1);
      if (mod == 0)
        return factor;
      return mod + 1;
    }
    
    /** Return (& remove) the requested number of segment descriptors from the
     * sorted map.
     */
    private List<Segment> getSegmentDescriptors(int numDescriptors) {
      if (numDescriptors > segments.size()) {
        List<Segment> subList = new ArrayList<Segment>(segments);
        segments.clear();
        return subList;
      }

      // Efficiently bulk remove segments
      List<Segment> subList = segments.subList(0, numDescriptors);
      List<Segment> subListCopy = new ArrayList<>(subList);
      subList.clear();
      return subListCopy;
    }
    
    /**
     * Compute expected size of input bytes to merges, will be used in
     * calculating mergeProgress. This simulates the above merge() method and
     * tries to obtain the number of bytes that are going to be merged in all
     * merges(assuming that there is no combiner called while merging).
     * @param segments segments to compute merge bytes
     * @param factor mapreduce.task.io.sort.factor
     * @param inMem  number of segments in memory to be merged
     * @param considerFinalMergeForProgress whether to consider for final merge
     */
    static long computeBytesInMerges(List<Segment> segments, int factor, int inMem, boolean considerFinalMergeForProgress) {
      int numSegments = segments.size();
      long[] segmentSizes = new long[numSegments];
      long totalBytes = 0;
      int n = numSegments - inMem;
      // factor for 1st pass
      int f = getPassFactor(factor, 1, n) + inMem;
      n = numSegments;
 
      for (int i = 0; i < numSegments; i++) {
        // Not handling empty segments here assuming that it would not affect
        // much in calculation of mergeProgress.
        segmentSizes[i] = segments.get(i).getLength();
      }
      
      // If includeFinalMerge is true, allow the following while loop iterate
      // for 1 more iteration. This is to include final merge as part of the
      // computation of expected input bytes of merges
      boolean considerFinalMerge = considerFinalMergeForProgress;

      int offset = 0;
      while (n > f || considerFinalMerge) {
        if (n <= f) {
          considerFinalMerge = false;
        }
        long mergedSize = 0;
        f = Math.min(f, n);
        for (int j = 0; j < f; j++) {
          mergedSize += segmentSizes[offset + j];
        }
        totalBytes += mergedSize;
        
        // insert new size into the sorted list
        int pos = Arrays.binarySearch(segmentSizes, offset, offset + n, mergedSize);
        if (pos < 0) {
          pos = -pos-1;
        }
        if (pos < offset + f) {
          // Insert at the beginning
          offset += f - 1;
          segmentSizes[offset] = mergedSize;
        } else if (pos < offset + n) {
          // Insert in the middle
          if (offset + n < segmentSizes.length) {
            // Shift right after insertion point into unused capacity
            System.arraycopy(segmentSizes, pos, segmentSizes, pos + 1, offset + n - pos);
            // Insert into insertion point
            segmentSizes[pos] = mergedSize;
            offset += f;
          } else {
            // Full left shift before insertion point
            System.arraycopy(segmentSizes, offset + f, segmentSizes, 0, pos - (offset + f));
            // Insert in the middle
            segmentSizes[pos - (offset + f)] = mergedSize;
            // Full left shift after insertion point
            System.arraycopy(segmentSizes, pos, segmentSizes, pos - (offset + f) + 1, offset + n - pos);
            offset = 0;
          }
        } else {
          // Insert at the end
          if (pos < segmentSizes.length) {
            // Append into unused capacity
            segmentSizes[pos] = mergedSize;
            offset += f;
          } else {
            // Full left shift
            // Append at the end
            System.arraycopy(segmentSizes, offset + f, segmentSizes, 0, n - f);
            segmentSizes[n - f] = mergedSize;
            offset = 0;
          }
        }
        n -=  f - 1;
        f = factor;
      }

      return totalBytes;
    }

    public Progress getProgress() {
      return mergeProgress;
    }

    @Override
    public boolean isSameKey() throws IOException {
      return (hasNext != null) && (hasNext == KeyState.SAME_KEY);
    }

    public boolean hasNext() throws IOException {
      if (size() == 0)
        return false;

      if (minSegment != null) {
        //minSegment is non-null for all invocations of next except the first
        //one. For the first invocation, the priority queue is ready for use
        //but for the subsequent invocations, first adjust the queue
        adjustPriorityQueue(minSegment);
        if (size() == 0) {
          minSegment = null;
          return false;
        }
      }

      return true;
    }

  }

  private static class EmptyIterator implements TezRawKeyValueIterator {
    final Progress progress = new Progress();

    EmptyIterator() {
      progress.set(1.0f);
    }

    @Override
    public DataInputBuffer getKey() throws IOException {
      throw new RuntimeException("No keys on an empty iterator");
    }

    @Override
    public DataInputBuffer getValue() throws IOException {
      throw new RuntimeException("No values on an empty iterator");
    }

    @Override
    public boolean next() throws IOException {
      return false;
    }

    @Override
    public boolean hasNext() throws IOException {
      return false;
    }

    @Override
    public void close() throws IOException {
    }

    @Override
    public Progress getProgress() {
      return progress;
    }

    @Override
    public boolean isSameKey() throws IOException {
      throw new UnsupportedOperationException("isSameKey is not supported");
    }
  }
}