java source code of ExternalSorter

tez-master
- NOTICE.txt
- tez-build-tools
  - src
    - main
      - resources
        checkstyle
        checkstyle.xml
        suppressions.xml
  - pom.xml
- tez-mapreduce
  - src
    - main
      - proto
        MRRuntimeProtos.proto
      - resources
        META-INF
        NOTICE.txt
        services
        org.apache.hadoop.mapreduce.protocol.ClientProtocolProvider
        LICENSE.txt
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        hadoop
        mapred
        split
        TezGroupedSplit.java
        TezMapredSplitsGrouper.java
        SplitLocationProvider.java
        SplitSizeEstimator.java
        TezGroupedSplitsInputFormat.java
        mapreduce
        split
        TezMapReduceSplitsGrouper.java
        SplitMetaInfoReaderTez.java
        TezGroupedSplit.java
        SplitLocationProvider.java
        SplitLocationProviderMapReduce.java
        SplitSizeEstimator.java
        TezGroupedSplitsInputFormat.java
        tez
        dag
        api
        client
        MRDAGClient.java
        client
        MRTezClient.java
        common
        MRFrameworkConfigs.java
        mapreduce
        committer
        MROutputCommitter.java
        processor
        MRTaskReporter.java
        MRTask.java
        reduce
        ReduceProcessor.java
        map
        MapProcessor.java
        SimpleMRProcessor.java
        hadoop
        MRHelpers.java
        MRJobConfig.java
        MRInputHelpers.java
        TezTypeConverters.java
        MRConfig.java
        IDConverter.java
        mapred
        MRCounters.java
        JobContextImpl.java
        MRReporter.java
        package-info.java
        TaskAttemptContextImpl.java
        InputSplitInfoDisk.java
        MultiStageMRConfToTezTranslator.java
        package-info.java
        MultiStageMRConfigUtil.java
        InputSplitInfo.java
        DeprecatedKeys.java
        mapreduce
        JobContextImpl.java
        MapContextImpl.java
        TezNullOutputCommitter.java
        package-info.java
        TaskInputOutputContextImpl.java
        TaskAttemptContextImpl.java
        InputSplitInfoMem.java
        client
        ClientServiceDelegate.java
        YARNRunner.java
        ResourceMgrDelegate.java
        package-info.java
        YarnTezClientProtocolProvider.java
        ClientCache.java
        NotRunningJob.java
        DAGJobStatus.java
        partition
        MRPartitioner.java
        combine
        MRCombiner.java
        output
        MultiMROutput.java
        MROutputLegacy.java
        MROutput.java
        common
        Utils.java
        MRInputAMSplitGenerator.java
        MRInputSplitDistributor.java
        lib
        MRInputUtils.java
        MRReaderMapred.java
        package-info.java
        MRReader.java
        MRReaderMapReduce.java
        input
        base
        MRInputBase.java
        MRInputLegacy.java
        MRInput.java
        MultiMRInput.java
        grouper
        SplitLocationProviderWrapper.java
        SplitLocationProviderWrapperMapred.java
        SplitSizeEstimatorWrapperMapReduce.java
        GroupedSplitContainer.java
        MapReduceSplitContainer.java
        SplitSizeEstimatorWrapperMapred.java
        MapredSplitContainer.java
        TezSplitGrouper.java
        SplitSizeEstimatorWrapper.java
        SplitContainer.java
    - test
      - resources
        log4j.properties
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        hadoop
        mapred
        split
        TestGroupedSplits.java
        tez
        mapreduce
        processor
        reduce
        TestReduceProcessor.java
        map
        TestMapProcessor.java
        MapUtils.java
        hadoop
        TestMRHelpers.java
        TestDeprecatedKeys.java
        TestMRInputHelpers.java
        TestConfigTranslationMRToTez.java
        combine
        TestMRCombiner.java
        TezTestUtils.java
        output
        TestMROutput.java
        TestMROutputLegacy.java
        TestMROutputConfigBuilder.java
        TestMultiMROutput.java
        common
        TestMRInputAMSplitGenerator.java
        TestMRInputSplitDistributor.java
        lib
        TestKVReadersWithMR.java
        TestUmbilical.java
        input
        TestMultiMRInput.java
        MultiMRInputForTest.java
        MRInputForTest.java
        TestMRInput.java
  - pom.xml
  - findbugs-exclude.xml
- hadoop-shim
  - src
    - main
      - java
        org
        apache
        tez
        hadoop
        shim
        HadoopShimsLoader.java
        DefaultHadoopShim.java
        HadoopShim.java
        HadoopShimProvider.java
    - test
      - resources
        log4j.properties
      - java
        org
        apache
        tez
        hadoop
        shim
        TestHadoopShimsLoader.java
        DummyShimProvider.java
  - pom.xml
  - findbugs-exclude.xml
- tez-tests
  - src
    - main
      - resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        mapreduce
        examples
        MRRSleepJob.java
        processor
        FilterByWordOutputProcessor.java
        FilterByWordInputProcessor.java
        BroadcastAndOneToOneExample.java
        TestOrderedWordCount.java
        helpers
        SplitsInClientOptionParser.java
        FilterLinesByWordOneToOne.java
        SecondarySort.java
        Sort.java
        UnionExample.java
        RandomTextWriter.java
        Join.java
        CartesianProduct.java
        RPCLoadGen.java
        MultipleCommitsExample.java
        RandomWriter.java
        MapredWordCount.java
        BroadcastLoadGen.java
        FilterLinesByWord.java
        ExampleDriver.java
    - test
      - resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        test
        FaultToleranceTestRunner.java
        TestLocalMode.java
        TestDAGRecovery2.java
        AMShutdownController.java
        TestSecureShuffle.java
        TestTaskErrorsUsingLocalMode.java
        RecoveryServiceWithEventHandlingHook.java
        dag
        ThreeLevelsFailingDAG.java
        SixLevelsFailingDAG.java
        TwoLevelsFailingDAG.java
        SimpleReverseVTestDAG.java
        SimpleVTestDAG.java
        MultiAttemptDAG.java
        TestPipelinedShuffle.java
        TestDAGRecovery.java
        TestMiniTezCluster.java
        SimpleTestDAG.java
        TestDriver.java
        TestTezJobs.java
        TestFaultTolerance.java
        TestInput.java
        TestProcessor.java
        TestOutput.java
        TestExceptionPropagation.java
        TestRecovery.java
        TestAMRecovery.java
        SimpleTestDAG3Vertices.java
        MiniTezCluster.java
        mapreduce
        TestMRRJobsDAGApi.java
        TestMRRJobs.java
  - pom.xml
  - findbugs-exclude.xml
- tez-examples
  - src
    - main
      - resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        examples
        SimpleSessionExample.java
        WordCount.java
        JoinValidate.java
        SortMergeJoinExample.java
        TezExampleBase.java
        JoinDataGen.java
        HashJoinExample.java
        OrderedWordCount.java
        CartesianProduct.java
        ExampleDriver.java
    - test
      - resources
        META-INF
        NOTICE.txt
        LICENSE.txt
  - pom.xml
  - findbugs-exclude.xml
- tez-runtime-internals
  - src
    - main
      - proto
        RuntimeEvents.proto
      - resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        common
        ProtoConverters.java
        TezLocalResource.java
        TezConverterUtils.java
        TezTaskUmbilicalProtocol.java
        ContainerTask.java
        ContainerContext.java
        runtime
        internals
        api
        TaskReporterInterface.java
        task
        EndReason.java
        ContainerReporter.java
        TezTaskRunner2.java
        ErrorReporter.java
        TezChild.java
        TaskRunner2Callable.java
        TaskReporter.java
        TaskRunner2Result.java
        RuntimeTask.java
        InputReadyTracker.java
        api
        impl
        TezHeartbeatResponse.java
        TezMergedInputContextImpl.java
        TezHeartbeatRequest.java
        EventType.java
        TezCountersDelegate.java
        TezProcessorContextImpl.java
        TezEvent.java
        EventMetaData.java
        TaskStatistics.java
        GroupInputSpec.java
        TaskSpec.java
        TezOutputContextImpl.java
        IOStatistics.java
        TezUmbilical.java
        TezInputContextImpl.java
        InputSpec.java
        OutputSpec.java
        ExecutionContextImpl.java
        TezTaskContextImpl.java
        events
        TaskAttemptCompletedEvent.java
        TaskAttemptFailedEvent.java
        TaskAttemptKilledEvent.java
        TaskStatusUpdateEvent.java
        common
        security
        JobTokenSelector.java
        resources
        MemoryDistributor.java
        ScalingAllocator.java
        objectregistry
        ObjectRegistryImpl.java
        LogicalIOProcessorRuntimeTask.java
        metrics
        FileSystemStatisticUpdater.java
        TaskCounterUpdater.java
    - test
      - resources
        log4j.properties
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        runtime
        task
        TaskExecutionTestHelpers.java
        TestContainerExecution.java
        TestTaskReporter.java
        TestTezTaskRunner2.java
        TestTaskExecution2.java
        api
        impl
        TestTezEvent.java
        TestTaskSpec.java
        TestProcessorContext.java
        common
        resources
        TestMemoryDistributor.java
        objectregistry
        TestObjectRegistry.java
        TestLogicalIOProcessorRuntimeTask.java
        TestInputReadyTracker.java
  - pom.xml
  - findbugs-exclude.xml
- tez-dag
  - src
    - main
      - proto
        HistoryEvents.proto
      - resources
        tez-container-log4j.properties
        tez-dag-version-info.properties
        META-INF
        NOTICE.txt
        LICENSE.txt
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        dag
        utils
        ProtoUtils.java
        TaskSpecificLaunchCmdOption.java
        TezBuilderUtils.java
        Graph.java
        Simple2LevelVersionComparator.java
        TezRuntimeChildJVM.java
        api
        client
        VertexStatusBuilder.java
        ProgressBuilder.java
        DAGClientHandler.java
        rpc
        DAGClientAMProtocolBlockingPBServerImpl.java
        DAGClientServer.java
        DAGStatusBuilder.java
        oldrecords
        TaskAttemptState.java
        AMInfo.java
        TaskReport.java
        TaskState.java
        TaskAttemptReport.java
        history
        utils
        DAGUtils.java
        TezEventUtils.java
        HistoryEvent.java
        DAGHistoryEvent.java
        HistoryEventType.java
        SummaryEvent.java
        RecoveryConverters.java
        recovery
        RecoveryService.java
        HistoryEventHandler.java
        logging
        impl
        HistoryEventJsonConversion.java
        SimpleHistoryLoggingService.java
        DevNullHistoryLoggingService.java
        HistoryLoggingService.java
        events
        DAGCommitStartedEvent.java
        VertexStartedEvent.java
        AMLaunchedEvent.java
        ContainerStoppedEvent.java
        TaskStartedEvent.java
        VertexGroupCommitFinishedEvent.java
        VertexGroupCommitStartedEvent.java
        ContainerLaunchedEvent.java
        VertexConfigurationDoneEvent.java
        VertexCommitStartedEvent.java
        DAGRecoveredEvent.java
        VertexInitializedEvent.java
        VertexFinishedEvent.java
        TaskFinishedEvent.java
        AppLaunchedEvent.java
        DAGFinishedEvent.java
        TaskAttemptStartedEvent.java
        DAGSubmittedEvent.java
        DAGStartedEvent.java
        DAGKillRequestEvent.java
        TaskAttemptFinishedEvent.java
        DAGInitializedEvent.java
        AMStartedEvent.java
        app
        security
        authorize
        TezAMPolicyProvider.java
        package-info.java
        RecoveryParser.java
        TaskAttemptEventInfo.java
        DAGAppMaster.java
        dag
        impl
        TaskImpl.java
        AMUserCodeException.java
        TezRootInputInitializerContextImpl.java
        OneToOneEdgeManager.java
        DAGSchedulerNaturalOrder.java
        OneToOneEdgeManagerOnDemand.java
        DAGImpl.java
        BroadcastEdgeManager.java
        Edge.java
        TaskReportImpl.java
        RootInputVertexManager.java
        ImmediateStartVertexManager.java
        OutputCommitterContextImpl.java
        ScatterGatherEdgeManager.java
        package-info.java
        VertexManager.java
        ServicePluginInfo.java
        TaskAttemptImplHelpers.java
        TaskAttemptImpl.java
        VertexStats.java
        VertexImpl.java
        DAGSchedulerNaturalOrderControlled.java
        StateChangeNotifier.java
        Task.java
        DAGState.java
        VertexTerminationCause.java
        VertexStateUpdateListener.java
        speculation
        legacy
        TaskRuntimeEstimator.java
        DataStatistics.java
        LegacyTaskRuntimeEstimator.java
        LegacySpeculator.java
        forecast
        SimpleExponentialSmoothing.java
        package-info.java
        StartEndTimesBase.java
        SimpleExponentialTaskRuntimeEstimator.java
        DAGTerminationCause.java
        Vertex.java
        RootInputInitializerManager.java
        TaskStateInternal.java
        package-info.java
        DAGReport.java
        event
        VertexEventTaskAttemptCompleted.java
        VertexEventSourceVertexStarted.java
        CallableEvent.java
        TaskAttemptEventContainerTerminating.java
        DAGAppMasterEvent.java
        VertexEventRootInputFailed.java
        TaskAttemptEvent.java
        TaskEvent.java
        DAGEvent.java
        DAGAppMasterEventDagCleanup.java
        DAGAppMasterEventDAGFinished.java
        DAGAppMasterEventType.java
        DAGEventCommitCompleted.java
        TaskAttemptEventSubmitted.java
        SpeculatorEventType.java
        TaskAttemptEventStartedRemotely.java
        DAGEventSchedulerUpdate.java
        TaskAttemptEventNodeFailed.java
        DAGEventRecoverEvent.java
        DiagnosableEvent.java
        DAGAppMasterEventUserServiceFatalError.java
        TaskAttemptEventSchedule.java
        DAGEventInternalError.java
        VertexEventRecoverVertex.java
        VertexEventSourceTaskAttemptCompleted.java
        TaskAttemptEventContainerTerminated.java
        TaskEventScheduleTask.java
        TaskAttemptEventContainerTerminatedBySystem.java
        VertexEventInputDataInformation.java
        TaskEventType.java
        DAGEventVertexReRunning.java
        TaskEventTAKilled.java
        DAGEventStartDag.java
        TaskEventTASucceeded.java
        DAGEventCounterUpdate.java
        TaskAttemptEventType.java
        VertexEventRouteEvent.java
        DAGEventType.java
        DAGEventTerminateDag.java
        DAGEventVertexCompleted.java
        package-info.java
        CallableEventType.java
        VertexEventRootInputInitialized.java
        RecoveryEvent.java
        VertexEventTermination.java
        TaskAttemptEventAttemptKilled.java
        SpeculatorEvent.java
        VertexEvent.java
        DAGEventDiagnosticsUpdate.java
        TaskAttemptEventOutputFailed.java
        DAGAppMasterEventSchedulingServiceError.java
        TaskAttemptEventKillRequest.java
        TaskAttemptEventTezEventUpdate.java
        TaskEventTAFailed.java
        TaskAttemptEventTerminationCauseEvent.java
        VertexEventTaskReschedule.java
        TaskAttemptEventStatusUpdate.java
        VertexEventManagerUserCodeError.java
        TaskEventTALaunched.java
        VertexEventType.java
        TaskEventTermination.java
        VertexEventCommitCompleted.java
        VertexEventNullEdgeInitialized.java
        VertexEventTaskCompleted.java
        SpeculatorEventTaskAttemptStatusUpdate.java
        TaskAttemptEventAttemptFailed.java
        TaskEventTAUpdate.java
        DAG.java
        TaskTerminationCause.java
        DAGScheduler.java
        TaskStateUpdateListener.java
        TaskAttemptStateInternal.java
        VertexState.java
        TaskAttempt.java
        TaskCommunicatorContextImpl.java
        ServicePluginLifecycleAbstractService.java
        TezTaskCommunicatorImpl.java
        web
        WebUIService.java
        AMWebController.java
        TezLocalTaskCommunicatorImpl.java
        TaskCommunicatorWrapper.java
        AppContext.java
        ClusterInfo.java
        HeartbeatHandlerBase.java
        TaskCommunicatorManagerInterface.java
        TezDagVersionInfo.java
        package-info.java
        rm
        ContainerAllocator.java
        AMSchedulerEventTAStateUpdated.java
        ContainerLauncherEventType.java
        AMSchedulerEventTALaunchRequest.java
        AMSchedulerEventTAEnded.java
        TezAMRMClientAsync.java
        TaskSchedulerContextImplWrapper.java
        TaskSchedulerManager.java
        node
        AMNodeImpl.java
        AMNodeEventNodeCountUpdated.java
        AMNodeEventContainerCompleted.java
        AMNodeEventTaskAttemptEnded.java
        AMNodeEventTaskAttemptSucceeded.java
        AMNodeTracker.java
        AMNodeEventType.java
        AMNode.java
        AMNodeEventContainerAllocated.java
        PerSourceNodeTracker.java
        AMNodeState.java
        AMNodeEventStateChanged.java
        AMNodeEvent.java
        ExtendedNodeId.java
        AMSchedulerEventType.java
        DagAwareYarnTaskScheduler.java
        ContainerLauncherEvent.java
        ContainerLauncherLaunchRequestEvent.java
        package-info.java
        AMSchedulerEventDeallocateContainer.java
        ContainerLauncherStopRequestEvent.java
        LocalTaskSchedulerService.java
        AMSchedulerEvent.java
        container
        AMContainerMap.java
        AMContainerEventAssignTA.java
        AMContainerImpl.java
        AMContainerEventCompleted.java
        AMContainerEventLaunched.java
        AMContainerEventLaunchRequest.java
        ContainerContextMatcher.java
        AMContainer.java
        AMContainerEvent.java
        AMContainerEventNodeFailed.java
        AMContainerEventStopFailed.java
        AMContainerTask.java
        AMContainerHelpers.java
        AMContainerState.java
        AMContainerEventType.java
        AMContainerEventTASucceeded.java
        AMContainerEventStopRequest.java
        AMContainerEventLaunchFailed.java
        AMSchedulerEventNodeBlacklistUpdate.java
        TaskSchedulerWrapper.java
        YarnTaskSchedulerService.java
        TaskSchedulerContextImpl.java
        YarnTaskSchedulerServiceError.java
        ContainerLauncherContextImpl.java
        TaskCommunicatorManager.java
        DAGAppMasterState.java
        TaskHeartbeatHandler.java
        ContainerContext.java
        ContainerHeartbeatHandler.java
        launcher
        DagDeleteRunnable.java
        TezLocalCacheManager.java
        TezContainerLauncherImpl.java
        ContainerOp.java
        package-info.java
        ContainerLauncherManager.java
        DeletionTracker.java
        DeletionTrackerImpl.java
        ContainerLauncherWrapper.java
        LocalContainerLauncher.java
        serviceplugins
        api
        TaskCommunicator.java
        TaskHeartbeatRequest.java
        TaskHeartbeatResponse.java
        TaskCommunicatorContext.java
        state
        StateMachineTez.java
        OnStateChangedCallback.java
        Utils.java
        client
        LocalClient.java
    - test
      - resources
        log4j.properties
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        dag
        utils
        TestSimple2LevelVersionComparator.java
        TestTaskSpecificLaunchCmdOption.java
        helpers
        DagInfoImplForTest.java
        api
        client
        TestDAGClientHandler.java
        rpc
        TestDAGClientAMProtocolBlockingPBServerImpl.java
        TestVertexStatusBuilder.java
        TestDAGClientServer.java
        history
        utils
        TestDAGUtils.java
        TestHistoryEventType.java
        recovery
        TestRecoveryService.java
        TestHistoryEventHandler.java
        logging
        impl
        TestHistoryEventJsonConversion.java
        events
        TestHistoryEventsProtoConversion.java
        app
        MockTezClient.java
        dag
        impl
        TestDAGScheduler.java
        TestImmediateStartVertexManager.java
        TestEdge.java
        TestCommit.java
        TestDAGRecovery.java
        TestRootInputVertexManager.java
        TestVertexStats.java
        TestVertexImpl2.java
        TestTaskImpl.java
        TestDAGImpl.java
        TestTaskAttempt.java
        CallableEventDispatcher.java
        TestVertexManager.java
        TestDAGSchedulerNaturalOrderControlled.java
        speculation
        legacy
        TestDataStatistics.java
        app
        TestTezTaskCommunicatorManager.java
        TestStateChangeNotifier.java
        TestRootInputInitializerManager.java
        PluginWrapperTestHelpers.java
        TestMockDAGAppMaster.java
        web
        TestAMWebController.java
        TestTaskCommunicatorManager.java
        TestTaskCommunicatorWrapper.java
        TestRecoveryParser.java
        MockLocalClient.java
        TestSpeculation.java
        TestMemoryWithEvents.java
        TestTaskCommunicatorManager2.java
        TestTaskCommunicatorContextImpl.java
        TestTaskCommunicatorManager1.java
        MockClock.java
        rm
        TestTaskSchedulerWrapper.java
        TestDagAwareYarnTaskScheduler.java
        node
        TestAMNodeTracker.java
        TestTaskSchedulerHelpers.java
        TestTezAMRMClient.java
        container
        TestAMContainerMap.java
        TestAMContainer.java
        TestContainerReuse.java
        TestLocalTaskScheduler.java
        TestTaskScheduler.java
        TestLocalTaskSchedulerService.java
        TestTaskSchedulerManager.java
        TestDAGAppMaster.java
        TestPreemption.java
        MockDAGAppMaster.java
        launcher
        TestContainerLauncherManager.java
        TestContainerLauncherWrapper.java
        TestDeletionTracker.java
        TestTezLocalCacheManager.java
        test
        ControlledScheduledExecutorService.java
        GraceShuffleVertexManagerForTest.java
        EdgeManagerForTest.java
        VertexManagerPluginForTest.java
  - pom.xml
  - findbugs-exclude.xml
- tez-plugins
  - tez-history-parser
    - src
      - main
        java
        org
        apache
        tez
        history
        ATSImportTool.java
        parser
        utils
        Utils.java
        ATSData.java
        SimpleHistoryParser.java
        datamodel
        TaskInfo.java
        Event.java
        BaseInfo.java
        EdgeInfo.java
        Constants.java
        VertexInfo.java
        BaseParser.java
        AdditionalInputOutputDetails.java
        VersionInfo.java
        TaskAttemptInfo.java
        DagInfo.java
        Container.java
        ProtoHistoryParser.java
        ATSFileParser.java
      - test
        java
        org
        apache
        tez
        history
        TestHistoryParser.java
    - pom.xml
    - findbugs-exclude.xml
  - pom.xml
  - tez-yarn-timeline-history-with-acls
    - src
      - main
        java
        org
        apache
        tez
        dag
        history
        ats
        acls
        ATSHistoryACLPolicyManager.java
      - test
        java
        org
        apache
        tez
        dag
        history
        ats
        acls
        TestATSHistoryWithACLs.java
    - pom.xml
    - findbugs-exclude.xml
  - tez-aux-services
    - src
      - main
        java
        org
        apache
        tez
        auxservices
        FadvisedChunkedFile.java
        IndexCache.java
        FadvisedFileRegion.java
        ShuffleHandler.java
      - test
        java
        org
        apache
        tez
        auxservices
        TestShuffleHandler.java
        TestIndexCache.java
        TestShuffleHandlerJobs.java
    - pom.xml
    - findbugs-exclude.xml
  - tez-yarn-timeline-cache-plugin
    - src
      - main
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
        javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
        java
        org
        apache
        tez
        dag
        history
        logging
        ats
        TimelineCachePluginImpl.java
      - test
        java
        org
        apache
        tez
        dag
        history
        logging
        ats
        TestTimelineCachePluginImpl.java
    - pom.xml
    - findbugs-exclude.xml
  - tez-yarn-timeline-history
    - src
      - main
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
        javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
        java
        org
        apache
        tez
        dag
        history
        logging
        ats
        HistoryEventTimelineConversion.java
        ATSHistoryLoggingService.java
      - test
        resources
        log4j.properties
        META-INF
        NOTICE.txt
        LICENSE.txt
        java
        org
        apache
        tez
        dag
        history
        logging
        ats
        TestATSHistoryLoggingService.java
        TestATSHistoryWithMiniCluster.java
        TestHistoryEventTimelineConversion.java
        tests
        MiniTezClusterWithTimeline.java
    - pom.xml
    - findbugs-exclude.xml
  - tez-yarn-timeline-history-with-fs
    - src
      - main
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
        javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
        java
        org
        apache
        tez
        dag
        history
        ats
        acls
        ATSV15HistoryACLPolicyManager.java
        logging
        ats
        ATSV15HistoryLoggingService.java
      - test
        java
        org
        apache
        tez
        dag
        history
        ats
        acls
        TestATSHistoryV15.java
        logging
        ats
        TestATSV15HistoryLoggingService.java
    - pom.xml
    - findbugs-exclude.xml
  - tez-protobuf-history-plugin
    - src
      - main
        proto
        HistoryLogger.proto
        java
        org
        apache
        tez
        dag
        history
        logging
        proto
        ProtoMessageReader.java
        ProtoMessageWriter.java
        HistoryEventProtoJsonConversion.java
        ProtoMessageWritable.java
        DagManifesFileScanner.java
        TezProtoLoggers.java
        HistoryEventProtoConverter.java
        ProtoHistoryLoggingService.java
        DatePartitionedLogger.java
      - test
        java
        org
        apache
        tez
        dag
        history
        logging
        proto
        TestProtoHistoryLoggingService.java
        TestDagManifestFileScanner.java
        TestHistoryEventProtoConverter.java
    - pom.xml
    - findbugs-exclude.xml
- tez-tools
  - tez-tfile-parser
    - src
      - main
        java
        org
        apache
        tez
        tools
        TFileLoader.java
        TFileRecordReader.java
    - pom.xml
    - README.txt
  - analyzers
    - job-analyzer
      - src
        main
        java
        org
        apache
        tez
        analyzer
        utils
        SVGUtils.java
        Utils.java
        Analyzer.java
        Result.java
        plugins
        SkewAnalyzer.java
        ShuffleTimeAnalyzer.java
        SlowestVertexAnalyzer.java
        SlowTaskIdentifier.java
        CriticalPathAnalyzer.java
        SlowNodeAnalyzer.java
        LocalityAnalyzer.java
        SpillAnalyzerImpl.java
        TaskAssignmentAnalyzer.java
        VertexLevelCriticalPathAnalyzer.java
        TaskAttemptResultStatisticsAnalyzer.java
        TezAnalyzerBase.java
        ContainerReuseAnalyzer.java
        AnalyzerDriver.java
        TaskConcurrencyAnalyzer.java
        OneOnOneEdgeAnalyzer.java
        CSVResult.java
        test
        java
        org
        apache
        tez
        analyzer
        TestAnalyzer.java
      - pom.xml
      - findbugs-exclude.xml
    - pom.xml
  - pom.xml
  - tez-javadoc-tools
    - src
      - main
        java
        org
        apache
        tez
        tools
        javadoc
        util
        XmlWriter.java
        Writer.java
        HtmlWriter.java
        doclet
        ConfigStandardDoclet.java
        model
        Config.java
        ConfigProperty.java
    - pom.xml
    - findbugs-exclude.xml
  - tez-log-split
    - logsplit.py
    - README.md
    - tez-log-splitter.sh
  - counter-diff
    - counter-diff.py
    - README.md
  - swimlanes
    - amlogparser.py
    - swimlane.py
    - README.md
    - yarn-swimlanes.sh
- hadoop-shim-impls
  - hadoop-shim-2.7
    - src
      - main
        resources
        META-INF
        services
        org.apache.tez.hadoop.shim.HadoopShimProvider
        java
        org
        apache
        tez
        hadoop
        shim
        HadoopShim27.java
        HadoopShim25_26_27Provider.java
      - test
        java
        org
        apache
        tez
        hadoop
        shim
        TestHadoop25_26_27ShimProvider.java
    - pom.xml
    - findbugs-exclude.xml
  - pom.xml
  - hadoop-shim-2.8
    - src
      - main
        resources
        META-INF
        services
        org.apache.tez.hadoop.shim.HadoopShimProvider
        java
        org
        apache
        tez
        hadoop
        shim
        HadoopShim28Provider.java
        HadoopShim28.java
      - test
        java
        org
        apache
        tez
        hadoop
        shim
        TestHadoopShim28Provider.java
        TestHadoopShim28.java
    - pom.xml
    - findbugs-exclude.xml
  - findbugs-exclude.xml
- pom.xml
- tez-api
  - src
    - main
      - proto
        Events.proto
        DAGClientAMProtocol.proto
        DAGApiRecords.proto
      - resources
        tez-api-version-info.properties
        META-INF
        NOTICE.txt
        services
        org.apache.hadoop.security.SecurityInfo
        LICENSE.txt
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        dag
        api
        TezReflectionException.java
        TezConfiguration.java
        VertexManagerPlugin.java
        HistoryLogLevel.java
        VertexManagerPluginContext.java
        InputDescriptor.java
        SessionNotReady.java
        client
        TimelineReaderFactory.java
        DAGClient.java
        DAGStatus.java
        VertexStatus.java
        DAGClientInternal.java
        StatusGetOpts.java
        DAGClientTimelineImpl.java
        rpc
        DAGClientAMProtocolBlockingPB.java
        package-info.java
        DAGClientRPCImpl.java
        DagStatusSource.java
        DAGClientImpl.java
        Progress.java
        TezConfigurationConstants.java
        DagTypeConverters.java
        Edge.java
        DataSinkDescriptor.java
        VertexGroup.java
        Vertex.java
        TezException.java
        InputInitializerDescriptor.java
        EdgeManagerPluginDescriptor.java
        NamedEntityDescriptor.java
        GroupInputEdge.java
        EdgeProperty.java
        Scope.java
        ConfigurationScope.java
        EdgeManagerPlugin.java
        VertexLocationHint.java
        OutputCommitterDescriptor.java
        DAGSubmissionTimedOut.java
        event
        VertexStateUpdateParallelismUpdated.java
        VertexStateUpdate.java
        VertexState.java
        EntityDescriptor.java
        TezConstants.java
        EdgeManagerPluginOnDemand.java
        DAG.java
        UserPayload.java
        DataSourceDescriptor.java
        ProcessorDescriptor.java
        TaskLocationHint.java
        OutputDescriptor.java
        PreWarmVertex.java
        EdgeManagerPluginContext.java
        TezUncheckedException.java
        DAGNotRunningException.java
        VertexManagerPluginDescriptor.java
        SessionNotRunning.java
        RootInputLeafOutput.java
        serviceplugins
        api
        ContainerEndReason.java
        TaskSchedulerContext.java
        TaskAttemptEndReason.java
        ContainerLauncherDescriptor.java
        TaskScheduler.java
        ContainerLauncherOperationBase.java
        ServicePluginContextBase.java
        TaskSchedulerDescriptor.java
        ContainerLauncherContext.java
        ContainerStopRequest.java
        ServicePluginErrorDefaults.java
        ContainerLauncher.java
        ServicePluginError.java
        TaskCommunicatorDescriptor.java
        ContainerLaunchRequest.java
        ServicePluginException.java
        DagInfo.java
        ServicePluginsDescriptor.java
        client
        AMConfiguration.java
        TezApiVersionInfo.java
        FrameworkClient.java
        TezYarnClient.java
        CallerContext.java
        TezAppMasterStatus.java
        TezClient.java
        TezClientUtils.java
        common
        security
        Master.java
        DAGAccessControls.java
        JobTokenIdentifier.java
        TokenCache.java
        HistoryACLPolicyException.java
        ACLConfigurationParser.java
        DAGClientSecurityInfo.java
        ACLManager.java
        JobTokenSecretManager.java
        ACLType.java
        HistoryACLPolicyManager.java
        TezYARNUtils.java
        Preconditions.java
        ATSConstants.java
        TezClassLoader.java
        JavaOptsChecker.java
        counters
        AggregateFrameworkCounter.java
        TezCounter.java
        AggregateTezCounter.java
        GenericCounter.java
        CounterGroupFactory.java
        AbstractCounters.java
        AggregateTezCounters.java
        CounterGroupBase.java
        CounterGroup.java
        FileSystemCounter.java
        JobCounter.java
        AbstractCounterGroup.java
        AbstractCounter.java
        AggregateTezCounterDelegate.java
        Limits.java
        FileSystemCounterGroup.java
        DAGCounter.java
        LimitExceededException.java
        FrameworkCounterGroup.java
        TezCounters.java
        TaskCounter.java
        ServicePluginLifecycle.java
        TezCommonUtils.java
        ReflectionUtils.java
        TezUtils.java
        VersionInfo.java
        annotation
        ConfigurationClass.java
        ConfigurationProperty.java
        GuavaShim.java
        ProgressHelper.java
        ContainerSignatureMatcher.java
        RPCUtil.java
        runtime
        api
        Reader.java
        LogicalIOProcessor.java
        MergedInputContext.java
        TaskFailureType.java
        LogicalInput.java
        VertexIdentifier.java
        Event.java
        Input.java
        ObjectRegistry.java
        OutputContext.java
        ProcessorContext.java
        Writer.java
        TaskIdentifier.java
        InputInitializer.java
        InputContext.java
        OutputStatistics.java
        LogicalIOProcessorFrameworkInterface.java
        OutputCommitter.java
        OutputStatisticsReporter.java
        ProcessorFrameworkInterface.java
        LogicalOutputFrameworkInterface.java
        AbstractLogicalIOProcessor.java
        InputSpecUpdate.java
        LogicalInputFrameworkInterface.java
        Processor.java
        Output.java
        AbstractLogicalInput.java
        InputInitializerContext.java
        DagIdentifier.java
        InputStatisticsReporter.java
        ExecutionContext.java
        OutputFrameworkInterface.java
        TaskAttemptIdentifier.java
        InputFrameworkInterface.java
        VertexStatistics.java
        InputStatistics.java
        AbstractLogicalOutput.java
        MemoryUpdateCallback.java
        MergedLogicalInput.java
        LogicalOutput.java
        ProgressFailedException.java
        OutputCommitterContext.java
        TaskContext.java
        events
        InputUpdatePayloadEvent.java
        InputConfigureVertexTasksEvent.java
        VertexManagerEvent.java
        CompositeDataMovementEvent.java
        InputFailedEvent.java
        InputInitializerEvent.java
        DataMovementEvent.java
        CustomProcessorEvent.java
        InputDataInformationEvent.java
        CompositeRoutedDataMovementEvent.java
        InputReadErrorEvent.java
    - test
      - resources
        tez-site.xml
        log4j.properties
        test3-version-info.properties
        META-INF
        NOTICE.txt
        LICENSE.txt
        test1-version-info.properties
        test2-version-info.properties
      - java
        org
        apache
        tez
        dag
        api
        TestDagTypeConverters.java
        TestEntityDescriptor.java
        client
        TestATSHttpClient.java
        rpc
        TestDAGClient.java
        TestTimelineReaderFactory.java
        TestDAG.java
        TestHistoryLogLevel.java
        TestTaskLocationHint.java
        TestDAGVerify.java
        TestDAGPlan.java
        TestTezConfiguration.java
        client
        TestTezClientUtils.java
        TestTezClient.java
        common
        security
        TestACLManager.java
        TestACLConfigurationParser.java
        TestTokenCache.java
        TestDAGAccessControls.java
        TestTezCommonUtils.java
        TestTezYARNUtils.java
        TestJavaOptsChecker.java
        TestVersionInfo.java
        TestRPCUtil.java
        TestReflectionUtils.java
        runtime
        api
        event
        TestCompositeDataMovementEvent.java
  - pom.xml
  - findbugs-exclude.xml
- BUILDING.txt
- build-tools
  - test-patch.sh
  - docker
    - Dockerfile
    - tez_env_checks.sh
  - install-protobuf.sh
  - smart-apply-patch.sh
- tez-common
  - src
    - main
      - resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        dag
        utils
        package-info.java
        RelocalizationUtils.java
        history
        logging
        EntityTypes.java
        records
        TezTaskID.java
        TaskIdentifierImpl.java
        TaskAttemptIdentifierImpl.java
        DagIdentifierImpl.java
        TezDAGID.java
        TezTaskAttemptID.java
        TezVertexID.java
        package-info.java
        TaskAttemptTerminationCause.java
        VertexIdentifierImpl.java
        TezID.java
        common
        TezAbstractEvent.java
        TezExecutors.java
        Preconditions.java
        AsyncDispatcher.java
        DagContainerLauncher.java
        AsyncDispatcherConcurrent.java
        TezUtilsInternal.java
        TezContainerLogAppender.java
        package-info.java
        CallableWithNdc.java
        io
        NonSyncDataOutputStream.java
        NonSyncByteArrayOutputStream.java
        NonSyncByteArrayInputStream.java
        EnvironmentUpdateUtils.java
        GcTimeUpdater.java
        RunnableWithNdc.java
        TezLog4jConfigurator.java
        TezSharedExecutor.java
        util
        TezMxBeanResourceCalculator.java
        StopWatch.java
        FastNumberFormat.java
        runtime
        common
        resources
        InitialMemoryRequestContext.java
        package-info.java
        InitialMemoryAllocator.java
    - test
      - resources
        log4j.properties
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        dag
        records
        TestTezIds.java
        common
        DrainDispatcher.java
        MockDNSToSwitchMapping.java
        TestTezSharedExecutor.java
        TestAsyncDispatcherConcurrent.java
        TestAsyncDispatcher.java
        TestTezUtils.java
        TestEnvironmentUpdateUtils.java
        util
        TestStopWatch.java
        TestNumberFormat.java
        TestTezMxBeanResourceCalculator.java
  - pom.xml
  - findbugs-exclude.xml
- tez-ui
  - src
    - main
      - resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - webapp
        .ember-cli
        bower.json
        bower-shrinkwrap.json
        public
        assets
        images
        yarn.lock
        ember-cli-build.js
        testem.json
        .editorconfig
        .jshintrc
        config
        environment.js
        default-app-conf.js
        build-info.js
        configs.env
        blueprints
        entity
        files
        app
        entities
        __name__.js
        index.js
        entity-test
        files
        tests
        unit
        entities
        __name__-test.js
        index.js
        .jshintrc
        .bowerrc
        WEB-INF
        wro.xml
        web.xml
        README.md
        package.json
        tests
        integration
        components
        home-table-controls-test.js
        em-table-tasks-log-link-cell-test.js
        em-swimlane-process-name-test.js
        pagination-ui-test.js
        em-swimlane-consolidated-process-test.js
        em-swimlane-test.js
        error-bar-test.js
        em-tooltip-test.js
        date-formatter-test.js
        em-swimlane-process-line-test.js
        em-swimlane-ruler-test.js
        query-timeline-test.js
        tab-n-refresh-test.js
        dags-page-search-test.js
        em-table-status-cell-test.js
        queries-page-search-test.js
        zip-download-modal-test.js
        em-swimlane-event-bar-test.js
        stats-link-test.js
        table-controls-test.js
        em-swimlane-event-test.js
        em-swimlane-blocking-event-test.js
        em-swimlane-vertex-name-test.js
        column-selector-test.js
        em-swimlane-process-visual-test.js
        caller-info-test.js
        helpers
        resolver.js
        start-app.js
        destroy-app.js
        module-for-acceptance.js
        test-helper.js
        .jshintrc
        index.html
        unit
        utils
        process-test.js
        virtual-anchor-test.js
        processor-test.js
        process-definition-test.js
        counter-column-definition-test.js
        download-dag-zip-test.js
        misc-test.js
        vertex-process-test.js
        services
        loader-test.js
        env-test.js
        pollster-test.js
        local-storage-test.js
        hosts-test.js
        initializers
        loader-test.js
        env-test.js
        local-storage-test.js
        jquery-test.js
        entities-test.js
        hosts-test.js
        models
        abstract-test.js
        ahs-app-test.js
        vertex-test.js
        dag-test.js
        attempt-test.js
        dag-am-test.js
        dag-info-test.js
        vertex-am-test.js
        am-test.js
        task-am-test.js
        app-rm-test.js
        hive-query-test.js
        timed-test.js
        app-test.js
        task-test.js
        timeline-test.js
        attempt-am-test.js
        am-timeline-test.js
        rm-test.js
        controllers
        abstract-test.js
        home
        queries-test.js
        index-test.js
        vertex-test.js
        dag-test.js
        dag
        index
        index-test.js
        vertices-test.js
        tasks-test.js
        counters-test.js
        attempts-test.js
        index-test.js
        swimlane-test.js
        graphical-test.js
        attempt-test.js
        task
        counters-test.js
        attempts-test.js
        index-test.js
        counters-table-test.js
        home-test.js
        attempt
        counters-test.js
        index-test.js
        query-test.js
        multi-table-test.js
        query
        index-test.js
        configs-test.js
        timeline-test.js
        app-test.js
        task-test.js
        parent-test.js
        page-test.js
        app
        dags-test.js
        index-test.js
        configs-test.js
        table-test.js
        vertex
        tasks-test.js
        counters-test.js
        attempts-test.js
        index-test.js
        configs-test.js
        application-test.js
        entities
        dag-test.js
        vertex-am-test.js
        am-test.js
        task-am-test.js
        entity-test.js
        attempt-am-test.js
        serializers
        loader-test.js
        ahs-app-test.js
        vertex-test.js
        dag-test.js
        attempt-test.js
        dag-am-test.js
        dag-info-test.js
        vertex-am-test.js
        am-test.js
        task-am-test.js
        app-rm-test.js
        hive-query-test.js
        app-test.js
        task-test.js
        timeline-test.js
        attempt-am-test.js
        rm-test.js
        routes
        abstract-test.js
        multi-am-pollster-test.js
        home
        queries-test.js
        index-test.js
        vertex-test.js
        dag-test.js
        dag
        index
        index-test.js
        vertices-test.js
        tasks-test.js
        counters-test.js
        attempts-test.js
        index-test.js
        swimlane-test.js
        graphical-test.js
        attempt-test.js
        task
        counters-test.js
        attempts-test.js
        index-test.js
        home-test.js
        attempt
        counters-test.js
        index-test.js
        am-pollster-test.js
        query-test.js
        query
        index-test.js
        configs-test.js
        timeline-test.js
        pollster-test.js
        app-test.js
        task-test.js
        app
        dags-test.js
        index-test.js
        configs-test.js
        single-am-pollster-test.js
        vertex
        tasks-test.js
        counters-test.js
        attempts-test.js
        index-test.js
        configs-test.js
        application-test.js
        server-side-ops-test.js
        mixins
        name-test.js
        auto-counter-column-test.js
        adapters
        abstract-test.js
        loader-test.js
        ahs-app-test.js
        vertex-test.js
        dag-test.js
        attempt-test.js
        dag-am-test.js
        dag-info-test.js
        vertex-am-test.js
        am-test.js
        task-am-test.js
        app-rm-test.js
        hive-query-test.js
        app-test.js
        task-test.js
        timeline-test.js
        attempt-am-test.js
        rm-test.js
        transforms
        object-test.js
        app
        utils
        vertex-process.js
        counter-column-definition.js
        misc.js
        virtual-anchor.js
        process.js
        processor.js
        download-dag-zip.js
        process-definition.js
        services
        env.js
        local-storage.js
        loader.js
        pollster.js
        hosts.js
        initializers
        jquery.js
        env.js
        local-storage.js
        loader.js
        hosts.js
        entities.js
        models
        task-am.js
        am-timeline.js
        abstract.js
        dag-info.js
        app-rm.js
        app.js
        hive-query.js
        vertex.js
        dag-am.js
        dag.js
        attempt.js
        rm.js
        am.js
        vertex-am.js
        timed.js
        task.js
        ahs-app.js
        timeline.js
        attempt-am.js
        templates
        home
        index.hbs
        queries.hbs
        dag
        index.hbs
        vertices.hbs
        tasks.hbs
        index
        index.hbs
        counters.hbs
        graphical.hbs
        attempts.hbs
        swimlane.hbs
        query.hbs
        application.hbs
        task
        index.hbs
        counters.hbs
        attempts.hbs
        attempt
        index.hbs
        counters.hbs
        components
        em-table-status-cell.hbs
        table-controls.hbs
        em-swimlane-event.hbs
        em-swimlane-process-visual.hbs
        query-timeline.hbs
        column-selector.hbs
        em-swimlane-ruler.hbs
        queries-page-search.hbs
        em-swimlane-vertex-name.hbs
        em-tooltip.hbs
        error-bar.hbs
        em-table-tasks-log-link-cell.hbs
        em-swimlane-event-bar.hbs
        zip-download-modal.hbs
        em-swimlane-consolidated-process.hbs
        em-swimlane.hbs
        dags-page-search.hbs
        em-swimlane-process-name.hbs
        tab-n-refresh.hbs
        date-formatter.hbs
        caller-info.hbs
        em-swimlane-blocking-event.hbs
        pagination-ui.hbs
        home-table-controls.hbs
        stats-link.hbs
        em-swimlane-process-line.hbs
        query
        index.hbs
        configs.hbs
        timeline.hbs
        home.hbs
        vertex.hbs
        attempt.hbs
        task.hbs
        app
        index.hbs
        configs.hbs
        dags.hbs
        app.hbs
        vertex
        index.hbs
        tasks.hbs
        counters.hbs
        configs.hbs
        attempts.hbs
        dag.hbs
        loading.hbs
        simple-modal.hbs
        components
        table-controls.js
        zip-download-modal.js
        em-swimlane-ruler.js
        stats-link.js
        em-swimlane.js
        em-swimlane-consolidated-process.js
        caller-info.js
        em-tooltip.js
        em-table-status-cell.js
        pagination-ui.js
        dags-page-search.js
        column-selector.js
        em-swimlane-event-bar.js
        em-swimlane-process-name.js
        home-table-controls.js
        em-table-tasks-log-link-cell.js
        tab-n-refresh.js
        em-swimlane-vertex-name.js
        em-swimlane-process-line.js
        em-swimlane-event.js
        em-swimlane-blocking-event.js
        date-formatter.js
        em-swimlane-process-visual.js
        query-timeline.js
        queries-page-search.js
        error-bar.js
        app.js
        controllers
        home
        queries.js
        index.js
        query.js
        dag
        index
        index.js
        attempts.js
        vertices.js
        graphical.js
        tasks.js
        counters.js
        index.js
        swimlane.js
        page.js
        task
        attempts.js
        counters.js
        index.js
        counters-table.js
        home.js
        attempt
        counters.js
        index.js
        abstract.js
        app.js
        table.js
        query
        configs.js
        timeline.js
        index.js
        multi-table.js
        vertex.js
        parent.js
        application.js
        dag.js
        attempt.js
        task.js
        app
        dags.js
        configs.js
        index.js
        vertex
        attempts.js
        configs.js
        tasks.js
        counters.js
        index.js
        router.js
        styles
        caller-info.less
        details-page.less
        dags-page-search.less
        app.less
        shared.less
        em-swimlane.less
        page-layout.less
        query-timeline.less
        table-controls.less
        vertex-configs-page.less
        queries-page-search.less
        em-table-status-cell.less
        swimlane-page.less
        zip-download-modal.less
        column-selector.less
        em-tooltip.less
        colors.less
        date-formatter.less
        em-swimlane-vertex-name.less
        tab-n-refresh.less
        tooltip.less
        home-table-controls.less
        error-bar.less
        index.html
        entities
        task-am.js
        dag.js
        am.js
        vertex-am.js
        entity.js
        attempt-am.js
        errors
        unlinked-promise.js
        serializers
        task-am.js
        dag-info.js
        app-rm.js
        app.js
        hive-query.js
        vertex.js
        dag-am.js
        loader.js
        dag.js
        attempt.js
        rm.js
        am.js
        vertex-am.js
        task.js
        ahs-app.js
        timeline.js
        attempt-am.js
        routes
        home
        queries.js
        index.js
        query.js
        dag
        index
        index.js
        attempts.js
        vertices.js
        graphical.js
        tasks.js
        counters.js
        index.js
        swimlane.js
        task
        attempts.js
        counters.js
        index.js
        home.js
        attempt
        counters.js
        index.js
        abstract.js
        multi-am-pollster.js
        app.js
        query
        configs.js
        timeline.js
        index.js
        vertex.js
        application.js
        dag.js
        attempt.js
        single-am-pollster.js
        am-pollster.js
        server-side-ops.js
        pollster.js
        task.js
        app
        dags.js
        configs.js
        index.js
        vertex
        attempts.js
        configs.js
        tasks.js
        counters.js
        index.js
        mixins
        name.js
        auto-counter-column.js
        adapters
        task-am.js
        abstract.js
        dag-info.js
        app-rm.js
        app.js
        hive-query.js
        vertex.js
        dag-am.js
        loader.js
        dag.js
        attempt.js
        rm.js
        am.js
        vertex-am.js
        task.js
        ahs-app.js
        timeline.js
        attempt-am.js
        transforms
        object.js
        .watchmanconfig
        .gitignore
  - pom.xml
  - README.md
  - findbugs-exclude.xml
- Tez_DOAP.rdf
- tez-ext-service-tests
  - src
    - test
      - proto
        TezDaemonProtocol.proto
      - resources
        log4j.properties
      - java
        org
        apache
        tez
        dag
        app
        TezTestServiceCommunicator.java
        taskcomm
        TezTestServiceTaskCommunicatorImpl.java
        TezTestServiceTaskCommunicatorWithErrors.java
        rm
        TezTestServiceTaskSchedulerServiceWithErrors.java
        TezTestServiceTaskSchedulerService.java
        ErrorPluginConfiguration.java
        launcher
        TezTestServiceContainerLauncherWithErrors.java
        TezTestServiceContainerLauncher.java
        TezTestServiceNoOpContainerLauncher.java
        shufflehandler
        IndexCache.java
        ShuffleHandler.java
        examples
        JoinValidateConfigured.java
        util
        ProtoConverters.java
        service
        impl
        TezTestServiceProtocolServerImpl.java
        TezTestServiceProtocolClientImpl.java
        TezTestService.java
        ContainerRunnerImpl.java
        TezTestServiceConfConstants.java
        MiniTezTestServiceCluster.java
        ContainerRunner.java
        TezTestServiceProtocolBlockingPB.java
        tests
        TestExtServicesWithLocalMode.java
        TestExternalTezServices.java
        ExternalTezServiceTestHelper.java
        TestExternalTezServicesErrors.java
  - pom.xml
  - findbugs-exclude.xml
- .travis.yml
- README.md
- KEYS
- tez-runtime-library
  - src
    - main
      - proto
        FairShufflePayloads.proto
        ShufflePayloads.proto
        CartesianProductPayload.proto
      - resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        hadoop
        io
        FileChunk.java
        tez
        dag
        library
        vertexmanager
        VertexManagerWithConcurrentInput.java
        FairShuffleEdgeManager.java
        DestinationTaskInputsProperty.java
        FairShuffleVertexManager.java
        ShuffleVertexManager.java
        FairEdgeConfiguration.java
        ShuffleVertexManagerBase.java
        InputReadyVertexManager.java
        edgemanager
        SilentEdgeManager.java
        common
        TezRuntimeFrameworkConfigs.java
        runtime
        library
        utils
        LocalProgress.java
        BufferUtils.java
        DATA_RANGE_IN_MB.java
        FastByteComparisons.java
        Grouper.java
        resources
        WeightedScalingMemoryDistributor.java
        processor
        SleepProcessor.java
        PreWarmProcessor.java
        SimpleProcessor.java
        hadoop
        compat
        NullProgressable.java
        output
        package-info.java
        UnorderedKVOutput.java
        OrderedPartitionedKVOutput.java
        UnorderedPartitionedKVOutput.java
        api
        KeyValueWriter.java
        TezRuntimeConfiguration.java
        KeyValuesReader.java
        KeyValueWriterWithBasePath.java
        IOInterruptedException.java
        KeyValuesWriter.java
        KeyValueReader.java
        Partitioner.java
        common
        security
        SecureShuffleUtils.java
        task
        local
        output
        TezTaskOutput.java
        package-info.java
        TezTaskOutputFiles.java
        ConfigUtils.java
        ValuesIterator.java
        TezRuntimeUtils.java
        combine
        Combiner.java
        InputAttemptIdentifier.java
        sort
        impl
        TezSpillRecord.java
        TezRawKeyValueIterator.java
        dflt
        package-info.java
        DefaultSorter.java
        PipelinedSorter.java
        IFileOutputStream.java
        ExternalSorter.java
        package-info.java
        TezIndexRecord.java
        IFile.java
        TezMerger.java
        IFileInputStream.java
        InputIdentifier.java
        Constants.java
        comparator
        ProxyComparator.java
        TezBytesComparator.java
        writers
        BaseUnorderedPartitionedKVWriter.java
        package-info.java
        UnorderedPartitionedKVWriter.java
        CompositeInputAttemptIdentifier.java
        readers
        UnorderedKVReader.java
        MemoryUpdateCallbackHandler.java
        shuffle
        impl
        SimpleFetchedInputAllocator.java
        ShuffleManager.java
        package-info.java
        ShuffleInputEventHandlerImpl.java
        InputHost.java
        FetchedInputAllocator.java
        DiskFetchedInput.java
        FetcherCallback.java
        FetchResult.java
        ShuffleEventHandler.java
        orderedgrouped
        Shuffle.java
        InMemoryReader.java
        MapHost.java
        ShuffleScheduler.java
        ShuffleHeader.java
        InMemoryWriter.java
        package-info.java
        ShuffleInputEventHandlerOrderedGrouped.java
        FetchedInputAllocatorOrderedGrouped.java
        FetcherOrderedGrouped.java
        ExceptionReporter.java
        MergeManager.java
        MergeThread.java
        MapOutput.java
        ShuffleUtils.java
        HostPort.java
        Fetcher.java
        MemoryFetchedInput.java
        FetchedInput.java
        package-info.java
        LocalDiskFetchedInput.java
        FetchedInputCallback.java
        serializer
        TezBytesWritableSerialization.java
        cartesianproduct
        CartesianProductEdgeManagerReal.java
        CartesianProductFilter.java
        CartesianProductVertexManagerReal.java
        CartesianProductEdgeManagerPartitioned.java
        CartesianProductEdgeManager.java
        CartesianProductCombination.java
        FairCartesianProductEdgeManager.java
        FairCartesianProductVertexManager.java
        CartesianProductVertexManager.java
        CartesianProductConfig.java
        CartesianProductVertexManagerPartitioned.java
        CartesianProductFilterDescriptor.java
        partitioner
        RoundRobinPartitioner.java
        HashPartitioner.java
        exceptions
        FetcherReadTimeoutException.java
        InputAlreadyClosedException.java
        input
        ConcatenatedMergedKeyValuesInput.java
        OrderedGroupedKVInput.java
        package-info.java
        OrderedGroupedInputLegacy.java
        OrderedGroupedMergedKVInput.java
        ConcatenatedMergedKeyValueInput.java
        UnorderedKVInput.java
        conf
        UnorderedKVEdgeConfig.java
        UnorderedPartitionedKVEdgeConfig.java
        UnorderedPartitionedKVOutputConfig.java
        Utils.java
        UnorderedKVOutputConfig.java
        OrderedGroupedKVInputConfig.java
        package-info.java
        OrderedPartitionedKVOutputConfig.java
        BaseConfigBuilder.java
        OrderedPartitionedKVEdgeConfig.java
        HadoopKeyValuesBasedBaseEdgeConfig.java
        UnorderedKVInputConfig.java
        http
        BaseHttpConnection.java
        HttpConnectionParams.java
        SSLFactory.java
        HttpConnection.java
        async
        netty
        TezBodyDeferringAsyncHandler.java
        AsyncHttpConnection.java
    - test
      - resources
        tez-site.xml
        log4j.properties
        TestIFile_concatenated_compressed.bin
        META-INF
        NOTICE.txt
        LICENSE.txt
      - java
        org
        apache
        tez
        dag
        library
        vertexmanager
        TestShuffleVertexManagerUtils.java
        TestVertexManagerWithConcurrentInput.java
        TestInputReadyVertexManager.java
        TestShuffleVertexManagerBase.java
        TestFairShuffleVertexManager.java
        TestShuffleVertexManager.java
        runtime
        library
        testutils
        RandomTextGenerator.java
        KVDataGen.java
        output
        OutputTestHelpers.java
        TestOnFileUnorderedKVOutput.java
        TestUnorderedPartitionedKVOutput2.java
        TestOnFileSortedOutput.java
        TestOrderedPartitionedKVOutput2.java
        TestUnorderedKVOutput2.java
        api
        TestTezRuntimeConfiguration.java
        common
        TestValuesIterator.java
        sort
        impl
        dflt
        TestDefaultSorter.java
        TestTezMerger.java
        TestIFile.java
        TestPipelinedSorter.java
        comparator
        TestProxyComparator.java
        writers
        TestUnorderedPartitionedKVWriter.java
        readers
        TestUnorderedKVReader.java
        shuffle
        impl
        TestSimpleFetchedInputAllocator.java
        TestShuffleManager.java
        TestShuffleInputEventHandlerImpl.java
        TestShuffleUtils.java
        orderedgrouped
        TestShuffleScheduler.java
        TestMergeManager.java
        TestShuffleInputEventHandlerOrderedGrouped.java
        TestFetcher.java
        TestShuffle.java
        TestFetcher.java
        TestInputIdentifiers.java
        cartesianproduct
        TestGrouper.java
        TestFairCartesianProductEdgeManager.java
        TestFairCartesianProductVertexManager.java
        TestCartesianProductCombination.java
        TestCartesianProductVertexManager.java
        TestCartesianProductConfig.java
        TestCartesianProductEdgeManagerPartitioned.java
        TestCartesianProductVertexManagerPartitioned.java
        TestCartesianProductEdgeManager.java
        input
        TestOrderedGroupedKVInput.java
        TestSortedGroupedMergedInput.java
        conf
        TestOrderedPartitionedKVOutputConfig.java
        TestUnorderedPartitionedKVEdgeConfig.java
        TestUnorderedPartitionedKVOutputConfig.java
        TestUnorderedKVEdgeConfig.java
        TestOrderedGroupedMergedKVInputConfig.java
        TestOrderedPartitionedKVEdgeConfig.java
        TestUnorderedKVOutputConfig.java
        TestUnorderedKVInputConfig.java
        common
        resources
        TestWeightedScalingMemoryDistributor.java
        http
        TestHttpConnection.java
  - pom.xml
  - findbugs-exclude.xml
- .gitignore
- docs
  - src
    - site
      - resources
        images
        pmc
        tez.rdf
      - markdown
        shuffle-handler.md
        tez-ui.md
        tez_yarn_timeline.md
        install.md
        index.md
        user_guides.md
        by-laws.md
        localmode.md
        releases
        apache-tez-0-6-2.md
        apache-tez-0-8-0-alpha.md
        apache-tez-0-6-0.md
        apache-tez-0-8-1-alpha.md
        index.md
        apache-tez-0-8-4.md
        apache-tez-0-5-4.md
        apache-tez-0-8-2.md
        apache-tez-0-7-1.md
        apache-tez-0-5-2.md
        apache-tez-0-7-0.md
        apache-tez-0-8-5.md
        apache-tez-0-6-1.md
        apache-tez-0-5-0.md
        apache-tez-0-9-2.md
        apache-tez-0-9-0.md
        apache-tez-0-8-3.md
        apache-tez-0-5-1.md
        apache-tez-0-9-1.md
        apache-tez-0-5-3.md
        tez_acls.md
        tez_ui_user_data.md
        install_pre_0_5_0.md
        talks.md
        privacy-policy.md
      - site.xml
      - custom
        project-info-report.properties
  - pom.xml
- INSTALL.md
- LICENSE.txt
- tez-dist
  - src
    - main
      - javadoc
        resources
        META-INF
        NOTICE.txt
        LICENSE.txt
      - assembly
        tez-dist-minimal.xml
        tez-dist.xml
  - pom.xml
  - dist-files
    - minimal
      - LICENSE-CDDLv1.1-GPLv2_withCPE
      - LICENSE
      - LICENSE-SIL_OpenFontLicense-v1.1
      - LICENSE-BSD-3clause
      - NOTICE
      - LICENSE-MIT
    - full
      - LICENSE-CDDLv1.1-GPLv2_withCPE
      - LICENSE
      - LICENSE-SIL_OpenFontLicense-v1.1
      - LICENSE-BSD-3clause
      - NOTICE
      - LICENSE-MIT
      - LICENSE-CDDLv1.0

/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements.  See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership.  The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License.  You may obtain a copy of the License at
*
*     http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/

package org.apache.tez.runtime.library.common.sort.impl;

import java.io.File;
import java.io.IOException;
import java.io.InputStream;
import java.util.Collections;
import java.util.Iterator;
import java.util.List;
import java.util.Map;

import com.google.common.annotations.VisibleForTesting;
import com.google.common.collect.Maps;
import org.apache.tez.runtime.api.Event;
import org.apache.tez.runtime.api.OutputStatisticsReporter;
import org.apache.tez.runtime.library.api.IOInterruptedException;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.apache.hadoop.classification.InterfaceAudience.Private;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.CommonConfigurationKeys;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.LocalFileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.fs.RawLocalFileSystem;
import org.apache.hadoop.io.RawComparator;
import org.apache.hadoop.io.compress.CompressionCodec;
import org.apache.hadoop.io.compress.Compressor;
import org.apache.hadoop.io.compress.DefaultCodec;
import org.apache.hadoop.io.serializer.SerializationFactory;
import org.apache.hadoop.io.serializer.Serializer;
import org.apache.hadoop.util.IndexedSorter;
import org.apache.hadoop.util.Progressable;
import org.apache.hadoop.util.QuickSort;
import org.apache.hadoop.util.ReflectionUtils;
import org.apache.tez.common.TezRuntimeFrameworkConfigs;
import org.apache.tez.common.counters.TaskCounter;
import org.apache.tez.common.counters.TezCounter;
import org.apache.tez.runtime.api.OutputContext;
import org.apache.tez.runtime.library.api.Partitioner;
import org.apache.tez.runtime.library.api.TezRuntimeConfiguration;
import org.apache.tez.runtime.library.api.TezRuntimeConfiguration.ReportPartitionStats;
import org.apache.tez.runtime.library.common.ConfigUtils;
import org.apache.tez.runtime.library.common.TezRuntimeUtils;
import org.apache.tez.runtime.library.common.combine.Combiner;
import org.apache.tez.runtime.library.common.shuffle.orderedgrouped.ShuffleHeader;
import org.apache.tez.runtime.library.common.sort.impl.IFile.Writer;
import org.apache.tez.runtime.library.common.task.local.output.TezTaskOutput;

import org.apache.tez.common.Preconditions;

@SuppressWarnings({"unchecked", "rawtypes"})
public abstract class ExternalSorter {

  private static final Logger LOG = LoggerFactory.getLogger(ExternalSorter.class);

  public List<Event> close() throws IOException {
    spillFileIndexPaths.clear();
    spillFilePaths.clear();
    reportStatistics();
    outputContext.notifyProgress();
    return Collections.emptyList();
  }

  public abstract void flush() throws IOException;

  public abstract void write(Object key, Object value) throws IOException;

  public void write(Object key, Iterable<Object> values) throws IOException {
    //TODO: Sorter classes should override this method later.
    Iterator<Object> it = values.iterator();
    while(it.hasNext()) {
      write(key, it.next());
    }
  }

  protected final Progressable progressable = new Progressable() {
    @Override
    public void progress() {
      outputContext.notifyProgress();
    }
  };

  protected final OutputContext outputContext;
  protected final Combiner combiner;
  protected final Partitioner partitioner;
  protected final Configuration conf;
  protected final RawLocalFileSystem localFs;
  protected final FileSystem rfs;
  protected final TezTaskOutput mapOutputFile;
  protected final int partitions;
  protected final Class keyClass;
  protected final Class valClass;
  protected final RawComparator comparator;
  protected final SerializationFactory serializationFactory;
  protected final Serializer keySerializer;
  protected final Serializer valSerializer;
  
  protected final boolean ifileReadAhead;
  protected final int ifileReadAheadLength;
  protected final int ifileBufferSize;

  protected final long availableMemoryMb;

  protected final IndexedSorter sorter;

  // Compression for map-outputs
  protected final CompressionCodec codec;

  protected final Map<Integer, Path> spillFilePaths = Maps.newHashMap();
  protected final Map<Integer, Path> spillFileIndexPaths = Maps.newHashMap();

  protected Path finalOutputFile;
  protected Path finalIndexFile;
  protected int numSpills;

  protected final boolean cleanup;

  protected OutputStatisticsReporter statsReporter;
  protected final long[] partitionStats;
  protected final boolean finalMergeEnabled;
  protected final boolean sendEmptyPartitionDetails;

  // Counters
  // MR compatilbity layer needs to rename counters back to what MR requries.

  // Represents final deserialized size of output (spills are not counted)
  protected final TezCounter mapOutputByteCounter;
  // Represents final number of records written (spills are not counted)
  protected final TezCounter mapOutputRecordCounter;
  // Represents the size of the final output - with any overheads introduced by
  // the storage/serialization mechanism. This is an uncompressed data size.
  protected final TezCounter outputBytesWithOverheadCounter;
  // Represents the size of the final output - which will be transmitted over
  // the wire (spills are not counted). Factors in compression if it is enabled.
  protected final TezCounter fileOutputByteCounter;
  // Represents total number of records written to disk (includes spills. Min
  // value for this is equal to number of output records)
  protected final TezCounter spilledRecordsCounter;
  // Bytes written as a result of additional spills. The single spill for the
  // final output data is not considered. (This will be 0 if there's no
  // additional spills. Compressed size - so may not represent the size in the
  // sort buffer)
  protected final TezCounter additionalSpillBytesWritten;
  
  protected final TezCounter additionalSpillBytesRead;
  // Number of spills written & consumed by the same task to generate the final file
  protected final TezCounter numAdditionalSpills;
  // Number of files offered via shuffle-handler to consumers.
  protected final TezCounter numShuffleChunks;
  // How partition stats should be reported.
  final ReportPartitionStats reportPartitionStats;

  public ExternalSorter(OutputContext outputContext, Configuration conf, int numOutputs,
      long initialMemoryAvailable) throws IOException {
    this.outputContext = outputContext;
    this.conf = conf;
    this.localFs = (RawLocalFileSystem) FileSystem.getLocal(conf).getRaw();
    this.partitions = numOutputs;
    reportPartitionStats = ReportPartitionStats.fromString(
        conf.get(TezRuntimeConfiguration.TEZ_RUNTIME_REPORT_PARTITION_STATS,
        TezRuntimeConfiguration.TEZ_RUNTIME_REPORT_PARTITION_STATS_DEFAULT));
    partitionStats = reportPartitionStats.isEnabled() ?
        (new long[partitions]) : null;

    cleanup = conf.getBoolean(TezRuntimeConfiguration.TEZ_RUNTIME_CLEANUP_FILES_ON_INTERRUPT,
        TezRuntimeConfiguration.TEZ_RUNTIME_CLEANUP_FILES_ON_INTERRUPT_DEFAULT);

    rfs = ((LocalFileSystem)FileSystem.getLocal(this.conf)).getRaw();

    if (LOG.isDebugEnabled()) {
      LOG.debug(outputContext.getDestinationVertexName() + ": Initial Mem bytes : " +
          initialMemoryAvailable + ", in MB=" + ((initialMemoryAvailable >> 20)));
    }
    int assignedMb = (int) (initialMemoryAvailable >> 20);
    //Let the overflow checks happen in appropriate sorter impls
    this.availableMemoryMb = assignedMb;

    // sorter
    sorter = ReflectionUtils.newInstance(this.conf.getClass(
        TezRuntimeConfiguration.TEZ_RUNTIME_INTERNAL_SORTER_CLASS, QuickSort.class,
        IndexedSorter.class), this.conf);

    comparator = ConfigUtils.getIntermediateOutputKeyComparator(this.conf);

    // k/v serialization
    keyClass = ConfigUtils.getIntermediateOutputKeyClass(this.conf);
    valClass = ConfigUtils.getIntermediateOutputValueClass(this.conf);
    serializationFactory = new SerializationFactory(this.conf);
    keySerializer = serializationFactory.getSerializer(keyClass);
    valSerializer = serializationFactory.getSerializer(valClass);
    LOG.info(outputContext.getDestinationVertexName() + " using: "
        + "memoryMb=" + assignedMb
        + ", keySerializerClass=" + keyClass
        + ", valueSerializerClass=" + valSerializer
        + ", comparator=" + (RawComparator) ConfigUtils.getIntermediateOutputKeyComparator(conf)
        + ", partitioner=" + conf.get(TezRuntimeConfiguration.TEZ_RUNTIME_PARTITIONER_CLASS)
        + ", serialization=" + conf.get(CommonConfigurationKeys.IO_SERIALIZATIONS_KEY)
        + ", reportPartitionStats=" + reportPartitionStats);

    //    counters    
    mapOutputByteCounter = outputContext.getCounters().findCounter(TaskCounter.OUTPUT_BYTES);
    mapOutputRecordCounter = outputContext.getCounters().findCounter(TaskCounter.OUTPUT_RECORDS);
    outputBytesWithOverheadCounter = outputContext.getCounters().findCounter(TaskCounter.OUTPUT_BYTES_WITH_OVERHEAD);
    fileOutputByteCounter = outputContext.getCounters().findCounter(TaskCounter.OUTPUT_BYTES_PHYSICAL);
    spilledRecordsCounter = outputContext.getCounters().findCounter(TaskCounter.SPILLED_RECORDS);
    additionalSpillBytesWritten = outputContext.getCounters().findCounter(TaskCounter.ADDITIONAL_SPILLS_BYTES_WRITTEN);
    additionalSpillBytesRead = outputContext.getCounters().findCounter(TaskCounter.ADDITIONAL_SPILLS_BYTES_READ);
    numAdditionalSpills = outputContext.getCounters().findCounter(TaskCounter.ADDITIONAL_SPILL_COUNT);
    numShuffleChunks = outputContext.getCounters().findCounter(TaskCounter.SHUFFLE_CHUNK_COUNT);

    // compression
    if (ConfigUtils.shouldCompressIntermediateOutput(this.conf)) {
      Class<? extends CompressionCodec> codecClass =
          ConfigUtils.getIntermediateOutputCompressorClass(this.conf, DefaultCodec.class);
      codec = ReflectionUtils.newInstance(codecClass, this.conf);

      if (codec != null) {
        Class<? extends Compressor> compressorType = null;
        Throwable cause = null;
        try {
          compressorType = codec.getCompressorType();
        } catch (RuntimeException e) {
          cause = e;
        }
        if (compressorType == null) {
          String errMsg =
              String.format("Unable to get CompressorType for codec (%s). This is most" +
                      " likely due to missing native libraries for the codec.",
                  conf.get(TezRuntimeConfiguration.TEZ_RUNTIME_COMPRESS_CODEC));
          throw new IOException(errMsg, cause);
        }
      }
    } else {
      codec = null;
    }

    this.ifileReadAhead = this.conf.getBoolean(
        TezRuntimeConfiguration.TEZ_RUNTIME_IFILE_READAHEAD,
        TezRuntimeConfiguration.TEZ_RUNTIME_IFILE_READAHEAD_DEFAULT);
    if (this.ifileReadAhead) {
      this.ifileReadAheadLength = conf.getInt(
          TezRuntimeConfiguration.TEZ_RUNTIME_IFILE_READAHEAD_BYTES,
          TezRuntimeConfiguration.TEZ_RUNTIME_IFILE_READAHEAD_BYTES_DEFAULT);
    } else {
      this.ifileReadAheadLength = 0;
    }
    this.ifileBufferSize = conf.getInt("io.file.buffer.size",
        TezRuntimeConfiguration.TEZ_RUNTIME_IFILE_BUFFER_SIZE_DEFAULT);

    
    // Task outputs
    mapOutputFile = TezRuntimeUtils.instantiateTaskOutputManager(conf, outputContext);

    this.conf.setInt(TezRuntimeFrameworkConfigs.TEZ_RUNTIME_NUM_EXPECTED_PARTITIONS, this.partitions);
    this.partitioner = TezRuntimeUtils.instantiatePartitioner(this.conf);
    this.combiner = TezRuntimeUtils.instantiateCombiner(this.conf, outputContext);

    this.statsReporter = outputContext.getStatisticsReporter();
    this.finalMergeEnabled = conf.getBoolean(
        TezRuntimeConfiguration.TEZ_RUNTIME_ENABLE_FINAL_MERGE_IN_OUTPUT,
        TezRuntimeConfiguration.TEZ_RUNTIME_ENABLE_FINAL_MERGE_IN_OUTPUT_DEFAULT);
    this.sendEmptyPartitionDetails = conf.getBoolean(
        TezRuntimeConfiguration.TEZ_RUNTIME_EMPTY_PARTITION_INFO_VIA_EVENTS_ENABLED,
        TezRuntimeConfiguration.TEZ_RUNTIME_EMPTY_PARTITION_INFO_VIA_EVENTS_ENABLED_DEFAULT);
  }

  @VisibleForTesting
  public boolean isFinalMergeEnabled() {
    return finalMergeEnabled;
  }

  /**
   * Exception indicating that the allocated sort buffer is insufficient to hold
   * the current record.
   */
  @SuppressWarnings("serial")
  public static class MapBufferTooSmallException extends IOException {
    public MapBufferTooSmallException(String s) {
      super(s);
    }
  }

  @Private
  public TezTaskOutput getMapOutput() {
    return mapOutputFile;
  }

  @Private
  public Path getFinalIndexFile() {
    return finalIndexFile;
  }

  public Path getFinalOutputFile() {
    return finalOutputFile;
  }

  protected void runCombineProcessor(TezRawKeyValueIterator kvIter,
      Writer writer) throws IOException {
    try {
      outputContext.notifyProgress();
      combiner.combine(kvIter, writer);
    } catch (InterruptedException e) {
      Thread.currentThread().interrupt();
      throw new IOInterruptedException("Combiner interrupted", e);
    }
  }

  /**
   * Rename srcPath to dstPath on the same volume. This is the same as
   * RawLocalFileSystem's rename method, except that it will not fall back to a
   * copy, and it will create the target directory if it doesn't exist.
   */
  protected void sameVolRename(Path srcPath, Path dstPath) throws IOException {
    RawLocalFileSystem rfs = (RawLocalFileSystem) this.rfs;
    File src = rfs.pathToFile(srcPath);
    File dst = rfs.pathToFile(dstPath);
    if (!dst.getParentFile().exists()) {
      if (!dst.getParentFile().mkdirs()) {
        throw new IOException("Unable to rename " + src + " to " + dst
            + ": couldn't create parent directory");
      }
    }

    if (!src.renameTo(dst)) {
      throw new IOException("Unable to rename " + src + " to " + dst);
    }
  }

  public InputStream getSortedStream(int partition) {
    throw new UnsupportedOperationException("getSortedStream isn't supported!");
  }

  public ShuffleHeader getShuffleHeader(int reduce) {
    throw new UnsupportedOperationException("getShuffleHeader isn't supported!");
  }

  public static long getInitialMemoryRequirement(Configuration conf, long maxAvailableTaskMemory) {
    int initialMemRequestMb = 
        conf.getInt(
            TezRuntimeConfiguration.TEZ_RUNTIME_IO_SORT_MB, 
            TezRuntimeConfiguration.TEZ_RUNTIME_IO_SORT_MB_DEFAULT);
    long reqBytes = ((long) initialMemRequestMb) << 20;
    //Higher bound checks are done in individual sorter implementations
    Preconditions.checkArgument(initialMemRequestMb > 0 && reqBytes < maxAvailableTaskMemory,
        TezRuntimeConfiguration.TEZ_RUNTIME_IO_SORT_MB + " " + initialMemRequestMb + " should be "
            + "larger than 0 and should be less than the available task memory (MB):" +
            (maxAvailableTaskMemory >> 20));
    if (LOG.isDebugEnabled()) {
      LOG.debug("Requested SortBufferSize ("
          + TezRuntimeConfiguration.TEZ_RUNTIME_IO_SORT_MB + "): "
          + initialMemRequestMb);
    }
    return reqBytes;
  }

  public int getNumSpills() {
    return numSpills;
  }

  protected synchronized void cleanup() throws IOException {
    if (!cleanup) {
      return;
    }
    cleanup(spillFilePaths);
    cleanup(spillFileIndexPaths);
    //TODO: What if when same volume rename happens (have to rely on job completion cleanup)
    cleanup(finalOutputFile);
    cleanup(finalIndexFile);
  }

  protected synchronized void cleanup(Path path) {
    if (path == null || !cleanup) {
      return;
    }
    try {
      LOG.info("Deleting " + path);
      rfs.delete(path, true);
    } catch(IOException ioe) {
      LOG.warn("Error in deleting "  + path);
    }
  }

  protected synchronized void cleanup(Map<Integer, Path> spillMap) {
    if (!cleanup) {
      return;
    }
    for(Map.Entry<Integer, Path> entry : spillMap.entrySet()) {
      cleanup(entry.getValue());
    }
  }

  public long[] getPartitionStats() {
    return partitionStats;
  }

  protected boolean reportPartitionStats() {
    return (partitionStats != null);
  }

  protected synchronized void reportStatistics() {
    // This works for non-started outputs since new counters will be created with an initial value of 0
    long outputSize = outputContext.getCounters().findCounter(TaskCounter.OUTPUT_BYTES).getValue();
    statsReporter.reportDataSize(outputSize);
    long outputRecords = outputContext.getCounters()
        .findCounter(TaskCounter.OUTPUT_RECORDS).getValue();
    statsReporter.reportItemsProcessed(outputRecords);
  }

  public boolean reportDetailedPartitionStats() {
    return reportPartitionStats.isPrecise();
  }
}