java source code of ReduceTask

RDFS-master
- NOTICE.txt
- src
  - saveVersion.sh
  - c++
    - utils
      - impl
        StringUtils.cc
        SerialUtils.cc
        config.h.in
      - m4
        hadoop_utils.m4
      - config.sub
      - Makefile.in
      - config.guess
      - api
        hadoop
        SerialUtils.hh
        StringUtils.hh
      - configure.ac
      - missing
      - Makefile.am
      - .autom4te.cfg
      - install-sh
      - ltmain.sh
      - depcomp
    - pipes
      - compile
      - impl
        HadoopPipes.cc
        config.h.in
      - config.sub
      - Makefile.in
      - config.guess
      - api
        hadoop
        TemplateFactory.hh
        Pipes.hh
      - configure.ac
      - missing
      - Makefile.am
      - .autom4te.cfg
      - install-sh
      - debug
        pipes-default-script
        pipes-default-gdb-commands.txt
      - ltmain.sh
      - depcomp
    - libhdfs
      - m4
        apfunctions.m4
        apjava.m4
        ltoptions.m4
        ltversion.m4
        lt~obsolete.m4
        apsupport.m4
        ltsugar.m4
      - hdfsJniHelper.h
      - hdfs_direct.h
      - config.sub
      - Makefile.in
      - hdfs.c
      - config.guess
      - hdfs_test.c
      - hdfsJniHelper.c
      - hdfs.h
      - hdfs_write.c
      - configure.ac
      - aclocal.m4
      - missing
      - hdfs_read.c
      - Makefile.am
      - tests
        test-libhdfs.sh
        conf
        hdfs-site.xml
        slaves
        hadoop-site.xml
        mapred-site.xml
        core-site.xml
      - install-sh
      - docs
        Doxyfile
        libhdfs_footer.html
      - depcomp
    - librecordio
      - csvarchive.cc
      - Makefile
      - binarchive.cc
      - typeInfo.cc
      - typeIDs.hh
      - xmlarchive.cc
      - exception.hh
      - fieldTypeInfo.hh
      - recordTypeInfo.cc
      - test
        test.hh
        Makefile
        testFromJava.cc
        test.jr
        testFromJava.hh
        test.cc
      - fieldTypeInfo.cc
      - typeInfo.hh
      - utils.hh
      - utils.cc
      - binarchive.hh
      - archive.hh
      - recordio.cc
      - filestream.cc
      - filestream.hh
      - xmlarchive.hh
      - recordTypeInfo.hh
      - exception.cc
      - csvarchive.hh
      - typeIDs.cc
      - recordio.hh
    - task-controller
      - configuration.h.in
      - configuration.c
      - task-controller.c
      - Makefile.in
      - configure
      - configure.ac
      - task-controller.h
      - main.c
  - examples
    - pipes
      - impl
        sort.cc
        wordcount-simple.cc
        wordcount-nopipe.cc
        config.h.in
        wordcount-part.cc
      - config.sub
      - Makefile.in
      - config.guess
      - README.txt
      - configure.ac
      - missing
      - Makefile.am
      - .autom4te.cfg
      - install-sh
      - conf
        word-part.xml
        word.xml
      - ltmain.sh
      - depcomp
    - python
      - compile
      - pyAbacus
        compile
        wordcountaggregator.spec
        JyAbacusWCPlugIN.py
        JythonAbacus.py
      - WordCount.py
    - org
      - apache
        hadoop
        examples
        SleepJob.java
        WordCount.java
        SecondarySort.java
        AggregateWordHistogram.java
        Sort.java
        dancing
        Pentomino.java
        OneSidedPentomino.java
        puzzle1.dta
        DistributedPentomino.java
        Sudoku.java
        DancingLinks.java
        package.html
        AggregateWordCount.java
        MultiFileWordCount.java
        RandomTextWriter.java
        Grep.java
        Join.java
        DBCountPageView.java
        terasort
        TeraSort.java
        job_history_summary.py
        TeraInputFormat.java
        TeraGen.java
        TeraOutputFormat.java
        TeraValidate.java
        package.html
        RandomWriter.java
        package.html
        ExampleDriver.java
        PiEstimator.java
  - test
    - hdfs-site.xml
    - ddl
      - int.jr
      - test.jr
      - buffer.jr
      - string.jr
    - testjar
      - CustomOutputCommitter.java
      - ExternalMapperReducer.java
      - ExternalWritable.java
      - ClassWordCount.java
    - log4j.properties
    - checkstyle.xml
    - checkstyle-noframes-sorted.xsl
    - lib
      - ftplet-api-1.0.0-SNAPSHOT.jar
      - ftpserver-server-1.0.0-SNAPSHOT.jar
    - findbugsExcludeFile.xml
    - hadoop-site.xml
    - hadoop-policy.xml
    - mapred-site.xml
    - testshell
      - ExternalMapReduce.java
    - bin
      - test-patch.sh
    - tools
      - data
        rumen
        zombie
        input-topology.json
        small-trace-test
        truncated-topology-output
        sample-job-tracker-logs.gz
        job-tracker-logs-trace-output.gz
        job-tracker-logs-topology-output
        truncated-trace-output
        truncated-job-tracker-log
        histogram-tests
        gold-three-values.json
        gold-one-value-many-repeats.json
        input-minimal.json
        input-only-one-value.json
        input-one-value-many-repeats.json
        gold-minimal.json
        gold-only-one-value.json
        input-three-values.json
    - org
      - apache
        hadoop
        security
        TestAccessControlList.java
        TestPermission.java
        TestUnixUserGroupInformation.java
        authorize
        TestServiceLevelAuthorization.java
        TestConfiguredPolicy.java
        HadoopPolicyProvider.java
        fs
        TestFilterFileSystem.java
        TestDFSIO.java
        s3
        TestInMemoryS3FileSystemContract.java
        Jets3tS3FileSystemContractTest.java
        InMemoryFileSystemStore.java
        TestINode.java
        TestS3FileSystem.java
        S3FileSystemContractBaseTest.java
        TestS3Credentials.java
        TestPath.java
        FileSystemContractBaseTest.java
        TestFileSystem.java
        TestChecksumFileSystem.java
        TestGetFileBlockLocations.java
        TestUrlStreamHandler.java
        TestDU.java
        s3native
        InMemoryNativeFileSystemStore.java
        NativeS3FileSystemContractBaseTest.java
        Jets3tNativeS3FileSystemContractTest.java
        TestInMemoryNativeS3FileSystemContract.java
        TestGlobPaths.java
        TestLocatedStatus.java
        TestLocalFileSystemPermission.java
        ftp
        TestFTPFileSystem.java
        TestLocalDirAllocator.java
        loadGenerator
        LoadGenerator.java
        DataGenerator.java
        StructureGenerator.java
        TestLoadGenerator.java
        TestGlobExpander.java
        TestTruncatedInputBug.java
        kfs
        KFSEmulationImpl.java
        TestKosmosFileSystem.java
        TestHarFileSystem.java
        permission
        TestFsPermission.java
        TestCopyFiles.java
        TestTrash.java
        AccumulatingReducer.java
        DistributedFSCheck.java
        DFSCIOTest.java
        IOMapperBase.java
        TestLocalFileSystem.java
        ipc
        TestIPC.java
        ClientAdapter.java
        TestSocketFactory.java
        TestIPCServerResponder.java
        TestRPC.java
        TestMethodRPCCompatibility.java
        net
        TestSockOpt.java
        TestNetworkTopology.java
        TestSocketIOWithTimeout.java
        TestIPv4AddressTruncationMapping.java
        TestScriptBasedMapping.java
        TestNetUtils.java
        TestInetSocketAddressFactory.java
        StaticMapping.java
        test
        AllTestDriver.java
        cli
        testConf.xsl
        TestCLI.java
        util
        CommandExecutor.java
        TokenComparator.java
        CLITestData.java
        SubstringComparator.java
        ComparatorData.java
        RegexpComparator.java
        ComparatorBase.java
        ExactComparator.java
        clitest_data
        data30bytes
        data15bytes
        data60bytes
        data120bytes
        testConf.xml
        record
        ToCpp.java
        TestRecordMR.java
        RecordBench.java
        TestRecordWritable.java
        TestBuffer.java
        TestRecordIO.java
        TestRecordVersioning.java
        FromCpp.java
        log
        TestLogLevel.java
        filecache
        TestDistributedCache.java
        util
        TestHostsFileReader.java
        TestDataChecksum.java
        TestIndexedSort.java
        TestCyclicIteration.java
        TestStringUtils.java
        TestAsyncDiskService.java
        TestPureJavaCrc32.java
        TestPulseChecker.java
        TestGenericsUtil.java
        TestReflectionUtils.java
        TestProcfsBasedProcessTree.java
        SerializableUtilsTest.java
        TestShell.java
        mapred
        TestJobClient.java
        ControlledMapReduceJob.java
        TestCompressedEmptyMapOutputs.java
        TestLocalMRNotification.java
        ReliabilityTest.java
        TestKeyValueTextInputFormat.java
        TestClusterMapReduceTestCase.java
        TestMiniMRDFSSort.java
        TestMapredSystemDir.java
        TestFieldSelection.java
        TestMiniMRTaskTempDir.java
        TestSequenceFileInputFormat.java
        TestSortedRanges.java
        TestControlledMapReduceJob.java
        TestLostTracker.java
        TestTaskLimits.java
        TestLimitTasksPerJobTaskScheduler.java
        TestIndexCache.java
        pipes
        WordCountInputFormat.java
        TestPipes.java
        TestPipesAsDifferentUser.java
        TestComparators.java
        TestSequenceFileAsBinaryOutputFormat.java
        TestMiniMRBringup.java
        TestMapCollection.java
        WordCount.java
        UtilsForTests.java
        TestFileOutputFormat.java
        test.jar
        TestClusterMRNotification.java
        GenericMRLoadGenerator.java
        TestParallelInitialization.java
        TestClusterStatus.java
        TestMapRed.java
        TestJobCleanup.java
        test.tar
        TestKillSubProcesses.java
        TestKillCompletedJob.java
        TestFileOutputCommitter.java
        TestGetSplitHosts.java
        TestCompositeTaskTrackerInstrumentation.java
        TestJobName.java
        TestInputPath.java
        TestTTCpuToTaskSlots.java
        TestJobCounters.java
        testscript.txt
        TestMapOutputType.java
        TestResourceEstimation.java
        BigMapOutput.java
        MiniMRCluster.java
        TestNodeHealthService.java
        TestEmptyJob.java
        lib
        db
        TestConstructQuery.java
        TestDBJob.java
        TestMultithreadedMapRunner.java
        TestDelegatingInputFormat.java
        TestMultipleInputs.java
        aggregate
        TestAggregates.java
        AggregatorTests.java
        TestCombineFileInputFormat.java
        TestLineInputFormat.java
        TestHarWithCombineFileInputFormat.java
        TestKeyFieldBasedPartitioner.java
        TestMultipleOutputs.java
        TestKeyFieldHelper.java
        TestKeyFieldBasedComparator.java
        TestTotalOrderPartitioner.java
        TestChainMapReduce.java
        TestJobExecutionAsDifferentUser.java
        TestJobRetire.java
        TestReduceFetch.java
        TestMRServerPorts.java
        TestJobTrackerXmlJsp.java
        TestSubmitJob.java
        test.txt
        TestJobHistoryParsing.java
        TestSetupAndCleanupFailure.java
        TestJobSysDirWithDFS.java
        TestTextOutputFormat.java
        TestSequenceFileInputFilter.java
        TestTaskFail.java
        TestJobHistoryVersion.java
        TestReduceTaskFetchFail.java
        TestSequenceFileAsBinaryInputFormat.java
        TestMultiFileInputFormat.java
        TestMultipleTextOutputFormat.java
        TestMiniMRDFSSharedCaching.java
        sharedTest2
        sharedTest.txt
        TestTaskCommit.java
        DummyResourceCalculatorPlugin.java
        SortValidator.java
        TestJobTrackerStart.java
        ClusterMapReduceTestCase.java
        NotificationTestCase.java
        TestFileInputFormatPathFilter.java
        TestUserDefinedCounters.java
        ClusterWithLinuxTaskController.java
        TestTaskLogsMonitor.java
        TestJobDirCleanup.java
        TestMiniMRDFSCaching.java
        TestMiniMRClasspath.java
        TestTTResourceReporting.java
        TestCollect.java
        TestQueueManager.java
        TestMiniMRWithDFS.java
        EmptyInputFormat.java
        TestMiniMRMapRedDebugScript.java
        test.tgz
        TestBadRecords.java
        TestMultipleLevelCaching.java
        TestCommandLineJobSubmission.java
        FakeObjectUtilities.java
        MRSharedCaching.java
        TestJobInProgressListener.java
        TestWritableJobConf.java
        TestIFileStreams.java
        TestReduceTaskNoMapOutput.java
        TestFileInputFormat.java
        TestRackAwareTaskPlacement.java
        TestTaskTrackerMemoryManager.java
        TestJobStatusPersistency.java
        TestChildTaskDirs.java
        TestNewCollector.java
        TestTrackerBlacklistAcrossJobs.java
        TestSpecialCharactersInOutputPath.java
        TestMiniMRWithDFSWithDistinctUsers.java
        TestMiniMRLocalFS.java
        TestReduceTask.java
        TestMiniMRChildTask.java
        join
        TestDatamerge.java
        IncomparableKey.java
        TestTupleWritable.java
        TestJobHistory.java
        ThreadedMapBenchmark.java
        test.tar.gz
        TestSetupWorkDir.java
        TestMultiFileSplit.java
        TestStatisticsCollector.java
        TestJobInProgress.java
        TestJavaSerialization.java
        sharedTest1
        sharedTest.txt
        TestCustomOutputCommitter.java
        DummyTaskTrackerInstrumentation.java
        TestJobKillAndFail.java
        TestSequenceFileAsTextInputFormat.java
        TestNodeRefresh.java
        TestJobQueueInformation.java
        TestTaskTrackerInstrumentation.java
        TestCounters.java
        HadoopTestCase.java
        TestSpeculativeExecution.java
        TestTextInputFormat.java
        TestQueueAclsForCurrentUser.java
        jobcontrol
        TestLocalJobControl.java
        TestJobControl.java
        JobControlTestUtils.java
        TestNodeBlacklisting.java
        MRCaching.java
        MRBench.java
        TestJobQueueTaskScheduler.java
        hdfs
        TestFileStatusExtended.java
        TestLargeBlock.java
        TestFastCopyDeadDataNodes.java
        FastCopySetupUtil.java
        TestDFSStartupVersions.java
        TestHDFSConcat.java
        hadoop-dfs-dir.txt
        TestAvailableForUnderConstruction.java
        TestDFSLocatedBlocks.java
        NNBenchWithoutMR.java
        TestHDFSTrash.java
        TestMissingBlocksAlert.java
        TestMultiThreadedSync.java
        TestFastCopyWithHardLink.java
        TestRbwReportSafeMode.java
        TestLocatedStatusInDFS.java
        ManualSyncTester.java
        TestFileAppend4.java
        TestDatanodeDeath.java
        TestDFSClientFavoredNodes.java
        TestFileCreationClient.java
        DFSTestUtil.java
        TestFastCopyCLI.java
        TestRenameWhileOpen.java
        TestAbandonBlock.java
        TestDFSUpgradeFromImage.java
        TestCheckDisk.java
        TestDFSUtil.java
        TestFileConcurrentReader.java
        TestFileAppend3.java
        TestDatanodeDeath2.java
        TestReplication.java
        TestDFSFinalize.java
        TestAbandonBlockEditLog.java
        TestModTime.java
        TestPread.java
        TestLease.java
        TestSeekBug.java
        TestDataTransferProtocol.java
        TestFileAppend.java
        UpgradeUtilities.java
        TestInjectionForSimulatedStorage.java
        DFSClientAdapter.java
        TestFastCopyCleanShutdown.java
        TestFSInputChecker.java
        TestFastCopyWithoutHardLink.java
        TestLeaseRecovery2.java
        TestSyncingWriterInterrupted.java
        TestBlockIncrementalReport.java
        TestFileCreationDelete.java
        NNBench.java
        TestReadShortCircuit.java
        TestBlockReportProcessingTime.java
        BenchmarkThroughput.java
        TestRestartDFS.java
        TestDefaultNameNodePort.java
        TestNameNodeIdempotence.java
        TestDFSMkdirs.java
        util
        TestLightWeightBitSet.java
        TestPosixPathNameChecker.java
        TestPathValidator.java
        TestHashSet.java
        TestDefaultPathNameChecker.java
        TestLinkedHashSet.java
        TestLeaseRecovery.java
        TestBlocksScheduledCounter.java
        hadoop-26-dfs-dir.tgz
        TestBlockReport.java
        TestDFSClientMetrics.java
        TestFileCreationNamenodeRestart.java
        TestDFSUpgrade.java
        TestSmallBlock.java
        TestParallelRBW.java
        TestSetrepDecreasing.java
        TestNameNodeUpgrade.java
        TestFileLocalRead.java
        TestFileCreation.java
        TestFileAppend2.java
        DataNodeCluster.java
        TestLookasideCache.java
        TestDFSClientExcludedNodes.java
        TestDFSPermission.java
        MiniDFSCluster.java
        TestDFSShellGenericOptions.java
        TestTotalFiles.java
        TestHDFSServerPorts.java
        TestDatanodeUpgrade.java
        TestDFSClientRetries.java
        TestDFSStorageStateRecovery.java
        TestFastCopyBadDatanode.java
        TestCrcCorruption.java
        TestDFSRollback.java
        TestGetOpenFiles.java
        TestLeaseRecovery4.java
        TestDFSRename.java
        TestReadSlowDataNode.java
        TestFileCreationEmpty.java
        Hoopla.java
        TestDFSRemove.java
        TestDecommission.java
        protocol
        TestCorruptFileBlocks.java
        TestDFSClientMultipleClose.java
        server
        common
        TestThreadLocalDateFormat.java
        TestDistributedUpgrade.java
        namenode
        TestNameEditsConfigs.java
        TestFastCopyDeletedBlocks.java
        NNThroughputBenchmark.java
        TestPendingReplication.java
        TestOverReplicatedBlocks.java
        TestPathComponents.java
        TestNNThroughputBenchmark.java
        TestNameNodePorts.java
        TestConfigurableBlockPlacement.java
        TestBlockInfo.java
        TestDeadDatanode.java
        TestHost2NodesMap.java
        TestNameNodeReconfigure.java
        TestAllowFormat.java
        TestStartup.java
        TestSafeModeDFSHealth.java
        TestFileDeleteWhitelist.java
        NameNodeAdapter.java
        TestUnderReplicatedBlocks.java
        TestParallelImageWrite.java
        TestEditLogFileOutputStream.java
        TestFileLimit.java
        TestSaveNamespace.java
        TestCheckpoint.java
        TestDualRPCServerStartup.java
        TestNameNodeValidPosixPath.java
        TestLeaseManager.java
        TestComputeInvalidateWork.java
        HttpServletResponseStub.java
        TestReplicationPolicy.java
        TestDecommissioningStatus.java
        TestNamenodeCapacityReport.java
        TestEditLog.java
        TestPersistTxId.java
        TestPartialOpenForWrite.java
        TestNameNodeMXBean.java
        OfflineEditsViewerHelper.java
        CreateEditsLog.java
        TestDatanodeDescriptor.java
        TestBlockReplicationQueue.java
        TestLargeDirectoryDelete.java
        TestEditLog2.java
        TestStartupDefaultRack.java
        TestWebUIMissingBlocks.java
        TestHeartbeatHandling.java
        TestRecount.java
        TestGetBlockInfo.java
        TestFsck.java
        TestListCorruptFileBlocks.java
        TestDFSIsUnderConstruction.java
        TestEmptyAbandonBlock.java
        TestDFSConcurrentFileOperations.java
        TestSafeModeDuplicateReports.java
        metrics
        TestNameNodeMetrics.java
        TestINodeFile.java
        TestFavoredNodes.java
        FSNamesystemAdapter.java
        TestNameCache.java
        FileNameGenerator.java
        FSImageAdapter.java
        TestStorageRestore.java
        TestNodeCount.java
        TestCorruptFilesJsp.java
        datanode
        TestBlockReplacement.java
        TestDataNodeVolumeFailureToleration.java
        SimulatedFSDataset.java
        TestDataBlockScanner.java
        TestMetricsTimeVaryingClasses.java
        TestStuckDataNode.java
        TestDataNodeMetrics.java
        TestRefreshNamenodes.java
        TestDataNodeVolumeRefresh.java
        TestMergeNamespaces.java
        TestCopyBlockAPI.java
        FSDatasetTestUtil.java
        TestInterDatanodeProtocol.java
        TestSimulatedFSDataset.java
        TestDatanodeRestart.java
        TestParallelBlockScan.java
        TestDiskError.java
        TestDataNodeMultipleRegistrations.java
        balancer
        TestBalancer.java
        TestDatanodeBlockScanner.java
        TestCloseFile.java
        TestLeaseRecovery3.java
        tools
        offlineEditsViewer
        TestOfflineEditsViewer.java
        offlineImageViewer
        fsimageV19
        fsimageV18
        TestOIVCanReadOldVersions.java
        TestOfflineImageViewer.java
        TestDelimitedImageVisitor.java
        SpotCheckImageVisitor.java
        TestSafeMode.java
        TestFileStatus.java
        TestOpenFilesInfo.java
        TestListPathServlet.java
        TestDFSClientUpdateNameNodeSignature.java
        TestDFSShell.java
        TestChecksumFile.java
        TestFileSync.java
        TestDatanodeReport.java
        TestSetrepIncreasing.java
        TestBlockRecovery.java
        TestHDFSFileSystemContract.java
        TestScatterGather.java
        TestSetTimes.java
        TestFileHardLink.java
        TestFSOutputSummer.java
        TestDFSClientMetricsSync.java
        TestLocalDFS.java
        TestQuota.java
        AppendTestUtil.java
        TestBlockMissingException.java
        TestFileCorruption.java
        TestHftpFileSystem.java
        TestGetBlocks.java
        TestNameNodeRestart.java
        TestDistributedFileSystem.java
        io
        nativeio
        TestNativeIO.java
        TestWritable.java
        RandomDatum.java
        TestTextNonUTF8.java
        compress
        TestCodec.java
        TestCodecFactory.java
        snappy
        TestSnappyCodec.java
        TestGzipCodec.java
        TestArrayFile.java
        FileBench.java
        TestSequenceFile.java
        TestBloomMapFile.java
        TestSortedMapWritable.java
        file
        tfile
        TestTFileNoneCodecsByteArrays.java
        NanoTimer.java
        TestTFileStreams.java
        TestVLong.java
        TestTFileSeek.java
        TestTFileComparators.java
        TestTFileSeqFileComparison.java
        TestTFileNoneCodecsStreams.java
        TestTFileNoneCodecsJClassComparatorByteArrays.java
        RandomDistribution.java
        TestTFile.java
        Timer.java
        KVGenerator.java
        TestTFileLzoCodecsByteArrays.java
        TestTFileUnsortedByteArrays.java
        TestTFileLzoCodecsStreams.java
        TestTFileByteArrays.java
        TestTFileSplit.java
        KeySampler.java
        TestTFileJClassComparatorByteArrays.java
        TestGenericWritable.java
        TestVersionedWritable.java
        TestWritableName.java
        TestText.java
        TestArrayWritable.java
        TestMD5Hash.java
        TestSequenceFileMergeProgress.java
        TestMapFile.java
        TestSetFile.java
        TestWritableUtils.java
        TestSequenceFileSerialization.java
        retry
        TestRetryProxy.java
        UnreliableInterface.java
        UnreliableImplementation.java
        TestMapWritable.java
        TestBytesWritable.java
        TestUTF8.java
        serializer
        TestWritableSerialization.java
        TestDefaultStringifier.java
        http
        TestServletFilter.java
        TestGlobalFilter.java
        TestHtmlQuoting.java
        TestHttpServer.java
        tools
        TestGetConf.java
        TestDistCh.java
        TestJMXGet.java
        rumen
        TestRumenJobTraces.java
        TestPiecewiseLinearInterpolation.java
        TestHistograms.java
        TestZombieJob.java
        HistogramRawTestData.java
        metrics
        TestContextFactory.java
        TestMetricsServlet.java
        spi
        TestOutputRecord.java
        mapreduce
        TestMapReduceLocal.java
        TestLocalRunner.java
        lib
        map
        TestMultithreadedMapper.java
        util
        TestMRAsyncDiskService.java
        TestNoJobSetupCleanup.java
        MapReduceTestUtil.java
        TestChild.java
        conf
        TestNoDefaultsJobConf.java
        TestJobConf.java
        TestReconfiguration.java
        TestConfiguration.java
    - core-site.xml
  - webapps
    - task
      - taskcompletionevents.jsp
      - index.html
      - tasktracker.jsp
    - job
      - jobtracker.jsp
      - gc.jsp
      - taskdetails.jsp
      - jobtrackersdetailsjson.jsp
      - locality.jsp
      - jobconf.jsp
      - jobdetails.jsp
      - jobtasks.jsp
      - jobtracker_hmon.jsp
      - analysejobhistory.jsp
      - joblogs.jsp
      - jobdetailshistory.jsp
      - jobqueue_details.jsp
      - taskstats.jsp
      - jobconf_history.jsp
      - jobblacklistedtrackers.jsp
      - machines.jsp
      - tasktrackerfaultstatus.jsp
      - jobtracker.jspx
      - jobfailures.jsp
      - loadhistory.jsp
      - jobcompletionevents.jsp
      - index.html
      - taskdetailshistory.jsp
      - jobhistory.jsp
      - jobtaskshistory.jsp
      - jobdetailsjson.jsp
    - hdfs
      - dfshealth.jsp
      - decommission.jsp
      - dfsclusterhealth.jsp
      - dfsnodelist.jsp
      - corrupt_files.jsp
      - index.html
      - nn_browsedfscontent.jsp
    - static
      - hadoop.css
      - tablesorter
        style.css
        asc.gif
        jobtablesorter.js
        desc.gif
        jquery.tablesorter.js
        bg.gif
      - hadoop-logo.jpg
      - cm.js
      - jobconf.xsl
      - jobtracker.js
      - cm_old.js
      - jqueryThemeRoller.js
      - jquery-1.7.1.min.js
      - jquery
        js
        jquery.dataTables.min.js
        jquery-1.7.2.min.js
        css
        smoothness
        images
        jquery-ui-1.8.20.custom.css
        ui-lightness
        images
        jquery-ui-1.8.20.custom.css
      - multiselect
        jquery.multiselect.css
        jquery.multiselect.min.js
      - dataTables
        images
        Sorting icons.psd
        favicon.ico
        js
        jquery.js
        jquery.dataTables.min.js
        css
        jquery.dataTables_themeroller.css
        jquery.dataTables.css
        demo_table.css
        demo_page.css
        demo_table_jui.css
    - datanode
      - tail.jsp
      - browseDirectory.jsp
      - browseBlock.jsp
  - mapred
    - mapred-default.xml
    - org
      - apache
        hadoop
        mapred
        ReduceTask.java
        TaskLogServlet.java
        TaskAttemptID.java
        SequenceFileInputFormat.java
        MemoryBlockTooSmallException.java
        SpillRecord.java
        LineRecordReader.java
        JobInProgress.java
        MapOutputFile.java
        Mapper.java
        TaskAttemptContext.java
        KeyValueTextInputFormat.java
        MemoryBlockIndex.java
        JSPUtil.java
        SkipBadRecords.java
        JobInProgress_Counter.properties
        SequenceFileOutputFormat.java
        TaskLog.java
        TaskStatus.java
        JobStatus.java
        DefaultJobHistoryParser.java
        TaskTrackerManager.java
        TextOutputFormat.java
        MapFileOutputFormat.java
        MapTaskCompletionEventsUpdate.java
        JobTrackerTraits.java
        NodeHealthCheckerService.java
        Task.java
        FileOutputCommitter.java
        MapReduceBase.java
        CleanupQueue.java
        pipes
        DownwardProtocol.java
        UpwardProtocol.java
        PipesMapRunner.java
        OutputHandler.java
        BinaryProtocol.java
        Submitter.java
        PipesNonJavaInputFormat.java
        PipesReducer.java
        PipesPartitioner.java
        package.html
        Application.java
        RamManager.java
        QueueAclsInfo.java
        SequenceFileInputFilter.java
        JobConfigurable.java
        MultiFileSplit.java
        RecordWriter.java
        SequenceFileAsBinaryInputFormat.java
        DisallowedTaskTrackerException.java
        JobQueueTaskScheduler.java
        InterTrackerProtocol.java
        TaskTracker.java
        DirectTaskUmbilical.java
        Utils.java
        DataStatistics.java
        ExpireUnusedFilesInCache.java
        SimulatedTaskRunner.java
        JobProfile.java
        JvmManager.java
        MapTask.java
        ChildMemoryBlock.java
        JvmTask.java
        HeartbeatResponse.java
        BufferSorter.java
        MultiFileInputFormat.java
        JobTrackerStatistics.java
        FileOutputFormat.java
        JobSubmissionProtocol.java
        MapRunner.java
        KeyValueLineRecordReader.java
        IFileOutputStream.java
        JobEndNotifier.java
        IsolationRunner.java
        Reducer.java
        TaskLogsMonitor.java
        OutputFormat.java
        BlockMapOutputBuffer.java
        LimitTasksPerJobTaskScheduler.java
        TaskID.java
        OutputLogFilter.java
        TaskTrackerAction.java
        TIPStatus.java
        Reporter.java
        QueueManager.java
        JobClient.java
        LexicographicalComparerHolder.java
        JobConf.java
        JobContext.java
        DefaultTaskController.java
        ResourceEstimator.java
        MapperWaitThread.java
        lib
        FieldSelectionMapReduce.java
        CombineFileSplit.java
        CombineFileInputFormat.java
        db
        DBWritable.java
        DBOutputFormat.java
        DBInputFormat.java
        DBConfiguration.java
        package.html
        DelegatingInputFormat.java
        KeyFieldHelper.java
        CombineFileRecordReader.java
        MultipleOutputFormat.java
        InverseMapper.java
        KeyFieldBasedPartitioner.java
        aggregate
        ValueAggregatorDescriptor.java
        UserDefinedValueAggregatorDescriptor.java
        StringValueMax.java
        LongValueMin.java
        StringValueMin.java
        ValueAggregator.java
        ValueAggregatorBaseDescriptor.java
        ValueHistogram.java
        DoubleValueSum.java
        ValueAggregatorJob.java
        UniqValueCount.java
        LongValueSum.java
        ValueAggregatorCombiner.java
        ValueAggregatorMapper.java
        package.html
        ValueAggregatorJobBase.java
        ValueAggregatorReducer.java
        LongValueMax.java
        HashPartitioner.java
        IdentityReducer.java
        InputSampler.java
        KeyFieldBasedComparator.java
        TokenCountMapper.java
        MultipleInputs.java
        NullOutputFormat.java
        ChainMapper.java
        MultithreadedMapRunner.java
        LongSumReducer.java
        MultipleOutputs.java
        Chain.java
        DelegatingMapper.java
        IdentityMapper.java
        MultipleTextOutputFormat.java
        NLineInputFormat.java
        TotalOrderPartitioner.java
        TaggedInputSplit.java
        package.html
        RegexMapper.java
        MultipleSequenceFileOutputFormat.java
        ChainReducer.java
        TaskTrackerInstrumentation.java
        OutputCommitter.java
        JobHistoryObserver.java
        TaskScheduler.java
        MemoryBlockAllocator.java
        JobQueueClient.java
        MergeSorter.java
        FileSplit.java
        LaunchTaskAction.java
        IndexCache.java
        MemoryBlockHolder.java
        OutputCollector.java
        SequenceFileAsTextInputFormat.java
        SequenceFileRecordReader.java
        JobTracker.java
        BasicTypeSorterBase.java
        SortedRanges.java
        KillJobAction.java
        MapSpillSortCounters.java
        RunningJob.java
        BlockMapOutputCollector.java
        TaskGraphServlet.java
        RawKeyValueIterator.java
        RecordReader.java
        ClusterStatus.java
        TaskLogAppender.java
        ResourceMetadata.java
        JobTrackerReconfigurable.java
        LocalJobRunner.java
        TaskUmbilicalProtocol.java
        JvmContext.java
        JobTrackerMetricsInst.java
        KeyValueSpillIterator.java
        JobHistory.java
        PoolMetadata.java
        JVMId.java
        CommitTaskAction.java
        StatisticsCollector.java
        TaskTrackerMetricsInst.java
        NettyMapOutputAttributes.java
        MapTaskStatus.java
        TaskReport.java
        InputFormat.java
        ResourceReporter.java
        ReinitTrackerAction.java
        JobInProgressListener.java
        SequenceFileAsBinaryOutputFormat.java
        MRConstants.java
        TaskInProgress.java
        BasicReducePartition.java
        PoolFairnessCalculator.java
        JobID.java
        InvalidJobConfException.java
        HistoryViewer.java
        ReducePartition.java
        LinuxTaskController.java
        ShuffleHandler.java
        IFile.java
        AdminOperationsProtocol.java
        EagerTaskInitializationListener.java
        KillTaskAction.java
        FileInputFormat.java
        JobInProgressTraits.java
        TaskTrackerStatus.java
        MapReducePolicyProvider.java
        tools
        MRAdmin.java
        CompositeTaskTrackerInstrumentation.java
        join
        Parser.java
        ResetableIterator.java
        CompositeInputFormat.java
        WrappedRecordReader.java
        OverrideRecordReader.java
        JoinRecordReader.java
        OuterJoinRecordReader.java
        ComposableInputFormat.java
        StreamBackedIterator.java
        ArrayListBackedIterator.java
        TupleWritable.java
        CompositeInputSplit.java
        CompositeRecordReader.java
        MultiFilterRecordReader.java
        package.html
        ComposableRecordReader.java
        InnerJoinRecordReader.java
        InvalidInputException.java
        TaskController.java
        MemoryBlock.java
        ReduceTaskStatus.java
        Counters.java
        JobStats.java
        JobQueueJobInProgressListener.java
        Task_Counter.properties
        MapRunnable.java
        TaskMemoryManagerThread.java
        Partitioner.java
        ReduceTaskRunner.java
        JobPriority.java
        MapTaskRunner.java
        JobQueueInfo.java
        TaskRunner.java
        Merger.java
        JobTrackerInstrumentation.java
        CompletedJobStatusStore.java
        package.html
        TextInputFormat.java
        IFileInputStream.java
        Clock.java
        TaskCompletionEvent.java
        JobStatusChangeEvent.java
        Child.java
        SequenceFileAsTextRecordReader.java
        jobcontrol
        JobControl.java
        package.html
        Job.java
        TaskErrorCollector.java
        JobChangeEvent.java
        InvalidFileTypeException.java
        ID.java
        InputSplit.java
        mapreduce
        TaskAttemptID.java
        CounterNames.java
        Mapper.java
        TaskAttemptContext.java
        TaskType.java
        ClusterMetrics.java
        JobStatus.java
        RecordWriter.java
        Reducer.java
        OutputFormat.java
        TaskID.java
        JobContext.java
        lib
        partition
        HashPartitioner.java
        output
        SequenceFileOutputFormat.java
        TextOutputFormat.java
        FileOutputCommitter.java
        FileOutputFormat.java
        NullOutputFormat.java
        reduce
        LongSumReducer.java
        IntSumReducer.java
        map
        InverseMapper.java
        MultithreadedMapper.java
        TokenCounterMapper.java
        input
        SequenceFileInputFormat.java
        LineRecordReader.java
        FileSplit.java
        SequenceFileRecordReader.java
        ShuffleRecordReader.java
        FileInputFormat.java
        InvalidInputException.java
        TextInputFormat.java
        OutputCommitter.java
        StatusReporter.java
        CounterGroup.java
        MapContext.java
        TaskInputOutputContext.java
        RecordReader.java
        InputFormat.java
        JobID.java
        server
        jobtracker
        TaskTracker.java
        JobTrackerJspHelper.java
        ReduceContext.java
        Counters.java
        Partitioner.java
        Counter.java
        Job.java
        ID.java
        InputSplit.java
  - hdfs
    - org
      - apache
        hadoop
        hdfs
        ChecksumDistributedFileSystem.java
        FileStatusExtended.java
        DataTransferPacket.java
        RecoverTreeNode.java
        Replicable.java
        BlockReader.java
        DFSOutputStream.java
        GaloisField.java
        CorruptFileBlockIterator.java
        HsftpFileSystem.java
        HighTideShell.java
        DFSLocatedBlocks.java
        HDFSPolicyProvider.java
        util
        DefaultPathNameChecker.java
        LightWeightHashSet.java
        LightWeightBitSet.java
        InjectionEvent.java
        LightWeightGSet.java
        InjectionHandler.java
        ByteArray.java
        PathNameChecker.java
        LightWeightLinkedSet.java
        PathValidator.java
        Holder.java
        GSet.java
        DataTransferThrottler.java
        PosixPathNameChecker.java
        GSetByHashMap.java
        HftpFileSystem.java
        BlockReaderLocal.java
        RecoverTreeNodeElement.java
        DFSClient.java
        DFSUtil.java
        LookasideCache.java
        MinimumSpanningTree.java
        LeaseRenewal.java
        protocol
        ReadMetadataHeader.java
        ReadBlockHeader.java
        CopyBlockHeader.java
        VersionedLocatedBlock.java
        ClientDatanodeProtocol.java
        LocatedBlockWithFileName.java
        HighTideProtocol.java
        LocatedBlocks.java
        AlreadyBeingCreatedException.java
        DataTransferProtocol.java
        VersionAndOpcode.java
        FSConstants.java
        DatanodeID.java
        LocatedBlock.java
        Block.java
        LocatedDirectoryListing.java
        VersionedLocatedBlocks.java
        LocatedBlockWithMetaInfo.java
        DSQuotaExceededException.java
        BlockChecksumHeader.java
        WriteBlockHeader.java
        BlockPathInfo.java
        PolicyInfo.java
        MergeBlockHeader.java
        DataTransferHeader.java
        NSQuotaExceededException.java
        LocatedBlocksWithMetaInfo.java
        ProtocolCompatible.java
        LayoutVersion.java
        ClientProtocol.java
        ReplaceBlockHeader.java
        CorruptFileBlocks.java
        UnregisteredDatanodeException.java
        QuotaExceededException.java
        HdfsFileStatus.java
        BlockListAsLongs.java
        ReadBlockAccelaratorHeader.java
        DirectoryListing.java
        DatanodeInfo.java
        DFSInputStream.java
        server
        hightidenode
        HighTideConfigurationException.java
        ConfigManager.java
        DirectoryTraversal.java
        README
        PendingReplication.java
        HighTideNode.java
        FileFixer.java
        metrics
        HighTideNodeActivityMBean.java
        HighTideNodeMetrics.java
        hightide.xml
        common
        InconsistentFSStateException.java
        HdfsConstants.java
        UpgradeObjectCollection.java
        UpgradeStatusReport.java
        GenerationStamp.java
        Upgradeable.java
        Storage.java
        StorageInfo.java
        Util.java
        ThreadLocalDateFormat.java
        UpgradeManager.java
        UpgradeObject.java
        IncorrectVersionException.java
        namenode
        LeaseExpiredException.java
        SafeModeInfo.java
        EditLogInputStream.java
        SecondaryNameNode.java
        TransferFsImage.java
        SerialNumberManager.java
        FSInodeInfo.java
        EditLogFileInputStream.java
        NameCache.java
        SaveNamespaceContext.java
        BlockPlacementPolicyDefault.java
        UnsupportedActionException.java
        FileDataServlet.java
        FSDirectory.java
        SafeModeUtil.java
        ConfigManager.java
        NameNodeSafeModeInfo.java
        INodeFileUnderConstruction.java
        CheckpointSignature.java
        ListPathsServlet.java
        DecommissionManager.java
        FSPermissionChecker.java
        UpgradeManagerNamenode.java
        FsckServlet.java
        StreamFile.java
        FSImage.java
        HardLinkFileInfo.java
        NameNode.java
        FSClusterStats.java
        Host2NodesMap.java
        EditsDoubleBuffer.java
        DefaultRackException.java
        FSEditLogOpCodes.java
        INode.java
        UnderReplicatedBlocks.java
        SafeModeException.java
        INodeDirectoryWithQuota.java
        CorruptReplicasMap.java
        JspHelper.java
        NotReplicatedYetException.java
        EditLogOutputStream.java
        PermissionChecker.java
        DfsServlet.java
        UpgradeObjectNamenode.java
        LeaseManager.java
        PendingReplicationBlocks.java
        FSEditLogLoader.java
        FSImageFormat.java
        SafeModeMonitor.java
        ClusterJspHelper.java
        BlocksMap.java
        BlockPlacementPolicy.java
        BlockPlacementPolicyConfigurable.java
        FSEditLog.java
        NameNodeMXBeanServlet.java
        EditLogFileOutputStream.java
        metrics
        NameNodeActivtyMBean.java
        FSNamesystemMetrics.java
        FSNamesystemMBean.java
        NameNodeMetrics.java
        INodeDirectory.java
        SaveNamespaceCancelledException.java
        FileChecksumServlets.java
        INodeFile.java
        FSImageSerialization.java
        DatanodeDescriptor.java
        FSEditLogOp.java
        NameNodeMXBean.java
        GetImageServlet.java
        FSImageCompression.java
        NamenodeFsck.java
        INodeHardLinkFile.java
        protocol
        DatanodeRegistration.java
        ReceivedDeletedBlockInfo.java
        BlockAlreadyCommittedException.java
        DatanodeCommand.java
        IncrementalBlockReport.java
        ReceivedBlockInfo.java
        BlocksWithLocations.java
        DatanodeProtocol.java
        BlockReport.java
        BlockRecoveryInfo.java
        NamenodeProtocol.java
        BlockCommand.java
        NamespaceInfo.java
        BlockFlags.java
        InterDatanodeProtocol.java
        DisallowedDatanodeException.java
        BlockMetaDataInfo.java
        UpgradeCommand.java
        datanode
        DataBlockScanner.java
        BlockSender.java
        UpgradeManagerDatanode.java
        FSDatasetInterface.java
        BlockReceiver.java
        VolumeMap.java
        BlockTransferThrottler.java
        ReplicaBeingWritten.java
        NamespaceService.java
        DataXceiverServer.java
        UpgradeObjectDatanode.java
        DataBlockScannerSet.java
        DataXceiver.java
        DatanodeBlockInfo.java
        NameSpaceSliceStorage.java
        DataNode.java
        BlockAlreadyExistsException.java
        FSDatasetAsyncDiskService.java
        DataStorage.java
        BlockXCodingSender.java
        DataNodeMXBean.java
        metrics
        FSDatasetMBean.java
        DataNodeMetrics.java
        DataNodeActivityMBean.java
        FSDataset.java
        BlockMetadataHeader.java
        BlockXCodingMerger.java
        balancer
        Balancer.java
        tools
        DFSck.java
        FastCopy.java
        DFSAdmin.java
        offlineEditsViewer
        XmlTokenizer.java
        EditsLoaderCurrent.java
        Tokenizer.java
        EditsVisitorFactory.java
        OfflineEditsViewer.java
        EditsVisitor.java
        BinaryTokenizer.java
        EditsElement.java
        TextEditsVisitor.java
        StatisticsEditsVisitor.java
        EditsLoader.java
        TokenizerFactory.java
        XmlEditsVisitor.java
        BinaryEditsVisitor.java
        DepthCounter.java
        offlineImageViewer
        FileDistributionVisitor.java
        LsImageVisitor.java
        OfflineImageViewer.java
        TextWriterImageVisitor.java
        XmlImageVisitor.java
        NameDistributionVisitor.java
        ImageVisitor.java
        DelimitedImageVisitor.java
        ImageLoaderCurrent.java
        IndentedImageVisitor.java
        DepthCounter.java
        ImageLoader.java
        JMXGet.java
        HDFSConcat.java
        DistributedFileSystem.java
        BlockReaderAccelerator.java
        metrics
        DFSClientMetrics.java
        LookasideMetrics.java
        package.html
        OpenFilesInfo.java
        LookasideCacheFileSystem.java
    - hdfs-default.xml
  - benchmarks
    - gridmix
      - gridmix-env
      - webdatascan
        webdata_scan.medium
        webdata_scan.small
        webdata_scan.large
      - javasort
        text-sort.small
        text-sort.large
        text-sort.medium
      - generateData.sh
      - submissionScripts
        sleep_if_too_busy
        webdataSortToSameCluster
        webdataSortHod
        textSortHod
        webdataScanToSameCluster
        textSortToSameCluster
        allToSameCluster
        monsterQueriesToSameCluster
        maxentToSameCluster
        webdataScanHod
        monsterQueriesHod
        allThroughHod
        maxentHod
      - monsterQuery
        monster_query.large
        monster_query.medium
        monster_query.small
      - README
      - webdatasort
        webdata_sort.medium
        webdata_sort.large
        webdata_sort.small
      - streamsort
        text-sort.small
        text-sort.large
        text-sort.medium
      - maxent
        maxent.large
      - pipesort
        text-sort.small
        text-sort.large
        text-sort.medium
    - gridmix2
      - src
        java
        org
        apache
        hadoop
        mapred
        GenericMRLoadJobCreator.java
        GridMixRunner.java
        CombinerJobCreator.java
      - build.xml
      - rungridmix_2
      - generateGridmix2data.sh
      - README.gridmix2
      - gridmix_config.xml
      - gridmix-env-2
  - ant
    - org
      - apache
        hadoop
        ant
        DfsTask.java
        antlib.xml
        condition
        DfsZeroLen.java
        DfsExists.java
        DfsIsDir.java
        DfsBaseConditional.java
  - native
    - src
      - org_apache_hadoop.h
      - org
        apache
        hadoop
        syscall
        Makefile.in
        Makefile.am
        LinuxSystemCall.c
        util
        bulk_crc32.h
        gcc_optimizations.h
        crc32_zlib_polynomial_tables.h
        bulk_crc32.c
        NativeCrc32.c
        crc32c_tables.h
        io
        nativeio
        file_descriptor.h
        NativeIO.c
        errno_enum.c
        errno_enum.h
        file_descriptor.c
        compress
        lzma
        Makefile.in
        org_apache_hadoop_io_compress_lzma.h
        Makefile.am
        LzmaCompressor.c
        LzmaDecompressor.c
        zlib
        Makefile.in
        ZlibCompressor.c
        org_apache_hadoop_io_compress_zlib.h
        Makefile.am
        ZlibDecompressor.c
        snappy
        org_apache_hadoop_io_compress_snappy_SnappyCompressor.h
        Makefile.in
        org_apache_hadoop_io_compress_snappy.h
        Makefile.am
        SnappyCompressor.c
        SnappyDecompressor.c
    - ChangeLog
    - AUTHORS
    - NEWS
    - Makefile.in
    - acinclude.m4
    - INSTALL
    - README
    - lib
      - Makefile.in
      - snappy
        include
        snappy-sinksource.h
        snappy-stubs-public.h
        snappy.h
        snappy-c.h
        lib
        libsnappy.so
        libsnappy.la
        libsnappy.so.1
        libsnappy.so.1.1.3
      - Makefile.am
    - config
      - config.sub
      - config.guess
      - missing
      - install-sh
      - ltmain.sh
      - depcomp
    - COPYING
    - configure.ac
    - Makefile.am
    - config.h.in
    - .autom4te.cfg
    - packageNativeHadoop.sh
  - tools
    - org
      - apache
        hadoop
        tools
        DistTool.java
        DistCp.java
        DistCp_Counter.properties
        rumen
        LoggedTaskAttempt.java
        TaskInfo.java
        AbstractClusterStory.java
        ZombieJob.java
        RackNode.java
        ClusterStory.java
        ClusterTopologyReader.java
        JobTraceReader.java
        ReduceTaskAttemptInfo.java
        ZombieCluster.java
        Node.java
        JsonObjectMapperParser.java
        ParsedHost.java
        LoggedDiscreteCDF.java
        MachineNode.java
        Histogram.java
        ZombieJobProducer.java
        ParsedLine.java
        CDFRandomGenerator.java
        HadoopLogsAnalyzer.java
        LoggedNetworkTopology.java
        LoggedTask.java
        LoggedJob.java
        MapTaskAttemptInfo.java
        ParsedConfigFile.java
        DeepInequalityException.java
        DeepCompare.java
        CDFPiecewiseLinearRandomGenerator.java
        JobStoryProducer.java
        TaskAttemptInfo.java
        TreePath.java
        Pair.java
        JobStory.java
        LoggedLocation.java
        LogRecordType.java
        Pre21JobHistoryConstants.java
        LoggedSingleRelativeRanking.java
        DistCh.java
        GetConf.java
        HadoopArchives.java
        Logalyzer.java
  - core
    - core-default.xml
    - overview.html
    - org
      - apache
        hadoop
        security
        UserGroupInformation.java
        UnixUserGroupInformation.java
        PermissionChecker.java
        authorize
        ConfiguredPolicy.java
        Service.java
        ConnectionPermission.java
        AuthorizationException.java
        RefreshAuthorizationPolicyProtocol.java
        ServiceAuthorizationManager.java
        PolicyProvider.java
        User.java
        AccessControlException.java
        Group.java
        SecurityUtil.java
        fs
        s3
        MigrationTool.java
        Jets3tFileSystemStore.java
        S3OutputStream.java
        S3FileSystemException.java
        Block.java
        INode.java
        S3Credentials.java
        S3Exception.java
        S3InputStream.java
        VersionMismatchException.java
        S3FileSystem.java
        package.html
        FileSystemStore.java
        shell
        Count.java
        CommandFormat.java
        Command.java
        CommandUtils.java
        FsShell.java
        HarFileSystem.java
        BlockLocation.java
        FsShellPermissions.java
        FSInputChecker.java
        PathFilter.java
        FileAlreadyExistsException.java
        FsUrlConnection.java
        MD5MD5CRC32FileChecksum.java
        FreightStreamer.java
        FilterFileSystem.java
        RawLocalFileSystem.java
        HardLink.java
        FileChecksum.java
        FSOutputSummer.java
        s3native
        NativeS3FileSystem.java
        Jets3tNativeFileSystemStore.java
        FileMetadata.java
        PartialListing.java
        package.html
        NativeFileSystemStore.java
        Syncable.java
        Trash.java
        FileStatus.java
        PositionedReadable.java
        RemoteIterator.java
        DU.java
        FileSystem.java
        ftp
        FTPInputStream.java
        FTPException.java
        FTPFileSystem.java
        BlockMissingException.java
        TrashPolicyBase.java
        FSError.java
        TrashPolicyPattern.java
        FileUtil.java
        LocalFileSystem.java
        InMemoryFileSystem.java
        TrashPolicy.java
        ContentSummary.java
        FSDataOutputStream.java
        kfs
        KFSInputStream.java
        KosmosFileSystem.java
        IFSImpl.java
        KFSImpl.java
        package.html
        KFSOutputStream.java
        FSDataInputStream.java
        FSInputStream.java
        LocatedFileStatus.java
        ChecksumException.java
        TrashPolicyDefault.java
        Seekable.java
        permission
        FsPermission.java
        UmaskParser.java
        PermissionParser.java
        ChmodParser.java
        PermissionStatus.java
        AccessControlException.java
        FsAction.java
        FsShellTouch.java
        LocalDirAllocator.java
        ChecksumFileSystem.java
        BufferedFSInputStream.java
        OpenFileInfo.java
        FsUrlStreamHandler.java
        Path.java
        package.html
        FsUrlStreamHandlerFactory.java
        DF.java
        GlobExpander.java
        syscall
        LinuxSystemCall.java
        ipc
        Server.java
        Client.java
        ConnectionHeader.java
        Status.java
        RemoteException.java
        ProtocolProxy.java
        metrics
        RpcActivityMBean.java
        RpcMetrics.java
        RpcMgt.java
        RpcMgtMBean.java
        ProtocolSignature.java
        VersionedProtocol.java
        RPC.java
        package.html
        net
        SocketInputStream.java
        SocketIOWithTimeout.java
        NodeBase.java
        NetUtils.java
        SocksSocketFactory.java
        Node.java
        CachedDNSToSwitchMapping.java
        DNS.java
        ScriptBasedMapping.java
        SocketOutputStream.java
        NetworkTopology.java
        IPv4AddressTruncationMapping.java
        StandardSocketFactory.java
        package.html
        DNSToSwitchMapping.java
        InetSocketAddressFactory.java
        HadoopVersionAnnotation.java
        classification
        InterfaceStability.java
        InterfaceAudience.java
        record
        XmlRecordInput.java
        Index.java
        Utils.java
        Buffer.java
        XmlRecordOutput.java
        compiler
        CodeGenerator.java
        JDouble.java
        JFile.java
        JString.java
        JCompType.java
        CodeBuffer.java
        JBoolean.java
        Consts.java
        JRecord.java
        CppGenerator.java
        JavaGenerator.java
        JFloat.java
        JMap.java
        ant
        RccTask.java
        JInt.java
        JByte.java
        JLong.java
        CGenerator.java
        JVector.java
        JType.java
        JField.java
        package.html
        JBuffer.java
        generated
        Token.java
        SimpleCharStream.java
        RccConstants.java
        RccTokenManager.java
        TokenMgrError.java
        Rcc.java
        package.html
        ParseException.java
        rcc.jj
        Record.java
        CsvRecordInput.java
        RecordComparator.java
        BinaryRecordOutput.java
        RecordOutput.java
        RecordInput.java
        BinaryRecordInput.java
        meta
        MapTypeID.java
        Utils.java
        StructTypeID.java
        VectorTypeID.java
        RecordTypeInfo.java
        FieldTypeInfo.java
        TypeID.java
        package.html
        CsvRecordOutput.java
        log
        LogLevel.java
        filecache
        DistributedCache.java
        util
        UTF8ByteArrayUtils.java
        SerializableUtils.java
        LRUCache.java
        ProgramDriver.java
        RunJar.java
        LineReader.java
        LinuxResourceCalculatorPlugin.java
        ServletUtil.java
        XMLUtils.java
        Tool.java
        PulseCheckable.java
        MergeSort.java
        AsyncDiskService.java
        IndexedSorter.java
        NativeCrc32.java
        HostsFileReader.java
        DataChecksum.java
        DiskChecker.java
        ChecksumUtil.java
        bloom
        BloomFilter.java
        RetouchedBloomFilter.java
        Filter.java
        DynamicBloomFilter.java
        HashFunction.java
        CountingBloomFilter.java
        Key.java
        RemoveScheme.java
        ReflectionUtils.java
        GenericsUtil.java
        NullResourceCalculatorPlugin.java
        PureJavaCrc32C.java
        Progressable.java
        CyclicIteration.java
        Daemon.java
        VersionInfoMBean.java
        ProcessTree.java
        PureJavaCrc32.java
        GenericOptionsParser.java
        VersionInfo.java
        PlatformName.java
        NativeCodeLoader.java
        HeapSort.java
        IndexedSortable.java
        BeanTracker.java
        QuickSort.java
        ProcfsBasedProcessTree.java
        Progress.java
        PulseMBean.java
        MRAsyncDiskService.java
        ResourceCalculatorPlugin.java
        hash
        Hash.java
        JenkinsHash.java
        MurmurHash.java
        package.html
        StringUtils.java
        PulseChecker.java
        Shell.java
        PriorityQueue.java
        ToolRunner.java
        PrintJarMainClass.java
        io
        VIntWritable.java
        TwoDArrayWritable.java
        MapWritable.java
        nativeio
        NativeIO.java
        Errno.java
        NativeIOException.java
        package-info.java
        DefaultStringifier.java
        WritableComparable.java
        MultipleIOException.java
        DoubleWritable.java
        GenericWritable.java
        DataOutputBuffer.java
        WritableComparator.java
        VersionedWritable.java
        CompressedWritable.java
        BinaryComparable.java
        AbstractMapWritable.java
        BytesWritable.java
        compress
        CompressionCodecFactory.java
        CompressionInputStream.java
        Compressor.java
        lzma
        LzmaCompressor.java
        LzmaDecompressor.java
        DecompressorStream.java
        zlib
        ZlibCompressor.java
        ZlibFactory.java
        ZlibDecompressor.java
        BuiltInZlibDeflater.java
        BuiltInZlibInflater.java
        CompressionOutputStream.java
        BlockDecompressorStream.java
        CompressionCodec.java
        BlockCompressorStream.java
        GzipCodec.java
        DefaultCodec.java
        snappy
        SnappyCompressor.java
        SnappyDecompressor.java
        LoadSnappy.java
        CompressorStream.java
        CodecPrematureEOFException.java
        Decompressor.java
        CodecUnavailableException.java
        CodecPool.java
        bzip2
        CRC.java
        CBZip2InputStream.java
        CBZip2OutputStream.java
        BZip2DummyDecompressor.java
        BZip2Constants.java
        BZip2DummyCompressor.java
        SnappyCodec.java
        LzmaCodec.java
        BZip2Codec.java
        VLongWritable.java
        SequenceFile.java
        MapFile.java
        ArrayFile.java
        MD5Hash.java
        WritableName.java
        RawComparator.java
        file
        tfile
        MetaBlockDoesNotExist.java
        Utils.java
        MetaBlockAlreadyExists.java
        SimpleBufferedOutputStream.java
        BoundedByteArrayOutputStream.java
        RawComparable.java
        BoundedRangeFileInputStream.java
        TFileDumper.java
        ByteArray.java
        BCFile.java
        TFile.java
        Chunk.java
        CompareUtils.java
        Compression.java
        BooleanWritable.java
        NullWritable.java
        InputBuffer.java
        VersionMismatchException.java
        Writable.java
        BloomMapFile.java
        DataInputBuffer.java
        ObjectWritable.java
        ByteWritable.java
        WritableFactory.java
        IntWritable.java
        Text.java
        FloatWritable.java
        SortedMapWritable.java
        Stringifier.java
        OutputBuffer.java
        IOUtils.java
        WritableFactories.java
        WritableUtils.java
        retry
        RetryPolicy.java
        RetryProxy.java
        RetryPolicies.java
        RetryInvocationHandler.java
        package.html
        package.html
        LongWritable.java
        BufferTooSmallException.java
        Closeable.java
        SetFile.java
        UTF8.java
        serializer
        Serializer.java
        JavaSerializationComparator.java
        Serialization.java
        SerializationFactory.java
        Deserializer.java
        JavaSerialization.java
        DeserializerComparator.java
        WritableSerialization.java
        package.html
        ArrayWritable.java
        ReadaheadPool.java
        http
        FilterInitializer.java
        NettyMapOutputHttpServer.java
        HttpServer.java
        FilterContainer.java
        HtmlQuoting.java
        metrics
        MetricsContext.java
        MetricsUtil.java
        MetricsRecord.java
        jvm
        JvmMetrics.java
        EventCounter.java
        MetricsServlet.java
        ContextFactory.java
        util
        MetricsRegistry.java
        MetricsIntValue.java
        MetricsDynamicMBeanBase.java
        MBeanUtil.java
        MetricsTimeVaryingRate.java
        MetricsBase.java
        MetricsTimeVaryingInt.java
        MetricsLongValue.java
        MetricsTimeVaryingLong.java
        file
        FileContext.java
        package.html
        jmx
        JMXContextMBean.java
        JMXContext.java
        MetricsException.java
        Updater.java
        ganglia
        GangliaContext.java
        package.html
        package.html
        spi
        MetricsRecordImpl.java
        NullContext.java
        NoEmitMetricsContext.java
        CompositeContext.java
        OutputRecord.java
        AbstractMetricsContext.java
        Util.java
        NullContextWithUpdateThread.java
        MetricValue.java
        package.html
        conf
        ReconfigurationServlet.java
        Configuration.java
        Reconfigurable.java
        Configurable.java
        ReconfigurationUtil.java
        Configured.java
        ReconfigurationException.java
        package.html
        ConfServlet.java
        ReconfigurableBase.java
  - docs
    - src
      - documentation
        resources
        images
        hadoop-logo-big.jpg
        hadoop-logo.jpg
        hdfsarchitecture.gif
        hdfsarchitecture.odg
        favicon.ico
        hdfsdatanodes.gif
        core-logo.gif
        architecture.gif
        hdfsdatanodes.odg
        classes
        CatalogManager.properties
        content
        xdocs
        index.xml
        hdfs_quota_admin_guide.xml
        mapred_tutorial.xml
        hadoop_archives.xml
        capacity_scheduler.xml
        fair_scheduler.xml
        vaidya.xml
        tabs.xml
        hdfs_shell.xml
        quickstart.xml
        libhdfs.xml
        hod_admin_guide.xml
        service_level_auth.xml
        hdfs_user_guide.xml
        hod_user_guide.xml
        streaming.xml
        native_libraries.xml
        distcp.xml
        hod_config_guide.xml
        SLG_user_guide.xml
        hdfs_permissions_guide.xml
        commands_manual.xml
        site.xml
        cluster_setup.xml
        gridmix.xml
        hdfs_design.xml
        README.txt
        skinconf.xml
        conf
        cli.xconf
    - forrest.properties
    - releasenotes.html
    - status.xml
    - changes
      - ChangesFancyStyle.css
      - changes2html.pl
      - ChangesSimpleStyle.css
  - contrib
    - capacity-scheduler
      - src
        test
        org
        apache
        hadoop
        mapred
        TestCapacitySchedulerWithJobTracker.java
        TestJobTrackerRestartWithCS.java
        TestCapacityScheduler.java
        ClusterWithCapacityScheduler.java
        TestCapacitySchedulerConf.java
        java
        org
        apache
        hadoop
        mapred
        CapacityTaskScheduler.java
        JobInitializationPoller.java
        CapacitySchedulerConf.java
        JobQueuesManager.java
        MemoryMatcher.java
      - build.xml
      - ivy
        libraries.properties
      - README
      - ivy.xml
    - build.xml
    - vaidya
      - src
        java
        org
        apache
        hadoop
        vaidya
        postexdiagnosis
        PostExPerformanceDiagnoser.java
        tests
        ReadingHDFSFilesAsSideEffect.java
        MapsReExecutionImpact.java
        BalancedReducePartitioning.java
        MapSideDiskSpill.java
        postex_diagnosis_tests.xml
        ReducesReExecutionImpact.java
        statistics
        job
        JobStatisticsInterface.java
        JobStatistics.java
        TaskStatistics.java
        MapTaskStatistics.java
        ReduceTaskStatistics.java
        JobDiagnoser.java
        util
        XMLUtils.java
        vaidya.sh
        DiagnosticTest.java
      - build.xml
      - ivy
        libraries.properties
      - ivy.xml
    - index
      - src
        test
        org
        apache
        hadoop
        contrib
        index
        lucene
        TestMixedDirectory.java
        mapred
        TestIndexUpdater.java
        TestDistributionPolicy.java
        java
        org
        apache
        hadoop
        contrib
        index
        main
        UpdateIndex.java
        lucene
        MixedDirectory.java
        FileSystemDirectory.java
        ShardWriter.java
        LuceneUtil.java
        MixedDeletionPolicy.java
        RAMDirectoryUtil.java
        LuceneIndexFileNameFilter.java
        mapred
        IndexUpdater.java
        DocumentAndOp.java
        IndexUpdateReducer.java
        DocumentID.java
        IntermediateForm.java
        IndexUpdatePartitioner.java
        IndexUpdateOutputFormat.java
        ILocalAnalysis.java
        IIndexUpdater.java
        IndexUpdateConfiguration.java
        IndexUpdateCombiner.java
        IDistributionPolicy.java
        Shard.java
        IndexUpdateMapper.java
        example
        RoundRobinDistributionPolicy.java
        LineDocLocalAnalysis.java
        LineDocTextAndOp.java
        IdentityLocalAnalysis.java
        LineDocInputFormat.java
        LineDocRecordReader.java
        HashingDistributionPolicy.java
      - build.xml
      - sample
        data2.txt
        data.txt
      - ivy
        libraries.properties
      - README
      - ivy.xml
      - conf
        index-config.xml
        index-config.xml.template
    - gridmix
      - src
        test
        org
        apache
        hadoop
        mapred
        gridmix
        TestFilePool.java
        TestFileQueue.java
        TestRecordFactory.java
        TestGridmixRecord.java
        DebugJobFactory.java
        TestGridmixSubmission.java
        java
        org
        apache
        hadoop
        mapred
        gridmix
        JobSubmitter.java
        InputStriper.java
        JobFactory.java
        CombineFileSplit.java
        AvgRecordFactory.java
        JobMonitor.java
        GenerateData.java
        FilePool.java
        GridmixKey.java
        GridmixRecord.java
        GridmixSplit.java
        RecordFactory.java
        ReadRecordFactory.java
        FileQueue.java
        GridmixJob.java
        Gridmix.java
        IntermediateRecordFactory.java
      - build.xml
      - ivy
        libraries.properties
      - README
      - ivy.xml
    - eclipse-plugin
      - src
        java
        org
        apache
        hadoop
        eclipse
        servers
        IHadoopServerListener.java
        RunOnHadoopWizard.java
        ServerRegistry.java
        HadoopLocationWizard.java
        HadoopServerSelectionListContentProvider.java
        NewDriverWizard.java
        actions
        DFSActionImpl.java
        OpenNewMRProjectAction.java
        EditLocationAction.java
        NewLocationAction.java
        OpenNewMRClassWizardAction.java
        NewMapReduceProjectWizard.java
        preferences
        MapReducePreferencePage.java
        PreferenceConstants.java
        PreferenceInitializer.java
        view
        servers
        ServerView.java
        PropertyTester.java
        MapReduceNature.java
        ErrorMessageDialog.java
        NewDriverWizardPage.java
        server
        ConfProp.java
        JarModule.java
        IJobListener.java
        HadoopServer.java
        HadoopPathPage.java
        HadoopJob.java
        dfs
        DFSContentProvider.java
        DFSLocation.java
        DFSMessage.java
        ActionProvider.java
        DFSActions.java
        DFSContent.java
        DFSFile.java
        DFSFolder.java
        DFSPath.java
        DFSLocationsRoot.java
        NewMapperWizard.java
        Activator.java
        HadoopPerspectiveFactory.java
        launch
        LocalMapReduceLaunchTabGroup.java
        StartHadoopLaunchTabGroup.java
        HadoopApplicationLaunchShortcut.java
        MutexRule.java
        NewReducerWizard.java
        ImageLibrary.java
      - build.xml
      - ivy
        libraries.properties
      - resources
        CreateProj.xml
        drive100x100.gif
        hadoop-logo.jpg
        MAP16x15.gif
        spitesmall.gif
        Components
        job.gif
        reducer-16x16.gif
        HelloWorld.xml
        Setup.xml
        RunProj.xml
        elephantblue16x16.gif
        files.gif
        Elephant2.jpg
        hadoop.gif
        drive16x16.gif
        hadoop_small.gif
        Elephant100x100.gif
        MAP100x100.gif
        Elephant.jpg
        SetHadoopPath.xml
        reduce100x100.gif
        Elephant16x16.gif
        reduce16x16.gif
        ConnectDFS.xml
        map16x16.gif
      - build.properties
      - .settings
        org.eclipse.jdt.ui.prefs
        org.eclipse.wst.validation.prefs
        org.eclipse.jdt.core.prefs
      - META-INF
        MANIFEST.MF
      - ivy.xml
      - .project
      - plugin.xml
      - .classpath
    - hmon
      - src
        test
        org
        apache
        hadoop
        mapred
        TestUtilizationCollector.java
        java
        org
        apache
        hadoop
        mapred
        UtilizationReporter.java
        UtilizationCollectorCached.java
        UtilizationCollector.java
        HmonResourceReporter.java
        JobUtilization.java
        ClusterUtilization.java
        UtilizationGauger.java
        resourceutilization.xml
        UtilizationCollectorProtocol.java
        TaskTrackerUtilization.java
        LocalJobUtilization.java
        LinuxUtilizationGauger.java
        UtilizationShell.java
      - build.xml
      - ivy
        libraries.properties
      - README
      - ivy.xml
      - bin
        start-hmon.sh
        stop-hmon.sh
    - hive-streaming
      - src
        test
        org
        apache
        hadoop
        streaming
        UtilTest.java
        TestStreamAggregate.java
        StreamAggregate.java
        TestStreaming.java
        UniqApp.java
        TrApp.java
        TestGzipInput.java
        TestStreamingFailure.java
        ValueCountReduce.java
        TestStreamedMerge.java
        TestStreamReduceNone.java
        TestStreamDataProtocol.java
        java
        org
        apache
        hadoop
        streaming
        UTF8ByteArrayUtils.java
        StreamBaseRecordReader.java
        PipeMapRed.java
        StreamJob.java
        PipeReducer.java
        StreamLineRecordReader.java
        StreamUtil.java
        JarBuilder.java
        PipeMapper.java
        BufferingOutputCollector.java
        StreamXmlRecordReader.java
        Environment.java
        StreamInputFormat.java
        PathFinder.java
        InmemBufferingOutputCollector.java
        StreamOutputFormat.java
        HadoopStreaming.java
        package.html
        StreamSequenceRecordReader.java
      - build.xml
      - ivy
        libraries.properties
      - ivy.xml
    - failmon
      - src
        java
        org
        apache
        hadoop
        contrib
        failmon
        SMARTParser.java
        Continuous.java
        LogParser.java
        HadoopLogParser.java
        ShellParser.java
        Monitored.java
        PersistentState.java
        EventRecord.java
        OfflineAnonymizer.java
        Environment.java
        HDFSMerger.java
        SensorsParser.java
        NICParser.java
        Anonymizer.java
        MonitorJob.java
        RunOnce.java
        CPUParser.java
        SerializedRecord.java
        Executor.java
        LocalStore.java
        SystemLogParser.java
      - build.xml
      - ivy
        libraries.properties
      - README
      - ivy.xml
      - bin
        scheduler.py
        failmon.sh
      - conf
        log4j.properties
        hosts.list
        commons-logging.properties
        failmon.properties
        global.config
    - test
      - hdfs-site.xml
      - hadoop-site.xml
      - mapred-site.xml
      - core-site.xml
    - streaming
      - src
        test
        org
        apache
        hadoop
        streaming
        UtilTest.java
        FailApp.java
        TestStreamAggregate.java
        TestStreamingAsDifferentUser.java
        TestStreamingExitStatus.java
        TestSymLink.java
        StreamAggregate.java
        TrAppReduce.java
        UlimitApp.java
        TestStreaming.java
        UniqApp.java
        TrApp.java
        TestStreamingSeparator.java
        TestStreamingStderr.java
        TestGzipInput.java
        TestStreamingCounters.java
        StderrApp.java
        TestStreamingFailure.java
        ValueCountReduce.java
        TestStreamingCombiner.java
        TestStreamReduceNone.java
        TestMultipleArchiveFiles.java
        TestStreamingBadRecords.java
        TestStreamDataProtocol.java
        TestStreamXmlRecordReader.java
        TestUlimit.java
        TestMultipleCachefiles.java
        TestStreamingKeyValue.java
        TestStreamingEmptyInpNonemptyOut.java
        java
        org
        apache
        hadoop
        streaming
        UTF8ByteArrayUtils.java
        StreamBaseRecordReader.java
        PipeMapRed.java
        StreamJob.java
        PipeCombiner.java
        PipeReducer.java
        StreamUtil.java
        PipeMapRunner.java
        JarBuilder.java
        PipeMapper.java
        StreamKeyValUtil.java
        StreamXmlRecordReader.java
        Environment.java
        StreamInputFormat.java
        PathFinder.java
        HadoopStreaming.java
        package.html
      - build.xml
      - ivy
        libraries.properties
      - ivy.xml
    - mumak
      - src
        test
        org
        apache
        hadoop
        mapred
        MockSimulatorJobTracker.java
        TestSimulatorJobClient.java
        FakeJobs.java
        MockSimulatorEngine.java
        TestSimulatorEventQueue.java
        TestSimulatorEngine.java
        TestSimulatorEndToEnd.java
        HeartbeatHelper.java
        CheckedEventQueue.java
        TestSimulatorTaskTracker.java
        TestSimulatorJobTracker.java
        java
        org
        apache
        hadoop
        net
        StaticMapping.java
        mapred
        SimulatorEngine.java
        SimulatorJobInProgress.java
        JobCompleteEvent.java
        SimulatorTaskTracker.java
        SimulatorJobTracker.java
        SortedZombieJobProducer.java
        JobSubmissionEvent.java
        AllMapsCompletedTaskAction.java
        SimulatorClock.java
        SimulatorEventListener.java
        SimulatorJobCache.java
        HeartbeatEvent.java
        SimulatorEvent.java
        TaskAttemptCompletionEvent.java
        SimulatorJobClient.java
        SimulatorJobStoryProducer.java
        EagerTaskInitializationListenerAspects.aj
        SimulatorTaskTrackerStatus.java
        SimulatorEventQueue.java
        SimulatorJobStory.java
        SimulatorLaunchTaskAction.java
      - build.xml
      - ivy
        libraries.properties
      - ivy.xml
      - bin
        mumak.sh
      - conf
        log4j.properties
        mumak.xml
    - bash-tab-completion
      - README
      - hadoop.sh
    - corona
      - src
        test
        checkstyle.xml
        checkstyle-noframes-sorted.xsl
        org
        apache
        hadoop
        mapred
        TestMiniCoronaBlacklist.java
        TestMiniCoronaTaskFail.java
        TestTaskTrackerAction.java
        TestResourceTracker.java
        corona
        TestPoolManager.java
        TestResourceCheck.java
        TestConfigManager.java
        TestBinarySearcher.java
        TestMiniCoronaBringup.java
        SessionListener.java
        TestMiniCoronaAdmin.java
        TstUtils.java
        TestScheduleComparator.java
        FakeSessionNotifier.java
        MiniCoronaCluster.java
        TestDistributeShare.java
        TstJob.java
        FakeConfigManager.java
        TestMiniCoronaRunJob.java
        ClusterManagerTestable.java
        TestClusterManager.java
        TestMiniCoronaFederatedJT.java
        ClusterManagerMetricsVerifier.java
        TestLoadManager.java
        CallbackSessionNotifier.java
        TestPreemption.java
        TestMiniCoronaSpeculativeTask.java
        BenchmarkClusterManager.java
        TestSessionDriver.java
        license-header.txt
        java
        org
        apache
        hadoop
        util
        Utils.java
        WebUtils.java
        mapred
        LocalityStats.java
        ExpireTasks.java
        CoronaTaskTracker.java
        CoronaTaskTrackerProtocol.java
        CoronaJobTrackerRunner.java
        ResourceTracker.java
        InterCoronaJobTrackerProtocol.java
        ResourceUsage.java
        CoronaJobInProgress.java
        ProxyJobTracker.java
        TrackerStats.java
        CoronaSessionInfo.java
        CoronaJobTracker.java
        TaskStateChangeListener.java
        package-info.java
        CoronaJobAggregator.java
        CoronaTaskLauncher.java
        TrackerClientCache.java
        CoronaJobHistory.java
        RemoteJTProxy.java
        ResourceReport.java
        corona
        TopologyCache.java
        TFactoryBasedThreadPoolServer.java
        GrantReport.java
        CoronaAdmin.java
        TypePoolGroupNameMap.java
        NodeSnapshot.java
        LocalityLevel.java
        LoadManager.java
        CoronaClient.java
        ScheduleComparator.java
        PoolGroupManager.java
        ResourceLimit.java
        NodeContainer.java
        ClusterManagerMetrics.java
        ConfigManager.java
        SchedulerForType.java
        SessionManager.java
        CoronaConf.java
        Schedulable.java
        BinarySearcher.java
        PoolInfoMetrics.java
        PoolsConfigDocumentGenerator.java
        ClusterManager.java
        PoolInfo.java
        Utilities.java
        Session.java
        RetiredSession.java
        NodeManager.java
        SessionHistoryManager.java
        EmptyPoolsConfigDocumentGenerator.java
        SessionNotificationCtx.java
        package-info.java
        PoolSchedulable.java
        FaultManager.java
        ResourceRequestInfo.java
        ClusterNode.java
        PoolGroupSchedulable.java
        ResourceTypeProperties.java
        RequestedNode.java
        SessionNotifier.java
        Scheduler.java
        TypePoolInfoMap.java
        ClusterManagerAvailabilityChecker.java
        ClusterManagerServer.java
        SessionDriver.java
        SessionSchedulable.java
        gen-java
        org
        apache
        hadoop
        corona
        RunningSession.java
        SessionStatus.java
        CoronaProxyJobTrackerService.java
        SessionRegistrationData.java
        ClusterManagerInfo.java
        ResourceType.java
        SessionDriverService.java
        InvalidSessionHandle.java
        SafeModeException.java
        ComputeSpecs.java
        SessionPriority.java
        CoronaTaskTrackerService.java
        DisallowedNode.java
        ResourceGrant.java
        PoolInfoStrings.java
        InetAddress.java
        ClusterNodeInfo.java
        ResourceRequest.java
        NodeUsageReport.java
        SessionInfo.java
        webapp
        jt
        coronajobdetails.jsp
        coronataskstats.jsp
        coronajobconf.jsp
        index.html
        coronajobfailures.jsp
        coronajobtasks.jsp
        coronajobresources.jsp
        coronataskdetails.jsp
        proxyjt
        coronajobhistory.jsp
        coronajobconf_history.jsp
        coronaanalysejobhistory.jsp
        coronajobtaskshistory.jsp
        coronataskdetailshistory.jsp
        index.html
        coronajobdetailshistory.jsp
        cm
        active_json.jsp
        retired_json.jsp
        exec.jsp
        cm_old.jsp
        machines.jsp
        cm.jsp
        pool_json.jsp
        index.html
        jobresources.jsp
      - build.xml
      - ivy
        libraries.properties
      - interface
        ClusterManager.thrift
      - lib
        README
        Thrift.LICENSE
      - ivy.xml
    - fairscheduler
      - src
        test
        org
        apache
        hadoop
        mapred
        TestFairScheduler.java
        webapps
        static
        dynamic-selector.js
        tablefilter.js
        java
        org
        apache
        hadoop
        mapred
        JobAdmissionWaitInfo.java
        AllocationConfigurationException.java
        TaskType.java
        protocal
        FairSchedulerProtocol.java
        FairSchedulerServlet.java
        DefaultTaskSelector.java
        LoadManager.java
        TaskSelector.java
        BlockedAdmissionReason.java
        FairSchedulerMetricsInst.java
        WeightAdjuster.java
        JobInitializer.java
        NotAdmittedJobInfo.java
        FairSchedulerAdmissionControlServlet.java
        HourGlass.java
        CapBasedLoadManager.java
        FairScheduler.java
        MemBasedLoadManager.java
        PoolManager.java
        FairSchedulerShell.java
        FifoJobComparator.java
        Pool.java
        NewJobWeightBooster.java
      - build.xml
      - ivy
        libraries.properties
      - README
      - ivy.xml
    - hdfsproxy
      - src
        test
        org
        apache
        hadoop
        hdfsproxy
        TestHdfsProxy.java
        TestProxyUgiManager.java
        java
        org
        apache
        hadoop
        hdfsproxy
        ProxyHttpServer.java
        ProxyFilter.java
        ProxyStreamFile.java
        ProxyUgiManager.java
        HdfsProxy.java
        ProxyListPathsServlet.java
        ProxyFileDataServlet.java
      - build.xml
      - ivy
        libraries.properties
      - README
      - ivy.xml
      - bin
        start-hdfsproxy.sh
        hdfsproxy-slaves.sh
        hdfsproxy-config.sh
        hdfsproxy
        stop-hdfsproxy.sh
        hdfsproxy-daemons.sh
        hdfsproxy-daemon.sh
      - conf
        log4j.properties
        hdfsproxy-default.xml
        user-permissions.xml
        hdfsproxy-env.sh.template
        hdfsproxy-env.sh
        user-certs.xml
        hdfsproxy-hosts
        configuration.xsl
    - highavailability
      - src
        test
        org
        apache
        hadoop
        hdfs
        MiniAvatarCluster.java
        TestAvatarCleanShutdown.java
        TestAvatarShell.java
        TestAvatarAPI.java
        TestAvatarCheckpointing.java
        TestAvatarForceFailover.java
        AvatarDFSckTest.java
        TestAvatarTxIds.java
        TestAvatarStaleCheckpoint.java
        TestAvatarCreateFile.java
        TestCachingAvatarZooKeeperClient.java
        TestAvatarSetQuota.java
        TestAvatarSyncLastTxid.java
        TestAvatarMultipleStartup.java
        AvatarSetupUtil.java
        TestAvatarFailoverCaching.java
        FailoverLoadTestUtil.java
        TestAvatarFailover.java
        TestAvatarQuiesce.java
        TestAvatarFastCopy.java
        TestAvatarContinuousFailover.java
        server
        namenode
        TestAvatarLease.java
        TestStandbySafeModeImpl.java
        TestZookeeperTxId.java
        datanode
        TestAvatarDataNodeRBW.java
        TestAvatarDataNodeRestartService.java
        TestAvatarMergeNamespaces.java
        TestAvatarDatanodeNoService.java
        TestAvatarRefreshNamenodes.java
        TestAvatarDataNodeMultipleRegistrations.java
        TestAvatarDataNodeMXBean.java
        TestStandbySafeMode.java
        TestAvatarIngesting.java
        java
        avatar-default.xml
        org
        apache
        hadoop
        hdfs
        AvatarShell.java
        AvatarZooKeeperClient.java
        AvatarZKShell.java
        DistributedAvatarFileSystem.java
        CachingAvatarZooKeeperClient.java
        protocol
        AvatarProtocol.java
        AvatarConstants.java
        server
        namenode
        Ingest.java
        StandbySafeMode.java
        ZookeeperTxId.java
        AvatarNode.java
        metrics
        AvatarNodeStatusMBean.java
        Standby.java
        protocol
        AvatarDatanodeCommand.java
        datanode
        OfferService.java
        DatanodeProtocols.java
        AvatarDataNode.java
        tools
        AvatarDFSck.java
        AvatarFailoverSnapshot.java
      - build.xml
      - ivy
        libraries.properties
      - README
      - ivy.xml
      - conf
        avatar-site.xml.template
        avatar-site.xml
        raid.xml
    - raid
      - src
        test
        org
        apache
        hadoop
        hdfs
        TestRaidFastCopy.java
        TestRaidDfs.java
        server
        namenode
        BlockPlacementPolicyFakeData.java
        TestDirectoryRaidBlockPlacement.java
        TestBlockPlacementPolicyRaid.java
        raid
        TestDirectoryRSRaidDfsMultipleBlocks.java
        TestParityMovement.java
        TestRaidNode.java
        TestRaidShellFsck_CorruptCounter.java
        TestBlockCopier.java
        TestHarIndexParser.java
        TestParallelReader.java
        Utils.java
        TestErasureCodes.java
        TestDirectoryBlockFixer.java
        TestMissingParity.java
        TestBlockFixer.java
        TestCodec.java
        TestReadConstruction.java
        TestDirectoryRaidDfs.java
        TestTempDirectoryCleanUp.java
        TestDirectoryRaidEncoder.java
        TestRaidHar.java
        TestDirectoryTraversal.java
        TestDirectoryRSRaidDfsOneBlock.java
        TestRaidPurge.java
        TestRaidShellFsck.java
        TestReedSolomonDecoder.java
        TestFileCorruptions.java
        TestPlacementMonitor.java
        TestRaidShell.java
        TestRaidUtils.java
        BadReedSolomonCode.java
        TestDirectoryRSRaidDfsTwoBlocks.java
        BadXORCode.java
        TestDirectoryPlacementMonitor.java
        TestStatisticsCollector.java
        TestRaidNodeMetrics.java
        TestSimulationBlockFixer.java
        ConfigBuilder.java
        TestDirectoryRaidShellFsck.java
        TestGaloisField.java
        java
        raid-default.xml
        org
        apache
        hadoop
        hdfs
        DistributedRaidFileSystem.java
        server
        namenode
        BlockPlacementPolicyRaidRandom.java
        BlockPlacementPolicyRaid.java
        BlockPlacementPolicyRaidBalance.java
        RaidDFSUtil.java
        raid
        FileStripeReader.java
        DirectoryStripeReader.java
        Stripe.java
        XORCode.java
        ErasureCode.java
        StripeReader.java
        LocalRaidNode.java
        ReedSolomonEncoder.java
        RaidConfigurationException.java
        ParityFilePair.java
        RaidShell.java
        ExpandedPolicy.java
        JspUtils.java
        Codec.java
        DataFsck.java
        BlockReconstructor.java
        GaloisField.java
        JobMonitor.java
        Encoder.java
        ConfigManager.java
        HarIndex.java
        DirectoryTraversal.java
        PurgeMonitor.java
        LocalBlockIntegrityMonitor.java
        DirectoryStatistics.java
        ReedSolomonCode.java
        TooManyErasedLocations.java
        RaidNodeMetrics.java
        Decoder.java
        RaidUtils.java
        DistBlockIntegrityMonitor.java
        BlockIntegrityMonitor.java
        CandidateLocations.java
        ParallelStreamReader.java
        MonitoredDistRaid.java
        StatisticsCollector.java
        LocallyRepairableCode.java
        SimpleRegeneratingCode.java
        TimeStatistics.java
        CauchyRSCode.java
        CorruptFileCounterServlet.java
        protocol
        RaidProtocol.java
        PolicyInfo.java
        PlacementMonitor.java
        ReedSolomonDecoder.java
        BlockMover.java
        MissingParityFiles.java
        Statistics.java
        RaidState.java
        DistRaidNode.java
        XOREncoder.java
        DistRaid.java
        XORDecoder.java
        RaidNode.java
      - build.xml
      - ivy
        libraries.properties
      - README
      - webapps
        raid
        blockfixer.jsp
        raidfsck.jsp
        raid.jsp
        jobmonitor.jsp
        index.html
      - ivy.xml
      - conf
        raid.xml
    - fuse-dfs
      - global_header.mk
      - src
        fuse_impls_getattr.c
        fuse_impls_readdir.c
        fuse_context_handle.h
        fuse_options.h
        fuse_dfs.c
        fuse_impls_statfs.c
        fuse_users.c
        fuse_impls_read.c
        fuse_impls_symlink.c
        fuse_impls_access.c
        fuse_dfs.h
        fuse_init.h
        fuse_impls_flush.c
        test
        TestFuseDFS.java
        fuse_options.c
        fuse_impls.h
        fuse_stat_struct.h
        fuse_impls_open.c
        fuse_impls_chown.c
        fuse_stat_struct.c
        fuse_impls_write.c
        fuse_dfs_wrapper.sh
        fuse_impls_mknod.c
        fuse_connect.h
        fuse_impls_chmod.c
        fuse_users.h
        fuse_impls_create.c
        fuse_impls_utimens.c
        fuse_init.c
        Makefile.am
        fuse_impls_unlink.c
        fuse_impls_truncate.c
        fuse_connect.c
        fuse_impls_mkdir.c
        fuse_trash.c
        fuse_trash.h
        fuse_impls_release.c
        fuse_impls_rename.c
        fuse_file_handle.h
        fuse_impls_rmdir.c
      - build.xml
      - ivy
        libraries.properties
      - bootstrap.sh
      - acinclude.m4
      - README
      - configure.ac
      - ivy.xml
      - Makefile.am
      - global_footer.mk
    - snapshot
      - src
        test
        org
        apache
        hadoop
        hdfs
        server
        namenode
        TestWaitingRoomPurger.java
        TestSnapshotCreation.java
        TestSnapshotFileRead.java
        TestSnapshotFileRename.java
        TestSnapshotShell.java
        TestWaitingRoom.java
        java
        org
        apache
        hadoop
        hdfs
        SnapshotClient.java
        server
        namenode
        SnapshotNode.java
        SnapshotShell.java
        WaitingRoom.java
        WaitingRoomTrashPolicy.java
        protocol
        SnapshotProtocol.java
      - build.xml
      - ivy
        libraries.properties
      - ivy.xml
    - hod
      - build.xml
      - ivy
        libraries.properties
      - config.txt
      - CHANGES.txt
      - README
      - support
        checklimits.sh
        logcondense.py
      - getting_started.txt
      - ivy.xml
      - bin
        ringmaster
        verify-account
        hodring
        VERSION
        hod
        checknodes
        hodcleanup
      - hodlib
        Common
        socketServers.py
        util.py
        desc.py
        miniHTMLParser.py
        threads.py
        descGenerator.py
        nodepoolutil.py
        tcp.py
        xmlrpc.py
        hodsvc.py
        setup.py
        logger.py
        allocationManagerUtil.py
        __init__.py
        types.py
        HodRing
        __init__.py
        hodRing.py
        NodePools
        torque.py
        __init__.py
        GridServices
        __init__.py
        mapred.py
        hdfs.py
        service.py
        Schedulers
        torque.py
        __init__.py
        ServiceRegistry
        __init__.py
        serviceRegistry.py
        Hod
        hadoop.py
        __init__.py
        hod.py
        nodePool.py
        ServiceProxy
        __init__.py
        serviceProxy.py
        __init__.py
        RingMaster
        ringMaster.py
        idleJobTracker.py
        __init__.py
        AllocationManagers
        goldAllocationManager.py
        __init__.py
      - conf
        hodrc
      - testing
        testHodCleanup.py
        testUtil.py
        lib.py
        testHod.py
        testHodRing.py
        testRingmasterRPCs.py
        testThreads.py
        testXmlrpc.py
        testModule.py
        testTypes.py
        __init__.py
        main.py
        testHadoop.py
        helper.py
    - build-contrib.xml
    - seekablecompression
      - src
        test
        org
        apache
        hadoop
        io
        simpleseekableformat
        UtilsForTests.java
        TestSimpleSeekableFormatCodec.java
        TestDataSegment.java
        TestSimpleSeekableFormatStreams.java
        TestInterleavedStreams.java
        java
        org
        apache
        hadoop
        io
        simpleseekableformat
        DataSegmentWriter.java
        InterleavedOutputStream.java
        SimpleSeekableFormatCodec.java
        DataSegmentReader.java
        SimpleSeekableFormatInputStream.java
        SimpleSeekableFormat.java
        SimpleSeekableFormatOutputStream.java
        CorruptedDataException.java
        InterleavedInputStream.java
      - build.xml
      - ivy
        libraries.properties
      - ivy.xml
    - dynamicclouds
      - src
        test
        org
        apache
        hadoop
        mapred
        TTMoverTestStub.java
        TestTTMover.java
        TestClustersBalancer.java
        TestTaskTrackerLoadInfo.java
        webapps
        cb
        status.jsp
        index.html
        java
        org
        apache
        hadoop
        mapred
        ClustersBalancer.java
        WastedTimeTTLIIterator.java
        TTLauncher.java
        ClusterStatusJSONParser.java
        ClusterBalancerTool.java
        ClusterBalancerAdminProtocol.java
        Cluster.java
        DynamicCloudsDaemon.java
        TaskTrackerLoadInfoIterator.java
        TTMover.java
        TaskTrackerLoadInfo.java
        TTLaunchTask.java
      - build.xml
      - ivy
        libraries.properties
      - ivy.xml
      - bin
        clusterbalancer.sh
    - ec2
      - README.txt
      - bin
        hadoop-ec2
        list-hadoop-clusters
        terminate-hadoop-cluster
        create-hadoop-image
        launch-hadoop-slaves
        cmd-hadoop-cluster
        hadoop-ec2-env.sh
        hadoop-ec2-env.sh.template
        hadoop-ec2-init-remote.sh
        image
        create-hadoop-image-remote
        ec2-run-user-data
        delete-hadoop-cluster
        launch-hadoop-master
        launch-hadoop-cluster
    - data_join
      - src
        examples
        org
        apache
        hadoop
        contrib
        utils
        join
        SampleDataJoinMapper.java
        SampleDataJoinReducer.java
        README.txt
        SampleTaggedMapOutput.java
        test
        org
        apache
        hadoop
        contrib
        utils
        join
        TestDataJoin.java
        java
        org
        apache
        hadoop
        contrib
        utils
        join
        DataJoinJob.java
        ResetableIterator.java
        TaggedMapOutput.java
        DataJoinMapperBase.java
        DataJoinReducerBase.java
        ArrayListBackedIterator.java
        JobBase.java
      - build.xml
      - ivy
        libraries.properties
      - ivy.xml
    - benchmark
      - src
        test
        org
        apache
        hadoop
        hashtable
        RandomGen.java
        Hashes.java
        LongInfo.java
        DoubleHash.java
        LightWeightGSet.java
        CuckooHash.java
        R250_521.java
        LightWeightSet.java
        THashSet.java
        TestHashTableBenchmark.java
        LightWeightGSetMulti.java
        MT.java
        HashTableBenchmark.java
        QuadHash.java
        java
        org
        apache
        hadoop
        mapred
        MapOutputCorrectness.java
        WriteMapper.java
        SleepJobRunner.java
        Reduce.java
        MapOutputCorrectnessRunner.java
        GenReduce.java
        GenReaderThread.java
        GenMapper.java
        DatanodeBenThread.java
        MultiTaskTracker.java
        GenThread.java
        DirMapper.java
        ReadMapper.java
        GenWriterThread.java
        DirReduce.java
        CreateFiles.java
        hdfs
        NNThroughputBenchmark.java
        Constant.java
        DirConstant.java
        TestNNThroughputBenchmark.java
        DFSIOTest.java
        LoadGenerator.java
        DFSLockTest.java
        GeneralConstant.java
        DFSGeneralTest.java
        AllTestDriver.java
        DataGenerator.java
        StructureGenerator.java
        DFSDirTest.java
        FileNameGenerator.java
      - build.xml
      - ivy
        libraries.properties
      - ivy.xml
- build.xml
- APACHE-README.txt
- copy-hdfs-jars-to-maven.sh
- ivy
  - libraries.properties
  - ivysettings.xml
  - hadoop-core.pom
- singleNodeHadoop
  - coronaConf
    - proxyjtnode
    - hdfs-site.xml
    - slaves
    - hadoop-metrics.properties
    - log4j.properties
    - corona.xml
    - hadoop-env.sh
    - ssl-server.xml.example
    - capacity-scheduler.xml
    - masters
    - coronapools.xml
    - mapred-queue-acls.xml
    - hadoop-policy.xml
    - mapred-site.xml
    - taskcontroller.cfg
    - configuration.xsl
    - ssl-client.xml.example
    - core-site.xml
  - singleNodeSwitch.sh
  - mapredConf
    - proxyjtnode
    - hdfs-site.xml
    - slaves
    - hadoop-metrics.properties
    - log4j.properties
    - corona.xml
    - hadoop-env.sh
    - ssl-server.xml.example
    - capacity-scheduler.xml
    - masters
    - mapred-queue-acls.xml
    - hadoop-policy.xml
    - mapred-site.xml
    - pools.xml
    - taskcontroller.cfg
    - configuration.xsl
    - ssl-client.xml.example
    - core-site.xml
- LICENSE
- lib
  - kfs-0.2.LICENSE.txt
  - slf4j-log4j12-1.6.1-hadoop.jar
  - emma
    - emma_ant.jar
  - kfs-0.2.2.jar
  - jsp-2.1
    - jsp-api-2.1.jar
  - hsqldb-1.8.0.10.LICENSE.txt
  - commons-codec-1.4.jar
  - slf4j-api-1.6.1-hadoop.jar
  - jdiff
- nativelib
  - lzma
    - lzma
      - lzma
        delta.h
        bcj.h
        base.h
        check.h
        filter.h
        stream_flags.h
        container.h
        version.h
        vli.h
        index_hash.h
        lzma.h
        index.h
        hardware.h
        block.h
      - lzma.h
- README.txt
- FB-CHANGES.txt
- ivy.xml
- README.md
- YAHOO-CHANGES.txt
- bin
  - hadoop-daemons.sh
  - start-multitasktracker.sh
  - start-avatar.sh
  - stop-raidnode-remote.sh
  - start-proxyjt.sh
  - stop-mapred.sh
  - slaves.sh
  - hadoop
  - stop-avatar.sh
  - start-mapred-single.sh
  - stop-all.sh
  - start-hmon.sh
  - start-mapred.sh
  - start-all.sh
  - stop-corona.sh
  - stop-tasktracker.sh
  - stop-raidnode.sh
  - start-proxyjt-remote.sh
  - start-balancer.sh
  - stop-mapred-single.sh
  - stop-multitasktracker.sh
  - rcc
  - start-corona.sh
  - hadoop-config.sh
  - stop-balancer.sh
  - hadoop-daemon.sh
  - stop-hmon-remote.sh
  - start-raidnode.sh
  - stop-dfs.sh
  - start-hmon-remote.sh
  - start-dfs.sh
  - extra-local-datanodes.sh
  - start-raidnode-remote.sh
  - stop-hmon.sh
- .arcconfig
- .gitignore
- LICENSE.txt
- conf
  - hdfs-site.xml.template
  - mapred-queue-acls.xml.template
  - hadoop-metrics.properties
  - log4j.properties
  - hadoop-env.sh
  - ssl-server.xml.example
  - mapred-site.xml.template
  - capacity-scheduler.xml.template
  - core-site.xml.template
  - slaves.template
  - hadoop-env.sh.template
  - taskcontroller.cfg
  - masters.template
  - hadoop-policy.xml.template
  - configuration.xsl
  - ssl-client.xml.example
- .project
- git-template.txt
- .classpath

/**
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.hadoop.mapred;

import java.io.DataInput;
import java.io.DataOutput;
import java.io.File;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.lang.Math;
import java.net.HttpURLConnection;
import java.net.UnknownHostException;
import java.net.URI;
import java.net.URL;
import java.net.URLClassLoader;
import java.net.URLConnection;
import java.text.DecimalFormat;
import java.util.ArrayList;
import java.util.Collections;
import java.util.Comparator;
import java.util.HashMap;
import java.util.HashSet;
import java.util.LinkedHashMap;
import java.util.Iterator;
import java.util.LinkedList;
import java.util.List;
import java.util.Map;
import java.util.Random;
import java.util.Set;
import java.util.SortedSet;
import java.util.TreeSet;
import java.util.concurrent.ConcurrentHashMap;
import java.util.concurrent.atomic.AtomicInteger;

import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.ChecksumFileSystem;
import org.apache.hadoop.fs.FSError;
import org.apache.hadoop.fs.FileStatus;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.LocalFileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.DataInputBuffer;
import org.apache.hadoop.io.IOUtils;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.RawComparator;
import org.apache.hadoop.io.SequenceFile;
import org.apache.hadoop.io.Writable;
import org.apache.hadoop.io.WritableFactories;
import org.apache.hadoop.io.WritableFactory;
import org.apache.hadoop.io.WritableUtils;
import org.apache.hadoop.io.SequenceFile.CompressionType;
import org.apache.hadoop.io.compress.CodecPool;
import org.apache.hadoop.io.compress.CompressionCodec;
import org.apache.hadoop.io.compress.Decompressor;
import org.apache.hadoop.io.compress.DefaultCodec;
import org.apache.hadoop.mapred.IFile.*;
import org.apache.hadoop.mapred.Merger.Segment;
import org.apache.hadoop.mapred.SortedRanges.SkipRangeIterator;
import org.apache.hadoop.mapred.Task.Counter;
import org.apache.hadoop.mapred.TaskTracker.TaskInProgress;
import org.apache.hadoop.mapreduce.TaskAttemptContext;
import org.apache.hadoop.metrics.MetricsContext;
import org.apache.hadoop.metrics.MetricsRecord;
import org.apache.hadoop.metrics.MetricsUtil;
import org.apache.hadoop.metrics.Updater;
import org.apache.hadoop.util.Progress;
import org.apache.hadoop.util.Progressable;
import org.apache.hadoop.util.ReflectionUtils;
import org.apache.hadoop.util.StringUtils;
import org.apache.hadoop.util.ResourceCalculatorPlugin.ProcResourceValues;

/** A Reduce task. */
class ReduceTask extends Task {

  static {                                        // register a ctor
    WritableFactories.setFactory
      (ReduceTask.class,
       new WritableFactory() {
         public Writable newInstance() { return new ReduceTask(); }
       });
  }

  private static final Log LOG = LogFactory.getLog(ReduceTask.class.getName());
  private int numMaps;
  private int maxCopyBackoff;
  private ReduceCopier reduceCopier;

  private CompressionCodec codec;


  {
    getProgress().setStatus("reduce");
    setPhase(TaskStatus.Phase.SHUFFLE);        // phase to start with
  }

  private Progress copyPhase;
  private Progress sortPhase;
  private Progress reducePhase;
  private Counters.Counter reduceShuffleBytes =
    getCounters().findCounter(Counter.REDUCE_SHUFFLE_BYTES);
  private Counters.Counter reduceInputKeyCounter =
    getCounters().findCounter(Counter.REDUCE_INPUT_GROUPS);
  private Counters.Counter reduceInputValueCounter =
    getCounters().findCounter(Counter.REDUCE_INPUT_RECORDS);
  private Counters.Counter reduceInputBytesCounter =
    getCounters().findCounter(Counter.REDUCE_INPUT_BYTES);
  private Counters.Counter reduceOutputCounter =
    getCounters().findCounter(Counter.REDUCE_OUTPUT_RECORDS);
  private Counters.Counter reduceCombineOutputCounter =
    getCounters().findCounter(Counter.COMBINE_OUTPUT_RECORDS);

  // A custom comparator for map output files. Here the ordering is determined
  // by the file's size and path. In case of files with same size and different
  // file paths, the first parameter is considered smaller than the second one.
  // In case of files with same size and path are considered equal.
  private Comparator<FileStatus> mapOutputFileComparator =
    new Comparator<FileStatus>() {
      public int compare(FileStatus a, FileStatus b) {
        if (a.getLen() < b.getLen())
          return -1;
        else if (a.getLen() == b.getLen())
          if (a.getPath().toString().equals(b.getPath().toString()))
            return 0;
          else
            return -1;
        else
          return 1;
      }
  };

  // A sorted set for keeping a set of map output files on disk
  private final SortedSet<FileStatus> mapOutputFilesOnDisk =
    new TreeSet<FileStatus>(mapOutputFileComparator);

  public ReduceTask() {
    super();
  }

  public ReduceTask(String jobFile, TaskAttemptID taskId,
                    int partition, int numMaps, int numSlotsRequired,
                    String username) {
    super(jobFile, taskId, partition, numSlotsRequired, username);
    this.numMaps = numMaps;
  }

  @Override
  public void setConf(Configuration conf) {
    super.setConf(conf);
    this.maxCopyBackoff = conf.getInt("mapred.reduce.copy.backoff.max", 10);
  }

  private CompressionCodec initCodec() {
    // check if map-outputs are to be compressed
    if (conf.getCompressMapOutput()) {
      Class<? extends CompressionCodec> codecClass =
        conf.getMapOutputCompressorClass(DefaultCodec.class);
      return ReflectionUtils.newInstance(codecClass, conf);
    }

    return null;
  }

  @Override
  public TaskRunner createRunner(TaskTracker tracker, TaskInProgress tip)
  throws IOException {
    return new ReduceTaskRunner(tip, tracker, this.conf);
  }

  @Override
  public boolean isMapTask() {
    return false;
  }

  public int getNumMaps() { return numMaps; }
  
  /**
   * Localize the given JobConf to be specific for this task.
   */
  @Override
  public void localizeConfiguration(JobConf conf) throws IOException {
    super.localizeConfiguration(conf);
    conf.setNumMapTasks(numMaps);
  }

  @Override
  public void write(DataOutput out) throws IOException {
    super.write(out);

    out.writeInt(numMaps);                        // write the number of maps
  }

  @Override
  public void readFields(DataInput in) throws IOException {
    super.readFields(in);

    numMaps = in.readInt();
  }

  // Get the input files for the reducer.
  private Path[] getMapFiles(FileSystem fs, boolean isLocal)
  throws IOException {
    List<Path> fileList = new ArrayList<Path>();
    if (isLocal) {
      // for local jobs
      for(int i = 0; i < numMaps; ++i) {
        fileList.add(mapOutputFile.getInputFile(i, getTaskID()));
      }
    } else {
      // for non local jobs
      for (FileStatus filestatus : mapOutputFilesOnDisk) {
        fileList.add(filestatus.getPath());
      }
    }
    return fileList.toArray(new Path[0]);
  }

  private class ReduceValuesIterator<KEY,VALUE>
          extends ValuesIterator<KEY,VALUE> {
    public ReduceValuesIterator (RawKeyValueIterator in,
                                 RawComparator<KEY> comparator,
                                 Class<KEY> keyClass,
                                 Class<VALUE> valClass,
                                 Configuration conf, Progressable reporter)
      throws IOException {
      super(in, comparator, keyClass, valClass, conf, reporter);
    }

    @Override
    public VALUE next() {
      reduceInputValueCounter.increment(1);
      long startBytesProcessed = in.getTotalBytesProcessed();
      VALUE v = moveToNext();
      long endBytesProcessed = in.getTotalBytesProcessed();
      reduceInputBytesCounter.increment(endBytesProcessed - startBytesProcessed);
      return v;
    }

    protected VALUE moveToNext() {
      return super.next();
    }

    public void informReduceProgress() {
      reducePhase.set(super.in.getProgress().get()); // update progress
      reporter.progress();
    }
  }

  private class SkippingReduceValuesIterator<KEY,VALUE>
     extends ReduceValuesIterator<KEY,VALUE> {
     private SkipRangeIterator skipIt;
     private TaskUmbilicalProtocol umbilical;
     private Counters.Counter skipGroupCounter;
     private Counters.Counter skipRecCounter;
     private long grpIndex = -1;
     private Class<KEY> keyClass;
     private Class<VALUE> valClass;
     private SequenceFile.Writer skipWriter;
     private boolean toWriteSkipRecs;
     private boolean hasNext;
     private TaskReporter reporter;

     public SkippingReduceValuesIterator(RawKeyValueIterator in,
         RawComparator<KEY> comparator, Class<KEY> keyClass,
         Class<VALUE> valClass, Configuration conf, TaskReporter reporter,
         TaskUmbilicalProtocol umbilical) throws IOException {
       super(in, comparator, keyClass, valClass, conf, reporter);
       this.umbilical = umbilical;
       this.skipGroupCounter =
         reporter.getCounter(Counter.REDUCE_SKIPPED_GROUPS);
       this.skipRecCounter =
         reporter.getCounter(Counter.REDUCE_SKIPPED_RECORDS);
       this.toWriteSkipRecs = toWriteSkipRecs() &&
         SkipBadRecords.getSkipOutputPath(conf)!=null;
       this.keyClass = keyClass;
       this.valClass = valClass;
       this.reporter = reporter;
       skipIt = getSkipRanges().skipRangeIterator();
       mayBeSkip();
     }

     void nextKey() throws IOException {
       super.nextKey();
       mayBeSkip();
     }

     boolean more() {
       return super.more() && hasNext;
     }

     private void mayBeSkip() throws IOException {
       hasNext = skipIt.hasNext();
       if(!hasNext) {
         LOG.warn("Further groups got skipped.");
         return;
       }
       grpIndex++;
       long nextGrpIndex = skipIt.next();
       long skip = 0;
       long skipRec = 0;
       while(grpIndex<nextGrpIndex && super.more()) {
         while (hasNext()) {
           VALUE value = moveToNext();
           if(toWriteSkipRecs) {
             writeSkippedRec(getKey(), value);
           }
           skipRec++;
         }
         super.nextKey();
         grpIndex++;
         skip++;
       }

       //close the skip writer once all the ranges are skipped
       if(skip>0 && skipIt.skippedAllRanges() && skipWriter!=null) {
         skipWriter.close();
       }
       skipGroupCounter.increment(skip);
       skipRecCounter.increment(skipRec);
       reportNextRecordRange(umbilical, grpIndex);
     }

     @SuppressWarnings("unchecked")
     private void writeSkippedRec(KEY key, VALUE value) throws IOException{
       if(skipWriter==null) {
         Path skipDir = SkipBadRecords.getSkipOutputPath(conf);
         Path skipFile = new Path(skipDir, getTaskID().toString());
         skipWriter = SequenceFile.createWriter(
               skipFile.getFileSystem(conf), conf, skipFile,
               keyClass, valClass,
               CompressionType.BLOCK, reporter);
       }
       skipWriter.append(key, value);
     }
  }

  @Override
  @SuppressWarnings("unchecked")
  public void run(JobConf job, final TaskUmbilicalProtocol umbilical)
    throws IOException, InterruptedException, ClassNotFoundException {
    this.umbilical = umbilical;
    job.setBoolean("mapred.skip.on", isSkipping());
    taskStartTime = System.currentTimeMillis();

    if (isMapOrReduce()) {
      copyPhase = getProgress().addPhase("copy");
      sortPhase  = getProgress().addPhase("sort");
      reducePhase = getProgress().addPhase("reduce");
    }
    // start thread that will handle communication with parent
    TaskReporter reporter = new TaskReporter(getProgress(), umbilical);
    reporter.startCommunicationThread();
    boolean useNewApi = job.getUseNewReducer();
    initialize(job, getJobID(), reporter, useNewApi);

    // check if it is a cleanupJobTask
    if (jobCleanup) {
      runJobCleanupTask(umbilical, reporter);
      return;
    }
    if (jobSetup) {
      runJobSetupTask(umbilical, reporter);
      return;
    }
    if (taskCleanup) {
      runTaskCleanupTask(umbilical, reporter);
      return;
    }

    // Initialize the codec
    codec = initCodec();

    boolean isLocal = "local".equals(job.get("mapred.job.tracker", "local"));
    long reduceCopyStartMilli = System.currentTimeMillis();
    ProcResourceValues copyStartProcVals = getCurrentProcResourceValues();
    if (!isLocal) {
      reduceCopier = new ReduceCopier(umbilical, job, reporter);
      if (!reduceCopier.fetchOutputs()) {
        if(reduceCopier.mergeThrowable instanceof FSError) {
          throw (FSError)reduceCopier.mergeThrowable;
        }
        throw new IOException("Task: " + getTaskID() +
            " - The reduce copier failed", reduceCopier.mergeThrowable);
      }
    }
    long reducerCopyEndMilli = System.currentTimeMillis();
    ProcResourceValues copyEndProcVals = getCurrentProcResourceValues();

    copyPhase.complete();                         // copy is already complete
    setPhase(TaskStatus.Phase.SORT);
    statusUpdate(umbilical);

    final FileSystem rfs = FileSystem.getLocal(job).getRaw();
    RawKeyValueIterator rIter = isLocal
      ? Merger.merge(job, rfs, job.getMapOutputKeyClass(),
          job.getMapOutputValueClass(), codec, getMapFiles(rfs, true),
          !conf.getKeepFailedTaskFiles(), job.getInt("io.sort.factor", 100),
          new Path(getTaskID().toString()), job.getOutputKeyComparator(),
          reporter, spilledRecordsCounter, null)
      : reduceCopier.createKVIterator(job, rfs, reporter);

    // free up the data structures
    mapOutputFilesOnDisk.clear();

    long sortEndMilli = System.currentTimeMillis();
    ProcResourceValues sortEndProcVals = getCurrentProcResourceValues();

    sortPhase.complete();                         // sort is complete
    setPhase(TaskStatus.Phase.REDUCE);
    statusUpdate(umbilical);
    Class keyClass = job.getMapOutputKeyClass();
    Class valueClass = job.getMapOutputValueClass();
    RawComparator comparator = job.getOutputValueGroupingComparator();

    if (useNewApi) {
      runNewReducer(job, umbilical, reporter, rIter, comparator,
                    keyClass, valueClass);
    } else {
      runOldReducer(job, umbilical, reporter, rIter, comparator,
                    keyClass, valueClass);
    }

    taskEndTime = System.currentTimeMillis();

    setWallClockCounter(reducerCopyEndMilli - reduceCopyStartMilli, reporter
        .getCounter(Counter.REDUCE_COPY_WALLCLOCK));
    setCPUCounter(copyStartProcVals, copyEndProcVals, reporter
        .getCounter(Counter.REDUCE_COPY_CPU));
    setWallClockCounter(sortEndMilli - reducerCopyEndMilli, reporter
        .getCounter(Counter.REDUCE_SORT_WALLCLOCK));
    setCPUCounter(copyEndProcVals, sortEndProcVals, reporter
        .getCounter(Counter.REDUCE_SORT_CPU));
    Counters.Counter taskWallClock = reporter.getCounter(Counter.REDUCE_TASK_WALLCLOCK);
    taskWallClock.setValue(taskEndTime - taskStartTime);
    done(umbilical, reporter);
  }

  private void setCPUCounter(ProcResourceValues startProcVals,
      ProcResourceValues endProcVals,
      org.apache.hadoop.mapred.Counters.Counter counter) {
    long cpuUsed = 0;
    if (startProcVals != null &&  endProcVals != null) {
      long cpuStartVal = startProcVals.getCumulativeCpuTime();
      long cpuEndVal = endProcVals.getCumulativeCpuTime();
      if (cpuEndVal > cpuStartVal) {
        cpuUsed = cpuEndVal - cpuStartVal;
      }
    }
    counter.setValue(cpuUsed);
  }

  private void setWallClockCounter(long wallClock,
      org.apache.hadoop.mapred.Counters.Counter counter) {
    counter.setValue(wallClock);
  }

  @SuppressWarnings("unchecked")
  private <INKEY,INVALUE,OUTKEY,OUTVALUE>
  void runOldReducer(JobConf job,
                     TaskUmbilicalProtocol umbilical,
                     final TaskReporter reporter,
                     RawKeyValueIterator rIter,
                     RawComparator<INKEY> comparator,
                     Class<INKEY> keyClass,
                     Class<INVALUE> valueClass) throws IOException {
    Reducer<INKEY,INVALUE,OUTKEY,OUTVALUE> reducer =
      ReflectionUtils.newInstance(job.getReducerClass(), job);
    // make output collector
    String finalName = getOutputName(getPartition());

    FileSystem fs = FileSystem.get(job);

    final RecordWriter<OUTKEY,OUTVALUE> out =
      job.getOutputFormat().getRecordWriter(fs, job, finalName, reporter);

    OutputCollector<OUTKEY,OUTVALUE> collector =
      new OutputCollector<OUTKEY,OUTVALUE>() {
        public void collect(OUTKEY key, OUTVALUE value)
          throws IOException {
          out.write(key, value);
          reduceOutputCounter.increment(1);
          // indicate that progress update needs to be sent
          reporter.progress();
        }
      };

    // apply reduce function
    try {
      //increment processed counter only if skipping feature is enabled
      boolean incrProcCount = SkipBadRecords.getReducerMaxSkipGroups(job)>0 &&
        SkipBadRecords.getAutoIncrReducerProcCount(job);

      ReduceValuesIterator<INKEY,INVALUE> values = isSkipping() ?
          new SkippingReduceValuesIterator<INKEY,INVALUE>(rIter,
              comparator, keyClass, valueClass,
              job, reporter, umbilical) :
          new ReduceValuesIterator<INKEY,INVALUE>(rIter,
          job.getOutputValueGroupingComparator(), keyClass, valueClass,
          job, reporter);
      values.informReduceProgress();
      INKEY lastKey = null;
      boolean checkOrder =
        job.getBoolean("mapred.reduce.input.order.verify", false);
      while (values.more()) {
        if (checkOrder && lastKey != null &&
            comparator.compare(lastKey, values.getKey()) > 0) {
          throw new IOException("Reducer keys are not fully sorted");
        }
        lastKey = values.getKey();
        reduceInputKeyCounter.increment(1);
        reducer.reduce(values.getKey(), values, collector, reporter);
        if(incrProcCount) {
          reporter.incrCounter(SkipBadRecords.COUNTER_GROUP,
              SkipBadRecords.COUNTER_REDUCE_PROCESSED_GROUPS, 1);
        }
        values.nextKey();
        values.informReduceProgress();
      }

      //Clean up: repeated in catch block below
      reducer.close();
      out.close(reporter);
      //End of clean up.
    } catch (IOException ioe) {
      try {
        reducer.close();
      } catch (IOException ignored) {}

      try {
        out.close(reporter);
      } catch (IOException ignored) {}

      throw ioe;
    }
  }

  static class NewTrackingRecordWriter<K,V>
      extends org.apache.hadoop.mapreduce.RecordWriter<K,V> {
    private final org.apache.hadoop.mapreduce.RecordWriter<K,V> real;
    private final org.apache.hadoop.mapreduce.Counter outputRecordCounter;

    NewTrackingRecordWriter(org.apache.hadoop.mapreduce.RecordWriter<K,V> real,
                            org.apache.hadoop.mapreduce.Counter recordCounter) {
      this.real = real;
      this.outputRecordCounter = recordCounter;
    }

    @Override
    public void close(TaskAttemptContext context) throws IOException,
    InterruptedException {
      real.close(context);
    }

    @Override
    public void write(K key, V value) throws IOException, InterruptedException {
      real.write(key,value);
      outputRecordCounter.increment(1);
    }
  }

  @SuppressWarnings("unchecked")
  private <INKEY,INVALUE,OUTKEY,OUTVALUE>
  void runNewReducer(JobConf job,
                     final TaskUmbilicalProtocol umbilical,
                     final TaskReporter reporter,
                     RawKeyValueIterator rIter,
                     RawComparator<INKEY> comparator,
                     Class<INKEY> keyClass,
                     Class<INVALUE> valueClass
                     ) throws IOException,InterruptedException,
                              ClassNotFoundException {
    // wrap value iterator to report progress.
    final RawKeyValueIterator rawIter = rIter;
    rIter = new RawKeyValueIterator() {
      public void close() throws IOException {
        rawIter.close();
      }
      public DataInputBuffer getKey() throws IOException {
        return rawIter.getKey();
      }
      public Progress getProgress() {
        return rawIter.getProgress();
      }
      public DataInputBuffer getValue() throws IOException {
        return rawIter.getValue();
      }
      public boolean next() throws IOException {
        long startBytesProcessed = rawIter.getTotalBytesProcessed();
        boolean ret = rawIter.next();
        long endBytesProcessed = rawIter.getTotalBytesProcessed();
        reduceInputBytesCounter.increment(
            endBytesProcessed - startBytesProcessed);
        reducePhase.set(rawIter.getProgress().get());
        reporter.progress();
        return ret;
      }
      public long getTotalBytesProcessed() {
        return rawIter.getTotalBytesProcessed();
      }
    };
    // make a task context so we can get the classes
    org.apache.hadoop.mapreduce.TaskAttemptContext taskContext =
      new org.apache.hadoop.mapreduce.TaskAttemptContext(job, getTaskID());
    // make a reducer
    org.apache.hadoop.mapreduce.Reducer<INKEY,INVALUE,OUTKEY,OUTVALUE> reducer =
      (org.apache.hadoop.mapreduce.Reducer<INKEY,INVALUE,OUTKEY,OUTVALUE>)
        ReflectionUtils.newInstance(taskContext.getReducerClass(), job);
    org.apache.hadoop.mapreduce.RecordWriter<OUTKEY,OUTVALUE> output =
      (org.apache.hadoop.mapreduce.RecordWriter<OUTKEY,OUTVALUE>)
        outputFormat.getRecordWriter(taskContext);
     org.apache.hadoop.mapreduce.RecordWriter<OUTKEY,OUTVALUE> trackedRW =
       new NewTrackingRecordWriter<OUTKEY, OUTVALUE>(output, reduceOutputCounter);
    job.setBoolean("mapred.skip.on", isSkipping());
    org.apache.hadoop.mapreduce.Reducer.Context
         reducerContext = createReduceContext(reducer, job, getTaskID(),
                                               rIter, reduceInputKeyCounter,
                                               reduceInputValueCounter,
                                               trackedRW, committer,
                                               reporter, comparator, keyClass,
                                               valueClass);
    reducer.run(reducerContext);
    output.close(reducerContext);
  }

  private static enum CopyOutputErrorType {
    NO_ERROR,
    READ_ERROR,
    OTHER_ERROR
  };

  class ReduceCopier<K, V> implements MRConstants {

    /** Reference to the umbilical object */
    private TaskUmbilicalProtocol umbilical;
    private final TaskReporter reporter;

    /** Reference to the task object */

    /** Number of ms before timing out a copy */
    private static final int STALLED_COPY_TIMEOUT = 3 * 60 * 1000;

    /** Max events to fetch in one go from the tasktracker */
    private static final int MAX_EVENTS_TO_FETCH = 10000;

    /**
     * our reduce task instance
     */
    private ReduceTask reduceTask;

    /**
     * the list of map outputs currently being copied
     */
    private List<MapOutputLocation> scheduledCopies;

    /**
     *  the results of dispatched copy attempts
     */
    private List<CopyResult> copyResults;

    /**
     *  the number of outputs to copy in parallel
     */
    private int numCopiers;

    /**
     *  a number that is set to the max #fetches we'd schedule and then
     *  pause the schduling
     */
    private int maxInFlight;


    /**
     * busy hosts from which copies are being backed off
     * Map of host -> next contact time
     */
    private Map<String, Long> penaltyBox;

    /**
     * the set of unique hosts from which we are copying
     */
    private Set<String> uniqueHosts;

    /**
     * A reference to the RamManager for writing the map outputs to.
     */

    private ShuffleRamManager ramManager;

    /**
     * A reference to the local file system for writing the map outputs to.
     */
    private FileSystem localFileSys;

    private FileSystem rfs;
    /**
     * Number of files to merge at a time
     */
    private int ioSortFactor;

    /**
     * A reference to the throwable object (if merge throws an exception)
     */
    private volatile Throwable mergeThrowable;

    /**
     * A flag to indicate when to exit localFS merge
     */
    private volatile boolean exitLocalFSMerge = false;

    /**
     * A flag to indicate when to exit getMapEvents thread
     */
    private volatile boolean exitGetMapEvents = false;

    /**
     * When we accumulate maxInMemOutputs number of files in ram, we merge/spill
     */
    private final int maxInMemOutputs;

    /**
     * Usage threshold for in-memory output accumulation.
     */
    private final float maxInMemCopyPer;

    /**
     * Maximum memory usage of map outputs to merge from memory into
     * the reduce, in bytes.
     */
    private final long maxInMemReduce;

    /**
     * The threads for fetching the files.
     */
    private List<MapOutputCopier> copiers = null;

    /**
     * The object for metrics reporting.
     */
    private ShuffleClientMetrics shuffleClientMetrics = null;

    /**
     * the minimum interval between tasktracker polls
     */
    private static final long MIN_POLL_INTERVAL = 1000;

    /**
     * a list of map output locations for fetch retrials
     */
    private List<MapOutputLocation> retryFetches =
      new ArrayList<MapOutputLocation>();

    /**
     * The set of required map outputs
     */
    private Set <TaskID> copiedMapOutputs =
      Collections.synchronizedSet(new TreeSet<TaskID>());
    
    private AtomicInteger emptyMaps = new AtomicInteger(0);

    /**
     * The set of obsolete map taskids.
     */
    private Set <TaskAttemptID> obsoleteMapIds =
      Collections.synchronizedSet(new TreeSet<TaskAttemptID>());

    private Random random = null;

    /**
     * the max of all the map completion times
     */
    private int maxMapRuntime;

    /**
     * Maximum number of fetch-retries per-map before reporting it.
     */
    private int maxFetchFailuresBeforeReporting;

    /**
     * Maximum number of fetch failures before reducer aborts.
     */
    private final int abortFailureLimit;

    /**
     * Initial penalty time in ms for a fetch failure.
     */
    private static final long INITIAL_PENALTY = 10000;

    /**
     * Penalty growth rate for each fetch failure.
     */
    private static final float PENALTY_GROWTH_RATE = 1.3f;

    /**
     * Default limit for maximum number of fetch failures before reporting.
     */
    private final static int REPORT_FAILURE_LIMIT = 10;

    /**
     * Combiner runner, if a combiner is needed
     */
    private CombinerRunner combinerRunner;

    /**
     * Resettable collector used for combine.
     */
    private CombineOutputCollector combineCollector = null;

    /**
     * Maximum percent of failed fetch attempt before killing the reduce task.
     */
    private static final float MAX_ALLOWED_FAILED_FETCH_ATTEMPT_PERCENT = 0.5f;

    /**
     * Minimum percent of progress required to keep the reduce alive.
     */
    private static final float MIN_REQUIRED_PROGRESS_PERCENT = 0.5f;

    /**
     * Maximum percent of shuffle execution time required to keep the reducer alive.
     */
    private static final float MAX_ALLOWED_STALL_TIME_PERCENT = 0.5f;

    /**
     * Minimum number of map fetch retries.
     */
    private static final int MIN_FETCH_RETRIES_PER_MAP = 2;

    /**
     * The minimum percentage of maps yet to be copied,
     * which indicates end of shuffle
     */
    private static final float MIN_PENDING_MAPS_PERCENT = 0.25f;
    /**
     * Maximum no. of unique maps from which we failed to fetch map-outputs
     * even after {@link #maxFetchRetriesPerMap} retries; after this the
     * reduce task is failed.
     */
    private int maxFailedUniqueFetches = 5;

    /**
     * The maps from which we fail to fetch map-outputs
     * even after {@link #maxFetchRetriesPerMap} retries.
     */
    Set<TaskID> fetchFailedMaps = new TreeSet<TaskID>();

    /**
     * A map of taskId -> no. of failed fetches
     */
    Map<TaskAttemptID, Integer> mapTaskToFailedFetchesMap =
      new HashMap<TaskAttemptID, Integer>();

    /**
     * Initial backoff interval (milliseconds)
     */
    private static final int BACKOFF_INIT = 4000;

    /**
     * The interval for logging in the shuffle
     */
    private static final int MIN_LOG_TIME = 60000;

    /**
     * List of in-memory map-outputs.
     */
    private final List<MapOutput> mapOutputsFilesInMemory =
      Collections.synchronizedList(new LinkedList<MapOutput>());

    /**
     * The map for (Hosts, List of MapIds from this Host) maintaining
     * map output locations
     */
    private final Map<String, List<MapOutputLocation>> mapLocations =
      new ConcurrentHashMap<String, List<MapOutputLocation>>();
    
    /**
     * Get the number of maps whose output have been copied, or ignored if the output is empty
     */
    private int getNumMapsCopyCompleted() {
      return copiedMapOutputs.size() + emptyMaps.get();
    }

    /**
     * This class contains the methods that should be used for metrics-reporting
     * the specific metrics for shuffle. This class actually reports the
     * metrics for the shuffle client (the ReduceTask), and hence the name
     * ShuffleClientMetrics.
     */
    class ShuffleClientMetrics implements Updater {
      private MetricsRecord shuffleMetrics = null;
      private int numFailedFetches = 0;
      private int numSuccessFetches = 0;
      private long numBytes = 0;
      private int numThreadsBusy = 0;
      ShuffleClientMetrics(JobConf conf) {
        MetricsContext metricsContext = MetricsUtil.getContext("mapred");
        this.shuffleMetrics =
          MetricsUtil.createRecord(metricsContext, "shuffleInput");
        this.shuffleMetrics.setTag("user", conf.getUser());
        this.shuffleMetrics.setTag("jobName", conf.getJobName());
        this.shuffleMetrics.setTag("jobId", ReduceTask.this.getJobID().toString());
        this.shuffleMetrics.setTag("taskId", getTaskID().toString());
        this.shuffleMetrics.setTag("sessionId", conf.getSessionId());
        metricsContext.registerUpdater(this);
      }
      public synchronized void inputBytes(long numBytes) {
        this.numBytes += numBytes;
      }
      public synchronized void failedFetch() {
        ++numFailedFetches;
      }
      public synchronized void successFetch() {
        ++numSuccessFetches;
      }
      public synchronized void threadBusy() {
        ++numThreadsBusy;
      }
      public synchronized void threadFree() {
        --numThreadsBusy;
      }
      public void doUpdates(MetricsContext unused) {
        synchronized (this) {
          shuffleMetrics.incrMetric("shuffle_input_bytes", numBytes);
          shuffleMetrics.incrMetric("shuffle_failed_fetches",
                                    numFailedFetches);
          shuffleMetrics.incrMetric("shuffle_success_fetches",
                                    numSuccessFetches);
          if (numCopiers != 0) {
            shuffleMetrics.setMetric("shuffle_fetchers_busy_percent",
                100*((float)numThreadsBusy/numCopiers));
          } else {
            shuffleMetrics.setMetric("shuffle_fetchers_busy_percent", 0);
          }
          numBytes = 0;
          numSuccessFetches = 0;
          numFailedFetches = 0;
        }
        shuffleMetrics.update();
      }
    }

    /** Represents the result of an attempt to copy a map output */
    private class CopyResult {

      // the map output location against which a copy attempt was made
      private final MapOutputLocation loc;

      // the size of the file copied, -1 if the transfer failed
      private final long size;

      //a flag signifying whether a copy result is obsolete
      private static final int OBSOLETE = -2;

      private CopyOutputErrorType error = CopyOutputErrorType.NO_ERROR;
      CopyResult(MapOutputLocation loc, long size) {
        this.loc = loc;
        this.size = size;
      }

      CopyResult(MapOutputLocation loc, long size, CopyOutputErrorType error) {
        this.loc = loc;
        this.size = size;
        this.error = error;
      }

      public boolean getSuccess() { return size >= 0; }
      public boolean isObsolete() {
        return size == OBSOLETE;
      }
      public long getSize() { return size; }
      public String getHost() { return loc.getHost(); }
      public MapOutputLocation getLocation() { return loc; }
      public CopyOutputErrorType getError() { return error; }
    }

    private int nextMapOutputCopierId = 0;
    private boolean reportReadErrorImmediately;

    /**
     * Abstraction to track a map-output.
     */
    private class MapOutputLocation {
      TaskAttemptID taskAttemptId;
      TaskID taskId;
      String ttHost;
      URL taskOutput;

      public MapOutputLocation(TaskAttemptID taskAttemptId,
                               String ttHost, URL taskOutput) {
        this.taskAttemptId = taskAttemptId;
        this.taskId = this.taskAttemptId.getTaskID();
        this.ttHost = ttHost;
        this.taskOutput = taskOutput;
      }

      public TaskAttemptID getTaskAttemptId() {
        return taskAttemptId;
      }

      public TaskID getTaskId() {
        return taskId;
      }

      public String getHost() {
        return ttHost;
      }

      public URL getOutputLocation() {
        return taskOutput;
      }
    }

    /** Describes the output of a map; could either be on disk or in-memory. */
    private class MapOutput {
      final TaskID mapId;
      final TaskAttemptID mapAttemptId;

      final Path file;
      final Configuration conf;

      byte[] data;
      final boolean inMemory;
      long compressedSize;

      public MapOutput(TaskID mapId, TaskAttemptID mapAttemptId,
                       Configuration conf, Path file, long size) {
        this.mapId = mapId;
        this.mapAttemptId = mapAttemptId;

        this.conf = conf;
        this.file = file;
        this.compressedSize = size;

        this.data = null;

        this.inMemory = false;
      }

      public MapOutput(TaskID mapId, TaskAttemptID mapAttemptId, byte[] data, int compressedLength) {
        this.mapId = mapId;
        this.mapAttemptId = mapAttemptId;

        this.file = null;
        this.conf = null;

        this.data = data;
        this.compressedSize = compressedLength;

        this.inMemory = true;
      }

      public void discard() throws IOException {
        if (inMemory) {
          data = null;
        } else {
          FileSystem fs = file.getFileSystem(conf);
          fs.delete(file, true);
        }
      }
    }

    class ShuffleRamManager implements RamManager {
      /* Maximum percentage of the in-memory limit that a single shuffle can
       * consume*/
      private static final float MAX_SINGLE_SHUFFLE_SEGMENT_FRACTION = 0.25f;

      /* Maximum percentage of shuffle-threads which can be stalled
       * simultaneously after which a merge is triggered. */
      private static final float MAX_STALLED_SHUFFLE_THREADS_FRACTION = 0.75f;

      private final long maxSize;
      private final long maxSingleShuffleLimit;

      private long size = 0;

      private Object dataAvailable = new Object();
      private long fullSize = 0;
      private int numPendingRequests = 0;
      private int numRequiredMapOutputs = 0;
      private int numClosed = 0;
      private boolean closed = false;

      public ShuffleRamManager(Configuration conf) throws IOException {
        final float maxInMemCopyUse =
          conf.getFloat("mapred.job.shuffle.input.buffer.percent", 0.70f);
        if (maxInMemCopyUse > 1.0 || maxInMemCopyUse < 0.0) {
          throw new IOException("mapred.job.shuffle.input.buffer.percent" +
                                maxInMemCopyUse);
        }
        maxSize = (long)Math.min(
            Runtime.getRuntime().maxMemory() * maxInMemCopyUse,
            Integer.MAX_VALUE);
        maxSingleShuffleLimit = (long)(maxSize * MAX_SINGLE_SHUFFLE_SEGMENT_FRACTION);
        LOG.info("ShuffleRamManager: MemoryLimit=" + maxSize +
                 ", MaxSingleShuffleLimit=" + maxSingleShuffleLimit);
      }

      public synchronized boolean reserve(int requestedSize, InputStream in)
      throws InterruptedException {
        // Wait till the request can be fulfilled...
        while ((size + requestedSize) > maxSize) {

          // Close the input...
          if (in != null) {
            try {
              in.close();
            } catch (IOException ie) {
              LOG.info("Failed to close connection with: " + ie);
            } finally {
              in = null;
            }
          }

          // Track pending requests
          synchronized (dataAvailable) {
            ++numPendingRequests;
            dataAvailable.notify();
          }

          // Wait for memory to free up
          wait();

          // Track pending requests
          synchronized (dataAvailable) {
            --numPendingRequests;
          }
        }

        size += requestedSize;

        return (in != null);
      }

      public synchronized void unreserve(int requestedSize) {
        size -= requestedSize;

        synchronized (dataAvailable) {
          fullSize -= requestedSize;
          --numClosed;
        }

        // Notify the threads blocked on RamManager.reserve
        notifyAll();
      }

      public boolean waitForDataToMerge() throws InterruptedException {
        boolean done = false;
        synchronized (dataAvailable) {
                 // Start in-memory merge if manager has been closed or...
          while (!closed
                 &&
                 // In-memory threshold exceeded and at least two segments
                 // have been fetched
                 (getPercentUsed() < maxInMemCopyPer || numClosed < 2)
                 &&
                 // More than "mapred.inmem.merge.threshold" map outputs
                 // have been fetched into memory
                 (maxInMemOutputs <= 0 || numClosed < maxInMemOutputs)
                 &&
                 // More than MAX... threads are blocked on the RamManager
                 // or the blocked threads are the last map outputs to be
                 // fetched. If numRequiredMapOutputs is zero, either
                 // setNumCopiedMapOutputs has not been called (no map ouputs
                 // have been fetched, so there is nothing to merge) or the
                 // last map outputs being transferred without
                 // contention, so a merge would be premature.
                 (numPendingRequests <
                      numCopiers*MAX_STALLED_SHUFFLE_THREADS_FRACTION &&
                  (0 == numRequiredMapOutputs ||
                   numPendingRequests < numRequiredMapOutputs))) {
            dataAvailable.wait();
          }
          done = closed;
        }
        return done;
      }

      public void closeInMemoryFile(int requestedSize) {
        synchronized (dataAvailable) {
          fullSize += requestedSize;
          ++numClosed;
          dataAvailable.notify();
        }
      }

      public void setNumCopiedMapOutputs(int numRequiredMapOutputs) {
        synchronized (dataAvailable) {
          this.numRequiredMapOutputs = numRequiredMapOutputs;
          dataAvailable.notify();
        }
      }

      public void close() {
        synchronized (dataAvailable) {
          closed = true;
          LOG.info("Closed ram manager");
          dataAvailable.notify();
        }
      }

      private float getPercentUsed() {
        return (float)fullSize/maxSize;
      }

      boolean canFitInMemory(long requestedSize) {
        return (requestedSize < Integer.MAX_VALUE &&
                requestedSize < maxSingleShuffleLimit);
      }
    }

    /** Copies map outputs as they become available */
    private class MapOutputCopier extends Thread {
      // basic/unit connection timeout (in milliseconds)
      private final static int UNIT_CONNECT_TIMEOUT = 30 * 1000;
      private final static int UNIT_DNS_RETRY_WAIT = 1000;
      // default read timeout (in milliseconds)
      private final static int DEFAULT_READ_TIMEOUT = 3 * 60 * 1000;
      private final int shuffleConnectionTimeout;
      private final int shuffleReadTimeout;

      private MapOutputLocation currentLocation = null;
      private int id = nextMapOutputCopierId++;
      private Reporter reporter;
      private boolean readError = false;

      // Decompression of map-outputs
      private CompressionCodec codec = null;
      private Decompressor decompressor = null;
      private volatile boolean shutdown = false;

      public MapOutputCopier(JobConf job, Reporter reporter) {
        setName("MapOutputCopier " + reduceTask.getTaskID() + "." + id);
        LOG.debug(getName() + " created");
        this.reporter = reporter;

        shuffleConnectionTimeout =
          job.getInt("mapreduce.reduce.shuffle.connect.timeout", STALLED_COPY_TIMEOUT);
        shuffleReadTimeout =
          job.getInt("mapreduce.reduce.shuffle.read.timeout", DEFAULT_READ_TIMEOUT);

        if (job.getCompressMapOutput()) {
          Class<? extends CompressionCodec> codecClass =
            job.getMapOutputCompressorClass(DefaultCodec.class);
          codec = ReflectionUtils.newInstance(codecClass, job);
          decompressor = CodecPool.getDecompressor(codec);
        }
        setDaemon(true);
      }

      public void stopCopier() {
        shutdown = true;
        this.interrupt();
      }


      /**
       * Fail the current file that we are fetching
       * @return were we currently fetching?
       */
      public synchronized boolean fail() {
        if (currentLocation != null) {
          finish(-1, CopyOutputErrorType.OTHER_ERROR);
          return true;
        } else {
          return false;
        }
      }

      /**
       * Get the current map output location.
       */
      public synchronized MapOutputLocation getLocation() {
        return currentLocation;
      }

      private synchronized void start(MapOutputLocation loc) {
        currentLocation = loc;
      }

      private synchronized void finish(long size, CopyOutputErrorType error) {
        if (currentLocation != null) {
          LOG.debug(getName() + " finishing " + currentLocation + " =" + size);
          synchronized (copyResults) {
            copyResults.add(new CopyResult(currentLocation, size, error));
            copyResults.notify();
          }
          currentLocation = null;
        }
      }

      /** Loop forever and fetch map outputs as they become available.
       * The thread exits when it is interrupted by {@link ReduceTaskRunner}
       */
      @Override
      public void run() {
        while (!shutdown) {
          try {
            MapOutputLocation loc = null;
            long size = -1;

            synchronized (scheduledCopies) {
              while (scheduledCopies.isEmpty()) {
                scheduledCopies.wait();
              }
              loc = scheduledCopies.remove(0);
            }
            CopyOutputErrorType error = CopyOutputErrorType.OTHER_ERROR;
            readError = false;
            try {
              shuffleClientMetrics.threadBusy();
              start(loc);
              size = copyOutput(loc);
              shuffleClientMetrics.successFetch();
              error = CopyOutputErrorType.NO_ERROR;
            } catch (IOException e) {
              LOG.warn(reduceTask.getTaskID() + " copy failed: " +
                       loc.getTaskAttemptId() + " from " + loc.getHost(), e);
              shuffleClientMetrics.failedFetch();
              if (readError) {
                error = CopyOutputErrorType.READ_ERROR;
              }
              // Reset
              size = -1;
            } finally {
              shuffleClientMetrics.threadFree();
              finish(size, error);
            }
          } catch (InterruptedException e) {
            if (shutdown)
              break; // ALL DONE
          } catch (FSError e) {
            LOG.error("Task: " + reduceTask.getTaskID() + " - FSError: " +
                      StringUtils.stringifyException(e));
            try {
              umbilical.fsError(reduceTask.getTaskID(), e.getMessage());
            } catch (IOException io) {
              LOG.error("Could not notify TT of FSError: " +
                      StringUtils.stringifyException(io));
            }
          } catch (Throwable th) {
            String msg = getTaskID() + " : Map output copy failure : "
                         + StringUtils.stringifyException(th);
            reportFatalError(getTaskID(), th, msg);
          }
        }

        if (decompressor != null) {
          CodecPool.returnDecompressor(decompressor);
        }

      }

      /** Copies a a map output from a remote host, via HTTP.
       * @param currentLocation the map output location to be copied
       * @return the path (fully qualified) of the copied file
       * @throws IOException if there is an error copying the file
       * @throws InterruptedException if the copier should give up
       */
      private long copyOutput(MapOutputLocation loc
                              ) throws IOException, InterruptedException {
        // check if we still need to copy the output from this location
        if (copiedMapOutputs.contains(loc.getTaskId()) ||
            obsoleteMapIds.contains(loc.getTaskAttemptId())) {
          return CopyResult.OBSOLETE;
        }

        // a temp filename. If this file gets created in ramfs, we're fine,
        // else, we will check the localFS to find a suitable final location
        // for this path
        TaskAttemptID reduceId = reduceTask.getTaskID();
        Path filename = new Path("/" + TaskTracker.getIntermediateOutputDir(
                                 reduceId.getJobID().toString(),
                                 reduceId.toString())
                                 + "/map_" +
                                 loc.getTaskId().getId() + ".out");

        // Copy the map output to a temp file whose name is unique to this attempt
        Path tmpMapOutput = new Path(filename+"-"+id);

        // Copy the map output
        MapOutput mapOutput = getMapOutput(loc, tmpMapOutput,
                                           reduceId.getTaskID().getId());
        if (mapOutput == null) {
          throw new IOException("Failed to fetch map-output for " +
                                loc.getTaskAttemptId() + " from " +
                                loc.getHost());
        }

        // The size of the map-output
        long bytes = mapOutput.compressedSize;

        // lock the ReduceTask while we do the rename
        synchronized (ReduceTask.this) {
          if (copiedMapOutputs.contains(loc.getTaskId())) {
            mapOutput.discard();
            return CopyResult.OBSOLETE;
          }

          // Special case: discard empty map-outputs
          if (bytes == 0) {
            try {
              mapOutput.discard();
            } catch (IOException ioe) {
              LOG.info("Couldn't discard output of " + loc.getTaskId());
            }

            // Note that we successfully copied the map-output
            noteCopiedMapOutput(loc.getTaskId());

            return bytes;
          }

          // Process map-output
          if (mapOutput.inMemory) {
            // Save it in the synchronized list of map-outputs
            mapOutputsFilesInMemory.add(mapOutput);
          } else {
            // Rename the temporary file to the final file;
            // ensure it is on the same partition
            tmpMapOutput = mapOutput.file;
            filename = new Path(tmpMapOutput.getParent(), filename.getName());
            if (!localFileSys.rename(tmpMapOutput, filename)) {
              localFileSys.delete(tmpMapOutput, true);
              bytes = -1;
              throw new IOException("Failed to rename map output " +
                  tmpMapOutput + " to " + filename);
            }

            synchronized (mapOutputFilesOnDisk) {
              addToMapOutputFilesOnDisk(localFileSys.getFileStatus(filename));
            }
          }

          // Note that we successfully copied the map-output
          noteCopiedMapOutput(loc.getTaskId());
        }

        return bytes;
      }

      /**
       * Save the map taskid whose output we just copied.
       * This function assumes that it has been synchronized on ReduceTask.this.
       *
       * @param taskId map taskid
       */
      private void noteCopiedMapOutput(TaskID taskId) {
        copiedMapOutputs.add(taskId);
        ramManager.setNumCopiedMapOutputs(numMaps - getNumMapsCopyCompleted());
      }

      /**
       * Get the map output into a local file (either in the inmemory fs or on the
       * local fs) from the remote server.
       * We use the file system so that we generate checksum files on the data.
       * @param mapOutputLoc map-output to be fetched
       * @param filename the filename to write the data into
       * @param connectionTimeout number of milliseconds for connection timeout
       * @param readTimeout number of milliseconds for read timeout
       * @return the path of the file that got created
       * @throws IOException when something goes wrong
       */
      private MapOutput getMapOutput(MapOutputLocation mapOutputLoc,
                                     Path filename, int reduce)
      throws IOException, InterruptedException {
        // Connect
        HttpURLConnection connection =
          (HttpURLConnection) mapOutputLoc.getOutputLocation().openConnection();

        InputStream input = getInputStream(connection, shuffleConnectionTimeout,
                                           shuffleReadTimeout);

        // Validate header from map output
        TaskAttemptID mapId = null;
        try {
          mapId =
            TaskAttemptID.forName(connection.getHeaderField(FROM_MAP_TASK));
        } catch (IllegalArgumentException ia) {
          LOG.warn("Invalid map id ", ia);
          return null;
        }
        TaskAttemptID expectedMapId = mapOutputLoc.getTaskAttemptId();
        if (!mapId.equals(expectedMapId)) {
          LOG.warn("data from wrong map:" + mapId +
              " arrived to reduce task " + reduce +
              ", where as expected map output should be from " + expectedMapId);
          return null;
        }

        long decompressedLength =
          Long.parseLong(connection.getHeaderField(RAW_MAP_OUTPUT_LENGTH));
        long compressedLength =
          Long.parseLong(connection.getHeaderField(MAP_OUTPUT_LENGTH));

        if (compressedLength < 0 || decompressedLength < 0) {
          LOG.warn(getName() + " invalid lengths in map output header: id: " +
              mapId + " compressed len: " + compressedLength +
              ", decompressed len: " + decompressedLength);
          return null;
        }
        int forReduce =
          (int)Integer.parseInt(connection.getHeaderField(FOR_REDUCE_TASK));

        if (forReduce != reduce) {
          LOG.warn("data for the wrong reduce: " + forReduce +
              " with compressed len: " + compressedLength +
              ", decompressed len: " + decompressedLength +
              " arrived to reduce task " + reduce);
          return null;
        }
        LOG.info(connection.getURL() + " header: " + mapId +
                 ", compressed len: " + compressedLength +
                 ", decompressed len: " + decompressedLength);

        //We will put a file in memory if it meets certain criteria:
        //1. The size of the (decompressed) file should be less than 25% of
        //    the total inmem fs
        //2. There is space available in the inmem fs

        // Check if this map-output can be saved in-memory
        boolean shuffleInMemory = ramManager.canFitInMemory(decompressedLength);

        // Shuffle
        MapOutput mapOutput = null;
        if (shuffleInMemory) {
          LOG.info("Shuffling " + decompressedLength + " bytes (" +
              compressedLength + " raw bytes) " +
              "into RAM from " + mapOutputLoc.getTaskAttemptId());

          mapOutput = shuffleInMemory(mapOutputLoc, connection, input,
                                      (int)decompressedLength,
                                      (int)compressedLength);
        } else {
          LOG.info("Shuffling " + decompressedLength + " bytes (" +
              compressedLength + " raw bytes) " +
              "into Local-FS from " + mapOutputLoc.getTaskAttemptId());

          mapOutput = shuffleToDisk(mapOutputLoc, input, filename,
              compressedLength);
        }

        return mapOutput;
      }

      /**
       * The connection establishment is attempted multiple times and is given up
       * only on the last failure. Instead of connecting with a timeout of
       * X, we try connecting with a timeout of x < X but multiple times.
       */
      private InputStream getInputStream(URLConnection connection,
                                         int connectionTimeout,
                                         int readTimeout)
      throws IOException {
        int unit = 0;
        if (connectionTimeout < 0) {
          throw new IOException("Invalid timeout "
                                + "[timeout = " + connectionTimeout + " ms]");
        } else if (connectionTimeout > 0) {
          unit = (UNIT_CONNECT_TIMEOUT > connectionTimeout)
                 ? connectionTimeout
                 : UNIT_CONNECT_TIMEOUT;
        }
        // set the read timeout to the total timeout
        connection.setReadTimeout(readTimeout);
        // set the connect timeout to the unit-connect-timeout
        connection.setConnectTimeout(unit);
        while (true) {
          try {
            connection.connect();
            break;
          } catch (UnknownHostException uex) {
            // This means that the DNS is failing again
            // the hostname we are using was received from the JT, so
            // most probably it is the fault of the DNS. We should sleep and
            // retry later
            if (connectionTimeout == 0) {
              throw uex;
            }
            try {
              int sleepTime = UNIT_DNS_RETRY_WAIT > unit ?
                                unit : UNIT_DNS_RETRY_WAIT;
              connectionTimeout -= sleepTime;
              Thread.sleep(sleepTime);
            } catch (InterruptedException iex) {
              Thread.currentThread().interrupt();
            }
          } catch (IOException ioe) {
            // update the total remaining connect-timeout
            connectionTimeout -= unit;

            // throw an exception if we have waited for timeout amount of time
            // note that the updated value if timeout is used here
            if (connectionTimeout == 0) {
              throw ioe;
            }

            // reset the connect timeout for the last try
            if (connectionTimeout < unit) {
              unit = connectionTimeout;
              // reset the connect time out for the final connect
              connection.setConnectTimeout(unit);
            }
          }
        }
        try {
          return connection.getInputStream();
        } catch (IOException ioe) {
          readError = true;
          throw ioe;
        }
      }

      private MapOutput shuffleInMemory(MapOutputLocation mapOutputLoc,
                                        URLConnection connection,
                                        InputStream input,
                                        int mapOutputLength,
                                        int compressedLength)
      throws IOException, InterruptedException {
        // Reserve ram for the map-output
        boolean createdNow = ramManager.reserve(mapOutputLength, input);

        // Reconnect if we need to
        if (!createdNow) {
          // Reconnect
          try {
            connection = mapOutputLoc.getOutputLocation().openConnection();
            input = getInputStream(connection, shuffleConnectionTimeout,
                                   shuffleReadTimeout);
          } catch (IOException ioe) {
            LOG.info("Failed reopen connection to fetch map-output from " +
                     mapOutputLoc.getHost(), ioe);

            // Inform the ram-manager
            ramManager.closeInMemoryFile(mapOutputLength);
            ramManager.unreserve(mapOutputLength);

            throw ioe;
          }
        }

        IFileInputStream checksumIn =
          new IFileInputStream(input,compressedLength);

        input = checksumIn;

        // Are map-outputs compressed?
        if (codec != null) {
          decompressor.reset();
          input = codec.createInputStream(input, decompressor);
        }

        // Copy map-output into an in-memory buffer
        byte[] shuffleData = new byte[mapOutputLength];
        MapOutput mapOutput =
          new MapOutput(mapOutputLoc.getTaskId(),
                        mapOutputLoc.getTaskAttemptId(), shuffleData, compressedLength);

        int bytesRead = 0;
        try {
          int n = 0;
          try {
            n = input.read(shuffleData, 0, shuffleData.length);
          } catch (Throwable t) {
            // Catch and rethrow as IOE since decompressor can throw
            // something else that IOException for corrupt map output
            throw new IOException(t);
          }
          while (n > 0) {
            bytesRead += n;
            shuffleClientMetrics.inputBytes(n);

            // indicate we're making progress
            reporter.progress();
            try {
              n = input.read(shuffleData, bytesRead,
                           (shuffleData.length-bytesRead));
            } catch (Throwable t) {
              throw new IOException(t);
            }
          }

          LOG.info("Read " + bytesRead + " bytes from map-output for " +
                   mapOutputLoc.getTaskAttemptId());

          input.close();
        } catch (IOException ioe) {
          LOG.info("Failed to shuffle from " + mapOutputLoc.getTaskAttemptId(),
                   ioe);

          // Inform the ram-manager
          ramManager.closeInMemoryFile(mapOutputLength);
          ramManager.unreserve(mapOutputLength);

          // Discard the map-output
          try {
            mapOutput.discard();
          } catch (IOException ignored) {
            LOG.info("Failed to discard map-output from " +
                     mapOutputLoc.getTaskAttemptId(), ignored);
          }
          mapOutput = null;

          // Close the streams
          IOUtils.cleanup(LOG, input);

          // Re-throw
          readError = true;
          throw ioe;
        }

        // Close the in-memory file
        ramManager.closeInMemoryFile(mapOutputLength);

        // Sanity check
        if (bytesRead != mapOutputLength) {
          // Inform the ram-manager
          ramManager.unreserve(mapOutputLength);

          // Discard the map-output
          try {
            mapOutput.discard();
          } catch (IOException ignored) {
            // IGNORED because we are cleaning up
            LOG.info("Failed to discard map-output from " +
                     mapOutputLoc.getTaskAttemptId(), ignored);
          }
          mapOutput = null;

          throw new IOException("Incomplete map output received for " +
                                mapOutputLoc.getTaskAttemptId() + " from " +
                                mapOutputLoc.getOutputLocation() + " (" +
                                bytesRead + " instead of " +
                                mapOutputLength + ")"
          );
        }

        // TODO: Remove this after a 'fix' for HADOOP-3647
        if (mapOutputLength > 0) {
          DataInputBuffer dib = new DataInputBuffer();
          dib.reset(shuffleData, 0, shuffleData.length);
          LOG.info("Rec #1 from " + mapOutputLoc.getTaskAttemptId() + " -> (" +
                   WritableUtils.readVInt(dib) + ", " +
                   WritableUtils.readVInt(dib) + ") from " +
                   mapOutputLoc.getHost());
        }

        return mapOutput;
      }

      private MapOutput shuffleToDisk(MapOutputLocation mapOutputLoc,
                                      InputStream input,
                                      Path filename,
                                      long mapOutputLength)
      throws IOException {
        // Find out a suitable location for the output on local-filesystem
        Path localFilename =
          lDirAlloc.getLocalPathForWrite(filename.toUri().getPath(),
                                         mapOutputLength, conf);

        MapOutput mapOutput =
          new MapOutput(mapOutputLoc.getTaskId(), mapOutputLoc.getTaskAttemptId(),
                        conf, localFileSys.makeQualified(localFilename),
                        mapOutputLength);


        // Copy data to local-disk
        OutputStream output = null;
        long bytesRead = 0;
        try {
          output = rfs.create(localFilename);

          byte[] buf = new byte[64 * 1024];
          int n = -1;
          try {
            n = input.read(buf, 0, buf.length);
          } catch (IOException ioe) {
            readError = true;
            throw ioe;
          }
          while (n > 0) {
            bytesRead += n;
            shuffleClientMetrics.inputBytes(n);
            output.write(buf, 0, n);

            // indicate we're making progress
            reporter.progress();
            try {
              n = input.read(buf, 0, buf.length);
            } catch (IOException ioe) {
              readError = true;
              throw ioe;
            }
          }

          LOG.info("Read " + bytesRead + " bytes from map-output for " +
              mapOutputLoc.getTaskAttemptId());

          output.close();
          input.close();
        } catch (IOException ioe) {
          LOG.info("Failed to shuffle from " + mapOutputLoc.getTaskAttemptId(),
                   ioe);

          // Discard the map-output
          try {
            mapOutput.discard();
          } catch (IOException ignored) {
            LOG.info("Failed to discard map-output from " +
                mapOutputLoc.getTaskAttemptId(), ignored);
          }
          mapOutput = null;

          // Close the streams
          IOUtils.cleanup(LOG, input, output);

          // Re-throw
          throw ioe;
        }

        // Sanity check
        if (bytesRead != mapOutputLength) {
          try {
            mapOutput.discard();
          } catch (Exception ioe) {
            // IGNORED because we are cleaning up
            LOG.info("Failed to discard map-output from " +
                mapOutputLoc.getTaskAttemptId(), ioe);
          } catch (Throwable t) {
            String msg = getTaskID() + " : Failed in shuffle to disk :"
                         + StringUtils.stringifyException(t);
            reportFatalError(getTaskID(), t, msg);
          }
          mapOutput = null;

          throw new IOException("Incomplete map output received for " +
                                mapOutputLoc.getTaskAttemptId() + " from " +
                                mapOutputLoc.getOutputLocation() + " (" +
                                bytesRead + " instead of " +
                                mapOutputLength + ")"
          );
        }

        return mapOutput;

      }

    } // MapOutputCopier

    private void configureClasspath(JobConf conf)
      throws IOException {

      // get the task and the current classloader which will become the parent
      Task task = ReduceTask.this;
      ClassLoader parent = conf.getClassLoader();

      // get the work directory which holds the elements we are dynamically
      // adding to the classpath
      File workDir = new File(task.getJobFile()).getParentFile();
      ArrayList<URL> urllist = new ArrayList<URL>();

      // add the jars and directories to the classpath
      String jar = conf.getJar();
      if (jar != null) {
        File jobCacheDir = new File(new Path(jar).getParent().toString());

        File[] libs = new File(jobCacheDir, "lib").listFiles();
        if (libs != null) {
          for (int i = 0; i < libs.length; i++) {
            urllist.add(libs[i].toURL());
          }
        }
        urllist.add(new File(jobCacheDir, "classes").toURL());
        urllist.add(jobCacheDir.toURL());

      }
      urllist.add(workDir.toURL());

      // create a new classloader with the old classloader as its parent
      // then set that classloader as the one used by the current jobconf
      URL[] urls = urllist.toArray(new URL[urllist.size()]);
      URLClassLoader loader = new URLClassLoader(urls, parent);
      conf.setClassLoader(loader);
    }

    public ReduceCopier(TaskUmbilicalProtocol umbilical, JobConf conf,
                        TaskReporter reporter
                        )throws ClassNotFoundException, IOException {

      configureClasspath(conf);
      this.reporter = reporter;
      this.shuffleClientMetrics = new ShuffleClientMetrics(conf);
      this.umbilical = umbilical;
      this.reduceTask = ReduceTask.this;

      this.scheduledCopies = new ArrayList<MapOutputLocation>(100);
      this.copyResults = new ArrayList<CopyResult>(100);
      this.numCopiers = conf.getInt("mapred.reduce.parallel.copies", 5);
      this.maxInFlight = 4 * numCopiers;
      Counters.Counter combineInputCounter =
        reporter.getCounter(Task.Counter.COMBINE_INPUT_RECORDS);
      this.combinerRunner = CombinerRunner.create(conf, getTaskID(),
                                                  combineInputCounter,
                                                  reporter, null);
      if (combinerRunner != null) {
        combineCollector =
          new CombineOutputCollector(reduceCombineOutputCounter);
      }

      this.ioSortFactor = conf.getInt("io.sort.factor", 10);

      this.abortFailureLimit = Math.max(30, numMaps / 10);

      this.maxFetchFailuresBeforeReporting = conf.getInt(
          "mapreduce.reduce.shuffle.maxfetchfailures", REPORT_FAILURE_LIMIT);

      this.maxFailedUniqueFetches = Math.min(numMaps,
                                             this.maxFailedUniqueFetches);
      this.maxInMemOutputs = conf.getInt("mapred.inmem.merge.threshold", 1000);
      this.maxInMemCopyPer =
        conf.getFloat("mapred.job.shuffle.merge.percent", 0.66f);
      final float maxRedPer =
        conf.getFloat("mapred.job.reduce.input.buffer.percent", 0f);
      if (maxRedPer > 1.0 || maxRedPer < 0.0) {
        throw new IOException("mapred.job.reduce.input.buffer.percent" +
                              maxRedPer);
      }
      this.maxInMemReduce = (int)Math.min(
          Runtime.getRuntime().maxMemory() * maxRedPer, Integer.MAX_VALUE);

      // Setup the RamManager
      ramManager = new ShuffleRamManager(conf);

      localFileSys = FileSystem.getLocal(conf);

      rfs = ((LocalFileSystem)localFileSys).getRaw();

      // hosts -> next contact time
      this.penaltyBox = new LinkedHashMap<String, Long>();

      // hostnames
      this.uniqueHosts = new HashSet<String>();

      // Seed the random number generator with a reasonably globally unique seed
      long randomSeed = System.nanoTime() +
                        (long)Math.pow(this.reduceTask.getPartition(),
                                       (this.reduceTask.getPartition()%10)
                                      );
      this.random = new Random(randomSeed);
      this.maxMapRuntime = 0;
      this.reportReadErrorImmediately =
        conf.getBoolean("mapreduce.reduce.shuffle.notify.readerror", true);
    }

    private boolean busyEnough(int numInFlight) {
      return numInFlight > maxInFlight;
    }


    public boolean fetchOutputs() throws IOException {
      int totalFailures = 0;
      int numInFlight = 0, numCopied = 0;
      DecimalFormat  mbpsFormat = new DecimalFormat("0.00");
      final Progress copyPhase =
        reduceTask.getProgress().phase();
      LocalFSMerger localFSMergerThread = null;
      InMemFSMergeThread inMemFSMergeThread = null;
      GetMapEventsThread getMapEventsThread = null;

      for (int i = 0; i < numMaps; i++) {
        copyPhase.addPhase();       // add sub-phase per file
      }

      copiers = new ArrayList<MapOutputCopier>(numCopiers);

      // start all the copying threads
      for (int i=0; i < numCopiers; i++) {
        MapOutputCopier copier = new MapOutputCopier(conf, reporter);
        copiers.add(copier);
        copier.start();
      }

      //start the on-disk-merge thread
      localFSMergerThread = new LocalFSMerger((LocalFileSystem)localFileSys);
      //start the in memory merger thread
      inMemFSMergeThread = new InMemFSMergeThread();
      localFSMergerThread.start();
      inMemFSMergeThread.start();

      // start the map events thread
      getMapEventsThread = new GetMapEventsThread();
      getMapEventsThread.start();

      // start the clock for bandwidth measurement
      long startTime = System.currentTimeMillis();
      long currentTime = startTime;
      long lastProgressTime = startTime;
      long lastOutputTime = 0;

        // loop until we get all required outputs
        while (getNumMapsCopyCompleted() < numMaps && mergeThrowable == null) {

          currentTime = System.currentTimeMillis();
          boolean logNow = false;
          if (currentTime - lastOutputTime > MIN_LOG_TIME) {
            lastOutputTime = currentTime;
            logNow = true;
          }
          if (logNow) {
            LOG.info(reduceTask.getTaskID() + " Need another "
                   + (numMaps - getNumMapsCopyCompleted()) + " map output(s) "
                   + "where " + numInFlight + " is already in progress");
          }

          // Put the hash entries for the failed fetches.
          Iterator<MapOutputLocation> locItr = retryFetches.iterator();

          while (locItr.hasNext()) {
            MapOutputLocation loc = locItr.next();
            List<MapOutputLocation> locList =
              mapLocations.get(loc.getHost());

            // Check if the list exists. Map output location mapping is cleared
            // once the jobtracker restarts and is rebuilt from scratch.
            // Note that map-output-location mapping will be recreated and hence
            // we continue with the hope that we might find some locations
            // from the rebuild map.
            if (locList != null) {
              // Add to the beginning of the list so that this map is
              //tried again before the others and we can hasten the
              //re-execution of this map should there be a problem
              locList.add(0, loc);
            }
          }

          if (retryFetches.size() > 0) {
            LOG.info(reduceTask.getTaskID() + ": " +
                  "Got " + retryFetches.size() +
                  " map-outputs from previous failures");
          }
          // clear the "failed" fetches hashmap
          retryFetches.clear();

          // now walk through the cache and schedule what we can
          int numScheduled = 0;
          int numDups = 0;

          synchronized (scheduledCopies) {

            // Randomize the map output locations to prevent
            // all reduce-tasks swamping the same tasktracker
            List<String> hostList = new ArrayList<String>();
            hostList.addAll(mapLocations.keySet());

            Collections.shuffle(hostList, this.random);

            Iterator<String> hostsItr = hostList.iterator();

            while (hostsItr.hasNext()) {

              String host = hostsItr.next();

              List<MapOutputLocation> knownOutputsByLoc =
                mapLocations.get(host);

              // Check if the list exists. Map output location mapping is
              // cleared once the jobtracker restarts and is rebuilt from
              // scratch.
              // Note that map-output-location mapping will be recreated and
              // hence we continue with the hope that we might find some
              // locations from the rebuild map and add then for fetching.
              if (knownOutputsByLoc == null || knownOutputsByLoc.size() == 0) {
                continue;
              }

              //Identify duplicate hosts here
              if (uniqueHosts.contains(host)) {
                 numDups += knownOutputsByLoc.size();
                 continue;
              }

              Long penaltyEnd = penaltyBox.get(host);
              boolean penalized = false;

              if (penaltyEnd != null) {
                if (currentTime < penaltyEnd.longValue()) {
                  penalized = true;
                } else {
                  penaltyBox.remove(host);
                }
              }

              if (penalized)
                continue;

              synchronized (knownOutputsByLoc) {

                locItr = knownOutputsByLoc.iterator();

                while (locItr.hasNext()) {

                  MapOutputLocation loc = locItr.next();

                  // Do not schedule fetches from OBSOLETE maps
                  if (obsoleteMapIds.contains(loc.getTaskAttemptId())) {
                    locItr.remove();
                    continue;
                  }

                  uniqueHosts.add(host);
                  scheduledCopies.add(loc);
                  locItr.remove();  // remove from knownOutputs
                  numInFlight++; numScheduled++;

                  //
                  // Comment out this break allows fetching all the shards at
                  // once from a host, instead of fetching one at a time.
                  // See MAPREDUCE-318.
                  //
                  // break; //we have a map from this host
                  //
                }
              }
            }
            scheduledCopies.notifyAll();
          }

          if (numScheduled > 0 || logNow) {
            LOG.info(reduceTask.getTaskID() + " Scheduled " + numScheduled +
                   " outputs (" + penaltyBox.size() +
                   " slow hosts and " + numDups + " dup hosts)");
          }

          if (penaltyBox.size() > 0 && logNow) {
            LOG.info("Penalized(slow) Hosts: ");
            for (String host : penaltyBox.keySet()) {
              LOG.info(host + " Will be considered after: " +
                  ((penaltyBox.get(host) - currentTime)/1000) + " seconds.");
            }
          }

          // if we have no copies in flight and we can't schedule anything
          // new, just wait for a bit
          try {
            if (numInFlight == 0 && numScheduled == 0) {
              // we should indicate progress as we don't want TT to think
              // we're stuck and kill us
              reporter.progress();
              synchronized (mapLocations) {
                mapLocations.wait(5000);
              }
            }
          } catch (InterruptedException e) { } // IGNORE

          while (numInFlight > 0 && mergeThrowable == null) {
            LOG.debug(reduceTask.getTaskID() + " numInFlight = " +
                      numInFlight);
            //the call to getCopyResult will either
            //1) return immediately with a null or a valid CopyResult object,
            //                 or
            //2) if the numInFlight is above maxInFlight, return with a
            //   CopyResult object after getting a notification from a
            //   fetcher thread,
            //So, when getCopyResult returns null, we can be sure that
            //we aren't busy enough and we should go and get more mapcompletion
            //events from the tasktracker
            CopyResult cr = getCopyResult(numInFlight);

            if (cr == null) {
              break;
            }

            if (cr.getSuccess()) {  // a successful copy
              numCopied++;
              lastProgressTime = System.currentTimeMillis();
              reduceShuffleBytes.increment(cr.getSize());

              long secsSinceStart =
                (System.currentTimeMillis()-startTime)/1000+1;
              float mbs = ((float)reduceShuffleBytes.getCounter())/(1024*1024);
              float transferRate = mbs/secsSinceStart;

              copyPhase.startNextPhase();
              copyPhase.setStatus("copy (" + numCopied + " of " + numMaps
                                  + " at " +
                                  mbpsFormat.format(transferRate) +  " MB/s)");

              // Note successful fetch for this mapId to invalidate
              // (possibly) old fetch-failures
              fetchFailedMaps.remove(cr.getLocation().getTaskId());
            } else if (cr.isObsolete()) {
              //ignore
              LOG.info(reduceTask.getTaskID() +
                       " Ignoring obsolete copy result for Map Task: " +
                       cr.getLocation().getTaskAttemptId() + " from host: " +
                       cr.getHost());
            } else {
              retryFetches.add(cr.getLocation());

              // note the failed-fetch
              TaskAttemptID mapTaskId = cr.getLocation().getTaskAttemptId();
              TaskID mapId = cr.getLocation().getTaskId();

              totalFailures++;
              Integer noFailedFetches =
                mapTaskToFailedFetchesMap.get(mapTaskId);
              noFailedFetches =
                (noFailedFetches == null) ? 1 : (noFailedFetches + 1);
              mapTaskToFailedFetchesMap.put(mapTaskId, noFailedFetches);
              LOG.info("Task " + getTaskID() + ": Failed fetch #" +
                       noFailedFetches + " from " + mapTaskId);

              if (noFailedFetches >= abortFailureLimit) {
                LOG.fatal(noFailedFetches + " failures downloading "
                          + getTaskID() + ".");
                umbilical.shuffleError(getTaskID(),
                                 "Exceeded the abort failure limit;"
                                 + " bailing-out.");
              }

              checkAndInformJobTracker(noFailedFetches, mapTaskId,
                  cr.getError().equals(CopyOutputErrorType.READ_ERROR));

              // note unique failed-fetch maps
              if (noFailedFetches == maxFetchFailuresBeforeReporting) {
                fetchFailedMaps.add(mapId);

                // did we have too many unique failed-fetch maps?
                // and did we fail on too many fetch attempts?
                // and did we progress enough
                //     or did we wait for too long without any progress?

                // check if the reducer is healthy
                boolean reducerHealthy =
                    (((float)totalFailures / (totalFailures + numCopied))
                     < MAX_ALLOWED_FAILED_FETCH_ATTEMPT_PERCENT);

                // check if the reducer has progressed enough
                boolean reducerProgressedEnough =
                    (((float)numCopied / numMaps)
                     >= MIN_REQUIRED_PROGRESS_PERCENT);

                // check if the reducer is stalled for a long time
                // duration for which the reducer is stalled
                int stallDuration =
                    (int)(System.currentTimeMillis() - lastProgressTime);
                // duration for which the reducer ran with progress
                int shuffleProgressDuration =
                    (int)(lastProgressTime - startTime);
                // min time the reducer should run without getting killed
                int minShuffleRunDuration =
                    (shuffleProgressDuration > maxMapRuntime)
                    ? shuffleProgressDuration
                    : maxMapRuntime;
                boolean reducerStalled =
                    (((float)stallDuration / minShuffleRunDuration)
                     >= MAX_ALLOWED_STALL_TIME_PERCENT);

                // kill if not healthy and has insufficient progress
                if ((fetchFailedMaps.size() >= maxFailedUniqueFetches ||
                     fetchFailedMaps.size() == (numMaps - getNumMapsCopyCompleted()))
                    && !reducerHealthy
                    && (!reducerProgressedEnough || reducerStalled)) {
                  LOG.fatal("Shuffle failed with too many fetch failures " +
                            "and insufficient progress!" +
                            "Killing task " + getTaskID() + ".");
                  umbilical.shuffleError(getTaskID(),
                                         "Exceeded MAX_FAILED_UNIQUE_FETCHES " + maxFailedUniqueFetches + ";" +
                                         " bailing-out.");
                }

              }

              currentTime = System.currentTimeMillis();
              long currentBackOff = (long)(INITIAL_PENALTY *
                  Math.pow(PENALTY_GROWTH_RATE,
                      Math.min(noFailedFetches, maxCopyBackoff)));

              penaltyBox.put(cr.getHost(), currentTime + currentBackOff);
              LOG.warn(reduceTask.getTaskID() + " adding host " +
                       cr.getHost() + " to penalty box, next contact in " +
                       (currentBackOff/1000) + " seconds");
            }
            uniqueHosts.remove(cr.getHost());
            numInFlight--;
          }
        }

        // all done, inform the copiers to exit
        exitGetMapEvents= true;
        try {
          getMapEventsThread.join();
          LOG.info("getMapsEventsThread joined.");
        } catch (InterruptedException ie) {
          LOG.info("getMapsEventsThread threw an exception: " +
              StringUtils.stringifyException(ie));
        }

        synchronized (copiers) {
          synchronized (scheduledCopies) {
            for (MapOutputCopier copier : copiers) {
              copier.stopCopier();
            }
            copiers.clear();
          }
        }

        // copiers are done, exit and notify the waiting merge threads
        synchronized (mapOutputFilesOnDisk) {
          exitLocalFSMerge = true;
          mapOutputFilesOnDisk.notify();
        }

        ramManager.close();

        //Do a merge of in-memory files (if there are any)
        if (mergeThrowable == null) {
          try {
            // Wait for the on-disk merge to complete
            localFSMergerThread.join();
            LOG.info("Interleaved on-disk merge complete: " +
                     mapOutputFilesOnDisk.size() + " files left.");

            //wait for an ongoing merge (if it is in flight) to complete
            inMemFSMergeThread.join();
            LOG.info("In-memory merge complete: " +
                     mapOutputsFilesInMemory.size() + " files left.");
            } catch (InterruptedException ie) {
            LOG.warn(reduceTask.getTaskID() +
                     " Final merge of the inmemory files threw an exception: " +
                     StringUtils.stringifyException(ie));
            // check if the last merge generated an error
            if (mergeThrowable != null) {
              mergeThrowable = ie;
            }
            return false;
          }
        }
        return mergeThrowable == null && (getNumMapsCopyCompleted()) == numMaps;
    }

    // Notify the JobTracker
    // after every read error, if 'reportReadErrorImmediately' is true or
    // after every 'maxFetchFailuresBeforeReporting' failures
    protected void checkAndInformJobTracker(
        int failures, TaskAttemptID mapId, boolean readError) {
      if ((reportReadErrorImmediately && readError)
          || ((failures % maxFetchFailuresBeforeReporting) == 0)) {
        synchronized (ReduceTask.this) {
          taskStatus.addFetchFailedMap(mapId);
          reporter.progress();
          LOG.info("Failed to fetch map-output from " + mapId +
                   " even after MAX_FETCH_RETRIES_PER_MAP retries... "
                   + " or it is a read error, "
                   + " reporting to the JobTracker");
        }
      }
    }



    private long createInMemorySegments(
        List<Segment<K, V>> inMemorySegments, long leaveBytes)
        throws IOException {
      long totalSize = 0L;
      synchronized (mapOutputsFilesInMemory) {
        // fullSize could come from the RamManager, but files can be
        // closed but not yet present in mapOutputsFilesInMemory
        long fullSize = 0L;
        for (MapOutput mo : mapOutputsFilesInMemory) {
          fullSize += mo.data.length;
        }
        while(fullSize > leaveBytes) {
          MapOutput mo = mapOutputsFilesInMemory.remove(0);
          totalSize += mo.data.length;
          fullSize -= mo.data.length;
          Reader<K, V> reader =
            new InMemoryReader<K, V>(ramManager, mo.mapAttemptId,
                                     mo.data, 0, mo.data.length);
          Segment<K, V> segment =
            new Segment<K, V>(reader, true);
          inMemorySegments.add(segment);
        }
      }
      return totalSize;
    }

    /**
     * Create a RawKeyValueIterator from copied map outputs. All copying
     * threads have exited, so all of the map outputs are available either in
     * memory or on disk. We also know that no merges are in progress, so
     * synchronization is more lax, here.
     *
     * The iterator returned must satisfy the following constraints:
     *   1. Fewer than io.sort.factor files may be sources
     *   2. No more than maxInMemReduce bytes of map outputs may be resident
     *      in memory when the reduce begins
     *
     * If we must perform an intermediate merge to satisfy (1), then we can
     * keep the excluded outputs from (2) in memory and include them in the
     * first merge pass. If not, then said outputs must be written to disk
     * first.
     */
    @SuppressWarnings("unchecked")
    private RawKeyValueIterator createKVIterator(
        JobConf job, FileSystem fs, Reporter reporter) throws IOException {

      // merge config params
      Class<K> keyClass = (Class<K>)job.getMapOutputKeyClass();
      Class<V> valueClass = (Class<V>)job.getMapOutputValueClass();
      boolean keepInputs = job.getKeepFailedTaskFiles();
      final Path tmpDir = new Path(getTaskID().toString());
      final RawComparator<K> comparator =
        (RawComparator<K>)job.getOutputKeyComparator();

      // segments required to vacate memory
      List<Segment<K,V>> memDiskSegments = new ArrayList<Segment<K,V>>();
      long inMemToDiskBytes = 0;
      if (mapOutputsFilesInMemory.size() > 0) {
        TaskID mapId = mapOutputsFilesInMemory.get(0).mapId;
        inMemToDiskBytes = createInMemorySegments(memDiskSegments,
            maxInMemReduce);
        final int numMemDiskSegments = memDiskSegments.size();
        if (numMemDiskSegments > 0 &&
              ioSortFactor > mapOutputFilesOnDisk.size()) {
          // must spill to disk, but can't retain in-mem for intermediate merge
          final Path outputPath = mapOutputFile.getInputFileForWrite(mapId,
                            reduceTask.getTaskID(), inMemToDiskBytes);
          final RawKeyValueIterator rIter = Merger.merge(job, fs,
              keyClass, valueClass, memDiskSegments, numMemDiskSegments,
              tmpDir, comparator, reporter, spilledRecordsCounter, null);
          final Writer writer = new Writer(job, fs, outputPath,
              keyClass, valueClass, codec, null);
          try {
            Merger.writeFile(rIter, writer, reporter, job);
            addToMapOutputFilesOnDisk(fs.getFileStatus(outputPath));
          } catch (Exception e) {
            if (null != outputPath) {
              fs.delete(outputPath, true);
            }
            throw new IOException("Final merge failed", e);
          } finally {
            if (null != writer) {
              writer.close();
            }
          }
          LOG.info("Merged " + numMemDiskSegments + " segments, " +
                   inMemToDiskBytes + " bytes to disk to satisfy " +
                   "reduce memory limit");
          inMemToDiskBytes = 0;
          memDiskSegments.clear();
        } else if (inMemToDiskBytes != 0) {
          LOG.info("Keeping " + numMemDiskSegments + " segments, " +
                   inMemToDiskBytes + " bytes in memory for " +
                   "intermediate, on-disk merge");
        }
      }

      // segments on disk
      List<Segment<K,V>> diskSegments = new ArrayList<Segment<K,V>>();
      long onDiskBytes = inMemToDiskBytes;
      Path[] onDisk = getMapFiles(fs, false);
      for (Path file : onDisk) {
        onDiskBytes += fs.getFileStatus(file).getLen();
        diskSegments.add(new Segment<K, V>(job, fs, file, codec, keepInputs));
      }
      LOG.info("Merging " + onDisk.length + " files, " +
               onDiskBytes + " bytes from disk");
      Collections.sort(diskSegments, new Comparator<Segment<K,V>>() {
        public int compare(Segment<K, V> o1, Segment<K, V> o2) {
          if (o1.getLength() == o2.getLength()) {
            return 0;
          }
          return o1.getLength() < o2.getLength() ? -1 : 1;
        }
      });

      // build final list of segments from merged backed by disk + in-mem
      List<Segment<K,V>> finalSegments = new ArrayList<Segment<K,V>>();
      long inMemBytes = createInMemorySegments(finalSegments, 0);
      LOG.info("Merging " + finalSegments.size() + " segments, " +
               inMemBytes + " bytes from memory into reduce");
      if (0 != onDiskBytes) {
        final int numInMemSegments = memDiskSegments.size();
        diskSegments.addAll(0, memDiskSegments);
        memDiskSegments.clear();
        RawKeyValueIterator diskMerge = Merger.merge(
            job, fs, keyClass, valueClass, codec, diskSegments,
            ioSortFactor, numInMemSegments, tmpDir, comparator,
            reporter, false, spilledRecordsCounter, null);
        diskSegments.clear();
        if (0 == finalSegments.size()) {
          return diskMerge;
        }
        finalSegments.add(new Segment<K,V>(
              new RawKVIteratorReader(diskMerge, onDiskBytes), true));
      }
      return Merger.merge(job, fs, keyClass, valueClass,
                   finalSegments, finalSegments.size(), tmpDir,
                   comparator, reporter, spilledRecordsCounter, null);
    }

    class RawKVIteratorReader extends IFile.Reader<K,V> {

      private final RawKeyValueIterator kvIter;

      public RawKVIteratorReader(RawKeyValueIterator kvIter, long size)
          throws IOException {
        super(null, null, size, null, spilledRecordsCounter);
        this.kvIter = kvIter;
      }

      public boolean next(DataInputBuffer key, DataInputBuffer value)
          throws IOException {
        if (kvIter.next()) {
          final DataInputBuffer kb = kvIter.getKey();
          final DataInputBuffer vb = kvIter.getValue();
          final int kp = kb.getPosition();
          final int klen = kb.getLength() - kp;
          key.reset(kb.getData(), kp, klen);
          final int vp = vb.getPosition();
          final int vlen = vb.getLength() - vp;
          value.reset(vb.getData(), vp, vlen);
          bytesRead += klen + vlen;
          return true;
        }
        return false;
      }

      public long getPosition() throws IOException {
        return kvIter.getTotalBytesProcessed();
      }

      public void close() throws IOException {
        kvIter.close();
      }
    }

    private CopyResult getCopyResult(int numInFlight) {
      synchronized (copyResults) {
        while (copyResults.isEmpty()) {
          try {
            //The idea is that if we have scheduled enough, we can wait until
            //we hear from one of the copiers.
            if (busyEnough(numInFlight)) {
              copyResults.wait();
            } else {
              return null;
            }
          } catch (InterruptedException e) { }
        }
        return copyResults.remove(0);
      }
    }

    private void addToMapOutputFilesOnDisk(FileStatus status) {
      synchronized (mapOutputFilesOnDisk) {
        mapOutputFilesOnDisk.add(status);
        mapOutputFilesOnDisk.notify();
      }
    }



    /** Starts merging the local copy (on disk) of the map's output so that
     * most of the reducer's input is sorted i.e overlapping shuffle
     * and merge phases.
     */
    private class LocalFSMerger extends Thread {
      private LocalFileSystem localFileSys;

      public LocalFSMerger(LocalFileSystem fs) {
        this.localFileSys = fs;
        setName("Thread for merging on-disk files");
        setDaemon(true);
      }

      @SuppressWarnings("unchecked")
      public void run() {
        try {
          LOG.info(reduceTask.getTaskID() + " Thread started: " + getName());
          while(!exitLocalFSMerge){
            synchronized (mapOutputFilesOnDisk) {
              while (!exitLocalFSMerge &&
                  mapOutputFilesOnDisk.size() < (2 * ioSortFactor - 1)) {
                LOG.info(reduceTask.getTaskID() + " Thread waiting: " + getName());
                mapOutputFilesOnDisk.wait();
              }
            }
            if(exitLocalFSMerge) {//to avoid running one extra time in the end
              break;
            }
            List<Path> mapFiles = new ArrayList<Path>();
            long approxOutputSize = 0;
            int bytesPerSum =
              reduceTask.getConf().getInt("io.bytes.per.checksum", 512);
            LOG.info(reduceTask.getTaskID() + "We have  " +
                mapOutputFilesOnDisk.size() + " map outputs on disk. " +
                "Triggering merge of " + ioSortFactor + " files");
            // 1. Prepare the list of files to be merged. This list is prepared
            // using a list of map output files on disk. Currently we merge
            // io.sort.factor files into 1.
            synchronized (mapOutputFilesOnDisk) {
              for (int i = 0; i < ioSortFactor; ++i) {
                FileStatus filestatus = mapOutputFilesOnDisk.first();
                mapOutputFilesOnDisk.remove(filestatus);
                mapFiles.add(filestatus.getPath());
                approxOutputSize += filestatus.getLen();
              }
            }

            // sanity check
            if (mapFiles.size() == 0) {
                return;
            }

            // add the checksum length
            approxOutputSize += ChecksumFileSystem
                                .getChecksumLength(approxOutputSize,
                                                   bytesPerSum);

            // 2. Start the on-disk merge process
            Path outputPath =
              lDirAlloc.getLocalPathForWrite(mapFiles.get(0).toString(),
                                             approxOutputSize, conf)
              .suffix(".merged");
            Writer writer =
              new Writer(conf,rfs, outputPath,
                         conf.getMapOutputKeyClass(),
                         conf.getMapOutputValueClass(),
                         codec, null);
            RawKeyValueIterator iter  = null;
            Path tmpDir = new Path(reduceTask.getTaskID().toString());
            try {
              iter = Merger.merge(conf, rfs,
                                  conf.getMapOutputKeyClass(),
                                  conf.getMapOutputValueClass(),
                                  codec, mapFiles.toArray(new Path[mapFiles.size()]),
                                  true, ioSortFactor, tmpDir,
                                  conf.getOutputKeyComparator(), reporter,
                                  spilledRecordsCounter, null);

              Merger.writeFile(iter, writer, reporter, conf);
              writer.close();
            } catch (Exception e) {
              localFileSys.delete(outputPath, true);
              throw new IOException (StringUtils.stringifyException(e));
            }

            synchronized (mapOutputFilesOnDisk) {
              addToMapOutputFilesOnDisk(localFileSys.getFileStatus(outputPath));
            }

            LOG.info(reduceTask.getTaskID() +
                     " Finished merging " + mapFiles.size() +
                     " map output files on disk of total-size " +
                     approxOutputSize + "." +
                     " Local output file is " + outputPath + " of size " +
                     localFileSys.getFileStatus(outputPath).getLen());
            }
        } catch (Exception e) {
          LOG.warn(reduceTask.getTaskID()
                   + " Merging of the local FS files threw an exception: "
                   + StringUtils.stringifyException(e));
          if (mergeThrowable == null) {
            mergeThrowable = e;
          }
        } catch (Throwable t) {
          String msg = getTaskID() + " : Failed to merge on the local FS"
                       + StringUtils.stringifyException(t);
          reportFatalError(getTaskID(), t, msg);
        }
      }
    }

    private class InMemFSMergeThread extends Thread {

      public InMemFSMergeThread() {
        setName("Thread for merging in memory files");
        setDaemon(true);
      }

      public void run() {
        LOG.info(reduceTask.getTaskID() + " Thread started: " + getName());
        try {
          boolean exit = false;
          do {
            exit = ramManager.waitForDataToMerge();
            if (!exit) {
              doInMemMerge();
            }
          } while (!exit);
        } catch (Exception e) {
          LOG.warn(reduceTask.getTaskID() +
                   " Merge of the inmemory files threw an exception: "
                   + StringUtils.stringifyException(e));
          ReduceCopier.this.mergeThrowable = e;
        } catch (Throwable t) {
          String msg = getTaskID() + " : Failed to merge in memory"
                       + StringUtils.stringifyException(t);
          reportFatalError(getTaskID(), t, msg);
        }
      }

      @SuppressWarnings("unchecked")
      private void doInMemMerge() throws IOException{
        if (mapOutputsFilesInMemory.size() == 0) {
          return;
        }

        //name this output file same as the name of the first file that is
        //there in the current list of inmem files (this is guaranteed to
        //be absent on the disk currently. So we don't overwrite a prev.
        //created spill). Also we need to create the output file now since
        //it is not guaranteed that this file will be present after merge
        //is called (we delete empty files as soon as we see them
        //in the merge method)

        //figure out the mapId
        TaskID mapId = mapOutputsFilesInMemory.get(0).mapId;

        List<Segment<K, V>> inMemorySegments = new ArrayList<Segment<K,V>>();
        long mergeOutputSize = createInMemorySegments(inMemorySegments, 0);
        int noInMemorySegments = inMemorySegments.size();

        Path outputPath = mapOutputFile.getInputFileForWrite(mapId,
                          reduceTask.getTaskID(), mergeOutputSize);

        Writer writer =
          new Writer(conf, rfs, outputPath,
                     conf.getMapOutputKeyClass(),
                     conf.getMapOutputValueClass(),
                     codec, null);

        RawKeyValueIterator rIter = null;
        try {
          LOG.info("Initiating in-memory merge with " + noInMemorySegments +
                   " segments...");

          rIter = Merger.merge(conf, rfs,
                               (Class<K>)conf.getMapOutputKeyClass(),
                               (Class<V>)conf.getMapOutputValueClass(),
                               inMemorySegments, inMemorySegments.size(),
                               new Path(reduceTask.getTaskID().toString()),
                               conf.getOutputKeyComparator(), reporter,
                               spilledRecordsCounter, null);

          if (combinerRunner == null) {
            Merger.writeFile(rIter, writer, reporter, conf);
          } else {
            combineCollector.setWriter(writer);
            combinerRunner.combine(rIter, combineCollector);
          }
          writer.close();

          LOG.info(reduceTask.getTaskID() +
              " Merge of the " + noInMemorySegments +
              " files in-memory complete." +
              " Local file is " + outputPath + " of size " +
              localFileSys.getFileStatus(outputPath).getLen());
        } catch (Exception e) {
          //make sure that we delete the ondisk file that we created
          //earlier when we invoked cloneFileAttributes
          localFileSys.delete(outputPath, true);
          throw (IOException)new IOException
                  ("Intermediate merge failed").initCause(e);
        }

        // Note the output of the merge
        FileStatus status = localFileSys.getFileStatus(outputPath);
        synchronized (mapOutputFilesOnDisk) {
          addToMapOutputFilesOnDisk(status);
        }
      }
    }

    private class GetMapEventsThread extends Thread {

      private IntWritable fromEventId = new IntWritable(0);
      private static final long SLEEP_TIME = 1000;

      public GetMapEventsThread() {
        setName("Thread for polling Map Completion Events");
        setDaemon(true);
      }

      @Override
      public void run() {

        LOG.info(reduceTask.getTaskID() + " Thread started: " + getName());

        do {
          try {
            int numNewMaps = getMapCompletionEvents();
            if (numNewMaps == 0) {
               if (getNumMapsCopyCompleted() == numMaps) {
                  break;
              }   
            }
            else if (numNewMaps > 0) {
                LOG.info(reduceTask.getTaskID() + ": " +
                  "Got " + numNewMaps + " new map-outputs");
                synchronized (mapLocations) {
                  mapLocations.notify();
                }
            }
            Thread.sleep(SLEEP_TIME);
          }
          catch (InterruptedException e) {
            // ignore. if we are shutting down - the while condition
            // will check for it and exit. otherwise this could be a
            // spurious interrupt due to log4j interaction
          }
          catch (Throwable t) {
            String msg = reduceTask.getTaskID()
                         + " GetMapEventsThread Ignoring exception : "
                         + StringUtils.stringifyException(t);
            reportFatalError(getTaskID(), t, msg);
          }
        } while (!exitGetMapEvents);

        LOG.info("GetMapEventsThread exiting");

      }

      /**
       * Queries the {@link TaskTracker} for a set of map-completion events
       * from a given event ID.
       * @throws IOException
       */
      private int getMapCompletionEvents() throws IOException {

        int numNewMaps = 0;

        MapTaskCompletionEventsUpdate update =
          umbilical.getMapCompletionEvents(reduceTask.getJobID(),
                                           fromEventId.get(),
                                           MAX_EVENTS_TO_FETCH,
                                           reduceTask.getTaskID());
        TaskCompletionEvent events[] = update.getMapTaskCompletionEvents();
        
        // Check if the reset is required.
        // Since there is no ordering of the task completion events at the
        // reducer, the only option to sync with the new jobtracker is to reset
        // the events index
        if (update.shouldReset()) {
          fromEventId.set(0);
          obsoleteMapIds.clear(); // clear the obsolete map
          mapLocations.clear(); // clear the map locations mapping
        }

        // Update the last seen event ID
        fromEventId.set(fromEventId.get() + events.length);

        // Process the TaskCompletionEvents:
        // 1. Save the SUCCEEDED maps in knownOutputs to fetch the outputs.
        // 2. Save the OBSOLETE/FAILED/KILLED maps in obsoleteOutputs to stop
        //    fetching from those maps.
        // 3. Remove TIPFAILED maps from neededOutputs since we don't need their
        //    outputs at all.
        for (TaskCompletionEvent event : events) {
          switch (event.getTaskStatus()) {
            case SUCCEEDED:
            {
              URI u = URI.create(event.getTaskTrackerHttp());
              String host = u.getHost();
              TaskAttemptID taskId = event.getTaskAttemptId();
              URL mapOutputLocation = new URL(event.getTaskTrackerHttp() +
                                      "/mapOutput?job=" + taskId.getJobID() +
                                      "&map=" + taskId +
                                      "&reduce=" + getPartition());
              List<MapOutputLocation> loc = mapLocations.get(host);
              if (loc == null) {
                loc = Collections.synchronizedList
                  (new LinkedList<MapOutputLocation>());
                mapLocations.put(host, loc);
               }
              loc.add(new MapOutputLocation(taskId, host, mapOutputLocation));
              numNewMaps ++;
            }
            break;
            case SUCCEEDED_NO_OUTPUT:
            {
               // Remove the task from list of tasks to be copied
               TaskID taskId = event.getTaskAttemptId().getTaskID(); 
               copiedMapOutputs.remove(taskId);
               emptyMaps.incrementAndGet();
               LOG.info("Map does not have any output, ignoring taskId: " + taskId);
               break;
            }    
            case FAILED:
            case KILLED:
            case OBSOLETE:
            {
              obsoleteMapIds.add(event.getTaskAttemptId());
              LOG.info("Ignoring obsolete output of " + event.getTaskStatus() +
                       " map-task: '" + event.getTaskAttemptId() + "'");
            }
            break;
            case TIPFAILED:
            {
              copiedMapOutputs.add(event.getTaskAttemptId().getTaskID());
              LOG.info("Ignoring output of failed map TIP: '" +
                   event.getTaskAttemptId() + "'");
            }
            break;
          }
        }
        return numNewMaps;
      }
    }
  }

  /**
   * Return the exponent of the power of two closest to the given
   * positive value, or zero if value leq 0.
   * This follows the observation that the msb of a given value is
   * also the closest power of two, unless the bit following it is
   * set.
   */
  private static int getClosestPowerOf2(int value) {
    if (value <= 0)
      throw new IllegalArgumentException("Undefined for " + value);
    final int hob = Integer.highestOneBit(value);
    return Integer.numberOfTrailingZeros(hob) +
      (((hob >>> 1) & value) == 0 ? 0 : 1);
  }
}