java source code of AbstractEthereumRecordReader

hadoopcryptoledger-master
- gradle
  - wrapper
    - gradle-wrapper.properties
- presto-connector
  - src
    - main
      - java
        org
        zuinnote
        presto
        bitcoin
        BitcoinConnector.java
- examples
  - mapreduce-ethereumblock
    - src
      - main
        java
        org
        zuinnote
        hadoop
        ethereum
        example
        driver
        EthereumBlockCounterDriver.java
        tasks
        EthereumBlockMap.java
        EthereumBlockReducer.java
      - test
        java
        org
        zuinnote
        hadoop
        ethereum
        example
        MapReduceEthereumBlockTest.java
      - integration-test
        resources
        testdata
        eth1346406.bin
        java
        org
        zuinnote
        hadoop
        ethereum
        example
        MapReduceEthereumBlockIntegrationTest.java
    - build.gradle
  - scala-spark-ethereumblock
    - src
      - main
        scala
        org
        zuinnote
        spark
        ethereum
        example
        SparkScalaEthereumBlockCounter.scala
      - it
        resources
        testdata
        eth1346406.bin
        scala
        org
        zuinnote
        spark
        ethereum
        example
        SparkEthereumBlockCounterSparkMasterIntegrationSpec.scala
      - test
        scala
        org
        zuinnote
        spark
        ethereum
        example
        SparkEthereumBlockCounterSpec.scala
    - project
      - assembly.sbt
      - plugins.sbt
    - build.sbt
  - scala-flink-bitcoinblock
    - src
      - main
        scala
        org
        zuinnote
        flink
        bitcoin
        example
        FlinkScalaBitcoinBlockCounter.scala
      - it
        resources
        testdata
        multiblock.blk
        genesis.blk
        scala
        org
        zuinnote
        flink
        bitcoin
        example
        FlinkBitcoinBlockCounterFlinkMasterIntegrationSpec.scala
      - test
        scala
        org
        zuinnote
        flink
        bitcoin
        example
        FlinkBitcoinBlockCounterSpec.scala
    - project
      - assembly.sbt
      - plugins.sbt
    - build.sbt
  - hive-ethereum
    - hive-ethereum.sql
    - hive-ethereum-udf.sql
  - scala-spark-graphx-bitcointransaction
    - src
      - main
        scala
        org
        zuinnote
        spark
        bitcoin
        example
        SparkScalaBitcoinTransactionGraph.scala
      - it
        resources
        testdata
        firstblocks.blk
        scala
        org
        zuinnote
        spark
        bitcoin
        example
        SparkGraphxBitcoinSparkMasterIntegrationSpec.scala
      - test
        scala
        org
        zuinnote
        spark
        bitcoin
        example
        SparkGraphxBitcoinSpec.scala
    - project
      - assembly.sbt
      - plugins.sbt
    - build.sbt
  - mapreduce-bitcointransaction
    - src
      - main
        java
        org
        zuinnote
        hadoop
        bitcoin
        example
        driver
        BitcoinTransactionCounterDriver.java
        tasks
        BitcoinTransactionMap.java
        BitcoinTransactionReducer.java
      - test
        java
        org
        zuinnote
        hadoop
        bitcoin
        example
        MapReduceBitcoinTransactionTest.java
      - integration-test
        resources
        testdata
        genesis.blk
        java
        org
        zuinnote
        hadoop
        bitcoin
        example
        MapReduceBitcoinTransactionIntegrationTest.java
    - build.gradle
  - spark2-bitcoinblock
    - src
      - main
        java
        org
        zuinnote
        spark2
        bitcoin
        example
        Spark2BitcoinBlockCounter.java
      - test
        java
        org
        zuinnote
        spark2
        bitcoin
        example
        Spark2BitcoinBlockCounterTest.java
      - integration-test
        resources
        testdata
        genesis.blk
        java
        org
        zuinnote
        spark2
        bitcoin
        example
        Spark2BitcoinBlockCounterSparkMasterIntegrationTest.java
    - build.gradle
  - mapreduce-bitcoinblock
    - src
      - main
        java
        org
        zuinnote
        hadoop
        bitcoin
        example
        driver
        BitcoinBlockCounterDriver.java
        tasks
        BitcoinBlockReducer.java
        BitcoinBlockMap.java
      - test
        java
        org
        zuinnote
        hadoop
        bitcoin
        example
        MapReduceBitcoinBlockTest.java
      - integration-test
        resources
        testdata
        genesis.blk
        java
        org
        zuinnote
        hadoop
        bitcoin
        example
        MapReduceBitcoinBlockIntegrationTest.java
    - build.gradle
  - hive-bitcoin
    - hive-bitcoin.sql
    - hive-bitcoin-udf.sql
  - scala-spark-datasource-ethereumblock
    - src
      - main
        scala
        org
        zuinnote
        spark
        ethereum
        example
        SparkScalaEthereumBlockDataSource.scala
      - it
        resources
        testdata
        eth0to10.bin
        eth1346406.bin
        scala
        org
        zuinnote
        spark
        ethereum
        example
        SparkEthereumBlockDSSparkMasterIntegrationSpec.scala
      - test
        scala
        org
        zuinnote
        spark
        ethereum
        example
        SparkEthereumBlockDSSpec.scala
    - project
      - assembly.sbt
      - plugins.sbt
    - build.sbt
  - spark-bitcoinblock
    - src
      - main
        java
        org
        zuinnote
        spark
        bitcoin
        example
        SparkBitcoinBlockCounter.java
      - test
        java
        org
        zuinnote
        spark
        bitcoin
        example
        SparkBitcoinBlockCounterTest.java
      - integration-test
        resources
        testdata
        genesis.blk
        java
        org
        zuinnote
        spark
        bitcoin
        example
        SparkBitcoinBlockCounterSparkMasterIntegrationTest.java
    - build.gradle
  - hive-litecoin
    - hive-litecoin.sql
  - scala-spark-litecoin
    - src
      - main
        scala
        org
        zuinnote
        spark
        litecoin
        example
        SparkScalaLitecoinBlockCounter.scala
      - it
        resources
        testdata
        litecoingenesis.blk
        scala
        org
        zuinnote
        spark
        litecoin
        example
        SparkLitecoinBlockCounterSparkMasterIntegrationSpec.scala
      - test
        scala
        org
        zuinnote
        spark
        litecoin
        example
        SparkLitecoinBlockCounterSpec.scala
    - project
      - assembly.sbt
      - plugins.sbt
    - build.sbt
  - scala-spark-datasource-bitcoinblock
    - src
      - main
        scala
        org
        zuinnote
        spark
        bitcoin
        example
        SparkScalaBitcoinBlockDataSource.scala
      - it
        resources
        testdata
        genesis.blk
        scala
        org
        zuinnote
        spark
        bitcoin
        example
        SparkBitcoinBlockDSSparkMasterIntegrationSpec.scala
      - test
        scala
        org
        zuinnote
        spark
        bitcoin
        example
        SparkBitcoinBlockDSSpec.scala
    - project
      - assembly.sbt
      - plugins.sbt
    - build.sbt
  - scala-flink-ethereumblock
    - src
      - main
        scala
        org
        zuinnote
        flink
        ethereum
        example
        FlinkScalaEthereumBlockCounter.scala
      - it
        resources
        testdata
        eth0to10.bin
        eth1346406.bin
        scala
        org
        zuinnote
        flink
        ethereum
        example
        FlinkEthereumBlockCounterFlinkMasterIntegrationSpec.scala
      - test
        scala
        org
        zuinnote
        flink
        ethereum
        example
        FlinkEthereumBlockCounterSpec.scala
    - project
      - assembly.sbt
      - plugins.sbt
    - build.sbt
  - hive-namecoin
    - hive-namecoin-udf.sql
    - hive-namecoin.sql
  - scala-spark-bitcoinblock
    - src
      - main
        scala
        org
        zuinnote
        spark
        bitcoin
        example
        SparkScalaBitcoinBlockCounter.scala
      - it
        resources
        testdata
        genesis.blk
        scala
        org
        zuinnote
        spark
        bitcoin
        example
        SparkBitcoinBlockCounterSparkMasterIntegrationSpec.scala
      - test
        scala
        org
        zuinnote
        spark
        bitcoin
        example
        SparkBitcoinBlockCounterSpec.scala
    - project
      - assembly.sbt
      - plugins.sbt
    - build.sbt
  - scala-spark-namecoin
    - src
      - main
        scala
        org
        zuinnote
        spark
        namecoin
        example
        SparkScalaNamecoinBlockCounter.scala
      - it
        resources
        testdata
        namecoingenesis.blk
        scala
        org
        zuinnote
        spark
        namecoin
        example
        SparkNamecoinBlockCounterSparkMasterIntegrationSpec.scala
      - test
        scala
        org
        zuinnote
        spark
        namecoin
        example
        SparkNamecoinBlockCounterSpec.scala
    - project
      - assembly.sbt
      - plugins.sbt
    - build.sbt
- .travis
  - publish-junitreport.sh
  - publish-pitest.sh
  - publish-javadoc.sh
  - jvmopts
  - publish-owaspdependency.sh
- gradlew.bat
- LICENSE
- gradlew
- sonar-project.properties
- CONTRIBUTING.md
- SECURITY.md
- build.gradle
- inputformat
  - src
    - main
      - java
        org
        zuinnote
        hadoop
        namecoin
        format
        common
        NamecoinUtil.java
        ethereum
        format
        common
        EthereumUtil.java
        EthereumBlockReader.java
        EthereumBlockHeader.java
        EthereumTransaction.java
        rlp
        RLPObject.java
        RLPElement.java
        RLPList.java
        EthereumBlock.java
        mapred
        EthereumBlockFileInputFormat.java
        AbstractEthereumFileInputFormat.java
        EthereumBlockRecordReader.java
        AbstractEthereumRecordReader.java
        exception
        EthereumBlockReadException.java
        mapreduce
        EthereumBlockFileInputFormat.java
        AbstractEthereumFileInputFormat.java
        EthereumBlockRecordReader.java
        AbstractEthereumRecordReader.java
        bitcoin
        format
        common
        BitcoinAuxPOWBlockHeader.java
        BitcoinUtil.java
        BitcoinAuxPOWBranch.java
        BitcoinScriptPatternParser.java
        BitcoinTransactionOutput.java
        BitcoinBlockReader.java
        BitcoinScriptWitness.java
        BitcoinBlock.java
        BitcoinAuxPOW.java
        BitcoinScriptWitnessItem.java
        BitcoinTransaction.java
        BitcoinTransactionInput.java
        mapred
        BitcoinRawBlockRecordReader.java
        BitcoinTransactionFileInputFormat.java
        AbstractBitcoinRecordReader.java
        BitcoinRawBlockFileInputFormat.java
        BitcoinTransactionRecordReader.java
        BitcoinBlockRecordReader.java
        BitcoinBlockFileInputFormat.java
        AbstractBitcoinFileInputFormat.java
        exception
        BitcoinBlockReadException.java
        HadoopCryptoLedgerConfigurationException.java
        mapreduce
        BitcoinRawBlockRecordReader.java
        BitcoinTransactionFileInputFormat.java
        AbstractBitcoinRecordReader.java
        BitcoinRawBlockFileInputFormat.java
        BitcoinTransactionRecordReader.java
        BitcoinBlockRecordReader.java
        BitcoinBlockFileInputFormat.java
        AbstractBitcoinFileInputFormat.java
    - test
      - resources
        testdata
        eth0to10.bin
        block447533.bin
        eth4910000.bin
        eth70000007000010
        eth1346406.bin
        eth3346406.bin
        testnet3genesis.blk
        reqseekversion1.blk
        namecoinblock.blk
        litecoinblockv4.blk
        block403419.bin
        eth1346406.bin.bz2
        namecoin20192blks.blk
        multiblock.blk
        eth351000to3510010.bin
        version2.blk
        eth1346406.bin.gz
        litecoingenesis.blk
        eth1.bin
        ethgenesis.bin
        namecointhreedifferentopinoneblock.blk
        eth4800251.bin
        block176149.blk
        genesis.blk
        version1.blk
        namecoingenesis.blk
      - java
        org
        zuinnote
        hadoop
        namecoin
        format
        common
        NamecoinAuxPOWTest.java
        NamecoinUtilTest.java
        ethereum
        format
        common
        EthereumUtilTest.java
        EthereumFormatReaderTest.java
        mapred
        EthereumFormatHadoopTest.java
        mapreduce
        EthereumFormatHadoopTest.java
        bitcoin
        format
        common
        BitcoinScriptPatternParserTest.java
        BitcoinFormatReaderTest.java
        BitcoinUtilTest.java
        mapred
        BitcoinFormatHadoopTest.java
        mapreduce
        BitcoinFormatHadoopTest.java
  - build.gradle
- flinkdatasource
  - src
    - main
      - java
        org
        zuinnote
        flink
        ethereum
        AbstractEthereumFlinkInputFormat.java
        EthereumRawBlockFlinkInputFormat.java
        EthereumBlockFlinkInputFormat.java
        bitcoin
        BitcoinTransactionFlinkInputFormat.java
        BitcoinRawBlockFlinkInputFormat.java
        AbstractBitcoinFlinkInputFormat.java
        BitcoinBlockFlinkInputFormat.java
    - test
      - resources
        testdata
        eth0to10.bin
        eth1346406.bin
        eth3346406.bin
        multiblock.blk
        version2.blk
        genesis.blk
        version1.blk
      - java
        org
        zuinnote
        flink
        ethereum
        FlinkEthereumDataSourceTest.java
        bitcoin
        FlinkBitcoinDataSourceTest.java
  - build.gradle
- hiveudf
  - src
    - main
      - resources
        deploy-udf-temporary.sql
        deploy-udf-permanent.sql
      - java
        org
        zuinnote
        hadoop
        namecoin
        hive
        udf
        NamecoinExtractFieldUDF.java
        NamecoinGetNameOperationUDF.java
        ethereum
        hive
        udf
        EthereumUDFUtil.java
        EthereumGetSendAddressUDF.java
        EthereumGetTransactionHashUDF.java
        EthereumGetChainIdUDF.java
        bitcoin
        hive
        udf
        BitcoinScriptPaymentPatternAnalyzerUDF.java
        BitcoinUDFUtil.java
        BitcoinTransactionHashUDF.java
        BitcoinTransactionHashSegwitUDF.java
    - test
      - resources
        eth1346406.bin
      - java
        org
        zuinnote
        hadoop
        namecoin
        hive
        udf
        NamecoinUDFTest.java
        ethereum
        hive
        udf
        EthereumUDFTest.java
        TestEthereumTransaction.java
        bitcoin
        hive
        udf
        TestBitcoinTransaction.java
        TestBitcoinTransactionInput.java
        TestBitcoinScriptWitnessItem.java
        TestBitcoinTransactionOutput.java
        TestBitcoinScriptWitness.java
        BitcoinUDFTest.java
  - build.gradle
- .travis.yml
- README.md
- settings.gradle
- NOTICE
- .gitignore
- hiveserde
  - src
    - main
      - java
        org
        zuinnote
        hadoop
        ethereum
        hive
        datatypes
        HiveEthereumBlock.java
        HiveEthereumBlockHeader.java
        HiveEthereumTransaction.java
        serde
        EthereumBlockStorageFormatDescriptor.java
        EthereumBlockSerde.java
        bitcoin
        hive
        datatypes
        HiveBitcoinTransaction.java
        HiveBitcoinAuxPOW.java
        HiveBitcoinTransactionOutput.java
        HiveBitcoinBlock.java
        serde
        BitcoinBlockStorageFormatDescriptor.java
        BitcoinBlockSerde.java
    - test
      - resources
        testdata
        eth1346406.bin
        genesis.blk
      - java
        org
        zuinnote
        hadoop
        ethereum
        hive
        serde
        EthereumHiveSerdeTest.java
        bitcoin
        hive
        serde
        BitcoinHiveSerdeTest.java
  - build.gradle

/**
* Copyright 2017 ZuInnoTe (Jörn Franke) <[email protected]>
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
*    http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
**/
package org.zuinnote.hadoop.ethereum.format.mapred;

import java.io.IOException;

import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FSDataInputStream;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.fs.Seekable;
import org.apache.hadoop.io.compress.CodecPool;
import org.apache.hadoop.io.compress.CompressionCodec;
import org.apache.hadoop.io.compress.CompressionCodecFactory;
import org.apache.hadoop.io.compress.Decompressor;
import org.apache.hadoop.io.compress.SplitCompressionInputStream;
import org.apache.hadoop.io.compress.SplittableCompressionCodec;
import org.apache.hadoop.mapred.FileSplit;
import org.apache.hadoop.mapred.JobConf;
import org.apache.hadoop.mapred.RecordReader;
import org.apache.hadoop.mapred.Reporter;
import org.zuinnote.hadoop.ethereum.format.common.EthereumBlockReader;


/**

 *
 */
public abstract class AbstractEthereumRecordReader <K,V> implements RecordReader<K,V>  {
	public static final String CONF_BUFFERSIZE=org.zuinnote.hadoop.ethereum.format.mapreduce.AbstractEthereumRecordReader.CONF_BUFFERSIZE;
	public static final String CONF_MAXBLOCKSIZE= org.zuinnote.hadoop.ethereum.format.mapreduce.AbstractEthereumRecordReader.CONF_MAXBLOCKSIZE;
	public static final String CONF_USEDIRECTBUFFER= org.zuinnote.hadoop.ethereum.format.mapreduce.AbstractEthereumRecordReader.CONF_USEDIRECTBUFFER;
	public static final int DEFAULT_BUFFERSIZE= org.zuinnote.hadoop.ethereum.format.mapreduce.AbstractEthereumRecordReader.DEFAULT_BUFFERSIZE;
	public static final int DEFAULT_MAXSIZE_ETHEREUMBLOCK= org.zuinnote.hadoop.ethereum.format.mapreduce.AbstractEthereumRecordReader.DEFAULT_MAXSIZE_ETHEREUMBLOCK;
	public static final boolean DEFAULT_USEDIRECTBUFFER= org.zuinnote.hadoop.ethereum.format.mapreduce.AbstractEthereumRecordReader.DEFAULT_USEDIRECTBUFFER;
	
	private static final Log LOG = LogFactory.getLog(AbstractEthereumRecordReader.class.getName());
	

private int bufferSize=0;
private int maxSizeEthereumBlock=0; 
private boolean useDirectBuffer=false;

private CompressionCodec codec;
private Decompressor decompressor;
private Reporter reporter;
private Configuration conf;
private long start;
private long end;
private final Seekable filePosition;
private FSDataInputStream fileIn;
private EthereumBlockReader ebr;



/**
* Creates an Abstract Record Reader for Ethereum blocks
* @param split Split to use (assumed to be a file split)
* @param job Configuration:
 * io.file.buffer.size: Size of in-memory  specified in the given Configuration. If io.file.buffer.size is not specified the default buffersize will be used. Furthermore, one may specify hadoopcryptoledger.ethereumblockinputformat.maxblocksize, which defines the maximum size a Ethereum block may have. By default it is 1M). If you want to experiment with performance using DirectByteBuffer instead of HeapByteBuffer you can use "hadoopcryptoledeger.ethereumblockinputformat.usedirectbuffer" (default: false). Note that it might have some unwanted consequences such as circumwenting Yarn memory management. The option is experimental and might be removed in future versions. 
* @param reporter Reporter
*
*
* @throws java.io.IOException in case of errors reading from the filestream provided by Hadoop
*
*/
public AbstractEthereumRecordReader(FileSplit split,JobConf job, Reporter reporter) throws IOException {
    LOG.debug("Reading configuration");
    // parse configuration
     this.reporter=reporter;
     this.conf=job;	
	this.maxSizeEthereumBlock=conf.getInt(AbstractEthereumRecordReader.CONF_MAXBLOCKSIZE,AbstractEthereumRecordReader.DEFAULT_MAXSIZE_ETHEREUMBLOCK);
	this.bufferSize=conf.getInt(AbstractEthereumRecordReader.CONF_BUFFERSIZE,AbstractEthereumRecordReader.DEFAULT_BUFFERSIZE);

	this.useDirectBuffer=conf.getBoolean(AbstractEthereumRecordReader.CONF_USEDIRECTBUFFER,AbstractEthereumRecordReader.DEFAULT_USEDIRECTBUFFER);
    // Initialize start and end of split
    start = split.getStart();
    end = start + split.getLength();
    final Path file = split.getPath();
    codec = new CompressionCodecFactory(job).getCodec(file);
    final FileSystem fs = file.getFileSystem(job);
    fileIn = fs.open(file);
    // open stream
      if (isCompressedInput()) { // decompress
	LOG.debug("Decompressing file");
      	decompressor = CodecPool.getDecompressor(codec);
      	if (codec instanceof SplittableCompressionCodec) {
		LOG.debug("SplittableCompressionCodec");
        	final SplitCompressionInputStream cIn =((SplittableCompressionCodec)codec).createInputStream(fileIn, decompressor, start, end,SplittableCompressionCodec.READ_MODE.CONTINUOUS);
        	ebr = new EthereumBlockReader(cIn, this.maxSizeEthereumBlock,this.bufferSize,this.useDirectBuffer);
  			start = cIn.getAdjustedStart();
       		end = cIn.getAdjustedEnd();
        	filePosition = cIn; // take pos from compressed stream
      } else {
	LOG.debug("Not-splitable compression codec");
  	ebr = new EthereumBlockReader(codec.createInputStream(fileIn,decompressor), this.maxSizeEthereumBlock,this.bufferSize,this.useDirectBuffer);
            filePosition = fileIn;
      }
    } else {
      LOG.debug("Processing file without compression");
      fileIn.seek(start);
      ebr = new EthereumBlockReader(fileIn, this.maxSizeEthereumBlock,this.bufferSize,this.useDirectBuffer);
	     filePosition = fileIn;
    }
    // initialize reader

    this.reporter.setStatus("Ready to read");
}


/**
* Get the current file position in a compressed or uncompressed file.
*
* @return file position
*
* @throws java.io.IOException in case of errors reading from the filestream provided by Hadoop
*
*/

public long getFilePosition() throws IOException {
	return  filePosition.getPos();
}

/**
* Get the end of file
*
* @return end of file position
*
*/

public long getEnd() {
	return end;
}

/**
* Get the current Block Reader
*
* @return end of file position
*
*/
public EthereumBlockReader getEbr() {
	return this.ebr;
}


/*
* Returns how much of the file has been processed in terms of bytes
*
* @return progress percentage
*
* @throws java.io.IOException in case of errors reading from the filestream provided by Hadoop
*
*/
@Override
public synchronized float getProgress() throws IOException {
if (start == end) {
      return 0.0f;
    } else {
      return Math.min(1.0f, (getFilePosition() - start) / (float)(end - start));
    }
}

/*
* Determines if the input is compressed or not
*
* @return true if compressed, false if not
*/
private boolean  isCompressedInput() {
    return codec != null;
  }

/*
* Get current position in the stream
*
* @return position
*
* @throws java.io.IOException in case of errors reading from the filestream provided by Hadoop
*
*/
@Override
public  synchronized long getPos() throws IOException {
	return filePosition.getPos();
}

/*
* Clean up InputStream and Decompressor after use
*
*
* @throws java.io.IOException in case of errors reading from the filestream provided by Hadoop
*
*/
@Override
public synchronized void  close() throws IOException {
try {
   if (ebr != null) {
        ebr.close();
      }
    } finally {
      if (decompressor != null) {
        CodecPool.returnDecompressor(decompressor);
        decompressor = null;
      }
    }
  }


}