package com.data.big.mlib;

import org.apache.spark.SparkConf;
import org.apache.spark.api.java.JavaRDD;
import org.apache.spark.api.java.JavaSparkContext;
import org.apache.spark.api.java.function.Function;


public class ScalaTest {
	public static void main( String[] args ){
		String inputFile = "data/dummy.txt";
		SparkConf configuration = new SparkConf().setMaster("local[4]").setAppName("My App");
		JavaSparkContext sparkContext = new JavaSparkContext(configuration);
		JavaRDD<String> logData = sparkContext.textFile(inputFile).cache();

		long numberA = logData.filter(new Function<String,Boolean>(){
			private static final long serialVersionUID = 1L;
			public Boolean call(String s){
				return s.length() == 0;
			}
		}).count();
		sparkContext.close();
		System.out.println("Empty Lines: " + numberA);
	}
}