scala source code of SparkPredictionTrainer

Project: smart-meter (GitHub Link)

smart-meter-master
- dockerfile-app_prometheus
  - Dockerfile.tpl
  - _docker_build.sh.tpl
  - LICENSE
  - prometheus.yml.tpl
- docker-down.sh
- excel
  - smartmert_data.xlsx
  - cassandra.dsn
- set_properties_to_dockerfile_templates.sh
- dockerfile-app_metrics
  - NATS Servers.json
  - gatling + max voltage - swarm.json
  - gatling + max voltage.json
  - LICENSE
  - graphite
    - conf
      - storage-schemas.conf
      - relay-rules.conf
      - dashboard.conf
      - carbon.amqp.conf
      - storage-aggregation.conf
      - blacklist.conf
      - aggregation-rules.conf
      - whitelist.conf
      - carbon.conf
      - graphTemplates.conf
      - rewrite-rules.conf
  - data_sources
    - influxdb.json
    - graphite.json
    - prometheus.json
  - _Active Containers Panel
  - smartmeter - containers.json
- build_push_remote-pull.sh
- docker-local-cluster-up.sh
- docker-up.sh
- docker-compose_telegraf-cassandra_write_count.yml
- docker-local-down.sh
- docker-remote-single-up.sh
- logs.sh
- build_push_LATEST.sh
- dockerfile-app_compose
  - Dockerfile.tpl
  - properties
    - configuration-application.properties.tpl
    - properties_app.yml
    - configuration-additional.properties
    - properties_branch.yml
  - _docker_build.sh.tpl
  - services_hierarchies.sh
  - compose
    - docker-compose-inject-cluster.yml
    - docker-compose-prediction-secrets.yml
    - docker-compose-prediction-metrics.yml
    - docker-compose-test-secrets.yml
    - docker-compose-cassandra_inject-secrets.yml
    - docker-compose-streaming_metrics-no_secrets.yml
    - docker-compose-cassandra_inject-no_secrets.yml
    - docker-compose-streaming.yml
    - docker-compose-streaming-secrets.yml
    - docker-compose-prediction-metrics-no_secrets.yml
    - docker-compose-monitoring.yml
    - docker-compose-inject-secrets.yml
    - docker-compose-cassandra_inject_metrics.yml
    - docker-compose-monitoring-secrets.yml
    - docker-compose-cassandra_inject-single.yml
    - docker-compose-test.yml
    - docker-compose-inject_metrics.yml
    - docker-compose-prediction-no_secrets.yml
    - docker-compose-streaming_metrics-secrets.yml
    - docker-compose-streaming_metrics.yml
    - docker-compose-inject-no_secrets.yml
    - docker-compose-cassandra_inject-cluster.yml
    - docker-compose-hadoop.yml
    - docker-compose-inject.yml
    - docker-compose-cassandra_inject.yml
    - docker-compose-test-no_secrets.yml
    - docker-compose-prediction-metrics-secrets.yml
    - docker-compose-streaming-no_secrets.yml
    - docker-compose-prediction.yml
    - docker-compose-inject-single.yml
    - docker-compose-monitoring-no_secrets.yml
    - docker-compose-cassandra-image.yml
- clean.sh
- docker-remote-cluster-up.sh
- build_push_DEV.sh
- images
  - SmartMeter-Full.umd
  - SmartMeter-Inject.umd
  - SmartMeter-Batch.umd
  - SmartMeter-Training.umd
  - SmartMeter.umd
- properties
  - configuration-location-local-debug.properties
  - configuration-telegraf-max_voltage.properties
  - configuration-telegraf-temperature.properties
  - configuration-telegraf-docker.properties
  - configuration-telegraf-cassandra_count.properties
  - configuration-mode-single.properties
  - configuration-telegraf-cassandra_write_count.properties
  - configuration-mode-cluster-debug.properties
  - configuration-telegraf-debug.properties
  - configuration-mode-single-debug.properties
  - configuration-location-remote.properties
  - configuration.properties
  - configuration-mode-cluster.properties
  - configuration-telegraf.properties
  - configuration-location-remote-debug.properties
  - _configuration-telegraf-cassandra_count.properties
  - configuration-telegraf-cassandra.properties
  - configuration-telegraf-prediction.properties
  - configuration-location-local.properties
- dockerfile-app_monitor
  - src
    - main
      - scala
        com
        logimethods
        nats
        connector
        spark
        monitor
        NatsOutputMonitor.scala
      - java
        com
        logimethods
        nats
        connector
        spark
        monitor
        NatsStreamingOutputMonitor.java
  - Dockerfile.tpl
  - LICENSE
  - project
    - build.sbt
    - plugins.sbt
  - pom.xml.tpl
  - build.sbt
  - entrypoint_insert.sh
- stop.sh
- sub_nats.sh
- service_logs.sh
- docker-remote-down.sh
- devsecrets
  - nats_password_secret
  - nats_cluster_username_secret
  - nats_cluster_password_secret
  - nats_username_secret
- dockerfile-app_cassandra
  - Dockerfile.tpl
  - _docker_build.sh.tpl
  - LICENSE
  - entrypoint_finalize.sh
  - cql
    - create-timeseries.cql
- docker-DEV-remote-cluster-up.sh
- LICENSE
- docker-DEV-local-single-up.sh
- build_DEV.sh
- build_functions.sh
- dockerfile-app_streaming
  - src
    - main
      - scala
        com
        logimethods
        nats
        connector
        spark
        app
        SparkPredictionProcessor.scala
        SparkPredictionAccuracy.scala
        SparkProcessor.scala
        SparkPredictionTrainer.scala
        SparkPredictionOracle.scala
        SparkAlertProcessor.scala
        SparkTemperatureProcessor.scala
        DummyNatsTransmiter.scala
        SparkMaxProcessor.scala
  - Dockerfile.tpl
  - _docker_build.sh.tpl
  - LICENSE
  - project
    - build.sbt
    - plugins.sbt
  - spark
    - conf
      - log4j.properties
  - pom.xml.tpl
  - build.sbt
  - .dockerignore
  - entrypoint_insert.sh
- pull.sh
- concourse
  - credentials-template.yml
  - smart_meter-pipeline-FULL.yml
  - smart_meter-pipeline.yml
  - README.md
- cassandra-cluster.sh
- start-services.py
- export_grafana_datasources.sh
- XXX_build_push_remote.sh
- cqlsh.sh
- docker-local-single-up.sh
- read_from_cassandra.txt
- cassandra-shell.sh
- import_grafana_datasources.sh
- start-services_exec.sh
- wercker.yml
- README.md
- ruby_nats.sh
- scripts
  - compose_deploy.sh
  - compose_test.sh
  - docker_build.sh
  - complete_templates.sh
  - alt_properties
    - configuration-application.properties
  - compose_classic.sh
- run_spark_shell.sh
- cassandra-run.sh
- cassandra-inject.sh
- dockerfile-app_telegraf
  - Dockerfile.tpl
  - entrypoint_prepare.sh
  - script
    - cfstats.sh
    - collect_cfstats.sh
    - cassandra_count.sh
  - _docker_build.sh.tpl
  - LICENSE
  - conf
    - prediction.conf
    - cassandra_count.conf
    - temperature.conf
    - _cassandra_count.conf
    - max_voltage.conf
    - cassandra.conf
    - telegraf-complete.conf
    - cassandra_write_count.conf
- dockerfile-app_inject
  - src
    - main
      - scala
        com
        logimethods
        smartmeter
        generate
        Profile.scala
        TemperatureProvider.scala
        TimeProvider.scala
        ValueProvider.scala
        InterpolatedProfile.scala
    - test
      - scala
        com
        logimethods
        smartmeter
        generate
        TimeProviderTest.scala
        TemperatureProviderTest.scala
        ValueProviderTest.scala
  - biasPerDay.xlsx
  - Dockerfile.tpl
  - user-files
    - simulations
      - nats
        NatsStreamingInjection.scala
        NatsInjection.scala
  - Dockerfile_post
  - LICENSE
  - project
    - build.sbt
    - plugins.sbt
  - pom.xml.tpl
  - Dockerfile_pre
  - build.sbt
  - .gitignore
  - conf
    - gatling.conf
  - entrypoint_insert.sh
- .gitignore
- app_cassandra_inject
  - go
    - src
      - app
        main.go
    - convert.txt
  - LICENSE
  - Dockerfile
  - entrypoint_insert.sh
- aws
  - Docker for AWS 1.13.1 (ga-2) - FIXED.tmpl
  - Docker for AWS 1.13.1 (ga-2).tmpl
- build.sh
- docker-cassandra-compose.yml
- docker-compose.yml
- build_LATEST.sh
- dockerfile-app_batch
  - src
    - main
      - resources
        log4j.properties
      - scala
        com
        logimethods
        nats
        connector
        spark
        app
        SparkBatch.scala
  - Dockerfile.tpl
  - LICENSE
  - project
    - assembly.sbt
    - build.sbt
    - plugins.sbt
  - build.sbt

/*******************************************************************************
 * Copyright (c) 2016 Logimethods
 * All rights reserved. This program and the accompanying materials
 * are made available under the terms of the MIT License (MIT)
 * which accompanies this distribution, and is available at
 * http://opensource.org/licenses/MIT
 *******************************************************************************/

package com.logimethods.nats.connector.spark.app

import java.util.Properties;
import java.io.File
import java.io.Serializable

import org.apache.spark.SparkConf
import org.apache.spark.SparkContext
import org.apache.spark.storage.StorageLevel;
import org.apache.spark.streaming._

import io.nats.client.ConnectionFactory._
import java.nio.ByteBuffer

import org.apache.log4j.{Level, LogManager, PropertyConfigurator}

import com.logimethods.connector.nats.to_spark._
import com.logimethods.scala.connector.spark.to_nats._

import org.apache.spark.ml.classification.MultilayerPerceptronClassifier
import org.apache.spark.ml.evaluation.MulticlassClassificationEvaluator

import java.util.function._

import java.time.{LocalDateTime, ZoneOffset}
import java.time.DayOfWeek._

import org.apache.spark.ml.classification.MultilayerPerceptronClassificationModel

object SparkPredictionTrainer extends App with SparkPredictionProcessor {
  log.setLevel(Level.WARN)

  val (properties, targets, logLevel, sc, inputNatsStreaming, inputSubject, outputSubject, clusterId, outputNatsStreaming, natsUrl) = setup(args)

  val streamingDuration = scala.util.Properties.envOrElse("STREAMING_DURATION", "2000").toInt
  println("STREAMING_DURATION = " + streamingDuration)

  new Thread(new Runnable {
              def run() {
                 while( true ){
                   try {
                     val data = SparkPredictionProcessor.getData(sc, THRESHOLD)
                     val model = trainer.fit(data)
                     model.write.overwrite.save(PREDICTION_MODEL_PATH)
                     println("New model of size " + data.count() + " trained: " + model.uid)
                     Thread.sleep(streamingDuration)
                   } catch {
                     case e: Throwable => log.error(e)
                   }
                 }
              }
             }).start()
}