python source code of multiclass_3D

CNNArt-master
- ReadMeForDeveloper.md
- DatabaseInfo.py
- utils
  - MotionCorrection
    - network_block.py
    - customLoss.py
    - plot.py
    - __init__.py
    - network.py
  - calculateInputOfPath2.py
  - DataPreprocessing.py
  - data.py
  - image_preprocessing.py
  - Training_Test_Split.py
  - Patching.py
  - tfrecord
    - medio
      - parse_gen.py
      - parse_tf.py
      - convert_tf.py
      - convert_dir.py
      - parse_tf_cnnart.py
      - read_image.py
    - training
      - multiclass_3D_CNN.py
      - create_dataset.py
      - train.py
    - examples
      - ex_conv_set.py
      - ex_pipeline_folder_test.py
      - ex_pipeline_folder_2.py
      - ex_pipeline_folder.py
      - ex_pipeline_simple.py
      - ex_pipeline_folder_3.py
    - util
      - patches.py
    - __init__.py
    - README.md
  - patch_shaping.py
  - PatchingUnpatching.py
  - Unpatching.py
  - Label.py
  - generator.py
  - fSetGPU_python.py
  - dlnetwork.py
  - scaling.py
  - __init__.py
  - Training_Test_Split_FCN.py
  - DataGenerator.py
  - RigidUnpatching.py
  - get_train_eval_files.py
  - RigidPatching.py
- matlab
  - utils
    - scaleImg.m
    - export_fig
      - license.txt
      - copyfig.m
      - user_string.m
      - print2eps.m
      - crop_borders.m
      - LICENSE
      - .ignore
        ghostscript.txt
        pdftops.txt
        gs_font_path.txt
      - append_pdfs.m
      - fix_lines.m
      - ghostscript.m
      - export_fig.m
      - using_hg2.m
      - README.md
      - print2array.m
      - pdf2eps.m
      - eps2pdf.m
      - pdftops.m
      - read_write_entire_textfile.m
      - isolate_axes.m
      - im2gif.m
    - zpad.m
    - crop.m
    - imoverlay
      - license.txt
      - imoverlay_tool.m
      - imoverlay.m
    - normalize_var_range.m
    - fSetGPU.m
    - fCreateAndSavePatches.m
  - parameters_default.m
  - fPredictCNN.m
  - runMain.m
  - README
  - deepvis
    - fVisualizePoint.m
    - fPatchOverlay.m
    - fVisualizeOverlay.m
    - fVisualizeOverlayMJ.m
  - fPatch.m
  - fUnpatch.m
  - io
    - fDicomReadFast.m
    - fReadDICOM.m
  - fTrainCNN.m
  - fGetModelInfo.m
  - fPatch3D.m
  - fUnpatch3D.m
- GUI
  - Tkinter
    - icons
    - Main_GUI_Tabs.py
    - demoGUI.py
    - Visualize_History.py
    - MRT_Layer.py
    - __init__.py
    - Visualize_Overlay.py
    - Main_GUI.py
  - PyQt
    - Icons
    - help
      - help_about_network_training
        WARNINGS
        node4.html
        labels.pl
        node5.html
        node1.html
        node3.html
        node2.html
        help_about_network_training.html
        index.html
        help_about_network_training.tex
        internals.pl
        help_about_network_training.css
      - help_about_labeling
        help_about_labeling.css
        images.aux
        WARNINGS
        images.pl
        help_about_labeling.tex
        img1.old
        help_about_labeling.html
        node4.html
        labels.pl
        node5.html
        help_about_labeling.aux
        node1.html
        node3.html
        node2.html
        images.log
        index.html
        help_about_labeling.synctex.gz
        images.tex
        internals.pl
        node6.html
        help_about_labeling.log
      - help_image_and_result_viewing
        images.aux
        WARNINGS
        images.pl
        help_image_and_result_viewing.aux
        node4.html
        help_image_and_result_viewing.log
        help_image_and_result_viewing.synctex.gz
        help_image_and_result_viewing.tex
        labels.pl
        node5.html
        node1.html
        help_image_and_result_viewing.html
        node3.html
        node2.html
        images.log
        index.html
        images.tex
        internals.pl
        node6.html
        help_image_and_result_viewing.css
      - help_about_network_testing
        WARNINGS
        help_about_network_testing.html
        help_about_network_testing.css
        labels.pl
        node1.html
        help_about_network_testing.tex
        node2.html
        index.html
      - help_about_network_visualization
        help_about_network_visualization.tex
        images.aux
        WARNINGS
        images.pl
        help_about_network_visualization.html
        node4.html
        labels.pl
        node5.html
        help_about_network_visualization.css
        node1.html
        node3.html
        node2.html
        images.log
        index.html
        images.tex
        internals.pl
        node6.html
    - utils
      - image_preprocessing.py
      - tftheanoFunction.py
      - Training_Test_Split.py
      - Unpatching.py
      - fSetGPU_python.py
      - LivePlotCallback.py
      - Prediction.py
      - Multiclass_Unpatching.py
      - CNN_main.py
    - LICENSE
    - networks
      - motion
        MNetArt
        __pycache__
        __init__.cpython-36.pyc
        __init__.cpython-35.pyc
        MNetArt.py
        __pycache__
        __init__.cpython-36.pyc
        __init__.cpython-35.pyc
        CNN3D
        __pycache__
        __init__.cpython-36.pyc
        __init__.cpython-35.pyc
        CNN3DmoreLayers.py
        CNN3D.py
        VNetArt
        __pycache__
        __init__.cpython-36.pyc
        __init__.cpython-35.pyc
        VNetArt.py
        CNN2D
        motion_head_CNN2D.py
        motion_all_CNN2D.py
        __pycache__
        motion_all_CNN2D.cpython-35.pyc
        __init__.cpython-36.pyc
        motion_head_CNN2D.cpython-36.pyc
        motion_head_CNN2D.cpython-35.pyc
        __init__.cpython-35.pyc
        motion_all_CNN2D.cpython-36.pyc
        motion_abd_CNN2D.cpython-35.pyc
        motion_abd_CNN2D.cpython-36.pyc
        models
        abdomen_3030_lr_0.0001_bs_64_json
        head_6060_lr_0.0001_bs_64.json
        head_6060_lr_0.0001_bs_64.mat
        abdomen_4040_lr_0.0001_bs_64.json
        head_3030_lr_0.0001_bs_64_json
        abdomen_3030_lr_0.0001_bs_64.json
        head_4040_lr_0.0001_bs_64.json
        abdomen_6060_lr_0.0001_bs_64_json
        abdomen_4040_lr_0.0001_bs_64_json
        abdomen_6060_lr_0.0001_bs_64.json
        abdomen_6060_lr_0.0001_bs_64.mat
        head_6060_lr_0.0001_bs_64_json
        head_3030_lr_0.0001_bs_64.json
        abdomen_4040_lr_0.0001_bs_64.mat
        head_4040_lr_0.0001_bs_64.mat
        head_4040_lr_0.0001_bs_64_json
        3D_CNN.py
        MNetArt.py
        2D_CNN.py
        __init__.py
        motion_abd_CNN2D.py
        VNetArt.py
      - network_generic.py
      - multiclass
        ResNet
        multiclass_ResNet.py
        GoogleNet
        multiclass_GoogleNet.py
        DenseResNet
        __pycache__
        multiclass_DenseResNet.cpython-36.pyc
        multiclass_DenseResNet.cpython-35.pyc
        __init__.cpython-36.pyc
        __init__.cpython-35.pyc
        multiclass_DenseResNet.py
        __pycache__
        __init__.cpython-36.pyc
        __init__.cpython-35.pyc
        SENets
        multiclass_DenseNet-34.py
        multiclass_DenseNet-BC-100.py
        multiclass_ResNet-50.py
        __pycache__
        multiclass_SE-ResNet-56.cpython-36.pyc
        multiclass_SE-DenseNet-34.cpython-35.pyc
        multiclass_DenseNet-BC-100.cpython-36.pyc
        multiclass_SE-ResNet-50.cpython-36.pyc
        multiclass_ResNet-50.cpython-36.pyc
        densely_connected_cnn_blocks.cpython-36.pyc
        multiclass_DenseNet-34.cpython-36.pyc
        multiclass_SE-ResNet-56.cpython-35.pyc
        multiclass_SE-DenseNet-34.cpython-36.pyc
        densely_connected_cnn_blocks.cpython-35.pyc
        squeeze_excitation_block.cpython-35.pyc
        multiclass_SE-ResNet-32.cpython-36.pyc
        deep_residual_learning_blocks.cpython-36.pyc
        squeeze_excitation_block.cpython-36.pyc
        multiclass_SE-DenseNet-BC-100.cpython-36.pyc
        deep_residual_learning_blocks.cpython-35.pyc
        multiclass_SE-ResNet-44_dense.cpython-36.pyc
        multiclass_ResNet-56.cpython-36.pyc
        multiclass_SE-DenseNet-BC-100.py
        densely_connected_cnn_blocks.py
        multiclass_ResNet-56.py
        multiclass_SE-ResNet-32.py
        multiclass_SE-DenseNet-34.py
        multiclass_DenseNet-100.py
        multiclass_SE-ResNet-50.py
        multiclass_SE-ResNet-56.py
        deep_residual_learning_blocks.py
        squeeze_excitation_block.py
        multiclass_SE_DenseNet-BC-100.py
        multiclass_SE-ResNet-44_dense.py
        CNN3D
        multiclass_3D_SE-ResNet.py
        multiclass_3D_SE-DenseNet-BC.py
        __pycache__
        multiclass_3D_SE-ResNet.cpython-35.pyc
        multiclass_3D_SE-DenseNet.cpython-36.pyc
        multiclass_3D_ResNet.cpython-36.pyc
        multiclass_3D_SE-ResNet.cpython-36.pyc
        multiclass_3D_ResNet.py
        multiclass_3D_SE-DenseNet.py
        InceptionNet
        __pycache__
        multiclass_InceptionNet.cpython-36.pyc
        __init__.cpython-36.pyc
        __init__.cpython-35.pyc
        multiclass_InceptionNet.py
        DenseNet
        multiclass_DenseNet.py
        __pycache__
        __init__.cpython-36.pyc
        Densenet.cpython-36.pyc
        Densenet.cpython-35.pyc
        __init__.cpython-35.pyc
        Densenet.py
        VGGNet
        multiclass_VGGNet.py
      - FullyConvolutionalNetworks
        3D_VResFCN_Upsampling_final_Motion_Binary_modified.py
        __pycache__
        3D_VResFCN_Upsampling_final_Motion_Binary.cpython-35.pyc
        3D_VResFCN_Upsampling_final.cpython-35.pyc
        3D_VResFCN_Upsampling_final_Motion_Binary_modified.cpython-36.pyc
        3D_VResFCN_Upsampling.cpython-36.pyc
        3D_VResFCN_Upsampling_final_Motion_Binary.cpython-36.pyc
        3D_VResFCN_Upsampling_final_Motion_Shim_Multi_Label.cpython-36.pyc
        3D_VResFCN_Upsampling_small.cpython-36.pyc
        3D_VResFCN.cpython-36.pyc
        3D_VResFCN_Upsampling_small_single.cpython-36.pyc
        3D_VResFCN_Upsampling_final.cpython-36.pyc
        3D_VResFCN_Upsampling_final.py
        3D_VResFCN_Upsampling_final_Motion_Shim_Multi_Label.py
        3D_VResFCN_Upsampling_small_single.py
        3D_VResFCN_Upsampling.py
        3D_VResFCN.py
        3D_VResFCN_Upsampling_small.py
        3D_VResFCN_Upsampling_final_Motion_Binary.py
    - DLart
      - DataPreprocessing.py
      - dlart.py
      - networks.csv
      - fSetGPU.py
      - network_interface.py
      - Unpatching.py
      - Dataset.py
      - DatasetSplit.py
      - PlotCanvas.py
      - network_interface_datasets.csv
      - RigidPatching.py
      - Constants_DLart.py
    - config
      - PATH.py
      - database
        MRPhysics
        MRPhysics.csv
      - param_GUI.yml
      - database_generic.py
      - setup.py
    - setup.py
    - README.md
    - configGUI
      - gridTable.py
      - LabelChoose.ui
      - editlabel.json
      - cnn_main.py
      - editgray.ui
      - canvas.py
      - Grey_window.py
      - framework.py
      - predefined_networks.py
      - Unpatch_eight.py
      - activeview.py
      - colorDialog.py
      - predefined_label.py
      - predefined_classes.txt
      - Unpatch.py
      - colors1.json
      - __pycache__
        Grey_window.cpython-36.pyc
        cPre_window.cpython-36.pyc
        colormapDialog.cpython-36.pyc
        framework.cpython-36.pyc
        activescene.cpython-36.pyc
        ROI_Selector.cpython-36.pyc
        Unpatch_eight.cpython-36.pyc
        proximal_alg.cpython-36.pyc
        colorDialog.cpython-36.pyc
        label_window.cpython-36.pyc
        loadf2.cpython-36.pyc
        cPatches.cpython-36.pyc
        activeview.cpython-36.pyc
        gridTable.cpython-36.pyc
        cnn_main.cpython-36.pyc
        loadf.cpython-36.pyc
        LabelChoose.cpython-36.pyc
        editgray.cpython-36.pyc
        network_visualization.cpython-36.pyc
        Unpatch_two.cpython-36.pyc
        Patches_window.cpython-36.pyc
        editlabel.cpython-36.pyc
        labelFile.cpython-36.pyc
        framework1.cpython-36.pyc
        img_rc.cpython-36.pyc
        canvas.cpython-36.pyc
        PreColor.cpython-36.pyc
        Unpatch.cpython-36.pyc
        labelDialog.cpython-36.pyc
        labelTable.cpython-36.pyc
        lib.cpython-36.pyc
        matplotlibwidget.cpython-36.pyc
      - variables.json
      - matplotlibwidget.py
      - ROI_Selector.py
      - labelTable.py
      - proximal_alg.py
      - cPre_window.py
      - LabelChoose.py
      - lib.py
      - editlabel.ui
      - colors0.json
      - Patches_window.py
      - multilabel.py
      - loadf.py
      - editlabel.py
      - Unpatch_two.py
      - cPatches.ui
      - patch_color.csv
      - PreColor.ui
      - label_window.py
      - predefined_label.csv
      - createJson.py
      - labelDialog.py
      - cPatches.py
      - framework.ui
      - colormapDialog.py
      - PreColor.py
      - network_visualization.py
      - resrc.qrc
      - lastWorkspace.json
      - editgray.py
      - loadf2.py
      - activescene.py
- LICENSE
- networks
  - motion
    - MNetArt
      - motion_MNetArt.py
      - __init__.py
    - CNN3D
      - motion_CNN3D.py
      - motion_CNN3DmoreLayers.py
      - __init__.py
    - VNetArt
      - motion_VNetArt.py
      - __init__.py
    - __init__.py
    - CNN2D
      - motion_head_CNN2D.py
      - motion_all_CNN2D.py
      - motion_all_CNN2D_multiscale.py
      - motion_vgg_CNN2D.py
      - models
        abdomen_3030_lr_0.0001_bs_64_json
        head_6060_lr_0.0001_bs_64.mat
        head_3030_lr_0.0001_bs_64_json
        abdomen_6060_lr_0.0001_bs_64_json
        abdomen_4040_lr_0.0001_bs_64_json
        abdomen_6060_lr_0.0001_bs_64.mat
        head_6060_lr_0.0001_bs_64_json
        abdomen_4040_lr_0.0001_bs_64.mat
        head_4040_lr_0.0001_bs_64.mat
        head_4040_lr_0.0001_bs_64_json
      - __init__.py
      - motion_abd_CNN2D.py
  - __init__.py
  - multiclass
    - CNN3D
      - multiclass_3D_SE_ResNet.py
      - multiclass_3D_SE-DenseNet_BC.py
      - multiclass_3D_ResNet.py
      - multiclass_3D_SE-DenseNet.py
    - CNN2D
      - ResNet
        multiclass_ResNet.py
      - GoogleNet
        multiclass_GoogleNet.py
      - DenseResNet
        multiclass_DenseResNet.py
      - SENets
        multiclass_DenseNet-34.py
        multiclass_DenseNet-BC-100.py
        multiclass_ResNet-50.py
        multiclass_SE-DenseNet-BC-100.py
        multiclass_ResNet-56.py
        multiclass_SE-ResNet-32.py
        multiclass_SE-DenseNet-34.py
        multiclass_SE-ResNet-50.py
        multiclass_SE-ResNet-56.py
        multiclass_SE-ResNet-44_dense.py
      - InceptionNet
        multiclass_InceptionNet.py
      - DenseNet
        multiclass_DenseNet.py
        Densenet.py
      - VGGNet
        multiclass_VGGNet.py
  - FullyConvolutionalNetworks
    - motion
      - VResFCN_3D_Upsampling_small_single.py
      - densely_connected_cnn_blocks.py
      - VResFCN_3D_Upsampling_final_Motion_Binary_DLArt.py
      - VResFCN_3D.py
      - VResFCN_3D_Upsampling_final_Motion_Binary_tf.py
      - VResFCN_3D_Upsampling.py
      - squeeze_excitation_block_tf.py
      - deep_residual_learning_blocks.py
      - squeeze_excitation_block.py
      - __init__.py
      - VResFCN_3D_Upsampling_final.py
      - VResFCN_3D_Upsampling_final_Motion_Binary.py
      - deep_residual_learning_blocks_tf.py
      - VResFCN_3D_Upsampling_small.py
    - __init__.py
  - multiscale
    - MSnetworks.py
    - runMS.py
    - __init__.py
- config
  - PATH.py
  - database
    - NAKO_IQA_tf.csv
    - MRPhysics.csv
    - NAKO_IQA.csv
  - param_IQA.yml
  - param_MC.yml
  - setup.py
  - param_3D.yml
  - param.yml
  - param_minimal.yml
  - param_2D.yml
  - param_MS.yml
- main_minimal.py
- setup.py
- __init__.py
- main.py
- README.md
- correction
  - networks
    - motion
      - VAE3D
        motion_VAE3D.py
        __init__.py
      - __init__.py
      - VAE2D
        motion_VAEGAN2D.py
        motion_VAE2D.py
        __init__.py
    - __init__.py
  - __init__.py
  - README.md
  - main_correction.py
- MRData.py
- requirements.txt
- .gitignore
- main_IQA.py
- mainGUI_Template.py

import os
# os.environ["CUDA_DEVICE_ORDER"]="0000:02:00.0"
# os.environ["CUDA_VISIBLE_DEVICES"] = "0"

from tensorflow.python.client import device_lib

print(device_lib.list_local_devices)

import os.path
import scipy.io as sio
import numpy as np
import math
import keras
from keras.layers import Input
import keras.backend as K
from keras.layers import Conv2D
from keras.layers import BatchNormalization
from keras.layers import GlobalAveragePooling2D
from keras.layers import GlobalAveragePooling3D
from keras.layers.core import Dense, Activation, Flatten
from keras.models import Model
from keras.models import Sequential
from keras.layers.convolutional import Convolution2D
from keras.callbacks import EarlyStopping
from keras.callbacks import LearningRateScheduler
from keras.callbacks import ReduceLROnPlateau
from keras.callbacks import ModelCheckpoint
from keras.models import model_from_json
from keras.regularizers import l2  # , activity_l2

from keras.optimizers import SGD
from networks.multiclass.SENets.deep_residual_learning_blocks import *
from DLart.Constants_DLart import *
from utils.image_preprocessing import ImageDataGenerator
from utils.LivePlotCallback import LivePlotCallback
from matplotlib import pyplot as plt

from networks.multiclass.SENets.densely_connected_cnn_blocks import *


def createModel(patchSize, numClasses):
    if K.image_data_format() == 'channels_last':
        bn_axis = -1
    else:
        bn_axis = 1

    growthRate_k = 12
    compressionFactor = 0.5

    input_tensor = Input(shape=(patchSize[0], patchSize[1], patchSize[2], 1))

    # first conv layer
    x = Conv3D(16, (3, 3, 3), strides=(1, 1, 1), padding='same', kernel_initializer='he_normal')(input_tensor)

    # 1. Dense Block
    x, numFilters = dense_block_3D(x, numInputFilters=16, numLayers=7, growthRate_k=growthRate_k,
                                   bottleneck_enabled=True)

    # Transition Layer
    x, numFilters = transition_SE_layer_3D(x, numFilters, compressionFactor=compressionFactor, se_ratio=8)

    # 2. Dense Block
    x, numFilters = dense_block_3D(x, numInputFilters=numFilters, numLayers=7, growthRate_k=growthRate_k,
                                   bottleneck_enabled=True)

    # Transition Layer
    x, numFilters = transition_SE_layer_3D(x, numFilters, compressionFactor=compressionFactor, se_ratio=8)

    # 3. Dense Block
    x, numFilters = dense_block_3D(x, numInputFilters=numFilters, numLayers=7, growthRate_k=growthRate_k,
                                   bottleneck_enabled=True)

    # SE Block
    x = squeeze_excitation_block_3D(x, ratio=16)

    x = BatchNormalization(axis=bn_axis)(x)
    x = Activation('relu')(x)

    # global average pooling
    x = GlobalAveragePooling3D(data_format='channels_last')(x)

    # fully-connected layer
    output = Dense(units=numClasses,
                   activation='softmax',
                   kernel_initializer='he_normal',
                   name='fully-connected')(x)

    # create model
    cnn = Model(input_tensor, output, name='3D-DenseNet-34')
    sModelName = '3D-DenseNet-34'

    return cnn, sModelName


def fTrain(X_train=None, y_train=None, X_valid=None, y_valid=None, X_test=None, y_test=None, sOutPath=None, patchSize=0,
           batchSizes=None, learningRates=None, iEpochs=None, dlart_handle=None):
    # grid search on batch_sizes and learning rates
    # parse inputs
    batchSize = batchSizes[0]
    learningRate = learningRates[0]

    # change the shape of the dataset -> at color channel -> here one for grey scale
    X_train = np.expand_dims(X_train, axis=-1)
    X_test = np.expand_dims(X_test, axis=-1)

    if X_valid is not None and y_valid is not None:
        X_valid = np.expand_dims(X_valid, axis=-1)

    # y_train = np.asarray([y_train[:], np.abs(np.asarray(y_train[:], dtype=np.float32) - 1)]).T
    # y_test = np.asarray([y_test[:], np.abs(np.asarray(y_test[:], dtype=np.float32) - 1)]).T

    # number of classes
    numClasses = np.shape(y_train)[1]

    # create cnn model
    cnn, sModelName = createModel(patchSize=patchSize, numClasses=numClasses)

    fTrainInner(cnn,
                sModelName,
                X_train=X_train,
                y_train=y_train,
                X_valid=X_valid,
                y_valid=y_valid,
                X_test=X_test,
                y_test=y_test,
                sOutPath=sOutPath,
                patchSize=patchSize,
                batchSize=batchSize,
                learningRate=learningRate,
                iEpochs=iEpochs,
                dlart_handle=dlart_handle)

    K.clear_session()

    # for iBatch in batchSizes:
    #     for iLearn in learningRates:
    #         fTrainInner(cnn,
    #                     sModelName,
    #                     X_train=X_train,
    #                     y_train=y_train,
    #                     X_valid=X_valid,
    #                     y_valid=y_valid,
    #                     X_test=X_test,
    #                     y_test=y_test,
    #                     sOutPath=sOutPath,
    #                     patchSize=patchSize,
    #                     batchSize=iBatch,
    #                     learningRate=iLearn,
    #                     iEpochs=iEpochs,
    #                     dlart_handle=dlart_handle)


def fTrainInner(cnn, modelName, X_train=None, y_train=None, X_valid=None, y_valid=None, X_test=None, y_test=None,
                sOutPath=None, patchSize=0, batchSize=None, learningRate=None, iEpochs=None, dlart_handle=None):
    print('Training CNN')
    print('with lr = ' + str(learningRate) + ' , batchSize = ' + str(batchSize))

    # save names
    _, sPath = os.path.splitdrive(sOutPath)
    sPath, sFilename = os.path.split(sPath)
    sFilename, sExt = os.path.splitext(sFilename)

    model_name = sOutPath + os.sep + sFilename + '_lr_' + str(learningRate) + '_bs_' + str(batchSize)
    weight_name = model_name + '_weights.h5'
    model_json = model_name + '.json'
    model_all = model_name + '_model.h5'
    model_mat = model_name + '.mat'

    if (os.path.isfile(model_mat)):  # no training if output file exists
        print('------- already trained -> go to next')
        return

    # create optimizer
    if dlart_handle != None:
        if dlart_handle.getOptimizer() == SGD_OPTIMIZER:
            opti = keras.optimizers.SGD(lr=learningRate,
                                        momentum=dlart_handle.getMomentum(),
                                        decay=dlart_handle.getWeightDecay(),
                                        nesterov=dlart_handle.getNesterovEnabled())
        elif dlart_handle.getOptimizer() == RMS_PROP_OPTIMIZER:
            opti = keras.optimizers.RMSprop(lr=learningRate, decay=dlart_handle.getWeightDecay())
        elif dlart_handle.getOptimizer() == ADAGRAD_OPTIMIZER:
            opti = keras.optimizers.Adagrad(lr=learningRate, epsilon=None, decay=dlart_handle.getWeightDecay())
        elif dlart_handle.getOptimizer() == ADADELTA_OPTIMIZER:
            opti = keras.optimizers.Adadelta(lr=learningRate, rho=0.95, epsilon=None,
                                             decay=dlart_handle.getWeightDecay())
        elif dlart_handle.getOptimizer() == ADAM_OPTIMIZER:
            opti = keras.optimizers.Adam(lr=learningRate, beta_1=0.9, beta_2=0.999, epsilon=None,
                                         decay=dlart_handle.getWeightDecay())
        else:
            raise ValueError("Unknown Optimizer!")
    else:
        # opti = SGD(lr=learningRate, momentum=1e-8, decay=0.1, nesterov=True);#Adag(lr=0.01, epsilon=1e-06)
        opti = keras.optimizers.Adam(lr=learningRate, beta_1=0.9, beta_2=0.999, epsilon=1e-08, decay=0.0)

    cnn.summary()

    # compile model
    cnn.compile(loss='categorical_crossentropy', optimizer=opti, metrics=['accuracy'])

    # callbacks
    callback_earlyStopping = EarlyStopping(monitor='val_loss', patience=10, verbose=1)
    # callback_tensorBoard = keras.callbacks.TensorBoard(log_dir=dlart_handle.getLearningOutputPath() + '/logs',
    # histogram_freq=2,
    # batch_size=batchSize,
    # write_graph=True,
    # write_grads=True,
    # write_images=True,
    # embeddings_freq=0,
    # embeddings_layer_names=None,
    #  embeddings_metadata=None)

    callbacks = [callback_earlyStopping,
                 ModelCheckpoint(sOutPath + os.sep + 'checkpoints' + os.sep + 'checker.hdf5', monitor='val_acc',
                                 verbose=0,
                                 period=1, save_best_only=True), LearningRateScheduler(schedule=step_decay, verbose=1),
                 LivePlotCallback(dlart_handle)]
    # callbacks.append(ReduceLROnPlateau(monitor='loss', factor=0.1, patience=5, min_lr=1e-4, verbose=1))

    # data augmentation
    if dlart_handle.getDataAugmentationEnabled():
        # Initialize Image Generator
        # all shifted and rotated images are filled with zero padded pixels
        datagen = ImageDataGenerator(
            featurewise_center=False,
            samplewise_center=False,
            featurewise_std_normalization=False,
            samplewise_std_normalization=False,
            zca_whitening=dlart_handle.getZCA_Whitening(),
            zca_epsilon=1e-6,
            rotation_range=dlart_handle.getRotation(),
            width_shift_range=dlart_handle.getWidthShift(),
            height_shift_range=dlart_handle.getHeightShift(),
            shear_range=0.,
            zoom_range=dlart_handle.getZoom(),
            channel_shift_range=0.,
            fill_mode='constant',
            cval=0.,
            horizontal_flip=dlart_handle.getHorizontalFlip(),
            vertical_flip=dlart_handle.getVerticalFlip(),
            rescale=None,
            histogram_equalization=dlart_handle.getHistogramEqualization(),
            contrast_stretching=dlart_handle.getContrastStretching(),
            adaptive_equalization=dlart_handle.getAdaptiveEqualization(),
            preprocessing_function=None,
            data_format=K.image_data_format()
        )

        # fit parameters from dataset
        datagen.fit(X_train)

        # configure batch size and get one batch of images
        for x_batch, y_batch in datagen.flow(X_train, y_train, batch_size=9):
            # display first 9 images
            for i in range(0, 9):
                plt.subplot(330 + 1 + i)
                plt.imshow(x_batch[i].reshape(x_batch.shape[1], x_batch.shape[2]), cmap='gray')
            plt.show()
            break

        if X_valid is not None and y_valid is not None:
            # fit model on data
            # use validation/test split
            result = cnn.fit_generator(datagen.flow(X_train, y_train, batch_size=batchSize),
                                       steps_per_epoch=X_train.shape[0] // batchSize,
                                       epochs=iEpochs,
                                       validation_data=(X_valid, y_valid),
                                       callbacks=callbacks,
                                       workers=1,
                                       use_multiprocessing=False)
        else:
            # fit model on data
            # use test data for validation and test
            result = cnn.fit_generator(datagen.flow(X_train, y_train, batch_size=batchSize),
                                       steps_per_epoch=X_train.shape[0] // batchSize,
                                       epochs=iEpochs,
                                       validation_data=(X_valid, y_valid),
                                       callbacks=callbacks,
                                       workers=1,
                                       use_multiprocessing=False)

    else:
        if not X_valid and not y_valid:
            # no validation datasets
            result = cnn.fit(X_train,
                             y_train,
                             validation_data=(X_test, y_test),
                             epochs=iEpochs,
                             batch_size=batchSize,
                             callbacks=callbacks,
                             verbose=1)
        else:
            # using validation datasets
            result = cnn.fit(X_train,
                             y_train,
                             validation_data=(X_valid, y_valid),
                             epochs=iEpochs,
                             batch_size=batchSize,
                             callbacks=callbacks,
                             verbose=1)

    # return the loss value and metrics values for the model in test mode
    score_test, acc_test = cnn.evaluate(X_test, y_test, batch_size=batchSize, verbose=1)

    prob_test = cnn.predict(X_test, batchSize, 0)

    # save model
    json_string = cnn.to_json()
    with open(model_json, 'w') as jsonFile:
        jsonFile.write(json_string)

    # wei = cnn.get_weights()
    cnn.save_weights(weight_name, overwrite=True)
    cnn.save(model_all)  # keras > v0.7
    model_png_dir = sOutPath + os.sep + "model.png"
    from keras.utils import plot_model
    plot_model(cnn, to_file=model_png_dir, show_shapes=True, show_layer_names=True)

    # matlab
    acc = result.history['acc']
    loss = result.history['loss']
    val_acc = result.history['val_acc']
    val_loss = result.history['val_loss']

    print('Saving results: ' + model_name)
    sio.savemat(model_name, {'model_settings': model_json,
                             'model': model_all,
                             'weights': weight_name,
                             'acc': acc,
                             'loss': loss,
                             'val_acc': val_acc,
                             'val_loss': val_loss,
                             'score_test': score_test,
                             'acc_test': acc_test,
                             'prob_test': prob_test})


def step_decay(epoch, lr):
    drop = 0.1
    epochs_drop = 10.0
    print("Current Learning Rate: " + str(lr))
    if epoch == epochs_drop or epoch == 2 * epochs_drop or epoch == 3 * epochs_drop or epoch == 4 * epochs_drop:
        lr = drop * lr
        print("Reduce Learningrate by 0.1 to " + str(lr))

    return lr


def fPredict(X, y, sModelPath, sOutPath, batchSize=64):
    """Takes an already trained model and computes the loss and Accuracy over the samples X with their Labels y
    Input: X: Samples to predict on. The shape of X should fit to the input shape of the model y: Labels for the
    Samples. Number of Samples should be equal to the number of samples in X sModelPath: (String) full path to a
    trained keras model. It should be *_json.txt file. there has to be a corresponding *_weights.h5 file in the same
    directory! sOutPath: (String) full path for the Output. It is a *.mat file with the computed loss and accuracy
    stored. The Output file has the Path 'sOutPath'+ the filename of sModelPath without the '_json.txt' added the
    suffix '_pred.mat' batchSize: Batchsize, number of samples that are processed at once """
    sModelPath = sModelPath.replace("_json.txt", "")
    weight_name = sModelPath + '_weights.h5'
    model_json = sModelPath + '_json.txt'
    model_all = sModelPath + '_model.h5'

    # load weights and model (new way)
    model_json = open(model_json, 'r')
    model_string = model_json.read()
    model_json.close()
    model = model_from_json(model_string)

    model.compile(loss='categorical_crossentropy', optimizer=keras.optimizers.Adam(), metrics=['accuracy'])
    model.load_weights(weight_name)

    score_test, acc_test = model.evaluate(X, y, batch_size=batchSize)
    print('loss' + str(score_test) + '   acc:' + str(acc_test))
    prob_pre = model.predict(X, batch_size=batchSize, verbose=1)
    print(prob_pre[0:14, :])
    _, sModelFileSave = os.path.split(sModelPath)

    modelSave = sOutPath + sModelFileSave + '_pred.mat'
    print('saving Model:{}'.format(modelSave))
    sio.savemat(modelSave, {'prob_pre': prob_pre, 'score_test': score_test, 'acc_test': acc_test})


###############################################################################
## OPTIMIZATIONS ##
###############################################################################
def fHyperasTrain(X_train, Y_train, X_test, Y_test, patchSize):
    # explicitly stated here instead of cnn = createModel() to allow optimization
    cnn = Sequential()
    #    cnn.add(Convolution2D(32,
    #                            14,
    #                            14,
    #                            init='normal',
    #                           # activation='sigmoid',
    #                            weights=None,
    #                            border_mode='valid',
    #                            subsample=(1, 1),
    #                            W_regularizer=l2(1e-6),
    #                            input_shape=(1, patchSize[0,0], patchSize[0,1])))
    #    cnn.add(Activation('relu'))

    cnn.add(Convolution2D(32,  # 64
                          7,
                          7,
                          init='normal',
                          # activation='sigmoid',
                          weights=None,
                          border_mode='valid',
                          subsample=(1, 1),
                          W_regularizer=l2(1e-6)))
    cnn.add(Activation('relu'))
    cnn.add(Convolution2D(64,  # learning rate: 0.1 -> 76%
                          3,
                          3,
                          init='normal',
                          # activation='sigmoid',
                          weights=None,
                          border_mode='valid',
                          subsample=(1, 1),
                          W_regularizer=l2(1e-6)))
    cnn.add(Activation('relu'))

    cnn.add(Convolution2D(128,  # learning rate: 0.1 -> 76%
                          3,
                          3,
                          init='normal',
                          # activation='sigmoid',
                          weights=None,
                          border_mode='valid',
                          subsample=(1, 1),
                          W_regularizer=l2(1e-6)))
    cnn.add(Activation('relu'))

    # cnn.add(pool2(pool_size=(2, 2), strides=None, border_mode='valid', dim_ordering='th'))

    cnn.add(Flatten())
    # cnn.add(Dense(input_dim= 100,
    #              output_dim= 100,
    #              init = 'normal',
    #              #activation = 'sigmoid',
    #              W_regularizer='l2'))
    # cnn.add(Activation('sigmoid'))
    cnn.add(Dense(input_dim=100,
                  output_dim=2,
                  init='normal',
                  # activation = 'sigmoid',
                  W_regularizer='l2'))
    cnn.add(Activation('softmax'))

    # opti = SGD(lr={{choice([0.1, 0.01, 0.05, 0.005, 0.001])}}, momentum=1e-8, decay=0.1, nesterov=True)
    # cnn.compile(loss='categorical_crossentropy', optimizer=opti)

    epochs = 300

    result = cnn.fit(X_train, Y_train,
                     batch_size=128,  # {{choice([64, 128])}}
                     nb_epoch=epochs,
                     show_accuracy=True,
                     verbose=2,
                     validation_data=(X_test, Y_test))
    score_test, acc_test = cnn.evaluate(X_test, Y_test, verbose=0)

    # return {'loss': -acc_test, 'status': STATUS_OK, 'model': cnn, 'trainresult': result, 'score_test': score_test}


## helper functions
def drange(start, stop, step):
    r = start
    while r < stop:
        yield r
    r += step