python source code of benchmark_empirical_kde

Project: Conditional_Density_Estimation (GitHub Link)

Conditional_Density_Estimation-master
- cde
  - utils
    - misc.py
    - serializable.py
    - tf_utils
      - map_inference.py
      - layers_powered.py
      - adamW.py
      - layers.py
      - __init__.py
      - tensor_utils.py
      - network.py
      - parameterized.py
    - optimizers.py
    - distribution.py
    - center_point_select.py
    - io.py
    - __init__.py
    - async_executor.py
    - integration.py
  - model_fitting
    - GoodnessOfFit.py
    - GoodnessOfFitSingleResult.py
    - sim_eval.py
    - GoodnessOfFitLogProb.py
    - plotting.py
    - __init__.py
    - GoodnessOfFitResults.py
    - ConfigRunner.py
    - divergences.py
    - ConfigRunnerLogProb.py
  - evaluation
    - simulation_eval
      - question5_regularisation_KMN.py
      - hyperparam_sweep_nonparametrics.py
      - question8_benchmark.py
      - question4_benchmark_econ_density.py
      - question4_benchmark_arma_jump.py
      - question4_benchmark_student5dim.py
      - question5_regularisation_MDN.py
      - question7_regularization_logprobs.py
      - question4_benchmark_student10dim.py
      - question3_NNvsCKDE_Arma_Skew.py
      - question3_NNvsCKDE_Econ_GMM.py
      - question1_noise_reg_xy.py
      - base_experiment.py
      - question4_benchmark_skew.py
      - __init__.py
      - hyperparam_sweep.py
      - question5_regularisation_NF.py
      - plotting
        question5_plots.py
        hyperparam_sweep_plots.py
        question2_plots.py
        question8_plots.py
        question4_plots.py
        question1_plots.py
        question6_plots.py
        question7_plots.py
        question3_plots.py
        question1_v1_plots.py
      - question2_entropy_reg.py
      - question6_noise_schedules.py
    - eurostoxx_eval
      - empirical_benchmark.py
      - load_dataset.py
      - noise_reg_plots.py
      - underest_of_variance.py
      - fit_density.py
      - __init__.py
      - feature_selection.py
      - moments_time_series.py
    - empirical_eval
      - benchmark_empirical_kde.py
      - datasets.py
      - __init__.py
      - experiment_util.py
      - regularization_empirical.py
      - benchmark_empirical.py
    - __init__.py
  - BaseConditionalDensity.py
  - density_simulation
    - JumpDiffusionModel.py
    - LinearGaussian.py
    - BaseConditionalDensitySimulation.py
    - ArmaJump.py
    - __init__.py
    - toy_densities.py
    - LinearStudentT.py
    - EconDensity.py
    - SkewNormal.py
    - GMM.py
  - __init__.py
  - density_estimator
    - NF.py
    - BaseNNMixtureEstimator.py
    - LSCDE.py
    - CKDE.py
    - BaseDensityEstimator.py
    - NKDE.py
    - normalizing_flows
      - IdentityFlow.py
      - BaseNormalizingFlow.py
      - PlanarFlow.py
      - AffineFlow.py
      - __init__.py
      - RadialFlow.py
    - BaseNNEstimator.py
    - KMN.py
    - __init__.py
    - MDN.py
- notes.txt
- config.py
- LICENSE
- demo.py
- .gitattributes
- setup.py
- .travis.yml
- README.md
- tests
  - unittests_simulations.py
  - unittests_evaluations.py
  - unittests_utils.py
  - unittests_configrunner.py
  - unittests_io.py
  - dummies.py
  - unittests_normalizing_flows.py
  - __init__.py
  - unittests_estimators.py
- requirements.txt
- .gitignore
- docs
  - Makefile
  - source
    - density_simulation
      - skew_normal.rst
      - density_simulation.rst
      - arma_jump.rst
      - jump_diff.rst
      - gmm.rst
      - linear_gaussian.rst
      - econ_density.rst
    - density_estimator
      - ckde.rst
      - mdn.rst
      - lscde.rst
      - nf.rst
      - density_estimator.rst
      - normalizing_flows
        identity.rst
        radial.rst
        affine.rst
        planar.rst
      - nkde.rst
      - kmn.rst
    - index.rst
    - conf.py
  - .nojekyll
  - index.html
  - docs
    - html
      - .nojekyll
      - _sources
        index.rst.txt
        density_simulation
        econ_density.rst.txt
        linear_gaussian.rst.txt
        arma_jump.rst.txt
        gmm.rst.txt
        skew_normal.rst.txt
        jump_diff.rst.txt
        density_simulation.rst.txt
        density_estimator
        kmn.rst.txt
        ckde.rst.txt
        mdn.rst.txt
        nkde.rst.txt
        nf.rst.txt
        normalizing_flows
        radial.rst.txt
        affine.rst.txt
        planar.rst.txt
        identity.rst.txt
        density_estimator.rst.txt
        lscde.rst.txt
      - searchindex.js
      - _modules
        cde
        utils
        tf_utils
        layers_powered.html
        BaseConditionalDensity.html
        density_simulation
        EconDensity.html
        BaseConditionalDensitySimulation.html
        ArmaJump.html
        JumpDiffusionModel.html
        GMM.html
        LinearGaussian.html
        SkewNormal.html
        density_estimator
        CKDE.html
        BaseDensityEstimator.html
        BaseNNEstimator.html
        NF.html
        LSCDE.html
        KMN.html
        NKDE.html
        normalizing_flows
        RadialFlow.html
        IdentityFlow.html
        PlanarFlow.html
        AffineFlow.html
        MDN.html
        BaseNNMixtureEstimator.html
        sklearn
        base.html
        index.html
        tensorflow
        python
        ops
        distributions
        bijector_impl.html
      - _images
      - .buildinfo
      - objects.inv
      - genindex.html
      - density_simulation
        gmm.html
        linear_gaussian.html
        skew_normal.html
        density_simulation.html
        econ_density.html
        jump_diff.html
        arma_jump.html
      - py-modindex.html
      - density_estimator
        nkde.html
        ckde.html
        mdn.html
        lscde.html
        nf.html
        normalizing_flows
        radial.html
        planar.html
        affine.html
        identity.html
        kmn.html
        density_estimator.html
      - index.html
      - search.html
      - _static
        jquery.js
        basic.css
        pygments.css
        searchtools.js
        documentation_options.js
        language_data.js
        doctools.js
        fonts
        fontawesome-webfont.woff2
        fontawesome-webfont.woff
        fontawesome-webfont.eot
        RobotoSlab-Bold.ttf
        Lato
        lato-bold.woff2
        lato-bolditalic.woff2
        lato-italic.woff2
        lato-regular.woff2
        RobotoSlab
        roboto-slab-v7-bold.woff2
        roboto-slab-v7-regular.eot
        roboto-slab-v7-bold.ttf
        roboto-slab-v7-bold.eot
        roboto-slab-v7-regular.woff
        roboto-slab-v7-bold.woff
        roboto-slab-v7-regular.ttf
        roboto-slab-v7-regular.woff2
        Inconsolata.ttf
        Inconsolata-Bold.ttf
        RobotoSlab-Regular.ttf
        fontawesome-webfont.ttf
        Inconsolata-Regular.ttf
        underscore-1.3.1.js
        js
        theme.js
        modernizr.min.js
        underscore.js
        css
        badge_only.css
        theme.css

from cde.evaluation.empirical_eval.experiment_util import run_benchmark_train_test_fit_cv, run_benchmark_train_test_fit_cv_ml
import cde.evaluation.empirical_eval.datasets as datasets
from ml_logger import logger
import config
import pandas as pd

EXP_PREFIX = 'benchmark_empirical_kde'


model_dict = {
    'CKDE_cv_ml': {'estimator': 'ConditionalKernelDensityEstimation', 'bandwidth': 'cv_ml'},
    'CKDE_normal_ref': {'estimator': 'ConditionalKernelDensityEstimation', 'bandwidth': 'normal_reference'},
    'NKDE_cv_ml': {'estimator': 'NeighborKernelDensityEstimation', 'param_selection': 'cv_ml'},
    'NKDE_normal_ref': {'estimator': 'NeighborKernelDensityEstimation', 'param_selection': 'normal_reference'},
}

def experiment():
    logger.configure(log_directory=config.DATA_DIR, prefix=EXP_PREFIX, color='green')

    # 1) EUROSTOXX
    dataset = datasets.EuroStoxx50()

    result_df = run_benchmark_train_test_fit_cv_ml(dataset, model_dict, n_train_valid_splits=3, shuffle_splits=False, seed=22)

    # 2)
    for n_samples in [10000]:
        dataset = datasets.NCYTaxiDropoffPredict(n_samples=n_samples)

    df = run_benchmark_train_test_fit_cv_ml(dataset, model_dict, n_train_valid_splits=3, shuffle_splits=True, seed=22)

    result_df = pd.concat([result_df, df], ignore_index=True)

    # 3) UCI & NYC Taxi
    for dataset_class in [datasets.BostonHousing, datasets.Conrete, datasets.Energy]:
        dataset = dataset_class()
        df = run_benchmark_train_test_fit_cv_ml(dataset, model_dict, n_train_valid_splits=3, shuffle_splits=True, seed=22)
        result_df = pd.concat([result_df, df], ignore_index=True)

    logger.log('\n', str(result_df))

if __name__ == "__main__":
    experiment()