python source code of mnist

sagemaker-python-sdk-master
- NOTICE.txt
- .github
  - PULL_REQUEST_TEMPLATE.md
  - ISSUE_TEMPLATE
    - documentation-request.md
    - feature_request.md
    - bug_report.md
    - config.yml
- src
  - sagemaker
    - predictor.py
    - debugger.py
    - sparkml
      - model.py
      - __init__.py
    - analytics.py
    - estimator.py
    - transformer.py
    - exceptions.py
    - pipeline.py
    - vpc_utils.py
    - multidatamodel.py
    - mxnet
      - estimator.py
      - model.py
      - __init__.py
      - defaults.py
    - job.py
    - algorithm.py
    - cli
      - mxnet.py
      - common.py
      - __init__.py
      - main.py
      - tensorflow.py
    - workflow
      - README.rst
      - __init__.py
      - airflow.py
    - tuner.py
    - inputs.py
    - automl
      - README.rst
      - automl.py
      - __init__.py
      - candidate_estimator.py
    - processing.py
    - rl
      - estimator.py
      - __init__.py
    - pytorch
      - estimator.py
      - model.py
      - __init__.py
      - defaults.py
    - amazon
      - object2vec.py
      - ipinsights.py
      - ntm.py
      - amazon_estimator.py
      - linear_learner.py
      - record_pb2.py
      - validation.py
      - README.rst
      - lda.py
      - common.py
      - __init__.py
      - hyperparameter.py
      - knn.py
      - randomcutforest.py
      - kmeans.py
      - factorization_machines.py
      - pca.py
    - xgboost
      - estimator.py
      - README.rst
      - model.py
      - __init__.py
      - defaults.py
    - s3.py
    - fw_utils.py
    - model.py
    - git_utils.py
    - sklearn
      - estimator.py
      - processing.py
      - model.py
      - __init__.py
      - defaults.py
    - __init__.py
    - utils.py
    - parameter.py
    - local
      - data.py
      - entities.py
      - image.py
      - local_session.py
      - __init__.py
      - utils.py
    - fw_registry.py
    - user_agent.py
    - model_monitor
      - monitoring_files.py
      - cron_expression_generator.py
      - dataset_format.py
      - data_capture_config.py
      - model_monitoring.py
      - __init__.py
    - tensorflow
      - predictor.py
      - tensorflow_serving
        apis
        prediction_service_pb2.py
        model_service_pb2.py
        input_pb2.py
        predict_pb2.py
        get_model_metadata_pb2.py
        inference_pb2.py
        regression_pb2.py
        model_pb2.py
        model_service_pb2_grpc.py
        __init__.py
        classification_pb2.py
        __init__.py
      - estimator.py
      - deploying_tensorflow_serving.rst
      - model.py
      - serving.py
      - __init__.py
      - defaults.py
    - session.py
    - content_types.py
    - chainer
      - estimator.py
      - model.py
      - __init__.py
      - defaults.py
    - network.py
    - logs.py
- buildspec-deploy.yml
- branding
  - icon
- .coveragerc
- examples
  - cli
    - train
      - hyperparameters.json
      - script.py
      - download_training_data.py
      - data
        training
        train-labels-idx1-ubyte.gz
        t10k-labels-idx1-ubyte.gz
      - run_training_example.sh
    - host
      - run_hosting_example.sh
      - script.py
      - data
        model.json
- buildspec-unittests.yml
- buildspec.yml
- .readthedocs.yml
- CONTRIBUTING.md
- .flake8
- CHANGELOG.md
- README.rst
- .pylintrc
- setup.py
- VERSION
- buildspec-localmodetests.yml
- setup.cfg
- buildspec-notebooktests.yml
- tests
  - integ
    - test_inference_pipeline.py
    - test_model_monitor.py
    - test_airflow_config.py
    - test_pytorch_train.py
    - test_data_upload.py
    - test_sparkml_serving.py
    - test_local_mode.py
    - test_object2vec.py
    - test_tf_efs_fsx.py
    - test_multidatamodel.py
    - test_marketplace.py
    - test_knn.py
    - test_processing.py
    - test_s3.py
    - auto_ml_utils.py
    - test_monitoring_files.py
    - test_data_capture_config.py
    - test_tuner_multi_algo.py
    - test_rl.py
    - test_chainer_train.py
    - test_kmeans_efs_fsx.py
    - test_ntm.py
    - test_pca.py
    - test_transformer.py
    - kms_utils.py
    - test_horovod.py
    - test_ipinsights.py
    - vpc_test_utils.py
    - test_lda.py
    - test_neo_mxnet.py
    - test_experiments_analytics.py
    - file_system_input_utils.py
    - test_record_set.py
    - test_linear_learner.py
    - timeout.py
    - record_set.py
    - test_multi_variant_endpoint.py
    - test_session.py
    - test_auto_ml.py
    - test_source_dirs.py
    - __init__.py
    - test_randomcutforest.py
    - test_debugger.py
    - test_kmeans.py
    - retry.py
    - test_sklearn_train.py
    - marketplace_utils.py
    - test_mxnet_train.py
    - test_tfs.py
    - test_git.py
    - test_factorization_machines.py
    - test_byo_estimator.py
    - s3_utils.py
    - lock.py
    - test_tuner.py
    - test_tf_script_mode.py
  - data
    - ipinsights
      - train.csv
    - with_integers.csv
    - chainer_mnist
      - mnist.py
      - test
      - train
      - distributed_mnist.py
    - protobuf_data
    - sparkml_xgboost_pipeline
      - valid_input.csv
      - invalid_input.csv
    - ray_cartpole
      - train_ray.py
    - one_p_mnist
      - transform_input.csv
      - first_10_rows_recordio
    - pytorch_eia
      - empty_inference_script.py
      - model_mnist.tar.gz
    - xgboost_model
      - xgb_model.tar.gz
    - pytorch_source_dirs
      - train.py
    - marketplace
      - training
        iris.csv
      - transform
        batchtransform_test.csv
    - sparkml_model
      - mleap_model.tar.gz
    - upload_data_tests
      - file2.py
      - file1.py
      - nested_dir
        file3.py
        file4.py
    - sklearn_mnist
      - mnist.py
      - test
      - failure_script.py
      - __init__.py
      - train
    - automl
      - data
        iris_test.csv
        iris_transform.csv
        iris_training.csv
    - tensorflow_mnist
      - mnist.py
      - data
        eval_labels.npy
        train_labels.npy
      - transform
        data.csv
    - dummy_input.txt
    - ntm
    - coach_cartpole
      - mxnet_deploy.py
      - preset_cartpole_clippedppo.py
      - train_coach.py
    - object2vec
      - train.jsonl
    - tensorflow-serving-test-model.tar.gz
    - monitor
      - constraint_violations.json
      - statistics.json
      - baseline_dataset.csv
      - preprocessor.py
      - postprocessor.py
      - constraints.json
      - captured-data.jsonl
    - mxnet_mnist
      - mnist_gluon.py
      - my_custom_rule.py
      - mnist_neo.py
      - mnist.py
      - test
        labels.gz
      - failure_script.py
      - model
        symbol
      - train
        labels.gz
      - mnist_hosting_with_custom_handlers.py
      - transform
        data.csv
    - iris
      - iris-dnn-classifier.py
      - failure_script.py
      - data
        iris_test.csv
        iris_training.csv
    - tf-iris-model.tar.gz
    - sagemaker_rl
      - coach_launcher.py
      - configuration_list.py
      - __init__.py
    - pytorch_mnist
      - training
        MNIST
        processed
      - mnist.py
      - packed_model.tar.gz
      - model.tar.gz
      - transform
    - dummy_script.py
    - tfs
      - tfs-test-entrypoint-with-handler
        training.py
        123
        variables
        variables.data-00000-of-00001
        variables.index
        saved_model.pb
        assets
        foo.txt
        inference.py
      - tfs-test-model-with-inference
        code
        inference.py
        00000123
        variables
        variables.data-00000-of-00001
        variables.index
        saved_model.pb
        assets
        foo.txt
      - tfs-test-entrypoint-and-dependencies
        inference.py
        dependency.py
    - horovod
      - launcher.sh
      - hvd_basic.py
    - dummy_requirements.txt
    - multimodel
      - container
        model_handler.py
        dockerd-entrypoint.py
        Dockerfile
    - lda
  - __init__.py
  - component
    - test_mxnet_estimator.py
    - __init__.py
    - test_tf_estimator.py
  - scripts
    - run-notebook-test.sh
    - fs_mount_setup.sh
  - unit
    - test_predictor.py
    - test_chainer.py
    - output_capturer.py
    - test_fm.py
    - test_utils.py
    - test_exception_on_bad_status.py
    - test_vpc_utils.py
    - test_sparkml_serving.py
    - test_amazon_estimator.py
    - test_fw_utils.py
    - test_upload_string_as_file_body.py
    - test_local_utils.py
    - test_object2vec.py
    - test_algorithm.py
    - test_endpoint_from_job.py
    - test_job.py
    - sagemaker
      - automl
        test_auto_ml.py
      - monitor
        test_data_capture_config.py
        test_cron_expression_generator.py
        __init__.py
        test_model_monitoring.py
      - __init__.py
      - model
        test_framework_model.py
        test_model_package.py
        test_model.py
        test_deploy.py
        test_neo.py
    - test_sync_directories.py
    - test_multidatamodel.py
    - test_endpoint_from_model_data.py
    - test_local_data.py
    - test_analytics.py
    - test_knn.py
    - test_processing.py
    - test_s3.py
    - test_git_utils.py
    - test_local_entities.py
    - test_rl.py
    - test_image.py
    - test_estimator.py
    - test_ntm.py
    - test_airflow.py
    - test_pca.py
    - test_transformer.py
    - test_hyperparameter.py
    - test_ipinsights.py
    - test_lda.py
    - test_inputs.py
    - test_init.py
    - test_common.py
    - test_xgboost.py
    - test_experiments_analytics.py
    - test_local_session.py
    - test_sklearn.py
    - test_linear_learner.py
    - test_default_bucket.py
    - test_create_deploy_entities.py
    - test_tf_predictor.py
    - test_session.py
    - test_cli.py
    - test_fw_registry.py
    - test_mxnet.py
    - __init__.py
    - test_randomcutforest.py
    - tuner_test_utils.py
    - test_upload_data.py
    - test_kmeans.py
    - test_timeout.py
    - test_pipeline_model.py
    - test_tf_estimator.py
    - test_pytorch.py
    - test_tfs.py
    - test_tuner.py
  - conftest.py
- CODE_OF_CONDUCT.md
- bin
  - README
  - sagemaker-submit
- .codecov.yml
- .gitignore
- LICENSE.txt
- buildspec-release.yml
- MANIFEST.in
- ci-scripts
  - queue_build.py
  - displaytime.sh
- doc
  - Makefile
  - make.bat
  - amazon_sagemaker_debugger.rst
  - amazon_sagemaker_model_monitoring.rst
  - amazon_sagemaker_processing.rst
  - api
    - training
      - analytics.rst
      - estimators.rst
      - debugger.rst
      - parameter.rst
      - automl.rst
      - index.rst
      - algorithm.rst
      - processing.rst
      - tuner.rst
    - utility
      - inputs.rst
      - session.rst
      - index.rst
      - s3.rst
      - network.rst
    - index.rst
    - inference
      - multi_data_model.rst
      - transformer.rst
      - predictors.rst
      - index.rst
      - model_monitor.rst
      - model.rst
      - pipeline.rst
  - algorithms
    - linear_learner.rst
    - sagemaker.amazon.amazon_estimator.rst
    - factorization_machines.rst
    - knn.rst
    - ipinsights.rst
    - pca.rst
    - lda.rst
    - ntm.rst
    - index.rst
    - object2vec.rst
    - randomcutforest.rst
    - kmeans.rst
  - overview.rst
  - frameworks
    - sparkml
      - index.rst
      - sagemaker.sparkml.rst
    - mxnet
      - sagemaker.mxnet.rst
      - index.rst
      - using_mxnet.rst
    - rl
      - sagemaker.rl.rst
      - using_rl.rst
      - index.rst
    - pytorch
      - sagemaker.pytorch.rst
      - using_pytorch.rst
      - index.rst
    - xgboost
      - index.rst
      - xgboost.rst
      - using_xgboost.rst
    - sklearn
      - using_sklearn.rst
      - sagemaker.sklearn.rst
      - index.rst
    - index.rst
    - tensorflow
      - sagemaker.tensorflow.rst
      - using_tf.rst
      - index.rst
    - chainer
      - using_chainer.rst
      - sagemaker.chainer.rst
      - index.rst
  - workflows
    - airflow
      - sagemaker.workflow.airflow.rst
      - index.rst
      - using_workflow.rst
    - step_functions
      - index.rst
    - index.rst
    - kubernetes
      - amazon_sagemaker_components_for_kubeflow_pipelines.rst
      - using_amazon_sagemaker_components.rst
      - amazon_sagemaker_jobs.rst
      - amazon_sagemaker_operators_for_kubernetes.rst
      - index.rst
  - requirements.txt
  - index.rst
  - conf.py
  - _static
    - js
      - analytics.js
- tox.ini

# Standard Library
import argparse
import random

# Third Party
import mxnet as mx
import numpy as np
from mxnet import autograd, gluon
from mxnet.gluon import nn


def parse_args():
    parser = argparse.ArgumentParser(
        description="Train a mxnet gluon model for FashonMNIST dataset"
    )
    parser.add_argument("--batch-size", type=int, default=256, help="Batch size")
    parser.add_argument("--epochs", type=int, default=1, help="Number of Epochs")
    parser.add_argument("--learning_rate", type=float, default=0.1)
    parser.add_argument(
        "--context", type=str, default="cpu", help="Context can be either cpu or gpu"
    )
    parser.add_argument(
        "--validate", type=bool, default=True, help="Run validation if running with smdebug"
    )

    opt = parser.parse_args()
    return opt


def test(ctx, net, val_data):
    metric = mx.metric.Accuracy()
    for i, (data, label) in enumerate(val_data):
        data = data.as_in_context(ctx)
        label = label.as_in_context(ctx)
        output = net(data)
        metric.update([label], [output])

    return metric.get()


def train_model(net, epochs, ctx, learning_rate, momentum, train_data, val_data):
    # Collect all parameters from net and its children, then initialize them.
    net.initialize(mx.init.Xavier(magnitude=2.24), ctx=ctx)
    # Trainer is for updating parameters with gradient.
    trainer = gluon.Trainer(
        net.collect_params(), "sgd", {"learning_rate": learning_rate, "momentum": momentum}
    )
    metric = mx.metric.Accuracy()
    loss = gluon.loss.SoftmaxCrossEntropyLoss()

    for epoch in range(epochs):
        # reset data iterator and metric at begining of epoch.
        metric.reset()
        for i, (data, label) in enumerate(train_data):
            # Copy data to ctx if necessary
            data = data.as_in_context(ctx)
            label = label.as_in_context(ctx)
            # Start recording computation graph with record() section.
            # Recorded graphs can then be differentiated with backward.
            with autograd.record():
                output = net(data)
                L = loss(output, label)
                L.backward()
            # take a gradient step with batch_size equal to data.shape[0]
            trainer.step(data.shape[0])
            # update metric at last.
            metric.update([label], [output])

            if i % 100 == 0 and i > 0:
                name, acc = metric.get()
                print("[Epoch %d Batch %d] Training: %s=%f" % (epoch, i, name, acc))

        name, acc = metric.get()
        print("[Epoch %d] Training: %s=%f" % (epoch, name, acc))
        name, val_acc = test(ctx, net, val_data)
        print("[Epoch %d] Validation: %s=%f" % (epoch, name, val_acc))


def transformer(data, label):
    data = data.reshape((-1,)).astype(np.float32) / 255
    return data, label


def prepare_data(batch_size):
    train_data = gluon.data.DataLoader(
        gluon.data.vision.MNIST("/tmp", train=True, transform=transformer),
        batch_size=batch_size,
        shuffle=True,
        last_batch="discard",
    )

    val_data = gluon.data.DataLoader(
        gluon.data.vision.MNIST("/tmp", train=False, transform=transformer),
        batch_size=batch_size,
        shuffle=False,
    )
    return train_data, val_data


# Create a model using gluon API. The hook is currently
# supports MXNet gluon models only.
def create_gluon_model():
    net = nn.Sequential()
    with net.name_scope():
        net.add(nn.Dense(128, activation="relu"))
        net.add(nn.Dense(64, activation="relu"))
        net.add(nn.Dense(10))
    return net


def main():
    opt = parse_args()
    mx.random.seed(128)
    random.seed(12)
    np.random.seed(2)

    context = mx.cpu() if opt.context.lower() == "cpu" else mx.gpu()
    # Create a Gluon Model.
    net = create_gluon_model()

    # Start the training.
    train_data, val_data = prepare_data(opt.batch_size)

    train_model(
        net=net,
        epochs=opt.epochs,
        ctx=context,
        learning_rate=opt.learning_rate,
        momentum=0.9,
        train_data=train_data,
        val_data=val_data,
    )


if __name__ == "__main__":
    main()