python source code of imagenet

tpu_models-master
- LICENSE
- models
  - samples
    - core
      - get_started
        custom_tpuestimator.py
        iris_data_tpu.py
  - official
    - squeezenet
      - data_pipeline.py
      - squeezenet_model.py
      - squeezenet_main.py
      - configs
        squeezenet_config.py
        __init__.py
    - densenet
      - vgg_preprocessing.py
      - densenet_model.py
      - README.md
      - densenet_imagenet.py
    - unet3d
      - input_reader.py
      - tpu_executor.py
      - unet_model.py
      - metrics.py
      - params_dict.py
      - data_preprocess
        convert_lits.py
        convert_lits_nii_to_npy.py
      - unet_config.py
      - unet_main.py
      - README.md
      - requirements.txt
      - export_saved_model.py
      - saved_model_inference.py
    - detection
      - utils
        autoaugment_utils.py
        input_utils.py
        spatial_transform.py
        __init__.py
        object_detection
        balanced_positive_negative_sampler.py
        region_similarity_calculator.py
        ops.py
        visualization_utils.py
        shape_utils.py
        target_assigner.py
        preprocessor.py
        minibatch_sampler.py
        box_list_ops.py
        box_list.py
        faster_rcnn_box_coder.py
        argmax_matcher.py
        matcher.py
        box_coder.py
        __init__.py
        box_utils.py
        segm_utils.py
      - modeling
        retinanet_model.py
        learning_rates.py
        factory.py
        base_model.py
        postprocess.py
        losses.py
        architecture
        efficientnet_builder.py
        efficientnet_model.py
        fpn.py
        identity.py
        factory.py
        seresnext.py
        resnet.py
        heads.py
        nasfpn.py
        __init__.py
        utils.py
        nn_ops.py
        serving.py
        __init__.py
        checkpoint_utils.py
        model_builder.py
      - executor
        tpu_executor.py
        __init__.py
      - dataloader
        input_reader.py
        anchor.py
        retinanet_parser.py
        factory.py
        __init__.py
        tf_example_decoder.py
        shapemask_parser.py
        mode_keys.py
      - evaluation
        factory.py
        coco_utils.py
        __init__.py
        coco_evaluator.py
      - k8s
        retinanet_k8s.yaml
      - configs
        yaml
        4.8.14_r152_pretrained_640_feat_300_drop_0.9_aug3.yaml
        2.0.5_nasfpn_resnet50_shorter.yaml
        4.1.1_effnet_b5_45k_90k_1024_feat_300.yaml
        2.6.1_r50_features_250_drop_0.7.yaml
        3.1.0_balanced_resnet50_step_45k.yaml
        2.3.1b_efficientnet_b5_resumed.yaml
        2.6.4_r50_features_250_drop_0.85.yaml
        1.0.0_retinanet.yaml
        4.2.2_effnet_b7_45k_90k_1024_feat_256_drop_0.9.yaml
        2.6.5_r50_features_300_drop_0.85.yaml
        2.0.0_nasfpn_resnet50.yaml
        4.5.5_effnet_b6_45k_90k_1024_feat_256_drop_0.85.yaml
        2.4.7_r50_cosine_10k_300_feat_drop_0.5.yaml
        4.1.0_effnet_b5_45k_90k_1024_batch_32.yaml
        2.1.0_nasfpn_resnet200_aug_v1.yaml
        2.6.10_r50_features_400_drop_0.5_1024.yaml
        4.1.10_effnet_b5_45k_90k_1024_feat_350_drop_0.9.yaml
        4.9.1_r101_step_45k_60k_feat_300_drop_0.9_aug0.yaml
        2.5.2_effnet_b5_cosine_10k_frozen_15.yaml
        2.0.4_nasfpn_resnet50_aug_v3.yaml
        2.2.0_nasfpn_seresnext50.yaml
        1.0.4_1024x768.yaml
        4.8.4_r50_step_45k_90k_1024.yaml
        4.0.3_r200_step_45k_90k_1024_drop_0.9.yaml
        4.1.6_effnet_b5_45k_90k_1024_feat_256_drop_0.9.yaml
        2.5.0_effnet_b5_cosine_10k.yaml
        4.5.7_effnet_b6_45k_90k_1024_feat_300_drop_0.85.yaml
        2.4.4_r50_cosine_10k_1024x1024.yaml
        4.8.0_r200_step_45k_90k_640_drop_0.9_aug1.yaml
        2.1.1_nasfpn_resnet200_aug_v3.yaml
        2.3.2_nasfpn_effnet_b7_clr.yaml
        4.8.5_r50_step_45k_90k_feat_300_drop_0.9.yaml
        2.4.5_r50_cosine_10k_128_feat.yaml
        2.4.6_r50_cosine_10k_384_feat.yaml
        4.3.0_effnet_b5_45k_90k_1024_frozen_25.yaml
        4.8.1_r152_step_45k_90k_800_drop_0.9_feat_300.yaml
        4.1.9_effnet_b5_45k_90k_1024_feat_350_drop_0.85.yaml
        4.5.9_effnet_b6_45k_90k_1024_feat_350_drop_0.85.yaml
        retinanet_autoaugment.yaml
        4.4.4_effnet_b7_45k_90k_1024_feat_300_drop_0.85.yaml
        2.6.0_r50_step_45k.yaml
        2.0.6_nasfpn_resnet50_cosine_lr1.yaml
        4.9.2_r200_pretrained_640_drop_0.9_aug1.yaml
        2.0.3_nasfpn_resnet200.yaml
        4.1.3_effnet_b5_45k_90k_1024_feat_400.yaml
        4.5.0_effnet_b6_45k_90k_1024_batch_32.yaml
        2.3.1_efficientnet_b5_pretrain.yaml
        4.5.1_effnet_b6_45k_90k_1024_feat_300.yaml
        4.1.5_effnet_b5_45k_90k_1024_feat_256_drop_0.85.yaml
        2.6.9_r50_features_512_drop_0.7_1024.yaml
        retinanet_nasfpn.yaml
        2.0.9a_nasfpn_resnet50_cosine_lr5.yaml
        4.0.2_r152_step_45k_90k_1024_drop_0.9.yaml
        4.8.8_r200_pretrained_640_drop_0.9_aug1.yaml
        1.1.0_added_lr_schedule.yaml
        4.8.9_r152_pretrained_640_drop_0.9_aug3.yaml
        2.3.3a_nasfpn_effnet_b7_resumed.yaml
        4.8.11_r101_pretrained_1024_feat_300_aug2.yaml
        4.2.3_effnet_b7_45k_90k_1024_feat_300_drop_0.9.yaml
        2.4.3_r50_cosine_10k_separable_aug_v3.yaml
        2.0.9_nasfpn_resnet50_cosine_lr4.yaml
        1.0.5_1024x1024.yaml
        2.6.7_r50_features_400_drop_0.7_1024.yaml
        1.3.1_resnet152.yaml
        2.3.3_nasfpn_effnet_b7_batch_32.yaml
        1.3.2_resnet200.yaml
        4.7.1_r50_cosine_10k_feat_300_drop_0.7.yaml
        4.0.0_r50_step_45k_90k_1024.yaml
        1.0.2_changed_schedule.yaml
        4.9.4_r152_pretrained_640_feat_300_drop_0.9_aug2.yaml
        2.1.4_nasfpn_resnet200_1024_aug_v3.yaml
        2.0.1_nasfpn_resnet101.yaml
        1.3.0_resnet101.yaml
        4.9.0_r50_step_45k_60k_feat_300_drop_0.9_aug2.yaml
        2.4.2_r50_cosine_10k_separable_aug_v1.yaml
        3.0.1_balanced_resnet50_cosine_20k.yaml
        3.0.2_balanced_resnet50_cosine_30k.yaml
        2.0.8_nasfpn_resnet50_cosine_lr3.yaml
        4.8.13_r200_pretrained_640_feat_300_drop_0.9_aug1.yaml
        4.7.0_r50_cosine_10k_1024.yaml
        4.8.6_r50_step_45k_90k_feat_300_drop_0.9_aug2.yaml
        4.6.0_r50_step_45k_60k_1024.yaml
        4.1.4_effnet_b5_45k_90k_1024_separable.yaml
        4.1.2_effnet_b5_45k_90k_1024_feat_350.yaml
        1.2.1_autoaugment_v1.yaml
        3.1.1_balanced_resnet50_step_30k.yaml
        4.9.3_r152_pretrained_640_drop_0.9_aug3.yaml
        2.6.2_r50_features_300_drop_0.7.yaml
        4.4.5_effnet_b7_45k_90k_1024_feat_350_drop_0.9.yaml
        2.5.1_effnet_b5_cosine_10k_frozen_10.yaml
        4.8.10_r101_pretrained_1024_feat_350_aug3.yaml
        2.5.4_effnet_b5_cosine_10k_frozen_15_640.yaml
        4.8.12_r200_pretrained_feat_300_aug3.yaml
        4.8.3_r101_step_45k_90k_1024_feat_300_aug2.yaml
        2.4.8_r50_cosine_10k_300_feat_drop_0.7.yaml
        2.5.5_effnet_b5_cosine_10k_frozen_15_640_sep.yaml
        1.2.0_autoaugment_v0.yaml
        2.1.2_nasfpn_resnet200_1024.yaml
        4.1.7_effnet_b5_45k_90k_1024_feat_300_drop_0.85.yaml
        4.8.2_r101_step_45k_90k_1024_feat_350_aug3.yaml
        4.5.4_effnet_b6_45k_90k_1024_separable.yaml
        4.5.3_effnet_b6_45k_90k_1024_feat_400.yaml
        2.3.0_nasfpn_efficientnet_b5.yaml
        3.0.0_balanced_resnet50_cosine_10k.yaml
        4.5.6_effnet_b6_45k_90k_1024_feat_256_drop_0.9.yaml
        2.6.6_r50_features_400_drop_0.85.yaml
        4.6.1_r50_step_45k_60k_1024_drop_0.9.yaml
        2.0.7_nasfpn_resnet50_cosine_lr2.yaml
        1.2.2_autoaugment_v2.yaml
        4.2.4_effnet_b7_45k_90k_1024_frozen_25.yaml
        2.5.3_effnet_b5_cosine_10k_frozen_20.yaml
        1.2.3_autoaugment_v3.yaml
        2.4.1_r50_cosine_10k_separable_aug_v0.yaml
        2.5.6_effnet_b5_cosine_10k_frozen_15_640_sep_drop.yaml
        4.5.2_effnet_b6_45k_90k_1024_feat_350.yaml
        4.4.2_effnet_b7_45k_90k_1024_feat_256_drop_0.85.yaml
        4.4.3_effnet_b7_45k_90k_1024_feat_300_drop_0.9.yaml
        4.1.8_effnet_b5_45k_90k_1024_feat_300_drop_0.9.yaml
        4.4.1_effnet_b7_45k_90k_1024_feat_256_drop_0.9.yaml
        2.6.3_r50_features_400_drop_0.7.yaml
        1.0.1_fixed_val_batch.yaml
        4.0.1_r101_step_45k_90k_1024_drop_0.9.yaml
        4.5.10_effnet_b6_45k_90k_1024_feat_350_drop_0.9.yaml
        2.4.0_r50_cosine_10k.yaml
        4.8.7_r50_step_45k_90k_feat_350_drop_0.85_aug0.yaml
        2.0.2_nasfpn_resnet152.yaml
        4.4.0_effnet_b7_45k_90k_1024_batch_32.yaml
        4.2.1_effnet_b7_45k_90k_1024_frozen_20.yaml
        4.5.8_effnet_b6_45k_90k_1024_feat_300_drop_0.9.yaml
        4.4.6_effnet_b7_45k_90k_1024_feat_350_drop_0.85.yaml
        4.2.0_effnet_b7_45k_90k_1024.yaml
        1.0.3_constant.yaml
        2.1.3_nasfpn_resnet200_1024_aug_v1.yaml
        2.6.8_r50_features_400_drop_0.85_1024.yaml
        factory.py
        retinanet_config.py
        __init__.py
      - main.py
      - README.md
      - export_saved_model.py
    - transformer
      - README.md
    - mask_rcnn
      - learning_rates.py
      - postprocess_ops.py
      - fpn.py
      - evaluation.py
      - mask_rcnn_main.py
      - anchors.py
      - mask_rcnn_model.py
      - losses.py
      - resnet.py
      - distributed_executer.py
      - dataloader.py
      - coco_utils.py
      - tpu_normalization.py
      - heads.py
      - training_ops.py
      - spatial_transform_ops.py
      - serving.py
      - configs
        mask_rcnn_config.py
        cloud
        v2-128.yaml
        v3-128.yaml
        v3-8.yaml
        v2-32.yaml
        v3-32.yaml
        v2-8.yaml
        __init__.py
      - README.md
      - mask_rcnn_k8s.yaml
      - object_detection
        balanced_positive_negative_sampler.py
        region_similarity_calculator.py
        ops.py
        visualization_utils.py
        shape_utils.py
        target_assigner.py
        preprocessor.py
        minibatch_sampler.py
        box_list.py
        faster_rcnn_box_coder.py
        argmax_matcher.py
        matcher.py
        box_coder.py
        __init__.py
        tf_example_decoder.py
      - box_utils.py
      - export_saved_model.py
      - preprocess_ops.py
      - roi_ops.py
      - coco_metric.py
    - resnet
      - imagenet_input.py
      - lars_util.py
      - resnet_preprocessing.py
      - resnet_k8s.yaml
      - resnet_model_test.py
      - resnet_model.py
      - configs
        resnet101.yaml
        resnet_config.py
        resnet152.yaml
        cloud
        v2-128.yaml
        v3-1024.yaml
        v3-128.yaml
        v3-8.yaml
        v2-32.yaml
        v3-512.yaml
        v3-64.yaml
        v3-32.yaml
        v2-8.yaml
        v2-512.yaml
        v3-2048.yaml
        v3-256.yaml
        v2-256.yaml
        __init__.py
        resnet200.yaml
      - __init__.py
      - README.md
      - resnet_main.py
      - benchmark
        read_training_time.py
        resnet_benchmark.py
        __init__.py
        README.md
    - amoeba_net
      - amoeba_net.py
      - inception_preprocessing.py
      - network_utils_test.py
      - amoeba_net_k8s.yaml
      - amoeba_net_model.py
      - README.md
      - tf_hub.py
      - model_specs.py
      - model_builder.py
      - network_utils.py
    - retinanet
      - retinanet_model.py
      - retinanet_segmentation_main.py
      - retinanet_segmentation_model.py
      - retinanet_architecture.py
      - evaluation.py
      - anchors.py
      - postprocess.py
      - retinanet_k8s.yaml
      - dataloader.py
      - retinanet_tensorrt.py
      - README.md
      - object_detection
        region_similarity_calculator.py
        shape_utils.py
        target_assigner.py
        preprocessor.py
        box_list.py
        faster_rcnn_box_coder.py
        argmax_matcher.py
        matcher.py
        box_coder.py
        __init__.py
        tf_example_decoder.py
      - retinanet_main.py
      - coco_metric.py
    - mobilenet
      - vgg_preprocessing.py
      - mobilenet_model.py
      - mobilenet.py
      - inception_preprocessing.py
      - configs
        mobilenet_config.py
        cloud
        v2-128.yaml
        v3-1024.yaml
        v3-128.yaml
        v3-8.yaml
        v2-32.yaml
        v3-512.yaml
        v3-64.yaml
        v3-32.yaml
        v2-8.yaml
        v2-512.yaml
        v3-2048.yaml
        v3-256.yaml
        v2-256.yaml
        __init__.py
      - README.md
      - supervised_images.py
    - __init__.py
    - mnist
      - mnist_tpu.py
      - README.md
    - efficientnet
      - eval_ckpt_main.py
      - autoaugment.py
      - edgetpu
        efficientnet_edgetpu_builder.py
        __init__.py
        README.md
      - efficientnet_builder.py
      - efficientnet_model.py
      - g3doc
      - imagenet_input.py
      - preprocessing.py
      - main.py
      - README.md
      - utils.py
      - export_model.py
    - mnasnet
      - eval_ckpt_main.py
      - mnasnet_models.py
      - post_quantization.py
      - g3doc
      - imagenet_input.py
      - mixnet
        g3doc
        mixnet_builder.py
        custom_layers.py
        __init__.py
        README.md
        mixnet_model.py
      - preprocessing.py
      - mnasnet_main.py
      - configs
        mnasnet_config.py
        cloud
        v3-8.yaml
        v2-32.yaml
        v3-32.yaml
        v2-8.yaml
        gpu.yaml
        __init__.py
      - README.md
      - mnas_utils.py
      - mnasnet_model.py
  - common
    - tpu_profiler_hook.py
    - inference_warmup.py
    - __init__.py
    - imagenet.py
  - setup.py
  - hyperparameters
    - flags_to_params.py
    - common_hparams_flags.py
    - params_dict.py
    - common_tpu_flags.py
    - __init__.py
  - experimental
    - mnist_keras
      - mnist.py
    - keras_colab
      - shakespeare_lstm.py
      - README.md
    - keras_application
      - application_model.py
    - dcgan
      - dcgan_main.py
      - mnist_input.py
      - cifar_model.py
      - mnist_model.py
      - README.md
      - cifar_input.py
    - qanet
      - data.py
      - preprocess.py
      - run.py
      - run_lib.py
      - testdata
        train-v1.1.json
        vocab.vec
        train_0000
      - model.py
      - README.md
      - utils.py
    - distribution_strategy
      - imagenet_input.py
      - resnet_preprocessing.py
      - resnet_model.py
      - resnet_estimator.py
    - resnet50_keras
      - resnet50_tf2.py
      - model_saving_utils.py
      - resnet50.py
      - imagenet_input.py
      - resnet_preprocessing.py
      - resnet50_ctl_tf1.py
      - resnet50_ctl_tf2.py
      - resnet_model.py
      - README.md
      - resnet50_test.py
    - cifar_keras
      - README.md
      - cifar_keras.py
    - inception
      - inception_v3.py
      - inception_v2_tpu_model.py
      - vgg_preprocessing.py
      - inception_v4_model.py
      - inception_v3_old.py
      - inception_preprocessing.py
      - inception_v3_k8s.yaml
      - inception_v2.py
      - inception_v4.py
      - imagenet.py
    - densenet_keras
      - densenet_keras_model.py
      - vgg_preprocessing.py
      - densenet_keras_imagenet.py
      - README.md
    - inference
      - setup-pool.sh
      - load_test_client.py
      - api_config.yaml
      - openapi.yaml
      - api_descriptor.pb
    - ncf
      - ncf_main.py
      - README.md
    - deeplab
      - data_pipeline.py
      - model.py
      - main.py
      - README.md
    - show_and_tell
      - show_and_tell_tpu_test.py
      - README
      - show_and_tell_model.py
      - inputs.py
      - image_processing.py
      - train.py
      - configuration.py
      - image_embedding.py
    - mnist_jupyter
      - launch.sh
- benchmarks
  - ResNet-50_v1.5_Performance_Comparison_TensorFlow_1.12_GCP.md
- README.md
- scripts
  - train_on_fold.sh
  - prepare_folds.sh
  - add_extra_data.sh
  - export_fold.sh
  - prepare_tfrecords_v3_balanced.sh
  - prepare_tfrecords_v1.sh
  - train_on_dataset.sh
  - build_validation.py
  - filter_dataset.py
  - prepare_datasets.sh
  - extra
    - class-ids-human-body-parts-and-mammal.txt
  - upload_files_to_gcs.sh
  - prepare_tfrecords_v2_removed_crowd.sh
  - kfold_split.py
  - gen_tfrecords.py
  - split_classes.py
  - prepare_tfrecords_v4_pseudo_labels.sh
  - export_saved_model.sh
  - blacklist.txt
  - build_leaf_classes_list.py
  - prepare_tfrecords_v5_balanced_pseudo_labels.sh
  - inference
    - merge_all_subs.sh
    - trim_sub_by_threshold.py
    - add_parents.py
    - ready_models.txt
    - gen_sub.py
    - cloud_inference.py
    - docker_run.sh
    - partial_inference.py
    - docker_build.sh
    - all_models.yml
    - gen_all_subs.sh
    - drop_parents.py
    - soft_nms.pyx
    - merge_subs.py
    - join_subs.py
    - trim_sub_decimal_digits.py
    - inference.py
    - trim_sub_by_num_of_predicts.py
    - join_predicted_parts.py
    - requirements.txt
    - Dockerfile
  - export_models.py
  - export_all_folds.sh
  - .gitignore
  - gen_coco_val_json.py
  - debug.py
  - add_data_from_testset.py
- tools
  - diagnostics
    - diagnostics.py
  - datasets
    - download_and_preprocess_coco.sh
    - download_and_preprocess_coco_k8s.yaml
    - create_coco_tf_record.py
    - imagenet_to_gcs.py
    - tfrecords_to_bigtable.py
    - README.md
    - imagenet_to_gcs_k8s.yaml
    - jpeg_to_tf_record.py
  - ctpu
    - ctrl
      - resourcemgmt.go
      - gce_test.go
      - ctrl_test.go
      - gcloud_cli_test.go
      - tpu_test.go
      - servicemgmt.go
      - ctrl.go
      - gcloud_cli.go
      - tpu.go
      - resourcemgmt_test.go
      - gce.go
    - commands
      - status.go
      - common.go
      - status_test.go
      - tpu_locations.go
      - config_cmd.go
      - tpu_size_test.go
      - list_test.go
      - pause_test.go
      - delete.go
      - quota.go
      - common_test.go
      - up_test.go
      - pause.go
      - list.go
      - up.go
      - auth_test.go
      - delete_test.go
      - tpu_size.go
      - version.go
      - tf_versions.go
      - restart.go
      - auth.go
      - tpu_locations_test.go
      - restart_test.go
    - config
      - config_gce.go
      - config.go
      - devshell_test.go
      - testdata
        gcloud
        corrupted2
        application_default_credentials.json
        README.md
        active_config
        corrupted
        application_default_credentials.json
        README.md
        active_config
        configurations
        config_default
        clean
        application_default_credentials.json
        README.md
        active_config
        configurations
        config_ctpu9
        no_config
        README.md
        incomplete
        application_default_credentials.json
        README.md
        active_config
        configurations
        config_ctpu9
        no_app_creds
        README.md
        active_config
        configurations
        config_ctpu9
      - config_gcloud_test.go
      - config_gcloud.go
      - config_test.go
      - devshell.go
    - tutorial.md
    - README.md
    - main.go
    - .gitignore
  - docker
    - Dockerfile.util
    - Dockerfile
  - colab
    - BUILD
  - kubernetes
    - tensorboard_k8s.yaml
    - tpu_profiler_k8s.yaml
- .gitignore

# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
"""Efficient ImageNet input pipeline using tf.data.Dataset."""

from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

import abc
from collections import namedtuple
import functools
import os
import tensorflow as tf

import preprocessing


# The input tensor is in the range of [0, 255], we need to scale them.
MEAN_RGB = [0.485 * 255, 0.456 * 255, 0.406 * 255]
STDDEV_RGB = [0.229 * 255, 0.224 * 255, 0.225 * 255]


def build_image_serving_input_fn(image_size):
  """Builds a serving input fn for raw images."""
  def _image_serving_input_fn():
    """Serving input fn for raw images."""
    def _preprocess_image(image_bytes):
      """Preprocess a single raw image."""
      image = preprocessing.preprocess_image(
          image_bytes=image_bytes, is_training=False, image_size=image_size)
      return image

    image_bytes_list = tf.placeholder(
        shape=[None],
        dtype=tf.string,
    )
    images = tf.map_fn(
        _preprocess_image, image_bytes_list, back_prop=False, dtype=tf.float32)
    return tf.estimator.export.ServingInputReceiver(
        images, {'image_bytes': image_bytes_list})
  return _image_serving_input_fn


class ImageNetTFExampleInput(object):
  """Base class for ImageNet input_fn generator.

  Args:
    is_training: `bool` for whether the input is for training
    use_bfloat16: If True, use bfloat16 precision; else use float32.
    num_cores: `int` for the number of TPU cores
    image_size: `int` for image size (both width and height).
    transpose_input: 'bool' for whether to use the double transpose trick
  """
  __metaclass__ = abc.ABCMeta

  def __init__(self,
               is_training,
               use_bfloat16,
               num_cores=8,
               image_size=224,
               transpose_input=False):
    self.image_preprocessing_fn = preprocessing.preprocess_image
    self.is_training = is_training
    self.use_bfloat16 = use_bfloat16
    self.num_cores = num_cores
    self.transpose_input = transpose_input
    self.image_size = image_size

  def set_shapes(self, batch_size, images, labels):
    """Statically set the batch_size dimension."""
    if self.transpose_input:
      images.set_shape(images.get_shape().merge_with(
          tf.TensorShape([None, None, None, batch_size])))
      labels.set_shape(labels.get_shape().merge_with(
          tf.TensorShape([batch_size])))
    else:
      images.set_shape(images.get_shape().merge_with(
          tf.TensorShape([batch_size, None, None, None])))
      labels.set_shape(labels.get_shape().merge_with(
          tf.TensorShape([batch_size])))

    return images, labels

  def dataset_parser(self, value):
    """Parses an image and its label from a serialized ResNet-50 TFExample.

    Args:
      value: serialized string containing an ImageNet TFExample.

    Returns:
      Returns a tuple of (image, label) from the TFExample.
    """
    keys_to_features = {
        'image/encoded': tf.FixedLenFeature((), tf.string, ''),
        'image/class/label': tf.FixedLenFeature([], tf.int64, -1),
    }

    parsed = tf.parse_single_example(value, keys_to_features)
    image_bytes = tf.reshape(parsed['image/encoded'], shape=[])

    image = self.image_preprocessing_fn(
        image_bytes=image_bytes,
        is_training=self.is_training,
        image_size=self.image_size,
        use_bfloat16=self.use_bfloat16)

    # Subtract one so that labels are in [0, 1000).
    label = tf.cast(
        tf.reshape(parsed['image/class/label'], shape=[]), dtype=tf.int32) - 1

    return image, label

  @abc.abstractmethod
  def make_source_dataset(self, index, num_hosts):
    """Makes dataset of serialized TFExamples.

    The returned dataset will contain `tf.string` tensors, but these strings are
    serialized `TFExample` records that will be parsed by `dataset_parser`.

    If self.is_training, the dataset should be infinite.

    Args:
      index: current host index.
      num_hosts: total number of hosts.

    Returns:
      A `tf.data.Dataset` object.
    """
    return

  def input_fn(self, params):
    """Input function which provides a single batch for train or eval.

    Args:
      params: `dict` of parameters passed from the `TPUEstimator`.
          `params['batch_size']` is always provided and should be used as the
          effective batch size.

    Returns:
      A `tf.data.Dataset` object.
    """
    # Retrieves the batch size for the current shard. The # of shards is
    # computed according to the input pipeline deployment. See
    # tf.contrib.tpu.RunConfig for details.
    batch_size = params['batch_size']

    if 'context' in params:
      current_host = params['context'].current_input_fn_deployment()[1]
      num_hosts = params['context'].num_hosts
    else:
      current_host = 0
      num_hosts = 1

    dataset = self.make_source_dataset(current_host, num_hosts)

    # Use the fused map-and-batch operation.
    #
    # For XLA, we must used fixed shapes. Because we repeat the source training
    # dataset indefinitely, we can use `drop_remainder=True` to get fixed-size
    # batches without dropping any training examples.
    #
    # When evaluating, `drop_remainder=True` prevents accidentally evaluating
    # the same image twice by dropping the final batch if it is less than a full
    # batch size. As long as this validation is done with consistent batch size,
    # exactly the same images will be used.
    dataset = dataset.apply(
        tf.contrib.data.map_and_batch(
            self.dataset_parser, batch_size=batch_size,
            num_parallel_batches=self.num_cores, drop_remainder=True))

    # Transpose for performance on TPU
    if self.transpose_input:
      dataset = dataset.map(
          lambda images, labels: (tf.transpose(images, [1, 2, 3, 0]), labels),
          num_parallel_calls=self.num_cores)

    # Assign static batch size dimension
    dataset = dataset.map(functools.partial(self.set_shapes, batch_size))

    # Prefetch overlaps in-feed with training
    dataset = dataset.prefetch(tf.contrib.data.AUTOTUNE)
    return dataset


class ImageNetInput(ImageNetTFExampleInput):
  """Generates ImageNet input_fn from a series of TFRecord files.

  The training data is assumed to be in TFRecord format with keys as specified
  in the dataset_parser below, sharded across 1024 files, named sequentially:

      train-00000-of-01024
      train-00001-of-01024
      ...
      train-01023-of-01024

  The validation data is in the same format but sharded in 128 files.

  The format of the data required is created by the script at:
      https://github.com/tensorflow/tpu/blob/master/tools/datasets/imagenet_to_gcs.py
  """

  def __init__(self,
               is_training,
               use_bfloat16,
               transpose_input,
               data_dir,
               image_size=224,
               num_parallel_calls=64,
               cache=False):
    """Create an input from TFRecord files.

    Args:
      is_training: `bool` for whether the input is for training
      use_bfloat16: If True, use bfloat16 precision; else use float32.
      transpose_input: 'bool' for whether to use the double transpose trick
      data_dir: `str` for the directory of the training and validation data;
          if 'null' (the literal string 'null') or implicitly False
          then construct a null pipeline, consisting of empty images
          and blank labels.
      image_size: `int` for image size (both width and height).
      num_parallel_calls: concurrency level to use when reading data from disk.
      cache: if true, fill the dataset by repeating from its cache
    """
    super(ImageNetInput, self).__init__(
        is_training=is_training,
        image_size=image_size,
        use_bfloat16=use_bfloat16,
        transpose_input=transpose_input)
    self.data_dir = data_dir
    if self.data_dir == 'null' or not self.data_dir:
      self.data_dir = None
    self.num_parallel_calls = num_parallel_calls
    self.cache = cache

  def _get_null_input(self, data):
    """Returns a null image (all black pixels).

    Args:
      data: element of a dataset, ignored in this method, since it produces
          the same null image regardless of the element.

    Returns:
      a tensor representing a null image.
    """
    del data  # Unused since output is constant regardless of input
    return tf.zeros([self.image_size, self.image_size, 3], tf.bfloat16
                    if self.use_bfloat16 else tf.float32)

  def dataset_parser(self, value):
    """See base class."""
    if not self.data_dir:
      return value, tf.constant(0, tf.int32)
    return super(ImageNetInput, self).dataset_parser(value)

  def make_source_dataset(self, index, num_hosts):
    """See base class."""
    if not self.data_dir:
      tf.logging.info('Undefined data_dir implies null input')
      return tf.data.Dataset.range(1).repeat().map(self._get_null_input)

    # Shuffle the filenames to ensure better randomization.
    file_pattern = os.path.join(
        self.data_dir, 'train-*' if self.is_training else 'validation-*')

    # For multi-host training, we want each hosts to always process the same
    # subset of files.  Each host only sees a subset of the entire dataset,
    # allowing us to cache larger datasets in memory.
    dataset = tf.data.Dataset.list_files(file_pattern, shuffle=False)
    dataset = dataset.shard(num_hosts, index)

    if self.is_training and not self.cache:
      dataset = dataset.repeat()

    def fetch_dataset(filename):
      buffer_size = 8 * 1024 * 1024  # 8 MiB per file
      dataset = tf.data.TFRecordDataset(filename, buffer_size=buffer_size)
      return dataset

    # Read the data from disk in parallel
    dataset = dataset.apply(
        tf.contrib.data.parallel_interleave(
            fetch_dataset, cycle_length=self.num_parallel_calls, sloppy=True))

    if self.cache:
      dataset = dataset.cache().apply(
          tf.contrib.data.shuffle_and_repeat(1024 * 16))
    else:
      dataset = dataset.shuffle(1024)
    return dataset


# Defines a selection of data from a Cloud Bigtable.
BigtableSelection = namedtuple('BigtableSelection',
                               ['project',
                                'instance',
                                'table',
                                'prefix',
                                'column_family',
                                'column_qualifier'])


class ImageNetBigtableInput(ImageNetTFExampleInput):
  """Generates ImageNet input_fn from a Bigtable for training or evaluation.
  """

  def __init__(self, is_training, use_bfloat16, transpose_input, selection):
    """Constructs an ImageNet input from a BigtableSelection.

    Args:
      is_training: `bool` for whether the input is for training
      use_bfloat16: If True, use bfloat16 precision; else use float32.
      transpose_input: 'bool' for whether to use the double transpose trick
      selection: a BigtableSelection specifying a part of a Bigtable.
    """
    super(ImageNetBigtableInput, self).__init__(
        is_training=is_training,
        use_bfloat16=use_bfloat16,
        transpose_input=transpose_input)
    self.selection = selection

  def make_source_dataset(self, index, num_hosts):
    """See base class."""
    data = self.selection
    client = tf.contrib.cloud.BigtableClient(data.project, data.instance)
    table = client.table(data.table)
    ds = table.parallel_scan_prefix(data.prefix,
                                    columns=[(data.column_family,
                                              data.column_qualifier)])
    # The Bigtable datasets will have the shape (row_key, data)
    ds_data = ds.map(lambda index, data: data)

    if self.is_training:
      ds_data = ds_data.repeat()

    return ds_data