python source code of model

ros_people_object_detection_tensorflow-master
- .github
  - stale.yml
- src
  - cob_people_object_detection_tensorflow.py
  - sort
  - face_recognizer.py
  - cob_people_object_detection_tensorflow
    - detector.py
    - __init__.py
    - utils.py
  - tracker.py
  - object_detection
    - BUILD
    - matchers
      - BUILD
      - bipartite_matcher_test.py
      - argmax_matcher.py
      - __init__.py
      - argmax_matcher_test.py
      - bipartite_matcher.py
    - object_detection_tutorial.ipynb
    - create_pascal_tf_record_test.py
    - evaluator.py
    - samples
      - cloud
        cloud.yml
      - configs
        faster_rcnn_resnet101_voc07.config
        faster_rcnn_inception_resnet_v2_atrous_oid.config
        faster_rcnn_resnet101_pets.config
        faster_rcnn_nas_coco.config
        ssd_mobilenet_v2_coco.config
        faster_rcnn_resnet101_kitti.config
        ssd_mobilenet_v1_coco.config
        ssd_mobilenet_v1_focal_loss_pets.config
        faster_rcnn_resnet50_pets.config
        ssd_inception_v2_pets.config
        faster_rcnn_resnet152_coco.config
        mask_rcnn_resnet101_atrous_coco.config
        mask_rcnn_resnet101_pets.config
        ssd_inception_v2_coco.config
        mask_rcnn_inception_resnet_v2_atrous_coco.config
        faster_rcnn_inception_resnet_v2_atrous_cosine_lr_coco.config
        ssd_mobilenet_v1_focal_loss_coco.config
        faster_rcnn_resnet101_atrous_coco.config
        faster_rcnn_inception_v2_coco.config
        mask_rcnn_inception_v2_coco.config
        rfcn_resnet101_pets.config
        ssd_inception_v3_pets.config
        faster_rcnn_inception_v2_pets.config
        faster_rcnn_resnet152_pets.config
        faster_rcnn_inception_resnet_v2_atrous_coco.config
        embedded_ssd_mobilenet_v1_coco.config
        ssd_mobilenet_v1_pets.config
        faster_rcnn_inception_resnet_v2_atrous_pets.config
        faster_rcnn_resnet101_coco.config
        mask_rcnn_resnet50_atrous_coco.config
        faster_rcnn_resnet50_coco.config
        rfcn_resnet101_coco.config
    - utils
      - json_utils_test.py
      - BUILD
      - np_mask_ops.py
      - np_box_mask_list_ops.py
      - label_map_util_test.py
      - test_utils.py
      - np_mask_ops_test.py
      - np_box_list_test.py
      - ops.py
      - metrics_test.py
      - config_util_test.py
      - np_box_mask_list_test.py
      - config_util.py
      - metrics.py
      - category_util.py
      - visualization_utils.py
      - shape_utils.py
      - label_map_util.py
      - dataset_util.py
      - variables_helper.py
      - test_utils_test.py
      - np_box_list_ops.py
      - category_util_test.py
      - learning_schedules.py
      - np_box_mask_list.py
      - static_shape.py
      - np_box_ops.py
      - dataset_util_test.py
      - variables_helper_test.py
      - test_case.py
      - visualization_utils_test.py
      - learning_schedules_test.py
      - __init__.py
      - static_shape_test.py
      - shape_utils_test.py
      - ops_test.py
      - per_image_evaluation.py
      - np_box_list_ops_test.py
      - np_box_ops_test.py
      - np_box_list.py
      - np_box_mask_list_ops_test.py
      - object_detection_evaluation_test.py
      - json_utils.py
      - per_image_evaluation_test.py
      - object_detection_evaluation.py
    - test_images
      - image_info.txt
    - eval.py
    - g3doc
      - running_on_cloud.md
      - instance_segmentation.md
      - running_pets.md
      - configuring_jobs.md
      - faq.md
      - img
      - defining_your_own_model.md
      - running_locally.md
      - running_notebook.md
      - installation.md
      - using_your_own_dataset.md
      - detection_model_zoo.md
      - preparing_inputs.md
      - oid_inference_and_evaluation.md
      - evaluation_protocols.md
      - exporting_models.md
    - model_tpu.py
    - test_ckpt
    - builders
      - anchor_generator_builder.py
      - BUILD
      - optimizer_builder_test.py
      - image_resizer_builder_test.py
      - anchor_generator_builder_test.py
      - post_processing_builder_test.py
      - region_similarity_calculator_builder_test.py
      - preprocessor_builder_test.py
      - box_coder_builder.py
      - optimizer_builder.py
      - losses_builder_test.py
      - hyperparams_builder.py
      - matcher_builder.py
      - image_resizer_builder.py
      - post_processing_builder.py
      - box_predictor_builder.py
      - box_predictor_builder_test.py
      - input_reader_builder_test.py
      - hyperparams_builder_test.py
      - model_builder_test.py
      - losses_builder.py
      - __init__.py
      - input_reader_builder.py
      - dataset_builder.py
      - dataset_builder_test.py
      - preprocessor_builder.py
      - matcher_builder_test.py
      - box_coder_builder_test.py
      - region_similarity_calculator_builder.py
      - model_builder.py
    - model_test.py
    - inputs_test.py
    - create_pet_tf_record.py
    - protos
      - bipartite_matcher.proto
      - matcher_pb2.py
      - mean_stddev_box_coder_pb2.py
      - BUILD
      - faster_rcnn_box_coder.proto
      - train.proto
      - ssd_pb2.py
      - model.proto
      - faster_rcnn.proto
      - eval.proto
      - string_int_label_map.proto
      - keypoint_box_coder.proto
      - preprocessor.proto
      - region_similarity_calculator_pb2.py
      - hyperparams.proto
      - train_pb2.py
      - box_predictor_pb2.py
      - region_similarity_calculator.proto
      - image_resizer.proto
      - hyperparams_pb2.py
      - input_reader_pb2.py
      - ssd_anchor_generator.proto
      - keypoint_box_coder_pb2.py
      - multiscale_anchor_generator_pb2.py
      - model_pb2.py
      - argmax_matcher_pb2.py
      - input_reader.proto
      - faster_rcnn_box_coder_pb2.py
      - grid_anchor_generator_pb2.py
      - post_processing_pb2.py
      - pipeline.proto
      - string_int_label_map_pb2.py
      - square_box_coder.proto
      - optimizer_pb2.py
      - eval_pb2.py
      - optimizer.proto
      - image_resizer_pb2.py
      - argmax_matcher.proto
      - losses.proto
      - box_predictor.proto
      - __init__.py
      - pipeline_pb2.py
      - square_box_coder_pb2.py
      - matcher.proto
      - losses_pb2.py
      - post_processing.proto
      - ssd_anchor_generator_pb2.py
      - ssd.proto
      - anchor_generator_pb2.py
      - multiscale_anchor_generator.proto
      - box_coder.proto
      - grid_anchor_generator.proto
      - preprocessor_pb2.py
      - faster_rcnn_pb2.py
      - box_coder_pb2.py
      - anchor_generator.proto
      - bipartite_matcher_pb2.py
      - mean_stddev_box_coder.proto
    - models
      - faster_rcnn_inception_v2_feature_extractor.py
      - faster_rcnn_inception_resnet_v2_feature_extractor_test.py
      - feature_map_generators.py
      - BUILD
      - ssd_inception_v3_feature_extractor.py
      - faster_rcnn_mobilenet_v1_feature_extractor_test.py
      - ssd_resnet_v1_fpn_feature_extractor_test.py
      - ssd_inception_v3_feature_extractor_test.py
      - ssd_feature_extractor_test.py
      - ssd_mobilenet_v2_feature_extractor.py
      - faster_rcnn_resnet_v1_feature_extractor_test.py
      - ssd_inception_v2_feature_extractor_test.py
      - ssd_inception_v2_feature_extractor.py
      - embedded_ssd_mobilenet_v1_feature_extractor_test.py
      - faster_rcnn_resnet_v1_feature_extractor.py
      - feature_map_generators_test.py
      - faster_rcnn_inception_v2_feature_extractor_test.py
      - ssd_mobilenet_v2_feature_extractor_test.py
      - ssd_resnet_v1_fpn_feature_extractor.py
      - ssd_mobilenet_v1_feature_extractor_test.py
      - __init__.py
      - faster_rcnn_mobilenet_v1_feature_extractor.py
      - faster_rcnn_nas_feature_extractor.py
      - embedded_ssd_mobilenet_v1_feature_extractor.py
      - ssd_mobilenet_v1_feature_extractor.py
      - faster_rcnn_inception_resnet_v2_feature_extractor.py
      - faster_rcnn_nas_feature_extractor_test.py
      - ssd_resnet_v1_fpn_feature_extractor_testbase.py
    - inputs.py
    - CONTRIBUTING.md
    - dataset_tools
      - create_pascal_tf_record_test.py
      - create_coco_tf_record_test.py
      - create_kitti_tf_record.py
      - download_and_preprocess_mscoco.sh
      - create_coco_tf_record.py
      - oid_tfrecord_creation_test.py
      - create_pet_tf_record.py
      - create_oid_tf_record.py
      - create_kitti_tf_record_test.py
      - __init__.py
      - create_pascal_tf_record.py
      - oid_tfrecord_creation.py
    - anchor_generators
      - BUILD
      - multiple_grid_anchor_generator.py
      - multiscale_grid_anchor_generator_test.py
      - multiple_grid_anchor_generator_test.py
      - __init__.py
      - grid_anchor_generator_test.py
      - multiscale_grid_anchor_generator.py
      - grid_anchor_generator.py
    - exporter.py
    - test_data
    - export_inference_graph.py
    - .ipynb_checkpoints
    - model.py
    - data
      - pascal_label_map.pbtxt
      - kitti_label_map.pbtxt
      - oid_bbox_trainable_label_map.pbtxt
      - pet_label_map.pbtxt
      - mscoco_label_map.pbtxt
    - eval_util_test.py
    - model_test_util.py
    - meta_architectures
      - BUILD
      - faster_rcnn_meta_arch.py
      - faster_rcnn_meta_arch_test_lib.py
      - ssd_meta_arch.py
      - rfcn_meta_arch.py
      - faster_rcnn_meta_arch_test.py
      - __init__.py
      - rfcn_meta_arch_test.py
      - ssd_meta_arch_test.py
    - train.py
    - __init__.py
    - eval_util.py
    - README.md
    - core
      - BUILD
      - box_predictor_test.py
      - balanced_positive_negative_sampler.py
      - preprocessor_cache.py
      - prefetcher.py
      - region_similarity_calculator.py
      - batcher.py
      - box_list_test.py
      - post_processing_test.py
      - matcher_test.py
      - minibatch_sampler_test.py
      - target_assigner.py
      - preprocessor.py
      - minibatch_sampler.py
      - data_decoder.py
      - keypoint_ops.py
      - keypoint_ops_test.py
      - losses.py
      - box_predictor.py
      - post_processing.py
      - box_list_ops.py
      - box_list.py
      - balanced_positive_negative_sampler_test.py
      - box_list_ops_test.py
      - model.py
      - matcher.py
      - standard_fields.py
      - region_similarity_calculator_test.py
      - box_coder.py
      - __init__.py
      - box_coder_test.py
      - preprocessor_test.py
      - target_assigner_test.py
      - batcher_test.py
      - data_parser.py
      - anchor_generator.py
      - prefetcher_test.py
      - losses_test.py
    - inference
      - infer_detections.py
      - detection_inference.py
      - __init__.py
      - detection_inference_test.py
    - trainer_test.py
    - trainer.py
    - metrics
      - offline_eval_map_corloc_test.py
      - offline_eval_map_corloc.py
      - __init__.py
      - tf_example_parser.py
      - coco_tools_test.py
      - tf_example_parser_test.py
      - coco_evaluation_test.py
      - coco_tools.py
      - coco_evaluation.py
    - create_pascal_tf_record.py
    - box_coders
      - BUILD
      - keypoint_box_coder.py
      - square_box_coder_test.py
      - faster_rcnn_box_coder_test.py
      - mean_stddev_box_coder.py
      - mean_stddev_box_coder_test.py
      - keypoint_box_coder_test.py
      - faster_rcnn_box_coder.py
      - __init__.py
      - square_box_coder.py
    - data_decoders
      - BUILD
      - tf_example_decoder_test.py
      - __init__.py
      - tf_example_decoder.py
    - ssd_mobilenet_v1_coco_2017_11_17
    - model_hparams.py
    - exporter_test.py
  - action_recognition.py
  - projection.py
- images
- .gitmodules
- LICENSE
- package.xml
- docker
  - cob_people_object_detection
    - Dockerfile
  - astra_docker
    - Dockerfile
  - docker-compose.yml
- people
- CMakeLists.txt
- action_recognition
  - labels.txt
- README.md
- .gitignore
- launch
  - cob_face_recognizer_params.yaml
  - action_recognition_params.yaml
  - alltogether.launch
  - projection.launch
  - cob_people_object_detection_tensorflow_params.yaml
  - projection_params.yaml
  - action_recognition.launch
  - cob_face_recognizer.launch
  - cob_people_object_tracker.launch
  - cob_people_object_detection_tensorflow.launch
  - cob_people_object_tracker_params.yaml

# Copyright 2017 The TensorFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
r"""Creates and runs `Experiment` for object detection model.

This uses the TF.learn framework to define and run an object detection model
wrapped in an `Estimator`.
Note that this module is only compatible with SSD Meta architecture at the
moment.
"""

from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

import functools
import os

import tensorflow as tf

from google.protobuf import text_format
from tensorflow.contrib.learn.python.learn import learn_runner
from tensorflow.contrib.tpu.python.tpu import tpu_optimizer
from tensorflow.python.lib.io import file_io
from object_detection import eval_util
from object_detection import inputs
from object_detection import model_hparams
from object_detection.builders import model_builder
from object_detection.builders import optimizer_builder
from object_detection.core import standard_fields as fields
from object_detection.utils import config_util
from object_detection.utils import label_map_util
from object_detection.utils import shape_utils
from object_detection.utils import variables_helper
from object_detection.utils import visualization_utils as vis_utils

tf.flags.DEFINE_string('model_dir', None, 'Path to output model directory '
                       'where event and checkpoint files will be written.')
tf.flags.DEFINE_string('pipeline_config_path', None, 'Path to pipeline config '
                       'file.')
tf.flags.DEFINE_integer('num_train_steps', 500000, 'Number of train steps.')
tf.flags.DEFINE_integer('num_eval_steps', 10000, 'Number of train steps.')
FLAGS = tf.flags.FLAGS


# A map of names to methods that help build the model.
MODEL_BUILD_UTIL_MAP = {
    'get_configs_from_pipeline_file':
        config_util.get_configs_from_pipeline_file,
    'create_pipeline_proto_from_configs':
        config_util.create_pipeline_proto_from_configs,
    'merge_external_params_with_configs':
        config_util.merge_external_params_with_configs,
    'create_train_input_fn': inputs.create_train_input_fn,
    'create_eval_input_fn': inputs.create_eval_input_fn,
    'create_predict_input_fn': inputs.create_predict_input_fn,
}


def _get_groundtruth_data(detection_model, class_agnostic):
  """Extracts groundtruth data from detection_model.

  Args:
    detection_model: A `DetectionModel` object.
    class_agnostic: Whether the detections are class_agnostic.

  Returns:
    A tuple of:
    groundtruth: Dictionary with the following fields:
      'groundtruth_boxes': [num_boxes, 4] float32 tensor of boxes, in
        normalized coordinates.
      'groundtruth_classes': [num_boxes] int64 tensor of 1-indexed classes.
      'groundtruth_masks': 3D float32 tensor of instance masks (if provided in
        groundtruth)
    class_agnostic: Boolean indicating whether detections are class agnostic.
  """
  input_data_fields = fields.InputDataFields()
  groundtruth_boxes = detection_model.groundtruth_lists(
      fields.BoxListFields.boxes)[0]
  # For class-agnostic models, groundtruth one-hot encodings collapse to all
  # ones.
  if class_agnostic:
    groundtruth_boxes_shape = tf.shape(groundtruth_boxes)
    groundtruth_classes_one_hot = tf.ones([groundtruth_boxes_shape[0], 1])
  else:
    groundtruth_classes_one_hot = detection_model.groundtruth_lists(
        fields.BoxListFields.classes)[0]
  label_id_offset = 1  # Applying label id offset (b/63711816)
  groundtruth_classes = (
      tf.argmax(groundtruth_classes_one_hot, axis=1) + label_id_offset)
  groundtruth = {
      input_data_fields.groundtruth_boxes: groundtruth_boxes,
      input_data_fields.groundtruth_classes: groundtruth_classes
  }
  if detection_model.groundtruth_has_field(fields.BoxListFields.masks):
    groundtruth[input_data_fields.groundtruth_instance_masks] = (
        detection_model.groundtruth_lists(fields.BoxListFields.masks)[0])
  return groundtruth


def unstack_batch(tensor_dict, unpad_groundtruth_tensors=True):
  """Unstacks all tensors in `tensor_dict` along 0th dimension.

  Unstacks tensor from the tensor dict along 0th dimension and returns a
  tensor_dict containing values that are lists of unstacked tensors.

  Tensors in the `tensor_dict` are expected to be of one of the three shapes:
  1. [batch_size]
  2. [batch_size, height, width, channels]
  3. [batch_size, num_boxes, d1, d2, ... dn]

  When unpad_groundtruth_tensors is set to true, unstacked tensors of form 3
  above are sliced along the `num_boxes` dimension using the value in tensor
  field.InputDataFields.num_groundtruth_boxes.

  Note that this function has a static list of input data fields and has to be
  kept in sync with the InputDataFields defined in core/standard_fields.py

  Args:
    tensor_dict: A dictionary of batched groundtruth tensors.
    unpad_groundtruth_tensors: Whether to remove padding along `num_boxes`
      dimension of the groundtruth tensors.

  Returns:
    A dictionary where the keys are from fields.InputDataFields and values are
    a list of unstacked (optionally unpadded) tensors.

  Raises:
    ValueError: If unpad_tensors is True and `tensor_dict` does not contain
      `num_groundtruth_boxes` tensor.
  """
  unbatched_tensor_dict = {key: tf.unstack(tensor)
                           for key, tensor in tensor_dict.items()}
  if unpad_groundtruth_tensors:
    if (fields.InputDataFields.num_groundtruth_boxes not in
        unbatched_tensor_dict):
      raise ValueError('`num_groundtruth_boxes` not found in tensor_dict. '
                       'Keys available: {}'.format(
                           unbatched_tensor_dict.keys()))
    unbatched_unpadded_tensor_dict = {}
    unpad_keys = set([
        # List of input data fields that are padded along the num_boxes
        # dimension. This list has to be kept in sync with InputDataFields in
        # standard_fields.py.
        fields.InputDataFields.groundtruth_instance_masks,
        fields.InputDataFields.groundtruth_classes,
        fields.InputDataFields.groundtruth_boxes,
        fields.InputDataFields.groundtruth_keypoints,
        fields.InputDataFields.groundtruth_group_of,
        fields.InputDataFields.groundtruth_difficult,
        fields.InputDataFields.groundtruth_is_crowd,
        fields.InputDataFields.groundtruth_area,
        fields.InputDataFields.groundtruth_weights
    ]).intersection(set(unbatched_tensor_dict.keys()))

    for key in unpad_keys:
      unpadded_tensor_list = []
      for num_gt, padded_tensor in zip(
          unbatched_tensor_dict[fields.InputDataFields.num_groundtruth_boxes],
          unbatched_tensor_dict[key]):
        tensor_shape = shape_utils.combined_static_and_dynamic_shape(
            padded_tensor)
        slice_begin = tf.zeros([len(tensor_shape)], dtype=tf.int32)
        slice_size = tf.stack(
            [num_gt] + [-1 if dim is None else dim for dim in tensor_shape[1:]])
        unpadded_tensor = tf.slice(padded_tensor, slice_begin, slice_size)
        unpadded_tensor_list.append(unpadded_tensor)
      unbatched_unpadded_tensor_dict[key] = unpadded_tensor_list
    unbatched_tensor_dict.update(unbatched_unpadded_tensor_dict)

  return unbatched_tensor_dict


def create_model_fn(detection_model_fn, configs, hparams, use_tpu=False):
  """Creates a model function for `Estimator`.

  Args:
    detection_model_fn: Function that returns a `DetectionModel` instance.
    configs: Dictionary of pipeline config objects.
    hparams: `HParams` object.
    use_tpu: Boolean indicating whether model should be constructed for
        use on TPU.

  Returns:
    `model_fn` for `Estimator`.
  """
  train_config = configs['train_config']
  eval_input_config = configs['eval_input_config']
  eval_config = configs['eval_config']

  def model_fn(features, labels, mode, params=None):
    """Constructs the object detection model.

    Args:
      features: Dictionary of feature tensors, returned from `input_fn`.
      labels: Dictionary of groundtruth tensors if mode is TRAIN or EVAL,
        otherwise None.
      mode: Mode key from tf.estimator.ModeKeys.
      params: Parameter dictionary passed from the estimator.

    Returns:
      An `EstimatorSpec` that encapsulates the model and its serving
        configurations.
    """
    params = params or {}
    total_loss, train_op, detections, export_outputs = None, None, None, None
    is_training = mode == tf.estimator.ModeKeys.TRAIN
    detection_model = detection_model_fn(is_training=is_training,
                                         add_summaries=(not use_tpu))
    scaffold_fn = None

    if mode == tf.estimator.ModeKeys.TRAIN:
      labels = unstack_batch(
          labels,
          unpad_groundtruth_tensors=train_config.unpad_groundtruth_tensors)
    elif mode == tf.estimator.ModeKeys.EVAL:
      labels = unstack_batch(labels, unpad_groundtruth_tensors=False)

    if mode in (tf.estimator.ModeKeys.TRAIN, tf.estimator.ModeKeys.EVAL):
      gt_boxes_list = labels[fields.InputDataFields.groundtruth_boxes]
      gt_classes_list = labels[fields.InputDataFields.groundtruth_classes]
      gt_masks_list = None
      if fields.InputDataFields.groundtruth_instance_masks in labels:
        gt_masks_list = labels[
            fields.InputDataFields.groundtruth_instance_masks]
      gt_keypoints_list = None
      if fields.InputDataFields.groundtruth_keypoints in labels:
        gt_keypoints_list = labels[fields.InputDataFields.groundtruth_keypoints]
      detection_model.provide_groundtruth(
          groundtruth_boxes_list=gt_boxes_list,
          groundtruth_classes_list=gt_classes_list,
          groundtruth_masks_list=gt_masks_list,
          groundtruth_keypoints_list=gt_keypoints_list)

    preprocessed_images = features[fields.InputDataFields.image]
    prediction_dict = detection_model.predict(
        preprocessed_images, features[fields.InputDataFields.true_image_shape])
    detections = detection_model.postprocess(
        prediction_dict, features[fields.InputDataFields.true_image_shape])

    if mode == tf.estimator.ModeKeys.TRAIN:
      if not train_config.fine_tune_checkpoint_type:
        # train_config.from_detection_checkpoint field is deprecated. For
        # backward compatibility, sets finetune_checkpoint_type based on
        # from_detection_checkpoint.
        if train_config.from_detection_checkpoint:
          train_config.fine_tune_checkpoint_type = 'detection'
        else:
          train_config.fine_tune_checkpoint_type = 'classification'
      if train_config.fine_tune_checkpoint and hparams.load_pretrained:
        if not train_config.fine_tune_checkpoint_type:
          # train_config.from_detection_checkpoint field is deprecated. For
          # backward compatibility, set train_config.fine_tune_checkpoint_type
          # based on train_config.from_detection_checkpoint.
          if train_config.from_detection_checkpoint:
            train_config.fine_tune_checkpoint_type = 'detection'
          else:
            train_config.fine_tune_checkpoint_type = 'classification'
        asg_map = detection_model.restore_map(
            fine_tune_checkpoint_type=train_config.fine_tune_checkpoint_type,
            load_all_detection_checkpoint_vars=(
                train_config.load_all_detection_checkpoint_vars))
        available_var_map = (
            variables_helper.get_variables_available_in_checkpoint(
                asg_map, train_config.fine_tune_checkpoint,
                include_global_step=False))
        if use_tpu:
          def tpu_scaffold():
            tf.train.init_from_checkpoint(train_config.fine_tune_checkpoint,
                                          available_var_map)
            return tf.train.Scaffold()
          scaffold_fn = tpu_scaffold
        else:
          tf.train.init_from_checkpoint(train_config.fine_tune_checkpoint,
                                        available_var_map)

    if mode in (tf.estimator.ModeKeys.TRAIN, tf.estimator.ModeKeys.EVAL):
      losses_dict = detection_model.loss(
          prediction_dict, features[fields.InputDataFields.true_image_shape])
      losses = [loss_tensor for loss_tensor in losses_dict.itervalues()]
      if train_config.add_regularization_loss:
        regularization_losses = tf.get_collection(
            tf.GraphKeys.REGULARIZATION_LOSSES)
        if regularization_losses:
          regularization_loss = tf.add_n(regularization_losses,
                                         name='regularization_loss')
          losses.append(regularization_loss)
          if not use_tpu:
            tf.summary.scalar('regularization_loss', regularization_loss)
      total_loss = tf.add_n(losses, name='total_loss')

    if mode == tf.estimator.ModeKeys.TRAIN:
      global_step = tf.train.get_or_create_global_step()
      training_optimizer, optimizer_summary_vars = optimizer_builder.build(
          train_config.optimizer)

      if use_tpu:
        training_optimizer = tpu_optimizer.CrossShardOptimizer(
            training_optimizer)

      # Optionally freeze some layers by setting their gradients to be zero.
      trainable_variables = None
      if train_config.freeze_variables:
        trainable_variables = tf.contrib.framework.filter_variables(
            tf.trainable_variables(),
            exclude_patterns=train_config.freeze_variables)

      clip_gradients_value = None
      if train_config.gradient_clipping_by_norm > 0:
        clip_gradients_value = train_config.gradient_clipping_by_norm

      if not use_tpu:
        for var in optimizer_summary_vars:
          tf.summary.scalar(var.op.name, var)
      summaries = [] if use_tpu else None
      train_op = tf.contrib.layers.optimize_loss(
          loss=total_loss,
          global_step=global_step,
          learning_rate=None,
          clip_gradients=clip_gradients_value,
          optimizer=training_optimizer,
          variables=trainable_variables,
          summaries=summaries,
          name='')  # Preventing scope prefix on all variables.

    if mode == tf.estimator.ModeKeys.PREDICT:
      export_outputs = {
          tf.saved_model.signature_constants.PREDICT_METHOD_NAME:
              tf.estimator.export.PredictOutput(detections)
      }

    eval_metric_ops = None
    if mode == tf.estimator.ModeKeys.EVAL:
      # Detection summaries during eval.
      class_agnostic = (fields.DetectionResultFields.detection_classes
                        not in detections)
      groundtruth = _get_groundtruth_data(detection_model, class_agnostic)
      use_original_images = fields.InputDataFields.original_image in features
      eval_images = (
          features[fields.InputDataFields.original_image] if use_original_images
          else features[fields.InputDataFields.image])
      eval_dict = eval_util.result_dict_for_single_example(
          eval_images[0:1],
          features[inputs.HASH_KEY][0],
          detections,
          groundtruth,
          class_agnostic=class_agnostic,
          scale_to_absolute=False)

      if class_agnostic:
        category_index = label_map_util.create_class_agnostic_category_index()
      else:
        category_index = label_map_util.create_category_index_from_labelmap(
            eval_input_config.label_map_path)
      if not use_tpu and use_original_images:
        detection_and_groundtruth = (
            vis_utils.draw_side_by_side_evaluation_image(
                eval_dict, category_index, max_boxes_to_draw=20,
                min_score_thresh=0.2))
        tf.summary.image('Detections_Left_Groundtruth_Right',
                         detection_and_groundtruth)

      # Eval metrics on a single image.
      eval_metrics = eval_config.metrics_set
      if not eval_metrics:
        eval_metrics = ['coco_detection_metrics']
      eval_metric_ops = eval_util.get_eval_metric_ops_for_evaluators(
          eval_metrics, category_index.values(), eval_dict,
          include_metrics_per_category=False)

    if use_tpu:
      return tf.contrib.tpu.TPUEstimatorSpec(
          mode=mode,
          scaffold_fn=scaffold_fn,
          predictions=detections,
          loss=total_loss,
          train_op=train_op,
          eval_metrics=eval_metric_ops,
          export_outputs=export_outputs)
    else:
      return tf.estimator.EstimatorSpec(
          mode=mode,
          predictions=detections,
          loss=total_loss,
          train_op=train_op,
          eval_metric_ops=eval_metric_ops,
          export_outputs=export_outputs)

  return model_fn


def build_experiment_fn(train_steps, eval_steps):
  """Returns a function that creates an `Experiment`."""

  def build_experiment(run_config, hparams):
    """Builds an `Experiment` from configuration and hyperparameters.

    Args:
      run_config: A `RunConfig`.
      hparams: A `HParams`.

    Returns:
      An `Experiment` object.
    """
    return populate_experiment(run_config, hparams, FLAGS.pipeline_config_path,
                               train_steps, eval_steps)

  return build_experiment


def populate_experiment(run_config,
                        hparams,
                        pipeline_config_path,
                        train_steps=None,
                        eval_steps=None,
                        model_fn_creator=create_model_fn,
                        **kwargs):
  """Populates an `Experiment` object.

  Args:
    run_config: A `RunConfig`.
    hparams: A `HParams`.
    pipeline_config_path: A path to a pipeline config file.
    train_steps: Number of training steps. If None, the number of training steps
      is set from the `TrainConfig` proto.
    eval_steps: Number of evaluation steps per evaluation cycle. If None, the
      number of evaluation steps is set from the `EvalConfig` proto.
    model_fn_creator: A function that creates a `model_fn` for `Estimator`.
      Follows the signature:

      * Args:
        * `detection_model_fn`: Function that returns `DetectionModel` instance.
        * `configs`: Dictionary of pipeline config objects.
        * `hparams`: `HParams` object.
      * Returns:
        `model_fn` for `Estimator`.

    **kwargs: Additional keyword arguments for configuration override.

  Returns:
    An `Experiment` that defines all aspects of training, evaluation, and
    export.
  """
  get_configs_from_pipeline_file = MODEL_BUILD_UTIL_MAP[
      'get_configs_from_pipeline_file']
  create_pipeline_proto_from_configs = MODEL_BUILD_UTIL_MAP[
      'create_pipeline_proto_from_configs']
  merge_external_params_with_configs = MODEL_BUILD_UTIL_MAP[
      'merge_external_params_with_configs']
  create_train_input_fn = MODEL_BUILD_UTIL_MAP['create_train_input_fn']
  create_eval_input_fn = MODEL_BUILD_UTIL_MAP['create_eval_input_fn']
  create_predict_input_fn = MODEL_BUILD_UTIL_MAP['create_predict_input_fn']

  configs = get_configs_from_pipeline_file(pipeline_config_path)
  configs = merge_external_params_with_configs(
      configs,
      hparams,
      train_steps=train_steps,
      eval_steps=eval_steps,
      **kwargs)
  model_config = configs['model']
  train_config = configs['train_config']
  train_input_config = configs['train_input_config']
  eval_config = configs['eval_config']
  eval_input_config = configs['eval_input_config']

  if train_steps is None and train_config.num_steps:
    train_steps = train_config.num_steps

  if eval_steps is None and eval_config.num_examples:
    eval_steps = eval_config.num_examples

  detection_model_fn = functools.partial(
      model_builder.build, model_config=model_config)

  # Create the input functions for TRAIN/EVAL.
  train_input_fn = create_train_input_fn(
      train_config=train_config,
      train_input_config=train_input_config,
      model_config=model_config)
  eval_input_fn = create_eval_input_fn(
      eval_config=eval_config,
      eval_input_config=eval_input_config,
      model_config=model_config)

  export_strategies = [
      tf.contrib.learn.utils.saved_model_export_utils.make_export_strategy(
          serving_input_fn=create_predict_input_fn(
              model_config=model_config))
  ]

  estimator = tf.estimator.Estimator(
      model_fn=model_fn_creator(detection_model_fn, configs, hparams),
      config=run_config)

  if run_config.is_chief:
    # Store the final pipeline config for traceability.
    pipeline_config_final = create_pipeline_proto_from_configs(
        configs)
    if not file_io.file_exists(estimator.model_dir):
      file_io.recursive_create_dir(estimator.model_dir)
    pipeline_config_final_path = os.path.join(estimator.model_dir,
                                              'pipeline.config')
    config_text = text_format.MessageToString(pipeline_config_final)
    with tf.gfile.Open(pipeline_config_final_path, 'wb') as f:
      tf.logging.info('Writing as-run pipeline config file to %s',
                      pipeline_config_final_path)
      f.write(config_text)

  return tf.contrib.learn.Experiment(
      estimator=estimator,
      train_input_fn=train_input_fn,
      eval_input_fn=eval_input_fn,
      train_steps=train_steps,
      eval_steps=eval_steps,
      export_strategies=export_strategies,
      eval_delay_secs=120,)


def main(unused_argv):
  tf.flags.mark_flag_as_required('model_dir')
  tf.flags.mark_flag_as_required('pipeline_config_path')
  config = tf.contrib.learn.RunConfig(model_dir=FLAGS.model_dir)
  learn_runner.run(
      experiment_fn=build_experiment_fn(FLAGS.num_train_steps,
                                        FLAGS.num_eval_steps),
      run_config=config,
      hparams=model_hparams.create_hparams())


if __name__ == '__main__':
  tf.app.run()