python source code of ssd_resnet_v1_fpn_feature

Traffic-Rule-Violation-Detection-System-master
- BUILD
- matchers
  - BUILD
  - bipartite_matcher_test.py
  - argmax_matcher.py
  - __init__.py
  - argmax_matcher_test.py
  - bipartite_matcher.py
- object_detection_tutorial.ipynb
- evaluator.py
- samples
  - cloud
    - cloud.yml
  - configs
    - faster_rcnn_resnet101_voc07.config
    - faster_rcnn_inception_resnet_v2_atrous_oid.config
    - BUILD
    - faster_rcnn_resnet101_pets.config
    - faster_rcnn_nas_coco.config
    - faster_rcnn_resnet101_kitti.config
    - ssd_mobilenet_v1_coco.config
    - ssd_mobilenet_v1_focal_loss_pets.config
    - faster_rcnn_resnet50_pets.config
    - ssd_inception_v2_pets.config
    - faster_rcnn_resnet152_coco.config
    - mask_rcnn_resnet101_atrous_coco.config
    - mask_rcnn_resnet101_pets.config
    - ssd_inception_v2_coco.config
    - mask_rcnn_inception_resnet_v2_atrous_coco.config
    - faster_rcnn_inception_resnet_v2_atrous_cosine_lr_coco.config
    - ssd_mobilenet_v1_focal_loss_coco.config
    - faster_rcnn_resnet101_atrous_coco.config
    - faster_rcnn_inception_v2_coco.config
    - mask_rcnn_inception_v2_coco.config
    - rfcn_resnet101_pets.config
    - ssd_inception_v3_pets.config
    - faster_rcnn_inception_v2_pets.config
    - faster_rcnn_resnet152_pets.config
    - faster_rcnn_inception_resnet_v2_atrous_coco.config
    - embedded_ssd_mobilenet_v1_coco.config
    - ssd_mobilenet_v1_pets.config
    - faster_rcnn_inception_resnet_v2_atrous_pets.config
    - faster_rcnn_resnet101_coco.config
    - mask_rcnn_resnet50_atrous_coco.config
    - faster_rcnn_resnet50_coco.config
    - rfcn_resnet101_coco.config
- utils
  - json_utils_test.py
  - BUILD
  - np_mask_ops.py
  - np_box_mask_list_ops.py
  - label_map_util_test.py
  - test_utils.py
  - np_mask_ops_test.py
  - np_box_list_test.py
  - ops.py
  - metrics_test.py
  - config_util_test.py
  - np_box_mask_list_test.py
  - config_util.py
  - metrics.py
  - category_util.py
  - visualization_utils.py
  - shape_utils.py
  - label_map_util.py
  - dataset_util.py
  - variables_helper.py
  - test_utils_test.py
  - np_box_list_ops.py
  - category_util_test.py
  - learning_schedules.py
  - np_box_mask_list.py
  - static_shape.py
  - np_box_ops.py
  - dataset_util_test.py
  - variables_helper_test.py
  - test_case.py
  - visualization_utils_test.py
  - learning_schedules_test.py
  - __init__.py
  - static_shape_test.py
  - shape_utils_test.py
  - ops_test.py
  - per_image_evaluation.py
  - np_box_list_ops_test.py
  - np_box_ops_test.py
  - np_box_list.py
  - np_box_mask_list_ops_test.py
  - object_detection_evaluation_test.py
  - json_utils.py
  - per_image_evaluation_test.py
  - object_detection_evaluation.py
- test_images
  - BUILD
  - image_info.txt
- eval.py
- jsoner.py
- g3doc
  - running_on_cloud.md
  - instance_segmentation.md
  - running_pets.md
  - configuring_jobs.md
  - img
  - defining_your_own_model.md
  - running_locally.md
  - running_notebook.md
  - installation.md
  - using_your_own_dataset.md
  - detection_model_zoo.md
  - preparing_inputs.md
  - oid_inference_and_evaluation.md
  - evaluation_protocols.md
  - exporting_models.md
- LicensePlate_detection_tutorial.py
- model_tpu.py
- test_ckpt
- tesser.py
- builders
  - anchor_generator_builder.py
  - BUILD
  - optimizer_builder_test.py
  - image_resizer_builder_test.py
  - anchor_generator_builder_test.py
  - post_processing_builder_test.py
  - region_similarity_calculator_builder_test.py
  - preprocessor_builder_test.py
  - box_coder_builder.py
  - optimizer_builder.py
  - losses_builder_test.py
  - hyperparams_builder.py
  - matcher_builder.py
  - image_resizer_builder.py
  - post_processing_builder.py
  - box_predictor_builder.py
  - box_predictor_builder_test.py
  - input_reader_builder_test.py
  - hyperparams_builder_test.py
  - model_builder_test.py
  - losses_builder.py
  - __init__.py
  - input_reader_builder.py
  - dataset_builder.py
  - dataset_builder_test.py
  - preprocessor_builder.py
  - matcher_builder_test.py
  - box_coder_builder_test.py
  - region_similarity_calculator_builder.py
  - model_builder.py
- model_test.py
- inputs_test.py
- LICENSE
- protos
  - bipartite_matcher.proto
  - matcher_pb2.py
  - mean_stddev_box_coder_pb2.py
  - BUILD
  - faster_rcnn_box_coder.proto
  - train.proto
  - ssd_pb2.py
  - model.proto
  - faster_rcnn.proto
  - eval.proto
  - string_int_label_map.proto
  - keypoint_box_coder.proto
  - preprocessor.proto
  - region_similarity_calculator_pb2.py
  - hyperparams.proto
  - train_pb2.py
  - box_predictor_pb2.py
  - region_similarity_calculator.proto
  - image_resizer.proto
  - hyperparams_pb2.py
  - input_reader_pb2.py
  - ssd_anchor_generator.proto
  - keypoint_box_coder_pb2.py
  - multiscale_anchor_generator_pb2.py
  - model_pb2.py
  - argmax_matcher_pb2.py
  - input_reader.proto
  - faster_rcnn_box_coder_pb2.py
  - grid_anchor_generator_pb2.py
  - post_processing_pb2.py
  - pipeline.proto
  - string_int_label_map_pb2.py
  - square_box_coder.proto
  - optimizer_pb2.py
  - eval_pb2.py
  - optimizer.proto
  - image_resizer_pb2.py
  - argmax_matcher.proto
  - losses.proto
  - box_predictor.proto
  - __init__.py
  - pipeline_pb2.py
  - square_box_coder_pb2.py
  - matcher.proto
  - losses_pb2.py
  - post_processing.proto
  - ssd_anchor_generator_pb2.py
  - ssd.proto
  - anchor_generator_pb2.py
  - multiscale_anchor_generator.proto
  - box_coder.proto
  - grid_anchor_generator.proto
  - preprocessor_pb2.py
  - faster_rcnn_pb2.py
  - box_coder_pb2.py
  - anchor_generator.proto
  - bipartite_matcher_pb2.py
  - mean_stddev_box_coder.proto
- object_detection_tutorial.py
- models
  - faster_rcnn_inception_v2_feature_extractor.py
  - faster_rcnn_inception_resnet_v2_feature_extractor_test.py
  - feature_map_generators.py
  - BUILD
  - ssd_inception_v3_feature_extractor.py
  - ssd_resnet_v1_fpn_feature_extractor_test.py
  - ssd_inception_v3_feature_extractor_test.py
  - ssd_feature_extractor_test.py
  - faster_rcnn_resnet_v1_feature_extractor_test.py
  - ssd_inception_v2_feature_extractor_test.py
  - ssd_inception_v2_feature_extractor.py
  - embedded_ssd_mobilenet_v1_feature_extractor_test.py
  - faster_rcnn_resnet_v1_feature_extractor.py
  - feature_map_generators_test.py
  - faster_rcnn_inception_v2_feature_extractor_test.py
  - ssd_resnet_v1_fpn_feature_extractor.py
  - ssd_mobilenet_v1_feature_extractor_test.py
  - __init__.py
  - faster_rcnn_nas_feature_extractor.py
  - embedded_ssd_mobilenet_v1_feature_extractor.py
  - ssd_mobilenet_v1_feature_extractor.py
  - faster_rcnn_inception_resnet_v2_feature_extractor.py
  - faster_rcnn_nas_feature_extractor_test.py
  - ssd_resnet_v1_fpn_feature_extractor_testbase.py
- detector.py
- inputs.py
- CONTRIBUTING.md
- dataset_tools
  - BUILD
  - create_pascal_tf_record_test.py
  - create_coco_tf_record_test.py
  - create_kitti_tf_record.py
  - download_and_preprocess_mscoco.sh
  - create_coco_tf_record.py
  - oid_tfrecord_creation_test.py
  - create_pet_tf_record.py
  - create_oid_tf_record.py
  - create_kitti_tf_record_test.py
  - __init__.py
  - create_pascal_tf_record.py
  - oid_tfrecord_creation.py
- VehicleMoniter.py
- anchor_generators
  - BUILD
  - multiple_grid_anchor_generator.py
  - multiscale_grid_anchor_generator_test.py
  - multiple_grid_anchor_generator_test.py
  - __init__.py
  - grid_anchor_generator_test.py
  - multiscale_grid_anchor_generator.py
  - grid_anchor_generator.py
- exporter.py
- Cars
  - car_label_map.pbtxt
  - ssd_inception_v2_car.config
- export_inference_graph.py
- model.py
- downsample.py
- data
  - BUILD
  - pascal_label_map.pbtxt
  - kitti_label_map.pbtxt
  - train_labels.csv
  - oid_bbox_trainable_label_map.pbtxt
  - pet_label_map.pbtxt
  - License-Plate-Detection.pbtxt
  - test_labels.csv
  - mscoco_label_map.pbtxt
- model_test_util.py
- meta_architectures
  - BUILD
  - faster_rcnn_meta_arch.py
  - faster_rcnn_meta_arch_test_lib.py
  - ssd_meta_arch.py
  - rfcn_meta_arch.py
  - faster_rcnn_meta_arch_test.py
  - __init__.py
  - rfcn_meta_arch_test.py
  - ssd_meta_arch_test.py
- testoutput.avi
- train.py
- __init__.py
- eval_util.py
- lp.py
- README.md
- core
  - BUILD
  - box_predictor_test.py
  - balanced_positive_negative_sampler.py
  - preprocessor_cache.py
  - prefetcher.py
  - region_similarity_calculator.py
  - batcher.py
  - box_list_test.py
  - post_processing_test.py
  - matcher_test.py
  - minibatch_sampler_test.py
  - target_assigner.py
  - preprocessor.py
  - minibatch_sampler.py
  - data_decoder.py
  - keypoint_ops.py
  - keypoint_ops_test.py
  - losses.py
  - box_predictor.py
  - post_processing.py
  - box_list_ops.py
  - box_list.py
  - balanced_positive_negative_sampler_test.py
  - box_list_ops_test.py
  - model.py
  - matcher.py
  - standard_fields.py
  - region_similarity_calculator_test.py
  - box_coder.py
  - __init__.py
  - box_coder_test.py
  - preprocessor_test.py
  - target_assigner_test.py
  - batcher_test.py
  - data_parser.py
  - anchor_generator.py
  - prefetcher_test.py
  - losses_test.py
- inference
  - BUILD
  - infer_detections.py
  - detection_inference.py
  - __init__.py
  - detection_inference_test.py
- trainer_test.py
- trainer.py
- metrics
  - offline_eval_map_corloc_test.py
  - BUILD
  - offline_eval_map_corloc.py
  - __init__.py
  - tf_example_parser.py
  - coco_tools_test.py
  - tf_example_parser_test.py
  - coco_evaluation_test.py
  - coco_tools.py
  - coco_evaluation.py
- vehicle.py
- Rule Breakers
  - rules.txt
- LP
- .gitignore
- box_coders
  - BUILD
  - keypoint_box_coder.py
  - square_box_coder_test.py
  - faster_rcnn_box_coder_test.py
  - mean_stddev_box_coder.py
  - mean_stddev_box_coder_test.py
  - keypoint_box_coder_test.py
  - faster_rcnn_box_coder.py
  - __init__.py
  - square_box_coder.py
- data_decoders
  - BUILD
  - tf_example_decoder_test.py
  - __init__.py
  - tf_example_decoder.py
- model_hparams.py
- exporter_test.py

"""SSD Feature Pyramid Network (FPN) feature extractors based on Resnet v1.

See https://arxiv.org/abs/1708.02002 for details.
"""

import tensorflow as tf

from object_detection.meta_architectures import ssd_meta_arch
from object_detection.models import feature_map_generators
from object_detection.utils import ops
from object_detection.utils import shape_utils
from nets import resnet_v1

slim = tf.contrib.slim


class _SSDResnetV1FpnFeatureExtractor(ssd_meta_arch.SSDFeatureExtractor):
  """SSD FPN feature extractor based on Resnet v1 architecture."""

  def __init__(self,
               is_training,
               depth_multiplier,
               min_depth,
               pad_to_multiple,
               conv_hyperparams,
               resnet_base_fn,
               resnet_scope_name,
               fpn_scope_name,
               batch_norm_trainable=True,
               reuse_weights=None,
               use_explicit_padding=False,
               use_depthwise=False):
    """SSD FPN feature extractor based on Resnet v1 architecture.

    Args:
      is_training: whether the network is in training mode.
      depth_multiplier: float depth multiplier for feature extractor.
        UNUSED currently.
      min_depth: minimum feature extractor depth. UNUSED Currently.
      pad_to_multiple: the nearest multiple to zero pad the input height and
        width dimensions to.
      conv_hyperparams: tf slim arg_scope for conv2d and separable_conv2d ops.
      resnet_base_fn: base resnet network to use.
      resnet_scope_name: scope name under which to construct resnet
      fpn_scope_name: scope name under which to construct the feature pyramid
        network.
      batch_norm_trainable: Whether to update batch norm parameters during
        training or not. When training with a small batch size
        (e.g. 1), it is desirable to disable batch norm update and use
        pretrained batch norm params.
      reuse_weights: Whether to reuse variables. Default is None.
      use_explicit_padding: Whether to use explicit padding when extracting
        features. Default is False. UNUSED currently.
      use_depthwise: Whether to use depthwise convolutions. UNUSED currently.

    Raises:
      ValueError: On supplying invalid arguments for unused arguments.
    """
    super(_SSDResnetV1FpnFeatureExtractor, self).__init__(
        is_training, depth_multiplier, min_depth, pad_to_multiple,
        conv_hyperparams, batch_norm_trainable, reuse_weights,
        use_explicit_padding)
    if self._depth_multiplier != 1.0:
      raise ValueError('Only depth 1.0 is supported, found: {}'.
                       format(self._depth_multiplier))
    if self._use_explicit_padding is True:
      raise ValueError('Explicit padding is not a valid option.')
    self._resnet_base_fn = resnet_base_fn
    self._resnet_scope_name = resnet_scope_name
    self._fpn_scope_name = fpn_scope_name

  def preprocess(self, resized_inputs):
    """SSD preprocessing.

    VGG style channel mean subtraction as described here:
    https://gist.github.com/ksimonyan/211839e770f7b538e2d8#file-readme-mdnge.

    Args:
      resized_inputs: a [batch, height, width, channels] float tensor
        representing a batch of images.

    Returns:
      preprocessed_inputs: a [batch, height, width, channels] float tensor
        representing a batch of images.
    """
    channel_means = [123.68, 116.779, 103.939]
    return resized_inputs - [[channel_means]]

  def _filter_features(self, image_features):
    # TODO: Change resnet endpoint to strip scope prefixes instead
    # of munging the scope here.
    filtered_image_features = dict({})
    for key, feature in image_features.items():
      feature_name = key.split('/')[-1]
      if feature_name in ['block2', 'block3', 'block4']:
        filtered_image_features[feature_name] = feature
    return filtered_image_features

  def extract_features(self, preprocessed_inputs):
    """Extract features from preprocessed inputs.

    Args:
      preprocessed_inputs: a [batch, height, width, channels] float tensor
        representing a batch of images.

    Returns:
      feature_maps: a list of tensors where the ith tensor has shape
        [batch, height_i, width_i, depth_i]

    Raises:
      ValueError: depth multiplier is not supported.
    """
    if self._depth_multiplier != 1.0:
      raise ValueError('Depth multiplier not supported.')

    preprocessed_inputs = shape_utils.check_min_image_dim(
        129, preprocessed_inputs)

    with tf.variable_scope(
        self._resnet_scope_name, reuse=self._reuse_weights) as scope:
      with slim.arg_scope(resnet_v1.resnet_arg_scope()):
        _, image_features = self._resnet_base_fn(
            inputs=ops.pad_to_multiple(preprocessed_inputs,
                                       self._pad_to_multiple),
            num_classes=None,
            is_training=self._is_training and self._batch_norm_trainable,
            global_pool=False,
            output_stride=None,
            store_non_strided_activations=True,
            scope=scope)
      image_features = self._filter_features(image_features)
      last_feature_map = image_features['block4']
    with tf.variable_scope(self._fpn_scope_name, reuse=self._reuse_weights):
      with slim.arg_scope(self._conv_hyperparams):
        for i in range(5, 7):
          last_feature_map = slim.conv2d(
              last_feature_map,
              num_outputs=256,
              kernel_size=[3, 3],
              stride=2,
              padding='SAME',
              scope='block{}'.format(i))
          image_features['bottomup_{}'.format(i)] = last_feature_map
        feature_maps = feature_map_generators.fpn_top_down_feature_maps(
            [
                image_features[key] for key in
                ['block2', 'block3', 'block4', 'bottomup_5', 'bottomup_6']
            ],
            depth=256,
            scope='top_down_features')
    return feature_maps.values()


class SSDResnet50V1FpnFeatureExtractor(_SSDResnetV1FpnFeatureExtractor):

  def __init__(self,
               is_training,
               depth_multiplier,
               min_depth,
               pad_to_multiple,
               conv_hyperparams,
               batch_norm_trainable=True,
               reuse_weights=None,
               use_explicit_padding=False,
               use_depthwise=False):
    """Resnet50 v1 FPN Feature Extractor for SSD Models.

    Args:
      is_training: whether the network is in training mode.
      depth_multiplier: float depth multiplier for feature extractor.
      min_depth: minimum feature extractor depth.
      pad_to_multiple: the nearest multiple to zero pad the input height and
        width dimensions to.
      conv_hyperparams: tf slim arg_scope for conv2d and separable_conv2d ops.
      batch_norm_trainable: Whether to update batch norm parameters during
        training or not. When training with a small batch size
        (e.g. 1), it is desirable to disable batch norm update and use
        pretrained batch norm params.
      reuse_weights: Whether to reuse variables. Default is None.
      use_explicit_padding: Whether to use explicit padding when extracting
        features. Default is False. UNUSED currently.
      use_depthwise: Whether to use depthwise convolutions. UNUSED currently.
    """
    super(SSDResnet50V1FpnFeatureExtractor, self).__init__(
        is_training, depth_multiplier, min_depth, pad_to_multiple,
        conv_hyperparams, resnet_v1.resnet_v1_50, 'resnet_v1_50', 'fpn',
        batch_norm_trainable, reuse_weights, use_explicit_padding)


class SSDResnet101V1FpnFeatureExtractor(_SSDResnetV1FpnFeatureExtractor):

  def __init__(self,
               is_training,
               depth_multiplier,
               min_depth,
               pad_to_multiple,
               conv_hyperparams,
               batch_norm_trainable=True,
               reuse_weights=None,
               use_explicit_padding=False,
               use_depthwise=False):
    """Resnet101 v1 FPN Feature Extractor for SSD Models.

    Args:
      is_training: whether the network is in training mode.
      depth_multiplier: float depth multiplier for feature extractor.
      min_depth: minimum feature extractor depth.
      pad_to_multiple: the nearest multiple to zero pad the input height and
        width dimensions to.
      conv_hyperparams: tf slim arg_scope for conv2d and separable_conv2d ops.
      batch_norm_trainable: Whether to update batch norm parameters during
        training or not. When training with a small batch size
        (e.g. 1), it is desirable to disable batch norm update and use
        pretrained batch norm params.
      reuse_weights: Whether to reuse variables. Default is None.
      use_explicit_padding: Whether to use explicit padding when extracting
        features. Default is False. UNUSED currently.
      use_depthwise: Whether to use depthwise convolutions. UNUSED currently.
    """
    super(SSDResnet101V1FpnFeatureExtractor, self).__init__(
        is_training, depth_multiplier, min_depth, pad_to_multiple,
        conv_hyperparams, resnet_v1.resnet_v1_101, 'resnet_v1_101', 'fpn',
        batch_norm_trainable, reuse_weights, use_explicit_padding)


class SSDResnet152V1FpnFeatureExtractor(_SSDResnetV1FpnFeatureExtractor):

  def __init__(self,
               is_training,
               depth_multiplier,
               min_depth,
               pad_to_multiple,
               conv_hyperparams,
               batch_norm_trainable=True,
               reuse_weights=None,
               use_explicit_padding=False,
               use_depthwise=False):
    """Resnet152 v1 FPN Feature Extractor for SSD Models.

    Args:
      is_training: whether the network is in training mode.
      depth_multiplier: float depth multiplier for feature extractor.
      min_depth: minimum feature extractor depth.
      pad_to_multiple: the nearest multiple to zero pad the input height and
        width dimensions to.
      conv_hyperparams: tf slim arg_scope for conv2d and separable_conv2d ops.
      batch_norm_trainable: Whether to update batch norm parameters during
        training or not. When training with a small batch size
        (e.g. 1), it is desirable to disable batch norm update and use
        pretrained batch norm params.
      reuse_weights: Whether to reuse variables. Default is None.
      use_explicit_padding: Whether to use explicit padding when extracting
        features. Default is False. UNUSED currently.
      use_depthwise: Whether to use depthwise convolutions. UNUSED currently.
    """
    super(SSDResnet152V1FpnFeatureExtractor, self).__init__(
        is_training, depth_multiplier, min_depth, pad_to_multiple,
        conv_hyperparams, resnet_v1.resnet_v1_152, 'resnet_v1_152', 'fpn',
        batch_norm_trainable, reuse_weights, use_explicit_padding)