python source code of fast

seg_every_thing-master
- .github
  - issue_template.md
- demo
  - output
  - NOTICE
- demo_vg3k
- LICENSE
- README_DETECTRON.md
- lib
  - cmake
    - Utils.cmake
    - Cuda.cmake
    - Modules
      - FindCuDNN.cmake
    - Dependencies.cmake
    - Summary.cmake
  - datasets
    - bbox2mask_dataset_processing
      - vg
        step_1_build_vg3k_raw_json.py
        step_2_build_vg3k_cocoaligned_json.py
      - coco
        split_coco_dataset_randsplits.py
        add_embeddings_to_weights.py
        glove_randn
        fixed_embedding_mat_coco_randn_0.npy
        fixed_embedding_mat_coco_glove.npy
        split_coco_dataset_voc_nonvoc.py
        count_training_instances_voc_nonvoc.py
        count_training_instances_randsplits.py
    - VOCdevkit-matlab-wrapper
      - xVOCap.m
      - voc_eval.m
      - get_voc_opts.m
    - json_dataset.py
    - voc_eval.py
    - json_dataset_evaluator.py
    - dummy_datasets.py
    - roidb.py
    - cityscapes_json_dataset_evaluator.py
    - dataset_catalog.py
    - cityscapes
      - coco_to_cityscapes_id.py
      - __init__.py
      - tools
        convert_cityscapes_to_coco.py
        convert_coco_model_to_cityscapes.py
    - data
      - coco_bbox2mask
        .keep
      - trained_models
        .keep
        fetch_vg3k_final_model.sh
        fetch_vg3k_faster_rcnn_model.sh
        fetch_coco_faster_rcnn_model.sh
      - README.md
      - vg3k_bbox2mask
        .keep
        fetch_vg3k_json.sh
    - voc_dataset_evaluator.py
    - __init__.py
    - task_evaluation.py
  - utils
    - keypoints.py
    - env.py
    - blob.py
    - image.py
    - cython_nms.pyx
    - vis.py
    - segms.py
    - collections.py
    - model_convert_utils.py
    - cython_bbox.pyx
    - training_stats.py
    - lr_policy.py
    - net.py
    - boxes.py
    - colormap.py
    - io.py
    - train.py
    - subprocess.py
    - __init__.py
    - coordinator.py
    - logging.py
    - timer.py
    - c2.py
  - Makefile
  - modeling
    - rfcn_heads.py
    - optimizer.py
    - ResNet.py
    - mask_rcnn_heads.py
    - VGG16.py
    - retinanet_heads.py
    - detector.py
    - VGG_CNN_M_1024.py
    - fast_rcnn_heads.py
    - generate_anchors.py
    - FPN.py
    - __init__.py
    - keypoint_rcnn_heads.py
    - rpn_heads.py
    - name_compat.py
    - model_builder.py
  - setup.py
  - roi_data
    - fast_rcnn.py
    - rpn.py
    - retinanet.py
    - __init__.py
    - keypoint_rcnn.py
    - loader.py
    - minibatch.py
    - data_utils.py
    - mask_rcnn.py
  - CMakeLists.txt
  - ops
    - collect_and_distribute_fpn_rpn_proposals.py
    - generate_proposal_labels.py
    - zero_even_op.h
    - zero_even_op.cu
    - generate_proposals.py
    - __init__.py
    - zero_even_op.cc
  - core
    - test_retinanet.py
    - config.py
    - rpn_generator.py
    - test_engine.py
    - __init__.py
    - test.py
- CONTRIBUTING.md
- projects
  - GN
    - README.md
- docker
  - Dockerfile
- FAQ.md
- GETTING_STARTED.md
- configs
  - bbox2mask_coco
    - fast_rcnn_R-50-FPN_1x.yaml
    - fast_rcnn_R-101-FPN_1x.yaml
    - voc2nonvoc
      - eval_e2e_R101
        e2e_clsbox_2_layer_mlp_nograd_R101.yaml
        e2e_baseline_R101.yaml
      - ablation_structure
        relu
        clsbox_2_layer_relu.yaml
        clsbox_3_layer_relu.yaml
        clsbox_3_layer.yaml
        clsbox_1_layer.yaml
      - ablation_mlp
        baseline_mlp.yaml
        clsbox_2_layer_mlp.yaml
      - eval_e2e
        e2e_clsbox_2_layer_mlp_nograd.yaml
        e2e_baseline.yaml
      - ablation_e2e_stopgrad
        e2e_clsbox_2_layer.yaml
        e2e_clsbox_2_layer_nograd.yaml
      - eval_sw
        clsbox_2_layer.yaml
        baseline.yaml
      - ablation_input
        glove_2_layer.yaml
        cls_2_layer.yaml
        box_2_layer.yaml
        randn_2_layer.yaml
    - oracle
      - e2e_mask_rcnn_R-101-FPN_1x.yaml
      - mask_rcnn_frozen_features_R-50-FPN_1x.yaml
      - e2e_mask_rcnn_R-50-FPN_1x.yaml
    - randsplits
      - gen_coco_randsplits_cfgs.py
      - eval_sw
        E5_A40B40_clsbox_2_layer.yaml
        E4_A60B20_baseline.yaml
        E2_A20B60_clsbox_2_layer.yaml
        E4_A40B40_baseline.yaml
        E1_A40B40_baseline.yaml
        E1_A40B40_clsbox_2_layer.yaml
        E4_A50B30_clsbox_2_layer.yaml
        E5_A20B60_baseline.yaml
        E1_A60B20_clsbox_2_layer.yaml
        E3_A30B50_clsbox_2_layer.yaml
        E4_A40B40_clsbox_2_layer.yaml
        E2_A30B50_baseline.yaml
        E3_A50B30_clsbox_2_layer.yaml
        E5_A50B30_baseline.yaml
        E2_A50B30_clsbox_2_layer.yaml
        E5_A30B50_baseline.yaml
        E1_A20B60_clsbox_2_layer.yaml
        E5_A20B60_clsbox_2_layer.yaml
        E1_A30B50_baseline.yaml
        E1_A20B60_baseline.yaml
        E3_A30B50_baseline.yaml
        E2_A60B20_clsbox_2_layer.yaml
        E2_A40B40_baseline.yaml
        E3_A60B20_baseline.yaml
        E2_A30B50_clsbox_2_layer.yaml
        E3_A60B20_clsbox_2_layer.yaml
        E3_A40B40_clsbox_2_layer.yaml
        E1_A50B30_clsbox_2_layer.yaml
        E1_A60B20_baseline.yaml
        E4_A20B60_baseline.yaml
        E3_A20B60_clsbox_2_layer.yaml
        E5_A30B50_clsbox_2_layer.yaml
        E5_A40B40_baseline.yaml
        E3_A20B60_baseline.yaml
        E1_A30B50_clsbox_2_layer.yaml
        E2_A50B30_baseline.yaml
        E5_A50B30_clsbox_2_layer.yaml
        E2_A40B40_clsbox_2_layer.yaml
        E4_A50B30_baseline.yaml
        E2_A60B20_baseline.yaml
        E5_A60B20_baseline.yaml
        E5_A60B20_clsbox_2_layer.yaml
        E4_A30B50_clsbox_2_layer.yaml
        E4_A60B20_clsbox_2_layer.yaml
        E1_A50B30_baseline.yaml
        E4_A20B60_clsbox_2_layer.yaml
        E3_A50B30_baseline.yaml
        E4_A30B50_baseline.yaml
        E3_A40B40_baseline.yaml
        E2_A20B60_baseline.yaml
      - template_baseline.yaml
      - template_clsbox_2_layer.yaml
    - nonvoc2voc
      - eval_e2e_R101
        e2e_clsbox_2_layer_mlp_nograd_R101.yaml
        e2e_baseline_R101.yaml
      - ablation_structure
        relu
        clsbox_2_layer_relu.yaml
        clsbox_3_layer_relu.yaml
        clsbox_3_layer.yaml
        clsbox_1_layer.yaml
      - ablation_mlp
        baseline_mlp.yaml
        clsbox_2_layer_mlp.yaml
      - eval_e2e
        e2e_clsbox_2_layer_mlp_nograd.yaml
        e2e_baseline.yaml
      - ablation_e2e_stopgrad
        e2e_clsbox_2_layer.yaml
        e2e_clsbox_2_layer_nograd.yaml
      - eval_sw
        clsbox_2_layer.yaml
        baseline.yaml
      - ablation_input
        glove_2_layer.yaml
        cls_2_layer.yaml
        box_2_layer.yaml
        randn_2_layer.yaml
  - 12_2017_baselines
    - keypoint_rcnn_R-50-FPN_s1x.yaml
    - fast_rcnn_R-50-FPN_1x.yaml
    - fast_rcnn_R-101-FPN_1x.yaml
    - e2e_keypoint_rcnn_R-50-FPN_s1x.yaml
    - e2e_faster_rcnn_R-101-FPN_2x.yaml
    - e2e_mask_rcnn_R-50-FPN_2x.yaml
    - e2e_mask_rcnn_X-101-32x8d-FPN_2x.yaml
    - e2e_keypoint_rcnn_X-101-64x4d-FPN_s1x.yaml
    - keypoint_rcnn_X-101-32x8d-FPN_1x.yaml
    - retinanet_R-101-FPN_1x.yaml
    - mask_rcnn_X-101-64x4d-FPN_2x.yaml
    - keypoint_rcnn_X-101-64x4d-FPN_s1x.yaml
    - rpn_R-50-C4_1x.yaml
    - fast_rcnn_R-50-FPN_2x.yaml
    - e2e_keypoint_rcnn_R-101-FPN_s1x.yaml
    - mask_rcnn_R-50-C4_2x.yaml
    - e2e_mask_rcnn_R-50-C4_1x.yaml
    - e2e_mask_rcnn_R-101-FPN_1x.yaml
    - fast_rcnn_X-101-64x4d-FPN_1x.yaml
    - mask_rcnn_R-101-FPN_2x.yaml
    - rpn_X-101-64x4d-FPN_1x.yaml
    - mask_rcnn_X-101-32x8d-FPN_1x.yaml
    - e2e_keypoint_rcnn_X-101-32x8d-FPN_1x.yaml
    - fast_rcnn_X-101-32x8d-FPN_1x.yaml
    - e2e_mask_rcnn_X-101-64x4d-FPN_2x.yaml
    - rpn_R-50-FPN_1x.yaml
    - rpn_person_only_X-101-64x4d-FPN_1x.yaml
    - retinanet_R-50-FPN_1x.yaml
    - keypoint_rcnn_X-101-32x8d-FPN_s1x.yaml
    - retinanet_X-101-32x8d-FPN_2x.yaml
    - rpn_R-101-FPN_1x.yaml
    - fast_rcnn_R-50-C4_1x.yaml
    - keypoint_rcnn_X-101-64x4d-FPN_1x.yaml
    - e2e_faster_rcnn_R-50-C4_2x.yaml
    - mask_rcnn_R-101-FPN_1x.yaml
    - e2e_faster_rcnn_R-50-C4_1x.yaml
    - rpn_person_only_R-101-FPN_1x.yaml
    - fast_rcnn_R-50-C4_2x.yaml
    - mask_rcnn_R-50-C4_1x.yaml
    - e2e_keypoint_rcnn_R-50-FPN_1x.yaml
    - mask_rcnn_R-50-FPN_2x.yaml
    - e2e_mask_rcnn_R-50-C4_2x.yaml
    - e2e_faster_rcnn_X-101-64x4d-FPN_2x.yaml
    - mask_rcnn_X-101-32x8d-FPN_2x.yaml
    - e2e_mask_rcnn_X-101-64x4d-FPN_1x.yaml
    - retinanet_X-101-32x8d-FPN_1x.yaml
    - rpn_X-101-32x8d-FPN_1x.yaml
    - rpn_person_only_X-101-32x8d-FPN_1x.yaml
    - rpn_person_only_R-50-FPN_1x.yaml
    - mask_rcnn_X-101-64x4d-FPN_1x.yaml
    - fast_rcnn_R-101-FPN_2x.yaml
    - e2e_faster_rcnn_X-101-32x8d-FPN_1x.yaml
    - fast_rcnn_X-101-32x8d-FPN_2x.yaml
    - mask_rcnn_R-50-FPN_1x.yaml
    - e2e_faster_rcnn_R-50-FPN_2x.yaml
    - e2e_mask_rcnn_X-101-32x8d-FPN_1x.yaml
    - e2e_mask_rcnn_R-101-FPN_2x.yaml
    - retinanet_X-101-64x4d-FPN_1x.yaml
    - e2e_keypoint_rcnn_X-101-32x8d-FPN_s1x.yaml
    - fast_rcnn_X-101-64x4d-FPN_2x.yaml
    - e2e_mask_rcnn_X-152-32x8d-FPN-IN5k_1.44x.yaml
    - keypoint_rcnn_R-101-FPN_s1x.yaml
    - e2e_faster_rcnn_X-101-64x4d-FPN_1x.yaml
    - keypoint_rcnn_R-101-FPN_1x.yaml
    - e2e_mask_rcnn_R-50-FPN_1x.yaml
    - retinanet_X-101-64x4d-FPN_2x.yaml
    - e2e_faster_rcnn_R-50-FPN_1x.yaml
    - retinanet_R-50-FPN_2x.yaml
    - e2e_keypoint_rcnn_R-101-FPN_1x.yaml
    - keypoint_rcnn_R-50-FPN_1x.yaml
    - e2e_faster_rcnn_X-101-32x8d-FPN_2x.yaml
    - e2e_keypoint_rcnn_X-101-64x4d-FPN_1x.yaml
    - e2e_faster_rcnn_R-101-FPN_1x.yaml
    - retinanet_R-101-FPN_2x.yaml
  - test_time_aug
    - e2e_mask_rcnn_R-50-FPN_2x.yaml
    - keypoint_rcnn_R-50-FPN_1x.yaml
  - getting_started
    - tutorial_1gpu_e2e_faster_rcnn_R-50-FPN.yaml
    - tutorial_4gpu_e2e_faster_rcnn_R-50-FPN.yaml
    - tutorial_2gpu_e2e_faster_rcnn_R-50-FPN.yaml
    - tutorial_8gpu_e2e_faster_rcnn_R-50-FPN.yaml
  - 04_2018_gn_baselines
    - mask_rcnn_R-50-FPN_1x_gn.yaml
    - e2e_mask_rcnn_R-101-FPN_2x_gn.yaml
    - e2e_mask_rcnn_R-50-FPN_3x_gn.yaml
    - scratch_e2e_mask_rcnn_R-101-FPN_3x_gn.yaml
    - e2e_mask_rcnn_R-50-FPN_2x_gn.yaml
    - scratch_e2e_mask_rcnn_R-50-FPN_3x_gn.yaml
    - e2e_mask_rcnn_R-101-FPN_3x_gn.yaml
  - bbox2mask_vg
    - eval_sw_R101
      - stage2_cocomask_clsbox_2_layer_mlp_nograd_R101.yaml
      - stage1_e2e_fast_rcnn_R-101-FPN_1x_1im.yaml
      - runtest_clsbox_2_layer_mlp_nograd_R101.yaml
    - eval_sw
      - stage2_cocomask_clsbox_2_layer_mlp_nograd.yaml
      - runtest_clsbox_2_layer_mlp_nograd.yaml
      - stage1_e2e_fast_rcnn_R-50-FPN_1x_1im.yaml
- README.md
- MODEL_ZOO.md
- tests
  - test_spatial_narrow_as_op.py
  - test_loader.py
  - test_restore_checkpoint.py
  - data_loader_benchmark.py
  - test_zero_even_op.py
  - test_smooth_l1_loss_op.py
  - test_cfg.py
  - test_batch_permutation_op.py
  - test_bbox_transform.py
- tools
  - infer.py
  - test_net.py
  - generate_testdev_from_test.py
  - vg3k_training
    - convert_coco_seg_to_vg3k.py
    - convert_vg3k_det_to_coco.py
  - infer_simple.py
  - train_net.py
  - visualize_results.py
  - convert_selective_search.py
  - reval.py
  - cfg_upgrade
    - upgrade_cfg_yaml.py
  - convert_pkl_to_pb.py
  - pickle_caffe_blobs.py
- NOTICE
- .gitignore
- INSTALL.md

# Copyright (c) 2017-present, Facebook, Inc.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
##############################################################################

"""Construct minibatches for Fast R-CNN training. Handles the minibatch blobs
that are specific to Fast R-CNN. Other blobs that are generic to RPN, etc.
are handled by their respecitive roi_data modules.
"""

from __future__ import absolute_import
from __future__ import division
from __future__ import print_function
from __future__ import unicode_literals

import logging
import numpy as np
import numpy.random as npr

from core.config import cfg
import modeling.FPN as fpn
import roi_data.keypoint_rcnn
import roi_data.mask_rcnn
import utils.blob as blob_utils
import utils.boxes as box_utils

logger = logging.getLogger(__name__)


def get_fast_rcnn_blob_names(is_training=True):
    """Fast R-CNN blob names."""
    # rois blob: holds R regions of interest, each is a 5-tuple
    # (batch_idx, x1, y1, x2, y2) specifying an image batch index and a
    # rectangle (x1, y1, x2, y2)
    blob_names = ['rois']
    if is_training:
        # labels_int32 blob: R categorical labels in [0, ..., K] for K
        # foreground classes plus background
        blob_names += ['labels_int32']
    if is_training:
        # bbox_targets blob: R bounding-box regression targets with 4
        # targets per class
        blob_names += ['bbox_targets']
        # bbox_inside_weights blob: At most 4 targets per roi are active
        # this binary vector sepcifies the subset of active targets
        blob_names += ['bbox_inside_weights']
        blob_names += ['bbox_outside_weights']
    if is_training and cfg.MODEL.MASK_ON:
        # 'mask_rois': RoIs sampled for training the mask prediction branch.
        # Shape is (#masks, 5) in format (batch_idx, x1, y1, x2, y2).
        blob_names += ['mask_rois']
        # 'roi_has_mask': binary labels for the RoIs specified in 'rois'
        # indicating if each RoI has a mask or not. Note that in some cases
        # a *bg* RoI will have an all -1 (ignore) mask associated with it in
        # the case that no fg RoIs can be sampled. Shape is (batchsize).
        blob_names += ['roi_has_mask_int32']
        # 'masks_int32' holds binary masks for the RoIs specified in
        # 'mask_rois'. Shape is (#fg, M * M) where M is the ground truth
        # mask size.
        blob_names += ['masks_int32']
    if is_training and cfg.MODEL.KEYPOINTS_ON:
        # 'keypoint_rois': RoIs sampled for training the keypoint prediction
        # branch. Shape is (#instances, 5) in format (batch_idx, x1, y1, x2,
        # y2).
        blob_names += ['keypoint_rois']
        # 'keypoint_locations_int32': index of keypoint in
        # KRCNN.HEATMAP_SIZE**2 sized array. Shape is (#instances). Used in
        # SoftmaxWithLoss.
        blob_names += ['keypoint_locations_int32']
        # 'keypoint_weights': weight assigned to each target in
        # 'keypoint_locations_int32'. Shape is (#instances). Used in
        # SoftmaxWithLoss.
        blob_names += ['keypoint_weights']
        # 'keypoint_loss_normalizer': optional normalization factor to use if
        # cfg.KRCNN.NORMALIZE_BY_VISIBLE_KEYPOINTS is False.
        blob_names += ['keypoint_loss_normalizer']
    if cfg.FPN.FPN_ON and cfg.FPN.MULTILEVEL_ROIS:
        # Support for FPN multi-level rois without bbox reg isn't
        # implemented (... and may never be implemented)
        k_max = cfg.FPN.ROI_MAX_LEVEL
        k_min = cfg.FPN.ROI_MIN_LEVEL
        # Same format as rois blob, but one per FPN level
        for lvl in range(k_min, k_max + 1):
            blob_names += ['rois_fpn' + str(lvl)]
        blob_names += ['rois_idx_restore_int32']
        if is_training:
            if cfg.MODEL.MASK_ON:
                for lvl in range(k_min, k_max + 1):
                    blob_names += ['mask_rois_fpn' + str(lvl)]
                blob_names += ['mask_rois_idx_restore_int32']
            if cfg.MODEL.KEYPOINTS_ON:
                for lvl in range(k_min, k_max + 1):
                    blob_names += ['keypoint_rois_fpn' + str(lvl)]
                blob_names += ['keypoint_rois_idx_restore_int32']
    return blob_names


def add_fast_rcnn_blobs(blobs, im_scales, roidb):
    """Add blobs needed for training Fast R-CNN style models."""
    # Sample training RoIs from each image and append them to the blob lists
    for im_i, entry in enumerate(roidb):
        frcn_blobs = _sample_rois(entry, im_scales[im_i], im_i)
        for k, v in frcn_blobs.items():
            blobs[k].append(v)
    # Concat the training blob lists into tensors
    for k, v in blobs.items():
        if isinstance(v, list) and len(v) > 0:
            blobs[k] = np.concatenate(v)
    # Add FPN multilevel training RoIs, if configured
    if cfg.FPN.FPN_ON and cfg.FPN.MULTILEVEL_ROIS:
        _add_multilevel_rois(blobs)

    # Perform any final work and validity checks after the collating blobs for
    # all minibatch images
    valid = True
    if cfg.MODEL.KEYPOINTS_ON:
        valid = roi_data.keypoint_rcnn.finalize_keypoint_minibatch(blobs, valid)

    return valid


def _sample_rois(roidb, im_scale, batch_idx):
    """Generate a random sample of RoIs comprising foreground and background
    examples.
    """
    rois_per_image = int(cfg.TRAIN.BATCH_SIZE_PER_IM)
    fg_rois_per_image = int(np.round(cfg.TRAIN.FG_FRACTION * rois_per_image))
    max_overlaps = roidb['max_overlaps']

    # Select foreground RoIs as those with >= FG_THRESH overlap
    fg_inds = np.where(max_overlaps >= cfg.TRAIN.FG_THRESH)[0]
    # Guard against the case when an image has fewer than fg_rois_per_image
    # foreground RoIs
    fg_rois_per_this_image = np.minimum(fg_rois_per_image, fg_inds.size)
    # Sample foreground regions without replacement
    if fg_inds.size > 0:
        fg_inds = npr.choice(
            fg_inds, size=fg_rois_per_this_image, replace=False
        )

    # Select background RoIs as those within [BG_THRESH_LO, BG_THRESH_HI)
    bg_inds = np.where(
        (max_overlaps < cfg.TRAIN.BG_THRESH_HI) &
        (max_overlaps >= cfg.TRAIN.BG_THRESH_LO)
    )[0]
    # Compute number of background RoIs to take from this image (guarding
    # against there being fewer than desired)
    bg_rois_per_this_image = rois_per_image - fg_rois_per_this_image
    bg_rois_per_this_image = np.minimum(bg_rois_per_this_image, bg_inds.size)
    # Sample foreground regions without replacement
    if bg_inds.size > 0:
        bg_inds = npr.choice(
            bg_inds, size=bg_rois_per_this_image, replace=False
        )

    # The indices that we're selecting (both fg and bg)
    keep_inds = np.append(fg_inds, bg_inds)
    # Label is the class each RoI has max overlap with
    sampled_labels = roidb['max_classes'][keep_inds]
    sampled_labels[fg_rois_per_this_image:] = 0  # Label bg RoIs with class 0
    sampled_boxes = roidb['boxes'][keep_inds]

    if 'bbox_targets' not in roidb:
        gt_inds = np.where(roidb['gt_classes'] > 0)[0]
        gt_boxes = roidb['boxes'][gt_inds, :]
        gt_assignments = gt_inds[roidb['box_to_gt_ind_map'][keep_inds]]
        bbox_targets = _compute_targets(
            sampled_boxes, gt_boxes[gt_assignments, :], sampled_labels
        )
        bbox_targets, bbox_inside_weights = _expand_bbox_targets(bbox_targets)
    else:
        bbox_targets, bbox_inside_weights = _expand_bbox_targets(
            roidb['bbox_targets'][keep_inds, :]
        )

    bbox_outside_weights = np.array(
        bbox_inside_weights > 0, dtype=bbox_inside_weights.dtype
    )

    # Scale rois and format as (batch_idx, x1, y1, x2, y2)
    sampled_rois = sampled_boxes * im_scale
    repeated_batch_idx = batch_idx * blob_utils.ones((sampled_rois.shape[0], 1))
    sampled_rois = np.hstack((repeated_batch_idx, sampled_rois))

    # Base Fast R-CNN blobs
    blob_dict = dict(
        labels_int32=sampled_labels.astype(np.int32, copy=False),
        rois=sampled_rois,
        bbox_targets=bbox_targets,
        bbox_inside_weights=bbox_inside_weights,
        bbox_outside_weights=bbox_outside_weights
    )

    # Optionally add Mask R-CNN blobs
    if cfg.MODEL.MASK_ON:
        roi_data.mask_rcnn.add_mask_rcnn_blobs(
            blob_dict, sampled_boxes, roidb, im_scale, batch_idx
        )

    # Optionally add Keypoint R-CNN blobs
    if cfg.MODEL.KEYPOINTS_ON:
        roi_data.keypoint_rcnn.add_keypoint_rcnn_blobs(
            blob_dict, roidb, fg_rois_per_image, fg_inds, im_scale, batch_idx
        )

    return blob_dict


def _compute_targets(ex_rois, gt_rois, labels):
    """Compute bounding-box regression targets for an image."""

    assert ex_rois.shape[0] == gt_rois.shape[0]
    assert ex_rois.shape[1] == 4
    assert gt_rois.shape[1] == 4

    targets = box_utils.bbox_transform_inv(
        ex_rois, gt_rois, cfg.MODEL.BBOX_REG_WEIGHTS
    )
    return np.hstack((labels[:, np.newaxis], targets)).astype(
        np.float32, copy=False
    )


def _expand_bbox_targets(bbox_target_data):
    """Bounding-box regression targets are stored in a compact form in the
    roidb.

    This function expands those targets into the 4-of-4*K representation used
    by the network (i.e. only one class has non-zero targets). The loss weights
    are similarly expanded.

    Returns:
        bbox_target_data (ndarray): N x 4K blob of regression targets
        bbox_inside_weights (ndarray): N x 4K blob of loss weights
    """
    num_bbox_reg_classes = cfg.MODEL.NUM_CLASSES
    if cfg.MODEL.CLS_AGNOSTIC_BBOX_REG:
        num_bbox_reg_classes = 2  # bg and fg

    clss = bbox_target_data[:, 0]
    bbox_targets = blob_utils.zeros((clss.size, 4 * num_bbox_reg_classes))
    bbox_inside_weights = blob_utils.zeros(bbox_targets.shape)
    inds = np.where(clss > 0)[0]
    for ind in inds:
        cls = int(clss[ind])
        start = 4 * cls
        end = start + 4
        bbox_targets[ind, start:end] = bbox_target_data[ind, 1:]
        bbox_inside_weights[ind, start:end] = (1.0, 1.0, 1.0, 1.0)
    return bbox_targets, bbox_inside_weights


def _add_multilevel_rois(blobs):
    """By default training RoIs are added for a single feature map level only.
    When using FPN, the RoIs must be distributed over different FPN levels
    according the level assignment heuristic (see: modeling.FPN.
    map_rois_to_fpn_levels).
    """
    lvl_min = cfg.FPN.ROI_MIN_LEVEL
    lvl_max = cfg.FPN.ROI_MAX_LEVEL

    def _distribute_rois_over_fpn_levels(rois_blob_name):
        """Distribute rois over the different FPN levels."""
        # Get target level for each roi
        # Recall blob rois are in (batch_idx, x1, y1, x2, y2) format, hence take
        # the box coordinates from columns 1:5
        target_lvls = fpn.map_rois_to_fpn_levels(
            blobs[rois_blob_name][:, 1:5], lvl_min, lvl_max
        )
        # Add per FPN level roi blobs named like: <rois_blob_name>_fpn<lvl>
        fpn.add_multilevel_roi_blobs(
            blobs, rois_blob_name, blobs[rois_blob_name], target_lvls, lvl_min,
            lvl_max
        )

    _distribute_rois_over_fpn_levels('rois')
    if cfg.MODEL.MASK_ON:
        _distribute_rois_over_fpn_levels('mask_rois')
    if cfg.MODEL.KEYPOINTS_ON:
        _distribute_rois_over_fpn_levels('keypoint_rois')