python source code of ilsvrc

gluon-cv-master
- Makefile
- .gitmodules
- LICENSE
- setup.py
- README.md
- tests
  - lint.py
  - unittests
    - test_data_dataloader.py
    - test_utils_bbox.py
    - test_utils_parallel.py
    - test_model_zoo.py
    - test_data_datasets.py
    - common.py
    - test_data_transforms.py
    - test_utils_segmentation.py
    - test_lr_scheduler.py
    - test_utils_block.py
    - test_nn.py
    - test_utils_export.py
    - test_utils_viz.py
    - test_utils_metric.py
  - py3.yml
  - pylint.yml
  - pylintrc
  - py2.yml
- scripts
  - action-recognition
    - train_recognizer.py
    - test_recognizer.py
    - README.md
    - inference.py
    - feat_extract.py
  - datasets
    - kinetics400.py
    - ade20k.py
    - hmdb51.py
    - lsun.py
    - mscoco.py
    - ucf101.py
    - ilsvrc_vid.py
    - coco_tracking.py
    - ilsvrc_det.py
    - cityscapes.py
    - README.md
    - somethingsomethingv2.py
    - pascal_voc.py
    - market1501.py
    - mhp_v1.py
    - imagenet.py
  - instance
    - mask_rcnn
      - train_mask_rcnn.py
      - demo_mask_rcnn.py
      - README.md
      - eval_mask_rcnn.py
      - benchmark
        README.md
        ompi_bind_DGX1.sh
    - README.md
  - segmentation
    - train.py
    - README.md
    - test.py
  - detection
    - center_net
      - demo_center_net.py
      - train_center_net.py
      - eval_center_net.py
    - faster_rcnn
      - eval_faster_rcnn.py
      - README.md
      - demo_faster_rcnn.py
      - train_faster_rcnn.py
    - yolo
      - eval_yolo.py
      - train_yolo3.py
      - README.md
      - demo_yolo.py
    - demo_webcam_run.py
    - README.md
    - ssd
      - demo_ssd.py
      - eval_ssd.py
      - README.md
      - train_ssd.py
  - classification
    - cifar
      - train_cifar10.py
      - demo_cifar10.py
      - train_mixup_cifar10.py
      - README.md
    - finetune
      - prepare_minc.py
      - finetune_minc.py
    - imagenet
      - train_imagenet.py
      - verify_pretrained.py
      - train_imagenet_nasnet.py
      - train_horovod.py
      - imagenet_labels.txt
      - README.md
      - demo_imagenet.py
  - re-id
    - baseline
      - networks
        resnet.py
        __init__.py
      - train.py
      - README.md
      - test.py
  - pose
    - simple_pose
      - coco.sh
      - validate.py
      - demo.py
      - validate.sh
      - cam_demo.py
      - README.md
      - train_simple_pose.py
    - alpha_pose
      - coco.sh
      - validate.py
      - demo.py
      - train_alpha_pose.py
      - validate.sh
      - validate_tools.py
      - cam_demo.py
      - coco_dpg.sh
  - deployment
    - cpp-inference
      - src
        detect.cpp
        common.hpp
      - CMakeLists.txt
      - README.md
      - .gitignore
    - export
      - README.md
      - export_pretrained.py
      - .gitignore
    - README.md
  - gan
    - srgan
      - demo_srgan.py
      - download_dataset.py
      - __init__.py
      - README.md
      - train_srgan.py
    - wgan
      - lsun.py
      - train_wgan.py
      - README.md
    - cycle_gan
      - train_cgan.py
      - download_dataset.py
      - README.md
      - demo_cycle_gan.py
  - README.md
  - tracking
    - demo.py
    - train.py
    - test.py
    - benchmark.py
- gluoncv
  - utils
    - lr_scheduler.py
    - viz
      - keypoints.py
      - image.py
      - mask.py
      - bbox.py
      - __init__.py
      - segmentation.py
      - network.py
    - download.py
    - filesystem.py
    - compress_json.py
    - version.py
    - random.py
    - block.py
    - bbox.py
    - data
      - tracking.py
    - export_helper.py
    - __init__.py
    - metrics
      - heatmap_accuracy.py
      - coco_keypoints.py
      - coco_detection.py
      - tracking.py
      - accuracy.py
      - voc_detection.py
      - __init__.py
      - rcnn.py
      - segmentation.py
      - coco_instance.py
    - plot_history.py
    - parallel.py
    - transforms.py
    - sync_loader_helper.py
  - loss.py
  - nn
    - predictor.py
    - dropblock.py
    - sampler.py
    - block.py
    - coder.py
    - cython_bbox.pyx
    - gn.py
    - bbox.py
    - matcher.py
    - __init__.py
    - splat.py
    - feature.py
  - data
    - market1501
      - data_read.py
      - label_read.py
      - __init__.py
    - mixup
      - detection.py
      - __init__.py
    - pascal_voc
      - detection.py
      - __init__.py
      - segmentation.py
    - sampler.py
    - mscoco
      - keypoints.py
      - detection.py
      - instance.py
      - __init__.py
      - utils.py
      - segmentation.py
    - visdrone
      - detection.py
      - __init__.py
    - segbase.py
    - pascal_aug
      - __init__.py
      - segmentation.py
    - video_custom
      - classification.py
      - __init__.py
    - recordio
      - detection.py
      - __init__.py
    - somethingsomethingv2
      - classification.py
      - __init__.py
    - dataloader.py
    - hmdb51
      - classification.py
      - __init__.py
    - mhp.py
    - batchify.py
    - cityscapes.py
    - otb
      - tracking.py
      - __init__.py
    - __init__.py
    - ade20k
      - __init__.py
      - segmentation.py
    - ucf101
      - classification.py
      - __init__.py
    - lst
      - detection.py
      - __init__.py
    - tracking_data
      - __init__.py
      - track.py
    - imagenet
      - classification.py
      - __init__.py
    - transforms
      - image.py
      - presets
        simple_pose.py
        yolo.py
        __init__.py
        rcnn.py
        center_net.py
        segmentation.py
        imagenet.py
        alpha_pose.py
        ssd.py
      - block.py
      - pose.py
      - mask.py
      - bbox.py
      - video.py
      - __init__.py
      - experimental
        image.py
        bbox.py
        __init__.py
      - track.py
    - base.py
    - kinetics400
      - classification.py
      - __init__.py
  - __init__.py
  - model_zoo
    - center_net
      - deconv_resnet.py
      - deconv_dla.py
      - duc_mobilenet.py
      - __init__.py
      - target_generator.py
      - center_net.py
    - vgg.py
    - quantized
      - ssd_512_vgg16_atrous_voc_int8-symbol.json
      - mobilenet1.0_int8-symbol.json
      - ssd_300_vgg16_atrous_voc_int8-symbol.json
      - __init__.py
    - resnetv1b.py
    - alexnet.py
    - icnet.py
    - rcnn
      - faster_rcnn
        predefined_models.py
        rcnn_target.py
        data_parallel.py
        faster_rcnn.py
        __init__.py
      - mask_rcnn
        predefined_models.py
        rcnn_target.py
        data_parallel.py
        __init__.py
        mask_rcnn.py
      - __init__.py
      - rcnn.py
      - rpn
        anchor.py
        rpn.py
        rpn_target.py
        bbox_clip.py
        proposal.py
        __init__.py
        cython_rpn_target.pyx
    - fastscnn.py
    - resnest.py
    - mobilenetv3.py
    - pruned_resnet
      - resnet50_v1d_8.8x.json
      - resnetv1b_pruned.py
      - resnet101_v1d_1.9x.json
      - resnet18_v1b_2.6x.json
      - resnet50_v1d_5.9x.json
      - resnet50_v1d_3.6x.json
      - __init__.py
      - resnet50_v1d_1.8x.json
      - resnet101_v1d_2.2x.json
    - mobilenet.py
    - segbase.py
    - fcn.py
    - hrnet.py
    - cifarresnext.py
    - squeezenet.py
    - residual_attentionnet.py
    - deeplabv3_plus.py
    - xception.py
    - se_resnet.py
    - yolo
      - yolo3.py
      - yolo_target.py
      - darknet.py
      - __init__.py
    - pspnet.py
    - attention.py
    - cifarresnet.py
    - resnet.py
    - nasnet.py
    - wideresnet.py
    - siamrpn
      - siam_net.py
      - siam_alexnet.py
      - siamrpn_tracker.py
      - siam_rpn.py
      - __init__.py
    - simple_pose
      - pose_target.py
      - simple_pose_resnet.py
      - __init__.py
      - mobile_pose.py
    - googlenet.py
    - model_zoo.py
    - densenet.py
    - deeplabv3b_plus.py
    - dla.py
    - action_recognition
      - actionrec_inceptionv1.py
      - i3d_inceptionv3.py
      - actionrec_vgg16.py
      - p3d.py
      - i3d_resnet.py
      - c3d.py
      - slowfast.py
      - actionrec_resnetv1b.py
      - i3d_inceptionv1.py
      - __init__.py
      - actionrec_inceptionv3.py
      - r2plus1d.py
      - non_local.py
    - __init__.py
    - model_store.py
    - cifarwideresnet.py
    - danet.py
    - resnext.py
    - deeplabv3.py
    - inception.py
    - alpha_pose
      - __init__.py
      - utils.py
      - fast_pose.py
    - ssd
      - anchor.py
      - resnet_v1b_ssd.py
      - target.py
      - vgg_atrous.py
      - __init__.py
      - presets.py
      - ssd.py
    - senet.py
- .gitignore
- Jenkinsfile
- docs
  - install.rst
  - Makefile
  - slides.md
  - .nojekyll
  - Doxyfile
  - api
    - nn.rst
    - data.transforms.rst
    - data.datasets.rst
    - utils.rst
    - model_zoo.rst
    - loss.rst
    - data.batchify.rst
    - index.rst
  - how_to
    - support.rst
    - contribute.md
    - index.rst
  - build.yml
  - README.txt
  - tutorials
    - datasets
      - kinetics400.py
      - ade20k.py
      - hmdb51.py
      - mscoco.py
      - ucf101.py
      - README.txt
      - detection_custom.py
      - cityscapes.py
      - somethingsomethingv2.py
      - pascal_voc.py
      - mhp_v1.py
      - imagenet.py
      - .gitignore
      - recordio.py
    - instance
      - demo_mask_rcnn.py
      - train_mask_rcnn_coco.py
      - README.txt
      - .gitignore
    - distributed
      - README.txt
      - distributed_slowfast.py
    - segmentation
      - demo_deeplab.py
      - train_fcn.py
      - demo_icnet.py
      - demo_psp.py
      - README.txt
      - demo_fcn.py
      - train_psp.py
      - .gitignore
      - voc_sota.py
    - detection
      - demo_ssd.py
      - skip_fintune.py
      - demo_webcam.py
      - train_yolo_v3.py
      - demo_jetson.py
      - train_ssd_voc.py
      - README.txt
      - demo_center_net.py
      - train_ssd_advanced.py
      - finetune_detection.py
      - demo_faster_rcnn.py
      - demo_yolo.py
      - .gitignore
      - train_faster_rcnn_voc.py
    - classification
      - dive_deep_cifar10.py
      - dive_deep_imagenet.py
      - demo_cifar10.py
      - transfer_learning_minc.py
      - README.txt
      - demo_imagenet.py
    - pose
      - demo_alpha_pose.py
      - dive_deep_simple_pose.py
      - demo_simple_pose.py
      - README.txt
      - cam_demo.py
    - deployment
      - cpp_inference.py
      - export_network.py
      - README.txt
      - int8_inference.py
      - .gitignore
    - action_recognition
      - demo_slowfast_kinetics400.py
      - feat_custom.py
      - demo_i3d_kinetics400.py
      - dive_deep_i3d_kinetics400.py
      - decord_loader.py
      - README.txt
      - dive_deep_slowfast_kinetics400.py
      - finetune_custom.py
      - demo_tsn_ucf101.py
      - dive_deep_tsn_ucf101.py
      - demo_custom.py
    - index.rst
    - tracking
      - demo_SiamRPN.py
      - README.txt
  - contents.rst
  - install
    - install-include.rst
    - install-more.rst
  - conf.py
  - model_zoo
    - pose.rst
    - detection.rst
    - classification.rst
    - action_recognition.rst
    - index.rst
    - segmentation.rst
  - .gitignore
  - _templates
    - layout.html
    - index.html
  - _static
    - install-options.js
    - logos
      - embed.html
    - applications.html
    - gluon-logo.svg
    - hidebib.js
    - apache2.svg
    - google_analytics.js
    - imagenet_banner.jpeg
    - js
      - jquery.min.js
      - slides.min.js
    - gluon.ico
    - css
      - material_icon.css
      - slides.min.css
      - custom.css
    - pose-estimation.svg
    - assets
      - svg
        video-icon.svg
        icons.svg
        video-icon-dark.svg
        play.svg
      - img
        background
- MANIFEST.in

"""this script is used to prepare DET dataset for tracking,
which is Object detection in Large Scale Visual Recognition Challenge 2015 (ILSVRC2015)
Code adapted from https://github.com/STVIR/pysot"""
import argparse
import tarfile
import os
import glob
try:
    import xml.etree.cElementTree as ET
except ImportError:
    import xml.etree.ElementTree as ET
import json
import time
from concurrent import futures
import numpy as np
from gluoncv.utils.filesystem import try_import_cv2
from gluoncv.utils import download, makedirs
from gluoncv.utils.data.tracking import crop_like_SiamFC, printProgress

def parse_args():
    """DET dataset parameter."""
    parser = argparse.ArgumentParser(
        description='Download DET dataset and prepare for tracking')
    parser.add_argument('--download-dir', type=str, default='~/.mxnet/datasets/det/',
                        help='dataset directory on disk')
    parser.add_argument('--instance-size', type=int, default=511, help='instance image size')
    parser.add_argument('--num-threads', type=int, default=12, help='threads number')
    args = parser.parse_args()
    args.download_dir = os.path.expanduser(args.download_dir)
    return args

def download_det(args, overwrite=False):
    """download DET dataset and Unzip to download_dir"""
    _DOWNLOAD_URLS = [
    ('http://image-net.org/image/ILSVRC2015/ILSVRC2015_DET.tar.gz',
    'cbf602d89f2877fa8843392a1ffde03450a18d38'),
    ]
    if not os.path.isdir(args.download_dir):
        makedirs(args.download_dir)
    for url, checksum in _DOWNLOAD_URLS:
        filename = download(url, path=args.download_dir, overwrite=overwrite, sha1_hash=checksum)
        print(' dataset has already download completed')
        with tarfile.open(filename) as tar:
            tar.extractall(path=args.download_dir)
    if os.path.isdir(os.path.join(args.download_dir, 'ILSVRC2015')):
        os.rename(os.path.join(args.download_dir, 'ILSVRC2015'), os.path.join(args.download_dir, 'ILSVRC'))

def crop_xml(args, xml, sub_set_crop_path, instance_size=511):
    """
    Dataset curation

    Parameters
    ----------
    xml: str , xml
    sub_set_crop_path: str, xml crop path
    instance_size: int, instance_size
    """
    cv2 = try_import_cv2()
    xmltree = ET.parse(xml)
    objects = xmltree.findall('object')

    frame_crop_base_path = os.path.join(sub_set_crop_path, xml.split('/')[-1].split('.')[0])
    if not os.path.isdir(frame_crop_base_path):
        makedirs(frame_crop_base_path)
    img_path = xml.replace('xml', 'JPEG').replace('Annotations', 'Data')
    im = cv2.imread(img_path)
    avg_chans = np.mean(im, axis=(0, 1))

    for id, object_iter in enumerate(objects):
        bndbox = object_iter.find('bndbox')
        bbox = [int(bndbox.find('xmin').text), int(bndbox.find('ymin').text),
                int(bndbox.find('xmax').text), int(bndbox.find('ymax').text)]
        z, x = crop_like_SiamFC(im, bbox, instance_size=instance_size, padding=avg_chans)
        cv2.imwrite(os.path.join(args.download_dir, frame_crop_base_path, '{:06d}.{:02d}.z.jpg'.format(0, id)), z)
        cv2.imwrite(os.path.join(args.download_dir, frame_crop_base_path, '{:06d}.{:02d}.x.jpg'.format(0, id)), x)

def par_crop(args):
    """
    Dataset curation,crop data and transform the format of a label
    """
    crop_path = os.path.join(args.download_dir, './crop{:d}'.format(args.instance_size))
    if not os.path.isdir(crop_path): makedirs(crop_path)
    VID_base_path = os.path.join(args.download_dir, './ILSVRC')
    ann_base_path = os.path.join(VID_base_path, 'Annotations/DET/train/')
    sub_sets = ('a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i')
    for sub_set in sub_sets:
        sub_set_base_path = os.path.join(ann_base_path, sub_set)
        if 'a' == sub_set:
            xmls = sorted(glob.glob(os.path.join(sub_set_base_path, '*', '*.xml')))
        else:
            xmls = sorted(glob.glob(os.path.join(sub_set_base_path, '*.xml')))
        n_imgs = len(xmls)
        sub_set_crop_path = os.path.join(crop_path, sub_set)
        with futures.ProcessPoolExecutor(max_workers=args.num_threads) as executor:
            fs = [executor.submit(crop_xml, args, xml, sub_set_crop_path, args.instance_size) for xml in xmls]
            for i, f in enumerate(futures.as_completed(fs)):
                printProgress(i, n_imgs, prefix=sub_set, suffix='Done ', barLength=80)

def gen_json(args):
    """Format XML and transform json.
       generate train and val json, prepare for tracking dataloader"""
    js = {}
    VID_base_path = os.path.join(args.download_dir, './ILSVRC')
    ann_base_path = os.path.join(VID_base_path, 'Annotations/DET/train/')
    sub_sets = ('a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i')
    for sub_set in sub_sets:
        sub_set_base_path = os.path.join(ann_base_path, sub_set)
        if 'a' == sub_set:
            xmls = sorted(glob.glob(os.path.join(sub_set_base_path, '*', '*.xml')))
        else:
            xmls = sorted(glob.glob(os.path.join(sub_set_base_path, '*.xml')))
        n_imgs = len(xmls)
        for f, xml in enumerate(xmls):
            print('subset: {} frame id: {:08d} / {:08d}'.format(sub_set, f, n_imgs))
            xmltree = ET.parse(xml)
            objects = xmltree.findall('object')

            video = os.path.join(sub_set, xml.split('/')[-1].split('.')[0])

            for id, object_iter in enumerate(objects):
                bndbox = object_iter.find('bndbox')
                bbox = [int(bndbox.find('xmin').text), int(bndbox.find('ymin').text),
                        int(bndbox.find('xmax').text), int(bndbox.find('ymax').text)]
                frame = '%06d' % (0)
                obj = '%02d' % (id)
                if video not in js:
                    js[video] = {}
                if obj not in js[video]:
                    js[video][obj] = {}
                js[video][obj][frame] = bbox

    train = {k:v for (k, v) in js.items() if 'i/' not in k}
    val = {k:v for (k, v) in js.items() if 'i/' in k}
    json.dump(train, open(os.path.join(args.download_dir, 'train.json'), 'w'),
              indent=4, sort_keys=True)
    json.dump(val, open(os.path.join(args.download_dir, 'val.json'), 'w'),
              indent=4, sort_keys=True)

def symlink(args):
    """Soft connection in DET"""
    def per_symlink(src, dst):
        """Soft connection"""
        src = os.path.join(args.download_dir, src)
        dst = os.path.join(args.download_dir, dst)
        if not os.path.isdir(dst):
            os.symlink(src, dst)
    per_symlink('ILSVRC/Annotations/DET/train/ILSVRC2013_train', 'ILSVRC/Annotations/DET/train/a')
    per_symlink('ILSVRC/Annotations/DET/train/ILSVRC2014_train_0000', 'ILSVRC/Annotations/DET/train/b')
    per_symlink('ILSVRC/Annotations/DET/train/ILSVRC2014_train_0001', 'ILSVRC/Annotations/DET/train/c')
    per_symlink('ILSVRC/Annotations/DET/train/ILSVRC2014_train_0002', 'ILSVRC/Annotations/DET/train/d')
    per_symlink('ILSVRC/Annotations/DET/train/ILSVRC2014_train_0003', 'ILSVRC/Annotations/DET/train/e')
    per_symlink('ILSVRC/Annotations/DET/train/ILSVRC2014_train_0004', 'ILSVRC/Annotations/DET/train/f')
    per_symlink('ILSVRC/Annotations/DET/train/ILSVRC2014_train_0005', 'ILSVRC/Annotations/DET/train/g')
    per_symlink('ILSVRC/Annotations/DET/train/ILSVRC2014_train_0006', 'ILSVRC/Annotations/DET/train/h')
    per_symlink('ILSVRC/Annotations/DET/val', 'ILSVRC/Annotations/DET/train/i')

    per_symlink('ILSVRC/Data/DET/train/ILSVRC2013_train', 'ILSVRC/Data/DET/train/a')
    per_symlink('ILSVRC/Data/DET/train/ILSVRC2014_train_0000', 'ILSVRC/Data/DET/train/b')
    per_symlink('ILSVRC/Data/DET/train/ILSVRC2014_train_0001', 'ILSVRC/Data/DET/train/c')
    per_symlink('ILSVRC/Data/DET/train/ILSVRC2014_train_0002', 'ILSVRC/Data/DET/train/d')
    per_symlink('ILSVRC/Data/DET/train/ILSVRC2014_train_0003', 'ILSVRC/Data/DET/train/e')
    per_symlink('ILSVRC/Data/DET/train/ILSVRC2014_train_0004', 'ILSVRC/Data/DET/train/f')
    per_symlink('ILSVRC/Data/DET/train/ILSVRC2014_train_0005', 'ILSVRC/Data/DET/train/g')
    per_symlink('ILSVRC/Data/DET/train/ILSVRC2014_train_0006', 'ILSVRC/Data/DET/train/h')
    per_symlink('ILSVRC/Data/DET/val', 'ILSVRC/Data/DET/train/i')


def main(args):
    # download DET dataset
    download_det(args)
    print('DET dataset has already download completed')
    symlink(args)
    # crop DET dataset for prepare for tracking
    par_crop(args)
    print('DET dataset has already crop completed')
    # generat DET json for prepare for tracking
    gen_json(args)
    print('DET dataset has already generat completed')

if __name__ == '__main__':
    since = time.time()
    args = parse_args()
    main(args)
    time_elapsed = time.time() - since
    print('Total complete in {:.0f}m {:.0f}s'.format(
        time_elapsed // 60, time_elapsed % 60))