remote_sensing_object_detection_2019-master
- environment.yaml
- demo
  - predictor.py
  - polygon_wrapper.py
  - __pycache__
    - predictor.cpython-36.pyc
    - __init__.cpython-36.pyc
  - link_boxes.py
  - RRPN_Demo.py
  - rrpn_e2e_infer.py
  - webcam.py
  - ICDAR_demo.py
  - __init__.py
  - README.md
- libs
  - __pycache__
    - __init__.cpython-36.pyc
    - __init__.cpython-37.pyc
  - __init__.pyc
  - setup.py
  - __init__.py
  - box_utils
    - iou_rotate.py
    - rbbox_overlaps.pyx
    - boxes_utils.py
    - build
      - temp.linux-x86_64-3.6
        rotate_polygon_nms_kernel.o
        rbbox_overlaps_kernel.o
    - __pycache__
      - __init__.cpython-36.pyc
    - show_box_in_tensor.pyc
    - rotate_polygon_nms_kernel.cu
    - boxes_utils.pyc
    - tf_ops.py
    - iou_cpu.pyx
    - rotate_polygon_nms.pyx
    - iou.py
    - __init__.pyc
    - coordinate_convert.py
    - rotate_gpu_nms.hpp
    - cython_utils
      - nms.pyx
      - Makefile
      - build
        temp.linux-x86_64-3.6
      - __init__.pyc
      - setup.py
      - __init__.py
      - bbox.pyx
    - setup.py
    - encode_and_decode.pyc
    - anchor_utils.pyc
    - __init__.py
    - draw_box_in_img.py
    - nms_rotate.pyc
    - rbbox_overlaps_kernel.cu
    - show_box_in_tensor.py
    - nms.py
    - rotate_polygon_nms.hpp
    - nms_rotate.py
    - rbbox_overlaps.hpp
    - encode_and_decode.py
    - coordinate_convert.pyc
    - anchor_utils.py
- dist
- LICENSE
- RRPN.egg-info
  - top_level.txt
  - dependency_links.txt
  - PKG-INFO
  - SOURCES.txt
- screenshot
- maskrcnn_benchmark.egg-info
  - top_level.txt
  - dependency_links.txt
  - PKG-INFO
  - SOURCES.txt
- rotation
  - rotate_cpython_nms.pyx
  - rotate_gpu_nms.pyx
  - rbbox_overlaps.pyx
  - __pycache__
    - __init__.cpython-36.pyc
  - rotate_polygon_nms_kernel.cu
  - rotate_polygon_nms.pyx
  - rotate_circle_nms.pyx
  - rotate_nms_kernel.cu
  - rotate_gpu_nms.hpp
  - __init__.py
  - rbbox_overlaps_kernel.cu
  - rotate_cpu_nms.py
  - rotate_polygon_nms.hpp
  - rbbox_overlaps.hpp
  - rotate_cython_nms.pyx
- setup.py
- docker
  - docker-jupyter
    - jupyter_notebook_config.py
    - Dockerfile
  - Dockerfile
- configs
  - pascal_voc
    - e2e_faster_rcnn_R_50_C4_1x_4_gpu_voc.yaml
    - e2e_mask_rcnn_R_50_FPN_1x_cocostyle.yaml
    - e2e_faster_rcnn_R_50_C4_1x_1_gpu_voc.yaml
  - e2e_rrpn_R_50_C4_1x_ICDAR13_15_trial.yaml
  - e2e_mask_rcnn_R_50_FPN_1x.yaml
  - e2e_faster_rcnn_R_50_C4_1x_ICDAR13.yaml
  - quick_schedules
    - rpn_R_50_FPN_quick.yaml
    - e2e_mask_rcnn_R_50_FPN_quick.yaml
    - e2e_faster_rcnn_R_50_C4_quick.yaml
    - rpn_R_50_C4_quick.yaml
    - e2e_mask_rcnn_X_101_32x8d_FPN_quick.yaml
    - e2e_faster_rcnn_X_101_32x8d_FPN_quick.yaml
    - e2e_faster_rcnn_R_50_FPN_quick.yaml
    - e2e_mask_rcnn_R_50_C4_quick.yaml
  - e2e_mask_rcnn_R_50_C4_1x.yaml
  - e2e_faster_rcnn_R_50_C4_1x.yaml
  - e2e_faster_rcnn_R_101_FPN_1x.yaml
  - rrpn
    - e2e_rrpn_R_50_C4_1x_ICDAR13_15_17_trial.yaml
    - e2e_rrpn_R_50_C4_1x_ICDAR13_15_17_trial_again_test.yaml
    - e2e_rrpn_X_101_32x8d_FPN_1x_DOTA.yaml
  - e2e_faster_rcnn_R_50_C4_1x_ICDAR13_test.yaml
  - caffe2
    - e2e_faster_rcnn_X_101_32x8d_FPN_1x_caffe2.yaml
    - e2e_faster_rcnn_R_101_FPN_1x_caffe2.yaml
    - e2e_mask_rcnn_X_101_32x8d_FPN_1x_caffe2.yaml
    - e2e_faster_rcnn_R_50_C4_1x_caffe2.yaml
    - e2e_faster_rcnn_R_50_FPN_1x_caffe2.yaml
    - e2e_mask_rcnn_R_101_FPN_1x_caffe2.yaml
    - e2e_mask_rcnn_R_50_C4_1x_caffe2.yaml
    - e2e_mask_rcnn_R_50_FPN_1x_caffe2.yaml
  - e2e_faster_rcnn_R_50_FPN_1x.yaml
  - e2e_faster_rcnn_X_101_32x8d_FPN_1x.yaml
  - e2e_mask_rcnn_R_101_FPN_1x.yaml
  - cityscapes
    - e2e_faster_rcnn_R_50_FPN_1x_cocostyle.yaml
    - e2e_mask_rcnn_R_50_FPN_1x_cocostyle.yaml
  - gn_baselines
    - scratch_e2e_faster_rcnn_R_50_FPN_3x_gn.yaml
    - scratch_e2e_faster_rcnn_R_50_FPN_Xconv1fc_3x_gn.yaml
    - e2e_mask_rcnn_R_50_FPN_Xconv1fc_1x_gn.yaml
    - scratch_e2e_mask_rcnn_R_50_FPN_Xconv1fc_3x_gn.yaml
    - e2e_faster_rcnn_R_50_FPN_Xconv1fc_1x_gn.yaml
    - e2e_faster_rcnn_R_50_FPN_1x_gn.yaml
    - scratch_e2e_mask_rcnn_R_50_FPN_3x_gn.yaml
    - e2e_mask_rcnn_R_50_FPN_1x_gn.yaml
  - e2e_mask_rcnn_X_101_32x8d_FPN_1x.yaml
  - e2e_rrpn_R_50_C4_1x_ICDAR13_toy.yaml
  - e2e_rrpn_R_50_C4_1x_ICDAR13_test.yaml
- README.md
- MODEL_ZOO.md
- tests
  - test_data_samplers.py
  - test_metric_logger.py
  - checkpoint.py
- tools
  - test_net.py
  - train_net.py
  - cityscapes
    - instances2dict_with_polygons.py
    - convert_cityscapes_to_coco.py
- rotation_setup.py
- INSTALL.md
- maskrcnn_benchmark
  - solver
    - build.py
    - lr_scheduler.py
    - __pycache__
      - build.cpython-36.pyc
      - __init__.cpython-36.pyc
      - __init__.cpython-37.pyc
      - lr_scheduler.cpython-37.pyc
      - lr_scheduler.cpython-36.pyc
      - build.cpython-37.pyc
    - __init__.py
  - utils
    - env.py
    - metric_logger.py
    - comm.py
    - c2_model_loading.py
    - __pycache__
      - miscellaneous.cpython-37.pyc
      - miscellaneous.cpython-36.pyc
      - rec_utils.cpython-37.pyc
      - registry.cpython-36.pyc
      - comm.cpython-37.pyc
      - registry.cpython-37.pyc
      - visualize.cpython-37.pyc
      - logger.cpython-37.pyc
      - c2_model_loading.cpython-36.pyc
      - comm.cpython-36.pyc
      - model_serialization.cpython-36.pyc
      - logger.cpython-36.pyc
      - metric_logger.cpython-37.pyc
      - visualize.cpython-36.pyc
      - __init__.cpython-36.pyc
      - __init__.cpython-37.pyc
      - checkpoint.cpython-37.pyc
      - cv2_util.cpython-36.pyc
      - c2_model_loading.cpython-37.pyc
      - env.cpython-37.pyc
      - model_zoo.cpython-36.pyc
      - collect_env.cpython-37.pyc
      - imports.cpython-37.pyc
      - env.cpython-36.pyc
      - collect_env.cpython-36.pyc
      - checkpoint.cpython-36.pyc
      - model_zoo.cpython-37.pyc
      - rec_utils.cpython-36.pyc
      - metric_logger.cpython-36.pyc
      - imports.cpython-36.pyc
      - model_serialization.cpython-37.pyc
    - checkpoint.py
    - logger.py
    - registry.py
    - model_zoo.py
    - __init__.py
    - README.md
    - imports.py
    - miscellaneous.py
    - visualize.py
    - cv2_util.py
    - model_serialization.py
    - collect_env.py
    - rec_utils.py
  - modeling
    - balanced_positive_negative_sampler.py
    - __pycache__
      - box_coder.cpython-37.pyc
      - registry.cpython-36.pyc
      - registry.cpython-37.pyc
      - rbox_coder.cpython-36.pyc
      - make_layers.cpython-36.pyc
      - poolers.cpython-36.pyc
      - rbox_coder.cpython-37.pyc
      - __init__.cpython-36.pyc
      - __init__.cpython-37.pyc
      - balanced_positive_negative_sampler.cpython-37.pyc
      - matcher.cpython-37.pyc
      - utils.cpython-36.pyc
      - utils.cpython-37.pyc
      - matcher.cpython-36.pyc
      - poolers.cpython-37.pyc
      - box_coder.cpython-36.pyc
      - make_layers.cpython-37.pyc
      - balanced_positive_negative_sampler.cpython-36.pyc
    - rrpn
      - __pycache__
        anchor_generator.cpython-36.pyc
        inference.cpython-36.pyc
        anchor_generator.cpython-37.pyc
        __init__.cpython-36.pyc
        __init__.cpython-37.pyc
        loss.cpython-36.pyc
        loss.cpython-37.pyc
        rrpn.cpython-36.pyc
        rrpn.cpython-37.pyc
        inference.cpython-37.pyc
      - loss.py
      - rrpn.py
      - __init__.py
      - inference.py
      - anchor_generator.py
    - make_layers.py
    - detector
      - detectors.py
      - __pycache__
        generalized_rcnn.cpython-36.pyc
        generalized_rrpn_rcnn.cpython-37.pyc
        detectors.cpython-37.pyc
        __init__.cpython-36.pyc
        generalized_rrpn_rcnn.cpython-36.pyc
        __init__.cpython-37.pyc
        generalized_rcnn.cpython-37.pyc
        detectors.cpython-36.pyc
      - generalized_rcnn.py
      - __init__.py
      - generalized_rrpn_rcnn.py
    - backbone
      - backbone.py
      - __pycache__
        fpn.cpython-37.pyc
        fpn.cpython-36.pyc
        backbone.cpython-36.pyc
        resnet.cpython-36.pyc
        __init__.cpython-36.pyc
        __init__.cpython-37.pyc
        backbone.cpython-37.pyc
        resnet.cpython-37.pyc
      - fpn.py
      - resnet.py
      - __init__.py
    - roi_heads
      - rmask_head
        roi_mask_feature_extractors.py
        roi_mask_predictors.py
        __pycache__
        roi_mask_predictors.cpython-36.pyc
        inference.cpython-36.pyc
        roi_mask_predictors.cpython-37.pyc
        __init__.cpython-36.pyc
        __init__.cpython-37.pyc
        mask_head.cpython-37.pyc
        loss.cpython-36.pyc
        loss.cpython-37.pyc
        roi_mask_feature_extractors.cpython-37.pyc
        roi_mask_feature_extractors.cpython-36.pyc
        mask_head.cpython-36.pyc
        inference.cpython-37.pyc
        loss.py
        mask_head.py
        __init__.py
        inference.py
      - rbox_head
        __pycache__
        box_head.cpython-37.pyc
        inference.cpython-36.pyc
        roi_box_predictors.cpython-36.pyc
        __init__.cpython-36.pyc
        __init__.cpython-37.pyc
        loss.cpython-36.pyc
        loss.cpython-37.pyc
        roi_box_predictors.cpython-37.pyc
        box_head.cpython-36.pyc
        roi_box_feature_extractors.cpython-36.pyc
        roi_box_feature_extractors.cpython-37.pyc
        inference.cpython-37.pyc
        loss.py
        box_head.py
        __init__.py
        inference.py
        roi_box_feature_extractors.py
        roi_box_predictors.py
      - __pycache__
        roi_heads.cpython-36.pyc
        __init__.cpython-36.pyc
        __init__.cpython-37.pyc
        roi_heads.cpython-37.pyc
        rroi_heads.cpython-36.pyc
        rroi_heads.cpython-37.pyc
      - roi_heads.py
      - rroi_heads.py
      - mask_head
        roi_mask_feature_extractors.py
        roi_mask_predictors.py
        __pycache__
        roi_mask_predictors.cpython-36.pyc
        inference.cpython-36.pyc
        roi_mask_predictors.cpython-37.pyc
        __init__.cpython-36.pyc
        __init__.cpython-37.pyc
        mask_head.cpython-37.pyc
        loss.cpython-36.pyc
        loss.cpython-37.pyc
        roi_mask_feature_extractors.cpython-37.pyc
        roi_mask_feature_extractors.cpython-36.pyc
        mask_head.cpython-36.pyc
        inference.cpython-37.pyc
        loss.py
        mask_head.py
        __init__.py
        inference.py
      - rec_head
        roi_rec_feature_extractors.py
        rec_head.py
        __pycache__
        inference.cpython-36.pyc
        roi_rec_feature_extractors.cpython-36.pyc
        roi_rec_feature_extractors.cpython-37.pyc
        roi_rec_predictors.cpython-36.pyc
        __init__.cpython-36.pyc
        __init__.cpython-37.pyc
        loss.cpython-36.pyc
        rec_head.cpython-37.pyc
        loss.cpython-37.pyc
        rec_head.cpython-36.pyc
        inference.cpython-37.pyc
        roi_rec_predictors.cpython-37.pyc
        loss.py
        roi_rec_predictors.py
        __init__.py
        inference.py
      - __init__.py
      - box_head
        __pycache__
        box_head.cpython-37.pyc
        inference.cpython-36.pyc
        roi_box_predictors.cpython-36.pyc
        __init__.cpython-36.pyc
        __init__.cpython-37.pyc
        loss.cpython-36.pyc
        loss.cpython-37.pyc
        roi_box_predictors.cpython-37.pyc
        box_head.cpython-36.pyc
        roi_box_feature_extractors.cpython-36.pyc
        roi_box_feature_extractors.cpython-37.pyc
        inference.cpython-37.pyc
        loss.py
        box_head.py
        __init__.py
        inference.py
        roi_box_feature_extractors.py
        roi_box_predictors.py
    - registry.py
    - matcher.py
    - poolers.py
    - box_coder.py
    - __init__.py
    - arpn
      - rpn.py
      - loss.py
      - __init__.py
      - inference.py
      - anchor_generator.py
    - utils.py
    - rbox_coder.py
    - rpn
      - __pycache__
        anchor_generator.cpython-36.pyc
        inference.cpython-36.pyc
        rpn.cpython-37.pyc
        anchor_generator.cpython-37.pyc
        __init__.cpython-36.pyc
        __init__.cpython-37.pyc
        loss.cpython-36.pyc
        loss.cpython-37.pyc
        rpn.cpython-36.pyc
        inference.cpython-37.pyc
      - rpn.py
      - loss.py
      - __init__.py
      - inference.py
      - anchor_generator.py
  - layers
    - roi_align.py
    - misc.py
    - __pycache__
      - smooth_l1_loss.cpython-36.pyc
      - roi_pool.cpython-36.pyc
      - __init__.cpython-36.pyc
      - __init__.cpython-37.pyc
      - misc.cpython-37.pyc
      - rroi_align.cpython-37.pyc
      - smooth_l1_loss.cpython-37.pyc
      - roi_pool.cpython-37.pyc
      - roi_align.cpython-36.pyc
      - batch_norm.cpython-36.pyc
      - rroi_align.cpython-36.pyc
      - roi_align.cpython-37.pyc
      - batch_norm.cpython-37.pyc
      - nms.cpython-37.pyc
      - nms.cpython-36.pyc
      - misc.cpython-36.pyc
    - batch_norm.py
    - roi_pool.py
    - _utils.py
    - smooth_l1_loss.py
    - __init__.py
    - rroi_align.py
    - nms.py
    - rroi_pool.py
  - __pycache__
    - __init__.cpython-36.pyc
    - __init__.cpython-37.pyc
  - structures
    - bounding_box.py
    - __pycache__
      - segmentation_for_rbox.cpython-36.pyc
      - bounding_box.cpython-37.pyc
      - image_list.cpython-36.pyc
      - segmentation_for_rbox.cpython-37.pyc
      - rboxlist_ops.cpython-37.pyc
      - __init__.cpython-36.pyc
      - __init__.cpython-37.pyc
      - boxlist_ops.cpython-36.pyc
      - image_list.cpython-37.pyc
      - segmentation_mask.cpython-36.pyc
      - bounding_box.cpython-36.pyc
      - boxlist_ops.cpython-37.pyc
      - segmentation_mask.cpython-37.pyc
      - rboxlist_ops.cpython-36.pyc
    - segmentation_for_rbox.py
    - segmentation_mask.py
    - rboxlist_ops.py
    - __init__.py
    - boxlist_ops.py
    - image_list.py
  - config
    - paths_catalog.py
    - __pycache__
      - paths_catalog.cpython-37.pyc
      - __init__.cpython-36.pyc
      - __init__.cpython-37.pyc
      - paths_catalog.cpython-36.pyc
      - defaults.cpython-36.pyc
      - defaults.cpython-37.pyc
    - __init__.py
    - defaults.py
  - engine
    - __pycache__
      - inference.cpython-36.pyc
      - trainer.cpython-36.pyc
      - __init__.cpython-36.pyc
      - __init__.cpython-37.pyc
      - trainer.cpython-37.pyc
      - inference.cpython-37.pyc
    - __init__.py
    - inference.py
    - trainer.py
  - data
    - build.py
    - datasets
      - coco.py
      - rrpn_e2e_series.py
      - concat_dataset.py
      - __pycache__
        coco.cpython-37.pyc
        rotation_mask_datasets.cpython-36.pyc
        rotation_series.cpython-36.pyc
        rotation_mask_datasets.cpython-37.pyc
        rrpn_e2e_series.cpython-37.pyc
        __init__.cpython-36.pyc
        __init__.cpython-37.pyc
        voc.cpython-37.pyc
        rotation_series.cpython-37.pyc
        voc.cpython-36.pyc
        icdar_series.cpython-37.pyc
        rrpn_e2e_series.cpython-36.pyc
        coco.cpython-36.pyc
        concat_dataset.cpython-36.pyc
        icdar_series.cpython-36.pyc
        concat_dataset.cpython-37.pyc
      - list_dataset.py
      - rotation_mask_datasets.py
      - icdar_series.py
      - evaluation
        __pycache__
        __init__.cpython-36.pyc
        __init__.cpython-37.pyc
        __init__.py
        coco
        coco_eval.py
        __pycache__
        __init__.cpython-36.pyc
        __init__.cpython-37.pyc
        coco_eval.cpython-37.pyc
        coco_eval.cpython-36.pyc
        __init__.py
        voc
        __pycache__
        voc_eval.cpython-37.pyc
        __init__.cpython-36.pyc
        __init__.cpython-37.pyc
        voc_eval.cpython-36.pyc
        voc_eval.py
        __init__.py
      - __init__.py
      - voc.py
      - coco_origin.py
      - rotation_series.py
    - __pycache__
      - collate_batch.cpython-36.pyc
      - collate_batch.cpython-37.pyc
      - build.cpython-36.pyc
      - __init__.cpython-36.pyc
      - __init__.cpython-37.pyc
      - build.cpython-37.pyc
    - icdar_series.py
    - collate_batch.py
    - __init__.py
    - README.md
    - samplers
      - __pycache__
        __init__.cpython-36.pyc
        __init__.cpython-37.pyc
        iteration_based_batch_sampler.cpython-37.pyc
        distributed.cpython-37.pyc
        iteration_based_batch_sampler.cpython-36.pyc
        grouped_batch_sampler.cpython-36.pyc
        distributed.cpython-36.pyc
        grouped_batch_sampler.cpython-37.pyc
      - distributed.py
      - iteration_based_batch_sampler.py
      - grouped_batch_sampler.py
      - __init__.py
    - transforms
      - build.py
      - __pycache__
        transforms.cpython-37.pyc
        transforms.cpython-36.pyc
        build.cpython-36.pyc
        __init__.cpython-36.pyc
        __init__.cpython-37.pyc
        build.cpython-37.pyc
      - __init__.py
      - transforms.py
  - __init__.py
  - csrc
    - ROIAlign.h
    - cuda
      - ROIPool_cuda.cu
      - ROIAlign_cuda.cu
      - vision.h
      - nms.cu
      - RROIAlign_cuda.cu
    - ROIPool.h
    - cpu
      - vision.h
      - ROIAlign_cpu.cpp
      - nms_cpu.cpp
    - RROIAlign.h
    - vision.cpp
    - nms.h

2019年遥感图像稀疏表征与智能分析竞赛 - 目标检测主题

比赛官网： http://rscup.bjxintong.com.cn/#/theme/2

使用RRPN模型，ResNeXt-101-FPN作为backbone,mAP达到0.336（单模，由于最后时间不够未加任何trick）。模型主要参考：https://github.com/mjq11302010044/RRPN_pytorch ，需要针对本项目进行一定的修改。

环境搭建

# first, make sure that your conda is setup properly with the right environment# for that, check that `which conda`, `which pip` and `which python` points to the# right path. From a clean conda env, this is what you need to do
conda create -n rrpn_pytorch python=3.6
conda activate rrpn_pytorch

# this installs the right pip and dependencies for the fresh python
conda install ipython

# maskrcnn_benchmark and coco api dependencies
pip install ninja yacs cython matplotlib tqdm opencv-python （可以先which pip确认下pip在当前环境）

# follow PyTorch installation in https://pytorch.org/get-started/locally
 (注意,这里一定要写=1.0或1.1,否则默认装1.2版本,后面一堆问题....)
conda install -c pytorch pytorch-nightly=1.0 torchvision=0.2.1 cudatoolkit=10.0（cudatoolkit的版本可以用nvcc -V看一下cuda编译器的版本，这两个最好一致！另外注意如果是RTX等图灵架构系列，一定不要用9.0版本的cudatoolkit，必须重装10.0，否则后面执行train_net.py时会报错）

# install pycocotoolscd ~/github
git clone https://github.com/cocodataset/cocoapi.git
cd cocoapi/PythonAPI
python setup.py build_ext install

# install RRPN
git clone https://github.com/clw5180/remote_sensing_object_detection_2019.git
cd RRPN_pytorch
# the following will install the lib with# symbolic links, so that you can modify
# the files if you want and won't need to
# re-build it
python setup.py build develop（一定注意：后期若有修改maskrcnn-benchmark文件夹下的代码，一定要用这条命令重新编译！目的是同步build文件夹下的内容）

# 后面这几步是RRPN项目特有的
python rotation_setup.py install
mv build/lib.linux-x86_64-3.6/rotation/*.so ./rotation (如果python版本不是3.6，就改成版本对应的数字）

# or if you are on macOS# MACOSX_DEPLOYMENT_TARGET=10.9 CC=clang CXX=clang++ python setup.py build develop

坑比较多，可以参考：

https://github.com/facebookresearch/maskrcnn-benchmark

https://zhuanlan.zhihu.com/p/64605565

数据预处理

采用800x800的crop，overlap取256，大约生成25000张图片。注意crop的同时要转换出对应的txt文件，放在labelTxt下。具体实现可以参考我的github，位置：Python_Practice/常用数据预处理脚本/超大图片crop/2019遥感_Step1_train_crop切图.py

训练

1、在maskrcnn_benchmark/config/paths_catalog.py根据个人数据集的路径进行修改

        "RRPN_train": 
        { 
            'dataset_list':
            {
                 # 这里根据个人数据集的路径进行修改,该路径下含有放在labelTxt下和images两个文件,分别存放放标注数据和图片
                 # 这两个文件名可在在maskrcnn_benchmark/data/datasets/rotation_series.py中修改，见最后
                'DOTA': '/media/clwclw/Elements/deep_learning/competion/2019yaogan/train/train_crop_800/'                         
            },
            "split": 'train'
        },

2、tools文件夹下，执行python train_net.py

预测

在demo文件夹下，执行python RRPN_Demo.py

主要是增加了在线crop，对bbox进行坐标变换，再用nms去掉overlap的重复检测框。

常见错误

1、invalid value encountered in greater overlaps[overlaps > 1.00000001] = 0.0 解决办法：（1）删除小于16x16（保险起见建议8x8）的bbox；（2）在代码中找到T.RandomRotation，注释掉。

其他注意事项

如果需要作一定修改，或者遇到问题，需要注意几点： 1、我这里首先在maskrcnn_benchmark/data/datasets/rotation_series.py里自己写了一个获取数据集标注的方法get_DOTA()，主要是为了将DOTA数据集（也就是本次比赛的数据集）的标注数据以一定格式读进来，即下面的im_infos；

        im_info = {
            'gt_classes': gt_classes,
            'max_classes': max_classes,
            'image': im_path,
            'boxes': gt_boxes,
            'gt_words': gt_words,
            'flipped': False,
            'gt_overlaps': overlaps,
            'seg_areas': seg_areas,
            'height': im.shape[0],
            'width': im.shape[1],
            'max_overlaps': max_overlaps,
            'rotated': True
        }
        im_infos.append(im_info)
        ...
        return im_infos

同时也会将im_infos转换成pkl格式文件，然后保存在tools/data_cache下，

    f_save_pkl = open(cache_pkl, 'wb')
    pickle.dump(im_infos, f_save_pkl)
    f_save_pkl.close()
    print("Save pickle done.")

以便下一次再训练的时候可以直接读入：

    if os.path.isfile(cache_pkl):
        return pickle.load(open(cache_pkl, 'rb'))

这里我首先删掉了50kB以上的txt及对应的images（因为比如small-vehicle这个类别，在一张800x800的切图中最多能达到2500+的个数，所以很容易就会OOM），然后过滤掉了训练集中小于8x8的bbox（会在训练中引起一些overlap的错误或loss=nan的现象，另外这么小的尺度，下采样几次之后在feature map基本就找不到了，因此也没必要保留），。

        elif "RRPN_train" in name:
            data_dir = DatasetCatalog.DATA_DIR
            attrs = DatasetCatalog.DATASETS['RRPN_train']
            args = dict(
                database=attrs["dataset_list"],
            )
            return dict(
                factory="RotationDataset",
                args=args,
            )

当然也可以将数据集转化为COCO官方提供的json格式，只需要在maskrcnn_benchmark/config/paths_catalog.py中增加如下内容：

        "DOTA_train": { 
            "img_dir": '/media/clwclw/Elements/deep_learning/competion/2019yaogan/train/train_crop_800/images/',
            "ann_file": '/media/clwclw/Elements/deep_learning/competion/2019yaogan/train/train_crop_800/train.json',
            "split": 'train'
        },

        elif "DOTA_train" in name:
            data_dir = DatasetCatalog.DATA_DIR
            attrs = DatasetCatalog.DATASETS[name]
            args = dict(
                root=os.path.join(data_dir, attrs["img_dir"]),
                ann_file=os.path.join(data_dir, attrs["ann_file"]),
            )
            return dict(
                factory="COCODataset",    # 通过官方API导入json格式数据
                args=args,
            )

此外如果使用其他数据集进行训练，还有几个地方需要修改：

1、配置文件e2e_rrpn_X_101_32x8d_FPN_1x_DOTA.yaml需要根据情况进行修改：

DATASETS:
  TRAIN: ("RRPN_train", )

    ......
  ROI_BOX_HEAD:
    NUM_CLASSES: 19 # 18类物体 + 1背景

OUTPUT_DIR: './models/DOTA/'

2、tools/train_net.py中，需要根据情况修改成自己的.yaml配置文件，如default="../configs/rrpn/e2e_rrpn_X_101_32x8d_FPN_1x_DOTA.yaml"

3、修改maskrcnn_benchmark/config/paths_catalog.py中需要添加自己的数据集，如

"XXXX_train": {  
"img_dir":'/home/xxx/2019yaogan/train_data/images/',    
"ann_file":'/home/xxx/2019yaogan/train_data/Annotations/train.json',   
"split": 'train'
},

4、在maskrcnn_benchmark/data/datasets/rotation_series.py中需要修改的地方

def get_DOTA(mode, dataset_dir):
    DATASET_DIR = dataset_dir
    print('clw:在get_DOTA中, dataset_dir = ', dataset_dir)

    # 如果dataset_dir下存放标注数据和图片的文件夹名称不是images和labelTxt,可以在下面进行修改
    img_dir = "/images/"  
    gt_dir = "/labelTxt/"

DATASET = {
    'IC13':get_ICDAR2013,
    'IC15':get_ICDAR2015_RRC_PICK_TRAIN,
    'IC17mlt':get_ICDAR2017_mlt,
    'LSVT':get_ICDAR_LSVT_full,
    'ArT':get_ICDAR_ArT,
    'ReCTs':get_ICDAR_ReCTs_full,
    'DOTA':get_DOTA,   # 增加自己的数据集名称及对应获取数据的方法
}

class RotationDataset(torch.utils.data.Dataset):
    CLASSES = (
        "__background__ ", #"background",
        "roundabout",
        "tennis-court",
        "swimming-pool",
        "storage-tank",
        "soccer-ball-field",
        "small-vehicle",
        "ship",
        "plane",
        "large-vehicle",
        "helicopter",
        "harbor",
        "ground-track-field",
        "bridge",
        "basketball-court",
        "baseball-diamond",
        "helipad",
        "airport",
        "container-crane"  # 修改自己的类别
    )

结果如下：

这里随便写文字

写得比较仓促，如有遗漏或遇到问题欢迎提出宝贵issue，我会及时修正。欢迎star！