├── .gitignore
├── IP
    ├── experiments
    │   ├── .ipynb_checkpoints
    │   │   ├── exp_0-checkpoint.py
    │   │   ├── exp_1-checkpoint.py
    │   │   ├── exp_2-checkpoint.py
    │   │   ├── exp_3-checkpoint.py
    │   │   ├── exp_4-checkpoint.py
    │   │   ├── exp_5-checkpoint.py
    │   │   └── exp_6-checkpoint.py
    │   ├── exp_0.py
    │   ├── exp_1.py
    │   ├── exp_2.py
    │   ├── exp_3.py
    │   ├── exp_4.py
    │   ├── exp_5.py
    │   └── exp_6.py
    ├── experiments_aux
    │   ├── .ipynb_checkpoints
    │   │   ├── exp_0-checkpoint.py
    │   │   ├── exp_1-checkpoint.py
    │   │   ├── exp_2-checkpoint.py
    │   │   ├── exp_3-checkpoint.py
    │   │   ├── exp_4-checkpoint.py
    │   │   ├── exp_5-checkpoint.py
    │   │   └── exp_6-checkpoint.py
    │   ├── exp_0.py
    │   ├── exp_1.py
    │   ├── exp_2.py
    │   ├── exp_3.py
    │   ├── exp_4.py
    │   ├── exp_5.py
    │   └── exp_6.py
    ├── gen_teaser.py
    ├── models
    │   ├── __init__.py
    │   ├── graph.py
    │   ├── inception.py
    │   ├── resnet.py
    │   └── utils.py
    ├── optimize_hyperparams.py
    ├── run_ablation_experiments.py
    ├── utils
    │   ├── .ipynb_checkpoints
    │   │   ├── intersections-checkpoint.py
    │   │   ├── metrics-checkpoint.py
    │   │   ├── optimizer-checkpoint.py
    │   │   ├── optimizer_BACKUP_29_AUG-checkpoint.py
    │   │   ├── optimizer_checkpoint_JUNE-checkpoint.py
    │   │   └── utils-checkpoint.py
    │   ├── QP.py
    │   ├── __init__.py
    │   ├── intersections.py
    │   ├── metrics.py
    │   ├── optimizer.py
    │   ├── optimizer_BACKUP_29_AUG.py
    │   ├── optimizer_checkpoint.py
    │   ├── optimizer_checkpoint_JUNE.py
    │   ├── optimizer_heuristic.py
    │   ├── plotter.py
    │   └── utils.py
    └── visualize.py
├── PC_and_CE_inference
    ├── .ipynb_checkpoints
    │   └── run_experiments-checkpoint.py
    ├── README.md
    ├── _init_paths.py
    ├── datasets
    │   ├── .ipynb_checkpoints
    │   │   ├── config-checkpoint.py
    │   │   ├── junction-checkpoint.py
    │   │   └── utils-checkpoint.py
    │   ├── __init__.py
    │   ├── config.py
    │   ├── generate_cell_anchors.py
    │   ├── junction.py
    │   ├── plotter.py
    │   └── utils.py
    ├── hypes
    │   ├── 1.json
    │   ├── 2.json
    │   └── 3.json
    ├── loss
    │   ├── balance_loss.py
    │   └── normal_loss.py
    ├── main.py
    ├── model
    │   ├── __init__.py
    │   ├── graph.py
    │   ├── inception.py
    │   ├── networks
    │   │   ├── __init__.py
    │   │   ├── active
    │   │   │   ├── anchor_target_layer.py
    │   │   │   ├── bbox_transform.py
    │   │   │   ├── ee.py
    │   │   │   ├── generate_anchors.py
    │   │   │   ├── inception.py
    │   │   │   ├── inception_part.py
    │   │   │   ├── proposal_target_layer_cascade.bk.py
    │   │   │   ├── proposal_target_layer_cascade.py
    │   │   │   ├── rr.py
    │   │   │   └── stackedHG.py
    │   │   ├── generate_cell_anchors.py
    │   │   ├── inception_v2.py
    │   │   └── junction_decoder.py
    │   ├── resnet.py
    │   └── utils.py
    ├── opts.py
    ├── process_cities.py
    ├── ref.py
    ├── requirements.txt
    ├── trainer
    │   ├── .ipynb_checkpoints
    │   │   └── balance_junction_trainer-checkpoint.py
    │   ├── balance_junction_trainer.py
    │   └── junction_trainer.py
    └── utils
    │   ├── .ipynb_checkpoints
    │       └── optimizer-checkpoint.py
    │   ├── __init__.py
    │   ├── intersections.py
    │   ├── metrics.py
    │   ├── plotter.py
    │   └── utils.py
├── PE_inference
    ├── dataset
    │   ├── .ipynb_checkpoints
    │   │   └── custom_dataloader-checkpoint.py
    │   ├── __init__.py
    │   ├── custom_dataloader.py
    │   └── metrics.py
    ├── detect.py
    ├── model
    │   ├── __init__.py
    │   ├── drn.py
    │   ├── mymodel.py
    │   └── utils.py
    ├── train.py
    └── utils
    │   ├── __init__.py
    │   ├── losses.py
    │   └── utils.py
├── PR_inference
    ├── LICENSE
    ├── README.md
    ├── configs
    │   ├── .ipynb_checkpoints
    │   │   └── buildings_mask_rcnn_R_50_FPN_1x-checkpoint.yaml
    │   ├── buildings_mask_rcnn_R_50_FPN_1x.yaml
    │   ├── caffe2
    │   │   ├── e2e_faster_rcnn_R_101_FPN_1x_caffe2.yaml
    │   │   ├── e2e_faster_rcnn_R_50_C4_1x_caffe2.yaml
    │   │   ├── e2e_faster_rcnn_R_50_FPN_1x_caffe2.yaml
    │   │   ├── e2e_faster_rcnn_X_101_32x8d_FPN_1x_caffe2.yaml
    │   │   ├── e2e_keypoint_rcnn_R_50_FPN_1x_caffe2.yaml
    │   │   ├── e2e_mask_rcnn_R_101_FPN_1x_caffe2.yaml
    │   │   ├── e2e_mask_rcnn_R_50_C4_1x_caffe2.yaml
    │   │   ├── e2e_mask_rcnn_R_50_FPN_1x_caffe2.yaml
    │   │   ├── e2e_mask_rcnn_X-152-32x8d-FPN-IN5k_1.44x_caffe2.yaml
    │   │   └── e2e_mask_rcnn_X_101_32x8d_FPN_1x_caffe2.yaml
    │   ├── cityscapes
    │   │   ├── e2e_faster_rcnn_R_50_FPN_1x_cocostyle.yaml
    │   │   └── e2e_mask_rcnn_R_50_FPN_1x_cocostyle.yaml
    │   ├── gn_baselines
    │   │   ├── README.md
    │   │   ├── e2e_faster_rcnn_R_50_FPN_1x_gn.yaml
    │   │   ├── e2e_faster_rcnn_R_50_FPN_Xconv1fc_1x_gn.yaml
    │   │   ├── e2e_mask_rcnn_R_50_FPN_1x_gn.yaml
    │   │   ├── e2e_mask_rcnn_R_50_FPN_Xconv1fc_1x_gn.yaml
    │   │   ├── scratch_e2e_faster_rcnn_R_50_FPN_3x_gn.yaml
    │   │   ├── scratch_e2e_faster_rcnn_R_50_FPN_Xconv1fc_3x_gn.yaml
    │   │   ├── scratch_e2e_mask_rcnn_R_50_FPN_3x_gn.yaml
    │   │   └── scratch_e2e_mask_rcnn_R_50_FPN_Xconv1fc_3x_gn.yaml
    │   ├── pascal_voc
    │   │   ├── e2e_faster_rcnn_R_50_C4_1x_1_gpu_voc.yaml
    │   │   ├── e2e_faster_rcnn_R_50_C4_1x_4_gpu_voc.yaml
    │   │   └── e2e_mask_rcnn_R_50_FPN_1x_cocostyle.yaml
    │   ├── quick_schedules
    │   │   ├── e2e_faster_rcnn_R_50_C4_quick.yaml
    │   │   ├── e2e_faster_rcnn_R_50_FPN_quick.yaml
    │   │   ├── e2e_faster_rcnn_X_101_32x8d_FPN_quick.yaml
    │   │   ├── e2e_keypoint_rcnn_R_50_FPN_quick.yaml
    │   │   ├── e2e_mask_rcnn_R_50_C4_quick.yaml
    │   │   ├── e2e_mask_rcnn_R_50_FPN_quick.yaml
    │   │   ├── e2e_mask_rcnn_X_101_32x8d_FPN_quick.yaml
    │   │   ├── rpn_R_50_C4_quick.yaml
    │   │   └── rpn_R_50_FPN_quick.yaml
    │   └── retinanet
    │   │   ├── retinanet_R-101-FPN_1x.yaml
    │   │   ├── retinanet_R-101-FPN_P5_1x.yaml
    │   │   ├── retinanet_R-50-FPN_1x.yaml
    │   │   ├── retinanet_R-50-FPN_1x_quick.yaml
    │   │   ├── retinanet_R-50-FPN_P5_1x.yaml
    │   │   └── retinanet_X_101_32x8d_FPN_1x.yaml
    ├── docker
    │   ├── Dockerfile
    │   └── docker-jupyter
    │   │   ├── Dockerfile
    │   │   └── jupyter_notebook_config.py
    ├── inference
    │   └── buildings_val
    │   │   └── predictions.pth
    ├── last_checkpoint
    ├── maskrcnn_benchmark
    │   ├── __init__.py
    │   ├── config
    │   │   ├── .ipynb_checkpoints
    │   │   │   ├── defaults-checkpoint.py
    │   │   │   └── paths_catalog-checkpoint.py
    │   │   ├── __init__.py
    │   │   ├── defaults.py
    │   │   └── paths_catalog.py
    │   ├── csrc
    │   │   ├── ROIAlign.h
    │   │   ├── ROIPool.h
    │   │   ├── SigmoidFocalLoss.h
    │   │   ├── cpu
    │   │   │   ├── ROIAlign_cpu.cpp
    │   │   │   ├── nms_cpu.cpp
    │   │   │   └── vision.h
    │   │   ├── cuda
    │   │   │   ├── ROIAlign_cuda.cu
    │   │   │   ├── ROIPool_cuda.cu
    │   │   │   ├── SigmoidFocalLoss_cuda.cu
    │   │   │   ├── nms.cu
    │   │   │   └── vision.h
    │   │   ├── nms.h
    │   │   └── vision.cpp
    │   ├── data
    │   │   ├── .ipynb_checkpoints
    │   │   │   └── README-checkpoint.md
    │   │   ├── README.md
    │   │   ├── __init__.py
    │   │   ├── build.py
    │   │   ├── collate_batch.py
    │   │   ├── datasets
    │   │   │   ├── .ipynb_checkpoints
    │   │   │   │   └── buildings-checkpoint.py
    │   │   │   ├── __init__.py
    │   │   │   ├── buildings.py
    │   │   │   ├── coco.py
    │   │   │   ├── concat_dataset.py
    │   │   │   ├── evaluation
    │   │   │   │   ├── __init__.py
    │   │   │   │   ├── buildings
    │   │   │   │   │   ├── .ipynb_checkpoints
    │   │   │   │   │   │   └── buildings_eval-checkpoint.py
    │   │   │   │   │   ├── __init__.py
    │   │   │   │   │   └── buildings_eval.py
    │   │   │   │   ├── coco
    │   │   │   │   │   ├── __init__.py
    │   │   │   │   │   └── coco_eval.py
    │   │   │   │   └── voc
    │   │   │   │   │   ├── __init__.py
    │   │   │   │   │   └── voc_eval.py
    │   │   │   ├── list_dataset.py
    │   │   │   └── voc.py
    │   │   ├── samplers
    │   │   │   ├── __init__.py
    │   │   │   ├── distributed.py
    │   │   │   ├── grouped_batch_sampler.py
    │   │   │   └── iteration_based_batch_sampler.py
    │   │   └── transforms
    │   │   │   ├── __init__.py
    │   │   │   ├── build.py
    │   │   │   └── transforms.py
    │   ├── engine
    │   │   ├── __init__.py
    │   │   ├── inference.py
    │   │   └── trainer.py
    │   ├── layers
    │   │   ├── __init__.py
    │   │   ├── _utils.py
    │   │   ├── batch_norm.py
    │   │   ├── misc.py
    │   │   ├── nms.py
    │   │   ├── roi_align.py
    │   │   ├── roi_pool.py
    │   │   ├── sigmoid_focal_loss.py
    │   │   └── smooth_l1_loss.py
    │   ├── modeling
    │   │   ├── __init__.py
    │   │   ├── backbone
    │   │   │   ├── __init__.py
    │   │   │   ├── backbone.py
    │   │   │   ├── fbnet.py
    │   │   │   ├── fbnet_builder.py
    │   │   │   ├── fbnet_modeldef.py
    │   │   │   ├── fpn.py
    │   │   │   └── resnet.py
    │   │   ├── balanced_positive_negative_sampler.py
    │   │   ├── box_coder.py
    │   │   ├── detector
    │   │   │   ├── __init__.py
    │   │   │   ├── detectors.py
    │   │   │   └── generalized_rcnn.py
    │   │   ├── make_layers.py
    │   │   ├── matcher.py
    │   │   ├── poolers.py
    │   │   ├── registry.py
    │   │   ├── roi_heads
    │   │   │   ├── __init__.py
    │   │   │   ├── box_head
    │   │   │   │   ├── __init__.py
    │   │   │   │   ├── box_head.py
    │   │   │   │   ├── inference.py
    │   │   │   │   ├── loss.py
    │   │   │   │   ├── roi_box_feature_extractors.py
    │   │   │   │   └── roi_box_predictors.py
    │   │   │   ├── keypoint_head
    │   │   │   │   ├── __init__.py
    │   │   │   │   ├── inference.py
    │   │   │   │   ├── keypoint_head.py
    │   │   │   │   ├── loss.py
    │   │   │   │   ├── roi_keypoint_feature_extractors.py
    │   │   │   │   └── roi_keypoint_predictors.py
    │   │   │   ├── mask_head
    │   │   │   │   ├── __init__.py
    │   │   │   │   ├── inference.py
    │   │   │   │   ├── loss.py
    │   │   │   │   ├── mask_head.py
    │   │   │   │   ├── roi_mask_feature_extractors.py
    │   │   │   │   └── roi_mask_predictors.py
    │   │   │   └── roi_heads.py
    │   │   ├── rpn
    │   │   │   ├── __init__.py
    │   │   │   ├── anchor_generator.py
    │   │   │   ├── inference.py
    │   │   │   ├── loss.py
    │   │   │   ├── retinanet
    │   │   │   │   ├── __init__.py
    │   │   │   │   ├── inference.py
    │   │   │   │   ├── loss.py
    │   │   │   │   └── retinanet.py
    │   │   │   ├── rpn.py
    │   │   │   └── utils.py
    │   │   └── utils.py
    │   ├── solver
    │   │   ├── __init__.py
    │   │   ├── build.py
    │   │   └── lr_scheduler.py
    │   ├── structures
    │   │   ├── __init__.py
    │   │   ├── bounding_box.py
    │   │   ├── boxlist_ops.py
    │   │   ├── image_list.py
    │   │   ├── keypoint.py
    │   │   └── segmentation_mask.py
    │   └── utils
    │   │   ├── .ipynb_checkpoints
    │   │       └── model_serialization-checkpoint.py
    │   │   ├── README.md
    │   │   ├── __init__.py
    │   │   ├── c2_model_loading.py
    │   │   ├── checkpoint.py
    │   │   ├── collect_env.py
    │   │   ├── comm.py
    │   │   ├── cv2_util.py
    │   │   ├── env.py
    │   │   ├── imports.py
    │   │   ├── logger.py
    │   │   ├── metric_logger.py
    │   │   ├── miscellaneous.py
    │   │   ├── model_serialization.py
    │   │   ├── model_zoo.py
    │   │   ├── registry.py
    │   │   └── timer.py
    ├── requirements.txt
    ├── setup.py
    ├── tests
    │   ├── checkpoint.py
    │   ├── env_tests
    │   │   └── env.py
    │   ├── test_backbones.py
    │   ├── test_box_coder.py
    │   ├── test_configs.py
    │   ├── test_data_samplers.py
    │   ├── test_detectors.py
    │   ├── test_fbnet.py
    │   ├── test_feature_extractors.py
    │   ├── test_metric_logger.py
    │   ├── test_nms.py
    │   ├── test_predictors.py
    │   ├── test_rpn_heads.py
    │   ├── test_segmentation_mask.py
    │   └── utils.py
    └── tools
    │   ├── cityscapes
    │       ├── convert_cityscapes_to_coco.py
    │       └── instances2dict_with_polygons.py
    │   ├── test_net.py
    │   └── train_net.py
├── README.md
├── RR_inference
    ├── LICENSE
    ├── MODEL_ZOO.md
    ├── README.md
    ├── configs
    │   ├── .ipynb_checkpoints
    │   │   └── buildings_mask_rcnn_R_50_FPN_1x-checkpoint.yaml
    │   ├── buildings_mask_rcnn_R_50_FPN_1x.yaml
    │   ├── caffe2
    │   │   ├── e2e_faster_rcnn_R_101_FPN_1x_caffe2.yaml
    │   │   ├── e2e_faster_rcnn_R_50_C4_1x_caffe2.yaml
    │   │   ├── e2e_faster_rcnn_R_50_FPN_1x_caffe2.yaml
    │   │   ├── e2e_faster_rcnn_X_101_32x8d_FPN_1x_caffe2.yaml
    │   │   ├── e2e_keypoint_rcnn_R_50_FPN_1x_caffe2.yaml
    │   │   ├── e2e_mask_rcnn_R_101_FPN_1x_caffe2.yaml
    │   │   ├── e2e_mask_rcnn_R_50_C4_1x_caffe2.yaml
    │   │   ├── e2e_mask_rcnn_R_50_FPN_1x_caffe2.yaml
    │   │   ├── e2e_mask_rcnn_X-152-32x8d-FPN-IN5k_1.44x_caffe2.yaml
    │   │   └── e2e_mask_rcnn_X_101_32x8d_FPN_1x_caffe2.yaml
    │   ├── cityscapes
    │   │   ├── e2e_faster_rcnn_R_50_FPN_1x_cocostyle.yaml
    │   │   └── e2e_mask_rcnn_R_50_FPN_1x_cocostyle.yaml
    │   ├── gn_baselines
    │   │   ├── README.md
    │   │   ├── e2e_faster_rcnn_R_50_FPN_1x_gn.yaml
    │   │   ├── e2e_faster_rcnn_R_50_FPN_Xconv1fc_1x_gn.yaml
    │   │   ├── e2e_mask_rcnn_R_50_FPN_1x_gn.yaml
    │   │   ├── e2e_mask_rcnn_R_50_FPN_Xconv1fc_1x_gn.yaml
    │   │   ├── scratch_e2e_faster_rcnn_R_50_FPN_3x_gn.yaml
    │   │   ├── scratch_e2e_faster_rcnn_R_50_FPN_Xconv1fc_3x_gn.yaml
    │   │   ├── scratch_e2e_mask_rcnn_R_50_FPN_3x_gn.yaml
    │   │   └── scratch_e2e_mask_rcnn_R_50_FPN_Xconv1fc_3x_gn.yaml
    │   ├── pascal_voc
    │   │   ├── e2e_faster_rcnn_R_50_C4_1x_1_gpu_voc.yaml
    │   │   ├── e2e_faster_rcnn_R_50_C4_1x_4_gpu_voc.yaml
    │   │   └── e2e_mask_rcnn_R_50_FPN_1x_cocostyle.yaml
    │   ├── quick_schedules
    │   │   ├── e2e_faster_rcnn_R_50_C4_quick.yaml
    │   │   ├── e2e_faster_rcnn_R_50_FPN_quick.yaml
    │   │   ├── e2e_faster_rcnn_X_101_32x8d_FPN_quick.yaml
    │   │   ├── e2e_keypoint_rcnn_R_50_FPN_quick.yaml
    │   │   ├── e2e_mask_rcnn_R_50_C4_quick.yaml
    │   │   ├── e2e_mask_rcnn_R_50_FPN_quick.yaml
    │   │   ├── e2e_mask_rcnn_X_101_32x8d_FPN_quick.yaml
    │   │   ├── rpn_R_50_C4_quick.yaml
    │   │   └── rpn_R_50_FPN_quick.yaml
    │   └── retinanet
    │   │   ├── retinanet_R-101-FPN_1x.yaml
    │   │   ├── retinanet_R-101-FPN_P5_1x.yaml
    │   │   ├── retinanet_R-50-FPN_1x.yaml
    │   │   ├── retinanet_R-50-FPN_1x_quick.yaml
    │   │   ├── retinanet_R-50-FPN_P5_1x.yaml
    │   │   └── retinanet_X_101_32x8d_FPN_1x.yaml
    ├── docker
    │   ├── Dockerfile
    │   └── docker-jupyter
    │   │   ├── Dockerfile
    │   │   └── jupyter_notebook_config.py
    ├── inference
    │   └── buildings_val
    │   │   └── predictions.pth
    ├── last_checkpoint
    ├── maskrcnn_benchmark
    │   ├── .ipynb_checkpoints
    │   │   └── __init__-checkpoint.py
    │   ├── __init__.py
    │   ├── config
    │   │   ├── .ipynb_checkpoints
    │   │   │   ├── defaults-checkpoint.py
    │   │   │   └── paths_catalog-checkpoint.py
    │   │   ├── __init__.py
    │   │   ├── defaults.py
    │   │   └── paths_catalog.py
    │   ├── csrc
    │   │   ├── ROIAlign.h
    │   │   ├── ROIPool.h
    │   │   ├── SigmoidFocalLoss.h
    │   │   ├── cpu
    │   │   │   ├── ROIAlign_cpu.cpp
    │   │   │   ├── nms_cpu.cpp
    │   │   │   └── vision.h
    │   │   ├── cuda
    │   │   │   ├── ROIAlign_cuda.cu
    │   │   │   ├── ROIPool_cuda.cu
    │   │   │   ├── SigmoidFocalLoss_cuda.cu
    │   │   │   ├── nms.cu
    │   │   │   └── vision.h
    │   │   ├── nms.h
    │   │   └── vision.cpp
    │   ├── data
    │   │   ├── .ipynb_checkpoints
    │   │   │   └── README-checkpoint.md
    │   │   ├── README.md
    │   │   ├── __init__.py
    │   │   ├── build.py
    │   │   ├── collate_batch.py
    │   │   ├── datasets
    │   │   │   ├── .ipynb_checkpoints
    │   │   │   │   ├── buildings-checkpoint.py
    │   │   │   │   └── buildings_test-checkpoint.py
    │   │   │   ├── __init__.py
    │   │   │   ├── buildings _BACKUP.py
    │   │   │   ├── buildings.py
    │   │   │   ├── buildings_test.py
    │   │   │   ├── coco.py
    │   │   │   ├── concat_dataset.py
    │   │   │   ├── evaluation
    │   │   │   │   ├── __init__.py
    │   │   │   │   ├── buildings
    │   │   │   │   │   ├── .ipynb_checkpoints
    │   │   │   │   │   │   └── buildings_eval-checkpoint.py
    │   │   │   │   │   ├── __init__.py
    │   │   │   │   │   └── buildings_eval.py
    │   │   │   │   ├── coco
    │   │   │   │   │   ├── __init__.py
    │   │   │   │   │   └── coco_eval.py
    │   │   │   │   └── voc
    │   │   │   │   │   ├── __init__.py
    │   │   │   │   │   └── voc_eval.py
    │   │   │   ├── list_dataset.py
    │   │   │   └── voc.py
    │   │   ├── samplers
    │   │   │   ├── __init__.py
    │   │   │   ├── distributed.py
    │   │   │   ├── grouped_batch_sampler.py
    │   │   │   └── iteration_based_batch_sampler.py
    │   │   └── transforms
    │   │   │   ├── __init__.py
    │   │   │   ├── build.py
    │   │   │   └── transforms.py
    │   ├── engine
    │   │   ├── __init__.py
    │   │   ├── inference.py
    │   │   └── trainer.py
    │   ├── layers
    │   │   ├── __init__.py
    │   │   ├── _utils.py
    │   │   ├── batch_norm.py
    │   │   ├── misc.py
    │   │   ├── nms.py
    │   │   ├── roi_align.py
    │   │   ├── roi_pool.py
    │   │   ├── sigmoid_focal_loss.py
    │   │   └── smooth_l1_loss.py
    │   ├── modeling
    │   │   ├── __init__.py
    │   │   ├── backbone
    │   │   │   ├── .ipynb_checkpoints
    │   │   │   │   └── backbone-checkpoint.py
    │   │   │   ├── __init__.py
    │   │   │   ├── backbone.py
    │   │   │   ├── fbnet.py
    │   │   │   ├── fbnet_builder.py
    │   │   │   ├── fbnet_modeldef.py
    │   │   │   ├── fpn.py
    │   │   │   └── resnet.py
    │   │   ├── balanced_positive_negative_sampler.py
    │   │   ├── box_coder.py
    │   │   ├── detector
    │   │   │   ├── .ipynb_checkpoints
    │   │   │   │   ├── detectors-checkpoint.py
    │   │   │   │   └── generalized_rcnn-checkpoint.py
    │   │   │   ├── __init__.py
    │   │   │   ├── detectors.py
    │   │   │   └── generalized_rcnn.py
    │   │   ├── make_layers.py
    │   │   ├── matcher.py
    │   │   ├── poolers.py
    │   │   ├── registry.py
    │   │   ├── roi_heads
    │   │   │   ├── __init__.py
    │   │   │   ├── box_head
    │   │   │   │   ├── __init__.py
    │   │   │   │   ├── box_head.py
    │   │   │   │   ├── inference.py
    │   │   │   │   ├── loss.py
    │   │   │   │   ├── roi_box_feature_extractors.py
    │   │   │   │   └── roi_box_predictors.py
    │   │   │   ├── keypoint_head
    │   │   │   │   ├── __init__.py
    │   │   │   │   ├── inference.py
    │   │   │   │   ├── keypoint_head.py
    │   │   │   │   ├── loss.py
    │   │   │   │   ├── roi_keypoint_feature_extractors.py
    │   │   │   │   └── roi_keypoint_predictors.py
    │   │   │   ├── mask_head
    │   │   │   │   ├── __init__.py
    │   │   │   │   ├── inference.py
    │   │   │   │   ├── loss.py
    │   │   │   │   ├── mask_head.py
    │   │   │   │   ├── roi_mask_feature_extractors.py
    │   │   │   │   └── roi_mask_predictors.py
    │   │   │   └── roi_heads.py
    │   │   ├── rpn
    │   │   │   ├── __init__.py
    │   │   │   ├── anchor_generator.py
    │   │   │   ├── inference.py
    │   │   │   ├── loss.py
    │   │   │   ├── retinanet
    │   │   │   │   ├── __init__.py
    │   │   │   │   ├── inference.py
    │   │   │   │   ├── loss.py
    │   │   │   │   └── retinanet.py
    │   │   │   ├── rpn.py
    │   │   │   └── utils.py
    │   │   └── utils.py
    │   ├── solver
    │   │   ├── __init__.py
    │   │   ├── build.py
    │   │   └── lr_scheduler.py
    │   ├── structures
    │   │   ├── __init__.py
    │   │   ├── bounding_box.py
    │   │   ├── boxlist_ops.py
    │   │   ├── image_list.py
    │   │   ├── keypoint.py
    │   │   └── segmentation_mask.py
    │   └── utils
    │   │   ├── .ipynb_checkpoints
    │   │       ├── checkpoint-checkpoint.py
    │   │       └── model_serialization-checkpoint.py
    │   │   ├── README.md
    │   │   ├── __init__.py
    │   │   ├── c2_model_loading.py
    │   │   ├── checkpoint.py
    │   │   ├── collect_env.py
    │   │   ├── comm.py
    │   │   ├── cv2_util.py
    │   │   ├── env.py
    │   │   ├── imports.py
    │   │   ├── logger.py
    │   │   ├── metric_logger.py
    │   │   ├── miscellaneous.py
    │   │   ├── model_serialization.py
    │   │   ├── model_zoo.py
    │   │   ├── registry.py
    │   │   └── timer.py
    ├── preprocess_per_region_pair.py
    ├── requirements.txt
    ├── setup.py
    ├── tests
    │   ├── checkpoint.py
    │   ├── env_tests
    │   │   └── env.py
    │   ├── test_backbones.py
    │   ├── test_box_coder.py
    │   ├── test_configs.py
    │   ├── test_data_samplers.py
    │   ├── test_detectors.py
    │   ├── test_fbnet.py
    │   ├── test_feature_extractors.py
    │   ├── test_metric_logger.py
    │   ├── test_nms.py
    │   ├── test_predictors.py
    │   ├── test_rpn_heads.py
    │   ├── test_segmentation_mask.py
    │   └── utils.py
    └── tools
    │   ├── cityscapes
    │       ├── convert_cityscapes_to_coco.py
    │       └── instances2dict_with_polygons.py
    │   ├── test_net.py
    │   └── train_net.py
└── refs
    └── raw.jpg


/.gitignore:
--------------------------------------------------------------------------------
1 | *.so
2 | *pycache*
3 | *.pyc
4 | */.git*
5 | 


--------------------------------------------------------------------------------
/IP/experiments/.ipynb_checkpoints/exp_0-checkpoint.py:
--------------------------------------------------------------------------------
 1 | import matplotlib.pyplot as plt
 2 | import random
 3 | import svgwrite
 4 | from PIL import Image, ImageDraw
 5 | from utils.utils import *
 6 | from utils.optimizer import reconstructBuilding
 7 | 
 8 | # Baseline - Trust on junctions orientations and optimize the number of edges
 9 | def run_experiment_0(cs, edge_map, th_filtered, metric, graph_annot, rgb_dir, _id):
10 | 
11 | 	# Run experiment
12 | 	junctions, juncs_on, lines_on = reconstructBuilding(cs, edge_map,
13 | 														use_junctions=True,
14 | 														thetas=th_filtered,
15 | 														angle_thresh=5,
16 | 														intersection_constraint=True,
17 | 														post_process=True)
18 | 
19 | 	# Draw output image
20 | 	dwg = svgwrite.Drawing('../results/svg_regions/{}_0.svg'.format(_id), (128, 128))
21 | 	im_path = os.path.join(rgb_dir, _id + '.jpg')
22 | 	draw_building(dwg, junctions, juncs_on, lines_on)
23 | 	dwg.save()
24 | 
25 | 	# Update metric
26 | 	metric.forward(graph_annot, junctions, juncs_on, lines_on, _id)
27 | 
28 | 	return


--------------------------------------------------------------------------------
/IP/experiments/.ipynb_checkpoints/exp_1-checkpoint.py:
--------------------------------------------------------------------------------
 1 | import matplotlib.pyplot as plt
 2 | import random
 3 | import svgwrite
 4 | from PIL import Image, ImageDraw
 5 | from utils.utils import *
 6 | from utils.optimizer import reconstructBuilding
 7 | 
 8 | # Experiment I - Weighted edges indicator variables using edges confidence
 9 | def run_experiment_1(cs, edge_map, th_filtered, metric, graph_annot, rgb_dir, _id):
10 | 
11 | 	junctions, juncs_on, lines_on = reconstructBuilding(cs, edge_map,
12 | 																use_junctions=True,
13 | 																thetas=th_filtered,
14 | 																angle_thresh=5,
15 | 																edge_threshold=0.5,
16 | 																with_edge_confidence=True,
17 | 																use_edge_classifier=False,
18 | 																edge_map_weight=10.0,
19 | 																intersection_constraint=True,
20 | 																post_process=True)
21 | 
22 | 	# Draw output image
23 | 	dwg = svgwrite.Drawing('../results/svg_regions/{}_1.svg'.format(_id), (128, 128))
24 | 	im_path = os.path.join(rgb_dir, _id + '.jpg')
25 | 	draw_building(dwg, junctions, juncs_on, lines_on)
26 | 	dwg.save()
27 | 
28 | 	# Update metric
29 | 	metric.forward(graph_annot, junctions, juncs_on, lines_on, _id)
30 | 
31 | 	return


--------------------------------------------------------------------------------
/IP/experiments/.ipynb_checkpoints/exp_2-checkpoint.py:
--------------------------------------------------------------------------------
 1 | import matplotlib.pyplot as plt
 2 | import random
 3 | import svgwrite
 4 | from PIL import Image, ImageDraw
 5 | from utils.utils import *
 6 | from utils.optimizer import reconstructBuilding
 7 | 
 8 | # Experiment II - Weights as combined junctions and edges confidence
 9 | def run_experiment_2(cs, cs_c, edge_map, th_filtered, metric, graph_annot, rgb_dir, _id):
10 | 
11 | 	# Run experiment
12 | 	junctions, juncs_on, lines_on = reconstructBuilding(cs, edge_map,
13 | 																use_junctions=True,
14 | 																thetas=th_filtered,
15 | 																angle_thresh=5,
16 | 																with_corner_edge_confidence=True,
17 | 																corner_confs=cs_c,
18 | 																corner_edge_thresh=0.125,
19 | 																edge_map_weight=10.0,
20 | 																intersection_constraint=True,
21 | 																post_process=True)
22 | 
23 | 	# Draw output image
24 | 	dwg = svgwrite.Drawing('../results/svg_regions/{}_2.svg'.format(_id), (128, 128))
25 | 	im_path = os.path.join(rgb_dir, _id + '.jpg')
26 | 	draw_building(dwg, junctions, juncs_on, lines_on)
27 | 	dwg.save()
28 | 
29 | 	# Update metric
30 | 	metric.forward(graph_annot, junctions, juncs_on, lines_on, _id)
31 | 
32 | 	return metric
33 | 
34 | 


--------------------------------------------------------------------------------
/IP/experiments/.ipynb_checkpoints/exp_3-checkpoint.py:
--------------------------------------------------------------------------------
 1 | import matplotlib.pyplot as plt
 2 | import random
 3 | import svgwrite
 4 | from PIL import Image, ImageDraw
 5 | from utils.utils import *
 6 | from utils.optimizer import reconstructBuilding
 7 | 
 8 | # Experiment III - Maximizing weighted sum of junction directions
 9 | def run_experiment_3(cs, cs_c, edge_map, th, th_c, metric, graph_annot, rgb_dir, _id):
10 | 
11 | 	# Run experiment
12 | 	junctions, juncs_on, lines_on = reconstructBuilding(cs, edge_map,
13 | 																use_junctions_with_var=True,
14 | 																thetas=th,
15 | 																angle_thresh=5,
16 | 																with_corner_edge_confidence=True,
17 | 																corner_confs=cs_c,
18 | 																theta_confs=th_c,
19 | 																theta_threshold=0.25,
20 | 																corner_edge_thresh=0.125,
21 | 																edge_map_weight=10.0,
22 | 																intersection_constraint=True,
23 | 																post_process=True)
24 | 
25 | 	# Draw output image
26 | 	dwg = svgwrite.Drawing('../results/svg_regions/{}_3.svg'.format(_id), (128, 128))
27 | 	im_path = os.path.join(rgb_dir, _id + '.jpg')
28 | 	draw_building(dwg, junctions, juncs_on, lines_on)
29 | 	dwg.save()
30 | 
31 | 	# Update metric
32 | 	metric.forward(graph_annot, junctions, juncs_on, lines_on, _id)
33 | 
34 | 	return metric


--------------------------------------------------------------------------------
/IP/experiments/exp_0.py:
--------------------------------------------------------------------------------
 1 | import matplotlib.pyplot as plt
 2 | import random
 3 | import svgwrite
 4 | from PIL import Image, ImageDraw
 5 | from utils.utils import *
 6 | from utils.optimizer import reconstructBuilding
 7 | 
 8 | # Baseline - Trust on junctions orientations and optimize the number of edges
 9 | def run_experiment_0(cs, edge_map, th_filtered, metric, graph_annot, rgb_dir, _id):
10 | 
11 | 	# Run experiment
12 | 	junctions, juncs_on, lines_on = reconstructBuilding(cs, edge_map,
13 | 														use_junctions=True,
14 | 														thetas=th_filtered,
15 | 														angle_thresh=5,
16 | 														intersection_constraint=True,
17 | 														post_process=True)
18 | 
19 | 	# Draw output image
20 | 	dwg = svgwrite.Drawing('../results/svg_regions/{}_0.svg'.format(_id), (128, 128))
21 | 	im_path = os.path.join(rgb_dir, _id + '.jpg')
22 | 	draw_building(dwg, junctions, juncs_on, lines_on)
23 | 	dwg.save()
24 | 
25 | 	# Update metric
26 | 	metric.forward(graph_annot, junctions, juncs_on, lines_on, _id)
27 | 
28 | 	return


--------------------------------------------------------------------------------
/IP/experiments/exp_1.py:
--------------------------------------------------------------------------------
 1 | import matplotlib.pyplot as plt
 2 | import random
 3 | import svgwrite
 4 | from PIL import Image, ImageDraw
 5 | from utils.utils import *
 6 | from utils.optimizer import reconstructBuilding
 7 | 
 8 | # Experiment I - Weighted edges indicator variables using edges confidence
 9 | def run_experiment_1(cs, edge_map, th_filtered, metric, graph_annot, rgb_dir, _id):
10 | 
11 | 	junctions, juncs_on, lines_on = reconstructBuilding(cs, edge_map,
12 | 																use_junctions=True,
13 | 																thetas=th_filtered,
14 | 																angle_thresh=5,
15 | 																edge_threshold=0.5,
16 | 																with_edge_confidence=True,
17 | 																use_edge_classifier=False,
18 | 																edge_map_weight=10.0,
19 | 																intersection_constraint=True,
20 | 																post_process=True)
21 | 
22 | 	# Draw output image
23 | 	dwg = svgwrite.Drawing('../results/svg_regions/{}_1.svg'.format(_id), (128, 128))
24 | 	im_path = os.path.join(rgb_dir, _id + '.jpg')
25 | 	draw_building(dwg, junctions, juncs_on, lines_on)
26 | 	dwg.save()
27 | 
28 | 	# Update metric
29 | 	metric.forward(graph_annot, junctions, juncs_on, lines_on, _id)
30 | 
31 | 	return


--------------------------------------------------------------------------------
/IP/experiments/exp_2.py:
--------------------------------------------------------------------------------
 1 | import matplotlib.pyplot as plt
 2 | import random
 3 | import svgwrite
 4 | from PIL import Image, ImageDraw
 5 | from utils.utils import *
 6 | from utils.optimizer import reconstructBuilding
 7 | 
 8 | # Experiment II - Weights as combined junctions and edges confidence
 9 | def run_experiment_2(cs, cs_c, edge_map, th_filtered, metric, graph_annot, rgb_dir, _id):
10 | 
11 | 	# Run experiment
12 | 	junctions, juncs_on, lines_on = reconstructBuilding(cs, edge_map,
13 | 																use_junctions=True,
14 | 																thetas=th_filtered,
15 | 																angle_thresh=5,
16 | 																with_corner_edge_confidence=True,
17 | 																corner_confs=cs_c,
18 | 																corner_edge_thresh=0.125,
19 | 																edge_map_weight=10.0,
20 | 																intersection_constraint=True,
21 | 																post_process=True)
22 | 
23 | 	# Draw output image
24 | 	dwg = svgwrite.Drawing('../results/svg_regions/{}_2.svg'.format(_id), (128, 128))
25 | 	im_path = os.path.join(rgb_dir, _id + '.jpg')
26 | 	draw_building(dwg, junctions, juncs_on, lines_on)
27 | 	dwg.save()
28 | 
29 | 	# Update metric
30 | 	metric.forward(graph_annot, junctions, juncs_on, lines_on, _id)
31 | 
32 | 	return metric
33 | 
34 | 


--------------------------------------------------------------------------------
/IP/experiments/exp_3.py:
--------------------------------------------------------------------------------
 1 | import matplotlib.pyplot as plt
 2 | import random
 3 | import svgwrite
 4 | from PIL import Image, ImageDraw
 5 | from utils.utils import *
 6 | from utils.optimizer import reconstructBuilding
 7 | 
 8 | # Experiment III - Maximizing weighted sum of junction directions
 9 | def run_experiment_3(cs, cs_c, edge_map, th, th_c, metric, graph_annot, rgb_dir, _id):
10 | 
11 | 	# Run experiment
12 | 	junctions, juncs_on, lines_on = reconstructBuilding(cs, edge_map,
13 | 																use_junctions_with_var=True,
14 | 																thetas=th,
15 | 																angle_thresh=5,
16 | 																with_corner_edge_confidence=True,
17 | 																corner_confs=cs_c,
18 | 																theta_confs=th_c,
19 | 																theta_threshold=0.25,
20 | 																corner_edge_thresh=0.125,
21 | 																edge_map_weight=10.0,
22 | 																intersection_constraint=True,
23 | 																post_process=True)
24 | 
25 | 	# Draw output image
26 | 	dwg = svgwrite.Drawing('../results/svg_regions/{}_3.svg'.format(_id), (128, 128))
27 | 	im_path = os.path.join(rgb_dir, _id + '.jpg')
28 | 	draw_building(dwg, junctions, juncs_on, lines_on)
29 | 	dwg.save()
30 | 
31 | 	# Update metric
32 | 	metric.forward(graph_annot, junctions, juncs_on, lines_on, _id)
33 | 
34 | 	return metric


--------------------------------------------------------------------------------
/IP/experiments_aux/.ipynb_checkpoints/exp_0-checkpoint.py:
--------------------------------------------------------------------------------
 1 | import matplotlib.pyplot as plt
 2 | import random
 3 | import svgwrite
 4 | from PIL import Image, ImageDraw
 5 | from utils.utils import *
 6 | from utils.optimizer import reconstructBuilding
 7 | 
 8 | # Baseline - Trust on junctions orientations and optimize the number of edges
 9 | def run_experiment_0(cs, edge_map, th_filtered, metric, graph_annot, rgb_dir, _id):
10 | 
11 | 	# Run experiment
12 | 	junctions, juncs_on, lines_on = reconstructBuilding(cs, edge_map,
13 | 														edge_threshold=0.5,
14 | 														with_edge_confidence=True, # edges
15 | 														edge_map_weight=10.0, # edges
16 | 														intersection_constraint=True, # intersection 
17 | 														with_corner_variables=True, # connectivity
18 | 														corner_min_degree_constraint=True, # degree
19 | 														post_process=True)
20 | 
21 | 	# Draw output image
22 | 	dwg = svgwrite.Drawing('../results/svg_regions/{}_0.svg'.format(_id), (128, 128))
23 | 	im_path = os.path.join(rgb_dir, _id + '.jpg')
24 | 	draw_building(dwg, junctions, juncs_on, lines_on)
25 | 	dwg.save()
26 | 
27 | 	# Update metric
28 | 	metric.forward(graph_annot, junctions, juncs_on, lines_on, _id)
29 | 
30 | 	return


--------------------------------------------------------------------------------
/IP/experiments_aux/.ipynb_checkpoints/exp_1-checkpoint.py:
--------------------------------------------------------------------------------
 1 | import matplotlib.pyplot as plt
 2 | import random
 3 | import svgwrite
 4 | from PIL import Image, ImageDraw
 5 | from utils.utils import *
 6 | from utils.optimizer import reconstructBuilding
 7 | 
 8 | # Experiment I - Weighted edges indicator variables using edges confidence
 9 | def run_experiment_1(cs, cs_c, edge_map, th_filtered, metric, graph_annot, rgb_dir, _id):
10 | 
11 | 	junctions, juncs_on, lines_on = reconstructBuilding(cs, edge_map,
12 | 																corner_confs=cs_c,
13 | 																with_corner_edge_confidence=True, # corners + edges
14 | 																corner_edge_thresh=0.125, # corners + edges
15 | 																edge_map_weight=10.0, # edges
16 | 																intersection_constraint=True, # intersection 
17 | 																with_corner_variables=True, # connectivity
18 | 																corner_min_degree_constraint=True, # degree
19 | 																post_process=True)
20 | 
21 |     
22 | 
23 |                                 
24 | 	# Draw output image
25 | 	dwg = svgwrite.Drawing('../results/svg_regions/{}_1.svg'.format(_id), (128, 128))
26 | 	im_path = os.path.join(rgb_dir, _id + '.jpg')
27 | 	draw_building(dwg, junctions, juncs_on, lines_on)
28 | 	dwg.save()
29 | 
30 | 	# Update metric
31 | 	metric.forward(graph_annot, junctions, juncs_on, lines_on, _id)
32 | 
33 | 	return


--------------------------------------------------------------------------------
/IP/experiments_aux/.ipynb_checkpoints/exp_2-checkpoint.py:
--------------------------------------------------------------------------------
 1 | import matplotlib.pyplot as plt
 2 | import random
 3 | import svgwrite
 4 | from PIL import Image, ImageDraw
 5 | from utils.utils import *
 6 | from utils.optimizer import reconstructBuilding
 7 | 
 8 | # Experiment II - Weights as combined junctions and edges confidence
 9 | def run_experiment_2(cs, cs_c, edge_map, th, th_c, metric, graph_annot, rgb_dir, _id):
10 | 
11 | 	# Run experiment
12 | 	junctions, juncs_on, lines_on = reconstructBuilding(cs, edge_map,
13 | 																coner_to_edge_constraint=True, # corner-to-edge
14 | 																thetas=th, # corner-to-edge
15 | 																angle_thresh=5, # corner-to-edge
16 | 																with_corner_edge_confidence=True, # corners + edges
17 | 																corner_edge_thresh=0.125, # corners + edges        
18 | 																edge_map_weight=10.0, # edges           
19 |                                                         
20 | 																corner_confs=cs_c, # corners
21 | 																theta_confs=th_c, # corner-to-edge
22 | 																theta_threshold=0.25, # corner-to-edge
23 | 
24 | 																intersection_constraint=True, # intersection 
25 | 																with_corner_variables=True, # connectivity
26 | 																corner_min_degree_constraint=True, # degree
27 | 																post_process=True)
28 | 
29 | 	# Draw output image
30 | 	dwg = svgwrite.Drawing('../results/svg_regions/{}_2.svg'.format(_id), (128, 128))
31 | 	im_path = os.path.join(rgb_dir, _id + '.jpg')
32 | 	draw_building(dwg, junctions, juncs_on, lines_on)
33 | 	dwg.save()
34 | 
35 | 	# Update metric
36 | 	metric.forward(graph_annot, junctions, juncs_on, lines_on, _id)
37 | 
38 | 	return metric
39 | 
40 | 


--------------------------------------------------------------------------------
/IP/experiments_aux/.ipynb_checkpoints/exp_3-checkpoint.py:
--------------------------------------------------------------------------------
 1 | import matplotlib.pyplot as plt
 2 | import random
 3 | import svgwrite
 4 | from PIL import Image, ImageDraw
 5 | from utils.utils import *
 6 | from utils.optimizer import reconstructBuilding
 7 | 
 8 | # Experiment III - Maximizing weighted sum of junction directions
 9 | def run_experiment_3(cs, cs_c, edge_map, th, th_c, metric, graph_annot, rgb_dir, _id):
10 | 
11 | 	# Run experiment
12 | 	junctions, juncs_on, lines_on = reconstructBuilding(cs, edge_map,
13 | 																use_junctions_with_var=True,
14 | 																thetas=th,
15 | 																angle_thresh=5,
16 | 																with_corner_edge_confidence=True,
17 | 																corner_confs=cs_c,
18 | 																theta_confs=th_c,
19 | 																theta_threshold=0.25,
20 | 																corner_edge_thresh=0.125,
21 | 																edge_map_weight=10.0,
22 | 																intersection_constraint=True,
23 | 																post_process=True)
24 | 
25 | 	# Draw output image
26 | 	dwg = svgwrite.Drawing('../results/svg_regions/{}_3.svg'.format(_id), (128, 128))
27 | 	im_path = os.path.join(rgb_dir, _id + '.jpg')
28 | 	draw_building(dwg, junctions, juncs_on, lines_on)
29 | 	dwg.save()
30 | 
31 | 	# Update metric
32 | 	metric.forward(graph_annot, junctions, juncs_on, lines_on, _id)
33 | 
34 | 	return metric


--------------------------------------------------------------------------------
/IP/experiments_aux/exp_0.py:
--------------------------------------------------------------------------------
 1 | import matplotlib.pyplot as plt
 2 | import random
 3 | import svgwrite
 4 | from PIL import Image, ImageDraw
 5 | from utils.utils import *
 6 | from utils.optimizer import reconstructBuilding
 7 | 
 8 | # Baseline - Trust on junctions orientations and optimize the number of edges
 9 | def run_experiment_0(cs, edge_map, th_filtered, metric, graph_annot, rgb_dir, _id):
10 | 
11 | 	# Run experiment
12 | 	junctions, juncs_on, lines_on = reconstructBuilding(cs, edge_map,
13 | 														edge_threshold=0.5,
14 | 														with_edge_confidence=True, # edges
15 | 														edge_map_weight=10.0, # edges
16 | 														intersection_constraint=True, # intersection 
17 | 														with_corner_variables=True, # connectivity
18 | 														corner_min_degree_constraint=True, # degree
19 | 														post_process=True)
20 | 
21 | 	# Draw output image
22 | 	dwg = svgwrite.Drawing('../results/svg_regions/{}_0.svg'.format(_id), (128, 128))
23 | 	im_path = os.path.join(rgb_dir, _id + '.jpg')
24 | 	draw_building(dwg, junctions, juncs_on, lines_on)
25 | 	dwg.save()
26 | 
27 | 	# Update metric
28 | 	metric.forward(graph_annot, junctions, juncs_on, lines_on, _id)
29 | 
30 | 	return


--------------------------------------------------------------------------------
/IP/experiments_aux/exp_1.py:
--------------------------------------------------------------------------------
 1 | import matplotlib.pyplot as plt
 2 | import random
 3 | import svgwrite
 4 | from PIL import Image, ImageDraw
 5 | from utils.utils import *
 6 | from utils.optimizer import reconstructBuilding
 7 | 
 8 | # Experiment I - Weighted edges indicator variables using edges confidence
 9 | def run_experiment_1(cs, cs_c, edge_map, th_filtered, metric, graph_annot, rgb_dir, _id):
10 | 
11 | 	junctions, juncs_on, lines_on = reconstructBuilding(cs, edge_map,
12 | 																corner_confs=cs_c,
13 | 																with_corner_edge_confidence=True, # corners + edges
14 | 																corner_edge_thresh=0.125, # corners + edges
15 | 																edge_map_weight=10.0, # edges
16 | 																intersection_constraint=True, # intersection 
17 | 																with_corner_variables=True, # connectivity
18 | 																corner_min_degree_constraint=True, # degree
19 | 																post_process=True)
20 | 
21 |     
22 | 
23 |                                 
24 | 	# Draw output image
25 | 	dwg = svgwrite.Drawing('../results/svg_regions/{}_1.svg'.format(_id), (128, 128))
26 | 	im_path = os.path.join(rgb_dir, _id + '.jpg')
27 | 	draw_building(dwg, junctions, juncs_on, lines_on)
28 | 	dwg.save()
29 | 
30 | 	# Update metric
31 | 	metric.forward(graph_annot, junctions, juncs_on, lines_on, _id)
32 | 
33 | 	return


--------------------------------------------------------------------------------
/IP/experiments_aux/exp_2.py:
--------------------------------------------------------------------------------
 1 | import matplotlib.pyplot as plt
 2 | import random
 3 | import svgwrite
 4 | from PIL import Image, ImageDraw
 5 | from utils.utils import *
 6 | from utils.optimizer import reconstructBuilding
 7 | 
 8 | # Experiment II - Weights as combined junctions and edges confidence
 9 | def run_experiment_2(cs, cs_c, edge_map, th, th_c, metric, graph_annot, rgb_dir, _id):
10 | 
11 | 	# Run experiment
12 | 	junctions, juncs_on, lines_on = reconstructBuilding(cs, edge_map,
13 | 																coner_to_edge_constraint=True, # corner-to-edge
14 | 																thetas=th, # corner-to-edge
15 | 																angle_thresh=5, # corner-to-edge
16 | 																with_corner_edge_confidence=True, # corners + edges
17 | 																corner_edge_thresh=0.125, # corners + edges        
18 | 																edge_map_weight=10.0, # edges           
19 |                                                         
20 | 																corner_confs=cs_c, # corners
21 | 																theta_confs=th_c, # corner-to-edge
22 | 																theta_threshold=0.25, # corner-to-edge
23 | 
24 | 																intersection_constraint=True, # intersection 
25 | 																with_corner_variables=True, # connectivity
26 | 																corner_min_degree_constraint=True, # degree
27 | 																post_process=True)
28 | 
29 | 	# Draw output image
30 | 	dwg = svgwrite.Drawing('../results/svg_regions/{}_2.svg'.format(_id), (128, 128))
31 | 	im_path = os.path.join(rgb_dir, _id + '.jpg')
32 | 	draw_building(dwg, junctions, juncs_on, lines_on)
33 | 	dwg.save()
34 | 
35 | 	# Update metric
36 | 	metric.forward(graph_annot, junctions, juncs_on, lines_on, _id)
37 | 
38 | 	return metric
39 | 
40 | 


--------------------------------------------------------------------------------
/IP/experiments_aux/exp_3.py:
--------------------------------------------------------------------------------
 1 | import matplotlib.pyplot as plt
 2 | import random
 3 | import svgwrite
 4 | from PIL import Image, ImageDraw
 5 | from utils.utils import *
 6 | from utils.optimizer import reconstructBuilding
 7 | 
 8 | # Experiment III - Maximizing weighted sum of junction directions
 9 | def run_experiment_3(cs, cs_c, edge_map, th, th_c, metric, graph_annot, rgb_dir, _id):
10 | 
11 | 	# Run experiment
12 | 	junctions, juncs_on, lines_on = reconstructBuilding(cs, edge_map,
13 | 																use_junctions_with_var=True,
14 | 																thetas=th,
15 | 																angle_thresh=5,
16 | 																with_corner_edge_confidence=True,
17 | 																corner_confs=cs_c,
18 | 																theta_confs=th_c,
19 | 																theta_threshold=0.25,
20 | 																corner_edge_thresh=0.125,
21 | 																edge_map_weight=10.0,
22 | 																intersection_constraint=True,
23 | 																post_process=True)
24 | 
25 | 	# Draw output image
26 | 	dwg = svgwrite.Drawing('../results/svg_regions/{}_3.svg'.format(_id), (128, 128))
27 | 	im_path = os.path.join(rgb_dir, _id + '.jpg')
28 | 	draw_building(dwg, junctions, juncs_on, lines_on)
29 | 	dwg.save()
30 | 
31 | 	# Update metric
32 | 	metric.forward(graph_annot, junctions, juncs_on, lines_on, _id)
33 | 
34 | 	return metric


--------------------------------------------------------------------------------
/IP/models/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/IP/models/__init__.py


--------------------------------------------------------------------------------
/IP/models/graph.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | import torch.nn as nn
 3 | import torch.nn.functional as F
 4 | from torch.autograd import Variable
 5 | 
 6 | # GNN - Graph Neural Network
 7 | class EdgeClassifier(nn.Module):
 8 |     def __init__(self, base):
 9 |         super(EdgeClassifier, self).__init__()
10 |         self.base = base
11 |         self.fc1 = nn.Linear(1000, 512, bias=True)
12 |         self.fc2 = nn.Linear(512, 1, bias=True)
13 |         self.relu = nn.ReLU(inplace=True)
14 | 
15 |     def forward(self, x):
16 | 
17 |         # apply backbone
18 |         x = self.relu(self.base(x))
19 | 
20 |         # classifier head
21 |         x = self.relu(self.fc1(x))
22 |         z = F.sigmoid(self.fc2(x)).view(-1)
23 | 
24 |         return  z
25 | 


--------------------------------------------------------------------------------
/IP/models/inception.py:
--------------------------------------------------------------------------------
 1 | import random
 2 | import torch
 3 | import torch.nn as nn
 4 | import torch.nn.functional as F
 5 | from torch.autograd import Variable, gradcheck
 6 | from torch.autograd.gradcheck import gradgradcheck
 7 | import torchvision.models as models
 8 | from torch.autograd import Variable
 9 | 
10 | import numpy as np
11 | import time
12 | import pdb
13 | import importlib
14 | 
15 | from model.networks.inception_v2 import inception_v2
16 | 
17 | 
18 | class inception(nn.Module):
19 |     def __init__(self, classes, opt):
20 |         super(inception, self).__init__()
21 |         self.classes = classes
22 |         self.n_classes = 2
23 |     
24 |         decoder_module = importlib.import_module('model.networks.{}_decoder'.format(opt.decoder))
25 | 
26 |         self.decoder_ = decoder_module.DecodeNet(opt, 'train')
27 |         self.base_net = inception_v2(num_classes = 2, with_bn=opt.hype.get('batchnorm', True))
28 |         
29 |     def forward(self, im_data, junc_conf, junc_res, bin_conf, bin_res):
30 |         # junc_conf, junc_res, bin_conf, bin_res
31 |         """ input includes:
32 |             im_data
33 |             gt_junctions
34 |             junc_conf
35 |             junc_residual
36 |             bin_conf
37 |             bin_residual
38 | 	    """
39 | 
40 |         batch_size = im_data.size(0)
41 |         base_feat = self.base_net(im_data)
42 |         preds = self.decoder_(base_feat)
43 |         return preds
44 | 


--------------------------------------------------------------------------------
/IP/models/utils.py:
--------------------------------------------------------------------------------
1 | try:
2 |     from torch.hub import load_state_dict_from_url
3 | except ImportError:
4 |     from torch.utils.model_zoo import load_url as load_state_dict_from_url
5 | 


--------------------------------------------------------------------------------
/IP/utils/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/IP/utils/__init__.py


--------------------------------------------------------------------------------
/PC_and_CE_inference/README.md:
--------------------------------------------------------------------------------
 1 | # Code for training junction detector.
 2 | ## Downloading Data
 3 | 
 4 | 
 5 | ## Preprocess
 6 | - install requirements in python3.
 7 | - put hype-parameter config file in hypes/EXPNAME.json, follow the example.
 8 | - preprocess dataset
 9 | ```
10 | python main.py --exp 1 --json --create_dataset
11 | ```
12 | 
13 | ## Training
14 | - train junction detector.
15 | ```
16 |   python3 main.py --exp 1 --json --gpu 0
17 | ```
18 | - testing.
19 | ```
20 |    python3 main.py --exp 1 --json --test --checkepoch 16 --gpu 0
21 | ```
22 | 


--------------------------------------------------------------------------------
/PC_and_CE_inference/_init_paths.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import sys
 3 | 
 4 | def add_path(path):
 5 |     if path not in sys.path:
 6 |         sys.path.insert(0, path)
 7 | 
 8 | this_dir = os.path.dirname(__file__)
 9 | 
10 | # Add lib to PYTHONPATH
11 | lib_path = os.path.join(this_dir)
12 | add_path(lib_path)
13 | 


--------------------------------------------------------------------------------
/PC_and_CE_inference/datasets/.ipynb_checkpoints/config-checkpoint.py:
--------------------------------------------------------------------------------
 1 | import numpy as np
 2 | # 0 menas no rotation.
 3 | #rotation_angles = [i * 30. for i in range(12)] 
 4 | rotation_angles = [0, 180] 
 5 | # [0, 30, 60, 90, 120, 150, ..., 330]
 6 | 
 7 | crop_ration = [(0.25, 0.25, 0.75, 0.75)]
 8 | 
 9 | #pixel_mean = np.array([116.46479065, 126.95309567,  137.88588786], dtype=np.float32)
10 | 
11 | #pixel_mean = np.array([115.9839754, 126.63120922, 137.73309306], dtype=np.float32)
12 | #pixel_mean = np.array([116.465, 126.953, 137.886], dtype=np.float32)
13 | pixel_mean = np.array([116., 127., 138.], dtype=np.float32)
14 | 


--------------------------------------------------------------------------------
/PC_and_CE_inference/datasets/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/PC_and_CE_inference/datasets/__init__.py


--------------------------------------------------------------------------------
/PC_and_CE_inference/datasets/config.py:
--------------------------------------------------------------------------------
 1 | import numpy as np
 2 | # 0 menas no rotation.
 3 | #rotation_angles = [i * 30. for i in range(12)] 
 4 | rotation_angles = [0, 180] 
 5 | # [0, 30, 60, 90, 120, 150, ..., 330]
 6 | 
 7 | crop_ration = [(0.25, 0.25, 0.75, 0.75)]
 8 | 
 9 | #pixel_mean = np.array([116.46479065, 126.95309567,  137.88588786], dtype=np.float32)
10 | 
11 | #pixel_mean = np.array([115.9839754, 126.63120922, 137.73309306], dtype=np.float32)
12 | #pixel_mean = np.array([116.465, 126.953, 137.886], dtype=np.float32)
13 | pixel_mean = np.array([116., 127., 138.], dtype=np.float32)
14 | 


--------------------------------------------------------------------------------
/PC_and_CE_inference/hypes/1.json:
--------------------------------------------------------------------------------
 1 | { "trainlst":"",
 2 |   "batchnorm": true,
 3 |   "solver": {
 4 |   	"batch_size": 1,
 5 |     "opt": "SGD", 
 6 |     "rnd_seed": 1, 
 7 |     "epsilon": 1e-05, 
 8 |   	"clip_norm": 1.0,
 9 | 	"momentum": 0.9
10 |   }, 
11 |   
12 |   "max_epochs": 20,
13 |   "steppoints": [8, 12, 16],
14 |   "num_classes": 2,
15 |   "focus_size": 1.5, 
16 |   "image_size": 480,
17 |   "grid_size": 60,
18 |   "region_size": 8, 
19 |   "max_len": 1, 
20 |   "num_bin": 15,
21 |   "loss_weights": [1.0, 0.1, 1.0, 0.1]
22 | }
23 | 


--------------------------------------------------------------------------------
/PC_and_CE_inference/hypes/2.json:
--------------------------------------------------------------------------------
 1 | { "trainlst":"",
 2 |   "batchnorm": true,
 3 |   "solver": {
 4 |   	"batch_size": 1,
 5 |     "opt": "SGD", 
 6 |     "rnd_seed": 1, 
 7 |     "epsilon": 1e-05, 
 8 |   	"clip_norm": 1.0,
 9 | 	"momentum": 0.9
10 |   }, 
11 |   
12 |   "max_epochs": 20,
13 |   "steppoints": [8, 12, 16],
14 |   "num_classes": 2,
15 |   "focus_size": 1.5, 
16 |   "image_size": 480,
17 |   "grid_size": 60,
18 |   "region_size": 8, 
19 |   "max_len": 1, 
20 |   "num_bin": 15,
21 |   "loss_weights": [1.0, 0.1, 1.0, 0.1]
22 | }
23 | 


--------------------------------------------------------------------------------
/PC_and_CE_inference/hypes/3.json:
--------------------------------------------------------------------------------
 1 | { "trainlst":"",
 2 |   "batchnorm": true,
 3 |   "solver": {
 4 |   	"batch_size": 10,
 5 |     "opt": "adam", 
 6 |     "rnd_seed": 1, 
 7 |     "epsilon": 1e-05, 
 8 |   	"clip_norm": 1.0,
 9 | 	"momentum": 0.9
10 |   }, 
11 |   
12 |   "max_epochs": 1000,
13 |   "steppoints": [100],
14 |   "num_classes": 2,
15 |   "focus_size": 1.5, 
16 |   "image_size": 256,
17 |   "grid_size": 32,
18 |   "region_size": 8, 
19 |   "max_len": 1, 
20 |   "num_bin": 15,
21 |   "loss_weights": [1.0, 0.1, 1.0, 0.1]
22 | }
23 | 


--------------------------------------------------------------------------------
/PC_and_CE_inference/model/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/PC_and_CE_inference/model/__init__.py


--------------------------------------------------------------------------------
/PC_and_CE_inference/model/graph.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | import torch.nn as nn
 3 | import torch.nn.functional as F
 4 | from torch.autograd import Variable
 5 | 
 6 | # GNN - Graph Neural Network
 7 | class EdgeClassifier(nn.Module):
 8 |     def __init__(self, base):
 9 |         super(EdgeClassifier, self).__init__()
10 |         self.base = base
11 |         self.fc1 = nn.Linear(1000, 512, bias=True)
12 |         self.fc2 = nn.Linear(512, 1, bias=True)
13 |         self.relu = nn.ReLU(inplace=True)
14 | 
15 |     def forward(self, x):
16 | 
17 |         # apply backbone
18 |         x = self.relu(self.base(x))
19 | 
20 |         # classifier head
21 |         x = self.relu(self.fc1(x))
22 |         z = F.sigmoid(self.fc2(x)).view(-1)
23 | 
24 |         return  z
25 | 


--------------------------------------------------------------------------------
/PC_and_CE_inference/model/inception.py:
--------------------------------------------------------------------------------
 1 | import random
 2 | import torch
 3 | import torch.nn as nn
 4 | import torch.nn.functional as F
 5 | from torch.autograd import Variable, gradcheck
 6 | from torch.autograd.gradcheck import gradgradcheck
 7 | import torchvision.models as models
 8 | from torch.autograd import Variable
 9 | 
10 | import numpy as np
11 | import time
12 | import pdb
13 | import importlib
14 | 
15 | from model.networks.inception_v2 import inception_v2
16 | 
17 | 
18 | class inception(nn.Module):
19 |     def __init__(self, classes, opt):
20 |         super(inception, self).__init__()
21 |         self.classes = classes
22 |         self.n_classes = 2
23 |     
24 |         decoder_module = importlib.import_module('model.networks.{}_decoder'.format(opt.decoder))
25 | 
26 |         self.decoder_ = decoder_module.DecodeNet(opt, 'train')
27 |         self.base_net = inception_v2(num_classes = 2, with_bn=opt.hype.get('batchnorm', True))
28 |         
29 |     def forward(self, im_data, junc_conf, junc_res, bin_conf, bin_res):
30 |         # junc_conf, junc_res, bin_conf, bin_res
31 |         """ input includes:
32 |             im_data
33 |             gt_junctions
34 |             junc_conf
35 |             junc_residual
36 |             bin_conf
37 |             bin_residual
38 | 	    """
39 | 
40 |         batch_size = im_data.size(0)
41 |         base_feat = self.base_net(im_data)
42 |         preds = self.decoder_(base_feat)
43 |         return preds
44 | 


--------------------------------------------------------------------------------
/PC_and_CE_inference/model/networks/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/PC_and_CE_inference/model/networks/__init__.py


--------------------------------------------------------------------------------
/PC_and_CE_inference/model/utils.py:
--------------------------------------------------------------------------------
1 | try:
2 |     from torch.hub import load_state_dict_from_url
3 | except ImportError:
4 |     from torch.utils.model_zoo import load_url as load_state_dict_from_url
5 | 


--------------------------------------------------------------------------------
/PC_and_CE_inference/ref.py:
--------------------------------------------------------------------------------
 1 | import numpy as np
 2 | from pathlib import Path
 3 | import os
 4 | 
 5 | home = Path.home()
 6 | 
 7 | eps = 1e-6
 8 | momentum = 0.9
 9 | weightDecay = 0.0
10 | alpha = 0.99
11 | epsilon = 1e-8
12 | 
13 | nThreads = 4
14 | pixel_mean = np.array([115.9839754, 126.63120922, 137.73309306], dtype=np.float32)
15 | 
16 | ext = '.pickle'
17 | #ext = '.pk'
18 | data_dir = Path('/home/nelson/Workspace/cities_dataset')
19 | root_dir = Path(os.getcwd()) / '..'
20 | data_root = data_dir
21 | junc_data_root = data_root / 'PC_and_CE_inference'
22 | output_root = root_dir / "output/"
23 | result_dir = root_dir / 'result' / 'PC_and_CE_inference'
24 | hypeDir = root_dir / 'PC_and_CE_inference/hypes'
25 | logdir = root_dir / 'logs'
26 | 


--------------------------------------------------------------------------------
/PC_and_CE_inference/requirements.txt:
--------------------------------------------------------------------------------
 1 | tqdm
 2 | joblib
 3 | scipy
 4 | numpy
 5 | opencv
 6 | dominate
 7 | easydict
 8 | plotly
 9 | progress
10 | 


--------------------------------------------------------------------------------
/PC_and_CE_inference/utils/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/PC_and_CE_inference/utils/__init__.py


--------------------------------------------------------------------------------
/PE_inference/dataset/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/PE_inference/dataset/__init__.py


--------------------------------------------------------------------------------
/PE_inference/model/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/PE_inference/model/__init__.py


--------------------------------------------------------------------------------
/PE_inference/model/utils.py:
--------------------------------------------------------------------------------
1 | try:
2 |     from torch.hub import load_state_dict_from_url
3 | except ImportError:
4 |     from torch.utils.model_zoo import load_url as load_state_dict_from_url
5 | 


--------------------------------------------------------------------------------
/PE_inference/utils/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/PE_inference/utils/__init__.py


--------------------------------------------------------------------------------
/PE_inference/utils/losses.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | import torch.nn as nn
 3 | import torch.nn.functional as F
 4 | 
 5 | def balanced_binary_cross_entropy(pred, gt, pos_w=2.0, neg_w=1.0):
 6 | 
 7 |     # flatten vectors
 8 |     pred = pred.view(-1)
 9 |     gt = gt.view(-1)
10 | 
11 |     # select postive/nevative samples
12 |     pos_ind = gt.nonzero().squeeze(-1)
13 |     neg_ind = (gt == 0).nonzero().squeeze(-1)
14 | 
15 |     # compute weighted loss
16 |     pos_loss = pos_w*F.binary_cross_entropy(pred[pos_ind], gt[pos_ind], size_average=True)
17 |     neg_loss = neg_w*F.binary_cross_entropy(pred[neg_ind], gt[neg_ind], size_average=True)
18 | 
19 |     return pos_loss + neg_loss
20 | 
21 | def mse(coords, coords_gt, prob_gt):
22 | 
23 |     # flatten vectors
24 |     coords = coords.view(-1, 2)
25 |     coords_gt = coords_gt.view(-1, 2)
26 |     prob_gt = prob_gt.view(-1)
27 | 
28 |     # select positive samples
29 |     pos_ind = prob_gt.nonzero().squeeze(-1)
30 |     pos_coords = coords[pos_ind, :]
31 |     pos_coords_gt = coords_gt[pos_ind, :]
32 | 
33 |     return F.mse_loss(pos_coords, pos_coords_gt)


--------------------------------------------------------------------------------
/PE_inference/utils/utils.py:
--------------------------------------------------------------------------------
 1 | import numpy as np
 2 | from PIL import Image
 3 | 
 4 | def compose_im(im_arr, alpha, shape=256):
 5 |     for i in range(shape):
 6 |         for j in range(shape):
 7 |             im_arr[i, j, :] = (1-alpha[i, j])*im_arr[i, j, :] + alpha[i, j]*np.array([0., 255., 0.])
 8 |     im_cmp = Image.fromarray(im_arr.astype('uint8')).resize((shape, shape))
 9 |     return im_cmp
10 | 
11 | def nms(dets, probs, embs=None, top_n=100, lim=0.0):
12 | 
13 |     if embs is None:
14 |         dets = np.concatenate([dets, probs[:, np.newaxis]], axis=-1)
15 |     else:
16 |         dets = np.concatenate([dets, probs[:, np.newaxis], embs], axis=-1)
17 |     dets = np.array(sorted(dets, key=lambda x: x[2], reverse=True))[:top_n, :]
18 |     for i in range(dets.shape[0]):
19 |         for j in range(i, dets.shape[0]):
20 |             if (dets[i, 2] != -1) and (dets[j, 2] != -1) and (i != j):
21 |                 dist = np.linalg.norm(dets[i, :2]-dets[j, :2])
22 |                 if dist <= lim:
23 |                     dets[j, 2] = -1
24 | 
25 |     to_keep = (dets[:, 2] != -1)
26 |     new_probs = dets[to_keep, 2]
27 |     new_dets = dets[to_keep, :2]
28 |     if embs is not None:
29 |         embs = dets[to_keep, 3:]
30 |     return new_dets, new_probs, embs
31 | 
32 |     


--------------------------------------------------------------------------------
/PR_inference/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2018 Facebook
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/PR_inference/README.md:
--------------------------------------------------------------------------------
1 | # Faster R-CNN and Mask R-CNN in PyTorch 1.0
2 | Refer to https://github.com/facebookresearch/maskrcnn-benchmark
3 | 


--------------------------------------------------------------------------------
/PR_inference/configs/.ipynb_checkpoints/buildings_mask_rcnn_R_50_FPN_1x-checkpoint.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |   ROI_MASK_HEAD:
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
26 |     PREDICTOR: "MaskRCNNC4Predictor"
27 |     POOLER_RESOLUTION: 14
28 |     POOLER_SAMPLING_RATIO: 2
29 |     RESOLUTION: 28
30 |     SHARE_BOX_FEATURE_EXTRACTOR: False
31 |   MASK_ON: True
32 | DATASETS:
33 |   TRAIN: ("buildings_train",)
34 |   TEST: ("buildings_val",)
35 | DATALOADER:
36 |   SIZE_DIVISIBILITY: 32
37 | SOLVER:
38 |   BASE_LR: 0.02
39 |   WEIGHT_DECAY: 0.0001
40 |   STEPS: (60000, 80000)
41 |   MAX_ITER: 90000


--------------------------------------------------------------------------------
/PR_inference/configs/buildings_mask_rcnn_R_50_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |   ROI_MASK_HEAD:
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
26 |     PREDICTOR: "MaskRCNNC4Predictor"
27 |     POOLER_RESOLUTION: 14
28 |     POOLER_SAMPLING_RATIO: 2
29 |     RESOLUTION: 28
30 |     SHARE_BOX_FEATURE_EXTRACTOR: False
31 |   MASK_ON: True
32 | DATASETS:
33 |   TRAIN: ("buildings_train",)
34 |   TEST: ("buildings_val",)
35 | DATALOADER:
36 |   SIZE_DIVISIBILITY: 32
37 | SOLVER:
38 |   BASE_LR: 0.02
39 |   WEIGHT_DECAY: 0.0001
40 |   STEPS: (60000, 80000)
41 |   MAX_ITER: 90000


--------------------------------------------------------------------------------
/PR_inference/configs/caffe2/e2e_faster_rcnn_R_101_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35857890/e2e_faster_rcnn_R-101-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 | DATASETS:
24 |   TEST: ("coco_2014_minival",)
25 | DATALOADER:
26 |   SIZE_DIVISIBILITY: 32
27 | 


--------------------------------------------------------------------------------
/PR_inference/configs/caffe2/e2e_faster_rcnn_R_50_C4_1x_caffe2.yaml:
--------------------------------------------------------------------------------
1 | MODEL:
2 |   META_ARCHITECTURE: "GeneralizedRCNN"
3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35857197/e2e_faster_rcnn_R-50-C4_1x"
4 | DATASETS:
5 |   TEST: ("coco_2014_minival",)
6 | 


--------------------------------------------------------------------------------
/PR_inference/configs/caffe2/e2e_faster_rcnn_R_50_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35857345/e2e_faster_rcnn_R-50-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 | DATASETS:
24 |   TEST: ("coco_2014_minival",)
25 | DATALOADER:
26 |   SIZE_DIVISIBILITY: 32
27 | 


--------------------------------------------------------------------------------
/PR_inference/configs/caffe2/e2e_faster_rcnn_X_101_32x8d_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/36761737/e2e_faster_rcnn_X-101-32x8d-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |     STRIDE_IN_1X1: False
 9 |     NUM_GROUPS: 32
10 |     WIDTH_PER_GROUP: 8
11 |   RPN:
12 |     USE_FPN: True
13 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
14 |     PRE_NMS_TOP_N_TRAIN: 2000
15 |     PRE_NMS_TOP_N_TEST: 1000
16 |     POST_NMS_TOP_N_TEST: 1000
17 |     FPN_POST_NMS_TOP_N_TEST: 1000
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |   ROI_BOX_HEAD:
21 |     POOLER_RESOLUTION: 7
22 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
23 |     POOLER_SAMPLING_RATIO: 2
24 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
25 |     PREDICTOR: "FPNPredictor"
26 | DATASETS:
27 |   TEST: ("coco_2014_minival",)
28 | DATALOADER:
29 |   SIZE_DIVISIBILITY: 32
30 | 


--------------------------------------------------------------------------------
/PR_inference/configs/caffe2/e2e_keypoint_rcnn_R_50_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/37697547/e2e_keypoint_rcnn_R-50-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |     NUM_CLASSES: 2
24 |   ROI_KEYPOINT_HEAD:
25 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
26 |     FEATURE_EXTRACTOR: "KeypointRCNNFeatureExtractor"
27 |     PREDICTOR: "KeypointRCNNPredictor"
28 |     POOLER_RESOLUTION: 14
29 |     POOLER_SAMPLING_RATIO: 2
30 |     RESOLUTION: 56
31 |     SHARE_BOX_FEATURE_EXTRACTOR: False
32 |   KEYPOINT_ON: True
33 | DATASETS:
34 |   TRAIN: ("keypoints_coco_2014_train", "keypoints_coco_2014_valminusminival",)
35 |   TEST: ("keypoints_coco_2014_minival",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (640, 672, 704, 736, 768, 800)
38 | DATALOADER:
39 |   SIZE_DIVISIBILITY: 32
40 | SOLVER:
41 |   BASE_LR: 0.02
42 |   WEIGHT_DECAY: 0.0001
43 |   STEPS: (60000, 80000)
44 |   MAX_ITER: 90000
45 | 


--------------------------------------------------------------------------------
/PR_inference/configs/caffe2/e2e_mask_rcnn_R_101_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35861795/e2e_mask_rcnn_R-101-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |   ROI_MASK_HEAD:
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
26 |     PREDICTOR: "MaskRCNNC4Predictor"
27 |     POOLER_RESOLUTION: 14
28 |     POOLER_SAMPLING_RATIO: 2
29 |     RESOLUTION: 28
30 |     SHARE_BOX_FEATURE_EXTRACTOR: False
31 |   MASK_ON: True
32 | DATASETS:
33 |   TEST: ("coco_2014_minival",)
34 | DATALOADER:
35 |   SIZE_DIVISIBILITY: 32
36 | 


--------------------------------------------------------------------------------
/PR_inference/configs/caffe2/e2e_mask_rcnn_R_50_C4_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35858791/e2e_mask_rcnn_R-50-C4_1x"
 4 |   ROI_MASK_HEAD:
 5 |     PREDICTOR: "MaskRCNNC4Predictor"
 6 |     SHARE_BOX_FEATURE_EXTRACTOR: True
 7 |   MASK_ON: True
 8 | DATASETS:
 9 |   TEST: ("coco_2014_minival",)
10 | 


--------------------------------------------------------------------------------
/PR_inference/configs/caffe2/e2e_mask_rcnn_R_50_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35858933/e2e_mask_rcnn_R-50-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |   ROI_MASK_HEAD:
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
26 |     PREDICTOR: "MaskRCNNC4Predictor"
27 |     POOLER_RESOLUTION: 14
28 |     POOLER_SAMPLING_RATIO: 2
29 |     RESOLUTION: 28
30 |     SHARE_BOX_FEATURE_EXTRACTOR: False
31 |   MASK_ON: True
32 | DATASETS:
33 |   TEST: ("coco_2014_minival",)
34 | DATALOADER:
35 |   SIZE_DIVISIBILITY: 32
36 | 


--------------------------------------------------------------------------------
/PR_inference/configs/caffe2/e2e_mask_rcnn_X-152-32x8d-FPN-IN5k_1.44x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/37129812/e2e_mask_rcnn_X-152-32x8d-FPN-IN5k_1.44x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-152-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |     STRIDE_IN_1X1: False
 9 |     NUM_GROUPS: 32
10 |     WIDTH_PER_GROUP: 8
11 |   RPN:
12 |     USE_FPN: True
13 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
14 |     PRE_NMS_TOP_N_TRAIN: 2000
15 |     PRE_NMS_TOP_N_TEST: 1000
16 |     POST_NMS_TOP_N_TEST: 1000
17 |     FPN_POST_NMS_TOP_N_TEST: 1000
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |   ROI_BOX_HEAD:
21 |     POOLER_RESOLUTION: 7
22 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
23 |     POOLER_SAMPLING_RATIO: 2
24 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
25 |     PREDICTOR: "FPNPredictor"
26 |   ROI_MASK_HEAD:
27 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
28 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
29 |     PREDICTOR: "MaskRCNNC4Predictor"
30 |     POOLER_RESOLUTION: 14
31 |     POOLER_SAMPLING_RATIO: 2
32 |     RESOLUTION: 28
33 |     SHARE_BOX_FEATURE_EXTRACTOR: False
34 |   MASK_ON: True
35 | DATASETS:
36 |   TEST: ("coco_2014_minival",)
37 | DATALOADER:
38 |   SIZE_DIVISIBILITY: 32
39 | 


--------------------------------------------------------------------------------
/PR_inference/configs/caffe2/e2e_mask_rcnn_X_101_32x8d_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/36761843/e2e_mask_rcnn_X-101-32x8d-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |     STRIDE_IN_1X1: False
 9 |     NUM_GROUPS: 32
10 |     WIDTH_PER_GROUP: 8
11 |   RPN:
12 |     USE_FPN: True
13 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
14 |     PRE_NMS_TOP_N_TRAIN: 2000
15 |     PRE_NMS_TOP_N_TEST: 1000
16 |     POST_NMS_TOP_N_TEST: 1000
17 |     FPN_POST_NMS_TOP_N_TEST: 1000
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |   ROI_BOX_HEAD:
21 |     POOLER_RESOLUTION: 7
22 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
23 |     POOLER_SAMPLING_RATIO: 2
24 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
25 |     PREDICTOR: "FPNPredictor"
26 |   ROI_MASK_HEAD:
27 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
28 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
29 |     PREDICTOR: "MaskRCNNC4Predictor"
30 |     POOLER_RESOLUTION: 14
31 |     POOLER_SAMPLING_RATIO: 2
32 |     RESOLUTION: 28
33 |     SHARE_BOX_FEATURE_EXTRACTOR: False
34 |   MASK_ON: True
35 | DATASETS:
36 |   TEST: ("coco_2014_minival",)
37 | DATALOADER:
38 |   SIZE_DIVISIBILITY: 32
39 | 


--------------------------------------------------------------------------------
/PR_inference/configs/cityscapes/e2e_faster_rcnn_R_50_FPN_1x_cocostyle.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |     NUM_CLASSES: 9
24 | DATASETS:
25 |   TRAIN: ("cityscapes_fine_instanceonly_seg_train_cocostyle",)
26 |   TEST: ("cityscapes_fine_instanceonly_seg_val_cocostyle",)
27 | DATALOADER:
28 |   SIZE_DIVISIBILITY: 32
29 | SOLVER:
30 |   BASE_LR: 0.01
31 |   WEIGHT_DECAY: 0.0001
32 |   STEPS: (18000,)
33 |   MAX_ITER: 24000
34 | 


--------------------------------------------------------------------------------
/PR_inference/configs/cityscapes/e2e_mask_rcnn_R_50_FPN_1x_cocostyle.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |     NUM_CLASSES: 9
24 |   ROI_MASK_HEAD:
25 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
26 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
27 |     PREDICTOR: "MaskRCNNC4Predictor"
28 |     POOLER_RESOLUTION: 14
29 |     POOLER_SAMPLING_RATIO: 2
30 |     RESOLUTION: 28
31 |     SHARE_BOX_FEATURE_EXTRACTOR: False
32 |   MASK_ON: True
33 | DATASETS:
34 |   TRAIN: ("cityscapes_fine_instanceonly_seg_train_cocostyle",)
35 |   TEST: ("cityscapes_fine_instanceonly_seg_val_cocostyle",)
36 | DATALOADER:
37 |   SIZE_DIVISIBILITY: 32
38 | SOLVER:
39 |   BASE_LR: 0.01
40 |   WEIGHT_DECAY: 0.0001
41 |   STEPS: (18000,)
42 |   MAX_ITER: 24000
43 | 


--------------------------------------------------------------------------------
/PR_inference/configs/gn_baselines/README.md:
--------------------------------------------------------------------------------
 1 | ### Group Normalization
 2 | 1 [Group Normalization](https://arxiv.org/abs/1803.08494)  
 3 | 2 [Rethinking ImageNet Pre-training](https://arxiv.org/abs/1811.08883)  
 4 | 3 [official code](https://github.com/facebookresearch/Detectron/blob/master/projects/GN/README.md)  
 5 | 
 6 | 
 7 | ### Performance
 8 | |      case                  |    Type      |  lr schd  |  im/gpu | bbox AP | mask AP |
 9 | |----------------------------|:------------:|:---------:|:-------:|:-------:|:-------:|
10 | |   R-50-FPN, GN (paper)     | finetune     |    2x     |   2     |   40.3  |  35.7   |
11 | |   R-50-FPN, GN (implement) | finetune     |    2x     |   2     |   40.2  |  36.0   |
12 | |   R-50-FPN, GN (paper)     | from scratch |    3x     |   2     |   39.5  |  35.2   |
13 | |   R-50-FPN, GN (implement) | from scratch |    3x     |   2     |   38.9  |  35.1   |
14 | 


--------------------------------------------------------------------------------
/PR_inference/configs/gn_baselines/e2e_faster_rcnn_R_50_FPN_1x_gn.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50-GN"
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |   RESNETS: # use GN for backbone
12 |     BACKBONE_OUT_CHANNELS: 256
13 |     STRIDE_IN_1X1: False
14 |     TRANS_FUNC: "BottleneckWithGN"
15 |     STEM_FUNC: "StemWithGN"
16 |   FPN:
17 |     USE_GN: True # use GN for FPN
18 |   RPN:
19 |     USE_FPN: True
20 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
21 |     PRE_NMS_TOP_N_TRAIN: 2000
22 |     PRE_NMS_TOP_N_TEST: 1000
23 |     POST_NMS_TOP_N_TEST: 1000
24 |     FPN_POST_NMS_TOP_N_TEST: 1000
25 |   ROI_HEADS:
26 |     USE_FPN: True
27 |     BATCH_SIZE_PER_IMAGE: 512
28 |     POSITIVE_FRACTION: 0.25
29 |   ROI_BOX_HEAD:
30 |     USE_GN: True # use GN for bbox head
31 |     POOLER_RESOLUTION: 7
32 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
33 |     POOLER_SAMPLING_RATIO: 2
34 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
35 |     PREDICTOR: "FPNPredictor"
36 | DATASETS:
37 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
38 |   TEST: ("coco_2014_minival",)
39 | DATALOADER:
40 |   SIZE_DIVISIBILITY: 32
41 | SOLVER:
42 |   # Assume 8 gpus
43 |   BASE_LR: 0.02
44 |   WEIGHT_DECAY: 0.0001
45 |   STEPS: (60000, 80000)
46 |   MAX_ITER: 90000
47 |   IMS_PER_BATCH: 16
48 | TEST:
49 |   IMS_PER_BATCH: 8
50 | 


--------------------------------------------------------------------------------
/PR_inference/configs/gn_baselines/e2e_faster_rcnn_R_50_FPN_Xconv1fc_1x_gn.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50-GN"
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |   RESNETS: # use GN for backbone
12 |     BACKBONE_OUT_CHANNELS: 256
13 |     STRIDE_IN_1X1: False
14 |     TRANS_FUNC: "BottleneckWithGN"
15 |     STEM_FUNC: "StemWithGN"
16 |   FPN:
17 |     USE_GN: True # use GN for FPN
18 |   RPN:
19 |     USE_FPN: True
20 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
21 |     PRE_NMS_TOP_N_TRAIN: 2000
22 |     PRE_NMS_TOP_N_TEST: 1000
23 |     POST_NMS_TOP_N_TEST: 1000
24 |     FPN_POST_NMS_TOP_N_TEST: 1000
25 |   ROI_HEADS:
26 |     USE_FPN: True
27 |     BATCH_SIZE_PER_IMAGE: 512
28 |     POSITIVE_FRACTION: 0.25
29 |   ROI_BOX_HEAD:
30 |     USE_GN: True # use GN for bbox head
31 |     POOLER_RESOLUTION: 7
32 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
33 |     POOLER_SAMPLING_RATIO: 2
34 |     CONV_HEAD_DIM: 256
35 |     NUM_STACKED_CONVS: 4
36 |     FEATURE_EXTRACTOR: "FPNXconv1fcFeatureExtractor"
37 |     PREDICTOR: "FPNPredictor"
38 | DATASETS:
39 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
40 |   TEST: ("coco_2014_minival",)
41 | DATALOADER:
42 |   SIZE_DIVISIBILITY: 32
43 | SOLVER:
44 |   # Assume 8 gpus
45 |   BASE_LR: 0.02
46 |   WEIGHT_DECAY: 0.0001
47 |   STEPS: (60000, 80000)
48 |   MAX_ITER: 90000
49 |   IMS_PER_BATCH: 16
50 | TEST:
51 |   IMS_PER_BATCH: 8
52 | 


--------------------------------------------------------------------------------
/PR_inference/configs/gn_baselines/scratch_e2e_faster_rcnn_R_50_FPN_3x_gn.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "" # no pretrained model
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |     FREEZE_CONV_BODY_AT: 0 # finetune all layers
12 |   RESNETS: # use GN for backbone
13 |     BACKBONE_OUT_CHANNELS: 256
14 |     STRIDE_IN_1X1: False
15 |     TRANS_FUNC: "BottleneckWithGN"
16 |     STEM_FUNC: "StemWithGN"
17 |   FPN:
18 |     USE_GN: True # use GN for FPN
19 |   RPN:
20 |     USE_FPN: True
21 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
22 |     PRE_NMS_TOP_N_TRAIN: 2000
23 |     PRE_NMS_TOP_N_TEST: 1000
24 |     POST_NMS_TOP_N_TEST: 1000
25 |     FPN_POST_NMS_TOP_N_TEST: 1000
26 |   ROI_HEADS:
27 |     USE_FPN: True
28 |     BATCH_SIZE_PER_IMAGE: 512
29 |     POSITIVE_FRACTION: 0.25
30 |   ROI_BOX_HEAD:
31 |     USE_GN: True # use GN for bbox head
32 |     POOLER_RESOLUTION: 7
33 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
34 |     POOLER_SAMPLING_RATIO: 2
35 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
36 |     PREDICTOR: "FPNPredictor"
37 | DATASETS:
38 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
39 |   TEST: ("coco_2014_minival",)
40 | DATALOADER:
41 |   SIZE_DIVISIBILITY: 32
42 | SOLVER:
43 |   # Assume 8 gpus
44 |   BASE_LR: 0.02
45 |   WEIGHT_DECAY: 0.0001
46 |   STEPS: (210000, 250000)
47 |   MAX_ITER: 270000
48 |   IMS_PER_BATCH: 16
49 | TEST:
50 |   IMS_PER_BATCH: 8
51 | 


--------------------------------------------------------------------------------
/PR_inference/configs/gn_baselines/scratch_e2e_faster_rcnn_R_50_FPN_Xconv1fc_3x_gn.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "" # no pretrained model
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |     FREEZE_CONV_BODY_AT: 0 # finetune all layers
12 |   RESNETS: # use GN for backbone
13 |     BACKBONE_OUT_CHANNELS: 256
14 |     STRIDE_IN_1X1: False
15 |     TRANS_FUNC: "BottleneckWithGN"
16 |     STEM_FUNC: "StemWithGN"
17 |   FPN:
18 |     USE_GN: True # use GN for FPN
19 |   RPN:
20 |     USE_FPN: True
21 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
22 |     PRE_NMS_TOP_N_TRAIN: 2000
23 |     PRE_NMS_TOP_N_TEST: 1000
24 |     POST_NMS_TOP_N_TEST: 1000
25 |     FPN_POST_NMS_TOP_N_TEST: 1000
26 |   ROI_HEADS:
27 |     USE_FPN: True
28 |     BATCH_SIZE_PER_IMAGE: 512
29 |     POSITIVE_FRACTION: 0.25
30 |   ROI_BOX_HEAD:
31 |     USE_GN: True # use GN for bbox head
32 |     POOLER_RESOLUTION: 7
33 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
34 |     POOLER_SAMPLING_RATIO: 2
35 |     CONV_HEAD_DIM: 256
36 |     NUM_STACKED_CONVS: 4
37 |     FEATURE_EXTRACTOR: "FPNXconv1fcFeatureExtractor"
38 |     PREDICTOR: "FPNPredictor"
39 | DATASETS:
40 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
41 |   TEST: ("coco_2014_minival",)
42 | DATALOADER:
43 |   SIZE_DIVISIBILITY: 32
44 | SOLVER:
45 |   # Assume 8 gpus
46 |   BASE_LR: 0.02
47 |   WEIGHT_DECAY: 0.0001
48 |   STEPS: (210000, 250000)
49 |   MAX_ITER: 270000
50 |   IMS_PER_BATCH: 16
51 | TEST:
52 |   IMS_PER_BATCH: 8
53 | 


--------------------------------------------------------------------------------
/PR_inference/configs/pascal_voc/e2e_faster_rcnn_R_50_C4_1x_1_gpu_voc.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN:
 5 |     PRE_NMS_TOP_N_TEST: 6000
 6 |     POST_NMS_TOP_N_TEST: 300
 7 |     ANCHOR_SIZES: (128, 256, 512)
 8 |   ROI_BOX_HEAD:
 9 |     NUM_CLASSES: 21
10 | DATASETS:
11 |   TRAIN: ("voc_2007_train", "voc_2007_val")
12 |   TEST: ("voc_2007_test",)
13 | SOLVER:
14 |   BASE_LR: 0.001
15 |   WEIGHT_DECAY: 0.0001
16 |   STEPS: (50000, )
17 |   MAX_ITER: 70000
18 |   IMS_PER_BATCH: 1
19 | TEST:
20 |   IMS_PER_BATCH: 1
21 | 


--------------------------------------------------------------------------------
/PR_inference/configs/pascal_voc/e2e_faster_rcnn_R_50_C4_1x_4_gpu_voc.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN:
 5 |     PRE_NMS_TOP_N_TEST: 6000
 6 |     POST_NMS_TOP_N_TEST: 300
 7 |     ANCHOR_SIZES: (128, 256, 512)
 8 |   ROI_BOX_HEAD:
 9 |     NUM_CLASSES: 21
10 | DATASETS:
11 |   TRAIN: ("voc_2007_train", "voc_2007_val")
12 |   TEST: ("voc_2007_test",)
13 | SOLVER:
14 |   BASE_LR: 0.004
15 |   WEIGHT_DECAY: 0.0001
16 |   STEPS: (12500, )
17 |   MAX_ITER: 17500
18 |   IMS_PER_BATCH: 4
19 | TEST:
20 |   IMS_PER_BATCH: 4
21 | 


--------------------------------------------------------------------------------
/PR_inference/configs/pascal_voc/e2e_mask_rcnn_R_50_FPN_1x_cocostyle.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |     NUM_CLASSES: 21
24 |   ROI_MASK_HEAD:
25 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
26 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
27 |     PREDICTOR: "MaskRCNNC4Predictor"
28 |     POOLER_RESOLUTION: 14
29 |     POOLER_SAMPLING_RATIO: 2
30 |     RESOLUTION: 28
31 |     SHARE_BOX_FEATURE_EXTRACTOR: False
32 |   MASK_ON: True
33 | DATASETS:
34 |   TRAIN: ("voc_2012_train_cocostyle",)
35 |   TEST: ("voc_2012_val_cocostyle",)
36 | DATALOADER:
37 |   SIZE_DIVISIBILITY: 32
38 | SOLVER:
39 |   BASE_LR: 0.01
40 |   WEIGHT_DECAY: 0.0001
41 |   STEPS: (18000,)
42 |   MAX_ITER: 24000
43 | 


--------------------------------------------------------------------------------
/PR_inference/configs/quick_schedules/e2e_faster_rcnn_R_50_C4_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN:
 5 |     PRE_NMS_TOP_N_TEST: 6000
 6 |     POST_NMS_TOP_N_TEST: 1000
 7 |   ROI_HEADS:
 8 |     BATCH_SIZE_PER_IMAGE: 256
 9 | DATASETS:
10 |   TRAIN: ("coco_2014_minival",)
11 |   TEST: ("coco_2014_minival",)
12 | INPUT:
13 |   MIN_SIZE_TRAIN: (600,)
14 |   MAX_SIZE_TRAIN: 1000
15 |   MIN_SIZE_TEST: 800
16 |   MAX_SIZE_TEST: 1000
17 | SOLVER:
18 |   BASE_LR: 0.005
19 |   WEIGHT_DECAY: 0.0001
20 |   STEPS: (1500,)
21 |   MAX_ITER: 2000
22 |   IMS_PER_BATCH: 2
23 | TEST:
24 |   IMS_PER_BATCH: 2
25 | 


--------------------------------------------------------------------------------
/PR_inference/configs/quick_schedules/e2e_faster_rcnn_R_50_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |     BATCH_SIZE_PER_IMAGE: 256
18 |   ROI_BOX_HEAD:
19 |     POOLER_RESOLUTION: 7
20 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
21 |     POOLER_SAMPLING_RATIO: 2
22 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
23 |     PREDICTOR: "FPNPredictor"
24 | DATASETS:
25 |   TRAIN: ("coco_2014_minival",)
26 |   TEST: ("coco_2014_minival",)
27 | INPUT:
28 |   MIN_SIZE_TRAIN: (600,)
29 |   MAX_SIZE_TRAIN: 1000
30 |   MIN_SIZE_TEST: 800
31 |   MAX_SIZE_TEST: 1000
32 | DATALOADER:
33 |   SIZE_DIVISIBILITY: 32
34 | SOLVER:
35 |   BASE_LR: 0.005
36 |   WEIGHT_DECAY: 0.0001
37 |   STEPS: (1500,)
38 |   MAX_ITER: 2000
39 |   IMS_PER_BATCH: 4
40 | TEST:
41 |   IMS_PER_BATCH: 2
42 | 


--------------------------------------------------------------------------------
/PR_inference/configs/quick_schedules/e2e_faster_rcnn_X_101_32x8d_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/FAIR/20171220/X-101-32x8d"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |     STRIDE_IN_1X1: False
 9 |     NUM_GROUPS: 32
10 |     WIDTH_PER_GROUP: 8
11 |   RPN:
12 |     USE_FPN: True
13 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
14 |     PRE_NMS_TOP_N_TRAIN: 2000
15 |     PRE_NMS_TOP_N_TEST: 1000
16 |     POST_NMS_TOP_N_TEST: 1000
17 |     FPN_POST_NMS_TOP_N_TEST: 1000
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |     BATCH_SIZE_PER_IMAGE: 256
21 |   ROI_BOX_HEAD:
22 |     POOLER_RESOLUTION: 7
23 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
24 |     POOLER_SAMPLING_RATIO: 2
25 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
26 |     PREDICTOR: "FPNPredictor"
27 | DATASETS:
28 |   TRAIN: ("coco_2014_minival",)
29 |   TEST: ("coco_2014_minival",)
30 | INPUT:
31 |   MIN_SIZE_TRAIN: (600,)
32 |   MAX_SIZE_TRAIN: 1000
33 |   MIN_SIZE_TEST: 800
34 |   MAX_SIZE_TEST: 1000
35 | DATALOADER:
36 |   SIZE_DIVISIBILITY: 32
37 | SOLVER:
38 |   BASE_LR: 0.005
39 |   WEIGHT_DECAY: 0.0001
40 |   STEPS: (1500,)
41 |   MAX_ITER: 2000
42 |   IMS_PER_BATCH: 2
43 | TEST:
44 |   IMS_PER_BATCH: 2
45 | 


--------------------------------------------------------------------------------
/PR_inference/configs/quick_schedules/e2e_keypoint_rcnn_R_50_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |     BATCH_SIZE_PER_IMAGE: 256
18 |   ROI_BOX_HEAD:
19 |     POOLER_RESOLUTION: 7
20 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
21 |     POOLER_SAMPLING_RATIO: 2
22 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
23 |     PREDICTOR: "FPNPredictor"
24 |     NUM_CLASSES: 2
25 |   ROI_KEYPOINT_HEAD:
26 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
27 |     FEATURE_EXTRACTOR: "KeypointRCNNFeatureExtractor"
28 |     PREDICTOR: "KeypointRCNNPredictor"
29 |     POOLER_RESOLUTION: 14
30 |     POOLER_SAMPLING_RATIO: 2
31 |     RESOLUTION: 56
32 |     SHARE_BOX_FEATURE_EXTRACTOR: False
33 |   KEYPOINT_ON: True
34 | DATASETS:
35 |   TRAIN: ("keypoints_coco_2014_minival",)
36 |   TEST: ("keypoints_coco_2014_minival",)
37 | INPUT:
38 |   MIN_SIZE_TRAIN: (640, 672, 704, 736, 768, 800)
39 |   MAX_SIZE_TRAIN: 1000
40 |   MIN_SIZE_TEST: 800
41 |   MAX_SIZE_TEST: 1000
42 | DATALOADER:
43 |   SIZE_DIVISIBILITY: 32
44 | SOLVER:
45 |   BASE_LR: 0.005
46 |   WEIGHT_DECAY: 0.0001
47 |   STEPS: (1500,)
48 |   MAX_ITER: 2000
49 |   IMS_PER_BATCH: 4
50 | TEST:
51 |   IMS_PER_BATCH: 2
52 | 


--------------------------------------------------------------------------------
/PR_inference/configs/quick_schedules/e2e_mask_rcnn_R_50_C4_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN:
 5 |     PRE_NMS_TOP_N_TEST: 6000
 6 |     POST_NMS_TOP_N_TEST: 1000
 7 |   ROI_HEADS:
 8 |     BATCH_SIZE_PER_IMAGE: 256
 9 |   ROI_MASK_HEAD:
10 |     PREDICTOR: "MaskRCNNC4Predictor"
11 |     SHARE_BOX_FEATURE_EXTRACTOR: True
12 |   MASK_ON: True
13 | DATASETS:
14 |   TRAIN: ("coco_2014_minival",)
15 |   TEST: ("coco_2014_minival",)
16 | INPUT:
17 |   MIN_SIZE_TRAIN: (600,)
18 |   MAX_SIZE_TRAIN: 1000
19 |   MIN_SIZE_TEST: 800
20 |   MAX_SIZE_TEST: 1000
21 | SOLVER:
22 |   BASE_LR: 0.005
23 |   WEIGHT_DECAY: 0.0001
24 |   STEPS: (1500,)
25 |   MAX_ITER: 2000
26 |   IMS_PER_BATCH: 4
27 | TEST:
28 |   IMS_PER_BATCH: 2
29 | 


--------------------------------------------------------------------------------
/PR_inference/configs/quick_schedules/e2e_mask_rcnn_R_50_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |     BATCH_SIZE_PER_IMAGE: 256
18 |   ROI_BOX_HEAD:
19 |     POOLER_RESOLUTION: 7
20 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
21 |     POOLER_SAMPLING_RATIO: 2
22 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
23 |     PREDICTOR: "FPNPredictor"
24 |   ROI_MASK_HEAD:
25 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
26 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
27 |     PREDICTOR: "MaskRCNNC4Predictor"
28 |     POOLER_RESOLUTION: 14
29 |     POOLER_SAMPLING_RATIO: 2
30 |     RESOLUTION: 28
31 |     SHARE_BOX_FEATURE_EXTRACTOR: False
32 |   MASK_ON: True
33 | DATASETS:
34 |   TRAIN: ("coco_2014_minival",)
35 |   TEST: ("coco_2014_minival",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (600,)
38 |   MAX_SIZE_TRAIN: 1000
39 |   MIN_SIZE_TEST: 800
40 |   MAX_SIZE_TEST: 1000
41 | DATALOADER:
42 |   SIZE_DIVISIBILITY: 32
43 | SOLVER:
44 |   BASE_LR: 0.005
45 |   WEIGHT_DECAY: 0.0001
46 |   STEPS: (1500,)
47 |   MAX_ITER: 2000
48 |   IMS_PER_BATCH: 4
49 | TEST:
50 |   IMS_PER_BATCH: 2
51 | 


--------------------------------------------------------------------------------
/PR_inference/configs/quick_schedules/e2e_mask_rcnn_X_101_32x8d_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/FAIR/20171220/X-101-32x8d"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |     STRIDE_IN_1X1: False
 9 |     NUM_GROUPS: 32
10 |     WIDTH_PER_GROUP: 8
11 |   RPN:
12 |     USE_FPN: True
13 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
14 |     PRE_NMS_TOP_N_TRAIN: 2000
15 |     PRE_NMS_TOP_N_TEST: 1000
16 |     POST_NMS_TOP_N_TEST: 1000
17 |     FPN_POST_NMS_TOP_N_TEST: 1000
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |     BATCH_SIZE_PER_IMAGE: 256
21 |   ROI_BOX_HEAD:
22 |     POOLER_RESOLUTION: 7
23 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
24 |     POOLER_SAMPLING_RATIO: 2
25 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
26 |     PREDICTOR: "FPNPredictor"
27 |   ROI_MASK_HEAD:
28 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
29 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
30 |     PREDICTOR: "MaskRCNNC4Predictor"
31 |     POOLER_RESOLUTION: 14
32 |     POOLER_SAMPLING_RATIO: 2
33 |     RESOLUTION: 28
34 |     SHARE_BOX_FEATURE_EXTRACTOR: False
35 |   MASK_ON: True
36 | DATASETS:
37 |   TRAIN: ("coco_2014_minival",)
38 |   TEST: ("coco_2014_minival",)
39 | INPUT:
40 |   MIN_SIZE_TRAIN: (600,)
41 |   MAX_SIZE_TRAIN: 1000
42 |   MIN_SIZE_TEST: 800
43 |   MAX_SIZE_TEST: 1000
44 | DATALOADER:
45 |   SIZE_DIVISIBILITY: 32
46 | SOLVER:
47 |   BASE_LR: 0.005
48 |   WEIGHT_DECAY: 0.0001
49 |   STEPS: (1500,)
50 |   MAX_ITER: 2000
51 |   IMS_PER_BATCH: 2
52 | TEST:
53 |   IMS_PER_BATCH: 2
54 | 


--------------------------------------------------------------------------------
/PR_inference/configs/quick_schedules/rpn_R_50_C4_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN_ONLY: True
 5 |   RPN:
 6 |     PRE_NMS_TOP_N_TEST: 12000
 7 |     POST_NMS_TOP_N_TEST: 2000
 8 | DATASETS:
 9 |   TRAIN: ("coco_2014_minival",)
10 |   TEST: ("coco_2014_minival",)
11 | INPUT:
12 |   MIN_SIZE_TRAIN: (600,)
13 |   MAX_SIZE_TRAIN: 1000
14 |   MIN_SIZE_TEST: 800
15 |   MAX_SIZE_TEST: 1000
16 | SOLVER:
17 |   BASE_LR: 0.005
18 |   WEIGHT_DECAY: 0.0001
19 |   STEPS: (1500,)
20 |   MAX_ITER: 2000
21 |   IMS_PER_BATCH: 4
22 | TEST:
23 |   IMS_PER_BATCH: 2
24 | 


--------------------------------------------------------------------------------
/PR_inference/configs/quick_schedules/rpn_R_50_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN_ONLY: True
 5 |   BACKBONE:
 6 |     CONV_BODY: "R-50-FPN"
 7 |   RESNETS:
 8 |     BACKBONE_OUT_CHANNELS: 256
 9 |   RPN:
10 |     USE_FPN: True
11 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 2000
14 |     FPN_POST_NMS_TOP_N_TEST: 2000
15 | DATASETS:
16 |   TRAIN: ("coco_2014_minival",)
17 |   TEST: ("coco_2014_minival",)
18 | INPUT:
19 |   MIN_SIZE_TRAIN: (600,)
20 |   MAX_SIZE_TRAIN: 1000
21 |   MIN_SIZE_TEST: 800
22 |   MAX_SIZE_TEST: 1000
23 | DATALOADER:
24 |   SIZE_DIVISIBILITY: 32
25 | SOLVER:
26 |   BASE_LR: 0.005
27 |   WEIGHT_DECAY: 0.0001
28 |   STEPS: (1500,)
29 |   MAX_ITER: 2000
30 |   IMS_PER_BATCH: 4
31 | TEST:
32 |   IMS_PER_BATCH: 2
33 | 


--------------------------------------------------------------------------------
/PR_inference/configs/retinanet/retinanet_R-101-FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-101"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-101-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   RPN:
11 |     USE_FPN: True
12 |     FG_IOU_THRESHOLD: 0.5
13 |     BG_IOU_THRESHOLD: 0.4
14 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
15 |     PRE_NMS_TOP_N_TRAIN: 2000
16 |     PRE_NMS_TOP_N_TEST: 1000
17 |     POST_NMS_TOP_N_TEST: 1000
18 |     FPN_POST_NMS_TOP_N_TEST: 1000
19 |   ROI_HEADS:
20 |     USE_FPN: True
21 |     BATCH_SIZE_PER_IMAGE: 256
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 7
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     POOLER_SAMPLING_RATIO: 2
26 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
27 |     PREDICTOR: "FPNPredictor"
28 |   RETINANET:
29 |     SCALES_PER_OCTAVE: 3
30 |     STRADDLE_THRESH: -1
31 |     FG_IOU_THRESHOLD: 0.5
32 |     BG_IOU_THRESHOLD: 0.4
33 | DATASETS:
34 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
35 |   TEST: ("coco_2014_minival",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (800, )
38 |   MAX_SIZE_TRAIN: 1333
39 |   MIN_SIZE_TEST: 800
40 |   MAX_SIZE_TEST: 1333
41 | DATALOADER:
42 |   SIZE_DIVISIBILITY: 32
43 | SOLVER:
44 |   # Assume 4 gpus
45 |   BASE_LR: 0.005
46 |   WEIGHT_DECAY: 0.0001
47 |   STEPS: (120000, 160000)
48 |   MAX_ITER: 180000
49 |   IMS_PER_BATCH: 8
50 | 


--------------------------------------------------------------------------------
/PR_inference/configs/retinanet/retinanet_R-101-FPN_P5_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-101"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-101-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   RPN:
11 |     USE_FPN: True
12 |     FG_IOU_THRESHOLD: 0.5
13 |     BG_IOU_THRESHOLD: 0.4
14 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
15 |     PRE_NMS_TOP_N_TRAIN: 2000
16 |     PRE_NMS_TOP_N_TEST: 1000
17 |     POST_NMS_TOP_N_TEST: 1000
18 |     FPN_POST_NMS_TOP_N_TEST: 1000
19 |   ROI_HEADS:
20 |     USE_FPN: True
21 |     BATCH_SIZE_PER_IMAGE: 256
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 7
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     POOLER_SAMPLING_RATIO: 2
26 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
27 |     PREDICTOR: "FPNPredictor"
28 |   RETINANET:
29 |     SCALES_PER_OCTAVE: 3
30 |     STRADDLE_THRESH: -1
31 |     USE_C5: False
32 |     FG_IOU_THRESHOLD: 0.5
33 |     BG_IOU_THRESHOLD: 0.4
34 | DATASETS:
35 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
36 |   TEST: ("coco_2014_minival",)
37 | INPUT:
38 |   MIN_SIZE_TRAIN: (800, )
39 |   MAX_SIZE_TRAIN: 1333
40 |   MIN_SIZE_TEST: 800
41 |   MAX_SIZE_TEST: 1333
42 | DATALOADER:
43 |   SIZE_DIVISIBILITY: 32
44 | SOLVER:
45 |   # Assume 4 gpus
46 |   BASE_LR: 0.005
47 |   WEIGHT_DECAY: 0.0001
48 |   STEPS: (120000, 160000)
49 |   MAX_ITER: 180000
50 |   IMS_PER_BATCH: 8
51 | 


--------------------------------------------------------------------------------
/PR_inference/configs/retinanet/retinanet_R-50-FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-50-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   RPN:
11 |     USE_FPN: True
12 |     FG_IOU_THRESHOLD: 0.5
13 |     BG_IOU_THRESHOLD: 0.4
14 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
15 |     PRE_NMS_TOP_N_TRAIN: 2000
16 |     PRE_NMS_TOP_N_TEST: 1000
17 |     POST_NMS_TOP_N_TEST: 1000
18 |     FPN_POST_NMS_TOP_N_TEST: 1000
19 |   ROI_HEADS:
20 |     USE_FPN: True
21 |     BATCH_SIZE_PER_IMAGE: 256
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 7
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     POOLER_SAMPLING_RATIO: 2
26 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
27 |     PREDICTOR: "FPNPredictor"
28 |   RETINANET:
29 |     SCALES_PER_OCTAVE: 3
30 |     STRADDLE_THRESH: -1
31 |     FG_IOU_THRESHOLD: 0.5
32 |     BG_IOU_THRESHOLD: 0.4
33 | DATASETS:
34 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
35 |   TEST: ("coco_2014_minival",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (800,)
38 |   MAX_SIZE_TRAIN: 1333
39 |   MIN_SIZE_TEST: 800
40 |   MAX_SIZE_TEST: 1333
41 | DATALOADER:
42 |   SIZE_DIVISIBILITY: 32
43 | SOLVER:
44 |   # Assume 4 gpus
45 |   BASE_LR: 0.005
46 |   WEIGHT_DECAY: 0.0001
47 |   STEPS: (120000, 160000)
48 |   MAX_ITER: 180000
49 |   IMS_PER_BATCH: 8
50 | 


--------------------------------------------------------------------------------
/PR_inference/configs/retinanet/retinanet_R-50-FPN_1x_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-50-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   RPN:
11 |     USE_FPN: True
12 |     FG_IOU_THRESHOLD: 0.5
13 |     BG_IOU_THRESHOLD: 0.4
14 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
15 |     PRE_NMS_TOP_N_TRAIN: 2000
16 |     PRE_NMS_TOP_N_TEST: 1000
17 |     POST_NMS_TOP_N_TEST: 1000
18 |     FPN_POST_NMS_TOP_N_TEST: 1000
19 |   ROI_HEADS:
20 |     USE_FPN: True
21 |     BATCH_SIZE_PER_IMAGE: 256
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 7
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     POOLER_SAMPLING_RATIO: 2
26 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
27 |     PREDICTOR: "FPNPredictor"
28 |   RETINANET:
29 |     SCALES_PER_OCTAVE: 3
30 |     STRADDLE_THRESH: -1
31 |     FG_IOU_THRESHOLD: 0.5
32 |     BG_IOU_THRESHOLD: 0.4
33 | DATASETS:
34 |   TRAIN: ("coco_2014_minival",)
35 |   TEST: ("coco_2014_minival",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (600,)
38 |   MAX_SIZE_TRAIN: 1000
39 |   MIN_SIZE_TEST: 800
40 |   MAX_SIZE_TEST: 1000
41 | DATALOADER:
42 |   SIZE_DIVISIBILITY: 32
43 | SOLVER:
44 |   BASE_LR: 0.005
45 |   WEIGHT_DECAY: 0.0001
46 |   STEPS: (3500,)
47 |   MAX_ITER: 4000
48 |   IMS_PER_BATCH: 4
49 | 


--------------------------------------------------------------------------------
/PR_inference/configs/retinanet/retinanet_R-50-FPN_P5_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-50-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   RPN:
11 |     USE_FPN: True
12 |     FG_IOU_THRESHOLD: 0.5
13 |     BG_IOU_THRESHOLD: 0.4
14 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
15 |     PRE_NMS_TOP_N_TRAIN: 2000
16 |     PRE_NMS_TOP_N_TEST: 1000
17 |     POST_NMS_TOP_N_TEST: 1000
18 |     FPN_POST_NMS_TOP_N_TEST: 1000
19 |   ROI_HEADS:
20 |     USE_FPN: True
21 |     BATCH_SIZE_PER_IMAGE: 256
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 7
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     POOLER_SAMPLING_RATIO: 2
26 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
27 |     PREDICTOR: "FPNPredictor"
28 |   RETINANET:
29 |     SCALES_PER_OCTAVE: 3
30 |     STRADDLE_THRESH: -1
31 |     USE_C5: False
32 |     FG_IOU_THRESHOLD: 0.5
33 |     BG_IOU_THRESHOLD: 0.4
34 | DATASETS:
35 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
36 |   TEST: ("coco_2014_minival",)
37 | INPUT:
38 |   MIN_SIZE_TRAIN: (800,)
39 |   MAX_SIZE_TRAIN: 1333
40 |   MIN_SIZE_TEST: 800
41 |   MAX_SIZE_TEST: 1333
42 | DATALOADER:
43 |   SIZE_DIVISIBILITY: 32
44 | SOLVER:
45 |   # Assume 4 gpus
46 |   BASE_LR: 0.005
47 |   WEIGHT_DECAY: 0.0001
48 |   STEPS: (120000, 160000)
49 |   MAX_ITER: 180000
50 |   IMS_PER_BATCH: 8
51 | 


--------------------------------------------------------------------------------
/PR_inference/configs/retinanet/retinanet_X_101_32x8d_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/FAIR/20171220/X-101-32x8d"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-101-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |     STRIDE_IN_1X1: False
11 |     NUM_GROUPS: 32
12 |     WIDTH_PER_GROUP: 8
13 |   RPN:
14 |     USE_FPN: True
15 |     FG_IOU_THRESHOLD: 0.5
16 |     BG_IOU_THRESHOLD: 0.4
17 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
18 |     PRE_NMS_TOP_N_TRAIN: 2000
19 |     PRE_NMS_TOP_N_TEST: 1000
20 |     POST_NMS_TOP_N_TEST: 1000
21 |     FPN_POST_NMS_TOP_N_TEST: 1000
22 |   ROI_HEADS:
23 |     USE_FPN: True
24 |     BATCH_SIZE_PER_IMAGE: 256
25 |   ROI_BOX_HEAD:
26 |     POOLER_RESOLUTION: 7
27 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
28 |     POOLER_SAMPLING_RATIO: 2
29 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
30 |     PREDICTOR: "FPNPredictor"
31 |   RETINANET:
32 |     SCALES_PER_OCTAVE: 3
33 |     STRADDLE_THRESH: -1
34 |     FG_IOU_THRESHOLD: 0.5
35 |     BG_IOU_THRESHOLD: 0.4
36 | DATASETS:
37 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
38 |   TEST: ("coco_2014_minival",)
39 | INPUT:
40 |   MIN_SIZE_TRAIN: (800, )
41 |   MAX_SIZE_TRAIN: 1333
42 |   MIN_SIZE_TEST: 800
43 |   MAX_SIZE_TEST: 1333
44 | DATALOADER:
45 |   SIZE_DIVISIBILITY: 32
46 | SOLVER:
47 |   # Assume 4 gpus
48 |   BASE_LR: 0.0025
49 |   WEIGHT_DECAY: 0.0001
50 |   STEPS: (240000, 320000)
51 |   MAX_ITER: 360000
52 |   IMS_PER_BATCH: 4
53 | 


--------------------------------------------------------------------------------
/PR_inference/docker/docker-jupyter/jupyter_notebook_config.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | from IPython.lib import passwd
 3 | 
 4 | #c = c  # pylint:disable=undefined-variable
 5 | c = get_config()
 6 | c.NotebookApp.ip = '0.0.0.0'
 7 | c.NotebookApp.port = int(os.getenv('PORT', 8888))
 8 | c.NotebookApp.open_browser = False
 9 | 
10 | # sets a password if PASSWORD is set in the environment
11 | if 'PASSWORD' in os.environ:
12 |   password = os.environ['PASSWORD']
13 |   if password:
14 |     c.NotebookApp.password = passwd(password)
15 |   else:
16 |     c.NotebookApp.password = ''
17 |     c.NotebookApp.token = ''
18 |   del os.environ['PASSWORD']
19 | 


--------------------------------------------------------------------------------
/PR_inference/inference/buildings_val/predictions.pth:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/PR_inference/inference/buildings_val/predictions.pth


--------------------------------------------------------------------------------
/PR_inference/last_checkpoint:
--------------------------------------------------------------------------------
1 | ./model_0027500.pth


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/config/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .defaults import _C as cfg
3 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/csrc/ROIPool.h:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #pragma once
 3 | 
 4 | #include "cpu/vision.h"
 5 | 
 6 | #ifdef WITH_CUDA
 7 | #include "cuda/vision.h"
 8 | #endif
 9 | 
10 | 
11 | std::tuple<at::Tensor, at::Tensor> ROIPool_forward(const at::Tensor& input,
12 |                                 const at::Tensor& rois,
13 |                                 const float spatial_scale,
14 |                                 const int pooled_height,
15 |                                 const int pooled_width) {
16 |   if (input.type().is_cuda()) {
17 | #ifdef WITH_CUDA
18 |     return ROIPool_forward_cuda(input, rois, spatial_scale, pooled_height, pooled_width);
19 | #else
20 |     AT_ERROR("Not compiled with GPU support");
21 | #endif
22 |   }
23 |   AT_ERROR("Not implemented on the CPU");
24 | }
25 | 
26 | at::Tensor ROIPool_backward(const at::Tensor& grad,
27 |                                  const at::Tensor& input,
28 |                                  const at::Tensor& rois,
29 |                                  const at::Tensor& argmax,
30 |                                  const float spatial_scale,
31 |                                  const int pooled_height,
32 |                                  const int pooled_width,
33 |                                  const int batch_size,
34 |                                  const int channels,
35 |                                  const int height,
36 |                                  const int width) {
37 |   if (grad.type().is_cuda()) {
38 | #ifdef WITH_CUDA
39 |     return ROIPool_backward_cuda(grad, input, rois, argmax, spatial_scale, pooled_height, pooled_width, batch_size, channels, height, width);
40 | #else
41 |     AT_ERROR("Not compiled with GPU support");
42 | #endif
43 |   }
44 |   AT_ERROR("Not implemented on the CPU");
45 | }
46 | 
47 | 
48 | 
49 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/csrc/SigmoidFocalLoss.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include "cpu/vision.h"
 4 | 
 5 | #ifdef WITH_CUDA
 6 | #include "cuda/vision.h"
 7 | #endif
 8 | 
 9 | // Interface for Python
10 | at::Tensor SigmoidFocalLoss_forward(
11 | 		const at::Tensor& logits,
12 |                 const at::Tensor& targets,
13 | 		const int num_classes, 
14 | 		const float gamma, 
15 | 		const float alpha) {
16 |   if (logits.type().is_cuda()) {
17 | #ifdef WITH_CUDA
18 |     return SigmoidFocalLoss_forward_cuda(logits, targets, num_classes, gamma, alpha);
19 | #else
20 |     AT_ERROR("Not compiled with GPU support");
21 | #endif
22 |   }
23 |   AT_ERROR("Not implemented on the CPU");
24 | }
25 | 
26 | at::Tensor SigmoidFocalLoss_backward(
27 | 			     const at::Tensor& logits,
28 |                              const at::Tensor& targets,
29 | 			     const at::Tensor& d_losses,
30 | 			     const int num_classes,
31 | 			     const float gamma,
32 | 			     const float alpha) {
33 |   if (logits.type().is_cuda()) {
34 | #ifdef WITH_CUDA
35 |     return SigmoidFocalLoss_backward_cuda(logits, targets, d_losses, num_classes, gamma, alpha);
36 | #else
37 |     AT_ERROR("Not compiled with GPU support");
38 | #endif
39 |   }
40 |   AT_ERROR("Not implemented on the CPU");
41 | }
42 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/csrc/cpu/vision.h:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #pragma once
 3 | #include <torch/extension.h>
 4 | 
 5 | 
 6 | at::Tensor ROIAlign_forward_cpu(const at::Tensor& input,
 7 |                                 const at::Tensor& rois,
 8 |                                 const float spatial_scale,
 9 |                                 const int pooled_height,
10 |                                 const int pooled_width,
11 |                                 const int sampling_ratio);
12 | 
13 | 
14 | at::Tensor nms_cpu(const at::Tensor& dets,
15 |                    const at::Tensor& scores,
16 |                    const float threshold);
17 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/csrc/nms.h:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #pragma once
 3 | #include "cpu/vision.h"
 4 | 
 5 | #ifdef WITH_CUDA
 6 | #include "cuda/vision.h"
 7 | #endif
 8 | 
 9 | 
10 | at::Tensor nms(const at::Tensor& dets,
11 |                const at::Tensor& scores,
12 |                const float threshold) {
13 | 
14 |   if (dets.type().is_cuda()) {
15 | #ifdef WITH_CUDA
16 |     // TODO raise error if not compiled with CUDA
17 |     if (dets.numel() == 0)
18 |       return at::empty({0}, dets.options().dtype(at::kLong).device(at::kCPU));
19 |     auto b = at::cat({dets, scores.unsqueeze(1)}, 1);
20 |     return nms_cuda(b, threshold);
21 | #else
22 |     AT_ERROR("Not compiled with GPU support");
23 | #endif
24 |   }
25 | 
26 |   at::Tensor result = nms_cpu(dets, scores, threshold);
27 |   return result;
28 | }
29 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/csrc/vision.cpp:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #include "nms.h"
 3 | #include "ROIAlign.h"
 4 | #include "ROIPool.h"
 5 | #include "SigmoidFocalLoss.h"
 6 | 
 7 | PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
 8 |   m.def("nms", &nms, "non-maximum suppression");
 9 |   m.def("roi_align_forward", &ROIAlign_forward, "ROIAlign_forward");
10 |   m.def("roi_align_backward", &ROIAlign_backward, "ROIAlign_backward");
11 |   m.def("roi_pool_forward", &ROIPool_forward, "ROIPool_forward");
12 |   m.def("roi_pool_backward", &ROIPool_backward, "ROIPool_backward");
13 |   m.def("sigmoid_focalloss_forward", &SigmoidFocalLoss_forward, "SigmoidFocalLoss_forward");
14 |   m.def("sigmoid_focalloss_backward", &SigmoidFocalLoss_backward, "SigmoidFocalLoss_backward");
15 | }
16 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/data/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .build import make_data_loader
3 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/data/collate_batch.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from maskrcnn_benchmark.structures.image_list import to_image_list
 3 | 
 4 | 
 5 | class BatchCollator(object):
 6 |     """
 7 |     From a list of samples from the dataset,
 8 |     returns the batched images and targets.
 9 |     This should be passed to the DataLoader
10 |     """
11 | 
12 |     def __init__(self, size_divisible=0):
13 |         self.size_divisible = size_divisible
14 | 
15 |     def __call__(self, batch):
16 |         transposed_batch = list(zip(*batch))
17 |         images = to_image_list(transposed_batch[0], self.size_divisible)
18 |         targets = transposed_batch[1]
19 |         img_ids = transposed_batch[2]
20 |         return images, targets, img_ids
21 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/data/datasets/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .coco import COCODataset
3 | from .voc import PascalVOCDataset
4 | from .buildings import BuildingsDataset
5 | from .concat_dataset import ConcatDataset
6 | 
7 | __all__ = ["COCODataset", "ConcatDataset", "PascalVOCDataset", "BuildingsDataset"]
8 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/data/datasets/concat_dataset.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import bisect
 3 | 
 4 | from torch.utils.data.dataset import ConcatDataset as _ConcatDataset
 5 | 
 6 | 
 7 | class ConcatDataset(_ConcatDataset):
 8 |     """
 9 |     Same as torch.utils.data.dataset.ConcatDataset, but exposes an extra
10 |     method for querying the sizes of the image
11 |     """
12 | 
13 |     def get_idxs(self, idx):
14 |         dataset_idx = bisect.bisect_right(self.cumulative_sizes, idx)
15 |         if dataset_idx == 0:
16 |             sample_idx = idx
17 |         else:
18 |             sample_idx = idx - self.cumulative_sizes[dataset_idx - 1]
19 |         return dataset_idx, sample_idx
20 | 
21 |     def get_img_info(self, idx):
22 |         dataset_idx, sample_idx = self.get_idxs(idx)
23 |         return self.datasets[dataset_idx].get_img_info(sample_idx)
24 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/data/datasets/evaluation/__init__.py:
--------------------------------------------------------------------------------
 1 | from maskrcnn_benchmark.data import datasets
 2 | 
 3 | from .coco import coco_evaluation
 4 | from .voc import voc_evaluation
 5 | from .buildings import buildings_evaluation
 6 | 
 7 | def evaluate(dataset, predictions, output_folder, **kwargs):
 8 |     """evaluate dataset using different methods based on dataset type.
 9 |     Args:
10 |         dataset: Dataset object
11 |         predictions(list[BoxList]): each item in the list represents the
12 |             prediction results for one image.
13 |         output_folder: output folder, to save evaluation files or results.
14 |         **kwargs: other args.
15 |     Returns:
16 |         evaluation result
17 |     """
18 |     args = dict(
19 |         dataset=dataset, predictions=predictions, output_folder=output_folder, **kwargs
20 |     )
21 |     if isinstance(dataset, datasets.COCODataset):
22 |         return coco_evaluation(**args)
23 |     elif isinstance(dataset, datasets.PascalVOCDataset):
24 |         return voc_evaluation(**args)
25 |     elif isinstance(dataset, datasets.BuildingsDataset):
26 |         return buildings_evaluation(**args)
27 |     else:
28 |         dataset_name = dataset.__class__.__name__
29 |         raise NotImplementedError("Unsupported dataset type {}.".format(dataset_name))
30 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/data/datasets/evaluation/buildings/__init__.py:
--------------------------------------------------------------------------------
 1 | from .buildings_eval import do_buildings_evaluation
 2 | 
 3 | 
 4 | def buildings_evaluation(
 5 |     dataset,
 6 |     predictions,
 7 |     output_folder,
 8 |     box_only,
 9 |     iou_types,
10 |     expected_results,
11 |     expected_results_sigma_tol,
12 | ):
13 |     return do_buildings_evaluation(
14 |         dataset=dataset,
15 |         predictions=predictions,
16 |         box_only=box_only,
17 |         output_folder=output_folder,
18 |         iou_types=iou_types,
19 |         expected_results=expected_results,
20 |         expected_results_sigma_tol=expected_results_sigma_tol
21 |     )
22 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/data/datasets/evaluation/coco/__init__.py:
--------------------------------------------------------------------------------
 1 | from .coco_eval import do_coco_evaluation
 2 | 
 3 | 
 4 | def coco_evaluation(
 5 |     dataset,
 6 |     predictions,
 7 |     output_folder,
 8 |     box_only,
 9 |     iou_types,
10 |     expected_results,
11 |     expected_results_sigma_tol,
12 | ):
13 |     return do_coco_evaluation(
14 |         dataset=dataset,
15 |         predictions=predictions,
16 |         box_only=box_only,
17 |         output_folder=output_folder,
18 |         iou_types=iou_types,
19 |         expected_results=expected_results,
20 |         expected_results_sigma_tol=expected_results_sigma_tol,
21 |     )
22 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/data/datasets/evaluation/voc/__init__.py:
--------------------------------------------------------------------------------
 1 | import logging
 2 | 
 3 | from .voc_eval import do_voc_evaluation
 4 | 
 5 | 
 6 | def voc_evaluation(dataset, predictions, output_folder, box_only, **_):
 7 |     logger = logging.getLogger("maskrcnn_benchmark.inference")
 8 |     if box_only:
 9 |         logger.warning("voc evaluation doesn't support box_only, ignored.")
10 |     logger.info("performing voc evaluation, ignored iou_types.")
11 |     return do_voc_evaluation(
12 |         dataset=dataset,
13 |         predictions=predictions,
14 |         output_folder=output_folder,
15 |         logger=logger,
16 |     )
17 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/data/datasets/list_dataset.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | """
 3 | Simple dataset class that wraps a list of path names
 4 | """
 5 | 
 6 | from PIL import Image
 7 | 
 8 | from maskrcnn_benchmark.structures.bounding_box import BoxList
 9 | 
10 | 
11 | class ListDataset(object):
12 |     def __init__(self, image_lists, transforms=None):
13 |         self.image_lists = image_lists
14 |         self.transforms = transforms
15 | 
16 |     def __getitem__(self, item):
17 |         img = Image.open(self.image_lists[item]).convert("RGB")
18 | 
19 |         # dummy target
20 |         w, h = img.size
21 |         target = BoxList([[0, 0, w, h]], img.size, mode="xyxy")
22 | 
23 |         if self.transforms is not None:
24 |             img, target = self.transforms(img, target)
25 | 
26 |         return img, target
27 | 
28 |     def __len__(self):
29 |         return len(self.image_lists)
30 | 
31 |     def get_img_info(self, item):
32 |         """
33 |         Return the image dimensions for the image, without
34 |         loading and pre-processing it
35 |         """
36 |         pass
37 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/data/samplers/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .distributed import DistributedSampler
3 | from .grouped_batch_sampler import GroupedBatchSampler
4 | from .iteration_based_batch_sampler import IterationBasedBatchSampler
5 | 
6 | __all__ = ["DistributedSampler", "GroupedBatchSampler", "IterationBasedBatchSampler"]
7 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/data/samplers/iteration_based_batch_sampler.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from torch.utils.data.sampler import BatchSampler
 3 | 
 4 | 
 5 | class IterationBasedBatchSampler(BatchSampler):
 6 |     """
 7 |     Wraps a BatchSampler, resampling from it until
 8 |     a specified number of iterations have been sampled
 9 |     """
10 | 
11 |     def __init__(self, batch_sampler, num_iterations, start_iter=0):
12 |         self.batch_sampler = batch_sampler
13 |         self.num_iterations = num_iterations
14 |         self.start_iter = start_iter
15 | 
16 |     def __iter__(self):
17 |         iteration = self.start_iter
18 |         while iteration <= self.num_iterations:
19 |             # if the underlying sampler has a set_epoch method, like
20 |             # DistributedSampler, used for making each process see
21 |             # a different split of the dataset, then set it
22 |             if hasattr(self.batch_sampler.sampler, "set_epoch"):
23 |                 self.batch_sampler.sampler.set_epoch(iteration)
24 |             for batch in self.batch_sampler:
25 |                 iteration += 1
26 |                 if iteration > self.num_iterations:
27 |                     break
28 |                 yield batch
29 | 
30 |     def __len__(self):
31 |         return self.num_iterations
32 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/data/transforms/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .transforms import Compose
3 | from .transforms import Resize
4 | from .transforms import RandomHorizontalFlip
5 | from .transforms import ToTensor
6 | from .transforms import Normalize
7 | 
8 | from .build import build_transforms
9 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/data/transforms/build.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from . import transforms as T
 3 | 
 4 | 
 5 | def build_transforms(cfg, is_train=True):
 6 |     if is_train:
 7 |         min_size = cfg.INPUT.MIN_SIZE_TRAIN
 8 |         max_size = cfg.INPUT.MAX_SIZE_TRAIN
 9 |         flip_prob = 0.5  # cfg.INPUT.FLIP_PROB_TRAIN
10 |     else:
11 |         min_size = cfg.INPUT.MIN_SIZE_TEST
12 |         max_size = cfg.INPUT.MAX_SIZE_TEST
13 |         flip_prob = 0
14 | 
15 |     to_bgr255 = cfg.INPUT.TO_BGR255
16 |     normalize_transform = T.Normalize(
17 |         mean=cfg.INPUT.PIXEL_MEAN, std=cfg.INPUT.PIXEL_STD, to_bgr255=to_bgr255
18 |     )
19 | 
20 |     transform = T.Compose(
21 |         [
22 |             T.Resize(min_size, max_size),
23 |             T.RandomHorizontalFlip(flip_prob),
24 |             T.ToTensor(),
25 |             normalize_transform,
26 |         ]
27 |     )
28 |     return transform
29 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/engine/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/layers/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | from .batch_norm import FrozenBatchNorm2d
 5 | from .misc import Conv2d
 6 | from .misc import ConvTranspose2d
 7 | from .misc import BatchNorm2d
 8 | from .misc import interpolate
 9 | from .nms import nms
10 | from .roi_align import ROIAlign
11 | from .roi_align import roi_align
12 | from .roi_pool import ROIPool
13 | from .roi_pool import roi_pool
14 | from .smooth_l1_loss import smooth_l1_loss
15 | from .sigmoid_focal_loss import SigmoidFocalLoss
16 | 
17 | __all__ = ["nms", "roi_align", "ROIAlign", "roi_pool", "ROIPool",
18 |            "smooth_l1_loss", "Conv2d", "ConvTranspose2d", "interpolate",
19 |            "BatchNorm2d", "FrozenBatchNorm2d", "SigmoidFocalLoss"
20 |           ]
21 | 
22 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/layers/_utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import glob
 3 | import os.path
 4 | 
 5 | import torch
 6 | 
 7 | try:
 8 |     from torch.utils.cpp_extension import load as load_ext
 9 |     from torch.utils.cpp_extension import CUDA_HOME
10 | except ImportError:
11 |     raise ImportError("The cpp layer extensions requires PyTorch 0.4 or higher")
12 | 
13 | 
14 | def _load_C_extensions():
15 |     this_dir = os.path.dirname(os.path.abspath(__file__))
16 |     this_dir = os.path.dirname(this_dir)
17 |     this_dir = os.path.join(this_dir, "csrc")
18 | 
19 |     main_file = glob.glob(os.path.join(this_dir, "*.cpp"))
20 |     source_cpu = glob.glob(os.path.join(this_dir, "cpu", "*.cpp"))
21 |     source_cuda = glob.glob(os.path.join(this_dir, "cuda", "*.cu"))
22 | 
23 |     source = main_file + source_cpu
24 | 
25 |     extra_cflags = []
26 |     if torch.cuda.is_available() and CUDA_HOME is not None:
27 |         source.extend(source_cuda)
28 |         extra_cflags = ["-DWITH_CUDA"]
29 |     source = [os.path.join(this_dir, s) for s in source]
30 |     extra_include_paths = [this_dir]
31 |     return load_ext(
32 |         "torchvision",
33 |         source,
34 |         extra_cflags=extra_cflags,
35 |         extra_include_paths=extra_include_paths,
36 |     )
37 | 
38 | 
39 | _C = _load_C_extensions()
40 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/layers/batch_norm.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | from torch import nn
 4 | 
 5 | 
 6 | class FrozenBatchNorm2d(nn.Module):
 7 |     """
 8 |     BatchNorm2d where the batch statistics and the affine parameters
 9 |     are fixed
10 |     """
11 | 
12 |     def __init__(self, n):
13 |         super(FrozenBatchNorm2d, self).__init__()
14 |         self.register_buffer("weight", torch.ones(n))
15 |         self.register_buffer("bias", torch.zeros(n))
16 |         self.register_buffer("running_mean", torch.zeros(n))
17 |         self.register_buffer("running_var", torch.ones(n))
18 | 
19 |     def forward(self, x):
20 |         scale = self.weight * self.running_var.rsqrt()
21 |         bias = self.bias - self.running_mean * scale
22 |         scale = scale.reshape(1, -1, 1, 1)
23 |         bias = bias.reshape(1, -1, 1, 1)
24 |         return x * scale + bias
25 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/layers/nms.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | # from ._utils import _C
3 | from maskrcnn_benchmark import _C
4 | 
5 | nms = _C.nms
6 | # nms.__doc__ = """
7 | # This function performs Non-maximum suppresion"""
8 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/layers/smooth_l1_loss.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | 
 5 | # TODO maybe push this to nn?
 6 | def smooth_l1_loss(input, target, beta=1. / 9, size_average=True):
 7 |     """
 8 |     very similar to the smooth_l1_loss from pytorch, but with
 9 |     the extra beta parameter
10 |     """
11 |     n = torch.abs(input - target)
12 |     cond = n < beta
13 |     loss = torch.where(cond, 0.5 * n ** 2 / beta, n - 0.5 * beta)
14 |     if size_average:
15 |         return loss.mean()
16 |     return loss.sum()
17 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/modeling/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/PR_inference/maskrcnn_benchmark/modeling/__init__.py


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/modeling/backbone/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .backbone import build_backbone
3 | from . import fbnet
4 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/modeling/detector/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .detectors import build_detection_model
3 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/modeling/detector/detectors.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from .generalized_rcnn import GeneralizedRCNN
 3 | 
 4 | 
 5 | _DETECTION_META_ARCHITECTURES = {"GeneralizedRCNN": GeneralizedRCNN}
 6 | 
 7 | 
 8 | def build_detection_model(cfg):
 9 |     meta_arch = _DETECTION_META_ARCHITECTURES[cfg.MODEL.META_ARCHITECTURE]
10 |     return meta_arch(cfg)
11 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/modeling/registry.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | from maskrcnn_benchmark.utils.registry import Registry
 4 | 
 5 | BACKBONES = Registry()
 6 | RPN_HEADS = Registry()
 7 | ROI_BOX_FEATURE_EXTRACTORS = Registry()
 8 | ROI_BOX_PREDICTOR = Registry()
 9 | ROI_KEYPOINT_FEATURE_EXTRACTORS = Registry()
10 | ROI_KEYPOINT_PREDICTOR = Registry()
11 | ROI_MASK_FEATURE_EXTRACTORS = Registry()
12 | ROI_MASK_PREDICTOR = Registry()
13 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/modeling/roi_heads/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/PR_inference/maskrcnn_benchmark/modeling/roi_heads/__init__.py


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/modeling/roi_heads/box_head/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/PR_inference/maskrcnn_benchmark/modeling/roi_heads/box_head/__init__.py


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/modeling/roi_heads/keypoint_head/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/PR_inference/maskrcnn_benchmark/modeling/roi_heads/keypoint_head/__init__.py


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/modeling/roi_heads/keypoint_head/roi_keypoint_predictors.py:
--------------------------------------------------------------------------------
 1 | from torch import nn
 2 | 
 3 | from maskrcnn_benchmark import layers
 4 | from maskrcnn_benchmark.modeling import registry
 5 | 
 6 | 
 7 | @registry.ROI_KEYPOINT_PREDICTOR.register("KeypointRCNNPredictor")
 8 | class KeypointRCNNPredictor(nn.Module):
 9 |     def __init__(self, cfg, in_channels):
10 |         super(KeypointRCNNPredictor, self).__init__()
11 |         input_features = in_channels
12 |         num_keypoints = cfg.MODEL.ROI_KEYPOINT_HEAD.NUM_CLASSES
13 |         deconv_kernel = 4
14 |         self.kps_score_lowres = layers.ConvTranspose2d(
15 |             input_features,
16 |             num_keypoints,
17 |             deconv_kernel,
18 |             stride=2,
19 |             padding=deconv_kernel // 2 - 1,
20 |         )
21 |         nn.init.kaiming_normal_(
22 |             self.kps_score_lowres.weight, mode="fan_out", nonlinearity="relu"
23 |         )
24 |         nn.init.constant_(self.kps_score_lowres.bias, 0)
25 |         self.up_scale = 2
26 |         self.out_channels = num_keypoints
27 | 
28 |     def forward(self, x):
29 |         x = self.kps_score_lowres(x)
30 |         x = layers.interpolate(
31 |             x, scale_factor=self.up_scale, mode="bilinear", align_corners=False
32 |         )
33 |         return x
34 | 
35 | 
36 | def make_roi_keypoint_predictor(cfg, in_channels):
37 |     func = registry.ROI_KEYPOINT_PREDICTOR[cfg.MODEL.ROI_KEYPOINT_HEAD.PREDICTOR]
38 |     return func(cfg, in_channels)
39 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/modeling/roi_heads/mask_head/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/PR_inference/maskrcnn_benchmark/modeling/roi_heads/mask_head/__init__.py


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/modeling/rpn/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | # from .rpn import build_rpn
3 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/modeling/rpn/retinanet/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/PR_inference/maskrcnn_benchmark/modeling/rpn/retinanet/__init__.py


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/modeling/utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | """
 3 | Miscellaneous utility functions
 4 | """
 5 | 
 6 | import torch
 7 | 
 8 | 
 9 | def cat(tensors, dim=0):
10 |     """
11 |     Efficient version of torch.cat that avoids a copy if there is only a single element in a list
12 |     """
13 |     assert isinstance(tensors, (list, tuple))
14 |     if len(tensors) == 1:
15 |         return tensors[0]
16 |     return torch.cat(tensors, dim)
17 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/solver/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .build import make_optimizer
3 | from .build import make_lr_scheduler
4 | from .lr_scheduler import WarmupMultiStepLR
5 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/solver/build.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | from .lr_scheduler import WarmupMultiStepLR
 5 | 
 6 | 
 7 | def make_optimizer(cfg, model):
 8 |     params = []
 9 |     for key, value in model.named_parameters():
10 |         if not value.requires_grad:
11 |             continue
12 |         lr = cfg.SOLVER.BASE_LR
13 |         weight_decay = cfg.SOLVER.WEIGHT_DECAY
14 |         if "bias" in key:
15 |             lr = cfg.SOLVER.BASE_LR * cfg.SOLVER.BIAS_LR_FACTOR
16 |             weight_decay = cfg.SOLVER.WEIGHT_DECAY_BIAS
17 |         params += [{"params": [value], "lr": lr, "weight_decay": weight_decay}]
18 | 
19 |     optimizer = torch.optim.SGD(params, lr, momentum=cfg.SOLVER.MOMENTUM)
20 |     return optimizer
21 | 
22 | 
23 | def make_lr_scheduler(cfg, optimizer):
24 |     return WarmupMultiStepLR(
25 |         optimizer,
26 |         cfg.SOLVER.STEPS,
27 |         cfg.SOLVER.GAMMA,
28 |         warmup_factor=cfg.SOLVER.WARMUP_FACTOR,
29 |         warmup_iters=cfg.SOLVER.WARMUP_ITERS,
30 |         warmup_method=cfg.SOLVER.WARMUP_METHOD,
31 |     )
32 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/structures/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/PR_inference/maskrcnn_benchmark/structures/__init__.py


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/utils/README.md:
--------------------------------------------------------------------------------
1 | # Utility functions
2 | 
3 | This folder contain utility functions that are not used in the
4 | core library, but are useful for building models or training
5 | code using the config system.
6 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/utils/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/PR_inference/maskrcnn_benchmark/utils/__init__.py


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/utils/collect_env.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import PIL
 3 | 
 4 | from torch.utils.collect_env import get_pretty_env_info
 5 | 
 6 | 
 7 | def get_pil_version():
 8 |     return "\n        Pillow ({})".format(PIL.__version__)
 9 | 
10 | 
11 | def collect_env_info():
12 |     env_str = get_pretty_env_info()
13 |     env_str += get_pil_version()
14 |     return env_str
15 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/utils/cv2_util.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Module for cv2 utility functions and maintaining version compatibility
 3 | between 3.x and 4.x
 4 | """
 5 | import cv2
 6 | 
 7 | 
 8 | def findContours(*args, **kwargs):
 9 |     """
10 |     Wraps cv2.findContours to maintain compatiblity between versions
11 |     3 and 4
12 | 
13 |     Returns:
14 |         contours, hierarchy
15 |     """
16 |     if cv2.__version__.startswith('4'):
17 |         contours, hierarchy = cv2.findContours(*args, **kwargs)
18 |     elif cv2.__version__.startswith('3'):
19 |         _, contours, hierarchy = cv2.findContours(*args, **kwargs)
20 |     else:
21 |         raise AssertionError(
22 |             'cv2 must be either version 3 or 4 to call this method')
23 | 
24 |     return contours, hierarchy
25 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/utils/env.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import os
 3 | 
 4 | from maskrcnn_benchmark.utils.imports import import_file
 5 | 
 6 | 
 7 | def setup_environment():
 8 |     """Perform environment setup work. The default setup is a no-op, but this
 9 |     function allows the user to specify a Python source file that performs
10 |     custom setup work that may be necessary to their computing environment.
11 |     """
12 |     custom_module_path = os.environ.get("TORCH_DETECTRON_ENV_MODULE")
13 |     if custom_module_path:
14 |         setup_custom_environment(custom_module_path)
15 |     else:
16 |         # The default setup is a no-op
17 |         pass
18 | 
19 | 
20 | def setup_custom_environment(custom_module_path):
21 |     """Load custom environment setup from a Python source file and run the setup
22 |     function.
23 |     """
24 |     module = import_file("maskrcnn_benchmark.utils.env.custom_module", custom_module_path)
25 |     assert hasattr(module, "setup_environment") and callable(
26 |         module.setup_environment
27 |     ), (
28 |         "Custom environment module defined in {} does not have the "
29 |         "required callable attribute 'setup_environment'."
30 |     ).format(
31 |         custom_module_path
32 |     )
33 |     module.setup_environment()
34 | 
35 | 
36 | # Force environment setup when this module is imported
37 | setup_environment()
38 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/utils/imports.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | if torch._six.PY3:
 5 |     import importlib
 6 |     import importlib.util
 7 |     import sys
 8 | 
 9 | 
10 |     # from https://stackoverflow.com/questions/67631/how-to-import-a-module-given-the-full-path?utm_medium=organic&utm_source=google_rich_qa&utm_campaign=google_rich_qa
11 |     def import_file(module_name, file_path, make_importable=False):
12 |         spec = importlib.util.spec_from_file_location(module_name, file_path)
13 |         module = importlib.util.module_from_spec(spec)
14 |         spec.loader.exec_module(module)
15 |         if make_importable:
16 |             sys.modules[module_name] = module
17 |         return module
18 | else:
19 |     import imp
20 | 
21 |     def import_file(module_name, file_path, make_importable=None):
22 |         module = imp.load_source(module_name, file_path)
23 |         return module
24 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/utils/logger.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import logging
 3 | import os
 4 | import sys
 5 | 
 6 | 
 7 | def setup_logger(name, save_dir, distributed_rank, filename="log.txt"):
 8 |     logger = logging.getLogger(name)
 9 |     logger.setLevel(logging.DEBUG)
10 |     # don't log results for the non-master process
11 |     if distributed_rank > 0:
12 |         return logger
13 |     ch = logging.StreamHandler(stream=sys.stdout)
14 |     ch.setLevel(logging.DEBUG)
15 |     formatter = logging.Formatter("%(asctime)s %(name)s %(levelname)s: %(message)s")
16 |     ch.setFormatter(formatter)
17 |     logger.addHandler(ch)
18 | 
19 |     if save_dir:
20 |         fh = logging.FileHandler(os.path.join(save_dir, filename))
21 |         fh.setLevel(logging.DEBUG)
22 |         fh.setFormatter(formatter)
23 |         logger.addHandler(fh)
24 | 
25 |     return logger
26 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/utils/miscellaneous.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import errno
 3 | import os
 4 | 
 5 | 
 6 | def mkdir(path):
 7 |     try:
 8 |         os.makedirs(path)
 9 |     except OSError as e:
10 |         if e.errno != errno.EEXIST:
11 |             raise
12 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/utils/registry.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | 
 4 | def _register_generic(module_dict, module_name, module):
 5 |     assert module_name not in module_dict
 6 |     module_dict[module_name] = module
 7 | 
 8 | 
 9 | class Registry(dict):
10 |     '''
11 |     A helper class for managing registering modules, it extends a dictionary
12 |     and provides a register functions.
13 | 
14 |     Eg. creeting a registry:
15 |         some_registry = Registry({"default": default_module})
16 | 
17 |     There're two ways of registering new modules:
18 |     1): normal way is just calling register function:
19 |         def foo():
20 |             ...
21 |         some_registry.register("foo_module", foo)
22 |     2): used as decorator when declaring the module:
23 |         @some_registry.register("foo_module")
24 |         @some_registry.register("foo_modeul_nickname")
25 |         def foo():
26 |             ...
27 | 
28 |     Access of module is just like using a dictionary, eg:
29 |         f = some_registry["foo_modeul"]
30 |     '''
31 |     def __init__(self, *args, **kwargs):
32 |         super(Registry, self).__init__(*args, **kwargs)
33 | 
34 |     def register(self, module_name, module=None):
35 |         # used as function call
36 |         if module is not None:
37 |             _register_generic(self, module_name, module)
38 |             return
39 | 
40 |         # used as decorator
41 |         def register_fn(fn):
42 |             _register_generic(self, module_name, fn)
43 |             return fn
44 | 
45 |         return register_fn
46 | 


--------------------------------------------------------------------------------
/PR_inference/maskrcnn_benchmark/utils/timer.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | 
 4 | import time
 5 | import datetime
 6 | 
 7 | 
 8 | class Timer(object):
 9 |     def __init__(self):
10 |         self.reset()
11 | 
12 |     @property
13 |     def average_time(self):
14 |         return self.total_time / self.calls if self.calls > 0 else 0.0
15 | 
16 |     def tic(self):
17 |         # using time.time instead of time.clock because time time.clock
18 |         # does not normalize for multithreading
19 |         self.start_time = time.time()
20 | 
21 |     def toc(self, average=True):
22 |         self.add(time.time() - self.start_time)
23 |         if average:
24 |             return self.average_time
25 |         else:
26 |             return self.diff
27 | 
28 |     def add(self, time_diff):
29 |         self.diff = time_diff
30 |         self.total_time += self.diff
31 |         self.calls += 1
32 | 
33 |     def reset(self):
34 |         self.total_time = 0.0
35 |         self.calls = 0
36 |         self.start_time = 0.0
37 |         self.diff = 0.0
38 | 
39 |     def avg_time_str(self):
40 |         time_str = str(datetime.timedelta(seconds=self.average_time))
41 |         return time_str
42 | 
43 | 
44 | def get_time_str(time_diff):
45 |     time_str = str(datetime.timedelta(seconds=time_diff))
46 |     return time_str
47 | 


--------------------------------------------------------------------------------
/PR_inference/requirements.txt:
--------------------------------------------------------------------------------
1 | ninja
2 | yacs
3 | cython
4 | matplotlib
5 | tqdm
6 | 


--------------------------------------------------------------------------------
/PR_inference/tests/env_tests/env.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | import os
 4 | 
 5 | 
 6 | def get_config_root_path():
 7 |     ''' Path to configs for unit tests '''
 8 |     # cur_file_dir is root/tests/env_tests
 9 |     cur_file_dir = os.path.dirname(os.path.abspath(os.path.realpath(__file__)))
10 |     ret = os.path.dirname(os.path.dirname(cur_file_dir))
11 |     ret = os.path.join(ret, "configs")
12 |     return ret
13 | 


--------------------------------------------------------------------------------
/PR_inference/tests/test_configs.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | import unittest
 4 | import glob
 5 | import os
 6 | import utils
 7 | 
 8 | 
 9 | class TestConfigs(unittest.TestCase):
10 |     def test_configs_load(self):
11 |         ''' Make sure configs are loadable '''
12 | 
13 |         cfg_root_path = utils.get_config_root_path()
14 |         files = glob.glob(
15 |             os.path.join(cfg_root_path, "./**/*.yaml"), recursive=True)
16 |         self.assertGreater(len(files), 0)
17 | 
18 |         for fn in files:
19 |             print('Loading {}...'.format(fn))
20 |             utils.load_config_from_file(fn)
21 | 
22 | 
23 | if __name__ == "__main__":
24 |     unittest.main()
25 | 


--------------------------------------------------------------------------------
/PR_inference/tests/test_metric_logger.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import unittest
 3 | 
 4 | from maskrcnn_benchmark.utils.metric_logger import MetricLogger
 5 | 
 6 | 
 7 | class TestMetricLogger(unittest.TestCase):
 8 |     def test_update(self):
 9 |         meter = MetricLogger()
10 |         for i in range(10):
11 |             meter.update(metric=float(i))
12 |         
13 |         m = meter.meters["metric"]
14 |         self.assertEqual(m.count, 10)
15 |         self.assertEqual(m.total, 45)
16 |         self.assertEqual(m.median, 4)
17 |         self.assertEqual(m.avg, 4.5)
18 | 
19 |     def test_no_attr(self):
20 |         meter = MetricLogger()
21 |         _ = meter.meters
22 |         _ = meter.delimiter
23 |         def broken():
24 |             _ = meter.not_existent
25 |         self.assertRaises(AttributeError, broken)
26 | 
27 | if __name__ == "__main__":
28 |     unittest.main()
29 | 


--------------------------------------------------------------------------------
/PR_inference/tests/utils.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, print_function, unicode_literals
 2 | 
 3 | # Set up custom environment before nearly anything else is imported
 4 | # NOTE: this should be the first import (no not reorder)
 5 | from maskrcnn_benchmark.utils.env import setup_environment  # noqa F401 isort:skip
 6 | import env_tests.env as env_tests
 7 | 
 8 | import os
 9 | import copy
10 | 
11 | from maskrcnn_benchmark.config import cfg as g_cfg
12 | 
13 | 
14 | def get_config_root_path():
15 |     return env_tests.get_config_root_path()
16 | 
17 | 
18 | def load_config(rel_path):
19 |     ''' Load config from file path specified as path relative to config_root '''
20 |     cfg_path = os.path.join(env_tests.get_config_root_path(), rel_path)
21 |     return load_config_from_file(cfg_path)
22 | 
23 | 
24 | def load_config_from_file(file_path):
25 |     ''' Load config from file path specified as absolute path '''
26 |     ret = copy.deepcopy(g_cfg)
27 |     ret.merge_from_file(file_path)
28 |     return ret
29 | 


--------------------------------------------------------------------------------
/RR_inference/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2018 Facebook
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/RR_inference/README.md:
--------------------------------------------------------------------------------
1 | # Faster R-CNN and Mask R-CNN in PyTorch 1.0
2 | Refer to https://github.com/facebookresearch/maskrcnn-benchmark
3 | 


--------------------------------------------------------------------------------
/RR_inference/configs/.ipynb_checkpoints/buildings_mask_rcnn_R_50_FPN_1x-checkpoint.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |   ROI_MASK_HEAD:
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
26 |     PREDICTOR: "MaskRCNNC4Predictor"
27 |     POOLER_RESOLUTION: 14
28 |     POOLER_SAMPLING_RATIO: 2
29 |     RESOLUTION: 28
30 |     SHARE_BOX_FEATURE_EXTRACTOR: False
31 |   MASK_ON: True
32 | DATASETS:
33 |   TRAIN: ("buildings_train",)
34 |   TEST: ("buildings_val",)
35 | DATALOADER:
36 |   SIZE_DIVISIBILITY: 32
37 | SOLVER:
38 |   BASE_LR: 0.001
39 |   WEIGHT_DECAY: 0.0001
40 |   STEPS: (60000, 80000)
41 |   MAX_ITER: 90000
42 | 


--------------------------------------------------------------------------------
/RR_inference/configs/buildings_mask_rcnn_R_50_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |   ROI_MASK_HEAD:
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
26 |     PREDICTOR: "MaskRCNNC4Predictor"
27 |     POOLER_RESOLUTION: 14
28 |     POOLER_SAMPLING_RATIO: 2
29 |     RESOLUTION: 28
30 |     SHARE_BOX_FEATURE_EXTRACTOR: False
31 |   MASK_ON: True
32 | DATASETS:
33 |   TRAIN: ("buildings_train",)
34 |   TEST: ("buildings_val",)
35 | DATALOADER:
36 |   SIZE_DIVISIBILITY: 32
37 | SOLVER:
38 |   BASE_LR: 0.001
39 |   WEIGHT_DECAY: 0.0001
40 |   STEPS: (60000, 80000)
41 |   MAX_ITER: 90000
42 | 


--------------------------------------------------------------------------------
/RR_inference/configs/caffe2/e2e_faster_rcnn_R_101_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35857890/e2e_faster_rcnn_R-101-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 | DATASETS:
24 |   TEST: ("coco_2014_minival",)
25 | DATALOADER:
26 |   SIZE_DIVISIBILITY: 32
27 | 


--------------------------------------------------------------------------------
/RR_inference/configs/caffe2/e2e_faster_rcnn_R_50_C4_1x_caffe2.yaml:
--------------------------------------------------------------------------------
1 | MODEL:
2 |   META_ARCHITECTURE: "GeneralizedRCNN"
3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35857197/e2e_faster_rcnn_R-50-C4_1x"
4 | DATASETS:
5 |   TEST: ("coco_2014_minival",)
6 | 


--------------------------------------------------------------------------------
/RR_inference/configs/caffe2/e2e_faster_rcnn_R_50_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35857345/e2e_faster_rcnn_R-50-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 | DATASETS:
24 |   TEST: ("coco_2014_minival",)
25 | DATALOADER:
26 |   SIZE_DIVISIBILITY: 32
27 | 


--------------------------------------------------------------------------------
/RR_inference/configs/caffe2/e2e_faster_rcnn_X_101_32x8d_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/36761737/e2e_faster_rcnn_X-101-32x8d-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |     STRIDE_IN_1X1: False
 9 |     NUM_GROUPS: 32
10 |     WIDTH_PER_GROUP: 8
11 |   RPN:
12 |     USE_FPN: True
13 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
14 |     PRE_NMS_TOP_N_TRAIN: 2000
15 |     PRE_NMS_TOP_N_TEST: 1000
16 |     POST_NMS_TOP_N_TEST: 1000
17 |     FPN_POST_NMS_TOP_N_TEST: 1000
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |   ROI_BOX_HEAD:
21 |     POOLER_RESOLUTION: 7
22 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
23 |     POOLER_SAMPLING_RATIO: 2
24 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
25 |     PREDICTOR: "FPNPredictor"
26 | DATASETS:
27 |   TEST: ("coco_2014_minival",)
28 | DATALOADER:
29 |   SIZE_DIVISIBILITY: 32
30 | 


--------------------------------------------------------------------------------
/RR_inference/configs/caffe2/e2e_keypoint_rcnn_R_50_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/37697547/e2e_keypoint_rcnn_R-50-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |     NUM_CLASSES: 2
24 |   ROI_KEYPOINT_HEAD:
25 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
26 |     FEATURE_EXTRACTOR: "KeypointRCNNFeatureExtractor"
27 |     PREDICTOR: "KeypointRCNNPredictor"
28 |     POOLER_RESOLUTION: 14
29 |     POOLER_SAMPLING_RATIO: 2
30 |     RESOLUTION: 56
31 |     SHARE_BOX_FEATURE_EXTRACTOR: False
32 |   KEYPOINT_ON: True
33 | DATASETS:
34 |   TRAIN: ("keypoints_coco_2014_train", "keypoints_coco_2014_valminusminival",)
35 |   TEST: ("keypoints_coco_2014_minival",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (640, 672, 704, 736, 768, 800)
38 | DATALOADER:
39 |   SIZE_DIVISIBILITY: 32
40 | SOLVER:
41 |   BASE_LR: 0.02
42 |   WEIGHT_DECAY: 0.0001
43 |   STEPS: (60000, 80000)
44 |   MAX_ITER: 90000
45 | 


--------------------------------------------------------------------------------
/RR_inference/configs/caffe2/e2e_mask_rcnn_R_101_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35861795/e2e_mask_rcnn_R-101-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |   ROI_MASK_HEAD:
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
26 |     PREDICTOR: "MaskRCNNC4Predictor"
27 |     POOLER_RESOLUTION: 14
28 |     POOLER_SAMPLING_RATIO: 2
29 |     RESOLUTION: 28
30 |     SHARE_BOX_FEATURE_EXTRACTOR: False
31 |   MASK_ON: True
32 | DATASETS:
33 |   TEST: ("coco_2014_minival",)
34 | DATALOADER:
35 |   SIZE_DIVISIBILITY: 32
36 | 


--------------------------------------------------------------------------------
/RR_inference/configs/caffe2/e2e_mask_rcnn_R_50_C4_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35858791/e2e_mask_rcnn_R-50-C4_1x"
 4 |   ROI_MASK_HEAD:
 5 |     PREDICTOR: "MaskRCNNC4Predictor"
 6 |     SHARE_BOX_FEATURE_EXTRACTOR: True
 7 |   MASK_ON: True
 8 | DATASETS:
 9 |   TEST: ("coco_2014_minival",)
10 | 


--------------------------------------------------------------------------------
/RR_inference/configs/caffe2/e2e_mask_rcnn_R_50_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35858933/e2e_mask_rcnn_R-50-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |   ROI_MASK_HEAD:
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
26 |     PREDICTOR: "MaskRCNNC4Predictor"
27 |     POOLER_RESOLUTION: 14
28 |     POOLER_SAMPLING_RATIO: 2
29 |     RESOLUTION: 28
30 |     SHARE_BOX_FEATURE_EXTRACTOR: False
31 |   MASK_ON: True
32 | DATASETS:
33 |   TEST: ("coco_2014_minival",)
34 | DATALOADER:
35 |   SIZE_DIVISIBILITY: 32
36 | 


--------------------------------------------------------------------------------
/RR_inference/configs/caffe2/e2e_mask_rcnn_X-152-32x8d-FPN-IN5k_1.44x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/37129812/e2e_mask_rcnn_X-152-32x8d-FPN-IN5k_1.44x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-152-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |     STRIDE_IN_1X1: False
 9 |     NUM_GROUPS: 32
10 |     WIDTH_PER_GROUP: 8
11 |   RPN:
12 |     USE_FPN: True
13 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
14 |     PRE_NMS_TOP_N_TRAIN: 2000
15 |     PRE_NMS_TOP_N_TEST: 1000
16 |     POST_NMS_TOP_N_TEST: 1000
17 |     FPN_POST_NMS_TOP_N_TEST: 1000
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |   ROI_BOX_HEAD:
21 |     POOLER_RESOLUTION: 7
22 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
23 |     POOLER_SAMPLING_RATIO: 2
24 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
25 |     PREDICTOR: "FPNPredictor"
26 |   ROI_MASK_HEAD:
27 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
28 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
29 |     PREDICTOR: "MaskRCNNC4Predictor"
30 |     POOLER_RESOLUTION: 14
31 |     POOLER_SAMPLING_RATIO: 2
32 |     RESOLUTION: 28
33 |     SHARE_BOX_FEATURE_EXTRACTOR: False
34 |   MASK_ON: True
35 | DATASETS:
36 |   TEST: ("coco_2014_minival",)
37 | DATALOADER:
38 |   SIZE_DIVISIBILITY: 32
39 | 


--------------------------------------------------------------------------------
/RR_inference/configs/caffe2/e2e_mask_rcnn_X_101_32x8d_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/36761843/e2e_mask_rcnn_X-101-32x8d-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |     STRIDE_IN_1X1: False
 9 |     NUM_GROUPS: 32
10 |     WIDTH_PER_GROUP: 8
11 |   RPN:
12 |     USE_FPN: True
13 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
14 |     PRE_NMS_TOP_N_TRAIN: 2000
15 |     PRE_NMS_TOP_N_TEST: 1000
16 |     POST_NMS_TOP_N_TEST: 1000
17 |     FPN_POST_NMS_TOP_N_TEST: 1000
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |   ROI_BOX_HEAD:
21 |     POOLER_RESOLUTION: 7
22 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
23 |     POOLER_SAMPLING_RATIO: 2
24 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
25 |     PREDICTOR: "FPNPredictor"
26 |   ROI_MASK_HEAD:
27 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
28 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
29 |     PREDICTOR: "MaskRCNNC4Predictor"
30 |     POOLER_RESOLUTION: 14
31 |     POOLER_SAMPLING_RATIO: 2
32 |     RESOLUTION: 28
33 |     SHARE_BOX_FEATURE_EXTRACTOR: False
34 |   MASK_ON: True
35 | DATASETS:
36 |   TEST: ("coco_2014_minival",)
37 | DATALOADER:
38 |   SIZE_DIVISIBILITY: 32
39 | 


--------------------------------------------------------------------------------
/RR_inference/configs/cityscapes/e2e_faster_rcnn_R_50_FPN_1x_cocostyle.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |     NUM_CLASSES: 9
24 | DATASETS:
25 |   TRAIN: ("cityscapes_fine_instanceonly_seg_train_cocostyle",)
26 |   TEST: ("cityscapes_fine_instanceonly_seg_val_cocostyle",)
27 | DATALOADER:
28 |   SIZE_DIVISIBILITY: 32
29 | SOLVER:
30 |   BASE_LR: 0.01
31 |   WEIGHT_DECAY: 0.0001
32 |   STEPS: (18000,)
33 |   MAX_ITER: 24000
34 | 


--------------------------------------------------------------------------------
/RR_inference/configs/cityscapes/e2e_mask_rcnn_R_50_FPN_1x_cocostyle.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |     NUM_CLASSES: 9
24 |   ROI_MASK_HEAD:
25 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
26 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
27 |     PREDICTOR: "MaskRCNNC4Predictor"
28 |     POOLER_RESOLUTION: 14
29 |     POOLER_SAMPLING_RATIO: 2
30 |     RESOLUTION: 28
31 |     SHARE_BOX_FEATURE_EXTRACTOR: False
32 |   MASK_ON: True
33 | DATASETS:
34 |   TRAIN: ("cityscapes_fine_instanceonly_seg_train_cocostyle",)
35 |   TEST: ("cityscapes_fine_instanceonly_seg_val_cocostyle",)
36 | DATALOADER:
37 |   SIZE_DIVISIBILITY: 32
38 | SOLVER:
39 |   BASE_LR: 0.01
40 |   WEIGHT_DECAY: 0.0001
41 |   STEPS: (18000,)
42 |   MAX_ITER: 24000
43 | 


--------------------------------------------------------------------------------
/RR_inference/configs/gn_baselines/README.md:
--------------------------------------------------------------------------------
 1 | ### Group Normalization
 2 | 1 [Group Normalization](https://arxiv.org/abs/1803.08494)  
 3 | 2 [Rethinking ImageNet Pre-training](https://arxiv.org/abs/1811.08883)  
 4 | 3 [official code](https://github.com/facebookresearch/Detectron/blob/master/projects/GN/README.md)  
 5 | 
 6 | 
 7 | ### Performance
 8 | |      case                  |    Type      |  lr schd  |  im/gpu | bbox AP | mask AP |
 9 | |----------------------------|:------------:|:---------:|:-------:|:-------:|:-------:|
10 | |   R-50-FPN, GN (paper)     | finetune     |    2x     |   2     |   40.3  |  35.7   |
11 | |   R-50-FPN, GN (implement) | finetune     |    2x     |   2     |   40.2  |  36.0   |
12 | |   R-50-FPN, GN (paper)     | from scratch |    3x     |   2     |   39.5  |  35.2   |
13 | |   R-50-FPN, GN (implement) | from scratch |    3x     |   2     |   38.9  |  35.1   |
14 | 


--------------------------------------------------------------------------------
/RR_inference/configs/gn_baselines/e2e_faster_rcnn_R_50_FPN_1x_gn.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50-GN"
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |   RESNETS: # use GN for backbone
12 |     BACKBONE_OUT_CHANNELS: 256
13 |     STRIDE_IN_1X1: False
14 |     TRANS_FUNC: "BottleneckWithGN"
15 |     STEM_FUNC: "StemWithGN"
16 |   FPN:
17 |     USE_GN: True # use GN for FPN
18 |   RPN:
19 |     USE_FPN: True
20 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
21 |     PRE_NMS_TOP_N_TRAIN: 2000
22 |     PRE_NMS_TOP_N_TEST: 1000
23 |     POST_NMS_TOP_N_TEST: 1000
24 |     FPN_POST_NMS_TOP_N_TEST: 1000
25 |   ROI_HEADS:
26 |     USE_FPN: True
27 |     BATCH_SIZE_PER_IMAGE: 512
28 |     POSITIVE_FRACTION: 0.25
29 |   ROI_BOX_HEAD:
30 |     USE_GN: True # use GN for bbox head
31 |     POOLER_RESOLUTION: 7
32 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
33 |     POOLER_SAMPLING_RATIO: 2
34 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
35 |     PREDICTOR: "FPNPredictor"
36 | DATASETS:
37 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
38 |   TEST: ("coco_2014_minival",)
39 | DATALOADER:
40 |   SIZE_DIVISIBILITY: 32
41 | SOLVER:
42 |   # Assume 8 gpus
43 |   BASE_LR: 0.02
44 |   WEIGHT_DECAY: 0.0001
45 |   STEPS: (60000, 80000)
46 |   MAX_ITER: 90000
47 |   IMS_PER_BATCH: 16
48 | TEST:
49 |   IMS_PER_BATCH: 8
50 | 


--------------------------------------------------------------------------------
/RR_inference/configs/gn_baselines/e2e_faster_rcnn_R_50_FPN_Xconv1fc_1x_gn.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50-GN"
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |   RESNETS: # use GN for backbone
12 |     BACKBONE_OUT_CHANNELS: 256
13 |     STRIDE_IN_1X1: False
14 |     TRANS_FUNC: "BottleneckWithGN"
15 |     STEM_FUNC: "StemWithGN"
16 |   FPN:
17 |     USE_GN: True # use GN for FPN
18 |   RPN:
19 |     USE_FPN: True
20 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
21 |     PRE_NMS_TOP_N_TRAIN: 2000
22 |     PRE_NMS_TOP_N_TEST: 1000
23 |     POST_NMS_TOP_N_TEST: 1000
24 |     FPN_POST_NMS_TOP_N_TEST: 1000
25 |   ROI_HEADS:
26 |     USE_FPN: True
27 |     BATCH_SIZE_PER_IMAGE: 512
28 |     POSITIVE_FRACTION: 0.25
29 |   ROI_BOX_HEAD:
30 |     USE_GN: True # use GN for bbox head
31 |     POOLER_RESOLUTION: 7
32 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
33 |     POOLER_SAMPLING_RATIO: 2
34 |     CONV_HEAD_DIM: 256
35 |     NUM_STACKED_CONVS: 4
36 |     FEATURE_EXTRACTOR: "FPNXconv1fcFeatureExtractor"
37 |     PREDICTOR: "FPNPredictor"
38 | DATASETS:
39 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
40 |   TEST: ("coco_2014_minival",)
41 | DATALOADER:
42 |   SIZE_DIVISIBILITY: 32
43 | SOLVER:
44 |   # Assume 8 gpus
45 |   BASE_LR: 0.02
46 |   WEIGHT_DECAY: 0.0001
47 |   STEPS: (60000, 80000)
48 |   MAX_ITER: 90000
49 |   IMS_PER_BATCH: 16
50 | TEST:
51 |   IMS_PER_BATCH: 8
52 | 


--------------------------------------------------------------------------------
/RR_inference/configs/gn_baselines/scratch_e2e_faster_rcnn_R_50_FPN_3x_gn.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "" # no pretrained model
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |     FREEZE_CONV_BODY_AT: 0 # finetune all layers
12 |   RESNETS: # use GN for backbone
13 |     BACKBONE_OUT_CHANNELS: 256
14 |     STRIDE_IN_1X1: False
15 |     TRANS_FUNC: "BottleneckWithGN"
16 |     STEM_FUNC: "StemWithGN"
17 |   FPN:
18 |     USE_GN: True # use GN for FPN
19 |   RPN:
20 |     USE_FPN: True
21 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
22 |     PRE_NMS_TOP_N_TRAIN: 2000
23 |     PRE_NMS_TOP_N_TEST: 1000
24 |     POST_NMS_TOP_N_TEST: 1000
25 |     FPN_POST_NMS_TOP_N_TEST: 1000
26 |   ROI_HEADS:
27 |     USE_FPN: True
28 |     BATCH_SIZE_PER_IMAGE: 512
29 |     POSITIVE_FRACTION: 0.25
30 |   ROI_BOX_HEAD:
31 |     USE_GN: True # use GN for bbox head
32 |     POOLER_RESOLUTION: 7
33 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
34 |     POOLER_SAMPLING_RATIO: 2
35 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
36 |     PREDICTOR: "FPNPredictor"
37 | DATASETS:
38 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
39 |   TEST: ("coco_2014_minival",)
40 | DATALOADER:
41 |   SIZE_DIVISIBILITY: 32
42 | SOLVER:
43 |   # Assume 8 gpus
44 |   BASE_LR: 0.02
45 |   WEIGHT_DECAY: 0.0001
46 |   STEPS: (210000, 250000)
47 |   MAX_ITER: 270000
48 |   IMS_PER_BATCH: 16
49 | TEST:
50 |   IMS_PER_BATCH: 8
51 | 


--------------------------------------------------------------------------------
/RR_inference/configs/gn_baselines/scratch_e2e_faster_rcnn_R_50_FPN_Xconv1fc_3x_gn.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "" # no pretrained model
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |     FREEZE_CONV_BODY_AT: 0 # finetune all layers
12 |   RESNETS: # use GN for backbone
13 |     BACKBONE_OUT_CHANNELS: 256
14 |     STRIDE_IN_1X1: False
15 |     TRANS_FUNC: "BottleneckWithGN"
16 |     STEM_FUNC: "StemWithGN"
17 |   FPN:
18 |     USE_GN: True # use GN for FPN
19 |   RPN:
20 |     USE_FPN: True
21 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
22 |     PRE_NMS_TOP_N_TRAIN: 2000
23 |     PRE_NMS_TOP_N_TEST: 1000
24 |     POST_NMS_TOP_N_TEST: 1000
25 |     FPN_POST_NMS_TOP_N_TEST: 1000
26 |   ROI_HEADS:
27 |     USE_FPN: True
28 |     BATCH_SIZE_PER_IMAGE: 512
29 |     POSITIVE_FRACTION: 0.25
30 |   ROI_BOX_HEAD:
31 |     USE_GN: True # use GN for bbox head
32 |     POOLER_RESOLUTION: 7
33 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
34 |     POOLER_SAMPLING_RATIO: 2
35 |     CONV_HEAD_DIM: 256
36 |     NUM_STACKED_CONVS: 4
37 |     FEATURE_EXTRACTOR: "FPNXconv1fcFeatureExtractor"
38 |     PREDICTOR: "FPNPredictor"
39 | DATASETS:
40 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
41 |   TEST: ("coco_2014_minival",)
42 | DATALOADER:
43 |   SIZE_DIVISIBILITY: 32
44 | SOLVER:
45 |   # Assume 8 gpus
46 |   BASE_LR: 0.02
47 |   WEIGHT_DECAY: 0.0001
48 |   STEPS: (210000, 250000)
49 |   MAX_ITER: 270000
50 |   IMS_PER_BATCH: 16
51 | TEST:
52 |   IMS_PER_BATCH: 8
53 | 


--------------------------------------------------------------------------------
/RR_inference/configs/pascal_voc/e2e_faster_rcnn_R_50_C4_1x_1_gpu_voc.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN:
 5 |     PRE_NMS_TOP_N_TEST: 6000
 6 |     POST_NMS_TOP_N_TEST: 300
 7 |     ANCHOR_SIZES: (128, 256, 512)
 8 |   ROI_BOX_HEAD:
 9 |     NUM_CLASSES: 21
10 | DATASETS:
11 |   TRAIN: ("voc_2007_train", "voc_2007_val")
12 |   TEST: ("voc_2007_test",)
13 | SOLVER:
14 |   BASE_LR: 0.001
15 |   WEIGHT_DECAY: 0.0001
16 |   STEPS: (50000, )
17 |   MAX_ITER: 70000
18 |   IMS_PER_BATCH: 1
19 | TEST:
20 |   IMS_PER_BATCH: 1
21 | 


--------------------------------------------------------------------------------
/RR_inference/configs/pascal_voc/e2e_faster_rcnn_R_50_C4_1x_4_gpu_voc.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN:
 5 |     PRE_NMS_TOP_N_TEST: 6000
 6 |     POST_NMS_TOP_N_TEST: 300
 7 |     ANCHOR_SIZES: (128, 256, 512)
 8 |   ROI_BOX_HEAD:
 9 |     NUM_CLASSES: 21
10 | DATASETS:
11 |   TRAIN: ("voc_2007_train", "voc_2007_val")
12 |   TEST: ("voc_2007_test",)
13 | SOLVER:
14 |   BASE_LR: 0.004
15 |   WEIGHT_DECAY: 0.0001
16 |   STEPS: (12500, )
17 |   MAX_ITER: 17500
18 |   IMS_PER_BATCH: 4
19 | TEST:
20 |   IMS_PER_BATCH: 4
21 | 


--------------------------------------------------------------------------------
/RR_inference/configs/pascal_voc/e2e_mask_rcnn_R_50_FPN_1x_cocostyle.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |     NUM_CLASSES: 21
24 |   ROI_MASK_HEAD:
25 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
26 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
27 |     PREDICTOR: "MaskRCNNC4Predictor"
28 |     POOLER_RESOLUTION: 14
29 |     POOLER_SAMPLING_RATIO: 2
30 |     RESOLUTION: 28
31 |     SHARE_BOX_FEATURE_EXTRACTOR: False
32 |   MASK_ON: True
33 | DATASETS:
34 |   TRAIN: ("voc_2012_train_cocostyle",)
35 |   TEST: ("voc_2012_val_cocostyle",)
36 | DATALOADER:
37 |   SIZE_DIVISIBILITY: 32
38 | SOLVER:
39 |   BASE_LR: 0.01
40 |   WEIGHT_DECAY: 0.0001
41 |   STEPS: (18000,)
42 |   MAX_ITER: 24000
43 | 


--------------------------------------------------------------------------------
/RR_inference/configs/quick_schedules/e2e_faster_rcnn_R_50_C4_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN:
 5 |     PRE_NMS_TOP_N_TEST: 6000
 6 |     POST_NMS_TOP_N_TEST: 1000
 7 |   ROI_HEADS:
 8 |     BATCH_SIZE_PER_IMAGE: 256
 9 | DATASETS:
10 |   TRAIN: ("coco_2014_minival",)
11 |   TEST: ("coco_2014_minival",)
12 | INPUT:
13 |   MIN_SIZE_TRAIN: (600,)
14 |   MAX_SIZE_TRAIN: 1000
15 |   MIN_SIZE_TEST: 800
16 |   MAX_SIZE_TEST: 1000
17 | SOLVER:
18 |   BASE_LR: 0.005
19 |   WEIGHT_DECAY: 0.0001
20 |   STEPS: (1500,)
21 |   MAX_ITER: 2000
22 |   IMS_PER_BATCH: 2
23 | TEST:
24 |   IMS_PER_BATCH: 2
25 | 


--------------------------------------------------------------------------------
/RR_inference/configs/quick_schedules/e2e_faster_rcnn_R_50_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |     BATCH_SIZE_PER_IMAGE: 256
18 |   ROI_BOX_HEAD:
19 |     POOLER_RESOLUTION: 7
20 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
21 |     POOLER_SAMPLING_RATIO: 2
22 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
23 |     PREDICTOR: "FPNPredictor"
24 | DATASETS:
25 |   TRAIN: ("coco_2014_minival",)
26 |   TEST: ("coco_2014_minival",)
27 | INPUT:
28 |   MIN_SIZE_TRAIN: (600,)
29 |   MAX_SIZE_TRAIN: 1000
30 |   MIN_SIZE_TEST: 800
31 |   MAX_SIZE_TEST: 1000
32 | DATALOADER:
33 |   SIZE_DIVISIBILITY: 32
34 | SOLVER:
35 |   BASE_LR: 0.005
36 |   WEIGHT_DECAY: 0.0001
37 |   STEPS: (1500,)
38 |   MAX_ITER: 2000
39 |   IMS_PER_BATCH: 4
40 | TEST:
41 |   IMS_PER_BATCH: 2
42 | 


--------------------------------------------------------------------------------
/RR_inference/configs/quick_schedules/e2e_faster_rcnn_X_101_32x8d_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/FAIR/20171220/X-101-32x8d"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |     STRIDE_IN_1X1: False
 9 |     NUM_GROUPS: 32
10 |     WIDTH_PER_GROUP: 8
11 |   RPN:
12 |     USE_FPN: True
13 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
14 |     PRE_NMS_TOP_N_TRAIN: 2000
15 |     PRE_NMS_TOP_N_TEST: 1000
16 |     POST_NMS_TOP_N_TEST: 1000
17 |     FPN_POST_NMS_TOP_N_TEST: 1000
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |     BATCH_SIZE_PER_IMAGE: 256
21 |   ROI_BOX_HEAD:
22 |     POOLER_RESOLUTION: 7
23 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
24 |     POOLER_SAMPLING_RATIO: 2
25 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
26 |     PREDICTOR: "FPNPredictor"
27 | DATASETS:
28 |   TRAIN: ("coco_2014_minival",)
29 |   TEST: ("coco_2014_minival",)
30 | INPUT:
31 |   MIN_SIZE_TRAIN: (600,)
32 |   MAX_SIZE_TRAIN: 1000
33 |   MIN_SIZE_TEST: 800
34 |   MAX_SIZE_TEST: 1000
35 | DATALOADER:
36 |   SIZE_DIVISIBILITY: 32
37 | SOLVER:
38 |   BASE_LR: 0.005
39 |   WEIGHT_DECAY: 0.0001
40 |   STEPS: (1500,)
41 |   MAX_ITER: 2000
42 |   IMS_PER_BATCH: 2
43 | TEST:
44 |   IMS_PER_BATCH: 2
45 | 


--------------------------------------------------------------------------------
/RR_inference/configs/quick_schedules/e2e_keypoint_rcnn_R_50_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |     BATCH_SIZE_PER_IMAGE: 256
18 |   ROI_BOX_HEAD:
19 |     POOLER_RESOLUTION: 7
20 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
21 |     POOLER_SAMPLING_RATIO: 2
22 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
23 |     PREDICTOR: "FPNPredictor"
24 |     NUM_CLASSES: 2
25 |   ROI_KEYPOINT_HEAD:
26 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
27 |     FEATURE_EXTRACTOR: "KeypointRCNNFeatureExtractor"
28 |     PREDICTOR: "KeypointRCNNPredictor"
29 |     POOLER_RESOLUTION: 14
30 |     POOLER_SAMPLING_RATIO: 2
31 |     RESOLUTION: 56
32 |     SHARE_BOX_FEATURE_EXTRACTOR: False
33 |   KEYPOINT_ON: True
34 | DATASETS:
35 |   TRAIN: ("keypoints_coco_2014_minival",)
36 |   TEST: ("keypoints_coco_2014_minival",)
37 | INPUT:
38 |   MIN_SIZE_TRAIN: (640, 672, 704, 736, 768, 800)
39 |   MAX_SIZE_TRAIN: 1000
40 |   MIN_SIZE_TEST: 800
41 |   MAX_SIZE_TEST: 1000
42 | DATALOADER:
43 |   SIZE_DIVISIBILITY: 32
44 | SOLVER:
45 |   BASE_LR: 0.005
46 |   WEIGHT_DECAY: 0.0001
47 |   STEPS: (1500,)
48 |   MAX_ITER: 2000
49 |   IMS_PER_BATCH: 4
50 | TEST:
51 |   IMS_PER_BATCH: 2
52 | 


--------------------------------------------------------------------------------
/RR_inference/configs/quick_schedules/e2e_mask_rcnn_R_50_C4_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN:
 5 |     PRE_NMS_TOP_N_TEST: 6000
 6 |     POST_NMS_TOP_N_TEST: 1000
 7 |   ROI_HEADS:
 8 |     BATCH_SIZE_PER_IMAGE: 256
 9 |   ROI_MASK_HEAD:
10 |     PREDICTOR: "MaskRCNNC4Predictor"
11 |     SHARE_BOX_FEATURE_EXTRACTOR: True
12 |   MASK_ON: True
13 | DATASETS:
14 |   TRAIN: ("coco_2014_minival",)
15 |   TEST: ("coco_2014_minival",)
16 | INPUT:
17 |   MIN_SIZE_TRAIN: (600,)
18 |   MAX_SIZE_TRAIN: 1000
19 |   MIN_SIZE_TEST: 800
20 |   MAX_SIZE_TEST: 1000
21 | SOLVER:
22 |   BASE_LR: 0.005
23 |   WEIGHT_DECAY: 0.0001
24 |   STEPS: (1500,)
25 |   MAX_ITER: 2000
26 |   IMS_PER_BATCH: 4
27 | TEST:
28 |   IMS_PER_BATCH: 2
29 | 


--------------------------------------------------------------------------------
/RR_inference/configs/quick_schedules/e2e_mask_rcnn_R_50_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |     BATCH_SIZE_PER_IMAGE: 256
18 |   ROI_BOX_HEAD:
19 |     POOLER_RESOLUTION: 7
20 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
21 |     POOLER_SAMPLING_RATIO: 2
22 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
23 |     PREDICTOR: "FPNPredictor"
24 |   ROI_MASK_HEAD:
25 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
26 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
27 |     PREDICTOR: "MaskRCNNC4Predictor"
28 |     POOLER_RESOLUTION: 14
29 |     POOLER_SAMPLING_RATIO: 2
30 |     RESOLUTION: 28
31 |     SHARE_BOX_FEATURE_EXTRACTOR: False
32 |   MASK_ON: True
33 | DATASETS:
34 |   TRAIN: ("coco_2014_minival",)
35 |   TEST: ("coco_2014_minival",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (600,)
38 |   MAX_SIZE_TRAIN: 1000
39 |   MIN_SIZE_TEST: 800
40 |   MAX_SIZE_TEST: 1000
41 | DATALOADER:
42 |   SIZE_DIVISIBILITY: 32
43 | SOLVER:
44 |   BASE_LR: 0.005
45 |   WEIGHT_DECAY: 0.0001
46 |   STEPS: (1500,)
47 |   MAX_ITER: 2000
48 |   IMS_PER_BATCH: 4
49 | TEST:
50 |   IMS_PER_BATCH: 2
51 | 


--------------------------------------------------------------------------------
/RR_inference/configs/quick_schedules/e2e_mask_rcnn_X_101_32x8d_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/FAIR/20171220/X-101-32x8d"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |     STRIDE_IN_1X1: False
 9 |     NUM_GROUPS: 32
10 |     WIDTH_PER_GROUP: 8
11 |   RPN:
12 |     USE_FPN: True
13 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
14 |     PRE_NMS_TOP_N_TRAIN: 2000
15 |     PRE_NMS_TOP_N_TEST: 1000
16 |     POST_NMS_TOP_N_TEST: 1000
17 |     FPN_POST_NMS_TOP_N_TEST: 1000
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |     BATCH_SIZE_PER_IMAGE: 256
21 |   ROI_BOX_HEAD:
22 |     POOLER_RESOLUTION: 7
23 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
24 |     POOLER_SAMPLING_RATIO: 2
25 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
26 |     PREDICTOR: "FPNPredictor"
27 |   ROI_MASK_HEAD:
28 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
29 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
30 |     PREDICTOR: "MaskRCNNC4Predictor"
31 |     POOLER_RESOLUTION: 14
32 |     POOLER_SAMPLING_RATIO: 2
33 |     RESOLUTION: 28
34 |     SHARE_BOX_FEATURE_EXTRACTOR: False
35 |   MASK_ON: True
36 | DATASETS:
37 |   TRAIN: ("coco_2014_minival",)
38 |   TEST: ("coco_2014_minival",)
39 | INPUT:
40 |   MIN_SIZE_TRAIN: (600,)
41 |   MAX_SIZE_TRAIN: 1000
42 |   MIN_SIZE_TEST: 800
43 |   MAX_SIZE_TEST: 1000
44 | DATALOADER:
45 |   SIZE_DIVISIBILITY: 32
46 | SOLVER:
47 |   BASE_LR: 0.005
48 |   WEIGHT_DECAY: 0.0001
49 |   STEPS: (1500,)
50 |   MAX_ITER: 2000
51 |   IMS_PER_BATCH: 2
52 | TEST:
53 |   IMS_PER_BATCH: 2
54 | 


--------------------------------------------------------------------------------
/RR_inference/configs/quick_schedules/rpn_R_50_C4_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN_ONLY: True
 5 |   RPN:
 6 |     PRE_NMS_TOP_N_TEST: 12000
 7 |     POST_NMS_TOP_N_TEST: 2000
 8 | DATASETS:
 9 |   TRAIN: ("coco_2014_minival",)
10 |   TEST: ("coco_2014_minival",)
11 | INPUT:
12 |   MIN_SIZE_TRAIN: (600,)
13 |   MAX_SIZE_TRAIN: 1000
14 |   MIN_SIZE_TEST: 800
15 |   MAX_SIZE_TEST: 1000
16 | SOLVER:
17 |   BASE_LR: 0.005
18 |   WEIGHT_DECAY: 0.0001
19 |   STEPS: (1500,)
20 |   MAX_ITER: 2000
21 |   IMS_PER_BATCH: 4
22 | TEST:
23 |   IMS_PER_BATCH: 2
24 | 


--------------------------------------------------------------------------------
/RR_inference/configs/quick_schedules/rpn_R_50_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN_ONLY: True
 5 |   BACKBONE:
 6 |     CONV_BODY: "R-50-FPN"
 7 |   RESNETS:
 8 |     BACKBONE_OUT_CHANNELS: 256
 9 |   RPN:
10 |     USE_FPN: True
11 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 2000
14 |     FPN_POST_NMS_TOP_N_TEST: 2000
15 | DATASETS:
16 |   TRAIN: ("coco_2014_minival",)
17 |   TEST: ("coco_2014_minival",)
18 | INPUT:
19 |   MIN_SIZE_TRAIN: (600,)
20 |   MAX_SIZE_TRAIN: 1000
21 |   MIN_SIZE_TEST: 800
22 |   MAX_SIZE_TEST: 1000
23 | DATALOADER:
24 |   SIZE_DIVISIBILITY: 32
25 | SOLVER:
26 |   BASE_LR: 0.005
27 |   WEIGHT_DECAY: 0.0001
28 |   STEPS: (1500,)
29 |   MAX_ITER: 2000
30 |   IMS_PER_BATCH: 4
31 | TEST:
32 |   IMS_PER_BATCH: 2
33 | 


--------------------------------------------------------------------------------
/RR_inference/configs/retinanet/retinanet_R-101-FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-101"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-101-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   RPN:
11 |     USE_FPN: True
12 |     FG_IOU_THRESHOLD: 0.5
13 |     BG_IOU_THRESHOLD: 0.4
14 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
15 |     PRE_NMS_TOP_N_TRAIN: 2000
16 |     PRE_NMS_TOP_N_TEST: 1000
17 |     POST_NMS_TOP_N_TEST: 1000
18 |     FPN_POST_NMS_TOP_N_TEST: 1000
19 |   ROI_HEADS:
20 |     USE_FPN: True
21 |     BATCH_SIZE_PER_IMAGE: 256
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 7
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     POOLER_SAMPLING_RATIO: 2
26 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
27 |     PREDICTOR: "FPNPredictor"
28 |   RETINANET:
29 |     SCALES_PER_OCTAVE: 3
30 |     STRADDLE_THRESH: -1
31 |     FG_IOU_THRESHOLD: 0.5
32 |     BG_IOU_THRESHOLD: 0.4
33 | DATASETS:
34 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
35 |   TEST: ("coco_2014_minival",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (800, )
38 |   MAX_SIZE_TRAIN: 1333
39 |   MIN_SIZE_TEST: 800
40 |   MAX_SIZE_TEST: 1333
41 | DATALOADER:
42 |   SIZE_DIVISIBILITY: 32
43 | SOLVER:
44 |   # Assume 4 gpus
45 |   BASE_LR: 0.005
46 |   WEIGHT_DECAY: 0.0001
47 |   STEPS: (120000, 160000)
48 |   MAX_ITER: 180000
49 |   IMS_PER_BATCH: 8
50 | 


--------------------------------------------------------------------------------
/RR_inference/configs/retinanet/retinanet_R-101-FPN_P5_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-101"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-101-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   RPN:
11 |     USE_FPN: True
12 |     FG_IOU_THRESHOLD: 0.5
13 |     BG_IOU_THRESHOLD: 0.4
14 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
15 |     PRE_NMS_TOP_N_TRAIN: 2000
16 |     PRE_NMS_TOP_N_TEST: 1000
17 |     POST_NMS_TOP_N_TEST: 1000
18 |     FPN_POST_NMS_TOP_N_TEST: 1000
19 |   ROI_HEADS:
20 |     USE_FPN: True
21 |     BATCH_SIZE_PER_IMAGE: 256
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 7
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     POOLER_SAMPLING_RATIO: 2
26 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
27 |     PREDICTOR: "FPNPredictor"
28 |   RETINANET:
29 |     SCALES_PER_OCTAVE: 3
30 |     STRADDLE_THRESH: -1
31 |     USE_C5: False
32 |     FG_IOU_THRESHOLD: 0.5
33 |     BG_IOU_THRESHOLD: 0.4
34 | DATASETS:
35 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
36 |   TEST: ("coco_2014_minival",)
37 | INPUT:
38 |   MIN_SIZE_TRAIN: (800, )
39 |   MAX_SIZE_TRAIN: 1333
40 |   MIN_SIZE_TEST: 800
41 |   MAX_SIZE_TEST: 1333
42 | DATALOADER:
43 |   SIZE_DIVISIBILITY: 32
44 | SOLVER:
45 |   # Assume 4 gpus
46 |   BASE_LR: 0.005
47 |   WEIGHT_DECAY: 0.0001
48 |   STEPS: (120000, 160000)
49 |   MAX_ITER: 180000
50 |   IMS_PER_BATCH: 8
51 | 


--------------------------------------------------------------------------------
/RR_inference/configs/retinanet/retinanet_R-50-FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-50-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   RPN:
11 |     USE_FPN: True
12 |     FG_IOU_THRESHOLD: 0.5
13 |     BG_IOU_THRESHOLD: 0.4
14 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
15 |     PRE_NMS_TOP_N_TRAIN: 2000
16 |     PRE_NMS_TOP_N_TEST: 1000
17 |     POST_NMS_TOP_N_TEST: 1000
18 |     FPN_POST_NMS_TOP_N_TEST: 1000
19 |   ROI_HEADS:
20 |     USE_FPN: True
21 |     BATCH_SIZE_PER_IMAGE: 256
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 7
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     POOLER_SAMPLING_RATIO: 2
26 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
27 |     PREDICTOR: "FPNPredictor"
28 |   RETINANET:
29 |     SCALES_PER_OCTAVE: 3
30 |     STRADDLE_THRESH: -1
31 |     FG_IOU_THRESHOLD: 0.5
32 |     BG_IOU_THRESHOLD: 0.4
33 | DATASETS:
34 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
35 |   TEST: ("coco_2014_minival",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (800,)
38 |   MAX_SIZE_TRAIN: 1333
39 |   MIN_SIZE_TEST: 800
40 |   MAX_SIZE_TEST: 1333
41 | DATALOADER:
42 |   SIZE_DIVISIBILITY: 32
43 | SOLVER:
44 |   # Assume 4 gpus
45 |   BASE_LR: 0.005
46 |   WEIGHT_DECAY: 0.0001
47 |   STEPS: (120000, 160000)
48 |   MAX_ITER: 180000
49 |   IMS_PER_BATCH: 8
50 | 


--------------------------------------------------------------------------------
/RR_inference/configs/retinanet/retinanet_R-50-FPN_1x_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-50-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   RPN:
11 |     USE_FPN: True
12 |     FG_IOU_THRESHOLD: 0.5
13 |     BG_IOU_THRESHOLD: 0.4
14 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
15 |     PRE_NMS_TOP_N_TRAIN: 2000
16 |     PRE_NMS_TOP_N_TEST: 1000
17 |     POST_NMS_TOP_N_TEST: 1000
18 |     FPN_POST_NMS_TOP_N_TEST: 1000
19 |   ROI_HEADS:
20 |     USE_FPN: True
21 |     BATCH_SIZE_PER_IMAGE: 256
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 7
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     POOLER_SAMPLING_RATIO: 2
26 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
27 |     PREDICTOR: "FPNPredictor"
28 |   RETINANET:
29 |     SCALES_PER_OCTAVE: 3
30 |     STRADDLE_THRESH: -1
31 |     FG_IOU_THRESHOLD: 0.5
32 |     BG_IOU_THRESHOLD: 0.4
33 | DATASETS:
34 |   TRAIN: ("coco_2014_minival",)
35 |   TEST: ("coco_2014_minival",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (600,)
38 |   MAX_SIZE_TRAIN: 1000
39 |   MIN_SIZE_TEST: 800
40 |   MAX_SIZE_TEST: 1000
41 | DATALOADER:
42 |   SIZE_DIVISIBILITY: 32
43 | SOLVER:
44 |   BASE_LR: 0.005
45 |   WEIGHT_DECAY: 0.0001
46 |   STEPS: (3500,)
47 |   MAX_ITER: 4000
48 |   IMS_PER_BATCH: 4
49 | 


--------------------------------------------------------------------------------
/RR_inference/configs/retinanet/retinanet_R-50-FPN_P5_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-50-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   RPN:
11 |     USE_FPN: True
12 |     FG_IOU_THRESHOLD: 0.5
13 |     BG_IOU_THRESHOLD: 0.4
14 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
15 |     PRE_NMS_TOP_N_TRAIN: 2000
16 |     PRE_NMS_TOP_N_TEST: 1000
17 |     POST_NMS_TOP_N_TEST: 1000
18 |     FPN_POST_NMS_TOP_N_TEST: 1000
19 |   ROI_HEADS:
20 |     USE_FPN: True
21 |     BATCH_SIZE_PER_IMAGE: 256
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 7
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     POOLER_SAMPLING_RATIO: 2
26 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
27 |     PREDICTOR: "FPNPredictor"
28 |   RETINANET:
29 |     SCALES_PER_OCTAVE: 3
30 |     STRADDLE_THRESH: -1
31 |     USE_C5: False
32 |     FG_IOU_THRESHOLD: 0.5
33 |     BG_IOU_THRESHOLD: 0.4
34 | DATASETS:
35 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
36 |   TEST: ("coco_2014_minival",)
37 | INPUT:
38 |   MIN_SIZE_TRAIN: (800,)
39 |   MAX_SIZE_TRAIN: 1333
40 |   MIN_SIZE_TEST: 800
41 |   MAX_SIZE_TEST: 1333
42 | DATALOADER:
43 |   SIZE_DIVISIBILITY: 32
44 | SOLVER:
45 |   # Assume 4 gpus
46 |   BASE_LR: 0.005
47 |   WEIGHT_DECAY: 0.0001
48 |   STEPS: (120000, 160000)
49 |   MAX_ITER: 180000
50 |   IMS_PER_BATCH: 8
51 | 


--------------------------------------------------------------------------------
/RR_inference/configs/retinanet/retinanet_X_101_32x8d_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/FAIR/20171220/X-101-32x8d"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-101-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |     STRIDE_IN_1X1: False
11 |     NUM_GROUPS: 32
12 |     WIDTH_PER_GROUP: 8
13 |   RPN:
14 |     USE_FPN: True
15 |     FG_IOU_THRESHOLD: 0.5
16 |     BG_IOU_THRESHOLD: 0.4
17 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
18 |     PRE_NMS_TOP_N_TRAIN: 2000
19 |     PRE_NMS_TOP_N_TEST: 1000
20 |     POST_NMS_TOP_N_TEST: 1000
21 |     FPN_POST_NMS_TOP_N_TEST: 1000
22 |   ROI_HEADS:
23 |     USE_FPN: True
24 |     BATCH_SIZE_PER_IMAGE: 256
25 |   ROI_BOX_HEAD:
26 |     POOLER_RESOLUTION: 7
27 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
28 |     POOLER_SAMPLING_RATIO: 2
29 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
30 |     PREDICTOR: "FPNPredictor"
31 |   RETINANET:
32 |     SCALES_PER_OCTAVE: 3
33 |     STRADDLE_THRESH: -1
34 |     FG_IOU_THRESHOLD: 0.5
35 |     BG_IOU_THRESHOLD: 0.4
36 | DATASETS:
37 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
38 |   TEST: ("coco_2014_minival",)
39 | INPUT:
40 |   MIN_SIZE_TRAIN: (800, )
41 |   MAX_SIZE_TRAIN: 1333
42 |   MIN_SIZE_TEST: 800
43 |   MAX_SIZE_TEST: 1333
44 | DATALOADER:
45 |   SIZE_DIVISIBILITY: 32
46 | SOLVER:
47 |   # Assume 4 gpus
48 |   BASE_LR: 0.0025
49 |   WEIGHT_DECAY: 0.0001
50 |   STEPS: (240000, 320000)
51 |   MAX_ITER: 360000
52 |   IMS_PER_BATCH: 4
53 | 


--------------------------------------------------------------------------------
/RR_inference/docker/docker-jupyter/jupyter_notebook_config.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | from IPython.lib import passwd
 3 | 
 4 | #c = c  # pylint:disable=undefined-variable
 5 | c = get_config()
 6 | c.NotebookApp.ip = '0.0.0.0'
 7 | c.NotebookApp.port = int(os.getenv('PORT', 8888))
 8 | c.NotebookApp.open_browser = False
 9 | 
10 | # sets a password if PASSWORD is set in the environment
11 | if 'PASSWORD' in os.environ:
12 |   password = os.environ['PASSWORD']
13 |   if password:
14 |     c.NotebookApp.password = passwd(password)
15 |   else:
16 |     c.NotebookApp.password = ''
17 |     c.NotebookApp.token = ''
18 |   del os.environ['PASSWORD']
19 | 


--------------------------------------------------------------------------------
/RR_inference/inference/buildings_val/predictions.pth:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/RR_inference/inference/buildings_val/predictions.pth


--------------------------------------------------------------------------------
/RR_inference/last_checkpoint:
--------------------------------------------------------------------------------
1 | ./model_0037500.pth


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/.ipynb_checkpoints/__init__-checkpoint.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/config/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .defaults import _C as cfg
3 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/csrc/SigmoidFocalLoss.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include "cpu/vision.h"
 4 | 
 5 | #ifdef WITH_CUDA
 6 | #include "cuda/vision.h"
 7 | #endif
 8 | 
 9 | // Interface for Python
10 | at::Tensor SigmoidFocalLoss_forward(
11 | 		const at::Tensor& logits,
12 |                 const at::Tensor& targets,
13 | 		const int num_classes, 
14 | 		const float gamma, 
15 | 		const float alpha) {
16 |   if (logits.type().is_cuda()) {
17 | #ifdef WITH_CUDA
18 |     return SigmoidFocalLoss_forward_cuda(logits, targets, num_classes, gamma, alpha);
19 | #else
20 |     AT_ERROR("Not compiled with GPU support");
21 | #endif
22 |   }
23 |   AT_ERROR("Not implemented on the CPU");
24 | }
25 | 
26 | at::Tensor SigmoidFocalLoss_backward(
27 | 			     const at::Tensor& logits,
28 |                              const at::Tensor& targets,
29 | 			     const at::Tensor& d_losses,
30 | 			     const int num_classes,
31 | 			     const float gamma,
32 | 			     const float alpha) {
33 |   if (logits.type().is_cuda()) {
34 | #ifdef WITH_CUDA
35 |     return SigmoidFocalLoss_backward_cuda(logits, targets, d_losses, num_classes, gamma, alpha);
36 | #else
37 |     AT_ERROR("Not compiled with GPU support");
38 | #endif
39 |   }
40 |   AT_ERROR("Not implemented on the CPU");
41 | }
42 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/csrc/cpu/vision.h:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #pragma once
 3 | #include <torch/extension.h>
 4 | 
 5 | 
 6 | at::Tensor ROIAlign_forward_cpu(const at::Tensor& input,
 7 |                                 const at::Tensor& rois,
 8 |                                 const float spatial_scale,
 9 |                                 const int pooled_height,
10 |                                 const int pooled_width,
11 |                                 const int sampling_ratio);
12 | 
13 | 
14 | at::Tensor nms_cpu(const at::Tensor& dets,
15 |                    const at::Tensor& scores,
16 |                    const float threshold);
17 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/csrc/nms.h:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #pragma once
 3 | #include "cpu/vision.h"
 4 | 
 5 | #ifdef WITH_CUDA
 6 | #include "cuda/vision.h"
 7 | #endif
 8 | 
 9 | 
10 | at::Tensor nms(const at::Tensor& dets,
11 |                const at::Tensor& scores,
12 |                const float threshold) {
13 | 
14 |   if (dets.type().is_cuda()) {
15 | #ifdef WITH_CUDA
16 |     // TODO raise error if not compiled with CUDA
17 |     if (dets.numel() == 0)
18 |       return at::empty({0}, dets.options().dtype(at::kLong).device(at::kCPU));
19 |     auto b = at::cat({dets, scores.unsqueeze(1)}, 1);
20 |     return nms_cuda(b, threshold);
21 | #else
22 |     AT_ERROR("Not compiled with GPU support");
23 | #endif
24 |   }
25 | 
26 |   at::Tensor result = nms_cpu(dets, scores, threshold);
27 |   return result;
28 | }
29 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/csrc/vision.cpp:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #include "nms.h"
 3 | #include "ROIAlign.h"
 4 | #include "ROIPool.h"
 5 | #include "SigmoidFocalLoss.h"
 6 | 
 7 | PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
 8 |   m.def("nms", &nms, "non-maximum suppression");
 9 |   m.def("roi_align_forward", &ROIAlign_forward, "ROIAlign_forward");
10 |   m.def("roi_align_backward", &ROIAlign_backward, "ROIAlign_backward");
11 |   m.def("roi_pool_forward", &ROIPool_forward, "ROIPool_forward");
12 |   m.def("roi_pool_backward", &ROIPool_backward, "ROIPool_backward");
13 |   m.def("sigmoid_focalloss_forward", &SigmoidFocalLoss_forward, "SigmoidFocalLoss_forward");
14 |   m.def("sigmoid_focalloss_backward", &SigmoidFocalLoss_backward, "SigmoidFocalLoss_backward");
15 | }
16 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/data/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .build import make_data_loader
3 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/data/collate_batch.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from maskrcnn_benchmark.structures.image_list import to_image_list
 3 | 
 4 | 
 5 | class BatchCollator(object):
 6 |     """
 7 |     From a list of samples from the dataset,
 8 |     returns the batched images and targets.
 9 |     This should be passed to the DataLoader
10 |     """
11 | 
12 |     def __init__(self, size_divisible=0):
13 |         self.size_divisible = size_divisible
14 | 
15 |     def __call__(self, batch):
16 |         transposed_batch = list(zip(*batch))
17 |         images = to_image_list(transposed_batch[0], self.size_divisible)
18 |         targets = transposed_batch[1]
19 |         img_ids = transposed_batch[2]
20 |         return images, targets, img_ids
21 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/data/datasets/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .coco import COCODataset
3 | from .voc import PascalVOCDataset
4 | from .buildings import BuildingsDataset
5 | from .buildings_test import BuildingsDatasetTest
6 | from .concat_dataset import ConcatDataset
7 | 
8 | __all__ = ["COCODataset", "ConcatDataset", "PascalVOCDataset", "BuildingsDataset", "BuildingsDatasetTest"]
9 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/data/datasets/concat_dataset.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import bisect
 3 | 
 4 | from torch.utils.data.dataset import ConcatDataset as _ConcatDataset
 5 | 
 6 | 
 7 | class ConcatDataset(_ConcatDataset):
 8 |     """
 9 |     Same as torch.utils.data.dataset.ConcatDataset, but exposes an extra
10 |     method for querying the sizes of the image
11 |     """
12 | 
13 |     def get_idxs(self, idx):
14 |         dataset_idx = bisect.bisect_right(self.cumulative_sizes, idx)
15 |         if dataset_idx == 0:
16 |             sample_idx = idx
17 |         else:
18 |             sample_idx = idx - self.cumulative_sizes[dataset_idx - 1]
19 |         return dataset_idx, sample_idx
20 | 
21 |     def get_img_info(self, idx):
22 |         dataset_idx, sample_idx = self.get_idxs(idx)
23 |         return self.datasets[dataset_idx].get_img_info(sample_idx)
24 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/data/datasets/evaluation/__init__.py:
--------------------------------------------------------------------------------
 1 | from maskrcnn_benchmark.data import datasets
 2 | 
 3 | from .coco import coco_evaluation
 4 | from .voc import voc_evaluation
 5 | from .buildings import buildings_evaluation
 6 | 
 7 | def evaluate(dataset, predictions, output_folder, **kwargs):
 8 |     """evaluate dataset using different methods based on dataset type.
 9 |     Args:
10 |         dataset: Dataset object
11 |         predictions(list[BoxList]): each item in the list represents the
12 |             prediction results for one image.
13 |         output_folder: output folder, to save evaluation files or results.
14 |         **kwargs: other args.
15 |     Returns:
16 |         evaluation result
17 |     """
18 |     args = dict(
19 |         dataset=dataset, predictions=predictions, output_folder=output_folder, **kwargs
20 |     )
21 |     if isinstance(dataset, datasets.COCODataset):
22 |         return coco_evaluation(**args)
23 |     elif isinstance(dataset, datasets.PascalVOCDataset):
24 |         return voc_evaluation(**args)
25 |     elif isinstance(dataset, datasets.BuildingsDataset) or isinstance(dataset, datasets.BuildingsDatasetTest):
26 |         return buildings_evaluation(**args)
27 |     else:
28 |         dataset_name = dataset.__class__.__name__
29 |         raise NotImplementedError("Unsupported dataset type {}.".format(dataset_name))
30 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/data/datasets/evaluation/buildings/__init__.py:
--------------------------------------------------------------------------------
 1 | from .buildings_eval import do_buildings_evaluation
 2 | 
 3 | 
 4 | def buildings_evaluation(
 5 |     dataset,
 6 |     predictions,
 7 |     output_folder,
 8 |     box_only,
 9 |     iou_types,
10 |     expected_results,
11 |     expected_results_sigma_tol,
12 | ):
13 |     return do_buildings_evaluation(
14 |         dataset=dataset,
15 |         predictions=predictions,
16 |         box_only=box_only,
17 |         output_folder=output_folder,
18 |         iou_types=iou_types,
19 |         expected_results=expected_results,
20 |         expected_results_sigma_tol=expected_results_sigma_tol
21 |     )
22 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/data/datasets/evaluation/coco/__init__.py:
--------------------------------------------------------------------------------
 1 | from .coco_eval import do_coco_evaluation
 2 | 
 3 | 
 4 | def coco_evaluation(
 5 |     dataset,
 6 |     predictions,
 7 |     output_folder,
 8 |     box_only,
 9 |     iou_types,
10 |     expected_results,
11 |     expected_results_sigma_tol,
12 | ):
13 |     return do_coco_evaluation(
14 |         dataset=dataset,
15 |         predictions=predictions,
16 |         box_only=box_only,
17 |         output_folder=output_folder,
18 |         iou_types=iou_types,
19 |         expected_results=expected_results,
20 |         expected_results_sigma_tol=expected_results_sigma_tol,
21 |     )
22 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/data/datasets/evaluation/voc/__init__.py:
--------------------------------------------------------------------------------
 1 | import logging
 2 | 
 3 | from .voc_eval import do_voc_evaluation
 4 | 
 5 | 
 6 | def voc_evaluation(dataset, predictions, output_folder, box_only, **_):
 7 |     logger = logging.getLogger("maskrcnn_benchmark.inference")
 8 |     if box_only:
 9 |         logger.warning("voc evaluation doesn't support box_only, ignored.")
10 |     logger.info("performing voc evaluation, ignored iou_types.")
11 |     return do_voc_evaluation(
12 |         dataset=dataset,
13 |         predictions=predictions,
14 |         output_folder=output_folder,
15 |         logger=logger,
16 |     )
17 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/data/datasets/list_dataset.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | """
 3 | Simple dataset class that wraps a list of path names
 4 | """
 5 | 
 6 | from PIL import Image
 7 | 
 8 | from maskrcnn_benchmark.structures.bounding_box import BoxList
 9 | 
10 | 
11 | class ListDataset(object):
12 |     def __init__(self, image_lists, transforms=None):
13 |         self.image_lists = image_lists
14 |         self.transforms = transforms
15 | 
16 |     def __getitem__(self, item):
17 |         img = Image.open(self.image_lists[item]).convert("RGB")
18 | 
19 |         # dummy target
20 |         w, h = img.size
21 |         target = BoxList([[0, 0, w, h]], img.size, mode="xyxy")
22 | 
23 |         if self.transforms is not None:
24 |             img, target = self.transforms(img, target)
25 | 
26 |         return img, target
27 | 
28 |     def __len__(self):
29 |         return len(self.image_lists)
30 | 
31 |     def get_img_info(self, item):
32 |         """
33 |         Return the image dimensions for the image, without
34 |         loading and pre-processing it
35 |         """
36 |         pass
37 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/data/samplers/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .distributed import DistributedSampler
3 | from .grouped_batch_sampler import GroupedBatchSampler
4 | from .iteration_based_batch_sampler import IterationBasedBatchSampler
5 | 
6 | __all__ = ["DistributedSampler", "GroupedBatchSampler", "IterationBasedBatchSampler"]
7 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/data/samplers/iteration_based_batch_sampler.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from torch.utils.data.sampler import BatchSampler
 3 | 
 4 | 
 5 | class IterationBasedBatchSampler(BatchSampler):
 6 |     """
 7 |     Wraps a BatchSampler, resampling from it until
 8 |     a specified number of iterations have been sampled
 9 |     """
10 | 
11 |     def __init__(self, batch_sampler, num_iterations, start_iter=0):
12 |         self.batch_sampler = batch_sampler
13 |         self.num_iterations = num_iterations
14 |         self.start_iter = start_iter
15 | 
16 |     def __iter__(self):
17 |         iteration = self.start_iter
18 |         while iteration <= self.num_iterations:
19 |             # if the underlying sampler has a set_epoch method, like
20 |             # DistributedSampler, used for making each process see
21 |             # a different split of the dataset, then set it
22 |             if hasattr(self.batch_sampler.sampler, "set_epoch"):
23 |                 self.batch_sampler.sampler.set_epoch(iteration)
24 |             for batch in self.batch_sampler:
25 |                 iteration += 1
26 |                 if iteration > self.num_iterations:
27 |                     break
28 |                 yield batch
29 | 
30 |     def __len__(self):
31 |         return self.num_iterations
32 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/data/transforms/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .transforms import Compose
3 | from .transforms import Resize
4 | from .transforms import RandomHorizontalFlip
5 | from .transforms import ToTensor
6 | from .transforms import Normalize
7 | 
8 | from .build import build_transforms
9 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/data/transforms/build.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from . import transforms as T
 3 | 
 4 | 
 5 | def build_transforms(cfg, is_train=True):
 6 |     if is_train:
 7 |         min_size = cfg.INPUT.MIN_SIZE_TRAIN
 8 |         max_size = cfg.INPUT.MAX_SIZE_TRAIN
 9 |         flip_prob = 0.5  # cfg.INPUT.FLIP_PROB_TRAIN
10 |     else:
11 |         min_size = cfg.INPUT.MIN_SIZE_TEST
12 |         max_size = cfg.INPUT.MAX_SIZE_TEST
13 |         flip_prob = 0
14 | 
15 |     to_bgr255 = cfg.INPUT.TO_BGR255
16 |     normalize_transform = T.Normalize(
17 |         mean=cfg.INPUT.PIXEL_MEAN, std=cfg.INPUT.PIXEL_STD, to_bgr255=to_bgr255
18 |     )
19 | 
20 |     transform = T.Compose(
21 |         [
22 |             T.Resize(min_size, max_size),
23 |             T.RandomHorizontalFlip(flip_prob),
24 |             T.ToTensor(),
25 |             normalize_transform,
26 |         ]
27 |     )
28 |     return transform
29 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/engine/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/layers/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | from .batch_norm import FrozenBatchNorm2d
 5 | from .misc import Conv2d
 6 | from .misc import ConvTranspose2d
 7 | from .misc import BatchNorm2d
 8 | from .misc import interpolate
 9 | from .nms import nms
10 | from .roi_align import ROIAlign
11 | from .roi_align import roi_align
12 | from .roi_pool import ROIPool
13 | from .roi_pool import roi_pool
14 | from .smooth_l1_loss import smooth_l1_loss
15 | from .sigmoid_focal_loss import SigmoidFocalLoss
16 | 
17 | __all__ = ["nms", "roi_align", "ROIAlign", "roi_pool", "ROIPool",
18 |            "smooth_l1_loss", "Conv2d", "ConvTranspose2d", "interpolate",
19 |            "BatchNorm2d", "FrozenBatchNorm2d", "SigmoidFocalLoss"
20 |           ]
21 | 
22 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/layers/_utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import glob
 3 | import os.path
 4 | 
 5 | import torch
 6 | 
 7 | try:
 8 |     from torch.utils.cpp_extension import load as load_ext
 9 |     from torch.utils.cpp_extension import CUDA_HOME
10 | except ImportError:
11 |     raise ImportError("The cpp layer extensions requires PyTorch 0.4 or higher")
12 | 
13 | 
14 | def _load_C_extensions():
15 |     this_dir = os.path.dirname(os.path.abspath(__file__))
16 |     this_dir = os.path.dirname(this_dir)
17 |     this_dir = os.path.join(this_dir, "csrc")
18 | 
19 |     main_file = glob.glob(os.path.join(this_dir, "*.cpp"))
20 |     source_cpu = glob.glob(os.path.join(this_dir, "cpu", "*.cpp"))
21 |     source_cuda = glob.glob(os.path.join(this_dir, "cuda", "*.cu"))
22 | 
23 |     source = main_file + source_cpu
24 | 
25 |     extra_cflags = []
26 |     if torch.cuda.is_available() and CUDA_HOME is not None:
27 |         source.extend(source_cuda)
28 |         extra_cflags = ["-DWITH_CUDA"]
29 |     source = [os.path.join(this_dir, s) for s in source]
30 |     extra_include_paths = [this_dir]
31 |     return load_ext(
32 |         "torchvision",
33 |         source,
34 |         extra_cflags=extra_cflags,
35 |         extra_include_paths=extra_include_paths,
36 |     )
37 | 
38 | 
39 | _C = _load_C_extensions()
40 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/layers/batch_norm.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | from torch import nn
 4 | 
 5 | 
 6 | class FrozenBatchNorm2d(nn.Module):
 7 |     """
 8 |     BatchNorm2d where the batch statistics and the affine parameters
 9 |     are fixed
10 |     """
11 | 
12 |     def __init__(self, n):
13 |         super(FrozenBatchNorm2d, self).__init__()
14 |         self.register_buffer("weight", torch.ones(n))
15 |         self.register_buffer("bias", torch.zeros(n))
16 |         self.register_buffer("running_mean", torch.zeros(n))
17 |         self.register_buffer("running_var", torch.ones(n))
18 | 
19 |     def forward(self, x):
20 |         scale = self.weight * self.running_var.rsqrt()
21 |         bias = self.bias - self.running_mean * scale
22 |         scale = scale.reshape(1, -1, 1, 1)
23 |         bias = bias.reshape(1, -1, 1, 1)
24 |         return x * scale + bias
25 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/layers/nms.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | # from ._utils import _C
3 | from maskrcnn_benchmark import _C
4 | 
5 | nms = _C.nms
6 | # nms.__doc__ = """
7 | # This function performs Non-maximum suppresion"""
8 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/layers/smooth_l1_loss.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | 
 5 | # TODO maybe push this to nn?
 6 | def smooth_l1_loss(input, target, beta=1. / 9, size_average=True):
 7 |     """
 8 |     very similar to the smooth_l1_loss from pytorch, but with
 9 |     the extra beta parameter
10 |     """
11 |     n = torch.abs(input - target)
12 |     cond = n < beta
13 |     loss = torch.where(cond, 0.5 * n ** 2 / beta, n - 0.5 * beta)
14 |     if size_average:
15 |         return loss.mean()
16 |     return loss.sum()
17 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/modeling/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/RR_inference/maskrcnn_benchmark/modeling/__init__.py


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/modeling/backbone/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .backbone import build_backbone
3 | from . import fbnet
4 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/modeling/detector/.ipynb_checkpoints/detectors-checkpoint.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from .generalized_rcnn import GeneralizedRCNN
 3 | 
 4 | 
 5 | _DETECTION_META_ARCHITECTURES = {"GeneralizedRCNN": GeneralizedRCNN}
 6 | 
 7 | 
 8 | def build_detection_model(cfg):
 9 |     meta_arch = _DETECTION_META_ARCHITECTURES[cfg.MODEL.META_ARCHITECTURE]
10 |     return meta_arch(cfg)
11 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/modeling/detector/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .detectors import build_detection_model
3 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/modeling/detector/detectors.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from .generalized_rcnn import GeneralizedRCNN
 3 | 
 4 | 
 5 | _DETECTION_META_ARCHITECTURES = {"GeneralizedRCNN": GeneralizedRCNN}
 6 | 
 7 | 
 8 | def build_detection_model(cfg):
 9 |     meta_arch = _DETECTION_META_ARCHITECTURES[cfg.MODEL.META_ARCHITECTURE]
10 |     return meta_arch(cfg)
11 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/modeling/registry.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | from maskrcnn_benchmark.utils.registry import Registry
 4 | 
 5 | BACKBONES = Registry()
 6 | RPN_HEADS = Registry()
 7 | ROI_BOX_FEATURE_EXTRACTORS = Registry()
 8 | ROI_BOX_PREDICTOR = Registry()
 9 | ROI_KEYPOINT_FEATURE_EXTRACTORS = Registry()
10 | ROI_KEYPOINT_PREDICTOR = Registry()
11 | ROI_MASK_FEATURE_EXTRACTORS = Registry()
12 | ROI_MASK_PREDICTOR = Registry()
13 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/modeling/roi_heads/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/RR_inference/maskrcnn_benchmark/modeling/roi_heads/__init__.py


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/modeling/roi_heads/box_head/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/RR_inference/maskrcnn_benchmark/modeling/roi_heads/box_head/__init__.py


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/modeling/roi_heads/keypoint_head/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/RR_inference/maskrcnn_benchmark/modeling/roi_heads/keypoint_head/__init__.py


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/modeling/roi_heads/keypoint_head/roi_keypoint_predictors.py:
--------------------------------------------------------------------------------
 1 | from torch import nn
 2 | 
 3 | from maskrcnn_benchmark import layers
 4 | from maskrcnn_benchmark.modeling import registry
 5 | 
 6 | 
 7 | @registry.ROI_KEYPOINT_PREDICTOR.register("KeypointRCNNPredictor")
 8 | class KeypointRCNNPredictor(nn.Module):
 9 |     def __init__(self, cfg, in_channels):
10 |         super(KeypointRCNNPredictor, self).__init__()
11 |         input_features = in_channels
12 |         num_keypoints = cfg.MODEL.ROI_KEYPOINT_HEAD.NUM_CLASSES
13 |         deconv_kernel = 4
14 |         self.kps_score_lowres = layers.ConvTranspose2d(
15 |             input_features,
16 |             num_keypoints,
17 |             deconv_kernel,
18 |             stride=2,
19 |             padding=deconv_kernel // 2 - 1,
20 |         )
21 |         nn.init.kaiming_normal_(
22 |             self.kps_score_lowres.weight, mode="fan_out", nonlinearity="relu"
23 |         )
24 |         nn.init.constant_(self.kps_score_lowres.bias, 0)
25 |         self.up_scale = 2
26 |         self.out_channels = num_keypoints
27 | 
28 |     def forward(self, x):
29 |         x = self.kps_score_lowres(x)
30 |         x = layers.interpolate(
31 |             x, scale_factor=self.up_scale, mode="bilinear", align_corners=False
32 |         )
33 |         return x
34 | 
35 | 
36 | def make_roi_keypoint_predictor(cfg, in_channels):
37 |     func = registry.ROI_KEYPOINT_PREDICTOR[cfg.MODEL.ROI_KEYPOINT_HEAD.PREDICTOR]
38 |     return func(cfg, in_channels)
39 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/modeling/roi_heads/mask_head/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/RR_inference/maskrcnn_benchmark/modeling/roi_heads/mask_head/__init__.py


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/modeling/rpn/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | # from .rpn import build_rpn
3 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/modeling/rpn/retinanet/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/RR_inference/maskrcnn_benchmark/modeling/rpn/retinanet/__init__.py


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/modeling/utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | """
 3 | Miscellaneous utility functions
 4 | """
 5 | 
 6 | import torch
 7 | 
 8 | 
 9 | def cat(tensors, dim=0):
10 |     """
11 |     Efficient version of torch.cat that avoids a copy if there is only a single element in a list
12 |     """
13 |     assert isinstance(tensors, (list, tuple))
14 |     if len(tensors) == 1:
15 |         return tensors[0]
16 |     return torch.cat(tensors, dim)
17 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/solver/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .build import make_optimizer
3 | from .build import make_lr_scheduler
4 | from .lr_scheduler import WarmupMultiStepLR
5 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/solver/build.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | from .lr_scheduler import WarmupMultiStepLR
 5 | 
 6 | 
 7 | def make_optimizer(cfg, model):
 8 |     params = []
 9 |     for key, value in model.named_parameters():
10 |         if not value.requires_grad:
11 |             continue
12 |         lr = cfg.SOLVER.BASE_LR
13 |         weight_decay = cfg.SOLVER.WEIGHT_DECAY
14 |         if "bias" in key:
15 |             lr = cfg.SOLVER.BASE_LR * cfg.SOLVER.BIAS_LR_FACTOR
16 |             weight_decay = cfg.SOLVER.WEIGHT_DECAY_BIAS
17 |         params += [{"params": [value], "lr": lr, "weight_decay": weight_decay}]
18 | 
19 |     optimizer = torch.optim.SGD(params, lr, momentum=cfg.SOLVER.MOMENTUM)
20 |     return optimizer
21 | 
22 | 
23 | def make_lr_scheduler(cfg, optimizer):
24 |     return WarmupMultiStepLR(
25 |         optimizer,
26 |         cfg.SOLVER.STEPS,
27 |         cfg.SOLVER.GAMMA,
28 |         warmup_factor=cfg.SOLVER.WARMUP_FACTOR,
29 |         warmup_iters=cfg.SOLVER.WARMUP_ITERS,
30 |         warmup_method=cfg.SOLVER.WARMUP_METHOD,
31 |     )
32 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/structures/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/RR_inference/maskrcnn_benchmark/structures/__init__.py


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/utils/README.md:
--------------------------------------------------------------------------------
1 | # Utility functions
2 | 
3 | This folder contain utility functions that are not used in the
4 | core library, but are useful for building models or training
5 | code using the config system.
6 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/utils/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/RR_inference/maskrcnn_benchmark/utils/__init__.py


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/utils/collect_env.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import PIL
 3 | 
 4 | from torch.utils.collect_env import get_pretty_env_info
 5 | 
 6 | 
 7 | def get_pil_version():
 8 |     return "\n        Pillow ({})".format(PIL.__version__)
 9 | 
10 | 
11 | def collect_env_info():
12 |     env_str = get_pretty_env_info()
13 |     env_str += get_pil_version()
14 |     return env_str
15 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/utils/cv2_util.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Module for cv2 utility functions and maintaining version compatibility
 3 | between 3.x and 4.x
 4 | """
 5 | import cv2
 6 | 
 7 | 
 8 | def findContours(*args, **kwargs):
 9 |     """
10 |     Wraps cv2.findContours to maintain compatiblity between versions
11 |     3 and 4
12 | 
13 |     Returns:
14 |         contours, hierarchy
15 |     """
16 |     if cv2.__version__.startswith('4'):
17 |         contours, hierarchy = cv2.findContours(*args, **kwargs)
18 |     elif cv2.__version__.startswith('3'):
19 |         _, contours, hierarchy = cv2.findContours(*args, **kwargs)
20 |     else:
21 |         raise AssertionError(
22 |             'cv2 must be either version 3 or 4 to call this method')
23 | 
24 |     return contours, hierarchy
25 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/utils/env.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import os
 3 | 
 4 | from maskrcnn_benchmark.utils.imports import import_file
 5 | 
 6 | 
 7 | def setup_environment():
 8 |     """Perform environment setup work. The default setup is a no-op, but this
 9 |     function allows the user to specify a Python source file that performs
10 |     custom setup work that may be necessary to their computing environment.
11 |     """
12 |     custom_module_path = os.environ.get("TORCH_DETECTRON_ENV_MODULE")
13 |     if custom_module_path:
14 |         setup_custom_environment(custom_module_path)
15 |     else:
16 |         # The default setup is a no-op
17 |         pass
18 | 
19 | 
20 | def setup_custom_environment(custom_module_path):
21 |     """Load custom environment setup from a Python source file and run the setup
22 |     function.
23 |     """
24 |     module = import_file("maskrcnn_benchmark.utils.env.custom_module", custom_module_path)
25 |     assert hasattr(module, "setup_environment") and callable(
26 |         module.setup_environment
27 |     ), (
28 |         "Custom environment module defined in {} does not have the "
29 |         "required callable attribute 'setup_environment'."
30 |     ).format(
31 |         custom_module_path
32 |     )
33 |     module.setup_environment()
34 | 
35 | 
36 | # Force environment setup when this module is imported
37 | setup_environment()
38 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/utils/imports.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | if torch._six.PY3:
 5 |     import importlib
 6 |     import importlib.util
 7 |     import sys
 8 | 
 9 | 
10 |     # from https://stackoverflow.com/questions/67631/how-to-import-a-module-given-the-full-path?utm_medium=organic&utm_source=google_rich_qa&utm_campaign=google_rich_qa
11 |     def import_file(module_name, file_path, make_importable=False):
12 |         spec = importlib.util.spec_from_file_location(module_name, file_path)
13 |         module = importlib.util.module_from_spec(spec)
14 |         spec.loader.exec_module(module)
15 |         if make_importable:
16 |             sys.modules[module_name] = module
17 |         return module
18 | else:
19 |     import imp
20 | 
21 |     def import_file(module_name, file_path, make_importable=None):
22 |         module = imp.load_source(module_name, file_path)
23 |         return module
24 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/utils/logger.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import logging
 3 | import os
 4 | import sys
 5 | 
 6 | 
 7 | def setup_logger(name, save_dir, distributed_rank, filename="log.txt"):
 8 |     logger = logging.getLogger(name)
 9 |     logger.setLevel(logging.DEBUG)
10 |     # don't log results for the non-master process
11 |     if distributed_rank > 0:
12 |         return logger
13 |     ch = logging.StreamHandler(stream=sys.stdout)
14 |     ch.setLevel(logging.DEBUG)
15 |     formatter = logging.Formatter("%(asctime)s %(name)s %(levelname)s: %(message)s")
16 |     ch.setFormatter(formatter)
17 |     logger.addHandler(ch)
18 | 
19 |     if save_dir:
20 |         fh = logging.FileHandler(os.path.join(save_dir, filename))
21 |         fh.setLevel(logging.DEBUG)
22 |         fh.setFormatter(formatter)
23 |         logger.addHandler(fh)
24 | 
25 |     return logger
26 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/utils/miscellaneous.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import errno
 3 | import os
 4 | 
 5 | 
 6 | def mkdir(path):
 7 |     try:
 8 |         os.makedirs(path)
 9 |     except OSError as e:
10 |         if e.errno != errno.EEXIST:
11 |             raise
12 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/utils/registry.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | 
 4 | def _register_generic(module_dict, module_name, module):
 5 |     assert module_name not in module_dict
 6 |     module_dict[module_name] = module
 7 | 
 8 | 
 9 | class Registry(dict):
10 |     '''
11 |     A helper class for managing registering modules, it extends a dictionary
12 |     and provides a register functions.
13 | 
14 |     Eg. creeting a registry:
15 |         some_registry = Registry({"default": default_module})
16 | 
17 |     There're two ways of registering new modules:
18 |     1): normal way is just calling register function:
19 |         def foo():
20 |             ...
21 |         some_registry.register("foo_module", foo)
22 |     2): used as decorator when declaring the module:
23 |         @some_registry.register("foo_module")
24 |         @some_registry.register("foo_modeul_nickname")
25 |         def foo():
26 |             ...
27 | 
28 |     Access of module is just like using a dictionary, eg:
29 |         f = some_registry["foo_modeul"]
30 |     '''
31 |     def __init__(self, *args, **kwargs):
32 |         super(Registry, self).__init__(*args, **kwargs)
33 | 
34 |     def register(self, module_name, module=None):
35 |         # used as function call
36 |         if module is not None:
37 |             _register_generic(self, module_name, module)
38 |             return
39 | 
40 |         # used as decorator
41 |         def register_fn(fn):
42 |             _register_generic(self, module_name, fn)
43 |             return fn
44 | 
45 |         return register_fn
46 | 


--------------------------------------------------------------------------------
/RR_inference/maskrcnn_benchmark/utils/timer.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | 
 4 | import time
 5 | import datetime
 6 | 
 7 | 
 8 | class Timer(object):
 9 |     def __init__(self):
10 |         self.reset()
11 | 
12 |     @property
13 |     def average_time(self):
14 |         return self.total_time / self.calls if self.calls > 0 else 0.0
15 | 
16 |     def tic(self):
17 |         # using time.time instead of time.clock because time time.clock
18 |         # does not normalize for multithreading
19 |         self.start_time = time.time()
20 | 
21 |     def toc(self, average=True):
22 |         self.add(time.time() - self.start_time)
23 |         if average:
24 |             return self.average_time
25 |         else:
26 |             return self.diff
27 | 
28 |     def add(self, time_diff):
29 |         self.diff = time_diff
30 |         self.total_time += self.diff
31 |         self.calls += 1
32 | 
33 |     def reset(self):
34 |         self.total_time = 0.0
35 |         self.calls = 0
36 |         self.start_time = 0.0
37 |         self.diff = 0.0
38 | 
39 |     def avg_time_str(self):
40 |         time_str = str(datetime.timedelta(seconds=self.average_time))
41 |         return time_str
42 | 
43 | 
44 | def get_time_str(time_diff):
45 |     time_str = str(datetime.timedelta(seconds=time_diff))
46 |     return time_str
47 | 


--------------------------------------------------------------------------------
/RR_inference/requirements.txt:
--------------------------------------------------------------------------------
1 | ninja
2 | yacs
3 | cython
4 | matplotlib
5 | tqdm
6 | 


--------------------------------------------------------------------------------
/RR_inference/tests/env_tests/env.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | import os
 4 | 
 5 | 
 6 | def get_config_root_path():
 7 |     ''' Path to configs for unit tests '''
 8 |     # cur_file_dir is root/tests/env_tests
 9 |     cur_file_dir = os.path.dirname(os.path.abspath(os.path.realpath(__file__)))
10 |     ret = os.path.dirname(os.path.dirname(cur_file_dir))
11 |     ret = os.path.join(ret, "configs")
12 |     return ret
13 | 


--------------------------------------------------------------------------------
/RR_inference/tests/test_configs.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | import unittest
 4 | import glob
 5 | import os
 6 | import utils
 7 | 
 8 | 
 9 | class TestConfigs(unittest.TestCase):
10 |     def test_configs_load(self):
11 |         ''' Make sure configs are loadable '''
12 | 
13 |         cfg_root_path = utils.get_config_root_path()
14 |         files = glob.glob(
15 |             os.path.join(cfg_root_path, "./**/*.yaml"), recursive=True)
16 |         self.assertGreater(len(files), 0)
17 | 
18 |         for fn in files:
19 |             print('Loading {}...'.format(fn))
20 |             utils.load_config_from_file(fn)
21 | 
22 | 
23 | if __name__ == "__main__":
24 |     unittest.main()
25 | 


--------------------------------------------------------------------------------
/RR_inference/tests/test_metric_logger.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import unittest
 3 | 
 4 | from maskrcnn_benchmark.utils.metric_logger import MetricLogger
 5 | 
 6 | 
 7 | class TestMetricLogger(unittest.TestCase):
 8 |     def test_update(self):
 9 |         meter = MetricLogger()
10 |         for i in range(10):
11 |             meter.update(metric=float(i))
12 |         
13 |         m = meter.meters["metric"]
14 |         self.assertEqual(m.count, 10)
15 |         self.assertEqual(m.total, 45)
16 |         self.assertEqual(m.median, 4)
17 |         self.assertEqual(m.avg, 4.5)
18 | 
19 |     def test_no_attr(self):
20 |         meter = MetricLogger()
21 |         _ = meter.meters
22 |         _ = meter.delimiter
23 |         def broken():
24 |             _ = meter.not_existent
25 |         self.assertRaises(AttributeError, broken)
26 | 
27 | if __name__ == "__main__":
28 |     unittest.main()
29 | 


--------------------------------------------------------------------------------
/RR_inference/tests/utils.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, print_function, unicode_literals
 2 | 
 3 | # Set up custom environment before nearly anything else is imported
 4 | # NOTE: this should be the first import (no not reorder)
 5 | from maskrcnn_benchmark.utils.env import setup_environment  # noqa F401 isort:skip
 6 | import env_tests.env as env_tests
 7 | 
 8 | import os
 9 | import copy
10 | 
11 | from maskrcnn_benchmark.config import cfg as g_cfg
12 | 
13 | 
14 | def get_config_root_path():
15 |     return env_tests.get_config_root_path()
16 | 
17 | 
18 | def load_config(rel_path):
19 |     ''' Load config from file path specified as path relative to config_root '''
20 |     cfg_path = os.path.join(env_tests.get_config_root_path(), rel_path)
21 |     return load_config_from_file(cfg_path)
22 | 
23 | 
24 | def load_config_from_file(file_path):
25 |     ''' Load config from file path specified as absolute path '''
26 |     ret = copy.deepcopy(g_cfg)
27 |     ret.merge_from_file(file_path)
28 |     return ret
29 | 


--------------------------------------------------------------------------------
/refs/raw.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ennauata/buildings2vec/c4cc103aec1aece08c86dfd945753405abb1ad3d/refs/raw.jpg


--------------------------------------------------------------------------------