├── .gitignore
├── ABSTRACTIONS.md
├── CODE_OF_CONDUCT.md
├── DATASET.md
├── INSTALL.md
├── LICENSE
├── MODELZOO.md
├── README.md
├── TROUBLESHOOTING.md
├── cmd.cache
├── configs
    ├── arichived
    │   ├── caffe2
    │   │   ├── e2e_faster_rcnn_R_101_FPN_1x_caffe2.yaml
    │   │   ├── e2e_faster_rcnn_R_50_C4_1x_caffe2.yaml
    │   │   ├── e2e_faster_rcnn_R_50_FPN_1x_caffe2.yaml
    │   │   ├── e2e_faster_rcnn_X_101_32x8d_FPN_1x_caffe2.yaml
    │   │   ├── e2e_keypoint_rcnn_R_50_FPN_1x_caffe2.yaml
    │   │   ├── e2e_mask_rcnn_R_101_FPN_1x_caffe2.yaml
    │   │   ├── e2e_mask_rcnn_R_50_C4_1x_caffe2.yaml
    │   │   ├── e2e_mask_rcnn_R_50_FPN_1x_caffe2.yaml
    │   │   ├── e2e_mask_rcnn_X-152-32x8d-FPN-IN5k_1.44x_caffe2.yaml
    │   │   └── e2e_mask_rcnn_X_101_32x8d_FPN_1x_caffe2.yaml
    │   ├── cityscapes
    │   │   ├── README.md
    │   │   ├── e2e_faster_rcnn_R_50_FPN_1x_cocostyle.yaml
    │   │   └── e2e_mask_rcnn_R_50_FPN_1x_cocostyle.yaml
    │   ├── dcn
    │   │   ├── README.md
    │   │   ├── e2e_faster_rcnn_dconv_R_50_FPN_1x.yaml
    │   │   ├── e2e_faster_rcnn_mdconv_R_50_FPN_1x.yaml
    │   │   ├── e2e_mask_rcnn_dconv_R_50_FPN_1x.yaml
    │   │   └── e2e_mask_rcnn_mdconv_R_50_FPN_1x.yaml
    │   ├── gn_baselines
    │   │   ├── README.md
    │   │   ├── e2e_faster_rcnn_R_50_FPN_1x_gn.yaml
    │   │   ├── e2e_faster_rcnn_R_50_FPN_Xconv1fc_1x_gn.yaml
    │   │   ├── e2e_mask_rcnn_R_50_FPN_1x_gn.yaml
    │   │   ├── e2e_mask_rcnn_R_50_FPN_Xconv1fc_1x_gn.yaml
    │   │   ├── scratch_e2e_faster_rcnn_R_50_FPN_3x_gn.yaml
    │   │   ├── scratch_e2e_faster_rcnn_R_50_FPN_Xconv1fc_3x_gn.yaml
    │   │   ├── scratch_e2e_mask_rcnn_R_50_FPN_3x_gn.yaml
    │   │   └── scratch_e2e_mask_rcnn_R_50_FPN_Xconv1fc_3x_gn.yaml
    │   ├── maskrcnn_benchmark_models
    │   │   ├── e2e_faster_rcnn_R_101_FPN_1x.yaml
    │   │   ├── e2e_faster_rcnn_R_50_C4_1x.yaml
    │   │   ├── e2e_faster_rcnn_R_50_FPN_1x.yaml
    │   │   ├── e2e_faster_rcnn_X_101_32x8d_FPN_1x.yaml
    │   │   ├── e2e_faster_rcnn_fbnet.yaml
    │   │   ├── e2e_faster_rcnn_fbnet_600.yaml
    │   │   ├── e2e_faster_rcnn_fbnet_chamv1a_600.yaml
    │   │   ├── e2e_keypoint_rcnn_R_50_FPN_1x.yaml
    │   │   ├── e2e_mask_rcnn_R_101_FPN_1x.yaml
    │   │   ├── e2e_mask_rcnn_R_50_C4_1x.yaml
    │   │   ├── e2e_mask_rcnn_R_50_FPN_1x.yaml
    │   │   ├── e2e_mask_rcnn_X_101_32x8d_FPN_1x.yaml
    │   │   ├── e2e_mask_rcnn_fbnet.yaml
    │   │   ├── e2e_mask_rcnn_fbnet_600.yaml
    │   │   ├── e2e_mask_rcnn_fbnet_xirb16d_dsmask.yaml
    │   │   ├── e2e_mask_rcnn_fbnet_xirb16d_dsmask_600.yaml
    │   │   ├── rpn_R_101_FPN_1x.yaml
    │   │   ├── rpn_R_50_C4_1x.yaml
    │   │   ├── rpn_R_50_FPN_1x.yaml
    │   │   └── rpn_X_101_32x8d_FPN_1x.yaml
    │   ├── pascal_voc
    │   │   ├── e2e_faster_rcnn_R_50_C4_1x_1_gpu_voc.yaml
    │   │   ├── e2e_faster_rcnn_R_50_C4_1x_4_gpu_voc.yaml
    │   │   └── e2e_mask_rcnn_R_50_FPN_1x_cocostyle.yaml
    │   ├── quick_schedules
    │   │   ├── e2e_faster_rcnn_R_50_C4_quick.yaml
    │   │   ├── e2e_faster_rcnn_R_50_FPN_quick.yaml
    │   │   ├── e2e_faster_rcnn_X_101_32x8d_FPN_quick.yaml
    │   │   ├── e2e_keypoint_rcnn_R_50_FPN_quick.yaml
    │   │   ├── e2e_mask_rcnn_R_50_C4_quick.yaml
    │   │   ├── e2e_mask_rcnn_R_50_FPN_quick.yaml
    │   │   ├── e2e_mask_rcnn_X_101_32x8d_FPN_quick.yaml
    │   │   ├── rpn_R_50_C4_quick.yaml
    │   │   └── rpn_R_50_FPN_quick.yaml
    │   ├── retinanet
    │   │   ├── retinanet_R-101-FPN_1x.yaml
    │   │   ├── retinanet_R-101-FPN_P5_1x.yaml
    │   │   ├── retinanet_R-50-FPN_1x.yaml
    │   │   ├── retinanet_R-50-FPN_1x_quick.yaml
    │   │   ├── retinanet_R-50-FPN_P5_1x.yaml
    │   │   └── retinanet_X_101_32x8d_FPN_1x.yaml
    │   └── test_time_aug
    │   │   └── e2e_mask_rcnn_R_50_FPN_1x.yaml
    ├── e2e_relBGNN_oiv4.yaml
    ├── e2e_relBGNN_oiv6.yaml
    ├── e2e_relBGNN_vg.yaml
    ├── e2e_relation_R_101_FPN_1x.yaml
    ├── e2e_relation_R_50_C4_1x.yaml
    ├── e2e_relation_R_50_C4_1x_motifs.yaml
    ├── e2e_relation_R_50_C4_1x_msdn.yaml
    ├── e2e_relation_R_50_C4_1x_naive_model.yaml
    ├── e2e_relation_VGG16_1x.yaml
    ├── e2e_relation_X_101_32_8_FPN_1x.yaml
    ├── e2e_relation_det_R_50_C4_1x.yaml
    ├── e2e_relation_detector_R_101_FPN_1x.yaml
    ├── e2e_relation_detector_VGG16_1x.yaml
    ├── e2e_relation_detector_X_101_32_8_FPN_1x.yaml
    └── e2e_relation_non_graph.yaml
├── demo
    ├── .gitignore
    ├── README.md
    ├── TDE_Results1.png
    ├── TDE_Results2.png
    ├── TDE_Results3.png
    ├── demo_e2e_mask_rcnn_R_50_FPN_1x.png
    ├── demo_e2e_mask_rcnn_X_101_32x8d_FPN_1x.png
    ├── output_format.png
    ├── predictor.py
    ├── relation_head.png
    ├── teaser_figure.png
    ├── vis_demo
    │   ├── __init__.py
    │   ├── manage.py
    │   ├── settings.py
    │   ├── thesis_demo
    │   │   ├── __init__.py
    │   │   ├── admin.py
    │   │   ├── apps.py
    │   │   ├── cfgs
    │   │   │   └── config.yml
    │   │   ├── migrations
    │   │   │   └── __init__.py
    │   │   ├── models.py
    │   │   ├── my_tranform.py
    │   │   ├── templates
    │   │   │   ├── res_vis.html
    │   │   │   └── upload.html
    │   │   ├── tests.py
    │   │   ├── urls.py
    │   │   ├── views.py
    │   │   └── vrd_demo.py
    │   ├── urls.py
    │   ├── vis_demo
    │   │   ├── __init__.py
    │   │   ├── settings.py
    │   │   ├── urls.py
    │   │   └── wsgi.py
    │   └── wsgi.py
    └── webcam.py
├── docker
    ├── Dockerfile
    └── docker-jupyter
    │   ├── Dockerfile
    │   └── jupyter_notebook_config.py
├── pysgg
    ├── __init__.py
    ├── config
    │   ├── __init__.py
    │   ├── defaults.py
    │   └── paths_catalog.py
    ├── csrc
    │   ├── ROIAlign.h
    │   ├── ROIPool.h
    │   ├── SigmoidFocalLoss.h
    │   ├── cpu
    │   │   ├── ROIAlign_cpu.cpp
    │   │   ├── nms_cpu.cpp
    │   │   └── vision.h
    │   ├── cuda
    │   │   ├── ROIAlign_cuda.cu
    │   │   ├── ROIPool_cuda.cu
    │   │   ├── SigmoidFocalLoss_cuda.cu
    │   │   ├── deform_conv_cuda.cu
    │   │   ├── deform_conv_kernel_cuda.cu
    │   │   ├── deform_pool_cuda.cu
    │   │   ├── deform_pool_kernel_cuda.cu
    │   │   ├── nms.cu
    │   │   └── vision.h
    │   ├── deform_conv.h
    │   ├── deform_pool.h
    │   ├── nms.h
    │   └── vision.cpp
    ├── data
    │   ├── README.md
    │   ├── __init__.py
    │   ├── build.py
    │   ├── collate_batch.py
    │   ├── datasets
    │   │   ├── __init__.py
    │   │   ├── bi_lvl_rsmp.py
    │   │   ├── coco.py
    │   │   ├── concat_dataset.py
    │   │   ├── evaluation
    │   │   │   ├── __init__.py
    │   │   │   ├── coco
    │   │   │   │   ├── __init__.py
    │   │   │   │   └── coco_eval.py
    │   │   │   ├── oi
    │   │   │   │   ├── __init__.py
    │   │   │   │   ├── ap_eval_rel.py
    │   │   │   │   └── oi_evaluation.py
    │   │   │   ├── vg
    │   │   │   │   ├── __init__.py
    │   │   │   │   ├── sgg_eval.py
    │   │   │   │   ├── vg_capgraphs_anno.json
    │   │   │   │   ├── vg_eval.py
    │   │   │   │   ├── vg_stage_eval_utils.py
    │   │   │   │   ├── vg_test_capgraph_anno.json
    │   │   │   │   ├── vg_test_caption_anno.json
    │   │   │   │   └── zeroshot_triplet.pytorch
    │   │   │   └── voc
    │   │   │   │   ├── __init__.py
    │   │   │   │   └── voc_eval.py
    │   │   ├── list_dataset.py
    │   │   ├── open_image.py
    │   │   ├── visual_genome.py
    │   │   └── voc.py
    │   ├── samplers
    │   │   ├── __init__.py
    │   │   ├── distributed.py
    │   │   ├── grouped_batch_sampler.py
    │   │   └── iteration_based_batch_sampler.py
    │   └── transforms
    │   │   ├── __init__.py
    │   │   ├── build.py
    │   │   └── transforms.py
    ├── engine
    │   ├── __init__.py
    │   ├── bbox_aug.py
    │   ├── inference.py
    │   └── trainer.py
    ├── image_retrieval
    │   ├── S2G-RETRIEVAL.md
    │   ├── __init__.py
    │   ├── dataloader.py
    │   ├── evaluation.py
    │   ├── model.py
    │   ├── modelv2.py
    │   └── preprocessing.py
    ├── layers
    │   ├── __init__.py
    │   ├── _utils.py
    │   ├── batch_norm.py
    │   ├── dcn
    │   │   ├── __init__.py
    │   │   ├── deform_conv_func.py
    │   │   ├── deform_conv_module.py
    │   │   ├── deform_pool_func.py
    │   │   └── deform_pool_module.py
    │   ├── entropy_loss.py
    │   ├── kl_div_loss.py
    │   ├── label_smoothing_loss.py
    │   ├── misc.py
    │   ├── nms.py
    │   ├── roi_align.py
    │   ├── roi_pool.py
    │   ├── sigmoid_focal_loss.py
    │   └── smooth_l1_loss.py
    ├── modeling
    │   ├── __init__.py
    │   ├── backbone
    │   │   ├── __init__.py
    │   │   ├── backbone.py
    │   │   ├── fbnet.py
    │   │   ├── fbnet_builder.py
    │   │   ├── fbnet_modeldef.py
    │   │   ├── fpn.py
    │   │   ├── resnet.py
    │   │   └── vgg.py
    │   ├── balanced_positive_negative_sampler.py
    │   ├── box_coder.py
    │   ├── detector
    │   │   ├── __init__.py
    │   │   ├── detectors.py
    │   │   └── generalized_rcnn.py
    │   ├── make_layers.py
    │   ├── matcher.py
    │   ├── poolers.py
    │   ├── registry.py
    │   ├── roi_heads
    │   │   ├── __init__.py
    │   │   ├── attribute_head
    │   │   │   ├── __init__.py
    │   │   │   ├── attribute_head.py
    │   │   │   ├── loss.py
    │   │   │   ├── roi_attribute_feature_extractors.py
    │   │   │   └── roi_attribute_predictors.py
    │   │   ├── box_head
    │   │   │   ├── __init__.py
    │   │   │   ├── box_head.py
    │   │   │   ├── inference.py
    │   │   │   ├── loss.py
    │   │   │   ├── roi_box_feature_extractors.py
    │   │   │   ├── roi_box_predictors.py
    │   │   │   └── sampling.py
    │   │   ├── keypoint_head
    │   │   │   ├── __init__.py
    │   │   │   ├── inference.py
    │   │   │   ├── keypoint_head.py
    │   │   │   ├── loss.py
    │   │   │   ├── roi_keypoint_feature_extractors.py
    │   │   │   └── roi_keypoint_predictors.py
    │   │   ├── mask_head
    │   │   │   ├── __init__.py
    │   │   │   ├── inference.py
    │   │   │   ├── loss.py
    │   │   │   ├── mask_head.py
    │   │   │   ├── roi_mask_feature_extractors.py
    │   │   │   └── roi_mask_predictors.py
    │   │   ├── relation_head
    │   │   │   ├── __init__.py
    │   │   │   ├── classifier.py
    │   │   │   ├── inference.py
    │   │   │   ├── loss.py
    │   │   │   ├── model_agcn.py
    │   │   │   ├── model_bgnn.py
    │   │   │   ├── model_gpsnet.py
    │   │   │   ├── model_kern.py
    │   │   │   ├── model_motifs.py
    │   │   │   ├── model_motifs_with_attribute.py
    │   │   │   ├── model_msdn.py
    │   │   │   ├── model_msg_passing.py
    │   │   │   ├── model_naive.py
    │   │   │   ├── model_transformer.py
    │   │   │   ├── model_vctree.py
    │   │   │   ├── model_vtranse.py
    │   │   │   ├── rel_proposal_network
    │   │   │   │   ├── __init__.py
    │   │   │   │   ├── loss.py
    │   │   │   │   └── models.py
    │   │   │   ├── relation_head.py
    │   │   │   ├── roi_relation_feature_extractors.py
    │   │   │   ├── roi_relation_predictors.py
    │   │   │   ├── sampling.py
    │   │   │   ├── utils_motifs.py
    │   │   │   ├── utils_relation.py
    │   │   │   ├── utils_treelstm.py
    │   │   │   └── utils_vctree.py
    │   │   └── roi_heads.py
    │   ├── rpn
    │   │   ├── __init__.py
    │   │   ├── anchor_generator.py
    │   │   ├── inference.py
    │   │   ├── loss.py
    │   │   ├── retinanet
    │   │   │   ├── __init__.py
    │   │   │   ├── inference.py
    │   │   │   ├── loss.py
    │   │   │   └── retinanet.py
    │   │   ├── rpn.py
    │   │   └── utils.py
    │   └── utils.py
    ├── solver
    │   ├── __init__.py
    │   ├── build.py
    │   └── lr_scheduler.py
    ├── structures
    │   ├── __init__.py
    │   ├── bounding_box.py
    │   ├── boxlist_ops.py
    │   ├── image_list.py
    │   ├── keypoint.py
    │   └── segmentation_mask.py
    └── utils
    │   ├── README.md
    │   ├── __init__.py
    │   ├── c2_model_loading.py
    │   ├── checkpoint.py
    │   ├── collect_env.py
    │   ├── comm.py
    │   ├── cv2_util.py
    │   ├── env.py
    │   ├── global_buffer.py
    │   ├── imports.py
    │   ├── logger.py
    │   ├── metric_logger.py
    │   ├── miscellaneous.py
    │   ├── model_serialization.py
    │   ├── model_zoo.py
    │   ├── registry.py
    │   ├── timer.py
    │   └── visualize_graph.py
├── requirements.txt
├── scripts
    ├── rel_test.sh
    ├── rel_train_BGNN_oiv4.sh
    ├── rel_train_BGNN_oiv6.sh
    ├── rel_train_BGNN_vg.sh
    └── rel_train_BGNN_vg_predcls.sh
├── setup.py
├── tests
    ├── checkpoint.py
    ├── env_tests
    │   └── env.py
    ├── test_backbones.py
    ├── test_box_coder.py
    ├── test_configs.py
    ├── test_data_samplers.py
    ├── test_detectors.py
    ├── test_fbnet.py
    ├── test_feature_extractors.py
    ├── test_metric_logger.py
    ├── test_nms.py
    ├── test_predictors.py
    ├── test_rpn_heads.py
    ├── test_segmentation_mask.py
    └── utils.py
└── tools
    ├── cityscapes
        ├── convert_cityscapes_to_coco.py
        └── instances2dict_with_polygons.py
    ├── detector_pretest_net.py
    ├── detector_pretrain_net.py
    ├── image_retrieval_main.py
    ├── relation_test_net.py
    ├── relation_train_net.py
    ├── runner.py
    └── visualize_bbox.ipynb


/.gitignore:
--------------------------------------------------------------------------------
 1 | # compilation and distribution
 2 | __pycache__
 3 | _ext
 4 | *.pyc
 5 | *.so
 6 | maskrcnn_benchmark.egg-info/
 7 | pysgg.egg-info/
 8 | build/
 9 | dist/
10 | 
11 | # ipython/jupyter notebooks
12 | #*.ipynb
13 | **/.ipynb_checkpoints/
14 | 
15 | # Editor temporaries
16 | *.swn
17 | *.swo
18 | *.swp
19 | *~
20 | 
21 | # Pycharm editor settings
22 | .idea
23 | 
24 | # vscode editor settings
25 | .vscode
26 | .github
27 | 
28 | .flake8
29 | 
30 | # MacOS
31 | .DS_Store
32 | 
33 | scripts/*
34 | 
35 | pymp-*
36 | 
37 | jupyter
38 | 
39 | .nfs*
40 | 
41 | /datasets
42 | /checkpoints
43 | 
44 | 
45 | .vsub
46 | service*.out.node*
47 | 


--------------------------------------------------------------------------------
/CODE_OF_CONDUCT.md:
--------------------------------------------------------------------------------
1 | # Code of Conduct
2 | 
3 | Facebook has adopted a Code of Conduct that we expect project participants to adhere to.
4 | Please read the [full text](https://code.fb.com/codeofconduct/)
5 | so that you can understand what actions will and will not be tolerated.
6 | 


--------------------------------------------------------------------------------
/INSTALL.md:
--------------------------------------------------------------------------------
 1 | ## Installation
 2 | 
 3 | Most of the requirements of this projects are exactly the same as [maskrcnn-benchmark](https://github.com/facebookresearch/maskrcnn-benchmark). If you have any problem of your environment, you should check their [issues page](https://github.com/facebookresearch/maskrcnn-benchmark/issues) first. Hope you will find the answer.
 4 | 
 5 | ### Requirements:
 6 | - PyTorch >= 1.4
 7 | - torchvision >= 0.4
 8 | - cocoapi
 9 | - yacs
10 | - matplotlib
11 | - GCC >= 4.9
12 | - OpenCV
13 | 
14 | 
15 | ### Step-by-step installation
16 | 
17 | ```bash
18 | # first, make sure that your conda is setup properly with the right environment
19 | # for that, check that `which conda`, `which pip` and `which python` points to the
20 | # right path. From a clean conda env, this is what you need to do
21 | 
22 | conda create -y --name pysgg
23 | conda activate pysgg
24 | 
25 | # this installs the right pip and dependencies for the fresh python
26 | conda install -y ipython scipy h5py
27 | 
28 | # scene_graph_benchmark and coco api dependencies
29 | pip install ninja yacs cython matplotlib tqdm opencv-python overrides gpustat gitpython ipdb graphviz tensorboardx termcolor scikit-learn==0.23.1
30 | 
31 | # follow PyTorch installation in https://pytorch.org/get-started/locally/
32 | conda install pytorch==1.4.0 torchvision==0.5.0 cudatoolkit=10.1 -c pytorch
33 | 
34 | export INSTALL_DIR=$PWD
35 | 
36 | # install pycocotools
37 | cd $INSTALL_DIR
38 | git clone https://github.com/cocodataset/cocoapi.git
39 | cd cocoapi/PythonAPI
40 | python setup.py build_ext install
41 | 
42 | # install apex
43 | cd $INSTALL_DIR
44 | git clone https://github.com/NVIDIA/apex.git
45 | cd apex
46 | git checkout f37fdf07367a71521bd14fec66153e0996ad128c
47 | python setup.py install --cuda_ext --cpp_ext
48 | 
49 | # install PyTorch Detection
50 | cd $INSTALL_DIR
51 | git clone https://github.com/KaihuaTang/Scene-Graph-Benchmark.pytorch.git
52 | cd pysgg
53 | 
54 | # the following will install the lib with
55 | # symbolic links, so that you can modify
56 | # the files if you want and won't need to
57 | # re-build it
58 | python setup.py build develop
59 | 
60 | 
61 | unset INSTALL_DIR
62 | 
63 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
1 | MIT License
2 | 
3 | The code is directly modified from facebook/maskrcnn-benchmark. I don't know what kind of license should be used here.
4 | 


--------------------------------------------------------------------------------
/MODELZOO.md:
--------------------------------------------------------------------------------
 1 | # Model Zoo
 2 | 
 3 | ## Evaluation Metrics
 4 | We follow the same evaluation protocols and metrics with [Scene-Graph-Benchmark.pytorch](https://github.com/KaihuaTang/Scene-Graph-Benchmark.pytorch/blob/master/METRICS.md)(Visual Genome dataset) and [Graphical Contrastive Losses for Scene Graph Parsing](https://github.com/NVIDIA/ContrastiveLosses4VRD) (Openimage V4/V6)
 5 | 
 6 | 
 7 | ## Reported Results
 8 | 
 9 | Here we list the SGGen results can be produced by our codebase with X-101-FPN backbone.
10 | We reimplement those methods according the official implementation released by author.
11 | 
12 | ∗ denotes the LVIS resampling is applied for this model.
13 | 
14 | ### VG
15 | | Model(SGGen) | mR@50 | mR@100 | R@50 | R@100 | head | body | tail |
16 | |--------------|:-----:|:------:|:----:|:-----:|------|------|------|
17 | | RelDN        |  6.0  |  7.3   | 31.4 |  35.9 | 34.1 | 6.6 | 1.1  |
18 | | Motifs       |  5.5 |  6.8 | 32.1 |  36.9 | 36.1 | 7.0| 0.0  |
19 | | Motifs∗      |  7.7 |  9.4 | 31.7 |  35.8 | 34.2 | 8.6 | 2.1 |
20 | | VCTree       |  10.9 |  13.5 | 29.8 |  34.6 | -| - | -| 
21 | | G-RCNN       |  5.8 |  6.7 | 29.78 |  32.8 | 28.6 | 6.5 | 0.1  |
22 | | MSDN         |  6.1 |  7.2 | 31.9  |  36.6 | 35.1 | 5.5 | 0.0  |
23 | | Unbiased     |  9.3 |  11.1 | 19.4 |  23.2 | 24.5 | 13.9 | 0.1  |
24 | | GPS-Net      |  6.79 |  8.6 | 31.1 |  35.9 | 34.5 | 7.0 | 1.0  |
25 | | GPS-Net*     |  7.4 |  9.5 | 27.8 |  32.1 | 30.4 | 8.5 | 3.8  |
26 | | BGNN         |  10.9 |  13.55 | 29.8 |  34.6 | 33.4 | 13.4 | 6.4  |
27 | 
28 | 
29 | ### OIv6
30 | | Model(SGGen) | mR@50 | R@50 | wmAP_rel | wmAP_phr | score_wtd |
31 | |---|:---:|:---:|:---:|:---:|---|
32 | | RelDN | 33.98 | 73.08 | 32.16 | 33.39 | 40.84
33 | | RelDN* | 37.20 | 75.34 | 33.21 | 34.31 | 41.97
34 | | VCTree | 33.91 | 74.08 | 34.16 | 33.11 | 40.21
35 | | G-RCNN | 34.04 | 74.51 | 33.15 | 34.21 | 41.84
36 | | Motifs | 32.68 | 71.63 | 29.91 | 31.59 | 38.93
37 | | Unbiased | 35.47 | 69.30 | 30.74 | 32.80 | 39.27
38 | | GPS-Net | 35.26 | 74.81 | 32.85 |  33.98 | 41.69
39 | | GPS-Net* | 38.93 |  74.74 | 32.77 | 33.87 | 41.60
40 | | BGNN | 41.71 | 74.96 | 33.83 | 34.87 | 42.47 |
41 | 
42 | 


--------------------------------------------------------------------------------
/configs/arichived/caffe2/e2e_faster_rcnn_R_101_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35857890/e2e_faster_rcnn_R-101-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 | DATASETS:
24 |   TEST: ("coco_2014_minival",)
25 | DATALOADER:
26 |   SIZE_DIVISIBILITY: 32
27 | 


--------------------------------------------------------------------------------
/configs/arichived/caffe2/e2e_faster_rcnn_R_50_C4_1x_caffe2.yaml:
--------------------------------------------------------------------------------
1 | MODEL:
2 |   META_ARCHITECTURE: "GeneralizedRCNN"
3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35857197/e2e_faster_rcnn_R-50-C4_1x"
4 | DATASETS:
5 |   TEST: ("coco_2014_minival",)
6 | 


--------------------------------------------------------------------------------
/configs/arichived/caffe2/e2e_faster_rcnn_R_50_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35857345/e2e_faster_rcnn_R-50-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 | DATASETS:
24 |   TEST: ("coco_2014_minival",)
25 | DATALOADER:
26 |   SIZE_DIVISIBILITY: 32
27 | 


--------------------------------------------------------------------------------
/configs/arichived/caffe2/e2e_faster_rcnn_X_101_32x8d_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/36761737/e2e_faster_rcnn_X-101-32x8d-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |     STRIDE_IN_1X1: False
 9 |     NUM_GROUPS: 32
10 |     WIDTH_PER_GROUP: 8
11 |   RPN:
12 |     USE_FPN: True
13 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
14 |     PRE_NMS_TOP_N_TRAIN: 2000
15 |     PRE_NMS_TOP_N_TEST: 1000
16 |     POST_NMS_TOP_N_TEST: 1000
17 |     FPN_POST_NMS_TOP_N_TEST: 1000
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |   ROI_BOX_HEAD:
21 |     POOLER_RESOLUTION: 7
22 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
23 |     POOLER_SAMPLING_RATIO: 2
24 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
25 |     PREDICTOR: "FPNPredictor"
26 | DATASETS:
27 |   TEST: ("coco_2014_minival",)
28 | DATALOADER:
29 |   SIZE_DIVISIBILITY: 32
30 | 


--------------------------------------------------------------------------------
/configs/arichived/caffe2/e2e_keypoint_rcnn_R_50_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/37697547/e2e_keypoint_rcnn_R-50-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |     NUM_CLASSES: 2
24 |   ROI_KEYPOINT_HEAD:
25 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
26 |     FEATURE_EXTRACTOR: "KeypointRCNNFeatureExtractor"
27 |     PREDICTOR: "KeypointRCNNPredictor"
28 |     POOLER_RESOLUTION: 14
29 |     POOLER_SAMPLING_RATIO: 2
30 |     RESOLUTION: 56
31 |     SHARE_BOX_FEATURE_EXTRACTOR: False
32 |   KEYPOINT_ON: True
33 | DATASETS:
34 |   TRAIN: ("keypoints_coco_2014_train", "keypoints_coco_2014_valminusminival",)
35 |   TEST: ("keypoints_coco_2014_minival",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (640, 672, 704, 736, 768, 800)
38 | DATALOADER:
39 |   SIZE_DIVISIBILITY: 32
40 | SOLVER:
41 |   BASE_LR: 0.02
42 |   WEIGHT_DECAY: 0.0001
43 |   STEPS: (60000, 80000)
44 |   MAX_ITER: 90000
45 | 


--------------------------------------------------------------------------------
/configs/arichived/caffe2/e2e_mask_rcnn_R_101_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35861795/e2e_mask_rcnn_R-101-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |   ROI_MASK_HEAD:
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
26 |     PREDICTOR: "MaskRCNNC4Predictor"
27 |     POOLER_RESOLUTION: 14
28 |     POOLER_SAMPLING_RATIO: 2
29 |     RESOLUTION: 28
30 |     SHARE_BOX_FEATURE_EXTRACTOR: False
31 |   MASK_ON: True
32 | DATASETS:
33 |   TEST: ("coco_2014_minival",)
34 | DATALOADER:
35 |   SIZE_DIVISIBILITY: 32
36 | 


--------------------------------------------------------------------------------
/configs/arichived/caffe2/e2e_mask_rcnn_R_50_C4_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35858791/e2e_mask_rcnn_R-50-C4_1x"
 4 |   ROI_MASK_HEAD:
 5 |     PREDICTOR: "MaskRCNNC4Predictor"
 6 |     SHARE_BOX_FEATURE_EXTRACTOR: True
 7 |   MASK_ON: True
 8 | DATASETS:
 9 |   TEST: ("coco_2014_minival",)
10 | 


--------------------------------------------------------------------------------
/configs/arichived/caffe2/e2e_mask_rcnn_R_50_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/35858933/e2e_mask_rcnn_R-50-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |   ROI_MASK_HEAD:
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
26 |     PREDICTOR: "MaskRCNNC4Predictor"
27 |     POOLER_RESOLUTION: 14
28 |     POOLER_SAMPLING_RATIO: 2
29 |     RESOLUTION: 28
30 |     SHARE_BOX_FEATURE_EXTRACTOR: False
31 |   MASK_ON: True
32 | DATASETS:
33 |   TEST: ("coco_2014_minival",)
34 | DATALOADER:
35 |   SIZE_DIVISIBILITY: 32
36 | 


--------------------------------------------------------------------------------
/configs/arichived/caffe2/e2e_mask_rcnn_X-152-32x8d-FPN-IN5k_1.44x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/37129812/e2e_mask_rcnn_X-152-32x8d-FPN-IN5k_1.44x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-152-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |     STRIDE_IN_1X1: False
 9 |     NUM_GROUPS: 32
10 |     WIDTH_PER_GROUP: 8
11 |   RPN:
12 |     USE_FPN: True
13 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
14 |     PRE_NMS_TOP_N_TRAIN: 2000
15 |     PRE_NMS_TOP_N_TEST: 1000
16 |     POST_NMS_TOP_N_TEST: 1000
17 |     FPN_POST_NMS_TOP_N_TEST: 1000
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |   ROI_BOX_HEAD:
21 |     POOLER_RESOLUTION: 7
22 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
23 |     POOLER_SAMPLING_RATIO: 2
24 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
25 |     PREDICTOR: "FPNPredictor"
26 |   ROI_MASK_HEAD:
27 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
28 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
29 |     PREDICTOR: "MaskRCNNC4Predictor"
30 |     POOLER_RESOLUTION: 14
31 |     POOLER_SAMPLING_RATIO: 2
32 |     RESOLUTION: 28
33 |     SHARE_BOX_FEATURE_EXTRACTOR: False
34 |   MASK_ON: True
35 | DATASETS:
36 |   TEST: ("coco_2014_minival",)
37 | DATALOADER:
38 |   SIZE_DIVISIBILITY: 32
39 | 


--------------------------------------------------------------------------------
/configs/arichived/caffe2/e2e_mask_rcnn_X_101_32x8d_FPN_1x_caffe2.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://Caffe2Detectron/COCO/36761843/e2e_mask_rcnn_X-101-32x8d-FPN_1x"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |     STRIDE_IN_1X1: False
 9 |     NUM_GROUPS: 32
10 |     WIDTH_PER_GROUP: 8
11 |   RPN:
12 |     USE_FPN: True
13 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
14 |     PRE_NMS_TOP_N_TRAIN: 2000
15 |     PRE_NMS_TOP_N_TEST: 1000
16 |     POST_NMS_TOP_N_TEST: 1000
17 |     FPN_POST_NMS_TOP_N_TEST: 1000
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |   ROI_BOX_HEAD:
21 |     POOLER_RESOLUTION: 7
22 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
23 |     POOLER_SAMPLING_RATIO: 2
24 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
25 |     PREDICTOR: "FPNPredictor"
26 |   ROI_MASK_HEAD:
27 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
28 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
29 |     PREDICTOR: "MaskRCNNC4Predictor"
30 |     POOLER_RESOLUTION: 14
31 |     POOLER_SAMPLING_RATIO: 2
32 |     RESOLUTION: 28
33 |     SHARE_BOX_FEATURE_EXTRACTOR: False
34 |   MASK_ON: True
35 | DATASETS:
36 |   TEST: ("coco_2014_minival",)
37 | DATALOADER:
38 |   SIZE_DIVISIBILITY: 32
39 | 


--------------------------------------------------------------------------------
/configs/arichived/cityscapes/e2e_faster_rcnn_R_50_FPN_1x_cocostyle.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |     NUM_CLASSES: 9
24 | DATASETS:
25 |   TRAIN: ("cityscapes_fine_instanceonly_seg_train_cocostyle",)
26 |   TEST: ("cityscapes_fine_instanceonly_seg_val_cocostyle",)
27 | DATALOADER:
28 |   SIZE_DIVISIBILITY: 32
29 | SOLVER:
30 |   BASE_LR: 0.01
31 |   WEIGHT_DECAY: 0.0001
32 |   STEPS: (18000,)
33 |   MAX_ITER: 24000
34 | 


--------------------------------------------------------------------------------
/configs/arichived/cityscapes/e2e_mask_rcnn_R_50_FPN_1x_cocostyle.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |     NUM_CLASSES: 9
24 |   ROI_MASK_HEAD:
25 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
26 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
27 |     PREDICTOR: "MaskRCNNC4Predictor"
28 |     POOLER_RESOLUTION: 14
29 |     POOLER_SAMPLING_RATIO: 2
30 |     RESOLUTION: 28
31 |     SHARE_BOX_FEATURE_EXTRACTOR: False
32 |   MASK_ON: True
33 | DATASETS:
34 |   TRAIN: ("cityscapes_fine_instanceonly_seg_train_cocostyle",)
35 |   TEST: ("cityscapes_fine_instanceonly_seg_val_cocostyle",)
36 | DATALOADER:
37 |   SIZE_DIVISIBILITY: 32
38 | SOLVER:
39 |   BASE_LR: 0.01
40 |   WEIGHT_DECAY: 0.0001
41 |   STEPS: (18000,)
42 |   MAX_ITER: 24000
43 | 


--------------------------------------------------------------------------------
/configs/arichived/dcn/README.md:
--------------------------------------------------------------------------------
 1 | ### Reference 
 2 | 1 [Deformable ConvNets v2: More Deformable, Better Results](https://arxiv.org/pdf/1811.11168.pdf)  
 3 | 2 third-party: [mmdetection](https://github.com/open-mmlab/mmdetection/tree/master/configs/dcn)  
 4 | 
 5 | ### Performance
 6 | |      case                   | bbox AP | mask AP |
 7 | |----------------------------:|--------:|:-------:|
 8 | | R-50-FPN-dcn (implement)    |  39.8   |  -      |
 9 | | R-50-FPN-dcn (mmdetection)  |  40.0   |  -      |
10 | | R-50-FPN-mdcn (implement)   |  40.0   |  -      |
11 | | R-50-FPN-mdcn (mmdetection) |  40.3   |  -      |
12 | | R-50-FPN-dcn (implement)    |  40.8   |  36.8   |
13 | | R-50-FPN-dcn (mmdetection)  |  41.1   |  37.2   |
14 | | R-50-FPN-dcn (implement)    |  40.7   |  36.7   |
15 | | R-50-FPN-dcn (mmdetection)  |  41.4   |  37.4   |
16 | 
17 | 
18 | ### Note
19 | see [dcn-v2](https://github.com/open-mmlab/mmdetection/blob/master/MODEL_ZOO.md#deformable-convolution-v2) in `mmdetection` for more details.  
20 | 
21 | 
22 | ### Usage
23 | add these three lines
24 | ```
25 | MODEL:
26 | 	RESNETS:
27 | 		# corresponding to C2,C3,C4,C5
28 | 		STAGE_WITH_DCN: (False, True, True, True)
29 | 		WITH_MODULATED_DCN: True
30 | 		DEFORMABLE_GROUPS: 1
31 | ```


--------------------------------------------------------------------------------
/configs/arichived/dcn/e2e_faster_rcnn_dconv_R_50_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |   RESNETS:
12 |     BACKBONE_OUT_CHANNELS: 256
13 |     STAGE_WITH_DCN: (False, True, True, True)
14 |     WITH_MODULATED_DCN: False
15 |     DEFORMABLE_GROUPS: 1
16 |   RPN:
17 |     USE_FPN: True
18 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
19 |     PRE_NMS_TOP_N_TRAIN: 2000
20 |     PRE_NMS_TOP_N_TEST: 1000
21 |     POST_NMS_TOP_N_TEST: 1000
22 |     FPN_POST_NMS_TOP_N_TEST: 1000
23 |   ROI_HEADS:
24 |     USE_FPN: True
25 |   ROI_BOX_HEAD:
26 |     POOLER_RESOLUTION: 7
27 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
28 |     POOLER_SAMPLING_RATIO: 2
29 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
30 |     PREDICTOR: "FPNPredictor"
31 | DATASETS:
32 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
33 |   TEST: ("coco_2014_minival",)
34 | DATALOADER:
35 |   SIZE_DIVISIBILITY: 32
36 | SOLVER:
37 |   # Assume 8 gpus
38 |   BASE_LR: 0.02
39 |   WEIGHT_DECAY: 0.0001
40 |   STEPS: (60000, 80000)
41 |   MAX_ITER: 90000
42 |   IMS_PER_BATCH: 16
43 | TEST:
44 |   IMS_PER_BATCH: 8
45 | 


--------------------------------------------------------------------------------
/configs/arichived/dcn/e2e_faster_rcnn_mdconv_R_50_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |   RESNETS:
12 |     BACKBONE_OUT_CHANNELS: 256
13 |     STAGE_WITH_DCN: (False, True, True, True)
14 |     WITH_MODULATED_DCN: True
15 |     DEFORMABLE_GROUPS: 1
16 |   RPN:
17 |     USE_FPN: True
18 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
19 |     PRE_NMS_TOP_N_TRAIN: 2000
20 |     PRE_NMS_TOP_N_TEST: 1000
21 |     POST_NMS_TOP_N_TEST: 1000
22 |     FPN_POST_NMS_TOP_N_TEST: 1000
23 |   ROI_HEADS:
24 |     USE_FPN: True
25 |   ROI_BOX_HEAD:
26 |     POOLER_RESOLUTION: 7
27 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
28 |     POOLER_SAMPLING_RATIO: 2
29 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
30 |     PREDICTOR: "FPNPredictor"
31 | DATASETS:
32 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
33 |   TEST: ("coco_2014_minival",)
34 | DATALOADER:
35 |   SIZE_DIVISIBILITY: 32
36 | SOLVER:
37 |   # Assume 8 gpus
38 |   BASE_LR: 0.02
39 |   WEIGHT_DECAY: 0.0001
40 |   STEPS: (60000, 80000)
41 |   MAX_ITER: 90000
42 |   IMS_PER_BATCH: 16
43 | TEST:
44 |   IMS_PER_BATCH: 8
45 | 


--------------------------------------------------------------------------------
/configs/arichived/dcn/e2e_mask_rcnn_dconv_R_50_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |   RESNETS:
12 |     BACKBONE_OUT_CHANNELS: 256
13 |     STAGE_WITH_DCN: (False, True, True, True)
14 |     WITH_MODULATED_DCN: False
15 |     DEFORMABLE_GROUPS: 1
16 |   RPN:
17 |     USE_FPN: True
18 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
19 |     PRE_NMS_TOP_N_TRAIN: 2000
20 |     PRE_NMS_TOP_N_TEST: 1000
21 |     POST_NMS_TOP_N_TEST: 1000
22 |     FPN_POST_NMS_TOP_N_TEST: 1000
23 |   ROI_HEADS:
24 |     USE_FPN: True
25 |   ROI_BOX_HEAD:
26 |     POOLER_RESOLUTION: 7
27 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
28 |     POOLER_SAMPLING_RATIO: 2
29 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
30 |     PREDICTOR: "FPNPredictor"
31 |   ROI_MASK_HEAD:
32 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
33 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
34 |     PREDICTOR: "MaskRCNNC4Predictor"
35 |     POOLER_RESOLUTION: 14
36 |     POOLER_SAMPLING_RATIO: 2
37 |     RESOLUTION: 28
38 |     SHARE_BOX_FEATURE_EXTRACTOR: False
39 |   MASK_ON: True
40 | DATASETS:
41 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
42 |   TEST: ("coco_2014_minival",)
43 | DATALOADER:
44 |   SIZE_DIVISIBILITY: 32
45 | SOLVER:
46 |   # Assume 8 gpus
47 |   BASE_LR: 0.02
48 |   WEIGHT_DECAY: 0.0001
49 |   STEPS: (60000, 80000)
50 |   MAX_ITER: 90000
51 |   IMS_PER_BATCH: 16
52 | TEST:
53 |   IMS_PER_BATCH: 8
54 | 
55 | 


--------------------------------------------------------------------------------
/configs/arichived/dcn/e2e_mask_rcnn_mdconv_R_50_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |   RESNETS:
12 |     BACKBONE_OUT_CHANNELS: 256
13 |     STAGE_WITH_DCN: (False, True, True, True)
14 |     WITH_MODULATED_DCN: True
15 |     DEFORMABLE_GROUPS: 1
16 |   RPN:
17 |     USE_FPN: True
18 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
19 |     PRE_NMS_TOP_N_TRAIN: 2000
20 |     PRE_NMS_TOP_N_TEST: 1000
21 |     POST_NMS_TOP_N_TEST: 1000
22 |     FPN_POST_NMS_TOP_N_TEST: 1000
23 |   ROI_HEADS:
24 |     USE_FPN: True
25 |   ROI_BOX_HEAD:
26 |     POOLER_RESOLUTION: 7
27 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
28 |     POOLER_SAMPLING_RATIO: 2
29 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
30 |     PREDICTOR: "FPNPredictor"
31 |   ROI_MASK_HEAD:
32 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
33 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
34 |     PREDICTOR: "MaskRCNNC4Predictor"
35 |     POOLER_RESOLUTION: 14
36 |     POOLER_SAMPLING_RATIO: 2
37 |     RESOLUTION: 28
38 |     SHARE_BOX_FEATURE_EXTRACTOR: False
39 |   MASK_ON: True
40 | DATASETS:
41 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
42 |   TEST: ("coco_2014_minival",)
43 | DATALOADER:
44 |   SIZE_DIVISIBILITY: 32
45 | SOLVER:
46 |   # Assume 8 gpus
47 |   BASE_LR: 0.02
48 |   WEIGHT_DECAY: 0.0001
49 |   STEPS: (60000, 80000)
50 |   MAX_ITER: 90000
51 |   IMS_PER_BATCH: 16
52 | TEST:
53 |   IMS_PER_BATCH: 8
54 | 


--------------------------------------------------------------------------------
/configs/arichived/gn_baselines/README.md:
--------------------------------------------------------------------------------
 1 | ### Group Normalization
 2 | 1 [Group Normalization](https://arxiv.org/abs/1803.08494)  
 3 | 2 [Rethinking ImageNet Pre-training](https://arxiv.org/abs/1811.08883)  
 4 | 3 [official code](https://github.com/facebookresearch/Detectron/blob/master/projects/GN/README.md)  
 5 | 
 6 | 
 7 | ### Performance
 8 | |      case                  |    Type      |  lr schd  |  im/gpu | bbox AP | mask AP |
 9 | |----------------------------|:------------:|:---------:|:-------:|:-------:|:-------:|
10 | |   R-50-FPN, GN (paper)     | finetune     |    2x     |   2     |   40.3  |  35.7   |
11 | |   R-50-FPN, GN (implement) | finetune     |    2x     |   2     |   40.2  |  36.0   |
12 | |   R-50-FPN, GN (paper)     | from scratch |    3x     |   2     |   39.5  |  35.2   |
13 | |   R-50-FPN, GN (implement) | from scratch |    3x     |   2     |   38.9  |  35.1   |
14 | 


--------------------------------------------------------------------------------
/configs/arichived/gn_baselines/e2e_faster_rcnn_R_50_FPN_1x_gn.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50-GN"
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |   RESNETS: # use GN for backbone
12 |     BACKBONE_OUT_CHANNELS: 256
13 |     STRIDE_IN_1X1: False
14 |     TRANS_FUNC: "BottleneckWithGN"
15 |     STEM_FUNC: "StemWithGN"
16 |   FPN:
17 |     USE_GN: True # use GN for FPN
18 |   RPN:
19 |     USE_FPN: True
20 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
21 |     PRE_NMS_TOP_N_TRAIN: 2000
22 |     PRE_NMS_TOP_N_TEST: 1000
23 |     POST_NMS_TOP_N_TEST: 1000
24 |     FPN_POST_NMS_TOP_N_TEST: 1000
25 |   ROI_HEADS:
26 |     USE_FPN: True
27 |     BATCH_SIZE_PER_IMAGE: 512
28 |     POSITIVE_FRACTION: 0.25
29 |   ROI_BOX_HEAD:
30 |     USE_GN: True # use GN for bbox head
31 |     POOLER_RESOLUTION: 7
32 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
33 |     POOLER_SAMPLING_RATIO: 2
34 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
35 |     PREDICTOR: "FPNPredictor"
36 | DATASETS:
37 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
38 |   TEST: ("coco_2014_minival",)
39 | DATALOADER:
40 |   SIZE_DIVISIBILITY: 32
41 | SOLVER:
42 |   # Assume 8 gpus
43 |   BASE_LR: 0.02
44 |   WEIGHT_DECAY: 0.0001
45 |   STEPS: (60000, 80000)
46 |   MAX_ITER: 90000
47 |   IMS_PER_BATCH: 16
48 | TEST:
49 |   IMS_PER_BATCH: 8
50 | 


--------------------------------------------------------------------------------
/configs/arichived/gn_baselines/e2e_faster_rcnn_R_50_FPN_Xconv1fc_1x_gn.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50-GN"
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |   RESNETS: # use GN for backbone
12 |     BACKBONE_OUT_CHANNELS: 256
13 |     STRIDE_IN_1X1: False
14 |     TRANS_FUNC: "BottleneckWithGN"
15 |     STEM_FUNC: "StemWithGN"
16 |   FPN:
17 |     USE_GN: True # use GN for FPN
18 |   RPN:
19 |     USE_FPN: True
20 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
21 |     PRE_NMS_TOP_N_TRAIN: 2000
22 |     PRE_NMS_TOP_N_TEST: 1000
23 |     POST_NMS_TOP_N_TEST: 1000
24 |     FPN_POST_NMS_TOP_N_TEST: 1000
25 |   ROI_HEADS:
26 |     USE_FPN: True
27 |     BATCH_SIZE_PER_IMAGE: 512
28 |     POSITIVE_FRACTION: 0.25
29 |   ROI_BOX_HEAD:
30 |     USE_GN: True # use GN for bbox head
31 |     POOLER_RESOLUTION: 7
32 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
33 |     POOLER_SAMPLING_RATIO: 2
34 |     CONV_HEAD_DIM: 256
35 |     NUM_STACKED_CONVS: 4
36 |     FEATURE_EXTRACTOR: "FPNXconv1fcFeatureExtractor"
37 |     PREDICTOR: "FPNPredictor"
38 | DATASETS:
39 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
40 |   TEST: ("coco_2014_minival",)
41 | DATALOADER:
42 |   SIZE_DIVISIBILITY: 32
43 | SOLVER:
44 |   # Assume 8 gpus
45 |   BASE_LR: 0.02
46 |   WEIGHT_DECAY: 0.0001
47 |   STEPS: (60000, 80000)
48 |   MAX_ITER: 90000
49 |   IMS_PER_BATCH: 16
50 | TEST:
51 |   IMS_PER_BATCH: 8
52 | 


--------------------------------------------------------------------------------
/configs/arichived/gn_baselines/e2e_mask_rcnn_R_50_FPN_1x_gn.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50-GN"
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |   RESNETS: # use GN for backbone
12 |     BACKBONE_OUT_CHANNELS: 256
13 |     STRIDE_IN_1X1: False
14 |     TRANS_FUNC: "BottleneckWithGN"
15 |     STEM_FUNC: "StemWithGN"
16 |   FPN:
17 |     USE_GN: True # use GN for FPN
18 |   RPN:
19 |     USE_FPN: True
20 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
21 |     PRE_NMS_TOP_N_TRAIN: 2000
22 |     PRE_NMS_TOP_N_TEST: 1000
23 |     POST_NMS_TOP_N_TEST: 1000
24 |     FPN_POST_NMS_TOP_N_TEST: 1000
25 |   ROI_HEADS:
26 |     USE_FPN: True
27 |     BATCH_SIZE_PER_IMAGE: 512
28 |     POSITIVE_FRACTION: 0.25
29 |   ROI_BOX_HEAD:
30 |     USE_GN: True # use GN for bbox head
31 |     POOLER_RESOLUTION: 7
32 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
33 |     POOLER_SAMPLING_RATIO: 2
34 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
35 |     PREDICTOR: "FPNPredictor"
36 |   ROI_MASK_HEAD:
37 |     USE_GN: True # use GN for mask head
38 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
39 |     CONV_LAYERS: (256, 256, 256, 256)
40 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
41 |     PREDICTOR: "MaskRCNNC4Predictor"
42 |     POOLER_RESOLUTION: 14
43 |     POOLER_SAMPLING_RATIO: 2
44 |     RESOLUTION: 28
45 |     SHARE_BOX_FEATURE_EXTRACTOR: False
46 |   MASK_ON: True
47 | DATASETS:
48 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
49 |   TEST: ("coco_2014_minival",)
50 | DATALOADER:
51 |   SIZE_DIVISIBILITY: 32
52 | SOLVER:
53 |   # Assume 8 gpus
54 |   BASE_LR: 0.02
55 |   WEIGHT_DECAY: 0.0001
56 |   STEPS: (60000, 80000)
57 |   MAX_ITER: 90000
58 |   IMS_PER_BATCH: 16
59 | TEST:
60 |   IMS_PER_BATCH: 8
61 | 


--------------------------------------------------------------------------------
/configs/arichived/gn_baselines/e2e_mask_rcnn_R_50_FPN_Xconv1fc_1x_gn.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50-GN"
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |   RESNETS: # use GN for backbone
12 |     BACKBONE_OUT_CHANNELS: 256
13 |     STRIDE_IN_1X1: False
14 |     TRANS_FUNC: "BottleneckWithGN"
15 |     STEM_FUNC: "StemWithGN"
16 |   FPN:
17 |     USE_GN: True # use GN for FPN
18 |   RPN:
19 |     USE_FPN: True
20 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
21 |     PRE_NMS_TOP_N_TRAIN: 2000
22 |     PRE_NMS_TOP_N_TEST: 1000
23 |     POST_NMS_TOP_N_TEST: 1000
24 |     FPN_POST_NMS_TOP_N_TEST: 1000
25 |   ROI_HEADS:
26 |     USE_FPN: True
27 |     BATCH_SIZE_PER_IMAGE: 512
28 |     POSITIVE_FRACTION: 0.25
29 |   ROI_BOX_HEAD:
30 |     USE_GN: True # use GN for bbox head
31 |     POOLER_RESOLUTION: 7
32 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
33 |     POOLER_SAMPLING_RATIO: 2
34 |     CONV_HEAD_DIM: 256
35 |     NUM_STACKED_CONVS: 4
36 |     FEATURE_EXTRACTOR: "FPNXconv1fcFeatureExtractor"
37 |     PREDICTOR: "FPNPredictor"
38 |   ROI_MASK_HEAD:
39 |     USE_GN: True # use GN for mask head
40 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
41 |     CONV_LAYERS: (256, 256, 256, 256)
42 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
43 |     PREDICTOR: "MaskRCNNC4Predictor"
44 |     POOLER_RESOLUTION: 14
45 |     POOLER_SAMPLING_RATIO: 2
46 |     RESOLUTION: 28
47 |     SHARE_BOX_FEATURE_EXTRACTOR: False
48 |   MASK_ON: True
49 | DATASETS:
50 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
51 |   TEST: ("coco_2014_minival",)
52 | DATALOADER:
53 |   SIZE_DIVISIBILITY: 32
54 | SOLVER:
55 |   # Assume 8 gpus
56 |   BASE_LR: 0.02
57 |   WEIGHT_DECAY: 0.0001
58 |   STEPS: (60000, 80000)
59 |   MAX_ITER: 90000
60 |   IMS_PER_BATCH: 16
61 | TEST:
62 |   IMS_PER_BATCH: 8
63 | 


--------------------------------------------------------------------------------
/configs/arichived/gn_baselines/scratch_e2e_faster_rcnn_R_50_FPN_3x_gn.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "" # no pretrained model
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |     FREEZE_CONV_BODY_AT: 0 # finetune all layers
12 |   RESNETS: # use GN for backbone
13 |     BACKBONE_OUT_CHANNELS: 256
14 |     STRIDE_IN_1X1: False
15 |     TRANS_FUNC: "BottleneckWithGN"
16 |     STEM_FUNC: "StemWithGN"
17 |   FPN:
18 |     USE_GN: True # use GN for FPN
19 |   RPN:
20 |     USE_FPN: True
21 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
22 |     PRE_NMS_TOP_N_TRAIN: 2000
23 |     PRE_NMS_TOP_N_TEST: 1000
24 |     POST_NMS_TOP_N_TEST: 1000
25 |     FPN_POST_NMS_TOP_N_TEST: 1000
26 |   ROI_HEADS:
27 |     USE_FPN: True
28 |     BATCH_SIZE_PER_IMAGE: 512
29 |     POSITIVE_FRACTION: 0.25
30 |   ROI_BOX_HEAD:
31 |     USE_GN: True # use GN for bbox head
32 |     POOLER_RESOLUTION: 7
33 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
34 |     POOLER_SAMPLING_RATIO: 2
35 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
36 |     PREDICTOR: "FPNPredictor"
37 | DATASETS:
38 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
39 |   TEST: ("coco_2014_minival",)
40 | DATALOADER:
41 |   SIZE_DIVISIBILITY: 32
42 | SOLVER:
43 |   # Assume 8 gpus
44 |   BASE_LR: 0.02
45 |   WEIGHT_DECAY: 0.0001
46 |   STEPS: (210000, 250000)
47 |   MAX_ITER: 270000
48 |   IMS_PER_BATCH: 16
49 | TEST:
50 |   IMS_PER_BATCH: 8
51 | 


--------------------------------------------------------------------------------
/configs/arichived/gn_baselines/scratch_e2e_faster_rcnn_R_50_FPN_Xconv1fc_3x_gn.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "" # no pretrained model
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |     FREEZE_CONV_BODY_AT: 0 # finetune all layers
12 |   RESNETS: # use GN for backbone
13 |     BACKBONE_OUT_CHANNELS: 256
14 |     STRIDE_IN_1X1: False
15 |     TRANS_FUNC: "BottleneckWithGN"
16 |     STEM_FUNC: "StemWithGN"
17 |   FPN:
18 |     USE_GN: True # use GN for FPN
19 |   RPN:
20 |     USE_FPN: True
21 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
22 |     PRE_NMS_TOP_N_TRAIN: 2000
23 |     PRE_NMS_TOP_N_TEST: 1000
24 |     POST_NMS_TOP_N_TEST: 1000
25 |     FPN_POST_NMS_TOP_N_TEST: 1000
26 |   ROI_HEADS:
27 |     USE_FPN: True
28 |     BATCH_SIZE_PER_IMAGE: 512
29 |     POSITIVE_FRACTION: 0.25
30 |   ROI_BOX_HEAD:
31 |     USE_GN: True # use GN for bbox head
32 |     POOLER_RESOLUTION: 7
33 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
34 |     POOLER_SAMPLING_RATIO: 2
35 |     CONV_HEAD_DIM: 256
36 |     NUM_STACKED_CONVS: 4
37 |     FEATURE_EXTRACTOR: "FPNXconv1fcFeatureExtractor"
38 |     PREDICTOR: "FPNPredictor"
39 | DATASETS:
40 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
41 |   TEST: ("coco_2014_minival",)
42 | DATALOADER:
43 |   SIZE_DIVISIBILITY: 32
44 | SOLVER:
45 |   # Assume 8 gpus
46 |   BASE_LR: 0.02
47 |   WEIGHT_DECAY: 0.0001
48 |   STEPS: (210000, 250000)
49 |   MAX_ITER: 270000
50 |   IMS_PER_BATCH: 16
51 | TEST:
52 |   IMS_PER_BATCH: 8
53 | 


--------------------------------------------------------------------------------
/configs/arichived/gn_baselines/scratch_e2e_mask_rcnn_R_50_FPN_3x_gn.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "" # no pretrained model
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |     FREEZE_CONV_BODY_AT: 0 # finetune all layers
12 |   RESNETS: # use GN for backbone
13 |     BACKBONE_OUT_CHANNELS: 256
14 |     STRIDE_IN_1X1: False
15 |     TRANS_FUNC: "BottleneckWithGN"
16 |     STEM_FUNC: "StemWithGN"
17 |   FPN:
18 |     USE_GN: True # use GN for FPN
19 |   RPN:
20 |     USE_FPN: True
21 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
22 |     PRE_NMS_TOP_N_TRAIN: 2000
23 |     PRE_NMS_TOP_N_TEST: 1000
24 |     POST_NMS_TOP_N_TEST: 1000
25 |     FPN_POST_NMS_TOP_N_TEST: 1000
26 |   ROI_HEADS:
27 |     USE_FPN: True
28 |     BATCH_SIZE_PER_IMAGE: 512
29 |     POSITIVE_FRACTION: 0.25
30 |   ROI_BOX_HEAD:
31 |     USE_GN: True # use GN for bbox head
32 |     POOLER_RESOLUTION: 7
33 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
34 |     POOLER_SAMPLING_RATIO: 2
35 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
36 |     PREDICTOR: "FPNPredictor"
37 |   ROI_MASK_HEAD:
38 |     USE_GN: True # use GN for mask head
39 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
40 |     CONV_LAYERS: (256, 256, 256, 256)
41 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
42 |     PREDICTOR: "MaskRCNNC4Predictor"
43 |     POOLER_RESOLUTION: 14
44 |     POOLER_SAMPLING_RATIO: 2
45 |     RESOLUTION: 28
46 |     SHARE_BOX_FEATURE_EXTRACTOR: False
47 |   MASK_ON: True
48 | DATASETS:
49 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
50 |   TEST: ("coco_2014_minival",)
51 | DATALOADER:
52 |   SIZE_DIVISIBILITY: 32
53 | SOLVER:
54 |   # Assume 8 gpus
55 |   BASE_LR: 0.02
56 |   WEIGHT_DECAY: 0.0001
57 |   STEPS: (210000, 250000)
58 |   MAX_ITER: 270000
59 |   IMS_PER_BATCH: 16
60 | TEST:
61 |   IMS_PER_BATCH: 8
62 | 


--------------------------------------------------------------------------------
/configs/arichived/gn_baselines/scratch_e2e_mask_rcnn_R_50_FPN_Xconv1fc_3x_gn.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (800,)
 3 |   MAX_SIZE_TRAIN: 1333
 4 |   MIN_SIZE_TEST: 800
 5 |   MAX_SIZE_TEST: 1333
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "" # no pretrained model
 9 |   BACKBONE:
10 |     CONV_BODY: "R-50-FPN"
11 |     FREEZE_CONV_BODY_AT: 0 # finetune all layers
12 |   RESNETS: # use GN for backbone
13 |     BACKBONE_OUT_CHANNELS: 256
14 |     STRIDE_IN_1X1: False
15 |     TRANS_FUNC: "BottleneckWithGN"
16 |     STEM_FUNC: "StemWithGN"
17 |   FPN:
18 |     USE_GN: True # use GN for FPN
19 |   RPN:
20 |     USE_FPN: True
21 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
22 |     PRE_NMS_TOP_N_TRAIN: 2000
23 |     PRE_NMS_TOP_N_TEST: 1000
24 |     POST_NMS_TOP_N_TEST: 1000
25 |     FPN_POST_NMS_TOP_N_TEST: 1000
26 |   ROI_HEADS:
27 |     USE_FPN: True
28 |     BATCH_SIZE_PER_IMAGE: 512
29 |     POSITIVE_FRACTION: 0.25
30 |   ROI_BOX_HEAD:
31 |     USE_GN: True # use GN for bbox head
32 |     POOLER_RESOLUTION: 7
33 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
34 |     POOLER_SAMPLING_RATIO: 2
35 |     CONV_HEAD_DIM: 256
36 |     NUM_STACKED_CONVS: 4
37 |     FEATURE_EXTRACTOR: "FPNXconv1fcFeatureExtractor"
38 |     PREDICTOR: "FPNPredictor"
39 |   ROI_MASK_HEAD:
40 |     USE_GN: True # use GN for mask head
41 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
42 |     CONV_LAYERS: (256, 256, 256, 256)
43 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
44 |     PREDICTOR: "MaskRCNNC4Predictor"
45 |     POOLER_RESOLUTION: 14
46 |     POOLER_SAMPLING_RATIO: 2
47 |     RESOLUTION: 28
48 |     SHARE_BOX_FEATURE_EXTRACTOR: False
49 |   MASK_ON: True
50 | DATASETS:
51 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
52 |   TEST: ("coco_2014_minival",)
53 | DATALOADER:
54 |   SIZE_DIVISIBILITY: 32
55 | SOLVER:
56 |   # Assume 8 gpus
57 |   BASE_LR: 0.02
58 |   WEIGHT_DECAY: 0.0001
59 |   STEPS: (210000, 250000)
60 |   MAX_ITER: 270000
61 |   IMS_PER_BATCH: 16
62 | TEST:
63 |   IMS_PER_BATCH: 8
64 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/e2e_faster_rcnn_R_101_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-101"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 | DATASETS:
24 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
25 |   TEST: ("coco_2014_minival",)
26 | DATALOADER:
27 |   SIZE_DIVISIBILITY: 32
28 | SOLVER:
29 |   BASE_LR: 0.02
30 |   WEIGHT_DECAY: 0.0001
31 |   STEPS: (60000, 80000)
32 |   MAX_ITER: 90000
33 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/e2e_faster_rcnn_R_50_C4_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN:
 5 |     PRE_NMS_TOP_N_TEST: 6000
 6 |     POST_NMS_TOP_N_TEST: 1000
 7 | DATASETS:
 8 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
 9 |   TEST: ("coco_2014_minival",)
10 | SOLVER:
11 |   BASE_LR: 0.01
12 |   WEIGHT_DECAY: 0.0001
13 |   STEPS: (120000, 160000)
14 |   MAX_ITER: 180000
15 |   IMS_PER_BATCH: 8
16 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/e2e_faster_rcnn_R_50_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 | DATASETS:
24 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
25 |   TEST: ("coco_2014_minival",)
26 | DATALOADER:
27 |   SIZE_DIVISIBILITY: 32
28 | SOLVER:
29 |   BASE_LR: 0.02
30 |   WEIGHT_DECAY: 0.0001
31 |   STEPS: (60000, 80000)
32 |   MAX_ITER: 90000
33 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/e2e_faster_rcnn_X_101_32x8d_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/FAIR/20171220/X-101-32x8d"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RPN:
 7 |     USE_FPN: True
 8 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
 9 |     PRE_NMS_TOP_N_TRAIN: 2000
10 |     PRE_NMS_TOP_N_TEST: 1000
11 |     POST_NMS_TOP_N_TEST: 1000
12 |     FPN_POST_NMS_TOP_N_TEST: 1000
13 |   ROI_HEADS:
14 |     USE_FPN: True
15 |   ROI_BOX_HEAD:
16 |     POOLER_RESOLUTION: 7
17 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
18 |     POOLER_SAMPLING_RATIO: 2
19 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
20 |     PREDICTOR: "FPNPredictor"
21 |   RESNETS:
22 |     BACKBONE_OUT_CHANNELS: 256
23 |     STRIDE_IN_1X1: False
24 |     NUM_GROUPS: 32
25 |     WIDTH_PER_GROUP: 8
26 | DATASETS:
27 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
28 |   TEST: ("coco_2014_minival",)
29 | DATALOADER:
30 |   SIZE_DIVISIBILITY: 32
31 | SOLVER:
32 |   BASE_LR: 0.01
33 |   WEIGHT_DECAY: 0.0001
34 |   STEPS: (120000, 160000)
35 |   MAX_ITER: 180000
36 |   IMS_PER_BATCH: 8
37 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/e2e_faster_rcnn_fbnet.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   BACKBONE:
 4 |     CONV_BODY: FBNet
 5 |   FBNET:
 6 |     ARCH: "default"
 7 |     BN_TYPE: "bn"
 8 |     WIDTH_DIVISOR: 8
 9 |     DW_CONV_SKIP_BN: True
10 |     DW_CONV_SKIP_RELU: True
11 |   RPN:
12 |     ANCHOR_SIZES: (16, 32, 64, 128, 256)
13 |     ANCHOR_STRIDE: (16, )
14 |     BATCH_SIZE_PER_IMAGE: 256
15 |     PRE_NMS_TOP_N_TRAIN: 6000
16 |     PRE_NMS_TOP_N_TEST: 6000
17 |     POST_NMS_TOP_N_TRAIN: 2000
18 |     POST_NMS_TOP_N_TEST: 100
19 |     RPN_HEAD: FBNet.rpn_head
20 |   ROI_HEADS:
21 |     BATCH_SIZE_PER_IMAGE: 512
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 6
24 |     FEATURE_EXTRACTOR: FBNet.roi_head
25 |     NUM_CLASSES: 81
26 | DATASETS:
27 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
28 |   TEST: ("coco_2014_minival",)
29 | SOLVER:
30 |   BASE_LR: 0.06
31 |   WARMUP_FACTOR: 0.1
32 |   WEIGHT_DECAY: 0.0001
33 |   STEPS: (60000, 80000)
34 |   MAX_ITER: 90000
35 |   IMS_PER_BATCH: 128  # for 8GPUs
36 | # TEST:
37 | #   IMS_PER_BATCH: 8
38 | INPUT:
39 |   MIN_SIZE_TRAIN: (320, )
40 |   MAX_SIZE_TRAIN: 640
41 |   MIN_SIZE_TEST: 320
42 |   MAX_SIZE_TEST: 640
43 |   PIXEL_MEAN: [103.53, 116.28, 123.675]
44 |   PIXEL_STD: [57.375, 57.12, 58.395]
45 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/e2e_faster_rcnn_fbnet_600.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   BACKBONE:
 4 |     CONV_BODY: FBNet
 5 |   FBNET:
 6 |     ARCH: "default"
 7 |     BN_TYPE: "bn"
 8 |     WIDTH_DIVISOR: 8
 9 |     DW_CONV_SKIP_BN: True
10 |     DW_CONV_SKIP_RELU: True
11 |   RPN:
12 |     ANCHOR_SIZES: (32, 64, 128, 256, 512)
13 |     ANCHOR_STRIDE: (16, )
14 |     BATCH_SIZE_PER_IMAGE: 256
15 |     PRE_NMS_TOP_N_TRAIN: 6000
16 |     PRE_NMS_TOP_N_TEST: 6000
17 |     POST_NMS_TOP_N_TRAIN: 2000
18 |     POST_NMS_TOP_N_TEST: 200
19 |     RPN_HEAD: FBNet.rpn_head
20 |   ROI_HEADS:
21 |     BATCH_SIZE_PER_IMAGE: 256
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 6
24 |     FEATURE_EXTRACTOR: FBNet.roi_head
25 |     NUM_CLASSES: 81
26 | DATASETS:
27 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
28 |   TEST: ("coco_2014_minival",)
29 | SOLVER:
30 |   BASE_LR: 0.06
31 |   WARMUP_FACTOR: 0.1
32 |   WEIGHT_DECAY: 0.0001
33 |   STEPS: (60000, 80000)
34 |   MAX_ITER: 90000
35 |   IMS_PER_BATCH: 128  # for 8GPUs
36 | # TEST:
37 | #   IMS_PER_BATCH: 8
38 | INPUT:
39 |   MIN_SIZE_TRAIN: (600, )
40 |   MAX_SIZE_TRAIN: 1000
41 |   MIN_SIZE_TEST: 600
42 |   MAX_SIZE_TEST: 1000
43 |   PIXEL_MEAN: [103.53, 116.28, 123.675]
44 |   PIXEL_STD: [57.375, 57.12, 58.395]
45 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/e2e_faster_rcnn_fbnet_chamv1a_600.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   BACKBONE:
 4 |     CONV_BODY: FBNet
 5 |   FBNET:
 6 |     ARCH: "cham_v1a"
 7 |     BN_TYPE: "bn"
 8 |     WIDTH_DIVISOR: 8
 9 |     DW_CONV_SKIP_BN: True
10 |     DW_CONV_SKIP_RELU: True
11 |   RPN:
12 |     ANCHOR_SIZES: (32, 64, 128, 256, 512)
13 |     ANCHOR_STRIDE: (16, )
14 |     BATCH_SIZE_PER_IMAGE: 256
15 |     PRE_NMS_TOP_N_TRAIN: 6000
16 |     PRE_NMS_TOP_N_TEST: 6000
17 |     POST_NMS_TOP_N_TRAIN: 2000
18 |     POST_NMS_TOP_N_TEST: 200
19 |     RPN_HEAD: FBNet.rpn_head
20 |   ROI_HEADS:
21 |     BATCH_SIZE_PER_IMAGE: 128
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 6
24 |     FEATURE_EXTRACTOR: FBNet.roi_head
25 |     NUM_CLASSES: 81
26 | DATASETS:
27 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
28 |   TEST: ("coco_2014_minival",)
29 | SOLVER:
30 |   BASE_LR: 0.045
31 |   WARMUP_FACTOR: 0.1
32 |   WEIGHT_DECAY: 0.0001
33 |   STEPS: (90000, 120000)
34 |   MAX_ITER: 135000
35 |   IMS_PER_BATCH: 96  # for 8GPUs
36 | # TEST:
37 | #   IMS_PER_BATCH: 8
38 | INPUT:
39 |   MIN_SIZE_TRAIN: (600, )
40 |   MAX_SIZE_TRAIN: 1000
41 |   MIN_SIZE_TEST: 600
42 |   MAX_SIZE_TEST: 1000
43 |   PIXEL_MEAN: [103.53, 116.28, 123.675]
44 |   PIXEL_STD: [57.375, 57.12, 58.395]
45 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/e2e_keypoint_rcnn_R_50_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |     NUM_CLASSES: 2
24 |   ROI_KEYPOINT_HEAD:
25 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
26 |     FEATURE_EXTRACTOR: "KeypointRCNNFeatureExtractor"
27 |     PREDICTOR: "KeypointRCNNPredictor"
28 |     POOLER_RESOLUTION: 14
29 |     POOLER_SAMPLING_RATIO: 2
30 |     RESOLUTION: 56
31 |     SHARE_BOX_FEATURE_EXTRACTOR: False
32 |   KEYPOINT_ON: True
33 | DATASETS:
34 |   TRAIN: ("keypoints_coco_2014_train", "keypoints_coco_2014_valminusminival",)
35 |   TEST: ("keypoints_coco_2014_minival",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (640, 672, 704, 736, 768, 800)
38 | DATALOADER:
39 |   SIZE_DIVISIBILITY: 32
40 | SOLVER:
41 |   BASE_LR: 0.02
42 |   WEIGHT_DECAY: 0.0001
43 |   STEPS: (60000, 80000)
44 |   MAX_ITER: 90000
45 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/e2e_mask_rcnn_R_101_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-101"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |   ROI_MASK_HEAD:
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
26 |     PREDICTOR: "MaskRCNNC4Predictor"
27 |     POOLER_RESOLUTION: 14
28 |     POOLER_SAMPLING_RATIO: 2
29 |     RESOLUTION: 28
30 |     SHARE_BOX_FEATURE_EXTRACTOR: False
31 |   MASK_ON: True
32 | DATASETS:
33 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
34 |   TEST: ("coco_2014_minival",)
35 | DATALOADER:
36 |   SIZE_DIVISIBILITY: 32
37 | SOLVER:
38 |   BASE_LR: 0.02
39 |   WEIGHT_DECAY: 0.0001
40 |   STEPS: (60000, 80000)
41 |   MAX_ITER: 90000
42 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/e2e_mask_rcnn_R_50_C4_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN:
 5 |     PRE_NMS_TOP_N_TEST: 6000
 6 |     POST_NMS_TOP_N_TEST: 1000
 7 |   ROI_MASK_HEAD:
 8 |     PREDICTOR: "MaskRCNNC4Predictor"
 9 |     SHARE_BOX_FEATURE_EXTRACTOR: True
10 |   MASK_ON: True
11 | DATASETS:
12 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
13 |   TEST: ("coco_2014_minival",)
14 | SOLVER:
15 |   BASE_LR: 0.01
16 |   WEIGHT_DECAY: 0.0001
17 |   STEPS: (120000, 160000)
18 |   MAX_ITER: 180000
19 |   IMS_PER_BATCH: 8
20 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/e2e_mask_rcnn_R_50_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |   ROI_MASK_HEAD:
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
26 |     PREDICTOR: "MaskRCNNC4Predictor"
27 |     POOLER_RESOLUTION: 14
28 |     POOLER_SAMPLING_RATIO: 2
29 |     RESOLUTION: 28
30 |     SHARE_BOX_FEATURE_EXTRACTOR: False
31 |   MASK_ON: True
32 | DATASETS:
33 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
34 |   TEST: ("coco_2014_minival",)
35 | DATALOADER:
36 |   SIZE_DIVISIBILITY: 32
37 | SOLVER:
38 |   BASE_LR: 0.02
39 |   WEIGHT_DECAY: 0.0001
40 |   STEPS: (60000, 80000)
41 |   MAX_ITER: 90000
42 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/e2e_mask_rcnn_X_101_32x8d_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/FAIR/20171220/X-101-32x8d"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |     STRIDE_IN_1X1: False
 9 |     NUM_GROUPS: 32
10 |     WIDTH_PER_GROUP: 8
11 |   RPN:
12 |     USE_FPN: True
13 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
14 |     PRE_NMS_TOP_N_TRAIN: 2000
15 |     PRE_NMS_TOP_N_TEST: 1000
16 |     POST_NMS_TOP_N_TEST: 1000
17 |     FPN_POST_NMS_TOP_N_TEST: 1000
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |   ROI_BOX_HEAD:
21 |     POOLER_RESOLUTION: 7
22 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
23 |     POOLER_SAMPLING_RATIO: 2
24 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
25 |     PREDICTOR: "FPNPredictor"
26 |   ROI_MASK_HEAD:
27 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
28 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
29 |     PREDICTOR: "MaskRCNNC4Predictor"
30 |     POOLER_RESOLUTION: 14
31 |     POOLER_SAMPLING_RATIO: 2
32 |     RESOLUTION: 28
33 |     SHARE_BOX_FEATURE_EXTRACTOR: False
34 |   MASK_ON: True
35 | DATASETS:
36 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
37 |   TEST: ("coco_2014_minival",)
38 | DATALOADER:
39 |   SIZE_DIVISIBILITY: 32
40 | SOLVER:
41 |   BASE_LR: 0.01
42 |   WEIGHT_DECAY: 0.0001
43 |   STEPS: (120000, 160000)
44 |   MAX_ITER: 180000
45 |   IMS_PER_BATCH: 8
46 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/e2e_mask_rcnn_fbnet.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   BACKBONE:
 4 |     CONV_BODY: FBNet
 5 |   FBNET:
 6 |     ARCH: "default"
 7 |     BN_TYPE: "bn"
 8 |     WIDTH_DIVISOR: 8
 9 |     DW_CONV_SKIP_BN: True
10 |     DW_CONV_SKIP_RELU: True
11 |     DET_HEAD_LAST_SCALE: 0.0
12 |   RPN:
13 |     ANCHOR_SIZES: (16, 32, 64, 128, 256)
14 |     ANCHOR_STRIDE: (16, )
15 |     BATCH_SIZE_PER_IMAGE: 256
16 |     PRE_NMS_TOP_N_TRAIN: 6000
17 |     PRE_NMS_TOP_N_TEST: 6000
18 |     POST_NMS_TOP_N_TRAIN: 2000
19 |     POST_NMS_TOP_N_TEST: 100
20 |     RPN_HEAD: FBNet.rpn_head
21 |   ROI_HEADS:
22 |     BATCH_SIZE_PER_IMAGE: 256
23 |   ROI_BOX_HEAD:
24 |     POOLER_RESOLUTION: 6
25 |     FEATURE_EXTRACTOR: FBNet.roi_head
26 |     NUM_CLASSES: 81
27 |   ROI_MASK_HEAD:
28 |     POOLER_RESOLUTION: 6
29 |     FEATURE_EXTRACTOR: FBNet.roi_head_mask
30 |     PREDICTOR: "MaskRCNNConv1x1Predictor"
31 |     RESOLUTION: 12
32 |     SHARE_BOX_FEATURE_EXTRACTOR: False
33 |   MASK_ON: True
34 | DATASETS:
35 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
36 |   TEST: ("coco_2014_minival",)
37 | SOLVER:
38 |   BASE_LR: 0.06
39 |   WARMUP_FACTOR: 0.1
40 |   WEIGHT_DECAY: 0.0001
41 |   STEPS: (60000, 80000)
42 |   MAX_ITER: 90000
43 |   IMS_PER_BATCH: 128  # for 8GPUs
44 | # TEST:
45 | #   IMS_PER_BATCH: 8
46 | INPUT:
47 |   MIN_SIZE_TRAIN: (320, )
48 |   MAX_SIZE_TRAIN: 640
49 |   MIN_SIZE_TEST: 320
50 |   MAX_SIZE_TEST: 640
51 |   PIXEL_MEAN: [103.53, 116.28, 123.675]
52 |   PIXEL_STD: [57.375, 57.12, 58.395]
53 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/e2e_mask_rcnn_fbnet_600.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   BACKBONE:
 4 |     CONV_BODY: FBNet
 5 |   FBNET:
 6 |     ARCH: "default"
 7 |     BN_TYPE: "bn"
 8 |     WIDTH_DIVISOR: 8
 9 |     DW_CONV_SKIP_BN: True
10 |     DW_CONV_SKIP_RELU: True
11 |     DET_HEAD_LAST_SCALE: 0.0
12 |   RPN:
13 |     ANCHOR_SIZES: (32, 64, 128, 256, 512)
14 |     ANCHOR_STRIDE: (16, )
15 |     BATCH_SIZE_PER_IMAGE: 256
16 |     PRE_NMS_TOP_N_TRAIN: 6000
17 |     PRE_NMS_TOP_N_TEST: 6000
18 |     POST_NMS_TOP_N_TRAIN: 2000
19 |     POST_NMS_TOP_N_TEST: 200
20 |     RPN_HEAD: FBNet.rpn_head
21 |   ROI_HEADS:
22 |     BATCH_SIZE_PER_IMAGE: 256
23 |   ROI_BOX_HEAD:
24 |     POOLER_RESOLUTION: 6
25 |     FEATURE_EXTRACTOR: FBNet.roi_head
26 |     NUM_CLASSES: 81
27 |   ROI_MASK_HEAD:
28 |     POOLER_RESOLUTION: 6
29 |     FEATURE_EXTRACTOR: FBNet.roi_head_mask
30 |     PREDICTOR: "MaskRCNNConv1x1Predictor"
31 |     RESOLUTION: 12
32 |     SHARE_BOX_FEATURE_EXTRACTOR: False
33 |   MASK_ON: True
34 | DATASETS:
35 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
36 |   TEST: ("coco_2014_minival",)
37 | SOLVER:
38 |   BASE_LR: 0.06
39 |   WARMUP_FACTOR: 0.1
40 |   WEIGHT_DECAY: 0.0001
41 |   STEPS: (60000, 80000)
42 |   MAX_ITER: 90000
43 |   IMS_PER_BATCH: 128  # for 8GPUs
44 | # TEST:
45 | #   IMS_PER_BATCH: 8
46 | INPUT:
47 |   MIN_SIZE_TRAIN: (600, )
48 |   MAX_SIZE_TRAIN: 1000
49 |   MIN_SIZE_TEST: 600
50 |   MAX_SIZE_TEST: 1000
51 |   PIXEL_MEAN: [103.53, 116.28, 123.675]
52 |   PIXEL_STD: [57.375, 57.12, 58.395]
53 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/e2e_mask_rcnn_fbnet_xirb16d_dsmask.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   BACKBONE:
 4 |     CONV_BODY: FBNet
 5 |   FBNET:
 6 |     ARCH: "xirb16d_dsmask"
 7 |     BN_TYPE: "bn"
 8 |     WIDTH_DIVISOR: 8
 9 |     DW_CONV_SKIP_BN: True
10 |     DW_CONV_SKIP_RELU: True
11 |     DET_HEAD_LAST_SCALE: -1.0
12 |   RPN:
13 |     ANCHOR_SIZES: (16, 32, 64, 128, 256)
14 |     ANCHOR_STRIDE: (16, )
15 |     BATCH_SIZE_PER_IMAGE: 256
16 |     PRE_NMS_TOP_N_TRAIN: 6000
17 |     PRE_NMS_TOP_N_TEST: 6000
18 |     POST_NMS_TOP_N_TRAIN: 2000
19 |     POST_NMS_TOP_N_TEST: 100
20 |     RPN_HEAD: FBNet.rpn_head
21 |   ROI_HEADS:
22 |     BATCH_SIZE_PER_IMAGE: 512
23 |   ROI_BOX_HEAD:
24 |     POOLER_RESOLUTION: 6
25 |     FEATURE_EXTRACTOR: FBNet.roi_head
26 |     NUM_CLASSES: 81
27 |   ROI_MASK_HEAD:
28 |     POOLER_RESOLUTION: 6
29 |     FEATURE_EXTRACTOR: FBNet.roi_head_mask
30 |     PREDICTOR: "MaskRCNNConv1x1Predictor"
31 |     RESOLUTION: 12
32 |     SHARE_BOX_FEATURE_EXTRACTOR: False
33 |   MASK_ON: True
34 | DATASETS:
35 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
36 |   TEST: ("coco_2014_minival",)
37 | SOLVER:
38 |   BASE_LR: 0.06
39 |   WARMUP_FACTOR: 0.1
40 |   WEIGHT_DECAY: 0.0001
41 |   STEPS: (60000, 80000)
42 |   MAX_ITER: 90000
43 |   IMS_PER_BATCH: 128  # for 8GPUs
44 | # TEST:
45 | #   IMS_PER_BATCH: 8
46 | INPUT:
47 |   MIN_SIZE_TRAIN: (320, )
48 |   MAX_SIZE_TRAIN: 640
49 |   MIN_SIZE_TEST: 320
50 |   MAX_SIZE_TEST: 640
51 |   PIXEL_MEAN: [103.53, 116.28, 123.675]
52 |   PIXEL_STD: [57.375, 57.12, 58.395]
53 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/e2e_mask_rcnn_fbnet_xirb16d_dsmask_600.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   BACKBONE:
 4 |     CONV_BODY: FBNet
 5 |   FBNET:
 6 |     ARCH: "xirb16d_dsmask"
 7 |     BN_TYPE: "bn"
 8 |     WIDTH_DIVISOR: 8
 9 |     DW_CONV_SKIP_BN: True
10 |     DW_CONV_SKIP_RELU: True
11 |     DET_HEAD_LAST_SCALE: 0.0
12 |   RPN:
13 |     ANCHOR_SIZES: (32, 64, 128, 256, 512)
14 |     ANCHOR_STRIDE: (16, )
15 |     BATCH_SIZE_PER_IMAGE: 256
16 |     PRE_NMS_TOP_N_TRAIN: 6000
17 |     PRE_NMS_TOP_N_TEST: 6000
18 |     POST_NMS_TOP_N_TRAIN: 2000
19 |     POST_NMS_TOP_N_TEST: 200
20 |     RPN_HEAD: FBNet.rpn_head
21 |   ROI_HEADS:
22 |     BATCH_SIZE_PER_IMAGE: 256
23 |   ROI_BOX_HEAD:
24 |     POOLER_RESOLUTION: 6
25 |     FEATURE_EXTRACTOR: FBNet.roi_head
26 |     NUM_CLASSES: 81
27 |   ROI_MASK_HEAD:
28 |     POOLER_RESOLUTION: 6
29 |     FEATURE_EXTRACTOR: FBNet.roi_head_mask
30 |     PREDICTOR: "MaskRCNNConv1x1Predictor"
31 |     RESOLUTION: 12
32 |     SHARE_BOX_FEATURE_EXTRACTOR: False
33 |   MASK_ON: True
34 | DATASETS:
35 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
36 |   TEST: ("coco_2014_minival",)
37 | SOLVER:
38 |   BASE_LR: 0.06
39 |   WARMUP_FACTOR: 0.1
40 |   WEIGHT_DECAY: 0.0001
41 |   STEPS: (60000, 80000)
42 |   MAX_ITER: 90000
43 |   IMS_PER_BATCH: 128  # for 8GPUs
44 | # TEST:
45 | #   IMS_PER_BATCH: 8
46 | INPUT:
47 |   MIN_SIZE_TRAIN: (600, )
48 |   MAX_SIZE_TRAIN: 1000
49 |   MIN_SIZE_TEST: 600
50 |   MAX_SIZE_TEST: 1000
51 |   PIXEL_MEAN: [103.53, 116.28, 123.675]
52 |   PIXEL_STD: [57.375, 57.12, 58.395]
53 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/rpn_R_101_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-101"
 4 |   RPN_ONLY: True
 5 |   BACKBONE:
 6 |     CONV_BODY: "R-101-FPN"
 7 |   RESNETS:
 8 |     BACKBONE_OUT_CHANNELS: 256
 9 |   RPN:
10 |     USE_FPN: True
11 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 2000
14 |     FPN_POST_NMS_TOP_N_TEST: 2000
15 | DATASETS:
16 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
17 |   TEST: ("coco_2014_minival",)
18 | DATALOADER:
19 |   SIZE_DIVISIBILITY: 32
20 | SOLVER:
21 |   BASE_LR: 0.02
22 |   WEIGHT_DECAY: 0.0001
23 |   STEPS: (60000, 80000)
24 |   MAX_ITER: 90000
25 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/rpn_R_50_C4_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN_ONLY: True
 5 |   RPN:
 6 |     PRE_NMS_TOP_N_TEST: 12000
 7 |     POST_NMS_TOP_N_TEST: 2000
 8 | DATASETS:
 9 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
10 |   TEST: ("coco_2014_minival",)
11 | SOLVER:
12 |   BASE_LR: 0.02
13 |   WEIGHT_DECAY: 0.0001
14 |   STEPS: (60000, 80000)
15 |   MAX_ITER: 90000
16 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/rpn_R_50_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN_ONLY: True
 5 |   BACKBONE:
 6 |     CONV_BODY: "R-50-FPN"
 7 |   RESNETS:
 8 |     BACKBONE_OUT_CHANNELS: 256
 9 |   RPN:
10 |     USE_FPN: True
11 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 2000
14 |     FPN_POST_NMS_TOP_N_TEST: 2000
15 | DATASETS:
16 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
17 |   TEST: ("coco_2014_minival",)
18 | DATALOADER:
19 |   SIZE_DIVISIBILITY: 32
20 | SOLVER:
21 |   BASE_LR: 0.02
22 |   WEIGHT_DECAY: 0.0001
23 |   STEPS: (60000, 80000)
24 |   MAX_ITER: 90000
25 | 


--------------------------------------------------------------------------------
/configs/arichived/maskrcnn_benchmark_models/rpn_X_101_32x8d_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/FAIR/20171220/X-101-32x8d"
 4 |   RPN_ONLY: True
 5 |   BACKBONE:
 6 |     CONV_BODY: "R-101-FPN"
 7 |   RESNETS:
 8 |     BACKBONE_OUT_CHANNELS: 256
 9 |     STRIDE_IN_1X1: False
10 |     NUM_GROUPS: 32
11 |     WIDTH_PER_GROUP: 8
12 |   RPN:
13 |     USE_FPN: True
14 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
15 |     PRE_NMS_TOP_N_TEST: 1000
16 |     POST_NMS_TOP_N_TEST: 2000
17 |     FPN_POST_NMS_TOP_N_TEST: 2000
18 | DATASETS:
19 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
20 |   TEST: ("coco_2014_minival",)
21 | DATALOADER:
22 |   SIZE_DIVISIBILITY: 32
23 | SOLVER:
24 |   BASE_LR: 0.02
25 |   WEIGHT_DECAY: 0.0001
26 |   STEPS: (60000, 80000)
27 |   MAX_ITER: 90000
28 | 


--------------------------------------------------------------------------------
/configs/arichived/pascal_voc/e2e_faster_rcnn_R_50_C4_1x_1_gpu_voc.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN:
 5 |     PRE_NMS_TOP_N_TEST: 6000
 6 |     POST_NMS_TOP_N_TEST: 300
 7 |     ANCHOR_SIZES: (128, 256, 512)
 8 |   ROI_BOX_HEAD:
 9 |     NUM_CLASSES: 21
10 | DATASETS:
11 |   TRAIN: ("voc_2007_train", "voc_2007_val")
12 |   TEST: ("voc_2007_test",)
13 | SOLVER:
14 |   BASE_LR: 0.001
15 |   WEIGHT_DECAY: 0.0001
16 |   STEPS: (50000, )
17 |   MAX_ITER: 70000
18 |   IMS_PER_BATCH: 1
19 | TEST:
20 |   IMS_PER_BATCH: 1
21 | 


--------------------------------------------------------------------------------
/configs/arichived/pascal_voc/e2e_faster_rcnn_R_50_C4_1x_4_gpu_voc.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN:
 5 |     PRE_NMS_TOP_N_TEST: 6000
 6 |     POST_NMS_TOP_N_TEST: 300
 7 |     ANCHOR_SIZES: (128, 256, 512)
 8 |   ROI_BOX_HEAD:
 9 |     NUM_CLASSES: 21
10 | DATASETS:
11 |   TRAIN: ("voc_2007_train", "voc_2007_val")
12 |   TEST: ("voc_2007_test",)
13 | SOLVER:
14 |   BASE_LR: 0.004
15 |   WEIGHT_DECAY: 0.0001
16 |   STEPS: (12500, )
17 |   MAX_ITER: 17500
18 |   IMS_PER_BATCH: 4
19 | TEST:
20 |   IMS_PER_BATCH: 4
21 | 


--------------------------------------------------------------------------------
/configs/arichived/pascal_voc/e2e_mask_rcnn_R_50_FPN_1x_cocostyle.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |     NUM_CLASSES: 21
24 |   ROI_MASK_HEAD:
25 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
26 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
27 |     PREDICTOR: "MaskRCNNC4Predictor"
28 |     POOLER_RESOLUTION: 14
29 |     POOLER_SAMPLING_RATIO: 2
30 |     RESOLUTION: 28
31 |     SHARE_BOX_FEATURE_EXTRACTOR: False
32 |   MASK_ON: True
33 | DATASETS:
34 |   TRAIN: ("voc_2012_train_cocostyle",)
35 |   TEST: ("voc_2012_val_cocostyle",)
36 | DATALOADER:
37 |   SIZE_DIVISIBILITY: 32
38 | SOLVER:
39 |   BASE_LR: 0.01
40 |   WEIGHT_DECAY: 0.0001
41 |   STEPS: (18000,)
42 |   MAX_ITER: 24000
43 | 


--------------------------------------------------------------------------------
/configs/arichived/quick_schedules/e2e_faster_rcnn_R_50_C4_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN:
 5 |     PRE_NMS_TOP_N_TEST: 6000
 6 |     POST_NMS_TOP_N_TEST: 1000
 7 |   ROI_HEADS:
 8 |     BATCH_SIZE_PER_IMAGE: 256
 9 | DATASETS:
10 |   TRAIN: ("coco_2014_minival",)
11 |   TEST: ("coco_2014_minival",)
12 | INPUT:
13 |   MIN_SIZE_TRAIN: (600,)
14 |   MAX_SIZE_TRAIN: 1000
15 |   MIN_SIZE_TEST: 800
16 |   MAX_SIZE_TEST: 1000
17 | SOLVER:
18 |   BASE_LR: 0.005
19 |   WEIGHT_DECAY: 0.0001
20 |   STEPS: (1500,)
21 |   MAX_ITER: 2000
22 |   IMS_PER_BATCH: 2
23 | TEST:
24 |   IMS_PER_BATCH: 2
25 | 


--------------------------------------------------------------------------------
/configs/arichived/quick_schedules/e2e_faster_rcnn_R_50_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |     BATCH_SIZE_PER_IMAGE: 256
18 |   ROI_BOX_HEAD:
19 |     POOLER_RESOLUTION: 7
20 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
21 |     POOLER_SAMPLING_RATIO: 2
22 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
23 |     PREDICTOR: "FPNPredictor"
24 | DATASETS:
25 |   TRAIN: ("coco_2014_minival",)
26 |   TEST: ("coco_2014_minival",)
27 | INPUT:
28 |   MIN_SIZE_TRAIN: (600,)
29 |   MAX_SIZE_TRAIN: 1000
30 |   MIN_SIZE_TEST: 800
31 |   MAX_SIZE_TEST: 1000
32 | DATALOADER:
33 |   SIZE_DIVISIBILITY: 32
34 | SOLVER:
35 |   BASE_LR: 0.005
36 |   WEIGHT_DECAY: 0.0001
37 |   STEPS: (1500,)
38 |   MAX_ITER: 2000
39 |   IMS_PER_BATCH: 4
40 | TEST:
41 |   IMS_PER_BATCH: 2
42 | 


--------------------------------------------------------------------------------
/configs/arichived/quick_schedules/e2e_faster_rcnn_X_101_32x8d_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/FAIR/20171220/X-101-32x8d"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |     STRIDE_IN_1X1: False
 9 |     NUM_GROUPS: 32
10 |     WIDTH_PER_GROUP: 8
11 |   RPN:
12 |     USE_FPN: True
13 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
14 |     PRE_NMS_TOP_N_TRAIN: 2000
15 |     PRE_NMS_TOP_N_TEST: 1000
16 |     POST_NMS_TOP_N_TEST: 1000
17 |     FPN_POST_NMS_TOP_N_TEST: 1000
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |     BATCH_SIZE_PER_IMAGE: 256
21 |   ROI_BOX_HEAD:
22 |     POOLER_RESOLUTION: 7
23 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
24 |     POOLER_SAMPLING_RATIO: 2
25 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
26 |     PREDICTOR: "FPNPredictor"
27 | DATASETS:
28 |   TRAIN: ("coco_2014_minival",)
29 |   TEST: ("coco_2014_minival",)
30 | INPUT:
31 |   MIN_SIZE_TRAIN: (600,)
32 |   MAX_SIZE_TRAIN: 1000
33 |   MIN_SIZE_TEST: 800
34 |   MAX_SIZE_TEST: 1000
35 | DATALOADER:
36 |   SIZE_DIVISIBILITY: 32
37 | SOLVER:
38 |   BASE_LR: 0.005
39 |   WEIGHT_DECAY: 0.0001
40 |   STEPS: (1500,)
41 |   MAX_ITER: 2000
42 |   IMS_PER_BATCH: 2
43 | TEST:
44 |   IMS_PER_BATCH: 2
45 | 


--------------------------------------------------------------------------------
/configs/arichived/quick_schedules/e2e_keypoint_rcnn_R_50_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |     BATCH_SIZE_PER_IMAGE: 256
18 |   ROI_BOX_HEAD:
19 |     POOLER_RESOLUTION: 7
20 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
21 |     POOLER_SAMPLING_RATIO: 2
22 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
23 |     PREDICTOR: "FPNPredictor"
24 |     NUM_CLASSES: 2
25 |   ROI_KEYPOINT_HEAD:
26 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
27 |     FEATURE_EXTRACTOR: "KeypointRCNNFeatureExtractor"
28 |     PREDICTOR: "KeypointRCNNPredictor"
29 |     POOLER_RESOLUTION: 14
30 |     POOLER_SAMPLING_RATIO: 2
31 |     RESOLUTION: 56
32 |     SHARE_BOX_FEATURE_EXTRACTOR: False
33 |   KEYPOINT_ON: True
34 | DATASETS:
35 |   TRAIN: ("keypoints_coco_2014_minival",)
36 |   TEST: ("keypoints_coco_2014_minival",)
37 | INPUT:
38 |   MIN_SIZE_TRAIN: (640, 672, 704, 736, 768, 800)
39 |   MAX_SIZE_TRAIN: 1000
40 |   MIN_SIZE_TEST: 800
41 |   MAX_SIZE_TEST: 1000
42 | DATALOADER:
43 |   SIZE_DIVISIBILITY: 32
44 | SOLVER:
45 |   BASE_LR: 0.005
46 |   WEIGHT_DECAY: 0.0001
47 |   STEPS: (1500,)
48 |   MAX_ITER: 2000
49 |   IMS_PER_BATCH: 4
50 | TEST:
51 |   IMS_PER_BATCH: 2
52 | 


--------------------------------------------------------------------------------
/configs/arichived/quick_schedules/e2e_mask_rcnn_R_50_C4_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN:
 5 |     PRE_NMS_TOP_N_TEST: 6000
 6 |     POST_NMS_TOP_N_TEST: 1000
 7 |   ROI_HEADS:
 8 |     BATCH_SIZE_PER_IMAGE: 256
 9 |   ROI_MASK_HEAD:
10 |     PREDICTOR: "MaskRCNNC4Predictor"
11 |     SHARE_BOX_FEATURE_EXTRACTOR: True
12 |   MASK_ON: True
13 | DATASETS:
14 |   TRAIN: ("coco_2014_minival",)
15 |   TEST: ("coco_2014_minival",)
16 | INPUT:
17 |   MIN_SIZE_TRAIN: (600,)
18 |   MAX_SIZE_TRAIN: 1000
19 |   MIN_SIZE_TEST: 800
20 |   MAX_SIZE_TEST: 1000
21 | SOLVER:
22 |   BASE_LR: 0.005
23 |   WEIGHT_DECAY: 0.0001
24 |   STEPS: (1500,)
25 |   MAX_ITER: 2000
26 |   IMS_PER_BATCH: 4
27 | TEST:
28 |   IMS_PER_BATCH: 2
29 | 


--------------------------------------------------------------------------------
/configs/arichived/quick_schedules/e2e_mask_rcnn_R_50_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |     BATCH_SIZE_PER_IMAGE: 256
18 |   ROI_BOX_HEAD:
19 |     POOLER_RESOLUTION: 7
20 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
21 |     POOLER_SAMPLING_RATIO: 2
22 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
23 |     PREDICTOR: "FPNPredictor"
24 |   ROI_MASK_HEAD:
25 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
26 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
27 |     PREDICTOR: "MaskRCNNC4Predictor"
28 |     POOLER_RESOLUTION: 14
29 |     POOLER_SAMPLING_RATIO: 2
30 |     RESOLUTION: 28
31 |     SHARE_BOX_FEATURE_EXTRACTOR: False
32 |   MASK_ON: True
33 | DATASETS:
34 |   TRAIN: ("coco_2014_minival",)
35 |   TEST: ("coco_2014_minival",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (600,)
38 |   MAX_SIZE_TRAIN: 1000
39 |   MIN_SIZE_TEST: 800
40 |   MAX_SIZE_TEST: 1000
41 | DATALOADER:
42 |   SIZE_DIVISIBILITY: 32
43 | SOLVER:
44 |   BASE_LR: 0.005
45 |   WEIGHT_DECAY: 0.0001
46 |   STEPS: (1500,)
47 |   MAX_ITER: 2000
48 |   IMS_PER_BATCH: 4
49 | TEST:
50 |   IMS_PER_BATCH: 2
51 | 


--------------------------------------------------------------------------------
/configs/arichived/quick_schedules/e2e_mask_rcnn_X_101_32x8d_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/FAIR/20171220/X-101-32x8d"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-101-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |     STRIDE_IN_1X1: False
 9 |     NUM_GROUPS: 32
10 |     WIDTH_PER_GROUP: 8
11 |   RPN:
12 |     USE_FPN: True
13 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
14 |     PRE_NMS_TOP_N_TRAIN: 2000
15 |     PRE_NMS_TOP_N_TEST: 1000
16 |     POST_NMS_TOP_N_TEST: 1000
17 |     FPN_POST_NMS_TOP_N_TEST: 1000
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |     BATCH_SIZE_PER_IMAGE: 256
21 |   ROI_BOX_HEAD:
22 |     POOLER_RESOLUTION: 7
23 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
24 |     POOLER_SAMPLING_RATIO: 2
25 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
26 |     PREDICTOR: "FPNPredictor"
27 |   ROI_MASK_HEAD:
28 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
29 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
30 |     PREDICTOR: "MaskRCNNC4Predictor"
31 |     POOLER_RESOLUTION: 14
32 |     POOLER_SAMPLING_RATIO: 2
33 |     RESOLUTION: 28
34 |     SHARE_BOX_FEATURE_EXTRACTOR: False
35 |   MASK_ON: True
36 | DATASETS:
37 |   TRAIN: ("coco_2014_minival",)
38 |   TEST: ("coco_2014_minival",)
39 | INPUT:
40 |   MIN_SIZE_TRAIN: (600,)
41 |   MAX_SIZE_TRAIN: 1000
42 |   MIN_SIZE_TEST: 800
43 |   MAX_SIZE_TEST: 1000
44 | DATALOADER:
45 |   SIZE_DIVISIBILITY: 32
46 | SOLVER:
47 |   BASE_LR: 0.005
48 |   WEIGHT_DECAY: 0.0001
49 |   STEPS: (1500,)
50 |   MAX_ITER: 2000
51 |   IMS_PER_BATCH: 2
52 | TEST:
53 |   IMS_PER_BATCH: 2
54 | 


--------------------------------------------------------------------------------
/configs/arichived/quick_schedules/rpn_R_50_C4_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN_ONLY: True
 5 |   RPN:
 6 |     PRE_NMS_TOP_N_TEST: 12000
 7 |     POST_NMS_TOP_N_TEST: 2000
 8 | DATASETS:
 9 |   TRAIN: ("coco_2014_minival",)
10 |   TEST: ("coco_2014_minival",)
11 | INPUT:
12 |   MIN_SIZE_TRAIN: (600,)
13 |   MAX_SIZE_TRAIN: 1000
14 |   MIN_SIZE_TEST: 800
15 |   MAX_SIZE_TEST: 1000
16 | SOLVER:
17 |   BASE_LR: 0.005
18 |   WEIGHT_DECAY: 0.0001
19 |   STEPS: (1500,)
20 |   MAX_ITER: 2000
21 |   IMS_PER_BATCH: 4
22 | TEST:
23 |   IMS_PER_BATCH: 2
24 | 


--------------------------------------------------------------------------------
/configs/arichived/quick_schedules/rpn_R_50_FPN_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN_ONLY: True
 5 |   BACKBONE:
 6 |     CONV_BODY: "R-50-FPN"
 7 |   RESNETS:
 8 |     BACKBONE_OUT_CHANNELS: 256
 9 |   RPN:
10 |     USE_FPN: True
11 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 2000
14 |     FPN_POST_NMS_TOP_N_TEST: 2000
15 | DATASETS:
16 |   TRAIN: ("coco_2014_minival",)
17 |   TEST: ("coco_2014_minival",)
18 | INPUT:
19 |   MIN_SIZE_TRAIN: (600,)
20 |   MAX_SIZE_TRAIN: 1000
21 |   MIN_SIZE_TEST: 800
22 |   MAX_SIZE_TEST: 1000
23 | DATALOADER:
24 |   SIZE_DIVISIBILITY: 32
25 | SOLVER:
26 |   BASE_LR: 0.005
27 |   WEIGHT_DECAY: 0.0001
28 |   STEPS: (1500,)
29 |   MAX_ITER: 2000
30 |   IMS_PER_BATCH: 4
31 | TEST:
32 |   IMS_PER_BATCH: 2
33 | 


--------------------------------------------------------------------------------
/configs/arichived/retinanet/retinanet_R-101-FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-101"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-101-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   RPN:
11 |     USE_FPN: True
12 |     FG_IOU_THRESHOLD: 0.5
13 |     BG_IOU_THRESHOLD: 0.4
14 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
15 |     PRE_NMS_TOP_N_TRAIN: 2000
16 |     PRE_NMS_TOP_N_TEST: 1000
17 |     POST_NMS_TOP_N_TEST: 1000
18 |     FPN_POST_NMS_TOP_N_TEST: 1000
19 |   ROI_HEADS:
20 |     USE_FPN: True
21 |     BATCH_SIZE_PER_IMAGE: 256
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 7
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     POOLER_SAMPLING_RATIO: 2
26 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
27 |     PREDICTOR: "FPNPredictor"
28 |   RETINANET:
29 |     SCALES_PER_OCTAVE: 3
30 |     STRADDLE_THRESH: -1
31 |     FG_IOU_THRESHOLD: 0.5
32 |     BG_IOU_THRESHOLD: 0.4
33 | DATASETS:
34 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
35 |   TEST: ("coco_2014_minival",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (800, )
38 |   MAX_SIZE_TRAIN: 1333
39 |   MIN_SIZE_TEST: 800
40 |   MAX_SIZE_TEST: 1333
41 | DATALOADER:
42 |   SIZE_DIVISIBILITY: 32
43 | SOLVER:
44 |   # Assume 4 gpus
45 |   BASE_LR: 0.005
46 |   WEIGHT_DECAY: 0.0001
47 |   STEPS: (120000, 160000)
48 |   MAX_ITER: 180000
49 |   IMS_PER_BATCH: 8
50 | 


--------------------------------------------------------------------------------
/configs/arichived/retinanet/retinanet_R-101-FPN_P5_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-101"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-101-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   RPN:
11 |     USE_FPN: True
12 |     FG_IOU_THRESHOLD: 0.5
13 |     BG_IOU_THRESHOLD: 0.4
14 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
15 |     PRE_NMS_TOP_N_TRAIN: 2000
16 |     PRE_NMS_TOP_N_TEST: 1000
17 |     POST_NMS_TOP_N_TEST: 1000
18 |     FPN_POST_NMS_TOP_N_TEST: 1000
19 |   ROI_HEADS:
20 |     USE_FPN: True
21 |     BATCH_SIZE_PER_IMAGE: 256
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 7
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     POOLER_SAMPLING_RATIO: 2
26 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
27 |     PREDICTOR: "FPNPredictor"
28 |   RETINANET:
29 |     SCALES_PER_OCTAVE: 3
30 |     STRADDLE_THRESH: -1
31 |     USE_C5: False
32 |     FG_IOU_THRESHOLD: 0.5
33 |     BG_IOU_THRESHOLD: 0.4
34 | DATASETS:
35 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
36 |   TEST: ("coco_2014_minival",)
37 | INPUT:
38 |   MIN_SIZE_TRAIN: (800, )
39 |   MAX_SIZE_TRAIN: 1333
40 |   MIN_SIZE_TEST: 800
41 |   MAX_SIZE_TEST: 1333
42 | DATALOADER:
43 |   SIZE_DIVISIBILITY: 32
44 | SOLVER:
45 |   # Assume 4 gpus
46 |   BASE_LR: 0.005
47 |   WEIGHT_DECAY: 0.0001
48 |   STEPS: (120000, 160000)
49 |   MAX_ITER: 180000
50 |   IMS_PER_BATCH: 8
51 | 


--------------------------------------------------------------------------------
/configs/arichived/retinanet/retinanet_R-50-FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-50-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   RPN:
11 |     USE_FPN: True
12 |     FG_IOU_THRESHOLD: 0.5
13 |     BG_IOU_THRESHOLD: 0.4
14 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
15 |     PRE_NMS_TOP_N_TRAIN: 2000
16 |     PRE_NMS_TOP_N_TEST: 1000
17 |     POST_NMS_TOP_N_TEST: 1000
18 |     FPN_POST_NMS_TOP_N_TEST: 1000
19 |   ROI_HEADS:
20 |     USE_FPN: True
21 |     BATCH_SIZE_PER_IMAGE: 256
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 7
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     POOLER_SAMPLING_RATIO: 2
26 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
27 |     PREDICTOR: "FPNPredictor"
28 |   RETINANET:
29 |     SCALES_PER_OCTAVE: 3
30 |     STRADDLE_THRESH: -1
31 |     FG_IOU_THRESHOLD: 0.5
32 |     BG_IOU_THRESHOLD: 0.4
33 | DATASETS:
34 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
35 |   TEST: ("coco_2014_minival",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (800,)
38 |   MAX_SIZE_TRAIN: 1333
39 |   MIN_SIZE_TEST: 800
40 |   MAX_SIZE_TEST: 1333
41 | DATALOADER:
42 |   SIZE_DIVISIBILITY: 32
43 | SOLVER:
44 |   # Assume 4 gpus
45 |   BASE_LR: 0.005
46 |   WEIGHT_DECAY: 0.0001
47 |   STEPS: (120000, 160000)
48 |   MAX_ITER: 180000
49 |   IMS_PER_BATCH: 8
50 | 


--------------------------------------------------------------------------------
/configs/arichived/retinanet/retinanet_R-50-FPN_1x_quick.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-50-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   RPN:
11 |     USE_FPN: True
12 |     FG_IOU_THRESHOLD: 0.5
13 |     BG_IOU_THRESHOLD: 0.4
14 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
15 |     PRE_NMS_TOP_N_TRAIN: 2000
16 |     PRE_NMS_TOP_N_TEST: 1000
17 |     POST_NMS_TOP_N_TEST: 1000
18 |     FPN_POST_NMS_TOP_N_TEST: 1000
19 |   ROI_HEADS:
20 |     USE_FPN: True
21 |     BATCH_SIZE_PER_IMAGE: 256
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 7
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     POOLER_SAMPLING_RATIO: 2
26 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
27 |     PREDICTOR: "FPNPredictor"
28 |   RETINANET:
29 |     SCALES_PER_OCTAVE: 3
30 |     STRADDLE_THRESH: -1
31 |     FG_IOU_THRESHOLD: 0.5
32 |     BG_IOU_THRESHOLD: 0.4
33 | DATASETS:
34 |   TRAIN: ("coco_2014_minival",)
35 |   TEST: ("coco_2014_minival",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (600,)
38 |   MAX_SIZE_TRAIN: 1000
39 |   MIN_SIZE_TEST: 800
40 |   MAX_SIZE_TEST: 1000
41 | DATALOADER:
42 |   SIZE_DIVISIBILITY: 32
43 | SOLVER:
44 |   BASE_LR: 0.005
45 |   WEIGHT_DECAY: 0.0001
46 |   STEPS: (3500,)
47 |   MAX_ITER: 4000
48 |   IMS_PER_BATCH: 4
49 | 


--------------------------------------------------------------------------------
/configs/arichived/retinanet/retinanet_R-50-FPN_P5_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-50-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   RPN:
11 |     USE_FPN: True
12 |     FG_IOU_THRESHOLD: 0.5
13 |     BG_IOU_THRESHOLD: 0.4
14 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
15 |     PRE_NMS_TOP_N_TRAIN: 2000
16 |     PRE_NMS_TOP_N_TEST: 1000
17 |     POST_NMS_TOP_N_TEST: 1000
18 |     FPN_POST_NMS_TOP_N_TEST: 1000
19 |   ROI_HEADS:
20 |     USE_FPN: True
21 |     BATCH_SIZE_PER_IMAGE: 256
22 |   ROI_BOX_HEAD:
23 |     POOLER_RESOLUTION: 7
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     POOLER_SAMPLING_RATIO: 2
26 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
27 |     PREDICTOR: "FPNPredictor"
28 |   RETINANET:
29 |     SCALES_PER_OCTAVE: 3
30 |     STRADDLE_THRESH: -1
31 |     USE_C5: False
32 |     FG_IOU_THRESHOLD: 0.5
33 |     BG_IOU_THRESHOLD: 0.4
34 | DATASETS:
35 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
36 |   TEST: ("coco_2014_minival",)
37 | INPUT:
38 |   MIN_SIZE_TRAIN: (800,)
39 |   MAX_SIZE_TRAIN: 1333
40 |   MIN_SIZE_TEST: 800
41 |   MAX_SIZE_TEST: 1333
42 | DATALOADER:
43 |   SIZE_DIVISIBILITY: 32
44 | SOLVER:
45 |   # Assume 4 gpus
46 |   BASE_LR: 0.005
47 |   WEIGHT_DECAY: 0.0001
48 |   STEPS: (120000, 160000)
49 |   MAX_ITER: 180000
50 |   IMS_PER_BATCH: 8
51 | 


--------------------------------------------------------------------------------
/configs/arichived/retinanet/retinanet_X_101_32x8d_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/FAIR/20171220/X-101-32x8d"
 4 |   RPN_ONLY: True
 5 |   RETINANET_ON: True
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-101-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |     STRIDE_IN_1X1: False
11 |     NUM_GROUPS: 32
12 |     WIDTH_PER_GROUP: 8
13 |   RPN:
14 |     USE_FPN: True
15 |     FG_IOU_THRESHOLD: 0.5
16 |     BG_IOU_THRESHOLD: 0.4
17 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
18 |     PRE_NMS_TOP_N_TRAIN: 2000
19 |     PRE_NMS_TOP_N_TEST: 1000
20 |     POST_NMS_TOP_N_TEST: 1000
21 |     FPN_POST_NMS_TOP_N_TEST: 1000
22 |   ROI_HEADS:
23 |     USE_FPN: True
24 |     BATCH_SIZE_PER_IMAGE: 256
25 |   ROI_BOX_HEAD:
26 |     POOLER_RESOLUTION: 7
27 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
28 |     POOLER_SAMPLING_RATIO: 2
29 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
30 |     PREDICTOR: "FPNPredictor"
31 |   RETINANET:
32 |     SCALES_PER_OCTAVE: 3
33 |     STRADDLE_THRESH: -1
34 |     FG_IOU_THRESHOLD: 0.5
35 |     BG_IOU_THRESHOLD: 0.4
36 | DATASETS:
37 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
38 |   TEST: ("coco_2014_minival",)
39 | INPUT:
40 |   MIN_SIZE_TRAIN: (800, )
41 |   MAX_SIZE_TRAIN: 1333
42 |   MIN_SIZE_TEST: 800
43 |   MAX_SIZE_TEST: 1333
44 | DATALOADER:
45 |   SIZE_DIVISIBILITY: 32
46 | SOLVER:
47 |   # Assume 4 gpus
48 |   BASE_LR: 0.0025
49 |   WEIGHT_DECAY: 0.0001
50 |   STEPS: (240000, 320000)
51 |   MAX_ITER: 360000
52 |   IMS_PER_BATCH: 4
53 | 


--------------------------------------------------------------------------------
/configs/arichived/test_time_aug/e2e_mask_rcnn_R_50_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-FPN"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 256
 8 |   RPN:
 9 |     USE_FPN: True
10 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
11 |     PRE_NMS_TOP_N_TRAIN: 2000
12 |     PRE_NMS_TOP_N_TEST: 1000
13 |     POST_NMS_TOP_N_TEST: 1000
14 |     FPN_POST_NMS_TOP_N_TEST: 1000
15 |   ROI_HEADS:
16 |     USE_FPN: True
17 |   ROI_BOX_HEAD:
18 |     POOLER_RESOLUTION: 7
19 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
20 |     POOLER_SAMPLING_RATIO: 2
21 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
22 |     PREDICTOR: "FPNPredictor"
23 |   ROI_MASK_HEAD:
24 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
25 |     FEATURE_EXTRACTOR: "MaskRCNNFPNFeatureExtractor"
26 |     PREDICTOR: "MaskRCNNC4Predictor"
27 |     POOLER_RESOLUTION: 14
28 |     POOLER_SAMPLING_RATIO: 2
29 |     RESOLUTION: 28
30 |     SHARE_BOX_FEATURE_EXTRACTOR: False
31 |   MASK_ON: True
32 | DATASETS:
33 |   TRAIN: ("coco_2014_train", "coco_2014_valminusminival")
34 |   TEST: ("coco_2014_minival",)
35 | DATALOADER:
36 |   SIZE_DIVISIBILITY: 32
37 | SOLVER:
38 |   BASE_LR: 0.02
39 |   WEIGHT_DECAY: 0.0001
40 |   STEPS: (60000, 80000)
41 |   MAX_ITER: 90000
42 | TEST:
43 |   BBOX_AUG:
44 |     ENABLED: True
45 |     H_FLIP: True
46 |     SCALES: (400, 500, 600, 700, 900, 1000, 1100, 1200)
47 |     MAX_SIZE: 2000
48 |     SCALE_H_FLIP: True
49 | 


--------------------------------------------------------------------------------
/configs/e2e_relation_det_R_50_C4_1x.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   BACKBONE:
 5 |     CONV_BODY: "R-50-C4"
 6 |   RESNETS:
 7 |     BACKBONE_OUT_CHANNELS: 1024
 8 |   FLIP_AUG: True
 9 |   RELATION_ON: False
10 |   RPN:
11 |     ANCHOR_SIZES: (35.54447264, 65.97050352, 115.4708024, 201.64208208, 363.3643696) # from neural-motifs
12 |     ANCHOR_STRIDE:  (16, )
13 |     ASPECT_RATIOS: (0.23232838, 0.63365731, 1.28478321, 3.15089189)   # from neural-motifs
14 |     BATCH_SIZE_PER_IMAGE: 256
15 |     BG_IOU_THRESHOLD: 0.3
16 |     FG_IOU_THRESHOLD: 0.7
17 |     MIN_SIZE: 0
18 |     NMS_THRESH: 0.7
19 |     POSITIVE_FRACTION: 0.5
20 |     POST_NMS_TOP_N_TEST: 1000
21 |     POST_NMS_TOP_N_TRAIN: 2000
22 |     PRE_NMS_TOP_N_TEST: 6000
23 |     PRE_NMS_TOP_N_TRAIN: 12000
24 |     RPN_HEAD: SingleConvRPNHead
25 |     RPN_MID_CHANNEL: 1024
26 |     STRADDLE_THRESH: 0
27 |     USE_FPN: False
28 |   ROI_HEADS:
29 |     USE_FPN: False
30 |     POSITIVE_FRACTION: 0.3
31 |     BG_IOU_THRESHOLD: 0.5
32 |     FG_IOU_THRESHOLD: 0.5
33 |     BATCH_SIZE_PER_IMAGE: 256
34 |     DETECTIONS_PER_IMG: 256
35 |   ROI_BOX_HEAD:
36 |     POOLER_RESOLUTION: 7
37 |     POOLER_SCALES: (0.0625, )
38 |     POOLER_SAMPLING_RATIO: 0
39 |     FEATURE_EXTRACTOR: "ResNet50Conv5ROIFeatureExtractor"
40 |     PREDICTOR: "FastRCNNPredictor"
41 |     NUM_CLASSES: 151                    # 151 for VG, 1201 for GQA
42 |     MLP_HEAD_DIM: 2048
43 | DATASETS:
44 |   TRAIN: ("VG_stanford_filtered_with_attribute_train",)
45 |   VAL: ("VG_stanford_filtered_with_attribute_val",)
46 |   TEST: ("VG_stanford_filtered_with_attribute_test",)
47 | DATALOADER:
48 |   SIZE_DIVISIBILITY: 32
49 | SOLVER:
50 |   BASE_LR: 0.01
51 |   WEIGHT_DECAY: 0.0001
52 |   WARMUP_FACTOR: 0.1
53 |   MOMENTUM: 0.9
54 |   GRAD_NORM_CLIP: 5.0
55 |   STEPS: (90000, 120000)
56 |   MAX_ITER: 180000
57 |   PRINT_GRAD_FREQ: 5000
58 | OUTPUT_DIR: './output/relation_baseline'
59 | 


--------------------------------------------------------------------------------
/configs/e2e_relation_detector_R_101_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (600,)
 3 |   MAX_SIZE_TRAIN: 1000
 4 |   MIN_SIZE_TEST: 600
 5 |   MAX_SIZE_TEST: 1000
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-101"
 9 |   BACKBONE:
10 |     CONV_BODY: "R-101-FPN"
11 |   RESNETS:
12 |     BACKBONE_OUT_CHANNELS: 512
13 |   RELATION_ON: False
14 |   ATTRIBUTE_ON: False
15 |   FLIP_AUG: False
16 |   RPN:
17 |     USE_FPN: True
18 |     ANCHOR_SIZES: (32, 64, 128, 256, 512)
19 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
20 |     ASPECT_RATIOS: (0.23232838, 0.63365731, 1.28478321, 3.15089189)   # from neural-motifs
21 |     PRE_NMS_TOP_N_TRAIN: 12000
22 |     PRE_NMS_TOP_N_TEST: 6000
23 |     POST_NMS_TOP_N_TRAIN: 2000
24 |     POST_NMS_TOP_N_TEST: 1000
25 |     FPN_POST_NMS_TOP_N_TRAIN: 2000
26 |     FPN_POST_NMS_TOP_N_TEST: 2000
27 |     FPN_POST_NMS_PER_BATCH: False
28 |     RPN_MID_CHANNEL: 512
29 |   ROI_HEADS:
30 |     USE_FPN: True
31 |     POSITIVE_FRACTION: 0.5
32 |     BG_IOU_THRESHOLD: 0.3
33 |     BATCH_SIZE_PER_IMAGE: 256
34 |     DETECTIONS_PER_IMG: 256
35 |   ROI_BOX_HEAD:
36 |     POOLER_RESOLUTION: 7
37 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
38 |     POOLER_SAMPLING_RATIO: 2
39 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
40 |     PREDICTOR: "FPNPredictor"
41 |     NUM_CLASSES: 151                    # 151 for VG, 1201 for GQA
42 |     MLP_HEAD_DIM: 4096
43 |   ROI_ATTRIBUTE_HEAD:
44 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
45 |     PREDICTOR: "FPNPredictor"
46 |     USE_BINARY_LOSS: True               # choose binary, because cross_entropy loss deteriorate the box head, even with 0.1 weight
47 |     POS_WEIGHT: 50.0
48 |     ATTRIBUTE_LOSS_WEIGHT: 1.0
49 |     NUM_ATTRIBUTES: 201                 # 201 for VG, 501 for GQA
50 |     MAX_ATTRIBUTES: 10             
51 |     ATTRIBUTE_BGFG_SAMPLE: True    
52 |     ATTRIBUTE_BGFG_RATIO: 3        
53 | DATASETS:
54 |   TRAIN: ("VG_stanford_filtered_with_attribute_train",)
55 |   VAL: ("VG_stanford_filtered_with_attribute_val",)
56 |   TEST: ("VG_stanford_filtered_with_attribute_test",)
57 | DATALOADER:
58 |   SIZE_DIVISIBILITY: 32
59 | SOLVER:
60 |   BASE_LR: 0.001
61 |   WEIGHT_DECAY: 0.0001
62 |   WARMUP_FACTOR: 0.1
63 |   MOMENTUM: 0.9
64 |   GRAD_NORM_CLIP: 5.0
65 |   STEPS: (90000, 120000)
66 |   MAX_ITER: 180000
67 |   PRINT_GRAD_FREQ: 5000
68 | OUTPUT_DIR: './checkpoints'
69 | 
70 | 


--------------------------------------------------------------------------------
/configs/e2e_relation_detector_VGG16_1x.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (600,)
 3 |   MAX_SIZE_TRAIN: 1000
 4 |   MIN_SIZE_TEST: 600
 5 |   MAX_SIZE_TEST: 1000
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   BACKBONE:
 9 |     CONV_BODY: "VGG-16"
10 |   RESNETS:
11 |     BACKBONE_OUT_CHANNELS: 512
12 |   RELATION_ON: False
13 |   ATTRIBUTE_ON: False
14 |   FLIP_AUG: False
15 |   RPN:
16 |     USE_FPN: False
17 |     ANCHOR_SIZES: (32, 64, 128, 256, 512)
18 |     ANCHOR_STRIDE: (16,)
19 |     ASPECT_RATIOS: (0.23232838, 0.63365731, 1.28478321, 3.15089189)   # from neural-motifs
20 |     PRE_NMS_TOP_N_TRAIN: 12000
21 |     PRE_NMS_TOP_N_TEST: 6000
22 |     POST_NMS_TOP_N_TRAIN: 2000
23 |     POST_NMS_TOP_N_TEST: 1000
24 |     FPN_POST_NMS_TOP_N_TRAIN: 2000
25 |     FPN_POST_NMS_TOP_N_TEST: 2000
26 |     FPN_POST_NMS_PER_BATCH: False
27 |     RPN_MID_CHANNEL: 512
28 |   ROI_HEADS:
29 |     USE_FPN: True
30 |     POSITIVE_FRACTION: 0.5
31 |     BG_IOU_THRESHOLD: 0.3
32 |     BATCH_SIZE_PER_IMAGE: 256
33 |     DETECTIONS_PER_IMG: 256
34 |   ROI_BOX_HEAD:
35 |     POOLER_RESOLUTION: 7
36 |     POOLER_SCALES: (0.0625,)
37 |     POOLER_SAMPLING_RATIO: 2
38 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
39 |     PREDICTOR: "FPNPredictor"
40 |     NUM_CLASSES: 151                    # 151 for VG, 1201 for GQA
41 |     MLP_HEAD_DIM: 2048
42 |   ROI_ATTRIBUTE_HEAD:
43 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
44 |     PREDICTOR: "FPNPredictor"
45 |     USE_BINARY_LOSS: True               # choose binary, because cross_entropy loss deteriorate the box head, even with 0.1 weight
46 |     POS_WEIGHT: 50.0
47 |     ATTRIBUTE_LOSS_WEIGHT: 1.0
48 |     NUM_ATTRIBUTES: 201                 # 201 for VG, 501 for GQA
49 |     MAX_ATTRIBUTES: 10             
50 |     ATTRIBUTE_BGFG_SAMPLE: True    
51 |     ATTRIBUTE_BGFG_RATIO: 3        
52 | DATASETS:
53 |   TRAIN: ("VG_stanford_filtered_with_attribute_train",)
54 |   VAL: ("VG_stanford_filtered_with_attribute_val",)
55 |   TEST: ("VG_stanford_filtered_with_attribute_test",)
56 | DATALOADER:
57 |   SIZE_DIVISIBILITY: 32
58 | SOLVER:
59 |   BASE_LR: 0.001
60 |   WEIGHT_DECAY: 0.0001
61 |   WARMUP_FACTOR: 0.1
62 |   MOMENTUM: 0.9
63 |   GRAD_NORM_CLIP: 5.0
64 |   STEPS: (30000, 45000)
65 |   MAX_ITER: 90000
66 |   PRINT_GRAD_FREQ: 5000
67 | OUTPUT_DIR: './output/relation_baseline'
68 | 
69 | 


--------------------------------------------------------------------------------
/configs/e2e_relation_detector_X_101_32_8_FPN_1x.yaml:
--------------------------------------------------------------------------------
 1 | INPUT:
 2 |   MIN_SIZE_TRAIN: (600,)
 3 |   MAX_SIZE_TRAIN: 1000
 4 |   MIN_SIZE_TEST: 600
 5 |   MAX_SIZE_TEST: 1000
 6 | MODEL:
 7 |   META_ARCHITECTURE: "GeneralizedRCNN"
 8 |   WEIGHT: "catalog://ImageNetPretrained/FAIR/20171220/X-101-32x8d"
 9 |   BACKBONE:
10 |     CONV_BODY: "R-101-FPN"
11 |   RESNETS:
12 |     BACKBONE_OUT_CHANNELS: 256
13 |     STRIDE_IN_1X1: False
14 |     NUM_GROUPS: 32
15 |     WIDTH_PER_GROUP: 8
16 |   RELATION_ON: False
17 |   ATTRIBUTE_ON: False
18 |   FLIP_AUG: False
19 |   RPN:
20 |     USE_FPN: True
21 |     ANCHOR_SIZES: (32, 64, 128, 256, 512)
22 |     ANCHOR_STRIDE: (4, 8, 16, 32, 64)
23 |     ASPECT_RATIOS: (0.23232838, 0.63365731, 1.28478321, 3.15089189)   # from neural-motifs
24 |     PRE_NMS_TOP_N_TRAIN: 12000
25 |     PRE_NMS_TOP_N_TEST: 6000
26 |     POST_NMS_TOP_N_TRAIN: 2000
27 |     POST_NMS_TOP_N_TEST: 1000
28 |     FPN_POST_NMS_TOP_N_TRAIN: 2000
29 |     FPN_POST_NMS_TOP_N_TEST: 2000
30 |     FPN_POST_NMS_PER_BATCH: False
31 |     RPN_MID_CHANNEL: 256
32 |   ROI_HEADS:
33 |     USE_FPN: True
34 |     POSITIVE_FRACTION: 0.5
35 |     BG_IOU_THRESHOLD: 0.3
36 |     BATCH_SIZE_PER_IMAGE: 256
37 |     DETECTIONS_PER_IMG: 256
38 |   ROI_BOX_HEAD:
39 |     POOLER_RESOLUTION: 7
40 |     POOLER_SCALES: (0.25, 0.125, 0.0625, 0.03125)
41 |     POOLER_SAMPLING_RATIO: 2
42 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
43 |     PREDICTOR: "FPNPredictor"
44 |     NUM_CLASSES: 151                    # 151 for VG, 1201 for GQA
45 |     MLP_HEAD_DIM: 4096
46 |   ROI_ATTRIBUTE_HEAD:
47 |     FEATURE_EXTRACTOR: "FPN2MLPFeatureExtractor"
48 |     PREDICTOR: "FPNPredictor"
49 |     USE_BINARY_LOSS: True               # choose binary, because cross_entropy loss deteriorate the box head, even with 0.1 weight
50 |     POS_WEIGHT: 50.0
51 |     ATTRIBUTE_LOSS_WEIGHT: 1.0
52 |     NUM_ATTRIBUTES: 201                 # 201 for VG, 501 for GQA
53 |     MAX_ATTRIBUTES: 10             
54 |     ATTRIBUTE_BGFG_SAMPLE: True    
55 |     ATTRIBUTE_BGFG_RATIO: 3        
56 | DATASETS:
57 |   TRAIN: ("VG_stanford_filtered_with_attribute_train",)
58 |   VAL: ("VG_stanford_filtered_with_attribute_val",)
59 |   TEST: ("VG_stanford_filtered_with_attribute_test",)
60 | DATALOADER:
61 |   SIZE_DIVISIBILITY: 32
62 | SOLVER:
63 |   BASE_LR: 0.001
64 |   WEIGHT_DECAY: 0.0001
65 |   WARMUP_FACTOR: 0.1
66 |   MOMENTUM: 0.9
67 |   GRAD_NORM_CLIP: 5.0
68 |   STEPS: (90000, 120000)
69 |   MAX_ITER: 180000
70 |   PRINT_GRAD_FREQ: 5000
71 | OUTPUT_DIR: './output/relation_baseline'
72 | 
73 | 


--------------------------------------------------------------------------------
/demo/.gitignore:
--------------------------------------------------------------------------------
1 | cache
2 | static
3 | *.pyc
4 | __pycache__
5 | db.sqlite3
6 | 


--------------------------------------------------------------------------------
/demo/README.md:
--------------------------------------------------------------------------------
 1 | ## Webcam and Jupyter notebook demo
 2 | 
 3 | This folder contains a simple webcam demo that illustrates how you can use `maskrcnn_benchmark` for inference.
 4 | 
 5 | 
 6 | ### With your preferred environment
 7 | 
 8 | You can start it by running it from this folder, using one of the following commands:
 9 | ```bash
10 | # by default, it runs on the GPU
11 | # for best results, use min-image-size 800
12 | python webcam.py --min-image-size 800
13 | # can also run it on the CPU
14 | python webcam.py --min-image-size 300 MODEL.DEVICE cpu
15 | # or change the model that you want to use
16 | python webcam.py --config-file ../configs/caffe2/e2e_mask_rcnn_R_101_FPN_1x_caffe2.yaml --min-image-size 300 MODEL.DEVICE cpu
17 | # in order to see the probability heatmaps, pass --show-mask-heatmaps
18 | python webcam.py --min-image-size 300 --show-mask-heatmaps MODEL.DEVICE cpu
19 | ```
20 | 
21 | ### With Docker
22 | 
23 | Build the image with the tag `maskrcnn-benchmark` (check [INSTALL.md](../INSTALL.md) for instructions)
24 | 
25 | Adjust permissions of the X server host (be careful with this step, refer to 
26 | [here](http://wiki.ros.org/docker/Tutorials/GUI) for alternatives)
27 | 
28 | ```bash
29 | xhost +
30 | ``` 
31 | 
32 | Then run a container with the demo:
33 |  
34 | ```
35 | docker run --rm -it \
36 |     -e DISPLAY=${DISPLAY} \
37 |     --privileged \
38 |     -v /tmp/.X11-unix:/tmp/.X11-unix \
39 |     --device=/dev/video0:/dev/video0 \
40 |     --ipc=host maskrcnn-benchmark \
41 |     python demo/webcam.py --min-image-size 300 \
42 |     --config-file configs/caffe2/e2e_mask_rcnn_R_50_FPN_1x_caffe2.yaml
43 | ```
44 | 
45 | **DISCLAIMER:** *This was tested for an Ubuntu 16.04 machine, 
46 | the volume mapping may vary depending on your platform*
47 | 


--------------------------------------------------------------------------------
/demo/TDE_Results1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/demo/TDE_Results1.png


--------------------------------------------------------------------------------
/demo/TDE_Results2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/demo/TDE_Results2.png


--------------------------------------------------------------------------------
/demo/TDE_Results3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/demo/TDE_Results3.png


--------------------------------------------------------------------------------
/demo/demo_e2e_mask_rcnn_R_50_FPN_1x.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/demo/demo_e2e_mask_rcnn_R_50_FPN_1x.png


--------------------------------------------------------------------------------
/demo/demo_e2e_mask_rcnn_X_101_32x8d_FPN_1x.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/demo/demo_e2e_mask_rcnn_X_101_32x8d_FPN_1x.png


--------------------------------------------------------------------------------
/demo/output_format.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/demo/output_format.png


--------------------------------------------------------------------------------
/demo/relation_head.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/demo/relation_head.png


--------------------------------------------------------------------------------
/demo/teaser_figure.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/demo/teaser_figure.png


--------------------------------------------------------------------------------
/demo/vis_demo/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/demo/vis_demo/__init__.py


--------------------------------------------------------------------------------
/demo/vis_demo/manage.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | """Django's command-line utility for administrative tasks."""
 3 | import os
 4 | import sys
 5 | 
 6 | 
 7 | def main():
 8 |     os.environ.setdefault('DJANGO_SETTINGS_MODULE', 'vis_demo.settings')
 9 |     try:
10 |         from django.core.management import execute_from_command_line
11 |     except ImportError as exc:
12 |         raise ImportError(
13 |             "Couldn't import Django. Are you sure it's installed and "
14 |             "available on your PYTHONPATH environment variable? Did you "
15 |             "forget to activate a virtual environment?"
16 |         ) from exc
17 |     execute_from_command_line(sys.argv)
18 | 
19 | 
20 | if __name__ == '__main__':
21 |     main()
22 | 


--------------------------------------------------------------------------------
/demo/vis_demo/thesis_demo/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/demo/vis_demo/thesis_demo/__init__.py


--------------------------------------------------------------------------------
/demo/vis_demo/thesis_demo/admin.py:
--------------------------------------------------------------------------------
1 | from django.contrib import admin
2 | 
3 | # Register your models here.
4 | 


--------------------------------------------------------------------------------
/demo/vis_demo/thesis_demo/apps.py:
--------------------------------------------------------------------------------
1 | from django.apps import AppConfig
2 | 
3 | 
4 | class ThesisDemoConfig(AppConfig):
5 |     name = 'thesis_demo'
6 | 


--------------------------------------------------------------------------------
/demo/vis_demo/thesis_demo/migrations/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/demo/vis_demo/thesis_demo/migrations/__init__.py


--------------------------------------------------------------------------------
/demo/vis_demo/thesis_demo/models.py:
--------------------------------------------------------------------------------
1 | from django.db import models
2 | 
3 | # Create your models here.
4 | 


--------------------------------------------------------------------------------
/demo/vis_demo/thesis_demo/my_tranform.py:
--------------------------------------------------------------------------------
 1 | from torchvision.transforms import functional as TF
 2 | 
 3 | 
 4 | class Compose(object):
 5 |     def __init__(self, transforms):
 6 |         self.transforms = transforms
 7 | 
 8 |     def __call__(self, image):
 9 |         for t in self.transforms:
10 |             image = t(image)
11 |         return image
12 | 
13 |     def __repr__(self):
14 |         format_string = self.__class__.__name__ + "("
15 |         for t in self.transforms:
16 |             format_string += "\n"
17 |             format_string += "    {0}".format(t)
18 |         format_string += "\n)"
19 |         return format_string
20 | 
21 | 
22 | class Resize(object):
23 |     def __init__(self, min_size, max_size):
24 |         self.min_size = min_size
25 |         self.max_size = max_size
26 | 
27 |     # modified from torchvision to add support for max size
28 |     def get_size(self, image_size):
29 |         w, h = image_size
30 |         size = self.min_size
31 |         max_size = self.max_size
32 |         if max_size is not None:
33 |             min_original_size = float(min((w, h)))
34 |             max_original_size = float(max((w, h)))
35 |             if max_original_size / min_original_size * size > max_size:
36 |                 size = int(round(max_size * min_original_size / max_original_size))
37 | 
38 |         if (w <= h and w == size) or (h <= w and h == size):
39 |             return (h, w)
40 | 
41 |         if w < h:
42 |             ow = size
43 |             oh = int(size * h / w)
44 |         else:
45 |             oh = size
46 |             ow = int(size * w / h)
47 | 
48 |         return (oh, ow)
49 | 
50 |     def __call__(self, image):
51 |         size = self.get_size(image.size)
52 |         image = TF.resize(image, size)
53 |         return image
54 | 
55 | 
56 | class Normalize(object):
57 |     def __init__(self, mean, std, to_bgr255=True):
58 |         self.mean = mean
59 |         self.std = std
60 |         self.to_bgr255 = to_bgr255
61 | 
62 |     def __call__(self, image):
63 |         if self.to_bgr255:
64 |             image = image[[2, 1, 0]] * 255
65 |         image = TF.normalize(image, mean=self.mean, std=self.std)
66 |         return image
67 | 
68 | 
69 | class ToTensor(object):
70 |     def __call__(self, image):
71 |         return TF.to_tensor(image)
72 | 


--------------------------------------------------------------------------------
/demo/vis_demo/thesis_demo/tests.py:
--------------------------------------------------------------------------------
1 | from django.test import TestCase
2 | 
3 | # Create your tests here.
4 | 


--------------------------------------------------------------------------------
/demo/vis_demo/thesis_demo/urls.py:
--------------------------------------------------------------------------------
1 | from django.urls import path
2 | 
3 | from . import views
4 | 
5 | urlpatterns = [
6 |     path('', views.upload, name='upload'),
7 | ]


--------------------------------------------------------------------------------
/demo/vis_demo/thesis_demo/views.py:
--------------------------------------------------------------------------------
 1 | import json
 2 | import os
 3 | import time
 4 | 
 5 | from django.core.files.storage import FileSystemStorage
 6 | from django.shortcuts import render
 7 | 
 8 | 
 9 | from . import vrd_demo
10 | detector = vrd_demo.VRDPredictor("thesis_demo")
11 | 
12 | 
13 | def show(request, img_dir):
14 |     print(img_dir)
15 |     start = time.time()
16 |     det_res = detector.inference(img_dir)
17 |     print("cost time: %f" % (time.time() - start))
18 |     context = {
19 |         "det_res":  json.dumps([det_res])
20 |     }
21 |     return render(request, 'res_vis.html', context=context)
22 | 
23 | 
24 | def upload(request):
25 |     context = {}
26 |     if request.method == 'POST':
27 | 
28 |         uploaded_file = request.FILES.get('image')
29 |         if uploaded_file is None:
30 |             return render(request, 'upload.html', context)
31 |         fs = FileSystemStorage()
32 |         if uploaded_file.name.split('.')[-1] not in ["jpg", 'png', 'jpeg']:
33 |             return render(request, 'upload.html', context)
34 |         f_dir = os.path.join('thesis_demo/static/img_cache', uploaded_file.name)
35 |         fs.save(f_dir, uploaded_file)
36 |         return show(request, f_dir)
37 | 
38 |     return render(request, 'upload.html', context)
39 | 
40 | 
41 | 


--------------------------------------------------------------------------------
/demo/vis_demo/urls.py:
--------------------------------------------------------------------------------
 1 | """vis_demo URL Configuration
 2 | 
 3 | The `urlpatterns` list routes URLs to views. For more information please see:
 4 |     https://docs.djangoproject.com/en/2.2/topics/http/urls/
 5 | Examples:
 6 | Function views
 7 |     1. Add an import:  from my_app import views
 8 |     2. Add a URL to urlpatterns:  path('', views.home, name='home')
 9 | Class-based views
10 |     1. Add an import:  from other_app.views import Home
11 |     2. Add a URL to urlpatterns:  path('', Home.as_view(), name='home')
12 | Including another URLconf
13 |     1. Import the include() function: from django.urls import include, path
14 |     2. Add a URL to urlpatterns:  path('blog/', include('blog.urls'))
15 | """
16 | from django.contrib import admin
17 | from django.urls import path, include
18 | 
19 | urlpatterns = [
20 |     path('admin/', admin.site.urls),
21 |     path('', include('thesis_demo.urls'))
22 | ]
23 | 


--------------------------------------------------------------------------------
/demo/vis_demo/vis_demo/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/demo/vis_demo/vis_demo/__init__.py


--------------------------------------------------------------------------------
/demo/vis_demo/vis_demo/urls.py:
--------------------------------------------------------------------------------
 1 | """vis_demo URL Configuration
 2 | 
 3 | The `urlpatterns` list routes URLs to views. For more information please see:
 4 |     https://docs.djangoproject.com/en/2.2/topics/http/urls/
 5 | Examples:
 6 | Function views
 7 |     1. Add an import:  from my_app import views
 8 |     2. Add a URL to urlpatterns:  path('', views.home, name='home')
 9 | Class-based views
10 |     1. Add an import:  from other_app.views import Home
11 |     2. Add a URL to urlpatterns:  path('', Home.as_view(), name='home')
12 | Including another URLconf
13 |     1. Import the include() function: from django.urls import include, path
14 |     2. Add a URL to urlpatterns:  path('blog/', include('blog.urls'))
15 | """
16 | from django.contrib import admin
17 | from django.urls import path, include
18 | 
19 | urlpatterns = [
20 |     path('admin/', admin.site.urls),
21 |     path('', include('thesis_demo.urls'))
22 | ]
23 | 


--------------------------------------------------------------------------------
/demo/vis_demo/vis_demo/wsgi.py:
--------------------------------------------------------------------------------
 1 | """
 2 | WSGI config for vis_demo project.
 3 | 
 4 | It exposes the WSGI callable as a module-level variable named ``application``.
 5 | 
 6 | For more information on this file, see
 7 | https://docs.djangoproject.com/en/2.2/howto/deployment/wsgi/
 8 | """
 9 | 
10 | import os
11 | 
12 | from django.core.wsgi import get_wsgi_application
13 | 
14 | os.environ.setdefault('DJANGO_SETTINGS_MODULE', 'vis_demo.settings')
15 | 
16 | application = get_wsgi_application()
17 | 


--------------------------------------------------------------------------------
/demo/vis_demo/wsgi.py:
--------------------------------------------------------------------------------
 1 | """
 2 | WSGI config for vis_demo project.
 3 | 
 4 | It exposes the WSGI callable as a module-level variable named ``application``.
 5 | 
 6 | For more information on this file, see
 7 | https://docs.djangoproject.com/en/2.2/howto/deployment/wsgi/
 8 | """
 9 | 
10 | import os
11 | 
12 | from django.core.wsgi import get_wsgi_application
13 | 
14 | os.environ.setdefault('DJANGO_SETTINGS_MODULE', 'vis_demo.settings')
15 | 
16 | application = get_wsgi_application()
17 | 


--------------------------------------------------------------------------------
/demo/webcam.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import argparse
 3 | import cv2
 4 | 
 5 | from pysgg.config import cfg
 6 | from predictor import COCODemo
 7 | 
 8 | import time
 9 | 
10 | 
11 | def main():
12 |     parser = argparse.ArgumentParser(description="PyTorch Object Detection Webcam Demo")
13 |     parser.add_argument(
14 |         "--config-file",
15 |         default="../configs/caffe2/e2e_mask_rcnn_R_50_FPN_1x_caffe2.yaml",
16 |         metavar="FILE",
17 |         help="path to config file",
18 |     )
19 |     parser.add_argument(
20 |         "--confidence-threshold",
21 |         type=float,
22 |         default=0.7,
23 |         help="Minimum score for the prediction to be shown",
24 |     )
25 |     parser.add_argument(
26 |         "--min-image-size",
27 |         type=int,
28 |         default=224,
29 |         help="Smallest size of the image to feed to the model. "
30 |             "Model was trained with 800, which gives best results",
31 |     )
32 |     parser.add_argument(
33 |         "--show-mask-heatmaps",
34 |         dest="show_mask_heatmaps",
35 |         help="Show a heatmap probability for the top masks-per-dim masks",
36 |         action="store_true",
37 |     )
38 |     parser.add_argument(
39 |         "--masks-per-dim",
40 |         type=int,
41 |         default=2,
42 |         help="Number of heatmaps per dimension to show",
43 |     )
44 |     parser.add_argument(
45 |         "opts",
46 |         help="Modify model config options using the command-line",
47 |         default=None,
48 |         nargs=argparse.REMAINDER,
49 |     )
50 | 
51 |     args = parser.parse_args()
52 | 
53 |     # load config from file and command-line arguments
54 |     cfg.merge_from_file(args.config_file)
55 |     cfg.merge_from_list(args.opts)
56 |     cfg.freeze()
57 | 
58 |     # prepare object that handles inference plus adds predictions on top of image
59 |     coco_demo = COCODemo(
60 |         cfg,
61 |         confidence_threshold=args.confidence_threshold,
62 |         show_mask_heatmaps=args.show_mask_heatmaps,
63 |         masks_per_dim=args.masks_per_dim,
64 |         min_image_size=args.min_image_size,
65 |     )
66 | 
67 |     cam = cv2.VideoCapture(0)
68 |     while True:
69 |         start_time = time.time()
70 |         ret_val, img = cam.read()
71 |         composite = coco_demo.run_on_opencv_image(img)
72 |         print("Time: {:.2f} s / img".format(time.time() - start_time))
73 |         cv2.imshow("COCO detections", composite)
74 |         if cv2.waitKey(1) == 27:
75 |             break  # esc to quit
76 |     cv2.destroyAllWindows()
77 | 
78 | 
79 | if __name__ == "__main__":
80 |     main()
81 | 


--------------------------------------------------------------------------------
/docker/Dockerfile:
--------------------------------------------------------------------------------
 1 | ARG CUDA="9.0"
 2 | ARG CUDNN="7"
 3 | 
 4 | FROM nvidia/cuda:${CUDA}-cudnn${CUDNN}-devel-ubuntu16.04
 5 | 
 6 | RUN echo 'debconf debconf/frontend select Noninteractive' | debconf-set-selections
 7 | 
 8 | # install basics
 9 | RUN apt-get update -y \
10 |  && apt-get install -y apt-utils git curl ca-certificates bzip2 cmake tree htop bmon iotop g++ \
11 |  && apt-get install -y libglib2.0-0 libsm6 libxext6 libxrender-dev
12 | 
13 | # Install Miniconda
14 | RUN curl -so /miniconda.sh https://repo.continuum.io/miniconda/Miniconda3-latest-Linux-x86_64.sh \
15 |  && chmod +x /miniconda.sh \
16 |  && /miniconda.sh -b -p /miniconda \
17 |  && rm /miniconda.sh
18 | 
19 | ENV PATH=/miniconda/bin:$PATH
20 | 
21 | # Create a Python 3.6 environment
22 | RUN /miniconda/bin/conda install -y conda-build \
23 |  && /miniconda/bin/conda create -y --name py36 python=3.6.7 \
24 |  && /miniconda/bin/conda clean -ya
25 | 
26 | ENV CONDA_DEFAULT_ENV=py36
27 | ENV CONDA_PREFIX=/miniconda/envs/$CONDA_DEFAULT_ENV
28 | ENV PATH=$CONDA_PREFIX/bin:$PATH
29 | ENV CONDA_AUTO_UPDATE_CONDA=false
30 | 
31 | RUN conda install -y ipython
32 | RUN pip install requests ninja yacs cython matplotlib opencv-python tqdm
33 | 
34 | # Install PyTorch 1.0 Nightly
35 | ARG CUDA
36 | RUN conda install pytorch-nightly cudatoolkit=${CUDA} -c pytorch \
37 |  && conda clean -ya
38 | 
39 | # Install TorchVision master
40 | RUN git clone https://github.com/pytorch/vision.git \
41 |  && cd vision \
42 |  && python setup.py install
43 | 
44 | # install pycocotools
45 | RUN git clone https://github.com/cocodataset/cocoapi.git \
46 |  && cd cocoapi/PythonAPI \
47 |  && python setup.py build_ext install
48 | 
49 | # install apex
50 | RUN git clone https://github.com/NVIDIA/apex.git \
51 |  && cd apex \
52 |  && python setup.py install --cuda_ext --cpp_ext
53 | 
54 | # install PyTorch Detection
55 | ARG FORCE_CUDA="1"
56 | ENV FORCE_CUDA=${FORCE_CUDA}
57 | RUN git clone https://github.com/facebookresearch/maskrcnn-benchmark.git \
58 |  && cd maskrcnn-benchmark \
59 |  && python setup.py build develop
60 | 
61 | WORKDIR /maskrcnn-benchmark
62 | 


--------------------------------------------------------------------------------
/docker/docker-jupyter/Dockerfile:
--------------------------------------------------------------------------------
 1 | ARG CUDA="9.0"
 2 | ARG CUDNN="7"
 3 | 
 4 | FROM nvidia/cuda:${CUDA}-cudnn${CUDNN}-devel-ubuntu16.04
 5 | 
 6 | RUN echo 'debconf debconf/frontend select Noninteractive' | debconf-set-selections
 7 | 
 8 | # install basics
 9 | RUN apt-get update -y \
10 |  && apt-get install -y apt-utils git curl ca-certificates bzip2 cmake tree htop bmon iotop g++
11 | 
12 | # Install Miniconda
13 | RUN curl -so /miniconda.sh https://repo.continuum.io/miniconda/Miniconda3-latest-Linux-x86_64.sh \
14 |  && chmod +x /miniconda.sh \
15 |  && /miniconda.sh -b -p /miniconda \
16 |  && rm /miniconda.sh
17 | 
18 | ENV PATH=/miniconda/bin:$PATH
19 | 
20 | # Create a Python 3.6 environment
21 | RUN /miniconda/bin/conda install -y conda-build \
22 |  && /miniconda/bin/conda create -y --name py36 python=3.6.7 \
23 |  && /miniconda/bin/conda clean -ya
24 | 
25 | ENV CONDA_DEFAULT_ENV=py36
26 | ENV CONDA_PREFIX=/miniconda/envs/$CONDA_DEFAULT_ENV
27 | ENV PATH=$CONDA_PREFIX/bin:$PATH
28 | ENV CONDA_AUTO_UPDATE_CONDA=false
29 | 
30 | RUN conda install -y ipython
31 | RUN pip install requests ninja yacs cython matplotlib jupyter
32 | 
33 | # Install PyTorch 1.0 Nightly and OpenCV
34 | RUN conda install -y pytorch-nightly -c pytorch \
35 |  && conda install -y opencv -c menpo \
36 |  && conda clean -ya
37 | 
38 | WORKDIR /root
39 | 
40 | USER root
41 | 
42 | RUN mkdir /notebooks
43 | 
44 | WORKDIR /notebooks
45 | 
46 | # Install TorchVision master
47 | RUN git clone https://github.com/pytorch/vision.git \
48 |  && cd vision \
49 |  && python setup.py install
50 | 
51 | # install pycocotools
52 | RUN git clone https://github.com/cocodataset/cocoapi.git \
53 |  && cd cocoapi/PythonAPI \
54 |  && python setup.py build_ext install
55 | 
56 | # install PyTorch Detection
57 | RUN git clone https://github.com/facebookresearch/maskrcnn-benchmark.git \
58 |  && cd maskrcnn-benchmark \
59 |  && python setup.py build develop
60 | 
61 | RUN jupyter notebook --generate-config
62 | 
63 | ENV CONFIG_PATH="/root/.jupyter/jupyter_notebook_config.py"
64 | 
65 | COPY "jupyter_notebook_config.py" ${CONFIG_PATH}
66 | 
67 | ENTRYPOINT ["sh", "-c", "jupyter notebook --allow-root -y --no-browser --ip=0.0.0.0 --config=${CONFIG_PATH}"]
68 | 


--------------------------------------------------------------------------------
/docker/docker-jupyter/jupyter_notebook_config.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | from IPython.lib import passwd
 3 | 
 4 | # c = c  # pylint:disable=undefined-variable
 5 | c = get_config()
 6 | c.NotebookApp.ip = '0.0.0.0'
 7 | c.NotebookApp.port = int(os.getenv('PORT', 8888))
 8 | c.NotebookApp.open_browser = False
 9 | 
10 | # sets a password if PASSWORD is set in the environment
11 | if 'PASSWORD' in os.environ:
12 |     password = os.environ['PASSWORD']
13 |     if password:
14 |         c.NotebookApp.password = passwd(password)
15 |     else:
16 |         c.NotebookApp.password = ''
17 |         c.NotebookApp.token = ''
18 |     del os.environ['PASSWORD']
19 | 


--------------------------------------------------------------------------------
/pysgg/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | 


--------------------------------------------------------------------------------
/pysgg/config/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .defaults import _C as cfg
3 | 


--------------------------------------------------------------------------------
/pysgg/csrc/ROIAlign.h:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #pragma once
 3 | 
 4 | #include "cpu/vision.h"
 5 | 
 6 | #ifdef WITH_CUDA
 7 | #include "cuda/vision.h"
 8 | #endif
 9 | 
10 | // Interface for Python
11 | at::Tensor ROIAlign_forward(const at::Tensor& input,
12 |                             const at::Tensor& rois,
13 |                             const float spatial_scale,
14 |                             const int pooled_height,
15 |                             const int pooled_width,
16 |                             const int sampling_ratio) {
17 |   if (input.type().is_cuda()) {
18 | #ifdef WITH_CUDA
19 |     return ROIAlign_forward_cuda(input, rois, spatial_scale, pooled_height, pooled_width, sampling_ratio);
20 | #else
21 |     AT_ERROR("Not compiled with GPU support");
22 | #endif
23 |   }
24 |   return ROIAlign_forward_cpu(input, rois, spatial_scale, pooled_height, pooled_width, sampling_ratio);
25 | }
26 | 
27 | at::Tensor ROIAlign_backward(const at::Tensor& grad,
28 |                              const at::Tensor& rois,
29 |                              const float spatial_scale,
30 |                              const int pooled_height,
31 |                              const int pooled_width,
32 |                              const int batch_size,
33 |                              const int channels,
34 |                              const int height,
35 |                              const int width,
36 |                              const int sampling_ratio) {
37 |   if (grad.type().is_cuda()) {
38 | #ifdef WITH_CUDA
39 |     return ROIAlign_backward_cuda(grad, rois, spatial_scale, pooled_height, pooled_width, batch_size, channels, height, width, sampling_ratio);
40 | #else
41 |     AT_ERROR("Not compiled with GPU support");
42 | #endif
43 |   }
44 |   AT_ERROR("Not implemented on the CPU");
45 | }
46 | 
47 | 


--------------------------------------------------------------------------------
/pysgg/csrc/ROIPool.h:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #pragma once
 3 | 
 4 | #include "cpu/vision.h"
 5 | 
 6 | #ifdef WITH_CUDA
 7 | #include "cuda/vision.h"
 8 | #endif
 9 | 
10 | 
11 | std::tuple<at::Tensor, at::Tensor> ROIPool_forward(const at::Tensor& input,
12 |                                 const at::Tensor& rois,
13 |                                 const float spatial_scale,
14 |                                 const int pooled_height,
15 |                                 const int pooled_width) {
16 |   if (input.type().is_cuda()) {
17 | #ifdef WITH_CUDA
18 |     return ROIPool_forward_cuda(input, rois, spatial_scale, pooled_height, pooled_width);
19 | #else
20 |     AT_ERROR("Not compiled with GPU support");
21 | #endif
22 |   }
23 |   AT_ERROR("Not implemented on the CPU");
24 | }
25 | 
26 | at::Tensor ROIPool_backward(const at::Tensor& grad,
27 |                                  const at::Tensor& input,
28 |                                  const at::Tensor& rois,
29 |                                  const at::Tensor& argmax,
30 |                                  const float spatial_scale,
31 |                                  const int pooled_height,
32 |                                  const int pooled_width,
33 |                                  const int batch_size,
34 |                                  const int channels,
35 |                                  const int height,
36 |                                  const int width) {
37 |   if (grad.type().is_cuda()) {
38 | #ifdef WITH_CUDA
39 |     return ROIPool_backward_cuda(grad, input, rois, argmax, spatial_scale, pooled_height, pooled_width, batch_size, channels, height, width);
40 | #else
41 |     AT_ERROR("Not compiled with GPU support");
42 | #endif
43 |   }
44 |   AT_ERROR("Not implemented on the CPU");
45 | }
46 | 
47 | 
48 | 
49 | 


--------------------------------------------------------------------------------
/pysgg/csrc/SigmoidFocalLoss.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include "cpu/vision.h"
 4 | 
 5 | #ifdef WITH_CUDA
 6 | #include "cuda/vision.h"
 7 | #endif
 8 | 
 9 | // Interface for Python
10 | at::Tensor SigmoidFocalLoss_forward(
11 | 		const at::Tensor& logits,
12 |                 const at::Tensor& targets,
13 | 		const int num_classes, 
14 | 		const float gamma, 
15 | 		const float alpha) {
16 |   if (logits.type().is_cuda()) {
17 | #ifdef WITH_CUDA
18 |     return SigmoidFocalLoss_forward_cuda(logits, targets, num_classes, gamma, alpha);
19 | #else
20 |     AT_ERROR("Not compiled with GPU support");
21 | #endif
22 |   }
23 |   AT_ERROR("Not implemented on the CPU");
24 | }
25 | 
26 | at::Tensor SigmoidFocalLoss_backward(
27 | 			     const at::Tensor& logits,
28 |                              const at::Tensor& targets,
29 | 			     const at::Tensor& d_losses,
30 | 			     const int num_classes,
31 | 			     const float gamma,
32 | 			     const float alpha) {
33 |   if (logits.type().is_cuda()) {
34 | #ifdef WITH_CUDA
35 |     return SigmoidFocalLoss_backward_cuda(logits, targets, d_losses, num_classes, gamma, alpha);
36 | #else
37 |     AT_ERROR("Not compiled with GPU support");
38 | #endif
39 |   }
40 |   AT_ERROR("Not implemented on the CPU");
41 | }
42 | 


--------------------------------------------------------------------------------
/pysgg/csrc/cpu/vision.h:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #pragma once
 3 | #include <torch/extension.h>
 4 | 
 5 | 
 6 | at::Tensor ROIAlign_forward_cpu(const at::Tensor& input,
 7 |                                 const at::Tensor& rois,
 8 |                                 const float spatial_scale,
 9 |                                 const int pooled_height,
10 |                                 const int pooled_width,
11 |                                 const int sampling_ratio);
12 | 
13 | 
14 | at::Tensor nms_cpu(const at::Tensor& dets,
15 |                    const at::Tensor& scores,
16 |                    const float threshold);
17 | 


--------------------------------------------------------------------------------
/pysgg/csrc/deform_pool.h:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #pragma once
 3 | #include "cpu/vision.h"
 4 | 
 5 | #ifdef WITH_CUDA
 6 | #include "cuda/vision.h"
 7 | #endif
 8 | 
 9 | 
10 | // Interface for Python
11 | void deform_psroi_pooling_forward(
12 |     at::Tensor input, 
13 |     at::Tensor bbox, 
14 |     at::Tensor trans, 
15 |     at::Tensor out,
16 |     at::Tensor top_count, 
17 |     const int no_trans, 
18 |     const float spatial_scale,
19 |     const int output_dim, 
20 |     const int group_size, 
21 |     const int pooled_size,
22 |     const int part_size, 
23 |     const int sample_per_part, 
24 |     const float trans_std)
25 | {
26 |   if (input.type().is_cuda()) {
27 | #ifdef WITH_CUDA
28 |     return deform_psroi_pooling_cuda_forward(
29 |         input, bbox, trans, out, top_count, 
30 |         no_trans, spatial_scale, output_dim, group_size,
31 |         pooled_size, part_size, sample_per_part, trans_std
32 |     );
33 | #else
34 |     AT_ERROR("Not compiled with GPU support");
35 | #endif
36 |   }
37 |   AT_ERROR("Not implemented on the CPU");
38 | }
39 | 
40 | 
41 | void deform_psroi_pooling_backward(
42 |     at::Tensor out_grad, 
43 |     at::Tensor input, 
44 |     at::Tensor bbox, 
45 |     at::Tensor trans,
46 |     at::Tensor top_count, 
47 |     at::Tensor input_grad, 
48 |     at::Tensor trans_grad,
49 |     const int no_trans, 
50 |     const float spatial_scale, 
51 |     const int output_dim,
52 |     const int group_size, 
53 |     const int pooled_size, 
54 |     const int part_size,
55 |     const int sample_per_part, 
56 |     const float trans_std) 
57 | {
58 |   if (input.type().is_cuda()) {
59 | #ifdef WITH_CUDA
60 |     return deform_psroi_pooling_cuda_backward(
61 |         out_grad, input, bbox, trans, top_count, input_grad, trans_grad,
62 |         no_trans, spatial_scale, output_dim, group_size, pooled_size, 
63 |         part_size, sample_per_part, trans_std
64 |     );
65 | #else
66 |     AT_ERROR("Not compiled with GPU support");
67 | #endif
68 |   }
69 |   AT_ERROR("Not implemented on the CPU");
70 | }
71 | 


--------------------------------------------------------------------------------
/pysgg/csrc/nms.h:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #pragma once
 3 | #include "cpu/vision.h"
 4 | 
 5 | #ifdef WITH_CUDA
 6 | #include "cuda/vision.h"
 7 | #endif
 8 | 
 9 | 
10 | at::Tensor nms(const at::Tensor& dets,
11 |                const at::Tensor& scores,
12 |                const float threshold) {
13 | 
14 |   if (dets.type().is_cuda()) {
15 | #ifdef WITH_CUDA
16 |     // TODO raise error if not compiled with CUDA
17 |     if (dets.numel() == 0)
18 |       return at::empty({0}, dets.options().dtype(at::kLong).device(at::kCPU));
19 |     auto b = at::cat({dets, scores.unsqueeze(1)}, 1);
20 |     return nms_cuda(b, threshold);
21 | #else
22 |     AT_ERROR("Not compiled with GPU support");
23 | #endif
24 |   }
25 | 
26 |   at::Tensor result = nms_cpu(dets, scores, threshold);
27 |   return result;
28 | }
29 | 


--------------------------------------------------------------------------------
/pysgg/csrc/vision.cpp:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #include "nms.h"
 3 | #include "ROIAlign.h"
 4 | #include "ROIPool.h"
 5 | #include "SigmoidFocalLoss.h"
 6 | #include "deform_conv.h"
 7 | #include "deform_pool.h"
 8 | 
 9 | PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
10 |   m.def("nms", &nms, "non-maximum suppression");
11 |   m.def("roi_align_forward", &ROIAlign_forward, "ROIAlign_forward");
12 |   m.def("roi_align_backward", &ROIAlign_backward, "ROIAlign_backward");
13 |   m.def("roi_pool_forward", &ROIPool_forward, "ROIPool_forward");
14 |   m.def("roi_pool_backward", &ROIPool_backward, "ROIPool_backward");
15 |   m.def("sigmoid_focalloss_forward", &SigmoidFocalLoss_forward, "SigmoidFocalLoss_forward");
16 |   m.def("sigmoid_focalloss_backward", &SigmoidFocalLoss_backward, "SigmoidFocalLoss_backward");
17 |   // dcn-v2
18 |   m.def("deform_conv_forward", &deform_conv_forward, "deform_conv_forward");
19 |   m.def("deform_conv_backward_input", &deform_conv_backward_input, "deform_conv_backward_input");
20 |   m.def("deform_conv_backward_parameters", &deform_conv_backward_parameters, "deform_conv_backward_parameters");
21 |   m.def("modulated_deform_conv_forward", &modulated_deform_conv_forward, "modulated_deform_conv_forward");
22 |   m.def("modulated_deform_conv_backward", &modulated_deform_conv_backward, "modulated_deform_conv_backward");
23 |   m.def("deform_psroi_pooling_forward", &deform_psroi_pooling_forward, "deform_psroi_pooling_forward");
24 |   m.def("deform_psroi_pooling_backward", &deform_psroi_pooling_backward, "deform_psroi_pooling_backward");
25 | }


--------------------------------------------------------------------------------
/pysgg/data/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .build import make_data_loader, get_dataset_statistics
3 | 


--------------------------------------------------------------------------------
/pysgg/data/collate_batch.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from pysgg.structures.image_list import to_image_list
 3 | 
 4 | 
 5 | class BatchCollator(object):
 6 |     """
 7 |     From a list of samples from the dataset,
 8 |     returns the batched images and targets.
 9 |     This should be passed to the DataLoader
10 |     """
11 | 
12 |     def __init__(self, size_divisible=0):
13 |         self.size_divisible = size_divisible
14 | 
15 |     def __call__(self, batch):
16 |         transposed_batch = list(zip(*batch))
17 |         images = to_image_list(transposed_batch[0], self.size_divisible)
18 |         targets = transposed_batch[1]
19 |         img_ids = transposed_batch[2]
20 |         return images, targets, img_ids
21 | 
22 | 
23 | class BBoxAugCollator(object):
24 |     """
25 |     From a list of samples from the dataset,
26 |     returns the images and targets.
27 |     Images should be converted to batched images in `im_detect_bbox_aug`
28 |     """
29 | 
30 |     def __call__(self, batch):
31 |         return list(zip(*batch))
32 | 
33 | 


--------------------------------------------------------------------------------
/pysgg/data/datasets/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .coco import COCODataset
3 | from .voc import PascalVOCDataset
4 | from .concat_dataset import ConcatDataset
5 | from .visual_genome import VGDataset
6 | from .open_image import OIDataset
7 | 
8 | __all__ = ["COCODataset", "ConcatDataset", "PascalVOCDataset", "VGDataset", "OIDataset"]
9 | 


--------------------------------------------------------------------------------
/pysgg/data/datasets/concat_dataset.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import bisect
 3 | 
 4 | from torch.utils.data.dataset import ConcatDataset as _ConcatDataset
 5 | 
 6 | 
 7 | class ConcatDataset(_ConcatDataset):
 8 |     """
 9 |     Same as torch.utils.data.dataset.ConcatDataset, but exposes an extra
10 |     method for querying the sizes of the image
11 |     """
12 | 
13 |     def get_idxs(self, idx):
14 |         dataset_idx = bisect.bisect_right(self.cumulative_sizes, idx)
15 |         if dataset_idx == 0:
16 |             sample_idx = idx
17 |         else:
18 |             sample_idx = idx - self.cumulative_sizes[dataset_idx - 1]
19 |         return dataset_idx, sample_idx
20 | 
21 |     def get_img_info(self, idx):
22 |         dataset_idx, sample_idx = self.get_idxs(idx)
23 |         return self.datasets[dataset_idx].get_img_info(sample_idx)
24 | 


--------------------------------------------------------------------------------
/pysgg/data/datasets/evaluation/__init__.py:
--------------------------------------------------------------------------------
 1 | from pysgg.data import datasets
 2 | 
 3 | from .coco import coco_evaluation
 4 | from .oi import oi_evaluation
 5 | from .voc import voc_evaluation
 6 | from .vg import vg_evaluation
 7 | 
 8 | 
 9 | def evaluate(cfg, dataset, predictions, output_folder, logger, **kwargs):
10 |     """evaluate dataset using different methods based on dataset type.
11 |     Args:
12 |         dataset: Dataset object
13 |         predictions(list[BoxList]): each item in the list represents the
14 |             prediction results for one image.
15 |         output_folder: output folder, to save evaluation files or results.
16 |         **kwargs: other args.
17 |     Returns:
18 |         evaluation result
19 |     """
20 |     args = dict(
21 |         cfg=cfg, dataset=dataset, predictions=predictions, output_folder=output_folder, logger=logger, **kwargs
22 |     )
23 |     if isinstance(dataset, datasets.COCODataset):
24 |         return coco_evaluation(**args)
25 |     elif isinstance(dataset, datasets.PascalVOCDataset):
26 |         return voc_evaluation(**args)
27 |     elif isinstance(dataset, datasets.VGDataset):
28 |         return vg_evaluation(**args)
29 |     elif isinstance(dataset, datasets.OIDataset):
30 |         return oi_evaluation(**args)
31 |     else:
32 |         dataset_name = dataset.__class__.__name__
33 |         raise NotImplementedError("Unsupported dataset type {}.".format(dataset_name))
34 | 


--------------------------------------------------------------------------------
/pysgg/data/datasets/evaluation/coco/__init__.py:
--------------------------------------------------------------------------------
 1 | from .coco_eval import do_coco_evaluation
 2 | 
 3 | 
 4 | def coco_evaluation(
 5 |     cfg,
 6 |     dataset,
 7 |     predictions,
 8 |     output_folder,
 9 |     logger,
10 |     box_only,
11 |     iou_types,
12 |     expected_results,
13 |     expected_results_sigma_tol,
14 | ):
15 |     return do_coco_evaluation(
16 |         dataset=dataset,
17 |         predictions=predictions,
18 |         box_only=box_only,
19 |         output_folder=output_folder,
20 |         logger=logger,
21 |         iou_types=iou_types,
22 |         expected_results=expected_results,
23 |         expected_results_sigma_tol=expected_results_sigma_tol,
24 |     )
25 | 


--------------------------------------------------------------------------------
/pysgg/data/datasets/evaluation/vg/__init__.py:
--------------------------------------------------------------------------------
 1 | from .vg_eval import do_vg_evaluation
 2 | 
 3 | 
 4 | def vg_evaluation(
 5 |     cfg,
 6 |     dataset,
 7 |     predictions,
 8 |     output_folder,
 9 |     logger,
10 |     iou_types,
11 |     **_
12 | ):
13 |     return do_vg_evaluation(
14 |         cfg=cfg,
15 |         dataset=dataset,
16 |         predictions=predictions,
17 |         output_folder=output_folder,
18 |         logger=logger,
19 |         iou_types=iou_types,
20 |     )
21 | 


--------------------------------------------------------------------------------
/pysgg/data/datasets/evaluation/vg/zeroshot_triplet.pytorch:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/pysgg/data/datasets/evaluation/vg/zeroshot_triplet.pytorch


--------------------------------------------------------------------------------
/pysgg/data/datasets/evaluation/voc/__init__.py:
--------------------------------------------------------------------------------
 1 | import logging
 2 | 
 3 | from .voc_eval import do_voc_evaluation
 4 | 
 5 | 
 6 | def voc_evaluation(cfg, dataset, predictions, output_folder, logger, box_only, **_):
 7 |     if box_only:
 8 |         logger.warning("voc evaluation doesn't support box_only, ignored.")
 9 |     logger.info("performing voc evaluation, ignored iou_types.")
10 |     return do_voc_evaluation(
11 |         dataset=dataset,
12 |         predictions=predictions,
13 |         output_folder=output_folder,
14 |         logger=logger,
15 |     )
16 | 


--------------------------------------------------------------------------------
/pysgg/data/datasets/list_dataset.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | """
 3 | Simple dataset class that wraps a list of path names
 4 | """
 5 | 
 6 | from PIL import Image
 7 | 
 8 | from pysgg.structures.bounding_box import BoxList
 9 | 
10 | 
11 | class ListDataset(object):
12 |     def __init__(self, image_lists, transforms=None):
13 |         self.image_lists = image_lists
14 |         self.transforms = transforms
15 | 
16 |     def __getitem__(self, item):
17 |         img = Image.open(self.image_lists[item]).convert("RGB")
18 | 
19 |         # dummy target
20 |         w, h = img.size
21 |         target = BoxList([[0, 0, w, h]], img.size, mode="xyxy")
22 | 
23 |         if self.transforms is not None:
24 |             img, target = self.transforms(img, target)
25 | 
26 |         return img, target
27 | 
28 |     def __len__(self):
29 |         return len(self.image_lists)
30 | 
31 |     def get_img_info(self, item):
32 |         """
33 |         Return the image dimensions for the image, without
34 |         loading and pre-processing it
35 |         """
36 |         pass
37 | 


--------------------------------------------------------------------------------
/pysgg/data/samplers/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .distributed import DistributedSampler
3 | from .grouped_batch_sampler import GroupedBatchSampler
4 | from .iteration_based_batch_sampler import IterationBasedBatchSampler
5 | 
6 | __all__ = ["DistributedSampler", "GroupedBatchSampler", "IterationBasedBatchSampler"]
7 | 


--------------------------------------------------------------------------------
/pysgg/data/samplers/iteration_based_batch_sampler.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from torch.utils.data.sampler import BatchSampler
 3 | 
 4 | 
 5 | class IterationBasedBatchSampler(BatchSampler):
 6 |     """
 7 |     Wraps a BatchSampler, resampling from it until
 8 |     a specified number of iterations have been sampled
 9 |     """
10 | 
11 |     def __init__(self, batch_sampler, num_iterations, start_iter=0):
12 |         self.batch_sampler = batch_sampler
13 |         self.num_iterations = num_iterations
14 |         self.start_iter = start_iter
15 | 
16 |     def __iter__(self):
17 |         iteration = self.start_iter
18 |         while iteration <= self.num_iterations:
19 |             # if the underlying sampler has a set_epoch method, like
20 |             # DistributedSampler, used for making each process see
21 |             # a different split of the dataset, then set it
22 |             if hasattr(self.batch_sampler.sampler, "set_epoch"):
23 |                 self.batch_sampler.sampler.set_epoch(iteration)
24 |             for batch in self.batch_sampler:
25 |                 iteration += 1
26 |                 if iteration > self.num_iterations:
27 |                     break
28 |                 yield batch
29 | 
30 |     def __len__(self):
31 |         return self.num_iterations
32 | 


--------------------------------------------------------------------------------
/pysgg/data/transforms/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .transforms import Compose
3 | from .transforms import Resize
4 | from .transforms import RandomHorizontalFlip
5 | from .transforms import ToTensor
6 | from .transforms import Normalize
7 | 
8 | from .build import build_transforms
9 | 


--------------------------------------------------------------------------------
/pysgg/data/transforms/build.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from . import transforms as T
 3 | 
 4 | 
 5 | def build_transforms(cfg, is_train=True):
 6 |     if is_train:
 7 |         min_size = cfg.INPUT.MIN_SIZE_TRAIN
 8 |         max_size = cfg.INPUT.MAX_SIZE_TRAIN
 9 |         flip_horizontal_prob = 0.5  # cfg.INPUT.FLIP_PROB_TRAIN
10 |         flip_vertical_prob = cfg.INPUT.VERTICAL_FLIP_PROB_TRAIN
11 |         brightness = cfg.INPUT.BRIGHTNESS
12 |         contrast = cfg.INPUT.CONTRAST
13 |         saturation = cfg.INPUT.SATURATION
14 |         hue = cfg.INPUT.HUE
15 |     else:
16 |         min_size = cfg.INPUT.MIN_SIZE_TEST
17 |         max_size = cfg.INPUT.MAX_SIZE_TEST
18 |         flip_horizontal_prob = 0.0
19 |         flip_vertical_prob = 0.0
20 |         brightness = 0.0
21 |         contrast = 0.0
22 |         saturation = 0.0
23 |         hue = 0.0
24 | 
25 |     to_bgr255 = cfg.INPUT.TO_BGR255
26 |     normalize_transform = T.Normalize(
27 |         mean=cfg.INPUT.PIXEL_MEAN, std=cfg.INPUT.PIXEL_STD, to_bgr255=to_bgr255
28 |     )
29 |     color_jitter = T.ColorJitter(
30 |         brightness=brightness,
31 |         contrast=contrast,
32 |         saturation=saturation,
33 |         hue=hue,
34 |     )
35 | 
36 |     transform = T.Compose(
37 |         [
38 |             color_jitter,
39 |             T.Resize(min_size, max_size),
40 |             T.RandomHorizontalFlip(flip_horizontal_prob),
41 |             T.RandomVerticalFlip(flip_vertical_prob),
42 |             T.ToTensor(),
43 |             normalize_transform,
44 |         ]
45 |     )
46 |     return transform
47 | 


--------------------------------------------------------------------------------
/pysgg/engine/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | 


--------------------------------------------------------------------------------
/pysgg/engine/trainer.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | import torch.distributed as dist
 4 | 
 5 | from pysgg.utils.comm import get_world_size
 6 | 
 7 | 
 8 | def reduce_loss_dict(loss_dict):
 9 |     """
10 |     Reduce the loss dictionary from all processes so that process with rank
11 |     0 has the averaged results. Returns a dict with the same fields as
12 |     loss_dict, after reduction.
13 |     """
14 |     world_size = get_world_size()
15 |     if world_size < 2:
16 |         return loss_dict
17 |     with torch.no_grad():
18 |         loss_names = []
19 |         all_losses = []
20 |         for k in sorted(loss_dict.keys()):
21 |             loss_names.append(k)
22 |             all_losses.append(loss_dict[k])
23 |         all_losses = torch.stack(all_losses, dim=0)
24 |         dist.reduce(all_losses, dst=0)
25 |         if dist.get_rank() == 0:
26 |             # only main process gets accumulated, so only divide by
27 |             # world_size in this case
28 |             all_losses /= world_size
29 |         reduced_losses = {k: v for k, v in zip(loss_names, all_losses)}
30 |     return reduced_losses
31 | 


--------------------------------------------------------------------------------
/pysgg/image_retrieval/S2G-RETRIEVAL.md:
--------------------------------------------------------------------------------
 1 | # Sentence-to-Graph Retrieval (S2G)
 2 | 
 3 | Forgive me, this part of code is ugly and less organized.
 4 | 
 5 | ## Preprocessing
 6 | 
 7 | Run the ```maskrcnn_benchmark/image_retrieval/preprocessing.py``` to process the annotations and checkpoints, where ```detected_path``` should be set to the corresponding checkpoints you want to use, ```vg_data, vg_dict, vg_info``` should have already downloaded if you followed DATASET.md, ```cap_graph``` is the ground-truth captions and generated sentence graphs (you can download it from [here](https://onedrive.live.com/embed?cid=22376FFAD72C4B64&resid=22376FFAD72C4B64%21779999&authkey=AGW0Wxjb1JSDFnc)). We use [SceneGraphParser](https://github.com/vacancy/SceneGraphParser) to generate these sentence graphs.
 8 | 
 9 | You also need to set the ```cap_graph``` PATH and ```vg_dict``` PATH in ```maskrcnn_benchmark/image_retrieval/dataloader.py``` manually.
10 | 
11 | ## Training and Evaluation
12 | 
13 | Run the ```tools/image_retrieval_main.py``` for both training and evaluation. 
14 | 
15 | To load the generated scene graphs of the given SGG checkpoints, you need to manually set ```sg_train_path``` and ```sg_test_path``` in ```tools/image_retrieval_main.py```, which means you need to evaluate your model on **both training and testing set** to get the generated crude scene graphs. Our evaluation code will automatically saves the crude SGGs into ```checkpoints/MODEL_NAME/inference/VG_stanford_filtered_wth_attribute_test/```  or ```checkpoints/MODEL_NAME/inference/VG_stanford_filtered_wth_attribute_train/```, which will be further processed to generate the input of ```sg_train_path``` and ```sg_test_path``` by our preprocessing code ```maskrcnn_benchmark/image_retrieval/preprocessing.py```.
16 | 
17 | ## Results
18 | 
19 | Sentence-to-Graph Retrieval (S2G) results are given in the paper [Unbiased Scene Graph Generation from Biased Training](https://arxiv.org/abs/2002.11949):
20 | 
21 | ![alt text](../../demo/TDE_Results3.png "from 'Unbiased Scene Graph Generation from Biased Training'")
22 | 


--------------------------------------------------------------------------------
/pysgg/image_retrieval/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | 


--------------------------------------------------------------------------------
/pysgg/image_retrieval/evaluation.py:
--------------------------------------------------------------------------------
 1 | from pysgg.utils.env import setup_environment  # noqa F401 isort:skip
 2 | 
 3 | import argparse
 4 | import os
 5 | import time
 6 | import datetime
 7 | import json
 8 | import random
 9 | 
10 | import torch
11 | import torch.nn as nn
12 | import torch.nn.functional as F
13 | from torch.nn.utils import clip_grad_norm_
14 | import torch.utils.data as data
15 | from torch.nn.utils import weight_norm
16 | from tqdm import tqdm
17 | 
18 | from pysgg.config import cfg
19 | from pysgg.data import make_data_loader
20 | from pysgg.solver import make_lr_scheduler
21 | from pysgg.solver import make_optimizer
22 | from pysgg.engine.trainer import reduce_loss_dict
23 | from pysgg.engine.inference import inference
24 | from pysgg.modeling.detector import build_detection_model
25 | from pysgg.utils.checkpoint import DetectronCheckpointer
26 | from pysgg.utils.checkpoint import clip_grad_norm
27 | from pysgg.utils.collect_env import collect_env_info
28 | from pysgg.utils.comm import synchronize, get_rank, all_gather
29 | from pysgg.utils.imports import import_file
30 | from pysgg.utils.miscellaneous import mkdir, save_config
31 | from pysgg.utils.metric_logger import MetricLogger
32 | 
33 | def evaluator(logger, input_lists):
34 |     cat_data = []
35 |     for item in input_lists:
36 |         cat_data.append(item[0])
37 |     # shape [num_image, 2, hidden_dim]
38 |     cat_data = torch.cat(cat_data, dim=0).squeeze(2)
39 | 
40 |     similarity = cat_data[:, 0, :] @ (cat_data[:, 1, :].transpose(0,1))   # img to txt
41 |     similarity = similarity.transpose(0,1)                                # txt to img
42 | 
43 |     pred_rank = (similarity > similarity.diag().view(-1, 1)).sum(-1)
44 | 
45 |     num_sample = pred_rank.shape[0]
46 |     thres = [1, 5, 10, 20, 50, 100]
47 |     for k in thres:
48 |         logger.info('Recall @ %d: %.4f; ' % (k, float((pred_rank<k).sum()) / num_sample))
49 | 
50 |     return similarity


--------------------------------------------------------------------------------
/pysgg/layers/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | from .batch_norm import FrozenBatchNorm2d
 5 | from .misc import Conv2d
 6 | from .misc import DFConv2d
 7 | from .misc import ConvTranspose2d
 8 | from .misc import BatchNorm2d
 9 | from .misc import interpolate
10 | from .nms import nms
11 | from .roi_align import ROIAlign
12 | from .roi_align import roi_align
13 | from .roi_pool import ROIPool
14 | from .roi_pool import roi_pool
15 | from .entropy_loss import entropy_loss
16 | from .kl_div_loss import kl_div_loss
17 | from .smooth_l1_loss import smooth_l1_loss
18 | from .sigmoid_focal_loss import SigmoidFocalLoss
19 | from .label_smoothing_loss import Label_Smoothing_Regression
20 | from .dcn.deform_conv_func import deform_conv, modulated_deform_conv
21 | from .dcn.deform_conv_module import DeformConv, ModulatedDeformConv, ModulatedDeformConvPack
22 | from .dcn.deform_pool_func import deform_roi_pooling
23 | from .dcn.deform_pool_module import DeformRoIPooling, DeformRoIPoolingPack, ModulatedDeformRoIPoolingPack
24 | 
25 | 
26 | __all__ = [
27 |     "nms",
28 |     "roi_align",
29 |     "ROIAlign",
30 |     "roi_pool",
31 |     "ROIPool",
32 |     "smooth_l1_loss",
33 |     "entropy_loss",
34 |     "kl_div_loss",
35 |     "Conv2d",
36 |     "DFConv2d",
37 |     "ConvTranspose2d",
38 |     "interpolate",
39 |     "BatchNorm2d",
40 |     "FrozenBatchNorm2d",
41 |     "SigmoidFocalLoss",
42 |     "Label_Smoothing_Regression",
43 |     'deform_conv',
44 |     'modulated_deform_conv',
45 |     'DeformConv',
46 |     'ModulatedDeformConv',
47 |     'ModulatedDeformConvPack',
48 |     'deform_roi_pooling',
49 |     'DeformRoIPooling',
50 |     'DeformRoIPoolingPack',
51 |     'ModulatedDeformRoIPoolingPack',
52 | ]
53 | 
54 | 


--------------------------------------------------------------------------------
/pysgg/layers/_utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import glob
 3 | import os.path
 4 | 
 5 | import torch
 6 | 
 7 | try:
 8 |     from torch.utils.cpp_extension import load as load_ext
 9 |     from torch.utils.cpp_extension import CUDA_HOME
10 | except ImportError:
11 |     raise ImportError("The cpp layer extensions requires PyTorch 0.4 or higher")
12 | 
13 | 
14 | def _load_C_extensions():
15 |     this_dir = os.path.dirname(os.path.abspath(__file__))
16 |     this_dir = os.path.dirname(this_dir)
17 |     this_dir = os.path.join(this_dir, "csrc")
18 | 
19 |     main_file = glob.glob(os.path.join(this_dir, "*.cpp"))
20 |     source_cpu = glob.glob(os.path.join(this_dir, "cpu", "*.cpp"))
21 |     source_cuda = glob.glob(os.path.join(this_dir, "cuda", "*.cu"))
22 | 
23 |     source = main_file + source_cpu
24 | 
25 |     extra_cflags = []
26 |     if torch.cuda.is_available() and CUDA_HOME is not None:
27 |         source.extend(source_cuda)
28 |         extra_cflags = ["-DWITH_CUDA"]
29 |     source = [os.path.join(this_dir, s) for s in source]
30 |     extra_include_paths = [this_dir]
31 |     return load_ext(
32 |         "torchvision",
33 |         source,
34 |         extra_cflags=extra_cflags,
35 |         extra_include_paths=extra_include_paths,
36 |     )
37 | 
38 | 
39 | _C = _load_C_extensions()
40 | 


--------------------------------------------------------------------------------
/pysgg/layers/batch_norm.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | from torch import nn
 4 | 
 5 | 
 6 | class FrozenBatchNorm2d(nn.Module):
 7 |     """
 8 |     BatchNorm2d where the batch statistics and the affine parameters
 9 |     are fixed
10 |     """
11 | 
12 |     def __init__(self, n):
13 |         super(FrozenBatchNorm2d, self).__init__()
14 |         self.register_buffer("weight", torch.ones(n))
15 |         self.register_buffer("bias", torch.zeros(n))
16 |         self.register_buffer("running_mean", torch.zeros(n))
17 |         self.register_buffer("running_var", torch.ones(n))
18 | 
19 |     def forward(self, x):
20 |         # Cast all fixed parameters to half() if necessary
21 |         if x.dtype == torch.float16:
22 |             self.weight = self.weight.half()
23 |             self.bias = self.bias.half()
24 |             self.running_mean = self.running_mean.half()
25 |             self.running_var = self.running_var.half()
26 | 
27 |         scale = self.weight * self.running_var.rsqrt()
28 |         bias = self.bias - self.running_mean * scale
29 |         scale = scale.reshape(1, -1, 1, 1)
30 |         bias = bias.reshape(1, -1, 1, 1)
31 |         return x * scale + bias
32 | 


--------------------------------------------------------------------------------
/pysgg/layers/dcn/__init__.py:
--------------------------------------------------------------------------------
1 | #
2 | # Copied From [mmdetection](https://github.com/open-mmlab/mmdetection/tree/master/mmdet/ops/dcn)
3 | #
4 | 


--------------------------------------------------------------------------------
/pysgg/layers/entropy_loss.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | 
 5 | def entropy_loss(input, e=1e-9, reduction='sum'):
 6 |     assert len(input.shape) == 2
 7 |     loss = - (input * (input + e).log())
 8 | 
 9 |     if reduction == 'sum':
10 |         loss = loss.sum(-1)
11 |     elif reduction == 'mean':
12 |         loss = loss.mean(-1)
13 | 
14 |     return loss.mean()


--------------------------------------------------------------------------------
/pysgg/layers/kl_div_loss.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | 
 5 | def kl_div_loss(input, target, e=1e-9, reduction='sum'):
 6 |     assert len(input.shape) == 2
 7 |     assert len(target.shape) == 2
 8 | 
 9 |     log_target = (target + e).log()
10 |     log_input =  (input + e).log()
11 | 
12 |     loss = target.detach() * (log_target.detach() - log_input)
13 | 
14 |     if reduction == 'sum':
15 |         loss = loss.sum(-1)
16 |     elif reduction == 'mean':
17 |         loss = loss.mean(-1)
18 | 
19 |     return loss.mean()


--------------------------------------------------------------------------------
/pysgg/layers/nms.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | # from ._utils import _C
 3 | from pysgg import _C
 4 | 
 5 | from apex import amp
 6 | 
 7 | # Only valid with fp32 inputs - give AMP the hint
 8 | nms = amp.float_function(_C.nms)
 9 | 
10 | # nms = _C.nms
11 | 
12 | # nms.__doc__ = """
13 | # This function performs Non-maximum suppresion"""
14 | 


--------------------------------------------------------------------------------
/pysgg/layers/roi_align.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | from torch import nn
 4 | from torch.autograd import Function
 5 | from torch.autograd.function import once_differentiable
 6 | from torch.nn.modules.utils import _pair
 7 | 
 8 | from pysgg import _C
 9 | 
10 | from apex import amp
11 | 
12 | class _ROIAlign(Function):
13 |     @staticmethod
14 |     def forward(ctx, input, roi, output_size, spatial_scale, sampling_ratio):
15 |         ctx.save_for_backward(roi)
16 |         ctx.output_size = _pair(output_size)
17 |         ctx.spatial_scale = spatial_scale
18 |         ctx.sampling_ratio = sampling_ratio
19 |         ctx.input_shape = input.size()
20 |         output = _C.roi_align_forward(
21 |             input, roi, spatial_scale, output_size[0], output_size[1], sampling_ratio
22 |         )
23 |         return output
24 | 
25 |     @staticmethod
26 |     @once_differentiable
27 |     def backward(ctx, grad_output):
28 |         rois, = ctx.saved_tensors
29 |         output_size = ctx.output_size
30 |         spatial_scale = ctx.spatial_scale
31 |         sampling_ratio = ctx.sampling_ratio
32 |         bs, ch, h, w = ctx.input_shape
33 |         grad_input = _C.roi_align_backward(
34 |             grad_output,
35 |             rois,
36 |             spatial_scale,
37 |             output_size[0],
38 |             output_size[1],
39 |             bs,
40 |             ch,
41 |             h,
42 |             w,
43 |             sampling_ratio,
44 |         )
45 |         return grad_input, None, None, None, None
46 | 
47 | 
48 | roi_align = _ROIAlign.apply
49 | 
50 | class ROIAlign(nn.Module):
51 |     def __init__(self, output_size, spatial_scale, sampling_ratio):
52 |         super(ROIAlign, self).__init__()
53 |         self.output_size = output_size
54 |         self.spatial_scale = spatial_scale
55 |         self.sampling_ratio = sampling_ratio
56 | 
57 |     @amp.float_function
58 |     def forward(self, input, rois):
59 |         return roi_align(
60 |             input, rois, self.output_size, self.spatial_scale, self.sampling_ratio
61 |         )
62 | 
63 |     def __repr__(self):
64 |         tmpstr = self.__class__.__name__ + "("
65 |         tmpstr += "output_size=" + str(self.output_size)
66 |         tmpstr += ", spatial_scale=" + str(self.spatial_scale)
67 |         tmpstr += ", sampling_ratio=" + str(self.sampling_ratio)
68 |         tmpstr += ")"
69 |         return tmpstr
70 | 


--------------------------------------------------------------------------------
/pysgg/layers/roi_pool.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | from torch import nn
 4 | from torch.autograd import Function
 5 | from torch.autograd.function import once_differentiable
 6 | from torch.nn.modules.utils import _pair
 7 | 
 8 | from pysgg import _C
 9 | 
10 | from apex import amp
11 | 
12 | class _ROIPool(Function):
13 |     @staticmethod
14 |     def forward(ctx, input, roi, output_size, spatial_scale):
15 |         ctx.output_size = _pair(output_size)
16 |         ctx.spatial_scale = spatial_scale
17 |         ctx.input_shape = input.size()
18 |         output, argmax = _C.roi_pool_forward(
19 |             input, roi, spatial_scale, output_size[0], output_size[1]
20 |         )
21 |         ctx.save_for_backward(input, roi, argmax)
22 |         return output
23 | 
24 |     @staticmethod
25 |     @once_differentiable
26 |     def backward(ctx, grad_output):
27 |         input, rois, argmax = ctx.saved_tensors
28 |         output_size = ctx.output_size
29 |         spatial_scale = ctx.spatial_scale
30 |         bs, ch, h, w = ctx.input_shape
31 |         grad_input = _C.roi_pool_backward(
32 |             grad_output,
33 |             input,
34 |             rois,
35 |             argmax,
36 |             spatial_scale,
37 |             output_size[0],
38 |             output_size[1],
39 |             bs,
40 |             ch,
41 |             h,
42 |             w,
43 |         )
44 |         return grad_input, None, None, None
45 | 
46 | 
47 | roi_pool = _ROIPool.apply
48 | 
49 | 
50 | class ROIPool(nn.Module):
51 |     def __init__(self, output_size, spatial_scale):
52 |         super(ROIPool, self).__init__()
53 |         self.output_size = output_size
54 |         self.spatial_scale = spatial_scale
55 | 
56 |     @amp.float_function
57 |     def forward(self, input, rois):
58 |         return roi_pool(input, rois, self.output_size, self.spatial_scale)
59 | 
60 |     def __repr__(self):
61 |         tmpstr = self.__class__.__name__ + "("
62 |         tmpstr += "output_size=" + str(self.output_size)
63 |         tmpstr += ", spatial_scale=" + str(self.spatial_scale)
64 |         tmpstr += ")"
65 |         return tmpstr
66 | 


--------------------------------------------------------------------------------
/pysgg/layers/sigmoid_focal_loss.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from torch import nn
 3 | from torch.autograd import Function
 4 | from torch.autograd.function import once_differentiable
 5 | 
 6 | from pysgg import _C
 7 | 
 8 | # TODO: Use JIT to replace CUDA implementation in the future.
 9 | class _SigmoidFocalLoss(Function):
10 |     @staticmethod
11 |     def forward(ctx, logits, targets, gamma, alpha):
12 |         ctx.save_for_backward(logits, targets)
13 |         num_classes = logits.shape[1]
14 |         ctx.num_classes = num_classes
15 |         ctx.gamma = gamma
16 |         ctx.alpha = alpha
17 | 
18 |         losses = _C.sigmoid_focalloss_forward(
19 |             logits, targets, num_classes, gamma, alpha
20 |         )
21 |         return losses
22 | 
23 |     @staticmethod
24 |     @once_differentiable
25 |     def backward(ctx, d_loss):
26 |         logits, targets = ctx.saved_tensors
27 |         num_classes = ctx.num_classes
28 |         gamma = ctx.gamma
29 |         alpha = ctx.alpha
30 |         d_loss = d_loss.contiguous()
31 |         d_logits = _C.sigmoid_focalloss_backward(
32 |             logits, targets, d_loss, num_classes, gamma, alpha
33 |         )
34 |         return d_logits, None, None, None, None
35 | 
36 | 
37 | sigmoid_focal_loss_cuda = _SigmoidFocalLoss.apply
38 | 
39 | 
40 | def sigmoid_focal_loss_cpu(logits, targets, gamma, alpha):
41 |     num_classes = logits.shape[1]
42 |     gamma = gamma[0]
43 |     alpha = alpha[0]
44 |     dtype = targets.dtype
45 |     device = targets.device
46 |     class_range = torch.arange(1, num_classes+1, dtype=dtype, device=device).unsqueeze(0)
47 | 
48 |     t = targets.unsqueeze(1)
49 |     p = torch.sigmoid(logits)
50 |     term1 = (1 - p) ** gamma * torch.log(p)
51 |     term2 = p ** gamma * torch.log(1 - p)
52 |     return -(t == class_range).float() * term1 * alpha - ((t != class_range) * (t >= 0)).float() * term2 * (1 - alpha)
53 | 
54 | 
55 | class SigmoidFocalLoss(nn.Module):
56 |     def __init__(self, gamma, alpha):
57 |         super(SigmoidFocalLoss, self).__init__()
58 |         self.gamma = gamma
59 |         self.alpha = alpha
60 | 
61 |     def forward(self, logits, targets):
62 |         device = logits.device
63 |         if logits.is_cuda:
64 |             loss_func = sigmoid_focal_loss_cuda
65 |         else:
66 |             loss_func = sigmoid_focal_loss_cpu
67 | 
68 |         loss = loss_func(logits, targets, self.gamma, self.alpha)
69 |         return loss.sum()
70 | 
71 |     def __repr__(self):
72 |         tmpstr = self.__class__.__name__ + "("
73 |         tmpstr += "gamma=" + str(self.gamma)
74 |         tmpstr += ", alpha=" + str(self.alpha)
75 |         tmpstr += ")"
76 |         return tmpstr
77 | 


--------------------------------------------------------------------------------
/pysgg/layers/smooth_l1_loss.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | 
 5 | # TODO maybe push this to nn?
 6 | def smooth_l1_loss(input, target, beta=1. / 9, size_average=True):
 7 |     """
 8 |     very similar to the smooth_l1_loss from pytorch, but with
 9 |     the extra beta parameter
10 |     """
11 |     n = torch.abs(input - target)
12 |     cond = n < beta
13 |     loss = torch.where(cond, 0.5 * n ** 2 / beta, n - 0.5 * beta)
14 |     if size_average:
15 |         return loss.mean()
16 |     return loss.sum()
17 | 
18 | 
19 | 


--------------------------------------------------------------------------------
/pysgg/modeling/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/pysgg/modeling/__init__.py


--------------------------------------------------------------------------------
/pysgg/modeling/backbone/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .backbone import build_backbone
3 | from . import fbnet
4 | 


--------------------------------------------------------------------------------
/pysgg/modeling/backbone/vgg.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | """
 3 | Variant of the resnet module that takes cfg as an argument.
 4 | Example usage. Strings may be specified in the config file.
 5 |     model = ResNet(
 6 |         "StemWithFixedBatchNorm",
 7 |         "BottleneckWithFixedBatchNorm",
 8 |         "ResNet50StagesTo4",
 9 |     )
10 | OR:
11 |     model = ResNet(
12 |         "StemWithGN",
13 |         "BottleneckWithGN",
14 |         "ResNet50StagesTo4",
15 |     )
16 | Custom implementations may be written in user code and hooked in via the
17 | `register_*` functions.
18 | """
19 | from collections import namedtuple
20 | 
21 | import torch
22 | import torch.nn.functional as F
23 | from torch import nn
24 | 
25 | import torchvision.models as models
26 | from pysgg.layers import FrozenBatchNorm2d
27 | from pysgg.layers import Conv2d
28 | from pysgg.layers import DFConv2d
29 | from pysgg.modeling.make_layers import group_norm
30 | from pysgg.utils.registry import Registry
31 | 
32 | 
33 | class VGG16(nn.Module):
34 |     def __init__(self, cfg):
35 |         super(VGG16, self).__init__()
36 |         vgg = models.vgg16(pretrained=True)
37 |         self.conv_body = nn.Sequential(*list(vgg.features._modules.values())[:-1])
38 | 
39 |     def forward(self, x):
40 |         output = []
41 |         output.append(self.conv_body(x))
42 |         return output
43 | 
44 | 


--------------------------------------------------------------------------------
/pysgg/modeling/detector/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .detectors import build_detection_model
3 | 


--------------------------------------------------------------------------------
/pysgg/modeling/detector/detectors.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from .generalized_rcnn import GeneralizedRCNN
 3 | 
 4 | 
 5 | _DETECTION_META_ARCHITECTURES = {"GeneralizedRCNN": GeneralizedRCNN}
 6 | 
 7 | 
 8 | def build_detection_model(cfg):
 9 |     meta_arch = _DETECTION_META_ARCHITECTURES[cfg.MODEL.META_ARCHITECTURE]
10 |     return meta_arch(cfg)
11 | 


--------------------------------------------------------------------------------
/pysgg/modeling/detector/generalized_rcnn.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | """
 3 | Implements the Generalized R-CNN framework
 4 | """
 5 | 
 6 | import torch
 7 | from torch import nn
 8 | 
 9 | from pysgg.structures.image_list import to_image_list
10 | 
11 | from ..backbone import build_backbone
12 | from ..rpn.rpn import build_rpn
13 | from ..roi_heads.roi_heads import build_roi_heads
14 | 
15 | 
16 | class GeneralizedRCNN(nn.Module):
17 |     """
18 |     Main class for Generalized R-CNN. Currently supports boxes and masks.
19 |     It consists of three main parts:
20 |     - backbone
21 |     - rpn
22 |     - heads: takes the features + the proposals from the RPN and computes
23 |         detections / masks from it.
24 |     """
25 | 
26 |     def __init__(self, cfg):
27 |         super(GeneralizedRCNN, self).__init__()
28 |         self.cfg = cfg.clone()
29 |         self.backbone = build_backbone(cfg)
30 |         self.rpn = build_rpn(cfg, self.backbone.out_channels)
31 |         self.roi_heads = build_roi_heads(cfg, self.backbone.out_channels)
32 | 
33 |     def forward(self, images, targets=None, logger=None):
34 |         """
35 |         Arguments:
36 |             images (list[Tensor] or ImageList): images to be processed
37 |             targets (list[BoxList]): ground-truth boxes present in the image (optional)
38 | 
39 |         Returns:
40 |             result (list[BoxList] or dict[Tensor]): the output from the model.
41 |                 During training, it returns a dict[Tensor] which contains the losses.
42 |                 During testing, it returns list[BoxList] contains additional fields
43 |                 like `scores`, `labels` and `mask` (for Mask R-CNN models).
44 | 
45 |         """
46 |         if self.training and targets is None:
47 |             raise ValueError("In training mode, targets should be passed")
48 |         images = to_image_list(images)
49 |         features = self.backbone(images.tensors)
50 |         proposals, proposal_losses = self.rpn(images, features, targets)
51 |         if self.roi_heads:
52 |             x, result, detector_losses = self.roi_heads(features, proposals, targets, logger)
53 |         else:
54 |             # RPN-only models don't have roi_heads
55 |             x = features
56 |             result = proposals
57 |             detector_losses = {}
58 | 
59 |         if self.training:
60 |             losses = {}
61 |             losses.update(detector_losses)
62 |             if not self.cfg.MODEL.RELATION_ON:
63 |                 # During the relationship training stage, the rpn_head should be fixed, and no loss. 
64 |                 losses.update(proposal_losses)
65 |             return losses
66 | 
67 |         return result
68 | 


--------------------------------------------------------------------------------
/pysgg/modeling/registry.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | from pysgg.utils.registry import Registry
 4 | 
 5 | BACKBONES = Registry()
 6 | RPN_HEADS = Registry()
 7 | ROI_BOX_FEATURE_EXTRACTORS = Registry()
 8 | ROI_BOX_PREDICTOR = Registry()
 9 | ROI_ATTRIBUTE_FEATURE_EXTRACTORS = Registry()
10 | ROI_ATTRIBUTE_PREDICTOR = Registry()
11 | ROI_KEYPOINT_FEATURE_EXTRACTORS = Registry()
12 | ROI_KEYPOINT_PREDICTOR = Registry()
13 | ROI_MASK_FEATURE_EXTRACTORS = Registry()
14 | ROI_MASK_PREDICTOR = Registry()
15 | ROI_RELATION_FEATURE_EXTRACTORS = Registry()
16 | ROI_RELATION_PREDICTOR = Registry()
17 | RELATION_CONFIDENCE_AWARE_MODULES = Registry()
18 | 


--------------------------------------------------------------------------------
/pysgg/modeling/roi_heads/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/pysgg/modeling/roi_heads/__init__.py


--------------------------------------------------------------------------------
/pysgg/modeling/roi_heads/attribute_head/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/pysgg/modeling/roi_heads/attribute_head/__init__.py


--------------------------------------------------------------------------------
/pysgg/modeling/roi_heads/attribute_head/roi_attribute_predictors.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from torch import nn
 3 | 
 4 | from pysgg.modeling import registry
 5 | 
 6 | 
 7 | @registry.ROI_ATTRIBUTE_PREDICTOR.register("FastRCNNPredictor")
 8 | class FastRCNNPredictor(nn.Module):
 9 |     def __init__(self, cfg, in_channels):
10 |         super(FastRCNNPredictor, self).__init__()
11 |         assert in_channels is not None
12 |         num_inputs = in_channels
13 | 
14 |         num_attributes = cfg.MODEL.ROI_ATTRIBUTE_HEAD.NUM_ATTRIBUTES
15 |         self.avgpool = nn.AdaptiveAvgPool2d(1)
16 |         self.att_score = nn.Linear(num_inputs, num_attributes)
17 | 
18 |         nn.init.normal_(self.att_score.weight, mean=0, std=0.01)
19 |         nn.init.constant_(self.att_score.bias, 0)
20 | 
21 |     def forward(self, x):
22 |         x = self.avgpool(x)
23 |         x = x.view(x.size(0), -1)
24 |         att_logit = self.att_score(x)
25 | 
26 |         return att_logit
27 | 
28 | 
29 | @registry.ROI_ATTRIBUTE_PREDICTOR.register("FPNPredictor")
30 | class FPNPredictor(nn.Module):
31 |     def __init__(self, cfg, in_channels):
32 |         super(FPNPredictor, self).__init__()
33 |         num_attributes = cfg.MODEL.ROI_ATTRIBUTE_HEAD.NUM_ATTRIBUTES
34 |         representation_size = in_channels
35 | 
36 |         self.att_score = nn.Linear(representation_size, num_attributes)
37 | 
38 |         nn.init.normal_(self.att_score.weight, std=0.01)
39 |         nn.init.constant_(self.att_score.bias, 0)
40 | 
41 |     def forward(self, x):
42 |         if x.ndimension() == 4:
43 |             assert list(x.shape[2:]) == [1, 1]
44 |             x = x.view(x.size(0), -1)
45 | 
46 |         att_logit = self.att_score(x)
47 | 
48 |         return att_logit
49 | 
50 | 
51 | def make_roi_attribute_predictor(cfg, in_channels):
52 |     func = registry.ROI_ATTRIBUTE_PREDICTOR[cfg.MODEL.ROI_ATTRIBUTE_HEAD.PREDICTOR]
53 |     return func(cfg, in_channels)
54 | 


--------------------------------------------------------------------------------
/pysgg/modeling/roi_heads/box_head/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/pysgg/modeling/roi_heads/box_head/__init__.py


--------------------------------------------------------------------------------
/pysgg/modeling/roi_heads/box_head/roi_box_predictors.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from torch import nn
 3 | 
 4 | from pysgg.modeling import registry
 5 | 
 6 | 
 7 | @registry.ROI_BOX_PREDICTOR.register("FastRCNNPredictor")
 8 | class FastRCNNPredictor(nn.Module):
 9 |     def __init__(self, config, in_channels):
10 |         super(FastRCNNPredictor, self).__init__()
11 |         assert in_channels is not None
12 |         num_inputs = in_channels
13 | 
14 |         num_classes = config.MODEL.ROI_BOX_HEAD.NUM_CLASSES
15 |         self.avgpool = nn.AdaptiveAvgPool2d(1)
16 |         self.cls_score = nn.Linear(num_inputs, num_classes)
17 |         num_bbox_reg_classes = 2 if config.MODEL.CLS_AGNOSTIC_BBOX_REG else num_classes
18 |         self.bbox_pred = nn.Linear(num_inputs, num_bbox_reg_classes * 4)
19 | 
20 |         nn.init.normal_(self.cls_score.weight, mean=0, std=0.01)
21 |         nn.init.constant_(self.cls_score.bias, 0)
22 | 
23 |         nn.init.normal_(self.bbox_pred.weight, mean=0, std=0.001)
24 |         nn.init.constant_(self.bbox_pred.bias, 0)
25 | 
26 |     def forward(self, x):
27 |         x = self.avgpool(x)
28 |         x = x.view(x.size(0), -1)
29 |         cls_logit = self.cls_score(x)
30 |         bbox_pred = self.bbox_pred(x)
31 |         return cls_logit, bbox_pred
32 | 
33 | 
34 | @registry.ROI_BOX_PREDICTOR.register("FPNPredictor")
35 | class FPNPredictor(nn.Module):
36 |     def __init__(self, cfg, in_channels):
37 |         super(FPNPredictor, self).__init__()
38 |         num_classes = cfg.MODEL.ROI_BOX_HEAD.NUM_CLASSES
39 |         representation_size = in_channels
40 | 
41 |         self.cls_score = nn.Linear(representation_size, num_classes)
42 |         num_bbox_reg_classes = 2 if cfg.MODEL.CLS_AGNOSTIC_BBOX_REG else num_classes
43 |         self.bbox_pred = nn.Linear(representation_size, num_bbox_reg_classes * 4)
44 | 
45 |         nn.init.normal_(self.cls_score.weight, std=0.01)
46 |         nn.init.normal_(self.bbox_pred.weight, std=0.001)
47 |         for l in [self.cls_score, self.bbox_pred]:
48 |             nn.init.constant_(l.bias, 0)
49 | 
50 |     def forward(self, x):
51 |         if x.ndimension() == 4:
52 |             assert list(x.shape[2:]) == [1, 1]
53 |             x = x.view(x.size(0), -1)
54 |         cls_logit = self.cls_score(x)
55 |         bbox_pred = self.bbox_pred(x)
56 | 
57 |         return cls_logit, bbox_pred
58 | 
59 | 
60 | def make_roi_box_predictor(cfg, in_channels):
61 |     func = registry.ROI_BOX_PREDICTOR[cfg.MODEL.ROI_BOX_HEAD.PREDICTOR]
62 |     return func(cfg, in_channels)
63 | 


--------------------------------------------------------------------------------
/pysgg/modeling/roi_heads/keypoint_head/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/pysgg/modeling/roi_heads/keypoint_head/__init__.py


--------------------------------------------------------------------------------
/pysgg/modeling/roi_heads/keypoint_head/keypoint_head.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | 
 3 | from .roi_keypoint_feature_extractors import make_roi_keypoint_feature_extractor
 4 | from .roi_keypoint_predictors import make_roi_keypoint_predictor
 5 | from .inference import make_roi_keypoint_post_processor
 6 | from .loss import make_roi_keypoint_loss_evaluator
 7 | 
 8 | 
 9 | class ROIKeypointHead(torch.nn.Module):
10 |     def __init__(self, cfg, in_channels):
11 |         super(ROIKeypointHead, self).__init__()
12 |         self.cfg = cfg.clone()
13 |         self.feature_extractor = make_roi_keypoint_feature_extractor(cfg, in_channels)
14 |         self.predictor = make_roi_keypoint_predictor(
15 |             cfg, self.feature_extractor.out_channels)
16 |         self.post_processor = make_roi_keypoint_post_processor(cfg)
17 |         self.loss_evaluator = make_roi_keypoint_loss_evaluator(cfg)
18 | 
19 |     def forward(self, features, proposals, targets=None):
20 |         """
21 |         Arguments:
22 |             features (list[Tensor]): feature-maps from possibly several levels
23 |             proposals (list[BoxList]): proposal boxes
24 |             targets (list[BoxList], optional): the ground-truth targets.
25 | 
26 |         Returns:
27 |             x (Tensor): the result of the feature extractor
28 |             proposals (list[BoxList]): during training, the original proposals
29 |                 are returned. During testing, the predicted boxlists are returned
30 |                 with the `mask` field set
31 |             losses (dict[Tensor]): During training, returns the losses for the
32 |                 head. During testing, returns an empty dict.
33 |         """
34 |         if self.training:
35 |             with torch.no_grad():
36 |                 proposals = self.loss_evaluator.subsample(proposals, targets)
37 | 
38 |         x = self.feature_extractor(features, proposals)
39 |         kp_logits = self.predictor(x)
40 | 
41 |         if not self.training:
42 |             result = self.post_processor(kp_logits, proposals)
43 |             return x, result, {}
44 | 
45 |         loss_kp = self.loss_evaluator(proposals, kp_logits)
46 | 
47 |         return x, proposals, dict(loss_kp=loss_kp)
48 | 
49 | 
50 | def build_roi_keypoint_head(cfg, in_channels):
51 |     return ROIKeypointHead(cfg, in_channels)
52 | 


--------------------------------------------------------------------------------
/pysgg/modeling/roi_heads/keypoint_head/roi_keypoint_feature_extractors.py:
--------------------------------------------------------------------------------
 1 | from torch import nn
 2 | from torch.nn import functional as F
 3 | 
 4 | from pysgg.modeling import registry
 5 | from pysgg.modeling.poolers import Pooler
 6 | 
 7 | from pysgg.layers import Conv2d
 8 | 
 9 | 
10 | @registry.ROI_KEYPOINT_FEATURE_EXTRACTORS.register("KeypointRCNNFeatureExtractor")
11 | class KeypointRCNNFeatureExtractor(nn.Module):
12 |     def __init__(self, cfg, in_channels):
13 |         super(KeypointRCNNFeatureExtractor, self).__init__()
14 | 
15 |         resolution = cfg.MODEL.ROI_KEYPOINT_HEAD.POOLER_RESOLUTION
16 |         scales = cfg.MODEL.ROI_KEYPOINT_HEAD.POOLER_SCALES
17 |         sampling_ratio = cfg.MODEL.ROI_KEYPOINT_HEAD.POOLER_SAMPLING_RATIO
18 |         pooler = Pooler(
19 |             output_size=(resolution, resolution),
20 |             scales=scales,
21 |             sampling_ratio=sampling_ratio,
22 |         )
23 |         self.pooler = pooler
24 | 
25 |         input_features = in_channels
26 |         layers = cfg.MODEL.ROI_KEYPOINT_HEAD.CONV_LAYERS
27 |         next_feature = input_features
28 |         self.blocks = []
29 |         for layer_idx, layer_features in enumerate(layers, 1):
30 |             layer_name = "conv_fcn{}".format(layer_idx)
31 |             module = Conv2d(next_feature, layer_features, 3, stride=1, padding=1)
32 |             nn.init.kaiming_normal_(module.weight, mode="fan_out", nonlinearity="relu")
33 |             nn.init.constant_(module.bias, 0)
34 |             self.add_module(layer_name, module)
35 |             next_feature = layer_features
36 |             self.blocks.append(layer_name)
37 |         self.out_channels = layer_features
38 | 
39 |     def forward(self, x, proposals):
40 |         x = self.pooler(x, proposals)
41 |         for layer_name in self.blocks:
42 |             x = F.relu(getattr(self, layer_name)(x))
43 |         return x
44 | 
45 | 
46 | def make_roi_keypoint_feature_extractor(cfg, in_channels):
47 |     func = registry.ROI_KEYPOINT_FEATURE_EXTRACTORS[
48 |         cfg.MODEL.ROI_KEYPOINT_HEAD.FEATURE_EXTRACTOR
49 |     ]
50 |     return func(cfg, in_channels)
51 | 


--------------------------------------------------------------------------------
/pysgg/modeling/roi_heads/keypoint_head/roi_keypoint_predictors.py:
--------------------------------------------------------------------------------
 1 | from torch import nn
 2 | 
 3 | from pysgg import layers
 4 | from pysgg.modeling import registry
 5 | 
 6 | 
 7 | @registry.ROI_KEYPOINT_PREDICTOR.register("KeypointRCNNPredictor")
 8 | class KeypointRCNNPredictor(nn.Module):
 9 |     def __init__(self, cfg, in_channels):
10 |         super(KeypointRCNNPredictor, self).__init__()
11 |         input_features = in_channels
12 |         num_keypoints = cfg.MODEL.ROI_KEYPOINT_HEAD.NUM_CLASSES
13 |         deconv_kernel = 4
14 |         self.kps_score_lowres = layers.ConvTranspose2d(
15 |             input_features,
16 |             num_keypoints,
17 |             deconv_kernel,
18 |             stride=2,
19 |             padding=deconv_kernel // 2 - 1,
20 |         )
21 |         nn.init.kaiming_normal_(
22 |             self.kps_score_lowres.weight, mode="fan_out", nonlinearity="relu"
23 |         )
24 |         nn.init.constant_(self.kps_score_lowres.bias, 0)
25 |         self.up_scale = 2
26 |         self.out_channels = num_keypoints
27 | 
28 |     def forward(self, x):
29 |         x = self.kps_score_lowres(x)
30 |         x = layers.interpolate(
31 |             x, scale_factor=self.up_scale, mode="bilinear", align_corners=False
32 |         )
33 |         return x
34 | 
35 | 
36 | def make_roi_keypoint_predictor(cfg, in_channels):
37 |     func = registry.ROI_KEYPOINT_PREDICTOR[cfg.MODEL.ROI_KEYPOINT_HEAD.PREDICTOR]
38 |     return func(cfg, in_channels)
39 | 


--------------------------------------------------------------------------------
/pysgg/modeling/roi_heads/mask_head/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/pysgg/modeling/roi_heads/mask_head/__init__.py


--------------------------------------------------------------------------------
/pysgg/modeling/roi_heads/mask_head/roi_mask_predictors.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from torch import nn
 3 | from torch.nn import functional as F
 4 | 
 5 | from pysgg.layers import Conv2d
 6 | from pysgg.layers import ConvTranspose2d
 7 | from pysgg.modeling import registry
 8 | 
 9 | 
10 | @registry.ROI_MASK_PREDICTOR.register("MaskRCNNC4Predictor")
11 | class MaskRCNNC4Predictor(nn.Module):
12 |     def __init__(self, cfg, in_channels):
13 |         super(MaskRCNNC4Predictor, self).__init__()
14 |         num_classes = cfg.MODEL.ROI_BOX_HEAD.NUM_CLASSES
15 |         dim_reduced = cfg.MODEL.ROI_MASK_HEAD.CONV_LAYERS[-1]
16 |         num_inputs = in_channels
17 | 
18 |         self.conv5_mask = ConvTranspose2d(num_inputs, dim_reduced, 2, 2, 0)
19 |         self.mask_fcn_logits = Conv2d(dim_reduced, num_classes, 1, 1, 0)
20 | 
21 |         for name, param in self.named_parameters():
22 |             if "bias" in name:
23 |                 nn.init.constant_(param, 0)
24 |             elif "weight" in name:
25 |                 # Caffe2 implementation uses MSRAFill, which in fact
26 |                 # corresponds to kaiming_normal_ in PyTorch
27 |                 nn.init.kaiming_normal_(param, mode="fan_out", nonlinearity="relu")
28 | 
29 |     def forward(self, x):
30 |         x = F.relu(self.conv5_mask(x))
31 |         return self.mask_fcn_logits(x)
32 | 
33 | 
34 | @registry.ROI_MASK_PREDICTOR.register("MaskRCNNConv1x1Predictor")
35 | class MaskRCNNConv1x1Predictor(nn.Module):
36 |     def __init__(self, cfg, in_channels):
37 |         super(MaskRCNNConv1x1Predictor, self).__init__()
38 |         num_classes = cfg.MODEL.ROI_BOX_HEAD.NUM_CLASSES
39 |         num_inputs = in_channels
40 | 
41 |         self.mask_fcn_logits = Conv2d(num_inputs, num_classes, 1, 1, 0)
42 | 
43 |         for name, param in self.named_parameters():
44 |             if "bias" in name:
45 |                 nn.init.constant_(param, 0)
46 |             elif "weight" in name:
47 |                 # Caffe2 implementation uses MSRAFill, which in fact
48 |                 # corresponds to kaiming_normal_ in PyTorch
49 |                 nn.init.kaiming_normal_(param, mode="fan_out", nonlinearity="relu")
50 | 
51 |     def forward(self, x):
52 |         return self.mask_fcn_logits(x)
53 | 
54 | 
55 | def make_roi_mask_predictor(cfg, in_channels):
56 |     func = registry.ROI_MASK_PREDICTOR[cfg.MODEL.ROI_MASK_HEAD.PREDICTOR]
57 |     return func(cfg, in_channels)
58 | 


--------------------------------------------------------------------------------
/pysgg/modeling/roi_heads/relation_head/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/pysgg/modeling/roi_heads/relation_head/__init__.py


--------------------------------------------------------------------------------
/pysgg/modeling/roi_heads/relation_head/rel_proposal_network/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/pysgg/modeling/roi_heads/relation_head/rel_proposal_network/__init__.py


--------------------------------------------------------------------------------
/pysgg/modeling/rpn/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | # from .rpn import build_rpn
3 | 


--------------------------------------------------------------------------------
/pysgg/modeling/rpn/retinanet/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/pysgg/modeling/rpn/retinanet/__init__.py


--------------------------------------------------------------------------------
/pysgg/modeling/rpn/utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | """
 3 | Utility functions minipulating the prediction layers
 4 | """
 5 | 
 6 | from ..utils import cat
 7 | 
 8 | import torch
 9 | 
10 | def permute_and_flatten(layer, N, A, C, H, W):
11 |     layer = layer.view(N, -1, C, H, W)
12 |     layer = layer.permute(0, 3, 4, 1, 2)
13 |     layer = layer.reshape(N, -1, C)
14 |     return layer
15 | 
16 | 
17 | def concat_box_prediction_layers(box_cls, box_regression):
18 |     box_cls_flattened = []
19 |     box_regression_flattened = []
20 |     # for each feature level, permute the outputs to make them be in the
21 |     # same format as the labels. Note that the labels are computed for
22 |     # all feature levels concatenated, so we keep the same representation
23 |     # for the objectness and the box_regression
24 |     for box_cls_per_level, box_regression_per_level in zip(
25 |         box_cls, box_regression
26 |     ):
27 |         N, AxC, H, W = box_cls_per_level.shape
28 |         Ax4 = box_regression_per_level.shape[1]
29 |         A = Ax4 // 4
30 |         C = AxC // A
31 |         box_cls_per_level = permute_and_flatten(
32 |             box_cls_per_level, N, A, C, H, W
33 |         )
34 |         box_cls_flattened.append(box_cls_per_level)
35 | 
36 |         box_regression_per_level = permute_and_flatten(
37 |             box_regression_per_level, N, A, 4, H, W
38 |         )
39 |         box_regression_flattened.append(box_regression_per_level)
40 |     # concatenate on the first dimension (representing the feature levels), to
41 |     # take into account the way the labels were generated (with all feature maps
42 |     # being concatenated as well)
43 |     box_cls = cat(box_cls_flattened, dim=1).reshape(-1, C)
44 |     box_regression = cat(box_regression_flattened, dim=1).reshape(-1, 4)
45 |     return box_cls, box_regression
46 | 


--------------------------------------------------------------------------------
/pysgg/modeling/utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | """
 3 | Miscellaneous utility functions
 4 | """
 5 | 
 6 | import torch
 7 | 
 8 | 
 9 | def cat(tensors, dim=0):
10 |     """
11 |     Efficient version of torch.cat that avoids a copy if there is only a single element in a list
12 |     """
13 |     assert isinstance(tensors, (list, tuple))
14 |     if len(tensors) == 1:
15 |         return tensors[0]
16 |     return torch.cat(tensors, dim)
17 | 


--------------------------------------------------------------------------------
/pysgg/solver/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .build import make_optimizer
3 | from .build import make_lr_scheduler
4 | from .lr_scheduler import WarmupMultiStepLR, WarmupReduceLROnPlateau
5 | 
6 | 


--------------------------------------------------------------------------------
/pysgg/solver/build.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | from .lr_scheduler import WarmupMultiStepLR, WarmupReduceLROnPlateau
 5 | 
 6 | 
 7 | def make_optimizer(cfg, model, logger, slow_heads=None, except_weight_decay=None, slow_ratio=5.0, rl_factor=1.0):
 8 |     params = []
 9 |     for key, value in model.named_parameters():
10 |         if not value.requires_grad:
11 |             continue
12 |         lr = cfg.SOLVER.BASE_LR
13 |         weight_decay = cfg.SOLVER.WEIGHT_DECAY
14 |         if "bias" in key:
15 |             lr = cfg.SOLVER.BASE_LR * cfg.SOLVER.BIAS_LR_FACTOR
16 |             weight_decay = cfg.SOLVER.WEIGHT_DECAY_BIAS
17 | 
18 |         if except_weight_decay is not None:
19 |             for item in except_weight_decay:
20 |                 if item in key:
21 |                     weight_decay = 0.0
22 |                     logger.info("NO WEIGHT DECAY: {}.".format(key))
23 | 
24 |         if slow_heads is not None:
25 |             for item in slow_heads:
26 |                 if item in key:
27 |                     logger.info("SLOW HEADS: {} is slow down by ratio of {}.".format(key, str(slow_ratio)))
28 |                     lr = lr / slow_ratio
29 |                     break
30 |         params += [{"params": [value], "lr": lr * rl_factor, "weight_decay": weight_decay}]
31 | 
32 |     optimizer = torch.optim.SGD(params, lr=cfg.SOLVER.BASE_LR, momentum=cfg.SOLVER.MOMENTUM)
33 |     return optimizer
34 | 
35 | 
36 | def make_lr_scheduler(cfg, optimizer, logger=None):
37 |     if cfg.SOLVER.SCHEDULE.TYPE == "WarmupMultiStepLR":
38 |         return WarmupMultiStepLR(
39 |             optimizer,
40 |             cfg.SOLVER.STEPS,
41 |             cfg.SOLVER.GAMMA,
42 |             warmup_factor=cfg.SOLVER.WARMUP_FACTOR,
43 |             warmup_iters=cfg.SOLVER.WARMUP_ITERS,
44 |             warmup_method=cfg.SOLVER.WARMUP_METHOD,
45 |         )
46 |     
47 |     elif cfg.SOLVER.SCHEDULE.TYPE == "WarmupReduceLROnPlateau":
48 |         return WarmupReduceLROnPlateau(
49 |             optimizer,
50 |             cfg.SOLVER.SCHEDULE.FACTOR,
51 |             warmup_factor=cfg.SOLVER.WARMUP_FACTOR,
52 |             warmup_iters=cfg.SOLVER.WARMUP_ITERS,
53 |             warmup_method=cfg.SOLVER.WARMUP_METHOD,
54 |             patience=cfg.SOLVER.SCHEDULE.PATIENCE,
55 |             threshold=cfg.SOLVER.SCHEDULE.THRESHOLD,
56 |             cooldown=cfg.SOLVER.SCHEDULE.COOLDOWN,
57 |             logger=logger,
58 |         )
59 |     
60 |     else:
61 |         raise ValueError("Invalid Schedule Type")
62 | 


--------------------------------------------------------------------------------
/pysgg/structures/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/pysgg/structures/__init__.py


--------------------------------------------------------------------------------
/pysgg/utils/README.md:
--------------------------------------------------------------------------------
1 | # Utility functions
2 | 
3 | This folder contain utility functions that are not used in the
4 | core library, but are useful for building models or training
5 | code using the config system.
6 | 


--------------------------------------------------------------------------------
/pysgg/utils/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/SHTUPLUS/PySGG/a63942a076932b3756a477cf8919c3b74cd36207/pysgg/utils/__init__.py


--------------------------------------------------------------------------------
/pysgg/utils/collect_env.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import PIL
 3 | 
 4 | from torch.utils.collect_env import get_pretty_env_info
 5 | 
 6 | 
 7 | def get_pil_version():
 8 |     return "\n        Pillow ({})".format(PIL.__version__)
 9 | 
10 | 
11 | def collect_env_info():
12 |     env_str = get_pretty_env_info()
13 |     env_str += get_pil_version()
14 |     return env_str
15 | 


--------------------------------------------------------------------------------
/pysgg/utils/cv2_util.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Module for cv2 utility functions and maintaining version compatibility
 3 | between 3.x and 4.x
 4 | """
 5 | import cv2
 6 | 
 7 | 
 8 | def findContours(*args, **kwargs):
 9 |     """
10 |     Wraps cv2.findContours to maintain compatiblity between versions
11 |     3 and 4
12 | 
13 |     Returns:
14 |         contours, hierarchy
15 |     """
16 |     if cv2.__version__.startswith('4'):
17 |         contours, hierarchy = cv2.findContours(*args, **kwargs)
18 |     elif cv2.__version__.startswith('3'):
19 |         _, contours, hierarchy = cv2.findContours(*args, **kwargs)
20 |     else:
21 |         raise AssertionError(
22 |             'cv2 must be either version 3 or 4 to call this method')
23 | 
24 |     return contours, hierarchy
25 | 


--------------------------------------------------------------------------------
/pysgg/utils/env.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import os
 3 | 
 4 | from pysgg.utils.imports import import_file
 5 | 
 6 | 
 7 | def setup_environment():
 8 |     """Perform environment setup work. The default setup is a no-op, but this
 9 |     function allows the user to specify a Python source file that performs
10 |     custom setup work that may be necessary to their computing environment.
11 |     """
12 |     custom_module_path = os.environ.get("TORCH_DETECTRON_ENV_MODULE")
13 |     if custom_module_path:
14 |         setup_custom_environment(custom_module_path)
15 |     else:
16 |         # The default setup is a no-op
17 |         pass
18 | 
19 | 
20 | def setup_custom_environment(custom_module_path):
21 |     """Load custom environment setup from a Python source file and run the setup
22 |     function.
23 |     """
24 |     module = import_file("pysgg.utils.env.custom_module", custom_module_path)
25 |     assert hasattr(module, "setup_environment") and callable(
26 |         module.setup_environment
27 |     ), (
28 |         "Custom environment module defined in {} does not have the "
29 |         "required callable attribute 'setup_environment'."
30 |     ).format(
31 |         custom_module_path
32 |     )
33 |     module.setup_environment()
34 | 
35 | 
36 | # Force environment setup when this module is imported
37 | setup_environment()
38 | 


--------------------------------------------------------------------------------
/pysgg/utils/global_buffer.py:
--------------------------------------------------------------------------------
 1 | from collections import defaultdict
 2 | import pickle
 3 | import torch
 4 | import os
 5 | 
 6 | from pysgg.utils.comm import is_main_process, get_world_size, all_gather, synchronize
 7 | from pysgg.config import cfg
 8 | 
 9 | def singleton(cls):
10 |     _instance = {}
11 | 
12 |     def inner():
13 |         if cls not in _instance:
14 |             _instance[cls] = cls()
15 |         return _instance[cls]
16 |     return inner
17 | 
18 | 
19 | @singleton
20 | class _GlobalBuffer():
21 |     """a singleton buffer for store data in anywhere of program
22 |     """
23 |     def __init__(self ):
24 |         self.multi_proc = (get_world_size() > 1)
25 |         self.data = defaultdict(list)
26 | 
27 |     def add_data(self, key, val):
28 |         if not isinstance(val, torch.Tensor):
29 |             val = torch.Tensor(val)
30 |         else:
31 |             val = val.detach()
32 | 
33 |         val = torch.cat(all_gather(val))
34 | 
35 |         if not is_main_process():
36 |             del val
37 |             return
38 |         self.data[key].append(val.cpu().numpy())
39 | 
40 |     def __str__(self):
41 |         ret_str = f"Buffer contains data: (key, value type)\n"
42 |         for k, v in self.data.items():
43 |             ret_str += f"    {k}, {type(v).__name__}\n"
44 |         ret_str += f"id {id(self)}"
45 |         return ret_str
46 | 
47 | 
48 | def store_data(k, v, ):
49 |     if cfg.GLOBAL_BUFFER_ON:
50 |         buffer = _GlobalBuffer()
51 |         buffer.add_data(k, v)
52 |         synchronize()
53 | 
54 | 
55 | def save_buffer(output_dir):
56 |     if cfg.GLOBAL_BUFFER_ON:
57 |         if is_main_process():
58 |             buffer = _GlobalBuffer()
59 |             with open(os.path.join(output_dir, "inter_data_buffer.pkl"), 'wb') as f:
60 |                 pickle.dump(buffer.data, f)
61 | 
62 |             print("save buffer:", str(buffer))
63 | 


--------------------------------------------------------------------------------
/pysgg/utils/imports.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | if torch._six.PY3:
 5 |     import importlib
 6 |     import importlib.util
 7 |     import sys
 8 | 
 9 | 
10 |     # from https://stackoverflow.com/questions/67631/how-to-import-a-module-given-the-full-path?utm_medium=organic&utm_source=google_rich_qa&utm_campaign=google_rich_qa
11 |     def import_file(module_name, file_path, make_importable=False):
12 |         spec = importlib.util.spec_from_file_location(module_name, file_path)
13 |         module = importlib.util.module_from_spec(spec)
14 |         spec.loader.exec_module(module)
15 |         if make_importable:
16 |             sys.modules[module_name] = module
17 |         return module
18 | else:
19 |     import imp
20 | 
21 |     def import_file(module_name, file_path, make_importable=None):
22 |         module = imp.load_source(module_name, file_path)
23 |         return module
24 | 


--------------------------------------------------------------------------------
/pysgg/utils/metric_logger.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from collections import defaultdict
 3 | from collections import deque
 4 | 
 5 | import torch
 6 | 
 7 | 
 8 | class SmoothedValue(object):
 9 |     """Track a series of values and provide access to smoothed values over a
10 |     window or the global series average.
11 |     """
12 | 
13 |     def __init__(self, window_size=20):
14 |         self.deque = deque(maxlen=window_size)
15 |         self.series = []
16 |         self.total = 0.0
17 |         self.count = 0
18 | 
19 |     def update(self, value):
20 |         self.deque.append(value)
21 |         self.series.append(value)
22 |         self.count += 1
23 |         self.total += value
24 | 
25 |     @property
26 |     def median(self):
27 |         d = torch.tensor(list(self.deque))
28 |         return d.median().item()
29 | 
30 |     @property
31 |     def avg(self):
32 |         d = torch.tensor(list(self.deque))
33 |         return d.mean().item()
34 | 
35 |     @property
36 |     def global_avg(self):
37 |         return self.total / self.count
38 | 
39 | 
40 | class MetricLogger(object):
41 |     def __init__(self, delimiter="\t"):
42 |         self.meters = defaultdict(SmoothedValue)
43 |         self.delimiter = delimiter
44 | 
45 |     def update(self, **kwargs):
46 |         for k, v in kwargs.items():
47 |             if isinstance(v, torch.Tensor):
48 |                 v = v.item()
49 |             assert isinstance(v, (float, int))
50 |             self.meters[k].update(v)
51 | 
52 |     def __getattr__(self, attr):
53 |         if attr in self.meters:
54 |             return self.meters[attr]
55 |         if attr in self.__dict__:
56 |             return self.__dict__[attr]
57 |         raise AttributeError("'{}' object has no attribute '{}'".format(
58 |                     type(self).__name__, attr))
59 | 
60 |     def __str__(self):
61 |         loss_str = []
62 |         for name, meter in self.meters.items():
63 |             loss_str.append(
64 |                 "{}: {:.4f} ({:.4f})\n".format(name, meter.median, meter.global_avg)
65 |             )
66 |         return self.delimiter.join(loss_str)
67 | 


--------------------------------------------------------------------------------
/pysgg/utils/registry.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | 
 4 | def _register_generic(module_dict, module_name, module):
 5 |     assert module_name not in module_dict
 6 |     module_dict[module_name] = module
 7 | 
 8 | 
 9 | class Registry(dict):
10 |     '''
11 |     A helper class for managing registering modules, it extends a dictionary
12 |     and provides a register functions.
13 | 
14 |     Eg. creeting a registry:
15 |         some_registry = Registry({"default": default_module})
16 | 
17 |     There're two ways of registering new modules:
18 |     1): normal way is just calling register function:
19 |         def foo():
20 |             ...
21 |         some_registry.register("foo_module", foo)
22 |     2): used as decorator when declaring the module:
23 |         @some_registry.register("foo_module")
24 |         @some_registry.register("foo_modeul_nickname")
25 |         def foo():
26 |             ...
27 | 
28 |     Access of module is just like using a dictionary, eg:
29 |         f = some_registry["foo_modeul"]
30 |     '''
31 |     def __init__(self, *args, **kwargs):
32 |         super(Registry, self).__init__(*args, **kwargs)
33 | 
34 |     def register(self, module_name, module=None):
35 |         # used as function call
36 |         if module is not None:
37 |             _register_generic(self, module_name, module)
38 |             return
39 | 
40 |         # used as decorator
41 |         def register_fn(fn):
42 |             _register_generic(self, module_name, fn)
43 |             return fn
44 | 
45 |         return register_fn
46 | 


--------------------------------------------------------------------------------
/pysgg/utils/timer.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | 
 4 | import time
 5 | import datetime
 6 | 
 7 | 
 8 | class Timer(object):
 9 |     def __init__(self):
10 |         self.reset()
11 | 
12 |     @property
13 |     def average_time(self):
14 |         return self.total_time / self.calls if self.calls > 0 else 0.0
15 | 
16 |     def tic(self):
17 |         # using time.time instead of time.clock because time time.clock
18 |         # does not normalize for multithreading
19 |         self.start_time = time.time()
20 | 
21 |     def toc(self, average=True):
22 |         self.add(time.time() - self.start_time)
23 |         if average:
24 |             return self.average_time
25 |         else:
26 |             return self.diff
27 | 
28 |     def add(self, time_diff):
29 |         self.diff = time_diff
30 |         self.total_time += self.diff
31 |         self.calls += 1
32 | 
33 |     def reset(self):
34 |         self.total_time = 0.0
35 |         self.calls = 0
36 |         self.start_time = 0.0
37 |         self.diff = 0.0
38 | 
39 |     def avg_time_str(self):
40 |         time_str = str(datetime.timedelta(seconds=self.average_time))
41 |         return time_str
42 | 
43 | 
44 | def get_time_str(time_diff):
45 |     time_str = str(datetime.timedelta(seconds=time_diff))
46 |     return time_str
47 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
1 | # This file may be used to create an environment using:
2 | # $ conda create --name <env> --file <this file>
3 | # platform: linux-64
4 | 


--------------------------------------------------------------------------------
/scripts/rel_test.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | export OMP_NUM_THREADS=1
 4 | export gpu_num=4
 5 | export CUDA_VISIBLE_DEVICES="0,1,2,3"
 6 | 
 7 | 
 8 | archive_dir="/group/rongjie/projects/Scene-Graph-Benchmark.pytorch/checkpoints/predcls-BGNNPredictor/(2021-07-16_08)BGNN-3-3-learnable_scaling(resampling)"
 9 | 
10 | python -m torch.distributed.launch --master_port 10029 --nproc_per_node=$gpu_num  \
11 |   tools/relation_test_net.py \
12 |   --config-file "$archive_dir/config.yml"\
13 |     TEST.IMS_PER_BATCH $[$gpu_num] \
14 |    MODEL.WEIGHT  "$archive_dir/model_0020000.pth"\
15 |    MODEL.ROI_RELATION_HEAD.EVALUATE_REL_PROPOSAL False \
16 |    DATASETS.TEST "('VG_stanford_filtered_with_attribute_test', )"
17 | 
18 | 


--------------------------------------------------------------------------------
/scripts/rel_train_BGNN_oiv4.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | 
 4 | export OMP_NUM_THREADS=1
 5 | export gpu_num=4
 6 | export CUDA_VISIBLE_DEVICES="0,1,2,3"
 7 | 
 8 | 
 9 | exp_name="(oiv4)BGNN-3-3"
10 | 
11 | python -m torch.distributed.launch --master_port 10028 --nproc_per_node=$gpu_num \
12 |        tools/relation_train_net.py \
13 |        --config-file "configs/e2e_relBGNN_oiv4.yaml" \
14 |        EXPERIMENT_NAME "$exp_name" \
15 |         SOLVER.IMS_PER_BATCH $[3*$gpu_num] \
16 |         TEST.IMS_PER_BATCH $[$gpu_num] \
17 |         SOLVER.VAL_PERIOD 2000 \
18 |         SOLVER.CHECKPOINT_PERIOD 2000 
19 | 
20 | 
21 | 


--------------------------------------------------------------------------------
/scripts/rel_train_BGNN_oiv6.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | 
 4 | export OMP_NUM_THREADS=1
 5 | export gpu_num=4
 6 | export CUDA_VISIBLE_DEVICES="0,1,2,3"
 7 | 
 8 | exp_name="(oiv6)BGNN-3-3-learnable_scaling-inst_drop0.9"
 9 | 
10 | export CUDA_VISIBLE_DEVICES="0,1,2,3"
11 | 
12 | python -m torch.distributed.launch --master_port 10028 --nproc_per_node=$gpu_num \
13 |        tools/relation_train_net.py \
14 |        --config-file "configs/e2e_relBGNN_oiv6.yaml" \
15 |        EXPERIMENT_NAME "$exp_name" \
16 |         SOLVER.IMS_PER_BATCH $[3*$gpu_num] \
17 |         TEST.IMS_PER_BATCH $[$gpu_num] \
18 |         SOLVER.VAL_PERIOD 2000 \
19 |         SOLVER.CHECKPOINT_PERIOD 2000 
20 | 
21 | 
22 | 


--------------------------------------------------------------------------------
/scripts/rel_train_BGNN_vg.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | export OMP_NUM_THREADS=1
 3 | export gpu_num=4
 4 | export CUDA_VISIBLE_DEVICES="0,1,2,3"
 5 | 
 6 | exp_name="BGNN-3-3-learnable_scaling"
 7 | 
 8 | 
 9 | python -m torch.distributed.launch --master_port 10028 --nproc_per_node=$gpu_num \
10 |        tools/relation_train_net.py \
11 |        --config-file "configs/e2e_relBGNN_vg.yaml" \
12 |        EXPERIMENT_NAME "$exp_name" \
13 |         SOLVER.IMS_PER_BATCH $[3*$gpu_num] \
14 |         TEST.IMS_PER_BATCH $[$gpu_num] \
15 |         SOLVER.VAL_PERIOD 2000 \
16 |         SOLVER.CHECKPOINT_PERIOD 2000 
17 | 
18 | 
19 | 


--------------------------------------------------------------------------------
/scripts/rel_train_BGNN_vg_predcls.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | export OMP_NUM_THREADS=1
 3 | export gpu_num=4
 4 | export CUDA_VISIBLE_DEVICES="0,1,2,3"
 5 | 
 6 | exp_name="BGNN-3-3-learnable_scaling"
 7 | 
 8 | 
 9 | python -m torch.distributed.launch --master_port 10028 --nproc_per_node=$gpu_num \
10 |        tools/relation_train_net.py \
11 |        --config-file "configs/e2e_relBGNN_vg.yaml" \
12 |        DEBUG False\
13 |        MODEL.ROI_RELATION_HEAD.USE_GT_BOX True \
14 |        MODEL.ROI_RELATION_HEAD.USE_GT_OBJECT_LABEL True \
15 |        MODEL.ROI_RELATION_HEAD.DATA_RESAMPLING_PARAM.REPEAT_FACTOR 0.13 \
16 |        MODEL.ROI_RELATION_HEAD.DATA_RESAMPLING_PARAM.INSTANCE_DROP_RATE 1.6 \
17 |        EXPERIMENT_NAME "$exp_name" \
18 |         SOLVER.IMS_PER_BATCH $[3*$gpu_num] \
19 |         TEST.IMS_PER_BATCH $[$gpu_num] \
20 |         SOLVER.VAL_PERIOD 2000 \
21 |        MODEL.PRETRAINED_DETECTOR_CKPT checkpoints/detection/pretrained_faster_rcnn/model_final.pth \
22 |         SOLVER.CHECKPOINT_PERIOD 2000 
23 | 
24 | 
25 | 


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #!/usr/bin/env python
 3 | 
 4 | import glob
 5 | import os
 6 | 
 7 | import torch
 8 | from setuptools import find_packages
 9 | from setuptools import setup
10 | from torch.utils.cpp_extension import CUDA_HOME
11 | from torch.utils.cpp_extension import CppExtension
12 | from torch.utils.cpp_extension import CUDAExtension
13 | 
14 | requirements = ["torch", "torchvision"]
15 | 
16 | 
17 | def get_extensions():
18 |     this_dir = os.path.dirname(os.path.abspath(__file__))
19 |     extensions_dir = os.path.join(this_dir, "pysgg", "csrc")
20 | 
21 |     main_file = glob.glob(os.path.join(extensions_dir, "*.cpp"))
22 |     source_cpu = glob.glob(os.path.join(extensions_dir, "cpu", "*.cpp"))
23 |     source_cuda = glob.glob(os.path.join(extensions_dir, "cuda", "*.cu"))
24 | 
25 |     sources = main_file + source_cpu
26 |     extension = CppExtension
27 | 
28 |     extra_compile_args = {"cxx": []}
29 |     define_macros = []
30 | 
31 |     if (torch.cuda.is_available() and CUDA_HOME is not None) or os.getenv("FORCE_CUDA", "0") == "1":
32 |         extension = CUDAExtension
33 |         sources += source_cuda
34 |         define_macros += [("WITH_CUDA", None)]
35 |         extra_compile_args["nvcc"] = [
36 |             "-DCUDA_HAS_FP16=1",
37 |             "-D__CUDA_NO_HALF_OPERATORS__",
38 |             "-D__CUDA_NO_HALF_CONVERSIONS__",
39 |             "-D__CUDA_NO_HALF2_OPERATORS__",
40 |         ]
41 | 
42 |     sources = [os.path.join(extensions_dir, s) for s in sources]
43 | 
44 |     include_dirs = [extensions_dir]
45 | 
46 |     ext_modules = [
47 |         extension(
48 |             "pysgg._C",
49 |             sources,
50 |             include_dirs=include_dirs,
51 |             define_macros=define_macros,
52 |             extra_compile_args=extra_compile_args,
53 |         )
54 |     ]
55 | 
56 |     return ext_modules
57 | 
58 | 
59 | setup(
60 |     name="pysgg",
61 |     version="0.1",
62 |     author="Rongjie Li, Songyang Zhang",
63 |     url="",
64 |     description="A Toolkit for Scene Graph Generation",
65 |     packages=find_packages(exclude=("configs", "tests",)),
66 |     # install_requires=requirements,
67 |     ext_modules=get_extensions(),
68 |     cmdclass={"build_ext": torch.utils.cpp_extension.BuildExtension},
69 | )
70 | 


--------------------------------------------------------------------------------
/tests/env_tests/env.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | import os
 4 | 
 5 | 
 6 | def get_config_root_path():
 7 |     ''' Path to configs for unit tests '''
 8 |     # cur_file_dir is root/tests/env_tests
 9 |     cur_file_dir = os.path.dirname(os.path.abspath(os.path.realpath(__file__)))
10 |     ret = os.path.dirname(os.path.dirname(cur_file_dir))
11 |     ret = os.path.join(ret, "configs")
12 |     return ret
13 | 


--------------------------------------------------------------------------------
/tests/test_backbones.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | import unittest
 4 | import copy
 5 | import torch
 6 | # import modules to to register backbones
 7 | from pysgg.modeling.backbone import build_backbone # NoQA
 8 | from pysgg.modeling import registry
 9 | from pysgg.config import cfg as g_cfg
10 | from utils import load_config
11 | 
12 | 
13 | # overwrite configs if specified, otherwise default config is used
14 | BACKBONE_CFGS = {
15 |     "R-50-FPN": "e2e_faster_rcnn_R_50_FPN_1x.yaml",
16 |     "R-101-FPN": "e2e_faster_rcnn_R_101_FPN_1x.yaml",
17 |     "R-152-FPN": "e2e_faster_rcnn_R_101_FPN_1x.yaml",
18 |     "R-50-FPN-RETINANET": "retinanet/retinanet_R-50-FPN_1x.yaml",
19 |     "R-101-FPN-RETINANET": "retinanet/retinanet_R-101-FPN_1x.yaml",
20 | }
21 | 
22 | 
23 | class TestBackbones(unittest.TestCase):
24 |     def test_build_backbones(self):
25 |         ''' Make sure backbones run '''
26 | 
27 |         self.assertGreater(len(registry.BACKBONES), 0)
28 | 
29 |         for name, backbone_builder in registry.BACKBONES.items():
30 |             print('Testing {}...'.format(name))
31 |             if name in BACKBONE_CFGS:
32 |                 cfg = load_config(BACKBONE_CFGS[name])
33 |             else:
34 |                 # Use default config if config file is not specified
35 |                 cfg = copy.deepcopy(g_cfg)
36 |             backbone = backbone_builder(cfg)
37 | 
38 |             # make sures the backbone has `out_channels`
39 |             self.assertIsNotNone(
40 |                 getattr(backbone, 'out_channels', None),
41 |                 'Need to provide out_channels for backbone {}'.format(name)
42 |             )
43 | 
44 |             N, C_in, H, W = 2, 3, 224, 256
45 |             input = torch.rand([N, C_in, H, W], dtype=torch.float32)
46 |             out = backbone(input)
47 |             for cur_out in out:
48 |                 self.assertEqual(
49 |                     cur_out.shape[:2],
50 |                     torch.Size([N, backbone.out_channels])
51 |                 )
52 | 
53 | 
54 | if __name__ == "__main__":
55 |     unittest.main()
56 | 


--------------------------------------------------------------------------------
/tests/test_configs.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | import unittest
 4 | import glob
 5 | import os
 6 | import utils
 7 | 
 8 | 
 9 | class TestConfigs(unittest.TestCase):
10 |     def test_configs_load(self):
11 |         ''' Make sure configs are loadable '''
12 | 
13 |         cfg_root_path = utils.get_config_root_path()
14 |         files = glob.glob(
15 |             os.path.join(cfg_root_path, "./**/*.yaml"), recursive=True)
16 |         self.assertGreater(len(files), 0)
17 | 
18 |         for fn in files:
19 |             print('Loading {}...'.format(fn))
20 |             utils.load_config_from_file(fn)
21 | 
22 | 
23 | if __name__ == "__main__":
24 |     unittest.main()
25 | 


--------------------------------------------------------------------------------
/tests/test_metric_logger.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import unittest
 3 | 
 4 | from pysgg.utils.metric_logger import MetricLogger
 5 | 
 6 | 
 7 | class TestMetricLogger(unittest.TestCase):
 8 |     def test_update(self):
 9 |         meter = MetricLogger()
10 |         for i in range(10):
11 |             meter.update(metric=float(i))
12 |         
13 |         m = meter.meters["metric"]
14 |         self.assertEqual(m.count, 10)
15 |         self.assertEqual(m.total, 45)
16 |         self.assertEqual(m.median, 4)
17 |         self.assertEqual(m.avg, 4.5)
18 | 
19 |     def test_no_attr(self):
20 |         meter = MetricLogger()
21 |         _ = meter.meters
22 |         _ = meter.delimiter
23 |         def broken():
24 |             _ = meter.not_existent
25 |         self.assertRaises(AttributeError, broken)
26 | 
27 | if __name__ == "__main__":
28 |     unittest.main()
29 | 


--------------------------------------------------------------------------------
/tests/test_rpn_heads.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | import unittest
 4 | import copy
 5 | import torch
 6 | # import modules to to register rpn heads
 7 | from pysgg.modeling.backbone import build_backbone # NoQA
 8 | from pysgg.modeling.rpn.rpn import build_rpn # NoQA
 9 | from pysgg.modeling import registry
10 | from pysgg.config import cfg as g_cfg
11 | from utils import load_config
12 | 
13 | 
14 | # overwrite configs if specified, otherwise default config is used
15 | RPN_CFGS = {
16 | }
17 | 
18 | 
19 | class TestRPNHeads(unittest.TestCase):
20 |     def test_build_rpn_heads(self):
21 |         ''' Make sure rpn heads run '''
22 | 
23 |         self.assertGreater(len(registry.RPN_HEADS), 0)
24 | 
25 |         in_channels = 64
26 |         num_anchors = 10
27 | 
28 |         for name, builder in registry.RPN_HEADS.items():
29 |             print('Testing {}...'.format(name))
30 |             if name in RPN_CFGS:
31 |                 cfg = load_config(RPN_CFGS[name])
32 |             else:
33 |                 # Use default config if config file is not specified
34 |                 cfg = copy.deepcopy(g_cfg)
35 | 
36 |             rpn = builder(cfg, in_channels, num_anchors)
37 | 
38 |             N, C_in, H, W = 2, in_channels, 24, 32
39 |             input = torch.rand([N, C_in, H, W], dtype=torch.float32)
40 |             LAYERS = 3
41 |             out = rpn([input] * LAYERS)
42 |             self.assertEqual(len(out), 2)
43 |             logits, bbox_reg = out
44 |             for idx in range(LAYERS):
45 |                 self.assertEqual(
46 |                     logits[idx].shape,
47 |                     torch.Size([
48 |                         input.shape[0], num_anchors,
49 |                         input.shape[2], input.shape[3],
50 |                     ])
51 |                 )
52 |                 self.assertEqual(
53 |                     bbox_reg[idx].shape,
54 |                     torch.Size([
55 |                         logits[idx].shape[0], num_anchors * 4,
56 |                         logits[idx].shape[2], logits[idx].shape[3],
57 |                     ]),
58 |                 )
59 | 
60 | 
61 | if __name__ == "__main__":
62 |     unittest.main()
63 | 


--------------------------------------------------------------------------------
/tests/test_segmentation_mask.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import unittest
 3 | import torch
 4 | from pysgg.structures.segmentation_mask import SegmentationMask
 5 | 
 6 | 
 7 | class TestSegmentationMask(unittest.TestCase):
 8 |     def __init__(self, method_name='runTest'):
 9 |         super(TestSegmentationMask, self).__init__(method_name)
10 |         poly = [[[423.0, 306.5, 406.5, 277.0, 400.0, 271.5, 389.5, 277.0,
11 |                   387.5, 292.0, 384.5, 295.0, 374.5, 220.0, 378.5, 210.0,
12 |                   391.0, 200.5, 404.0, 199.5, 414.0, 203.5, 425.5, 221.0,
13 |                   438.5, 297.0, 423.0, 306.5],
14 |                  [100, 100,     200, 100,     200, 200,     100, 200],
15 |                 ]]
16 |         width = 640
17 |         height = 480
18 |         size = width, height
19 | 
20 |         self.P = SegmentationMask(poly, size, 'poly')
21 |         self.M = SegmentationMask(poly, size, 'poly').convert('mask')
22 | 
23 |     def L1(self, A, B):
24 |         diff = A.get_mask_tensor() - B.get_mask_tensor()
25 |         diff = torch.sum(torch.abs(diff.float())).item()
26 |         return diff
27 | 
28 |     def test_convert(self):
29 |         M_hat = self.M.convert('poly').convert('mask')
30 |         P_hat = self.P.convert('mask').convert('poly')
31 | 
32 |         diff_mask = self.L1(self.M, M_hat)
33 |         diff_poly = self.L1(self.P, P_hat)
34 |         self.assertTrue(diff_mask == diff_poly)
35 |         self.assertTrue(diff_mask <= 8169.)
36 |         self.assertTrue(diff_poly <= 8169.)
37 | 
38 |     def test_crop(self):
39 |         box = [400, 250, 500, 300] # xyxy
40 |         diff = self.L1(self.M.crop(box), self.P.crop(box))
41 |         self.assertTrue(diff <= 1.)
42 | 
43 |     def test_resize(self):
44 |         new_size = 50, 25
45 |         M_hat = self.M.resize(new_size)
46 |         P_hat = self.P.resize(new_size)
47 |         diff = self.L1(M_hat, P_hat)
48 | 
49 |         self.assertTrue(self.M.size == self.P.size)
50 |         self.assertTrue(M_hat.size == P_hat.size)
51 |         self.assertTrue(self.M.size != M_hat.size)
52 |         self.assertTrue(diff <= 255.)
53 | 
54 |     def test_transpose(self):
55 |         FLIP_LEFT_RIGHT = 0
56 |         FLIP_TOP_BOTTOM = 1
57 |         diff_hor = self.L1(self.M.transpose(FLIP_LEFT_RIGHT),
58 |                            self.P.transpose(FLIP_LEFT_RIGHT))
59 | 
60 |         diff_ver = self.L1(self.M.transpose(FLIP_TOP_BOTTOM),
61 |                            self.P.transpose(FLIP_TOP_BOTTOM))
62 | 
63 |         self.assertTrue(diff_hor <= 53250.)
64 |         self.assertTrue(diff_ver <= 42494.)
65 | 
66 | 
67 | if __name__ == "__main__":
68 | 
69 |     unittest.main()
70 | 


--------------------------------------------------------------------------------
/tests/utils.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, print_function, unicode_literals
 2 | 
 3 | # Set up custom environment before nearly anything else is imported
 4 | # NOTE: this should be the first import (no not reorder)
 5 | from pysgg.utils.env import setup_environment  # noqa F401 isort:skip
 6 | import env_tests.env as env_tests
 7 | 
 8 | import os
 9 | import copy
10 | 
11 | from pysgg.config import cfg as g_cfg
12 | 
13 | 
14 | def get_config_root_path():
15 |     return env_tests.get_config_root_path()
16 | 
17 | 
18 | def load_config(rel_path):
19 |     ''' Load config from file path specified as path relative to config_root '''
20 |     cfg_path = os.path.join(env_tests.get_config_root_path(), rel_path)
21 |     return load_config_from_file(cfg_path)
22 | 
23 | 
24 | def load_config_from_file(file_path):
25 |     ''' Load config from file path specified as absolute path '''
26 |     ret = copy.deepcopy(g_cfg)
27 |     ret.merge_from_file(file_path)
28 |     return ret
29 | 


--------------------------------------------------------------------------------
/tools/runner.py:
--------------------------------------------------------------------------------
 1 | import argparse
 2 | import logging
 3 | import os
 4 | import random
 5 | import time
 6 | 
 7 | import gpustat
 8 | import torch
 9 | import numpy as np
10 | 
11 | 
12 | def start():
13 |     mem = None
14 |     gpu_id = int(os.environ["CUDA_VISIBLE_DEVICES"].split(",")[0])
15 | 
16 |     while True:
17 |         info = gpustat.core.GPUStatCollection.new_query()
18 |         gpu_info = info.jsonify()['gpus'][gpu_id]
19 |         u_ratio = gpu_info['utilization.gpu']
20 |         mem_ratio = gpu_info['memory.used'] / gpu_info['memory.total']
21 |         # print("add meme")
22 |         if mem is None:
23 |             mem = torch.rand((25000, 8196), device=torch.torch.device("cuda"))
24 | 
25 |         if u_ratio < 30:
26 |             if  mem_ratio < 0.50 :
27 |                     mem = torch.cat((mem, torch.rand((25000, 8196), device=torch.torch.device("cuda")))).cuda()
28 |             elif mem_ratio < 0.95 :
29 |                 mem = torch.cat((mem, torch.rand((10000, 8196), device=torch.torch.device("cuda")))).cuda()
30 | 
31 |             else:
32 |                 if mem is not None:
33 |                     for _ in range(100):
34 |                         mem *= mem
35 |                         mem /= mem
36 |                     time.sleep(0.001)
37 | 
38 | 
39 | 
40 | if __name__ == "__main__":
41 |     start()


--------------------------------------------------------------------------------