├── INSTALL.md
├── README.md
├── apex
    ├── .nojekyll
    ├── LICENSE
    ├── README.md
    ├── apex
    │   ├── RNN
    │   │   ├── README.md
    │   │   ├── RNNBackend.py
    │   │   ├── __init__.py
    │   │   ├── cells.py
    │   │   └── models.py
    │   ├── __init__.py
    │   ├── amp
    │   │   ├── README.md
    │   │   ├── __init__.py
    │   │   ├── __version__.py
    │   │   ├── _amp_state.py
    │   │   ├── _initialize.py
    │   │   ├── _process_optimizer.py
    │   │   ├── amp.py
    │   │   ├── compat.py
    │   │   ├── frontend.py
    │   │   ├── handle.py
    │   │   ├── lists
    │   │   │   ├── __init__.py
    │   │   │   ├── __pycache__
    │   │   │   │   ├── __init__.cpython-35.pyc
    │   │   │   │   ├── __init__.cpython-36.pyc
    │   │   │   │   ├── functional_overrides.cpython-35.pyc
    │   │   │   │   ├── functional_overrides.cpython-36.pyc
    │   │   │   │   ├── tensor_overrides.cpython-35.pyc
    │   │   │   │   ├── tensor_overrides.cpython-36.pyc
    │   │   │   │   ├── torch_overrides.cpython-35.pyc
    │   │   │   │   └── torch_overrides.cpython-36.pyc
    │   │   │   ├── functional_overrides.py
    │   │   │   ├── tensor_overrides.py
    │   │   │   └── torch_overrides.py
    │   │   ├── opt.py
    │   │   ├── rnn_compat.py
    │   │   ├── scaler.py
    │   │   ├── utils.py
    │   │   └── wrap.py
    │   ├── fp16_utils
    │   │   ├── README.md
    │   │   ├── __init__.py
    │   │   ├── fp16_optimizer.py
    │   │   ├── fp16util.py
    │   │   └── loss_scaler.py
    │   ├── multi_tensor_apply
    │   │   ├── __init__.py
    │   │   └── multi_tensor_apply.py
    │   ├── normalization
    │   │   ├── __init__.py
    │   │   └── fused_layer_norm.py
    │   ├── optimizers
    │   │   ├── __init__.py
    │   │   ├── fp16_optimizer.py
    │   │   └── fused_adam.py
    │   ├── parallel
    │   │   ├── LARC.py
    │   │   ├── README.md
    │   │   ├── __init__.py
    │   │   ├── distributed.py
    │   │   ├── multiproc.py
    │   │   ├── optimized_sync_batchnorm.py
    │   │   ├── optimized_sync_batchnorm_kernel.py
    │   │   ├── sync_batchnorm.py
    │   │   └── sync_batchnorm_kernel.py
    │   └── reparameterization
    │   │   ├── README.md
    │   │   ├── __init__.py
    │   │   ├── reparameterization.py
    │   │   └── weight_norm.py
    ├── csrc
    │   ├── amp_C_frontend.cpp
    │   ├── flatten_unflatten.cpp
    │   ├── fused_adam_cuda.cpp
    │   ├── fused_adam_cuda_kernel.cu
    │   ├── layer_norm_cuda.cpp
    │   ├── layer_norm_cuda_kernel.cu
    │   ├── multi_tensor_apply.cuh
    │   ├── multi_tensor_axpby_kernel.cu
    │   ├── multi_tensor_l2norm_kernel.cu
    │   ├── multi_tensor_scale_kernel.cu
    │   ├── syncbn.cpp
    │   ├── type_shim.h
    │   └── welford.cu
    ├── docs
    │   ├── Makefile
    │   └── source
    │   │   ├── _static
    │   │       ├── css
    │   │       │   └── pytorch_theme.css
    │   │       └── img
    │   │       │   └── nv-pytorch2.png
    │   │   ├── _templates
    │   │       └── layout.html
    │   │   ├── advanced.rst
    │   │   ├── amp.rst
    │   │   ├── conf.py
    │   │   ├── fp16_utils.rst
    │   │   ├── index.rst
    │   │   ├── layernorm.rst
    │   │   ├── optimizers.rst
    │   │   └── parallel.rst
    ├── examples
    │   ├── README.md
    │   ├── dcgan
    │   │   └── README.md
    │   ├── docker
    │   │   ├── Dockerfile
    │   │   └── README.md
    │   ├── imagenet
    │   │   ├── README.md
    │   │   └── main_amp.py
    │   └── simple
    │   │   └── distributed
    │   │       ├── README.md
    │   │       ├── distributed_data_parallel.py
    │   │       └── run.sh
    ├── setup.py
    └── tests
    │   ├── L0
    │       ├── run_amp
    │       │   ├── __init__.py
    │       │   ├── test_basic_casts.py
    │       │   ├── test_cache.py
    │       │   ├── test_multi_tensor_axpby.py
    │       │   ├── test_multi_tensor_l2norm.py
    │       │   ├── test_multi_tensor_scale.py
    │       │   ├── test_multiple_models_optimizers_losses.py
    │       │   ├── test_promotion.py
    │       │   ├── test_rnn.py
    │       │   └── utils.py
    │       ├── run_fp16util
    │       │   ├── __init__.py
    │       │   └── test_fp16util.py
    │       ├── run_fused_layer_norm
    │       │   └── test_fused_layer_norm.py
    │       ├── run_mixed_adam
    │       │   ├── __init__.py
    │       │   ├── test_fp16_optimizer.py
    │       │   └── test_mixed_adam.py
    │       └── run_test.py
    │   ├── L1
    │       ├── common
    │       │   ├── compare.py
    │       │   ├── main_amp.py
    │       │   └── run_test.sh
    │       ├── cross_product
    │       │   └── run.sh
    │       └── cross_product_distributed
    │       │   └── run.sh
    │   ├── distributed
    │       ├── DDP
    │       │   ├── ddp_race_condition_test.py
    │       │   └── run_race_test.sh
    │       ├── amp_master_params
    │       │   ├── amp_master_params.py
    │       │   ├── compare.py
    │       │   └── run.sh
    │       └── synced_batchnorm
    │       │   ├── single_gpu_unit_test.py
    │       │   ├── test_groups.py
    │       │   ├── two_gpu_unit_test.py
    │       │   └── unit_test.sh
    │   └── docker_extension_builds
    │       └── run.sh
├── configs
    └── rdpnet
    │   ├── r101-isod.yaml
    │   ├── r50-come.yaml
    │   ├── r50-isod-te.yaml
    │   ├── r50-isod.yaml
    │   ├── r50-soc-te.yaml
    │   ├── r50-soc.yaml
    │   └── x101-isod.yaml
├── datasets
    └── PLACE_DATA_HERE
├── demo
    ├── examples
    │   ├── test_10.jpg
    │   ├── test_14.jpg
    │   ├── test_20.jpg
    │   ├── test_23.jpg
    │   ├── test_24.jpg
    │   ├── test_25.jpg
    │   ├── test_3.jpg
    │   ├── test_5.jpg
    │   ├── test_53.jpg
    │   ├── test_6.jpg
    │   └── test_9.jpg
    ├── model_zoo
    ├── predictor.py
    └── visualize.py
├── docker
    ├── Dockerfile
    └── docker-jupyter
    │   ├── Dockerfile
    │   └── jupyter_notebook_config.py
├── maskrcnn_benchmark
    ├── _C.cpython-36m-x86_64-linux-gnu.so
    ├── __init__.py
    ├── config
    │   ├── __init__.py
    │   ├── defaults.py
    │   └── paths_catalog.py
    ├── csrc
    │   ├── ROIAlign.h
    │   ├── ROIPool.h
    │   ├── SigmoidFocalLoss.h
    │   ├── cpu
    │   │   ├── ROIAlign_cpu.cpp
    │   │   ├── nms_cpu.cpp
    │   │   └── vision.h
    │   ├── cuda
    │   │   ├── ROIAlign_cuda.cu
    │   │   ├── ROIPool_cuda.cu
    │   │   ├── SigmoidFocalLoss_cuda.cu
    │   │   ├── deform_conv_cuda_kernel.cu
    │   │   ├── nms.cu
    │   │   └── vision.h
    │   ├── deform_conv_cuda.h
    │   ├── nms.h
    │   └── vision.cpp
    ├── data
    │   ├── README.md
    │   ├── __init__.py
    │   ├── build.py
    │   ├── collate_batch.py
    │   ├── datasets
    │   │   ├── __init__.py
    │   │   ├── coco.py
    │   │   ├── concat_dataset.py
    │   │   ├── evaluation
    │   │   │   ├── __init__.py
    │   │   │   ├── coco
    │   │   │   │   ├── __init__.py
    │   │   │   │   └── coco_eval.py
    │   │   │   └── voc
    │   │   │   │   ├── __init__.py
    │   │   │   │   └── voc_eval.py
    │   │   ├── list_dataset.py
    │   │   └── voc.py
    │   ├── samplers
    │   │   ├── __init__.py
    │   │   ├── distributed.py
    │   │   ├── grouped_batch_sampler.py
    │   │   └── iteration_based_batch_sampler.py
    │   └── transforms
    │   │   ├── __init__.py
    │   │   ├── build.py
    │   │   └── transforms.py
    ├── engine
    │   ├── __init__.py
    │   ├── inference.py
    │   └── trainer.py
    ├── layers
    │   ├── __init__.py
    │   ├── _utils.py
    │   ├── batch_norm.py
    │   ├── deform_conv.py
    │   ├── functions
    │   │   └── deform_conv.py
    │   ├── iou_loss.py
    │   ├── misc.py
    │   ├── nms.py
    │   ├── roi_align.py
    │   ├── roi_pool.py
    │   ├── scale.py
    │   ├── sigmoid_focal_loss.py
    │   └── smooth_l1_loss.py
    ├── modeling
    │   ├── __init__.py
    │   ├── backbone
    │   │   ├── __init__.py
    │   │   ├── backbone.py
    │   │   ├── bn.py
    │   │   ├── fbnet.py
    │   │   ├── fbnet_builder.py
    │   │   ├── fbnet_modeldef.py
    │   │   ├── fpn.py
    │   │   ├── functions.py
    │   │   ├── resnet.py
    │   │   ├── segmentation.py
    │   │   └── src
    │   │   │   ├── checks.h
    │   │   │   ├── inplace_abn.cpp
    │   │   │   ├── inplace_abn.h
    │   │   │   ├── inplace_abn_cpu.cpp
    │   │   │   ├── inplace_abn_cuda.cu
    │   │   │   ├── inplace_abn_cuda_half.cu
    │   │   │   └── utils
    │   │   │       ├── checks.h
    │   │   │       ├── common.h
    │   │   │       └── cuda.cuh
    │   ├── balanced_positive_negative_sampler.py
    │   ├── box_coder.py
    │   ├── detector
    │   │   ├── __init__.py
    │   │   ├── detectors.py
    │   │   └── generalized_rcnn.py
    │   ├── make_layers.py
    │   ├── matcher.py
    │   ├── poolers.py
    │   ├── registry.py
    │   ├── roi_heads
    │   │   ├── __init__.py
    │   │   ├── box_head
    │   │   │   ├── __init__.py
    │   │   │   ├── box_head.py
    │   │   │   ├── inference.py
    │   │   │   ├── loss.py
    │   │   │   ├── roi_box_feature_extractors.py
    │   │   │   └── roi_box_predictors.py
    │   │   ├── keypoint_head
    │   │   │   ├── __init__.py
    │   │   │   ├── inference.py
    │   │   │   ├── keypoint_head.py
    │   │   │   ├── loss.py
    │   │   │   ├── roi_keypoint_feature_extractors.py
    │   │   │   └── roi_keypoint_predictors.py
    │   │   ├── mask_head
    │   │   │   ├── __init__.py
    │   │   │   ├── inference.py
    │   │   │   ├── loss.py
    │   │   │   ├── mask_head.py
    │   │   │   ├── roi_mask_feature_extractors.py
    │   │   │   └── roi_mask_predictors.py
    │   │   └── roi_heads.py
    │   ├── rpn
    │   │   ├── __init__.py
    │   │   ├── anchor_generator.py
    │   │   ├── fcos-drop
    │   │   │   ├── __init__.py
    │   │   │   ├── fcos.py
    │   │   │   ├── inference.py
    │   │   │   └── loss.py
    │   │   ├── fcos
    │   │   │   ├── __init__.py
    │   │   │   ├── fcos.py
    │   │   │   ├── inference.py
    │   │   │   └── loss.py
    │   │   ├── inference.py
    │   │   ├── loss.py
    │   │   ├── retinanet
    │   │   │   ├── __init__.py
    │   │   │   ├── inference.py
    │   │   │   ├── loss.py
    │   │   │   └── retinanet.py
    │   │   ├── rpn.py
    │   │   └── utils.py
    │   └── utils.py
    ├── solver
    │   ├── __init__.py
    │   ├── build.py
    │   └── lr_scheduler.py
    ├── structures
    │   ├── __init__.py
    │   ├── bounding_box.py
    │   ├── boxlist_ops.py
    │   ├── image_list.py
    │   ├── keypoint.py
    │   └── segmentation_mask.py
    └── utils
    │   ├── README.md
    │   ├── __init__.py
    │   ├── c2_model_loading.py
    │   ├── checkpoint.py
    │   ├── collect_env.py
    │   ├── comm.py
    │   ├── cv2_util.py
    │   ├── env.py
    │   ├── imports.py
    │   ├── logger.py
    │   ├── metric_logger.py
    │   ├── miscellaneous.py
    │   ├── model_serialization.py
    │   ├── model_zoo.py
    │   ├── registry.py
    │   └── timer.py
├── model_zoo
    └── PLACE_WEIGHTS_HERE
├── my_env.txt
├── requirements.txt
├── scripts
    ├── test_isod.sh
    ├── test_soc.sh
    ├── train_come.sh
    ├── train_isod.sh
    ├── train_r101_isod.sh
    ├── train_soc.sh
    └── train_x101_isod.sh
├── setup.py
└── tools
    ├── cityscapes
        ├── convert_cityscapes_to_coco.py
        └── instances2dict_with_polygons.py
    ├── test_net.py
    └── train_net.py


/INSTALL.md:
--------------------------------------------------------------------------------
 1 | ## Installation
 2 | 
 3 | ### Requirements:
 4 | - PyTorch 1.1 or 1.0.1.
 5 | - torchvision 0.2.2.post3
 6 | - cocoapi
 7 | - yacs
 8 | - matplotlib
 9 | - GCC >= 4.9
10 | - OpenCV
11 | 
12 | 
13 | ### Option 1: Step-by-step installation
14 | 
15 | ```bash
16 | # first, make sure that your conda is setup properly with the right environment
17 | # for that, check that `which conda`, `which pip` and `which python` points to the
18 | # right path. From a clean conda env, this is what you need to do
19 | 
20 | conda create --name RDPNet
21 | conda activate RDPNet
22 | 
23 | # this installs the right pip and dependencies for the fresh python
24 | conda install ipython
25 | 
26 | # follow PyTorch installation in https://pytorch.org/get-started/locally/
27 | # we give the instructions for CUDA 9.0
28 | # You should install the consistent CUDA vesion which is same with your system's CUDA version!!!
29 | conda install -c pytorch pytorch==1.1 torchvision==0.2.2 cudatoolkit=9.0
30 | 
31 | export INSTALL_DIR=$PWD
32 | 
33 | # install pycocotools
34 | pip install pycocotools
35 | 
36 | # install RDPNet
37 | cd $INSTALL_DIR
38 | git clone https://github.com/yuhuan-wu/RDPNet.git
39 | cd RDPNet
40 | 
41 | 
42 | # RDPNet and coco api dependencies
43 | pip install -r requirements.txt
44 | 
45 | # the following will install the lib with
46 | # symbolic links, so that you can modify
47 | # the files if you want and won't need to
48 | # re-build it
49 | python setup.py build develop
50 | 
51 | cd apex
52 | pip install -v --no-cache-dir --global-option="--cpp_ext" --global-option="--cuda_ext" .
53 | 
54 | unset INSTALL_DIR
55 | 
56 | # or if you are on macOS
57 | # MACOSX_DEPLOYMENT_TARGET=10.9 CC=clang CXX=clang++ python setup.py build develop
58 | ```
59 | 
60 | ### Option 2: Docker Image (Requires CUDA, Linux only)
61 | *The following steps are for original maskrcnn-benchmark. Please change the repository name if needed.* 
62 | 
63 | Build image with defaults (`CUDA=9.0`, `CUDNN=7`, `FORCE_CUDA=1`):
64 | 
65 |     nvidia-docker build -t maskrcnn-benchmark docker/
66 | 
67 | Build image with other CUDA and CUDNN versions:
68 | 
69 |     nvidia-docker build -t maskrcnn-benchmark --build-arg CUDA=9.2 --build-arg CUDNN=7 docker/
70 | 
71 | Build image with FORCE_CUDA disabled:
72 | 
73 |     nvidia-docker build -t maskrcnn-benchmark --build-arg FORCE_CUDA=0 docker/
74 | 
75 | Build and run image with built-in jupyter notebook(note that the password is used to log in jupyter notebook):
76 | 
77 |     nvidia-docker build -t maskrcnn-benchmark-jupyter docker/docker-jupyter/
78 |     nvidia-docker run -td -p 8888:8888 -e PASSWORD=<password> -v <host-dir>:<container-dir> maskrcnn-benchmark-jupyter
79 | 


--------------------------------------------------------------------------------
/apex/.nojekyll:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/apex/.nojekyll


--------------------------------------------------------------------------------
/apex/LICENSE:
--------------------------------------------------------------------------------
 1 | All rights reserved.
 2 | 
 3 | Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met:
 4 | 
 5 | 1. Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer.
 6 | 
 7 | 2. Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution.
 8 | 
 9 | 3. Neither the name of the copyright holder nor the names of its contributors may be used to endorse or promote products derived from this software without specific prior written permission.
10 | 
11 | THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.


--------------------------------------------------------------------------------
/apex/apex/RNN/README.md:
--------------------------------------------------------------------------------
1 | Under construction...
2 | 


--------------------------------------------------------------------------------
/apex/apex/RNN/__init__.py:
--------------------------------------------------------------------------------
1 | from .models import LSTM, GRU, ReLU, Tanh, mLSTM
2 | 
3 | __all__ = ['models']
4 | 


--------------------------------------------------------------------------------
/apex/apex/RNN/cells.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | import torch.nn as nn
 3 | import torch.nn.functional as F
 4 | 
 5 | from .RNNBackend import RNNCell
 6 | 
 7 | from torch.nn._functions.thnn import rnnFusedPointwise as fusedBackend
 8 | 
 9 | import math 
10 | 
11 | 
12 | class mLSTMRNNCell(RNNCell):
13 |     """
14 |     mLSTMRNNCell
15 |     """
16 | 
17 |     def __init__(self, input_size, hidden_size, bias = False, output_size = None):
18 |         gate_multiplier = 4
19 |         super(mLSTMRNNCell, self).__init__(gate_multiplier, input_size, hidden_size, mLSTMCell, n_hidden_states = 2, bias = bias, output_size = output_size)
20 | 
21 |         self.w_mih = nn.Parameter(torch.Tensor(self.output_size, self.input_size))
22 |         self.w_mhh = nn.Parameter(torch.Tensor(self.output_size, self.output_size))
23 | 
24 |         self.reset_parameters()
25 | 
26 |     def forward(self, input):
27 |         """
28 |         mLSTMRNNCell.forward()
29 |         """
30 |         #if not inited or bsz has changed this will create hidden states
31 |         self.init_hidden(input.size()[0])
32 | 
33 |         hidden_state = self.hidden[0] if self.n_hidden_states == 1 else self.hidden
34 | 
35 |         self.hidden = list(
36 |                            self.cell(input, hidden_state, self.w_ih, self.w_hh, self.w_mih, self.w_mhh,
37 |                            b_ih=self.b_ih, b_hh=self.b_hh)
38 |         )
39 |         
40 |         if self.output_size != self.hidden_size:
41 |             self.hidden[0] = F.linear(self.hidden[0], self.w_ho)
42 |         return tuple(self.hidden)
43 | 
44 | 
45 |     def new_like(self, new_input_size=None):
46 |         if new_input_size is None:
47 |             new_input_size = self.input_size
48 |         
49 |         return type(self)(
50 |             new_input_size,
51 |             self.hidden_size,
52 |             self.bias,
53 |             self.output_size)
54 | 
55 | def mLSTMCell(input, hidden, w_ih, w_hh, w_mih, w_mhh, b_ih=None, b_hh=None):
56 |     """
57 |     mLSTMCell
58 |     """
59 | 
60 |     if input.is_cuda:
61 |         igates = F.linear(input, w_ih)
62 |         m = F.linear(input, w_mih) * F.linear(hidden[0], w_mhh)
63 |         hgates = F.linear(m, w_hh)
64 | 
65 |         state = fusedBackend.LSTMFused.apply
66 |         return state(igates, hgates, hidden[1], b_ih, b_hh)
67 | 
68 |     hx, cx = hidden
69 |     
70 |     m = F.linear(input, w_mih) * F.linear(hidden[0], w_mhh)
71 |     gates = F.linear(input, w_ih, b_ih) + F.linear(m, w_hh, b_hh)
72 | 
73 |     ingate, forgetgate, cellgate, outgate = gates.chunk(4, 1)
74 | 
75 |     ingate = F.sigmoid(ingate)
76 |     forgetgate = F.sigmoid(forgetgate)
77 |     cellgate = F.tanh(cellgate)
78 |     outgate = F.sigmoid(outgate)
79 |     
80 |     cy = (forgetgate * cx) + (ingate * cellgate)
81 |     hy = outgate * F.tanh(cy)
82 |     
83 |     return hy, cy
84 |                                                                             
85 | 


--------------------------------------------------------------------------------
/apex/apex/RNN/models.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | 
 3 | from torch.nn._functions.rnn import LSTMCell, RNNReLUCell, RNNTanhCell, GRUCell
 4 | 
 5 | from .RNNBackend import bidirectionalRNN, stackedRNN, RNNCell
 6 | from .cells import mLSTMRNNCell, mLSTMCell
 7 | 
 8 | def toRNNBackend(inputRNN, num_layers, bidirectional=False, dropout = 0):
 9 |     """
10 |     :class:`toRNNBackend`
11 |     """
12 | 
13 |     if bidirectional:
14 |         return bidirectionalRNN(inputRNN, num_layers, dropout = dropout)
15 |     else:
16 |         return stackedRNN(inputRNN, num_layers, dropout = dropout)
17 | 
18 | 
19 | def LSTM(input_size, hidden_size, num_layers, bias=True, batch_first=False, dropout=0, bidirectional=False, output_size = None):
20 |     """
21 |     :class:`LSTM`
22 |     """
23 |     inputRNN = RNNCell(4, input_size, hidden_size, LSTMCell, 2, bias, output_size)
24 |     return toRNNBackend(inputRNN, num_layers, bidirectional, dropout=dropout)
25 | 
26 | def GRU(input_size, hidden_size, num_layers, bias=True, batch_first=False, dropout=0, bidirectional=False, output_size = None):
27 |     """
28 |     :class:`GRU`
29 |     """
30 |     inputRNN = RNNCell(3, input_size, hidden_size, GRUCell, 1, bias, output_size)
31 |     return toRNNBackend(inputRNN, num_layers, bidirectional, dropout=dropout)
32 | 
33 | def ReLU(input_size, hidden_size, num_layers, bias=True, batch_first=False, dropout=0, bidirectional=False, output_size = None):
34 |     """
35 |     :class:`ReLU`
36 |     """
37 |     inputRNN = RNNCell(1, input_size, hidden_size, RNNReLUCell, 1, bias, output_size)
38 |     return toRNNBackend(inputRNN, num_layers, bidirectional, dropout=dropout)
39 | 
40 | def Tanh(input_size, hidden_size, num_layers, bias=True, batch_first=False, dropout=0, bidirectional=False, output_size = None):
41 |     """
42 |     :class:`Tanh`
43 |     """
44 |     inputRNN = RNNCell(1, input_size, hidden_size, RNNTanhCell, 1, bias, output_size)
45 |     return toRNNBackend(inputRNN, num_layers, bidirectional, dropout=dropout)
46 |         
47 | def mLSTM(input_size, hidden_size, num_layers, bias=True, batch_first=False, dropout=0, bidirectional=False, output_size = None):
48 |     """
49 |     :class:`mLSTM`
50 |     """
51 |     inputRNN = mLSTMRNNCell(input_size, hidden_size, bias=bias, output_size=output_size)
52 |     return toRNNBackend(inputRNN, num_layers, bidirectional, dropout=dropout)
53 | 
54 | 
55 | 


--------------------------------------------------------------------------------
/apex/apex/__init__.py:
--------------------------------------------------------------------------------
 1 | from . import parallel
 2 | from . import amp
 3 | from . import fp16_utils
 4 | 
 5 | # For optimizers and normalization there is no Python fallback.
 6 | # Absence of cuda backend is a hard error.
 7 | # I would like the errors from importing fused_adam_cuda or fused_layer_norm_cuda
 8 | # to be triggered lazily, because if someone has installed with --cpp_ext and --cuda_ext
 9 | # so they expect those backends to be available, but for some reason they actually aren't
10 | # available (for example because they built improperly in a way that isn't revealed until
11 | # load time) the error message is timely and visible.
12 | from . import optimizers
13 | from . import normalization
14 | 


--------------------------------------------------------------------------------
/apex/apex/amp/__init__.py:
--------------------------------------------------------------------------------
1 | from .amp import init, half_function, float_function, promote_function,\
2 |     register_half_function, register_float_function, register_promote_function
3 | from .handle import scale_loss, disable_casts
4 | from .frontend import initialize
5 | from ._amp_state import master_params, _amp_state
6 | 


--------------------------------------------------------------------------------
/apex/apex/amp/__version__.py:
--------------------------------------------------------------------------------
1 | VERSION = (0, 1, 0)
2 | __version__ = '.'.join(map(str, VERSION))
3 | 


--------------------------------------------------------------------------------
/apex/apex/amp/_amp_state.py:
--------------------------------------------------------------------------------
 1 | # This is a "header object" that allows different amp modules to communicate.
 2 | # I'm a C++ guy, not a python guy.  I decided this approach because it seemed most C++-like.  
 3 | # But apparently it's ok:
 4 | # http://effbot.org/pyfaq/how-do-i-share-global-variables-across-modules.htm
 5 | import os
 6 | import torch
 7 | 
 8 | TORCH_MAJOR = int(torch.__version__.split('.')[0])
 9 | TORCH_MINOR = int(torch.__version__.split('.')[1])
10 | 
11 | if TORCH_MAJOR == 0:
12 |     import collections.abc as container_abcs
13 | else:
14 |     from torch._six import container_abcs
15 | 
16 | 
17 | class AmpState(object):
18 |     def __init__(self):
19 |         self.hard_override=False
20 |         self.allow_incoming_model_not_fp32 = False
21 |         self.verbosity=1
22 | 
23 | 
24 | # Attribute stash.  Could also just stash things as global module attributes.
25 | _amp_state = AmpState()
26 | 
27 | 
28 | def warn_or_err(msg):
29 |     if _amp_state.hard_override:
30 |         print("Warning:  " + msg)
31 |     else:
32 |         raise RuntimeError(msg)
33 |         # I'm not sure if allowing hard_override is a good idea.
34 |         # + "  If you're sure you know what you're doing, supply " +
35 |         #                    "hard_override=True to amp.initialize.")
36 | 
37 | 
38 | distributed = False
39 | if 'WORLD_SIZE' in os.environ:
40 |     distributed = int(os.environ['WORLD_SIZE']) > 1
41 | 
42 | 
43 | def maybe_print(msg, rank0=False):
44 |     if _amp_state.verbosity > 0:
45 |         if rank0:
46 |             if distributed:
47 |                 if torch.distributed.get_rank() == 0:
48 |                     print(msg)
49 |             else:
50 |                 print(msg)
51 |         else:
52 |             print(msg)
53 | 
54 | 
55 | # def iter_params(param_groups):
56 | #     for group in param_groups:
57 | #         for p in group['params']:
58 | #             yield p
59 | 
60 | 
61 | def master_params(optimizer):
62 |     """
63 |     Generator expression that iterates over the params owned by ``optimizer``.
64 | 
65 |     Args:
66 |         optimizer: An optimizer previously returned from ``amp.initialize``.
67 |     """
68 |     for group in optimizer.param_groups:
69 |         for p in group['params']:
70 |             yield p
71 | 


--------------------------------------------------------------------------------
/apex/apex/amp/compat.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | 
 3 | # True for post-0.4, when Variables/Tensors merged.
 4 | def variable_is_tensor():
 5 |     v = torch.autograd.Variable()
 6 |     return isinstance(v, torch.Tensor)
 7 | 
 8 | def tensor_is_variable():
 9 |     x = torch.Tensor()
10 |     return type(x) == torch.autograd.Variable
11 | 
12 | # False for post-0.4
13 | def tensor_is_float_tensor():
14 |     x = torch.Tensor()
15 |     return type(x) == torch.FloatTensor
16 | 
17 | # Akin to `torch.is_tensor`, but returns True for Variable
18 | # objects in pre-0.4.
19 | def is_tensor_like(x):
20 |     return torch.is_tensor(x) or isinstance(x, torch.autograd.Variable)
21 | 
22 | # Wraps `torch.is_floating_point` if present, otherwise checks
23 | # the suffix of `x.type()`.
24 | def is_floating_point(x):
25 |     if hasattr(torch, 'is_floating_point'):
26 |         return torch.is_floating_point(x)
27 |     try:
28 |         torch_type = x.type()
29 |         return torch_type.endswith('FloatTensor') or \
30 |             torch_type.endswith('HalfTensor') or \
31 |             torch_type.endswith('DoubleTensor')
32 |     except AttributeError:
33 |         return False
34 | 
35 | def scalar_python_val(x):
36 |     if hasattr(x, 'item'):
37 |         return x.item()
38 |     else:
39 |         if isinstance(x, torch.autograd.Variable):
40 |             return x.data[0]
41 |         else:
42 |             return x[0]
43 | 


--------------------------------------------------------------------------------
/apex/apex/amp/lists/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/apex/apex/amp/lists/__init__.py


--------------------------------------------------------------------------------
/apex/apex/amp/lists/__pycache__/__init__.cpython-35.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/apex/apex/amp/lists/__pycache__/__init__.cpython-35.pyc


--------------------------------------------------------------------------------
/apex/apex/amp/lists/__pycache__/__init__.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/apex/apex/amp/lists/__pycache__/__init__.cpython-36.pyc


--------------------------------------------------------------------------------
/apex/apex/amp/lists/__pycache__/functional_overrides.cpython-35.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/apex/apex/amp/lists/__pycache__/functional_overrides.cpython-35.pyc


--------------------------------------------------------------------------------
/apex/apex/amp/lists/__pycache__/functional_overrides.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/apex/apex/amp/lists/__pycache__/functional_overrides.cpython-36.pyc


--------------------------------------------------------------------------------
/apex/apex/amp/lists/__pycache__/tensor_overrides.cpython-35.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/apex/apex/amp/lists/__pycache__/tensor_overrides.cpython-35.pyc


--------------------------------------------------------------------------------
/apex/apex/amp/lists/__pycache__/tensor_overrides.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/apex/apex/amp/lists/__pycache__/tensor_overrides.cpython-36.pyc


--------------------------------------------------------------------------------
/apex/apex/amp/lists/__pycache__/torch_overrides.cpython-35.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/apex/apex/amp/lists/__pycache__/torch_overrides.cpython-35.pyc


--------------------------------------------------------------------------------
/apex/apex/amp/lists/__pycache__/torch_overrides.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/apex/apex/amp/lists/__pycache__/torch_overrides.cpython-36.pyc


--------------------------------------------------------------------------------
/apex/apex/amp/lists/functional_overrides.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # TODO: think about the following two. They do weird things.
 3 | # - torch.nn.utils.clip_grad (but it should always be fp32 anyway)
 4 | # - torch.nn.utils.weight_norm
 5 | 
 6 | # Notes:
 7 | # F.instance_norm uses batch_norm internally. Which correctly handles
 8 | #   fp16 in/out with fp32 weights. So we shouldn't do anything for
 9 | #   either of these.
10 | # F.normalize calls `input.norm()` internally, so it's redundant, but
11 | #   kept here in case impl. changes.
12 | # F.cosine_similarity is same: calls `x.norm()` internally.
13 | 
14 | import torch.nn.functional
15 | 
16 | MODULE = torch.nn.functional
17 | 
18 | FP16_FUNCS = [
19 |     'conv1d',
20 |     'conv2d',
21 |     'conv3d',
22 |     'conv_transpose1d',
23 |     'conv_transpose2d',
24 |     'conv_transpose3d',
25 |     'conv_tbc', # Undocumented / maybe new?
26 |     'linear',
27 | ]
28 | 
29 | FP32_FUNCS = [
30 | 
31 |     # Interpolation/Upsampling
32 |     'interpolate',
33 | 
34 |     # Pointwise
35 |     'softplus',
36 |     'softmin',
37 |     'log_softmax',
38 |     'softmax',
39 | 
40 |     # Normalization
41 |     'layer_norm',
42 |     'group_norm',
43 |     'local_response_norm',
44 |     'normalize',
45 |     'cosine_similarity',
46 | 
47 |     # Loss functions
48 |     # TODO: which of these can be fp16?
49 |     'poisson_nll_loss',
50 |     'cosine_embedding_loss',
51 |     'cross_entropy',
52 |     'hinge_embedding_loss',
53 |     'kl_div',
54 |     'l1_loss',
55 |     'mse_loss',
56 |     'margin_ranking_loss',
57 |     'multilabel_margin_loss',
58 |     'multilabel_soft_margin_loss',
59 |     'multi_margin_loss',
60 |     'nll_loss',
61 |     'binary_cross_entropy_with_logits',
62 |     'smooth_l1_loss',
63 |     'soft_margin_loss',
64 |     'triplet_margin_loss'
65 | ]
66 | 
67 | BANNED_FUNCS = [
68 |     ('binary_cross_entropy',
69 |      ("\namp does not work out-of-the-box with `F.binary_cross_entropy` or `torch.nn.BCELoss.` "
70 |       "It requires that the output of the previous function be already a FloatTensor. \n\n"
71 |       "Most models have a Sigmoid right before BCELoss. In that case, you can use\n"
72 |       "    torch.nn.BCEWithLogitsLoss\nto combine Sigmoid+BCELoss into a single layer "
73 |       "that is compatible with amp.\nAnother option is to add\n"
74 |       "    amp.register_float_function(torch, 'sigmoid')\nbefore calling `amp.init()`.\n"
75 |       "If you _really_ know what you are doing, you can disable this warning by passing "
76 |       "allow_banned=True to `amp.init()`."))
77 | ]
78 | 


--------------------------------------------------------------------------------
/apex/apex/amp/lists/tensor_overrides.py:
--------------------------------------------------------------------------------
 1 | from .. import compat
 2 | from . import torch_overrides
 3 | 
 4 | import importlib
 5 | 
 6 | import torch
 7 | 
 8 | if compat.variable_is_tensor() and not compat.tensor_is_variable():
 9 |     MODULE = torch.Tensor
10 | else:
11 |     MODULE = torch.autograd.Variable
12 | 
13 | 
14 | FP16_FUNCS = [
15 |     '__matmul__',
16 | ]
17 | 
18 | FP32_FUNCS = [
19 |     '__ipow__',
20 |     '__pow__',
21 |     '__rpow__',
22 | 
23 |     # Cast to fp32 before transfer to CPU
24 |     'cpu',
25 | ]
26 | 
27 | CASTS = [
28 |     '__add__',
29 |     '__div__',
30 |     '__eq__',
31 |     '__ge__',
32 |     '__gt__',
33 |     '__iadd__',
34 |     '__idiv__',
35 |     '__imul__',
36 |     '__isub__',
37 |     '__itruediv__',
38 |     '__le__',
39 |     '__lt__',
40 |     '__mul__',
41 |     '__ne__',
42 |     '__radd__',
43 |     '__rdiv__',
44 |     '__rmul__',
45 |     '__rsub__',
46 |     '__rtruediv__',
47 |     '__sub__',
48 |     '__truediv__',
49 | ]
50 | 
51 | # None of these, but here to make code cleaner.
52 | SEQUENCE_CASTS = []
53 | 
54 | # We need to grab all the methods from torch_overrides and add them to
55 | # the Tensor lists as well, as almost all methods are duplicated
56 | # between `torch` and `torch.Tensor` (and check with `hasattr`,
57 | # because a few random ones aren't defined on Tensor)
58 | _self_mod = importlib.import_module(__name__)
59 | for attrname in ['FP16_FUNCS', 'FP32_FUNCS', 'CASTS', 'SEQUENCE_CASTS']:
60 |     lst = getattr(_self_mod, attrname)
61 |     for fn in getattr(torch_overrides, attrname):
62 |         if hasattr(MODULE, fn):
63 |             lst.append(fn)
64 | 


--------------------------------------------------------------------------------
/apex/apex/amp/lists/torch_overrides.py:
--------------------------------------------------------------------------------
  1 | import torch
  2 | 
  3 | from .. import utils
  4 | 
  5 | MODULE = torch
  6 | 
  7 | FP16_FUNCS = [
  8 |     # Low level functions wrapped by torch.nn layers.
  9 |     # The wrapper layers contain the weights which are then passed in as a parameter
 10 |     # to these functions.
 11 |     'conv1d',
 12 |     'conv2d',
 13 |     'conv3d',
 14 |     'conv_transpose1d',
 15 |     'conv_transpose2d',
 16 |     'conv_transpose3d',
 17 |     'conv_tbc',
 18 |     'prelu',
 19 | 
 20 |     # BLAS
 21 |     'addmm',
 22 |     'addmv',
 23 |     'addr',
 24 |     'matmul',
 25 |     'mm',
 26 |     'mv',
 27 | ]
 28 | 
 29 | FP32_FUNCS = [
 30 |     # Pointwise
 31 |     'acos',
 32 |     'asin',
 33 |     'cosh',
 34 |     'erfinv',
 35 |     'exp',
 36 |     'expm1',
 37 |     'log',
 38 |     'log10',
 39 |     'log2',
 40 |     'reciprocal',
 41 |     'rsqrt',
 42 |     'sinh',
 43 |     'tan',
 44 | 
 45 |     # Other math
 46 |     'pow',
 47 | 
 48 |     # Reduction
 49 |     'cumprod',
 50 |     'cumsum',
 51 |     'dist',
 52 |     'mean',
 53 |     'norm',
 54 |     'prod',
 55 |     'std',
 56 |     'sum',
 57 |     'var',
 58 | 
 59 |     # Misc
 60 |     'renorm'
 61 | ]
 62 | 
 63 | # Before CUDA 9.1, batched matmul was missing fast FP16 kernels. We
 64 | # check the CUDA version -- if at least 9.1, then put the bmm
 65 | # functions on the fp16 list. Otherwise, put them on the fp32 list.
 66 | _bmms = ['addbmm',
 67 |          'baddbmm',
 68 |          'bmm']
 69 | if utils.get_cuda_version() >= (9, 1, 0):
 70 |     FP16_FUNCS.extend(_bmms)
 71 | else:
 72 |     FP32_FUNCS.extend(_bmms)
 73 | 
 74 | # Multi-tensor fns that may need type promotion
 75 | CASTS = [
 76 |     # Multi-tensor math
 77 |     'addcdiv',
 78 |     'addcmul',
 79 |     'atan2',
 80 |     'cross',
 81 |     'bilinear',
 82 | 
 83 |     # Element-wise _or_ tensor-wise math
 84 |     'add',
 85 |     'div',
 86 |     'mul',
 87 | 
 88 |     # Comparison
 89 |     'eq',
 90 |     'equal',
 91 |     'ge',
 92 |     'gt',
 93 |     'le',
 94 |     'lt',
 95 |     'ne'
 96 | ]
 97 | 
 98 | # Functions that take sequence arguments. We need to inspect the whole
 99 | # sequence and cast to the widest type.
100 | SEQUENCE_CASTS = [
101 |     'cat',
102 |     'stack'
103 | ]
104 | 


--------------------------------------------------------------------------------
/apex/apex/amp/rnn_compat.py:
--------------------------------------------------------------------------------
 1 | from . import utils, wrap
 2 | 
 3 | import torch
 4 | _VF = torch._C._VariableFunctions
 5 | RNN_NAMES = ['rnn_relu', 'rnn_tanh', 'gru', 'lstm']
 6 | 
 7 | def _gen_VF_wrapper(name):
 8 |     def wrapper(*args, **kwargs):
 9 |         return getattr(_VF, name)(*args, **kwargs)
10 |     return wrapper
11 | 
12 | # Some python magic to generate an object that has the rnn cell functions
13 | # defined on it, all of which call into corresponding _VF version.
14 | # Intended to patch torch.nn.modules.rnn._VF (aka, the ref named "_VF"
15 | # imported at module scope within torch.nn.modules.rnn).  This should
16 | # not affect third-party importers of _VF.py.
17 | class VariableFunctionsShim(object):
18 |     def __init__(self):
19 |         for name in RNN_NAMES:
20 |             for suffix in ['', '_cell']:
21 |                fn_name = name + suffix
22 |                setattr(self, fn_name, _gen_VF_wrapper(fn_name))
23 | 
24 | def has_old_rnns():
25 |     try:
26 |         torch.nn.backends.thnn.backend.LSTMCell
27 |         return True
28 |     except:
29 |         return False
30 | 
31 | def whitelist_rnn_cells(handle, verbose):
32 |     # Different module + function names in old/new RNN cases
33 |     if has_old_rnns():
34 |         fn_names = ['RNNReLUCell', 'RNNTanhCell', 'LSTMCell', 'GRUCell']
35 |         mod = torch.nn.backends.thnn.backend
36 |     else:
37 |         fn_names = [x + '_cell' for x in RNN_NAMES]
38 |         mod = torch.nn.modules.rnn._VF
39 |         assert isinstance(mod, VariableFunctionsShim)
40 | 
41 |     # Insert casts on cell functions
42 |     for fn in fn_names:
43 |         wrap.cached_cast(mod, fn, utils.maybe_half, handle,
44 |                          try_caching=True, verbose=verbose)
45 | 
46 |     if has_old_rnns():
47 |         # Special handling of `backward` for fused gru / lstm:
48 |         # The `backward` method calls Tensor.sum() (blacklist) internally,
49 |         # and then the resulting grad_input has the wrong type.
50 |         # TODO: where else is this a problem?
51 |         for rnn_type in ['GRUFused', 'LSTMFused']:
52 |             mod = getattr(torch.nn._functions.thnn.rnnFusedPointwise, rnn_type)
53 |             wrap.disable_casts(mod, 'backward', handle)
54 | 


--------------------------------------------------------------------------------
/apex/apex/fp16_utils/README.md:
--------------------------------------------------------------------------------
 1 | fp16_optimizer.py contains `FP16_Optimizer`, a Python class designed to wrap an existing Pytorch optimizer and automatically enable master parameters and loss scaling in a manner transparent to the user.  To use `FP16_Optimizer`, only two lines of one's Python model need to change.
 2 | 
 3 | #### [FP16_Optimizer API documentation](https://nvidia.github.io/apex/fp16_utils.html#automatic-management-of-master-params-loss-scaling)
 4 | 
 5 | #### [Simple examples with FP16_Optimizer](https://github.com/NVIDIA/apex/tree/master/examples/FP16_Optimizer_simple)
 6 | 
 7 | #### [Imagenet with FP16_Optimizer](https://github.com/NVIDIA/apex/tree/master/examples/imagenet)
 8 | 
 9 | #### [word_language_model with FP16_Optimizer](https://github.com/NVIDIA/apex/tree/master/examples/word_language_model)
10 | 
11 | 
12 | fp16_util.py contains a number of utilities to manually manage master parameters and loss scaling, if the user chooses.  
13 | 
14 | #### [Manual management documentation](https://nvidia.github.io/apex/fp16_utils.html#manual-master-parameter-management)
15 | 
16 | The [Imagenet with FP16_Optimizer](https://github.com/NVIDIA/apex/tree/master/examples/imagenet) and [word_language_model with FP16_Optimizer](https://github.com/NVIDIA/apex/tree/master/examples/word_language_model) directories also contain `main.py` files that demonstrate manual management of master parameters and static loss scaling.  These examples illustrate what sort of operations `FP16_Optimizer` is performing automatically.
17 | 


--------------------------------------------------------------------------------
/apex/apex/fp16_utils/__init__.py:
--------------------------------------------------------------------------------
 1 | from .fp16util import (
 2 |     BN_convert_float,
 3 |     network_to_half,
 4 |     prep_param_lists,
 5 |     model_grads_to_master_grads,
 6 |     master_params_to_model_params,
 7 |     tofp16,
 8 |     to_python_float,
 9 |     clip_grad_norm,
10 |     convert_module,
11 |     convert_network,
12 |     FP16Model,
13 | )
14 | 
15 | from .fp16_optimizer import FP16_Optimizer
16 | from .loss_scaler import LossScaler, DynamicLossScaler
17 | 


--------------------------------------------------------------------------------
/apex/apex/multi_tensor_apply/__init__.py:
--------------------------------------------------------------------------------
1 | from .multi_tensor_apply import MultiTensorApply
2 | 
3 | multi_tensor_applier = MultiTensorApply(2048*32)
4 | 
5 | 


--------------------------------------------------------------------------------
/apex/apex/multi_tensor_apply/multi_tensor_apply.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | 
 3 | class MultiTensorApply(object):
 4 |     available = False
 5 |     warned = False
 6 | 
 7 |     def __init__(self, chunk_size):
 8 |         try:
 9 |             import amp_C
10 |             MultiTensorApply.available = True
11 |             self.chunk_size = chunk_size
12 |         except ImportError as err:
13 |             MultiTensorApply.available = False
14 |             MultiTensorApply.import_err = err
15 | 
16 |     def check_avail(self):
17 |         if MultiTensorApply.available == False:
18 |             raise RuntimeError(
19 |                 "Attempted to call MultiTensorApply method, but MultiTensorApply "
20 |                 "is not available, possibly because Apex was installed without "
21 |                 "--cpp_ext --cuda_ext.  Original import error message:",
22 |                 MultiTensorApply.import_err)
23 | 
24 |     def __call__(self, op, noop_flag_buffer, tensor_lists, *args):
25 |         self.check_avail()
26 | 
27 |         return op(self.chunk_size,
28 |                   noop_flag_buffer,
29 |                   tensor_lists,
30 |                   *args)
31 | 


--------------------------------------------------------------------------------
/apex/apex/normalization/__init__.py:
--------------------------------------------------------------------------------
1 | from .fused_layer_norm import FusedLayerNorm
2 | 


--------------------------------------------------------------------------------
/apex/apex/optimizers/__init__.py:
--------------------------------------------------------------------------------
1 | from .fused_adam import FusedAdam
2 | from .fp16_optimizer import FP16_Optimizer
3 | 


--------------------------------------------------------------------------------
/apex/apex/parallel/README.md:
--------------------------------------------------------------------------------
 1 | ## Distributed Data Parallel
 2 | 
 3 | distributed.py contains the source code for `apex.parallel.DistributedDataParallel`, a module wrapper that enables multi-process multi-GPU data parallel training optimized for NVIDIA's NCCL communication library.
 4 | 
 5 | `apex.parallel.DistributedDataParallel` achieves high performance by overlapping communication with
 6 | computation in the backward pass and bucketing smaller transfers to reduce the total number of
 7 | transfers required.
 8 | 
 9 | multiproc.py contains the source code for `apex.parallel.multiproc`, a launch utility that places one process on each of the node's available GPUs.
10 | 
11 | #### [API Documentation](https://nvidia.github.io/apex/parallel.html)
12 | 
13 | #### [Example/Walkthrough](https://github.com/NVIDIA/apex/tree/master/examples/distributed)
14 | 
15 | #### [Imagenet example with Mixed Precision](https://github.com/NVIDIA/apex/tree/master/examples/imagenet)
16 | 
17 | #### [Simple example with FP16_Optimizer](https://github.com/NVIDIA/apex/tree/master/examples/FP16_Optimizer_simple/distributed_apex)
18 | 
19 | ### Synchronized Batch Normalization
20 | 
21 | `apex.parallel.SyncBatchNorm` has similar APIs as with `torch.nn.BatchNorm*N*d`.
22 | It reduces stats on the first (channel) dimension of the Tensor and accepts
23 | arbitrary spatial dimensions.
24 | 
25 | #### Installation
26 | 
27 | Apex provides two sync BN implementation:
28 | 
29 | 1. There is the Python-only implementation, which is the default implementation
30 | when install with `python setup.py install`.
31 | It uses PyTorch primitive operations and distributed communication package from
32 | `torch.distributed`.
33 | 
34 |    - _Python-only implementation requires input tensor to be of same data type as
35 | layer_
36 | 
37 | 2. We also provide implementation with kernels through CUDA/C++ extension with
38 | improved performance. We are experimenting with Welford and Kahan for reduction
39 | hoping to get better accuracy.
40 |    To use the kernel implementation, user need to install Apex with CUDA extension
41 | enabled `python setup.py install --cuda_ext`.
42 | 
43 |    - _Custom kernel implementation supports fp16 input with fp32 layer as cudnn.
44 | This is required to run imagenet example in fp16._
45 | 
46 |    - _Currently kernel implementation only supports GPU._
47 | 
48 | #### HowTo
49 | 
50 | 1. User could use `apex.parallel.SyncBatchNorm` by building their module with
51 | the layer explicitly.
52 | 
53 | ```
54 | import apex
55 | input_t = torch.randn(3, 5, 20).cuda()
56 | sbn = apex.parallel.SyncBatchNorm(5).cuda()
57 | output_t = sbn(input)
58 | ```
59 | 
60 | 2. User could also take a constructed `torch.nn.Model` and replace all its `torch.nn.BatchNorm*N*d` modules with `apex.parallel.SyncBatchNorm` through utility function `apex.parallel.convert_syncbn_model`.
61 | 
62 | ```
63 | # model is an instance of torch.nn.Module
64 | import apex
65 | sync_bn_model = apex.parallel.convert_syncbn_model(model)
66 | ```
67 | 


--------------------------------------------------------------------------------
/apex/apex/parallel/multiproc.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | import sys
 3 | import subprocess
 4 | 
 5 | def docstring_hack():
 6 |     """
 7 |     Multiproc file which will launch a set of processes locally for multi-gpu
 8 |     usage: python -m apex.parallel.multiproc main.py ...
 9 |     """
10 |     pass
11 | 
12 | argslist = list(sys.argv)[1:]
13 | world_size = torch.cuda.device_count()
14 | 
15 | if '--world-size' in argslist:
16 |     world_size = int(argslist[argslist.index('--world-size')+1])
17 | else:
18 |     argslist.append('--world-size')
19 |     argslist.append(str(world_size))
20 | 
21 | workers = []
22 | 
23 | for i in range(world_size):
24 |     if '--rank' in argslist:
25 |         argslist[argslist.index('--rank')+1] = str(i)
26 |     else:
27 |         argslist.append('--rank')
28 |         argslist.append(str(i))
29 |     stdout = None if i == 0 else open("GPU_"+str(i)+".log", "w")
30 |     print(argslist)
31 |     p = subprocess.Popen([str(sys.executable)]+argslist, stdout=stdout)
32 |     workers.append(p)
33 | 
34 | for p in workers:
35 |     p.wait()
36 | 


--------------------------------------------------------------------------------
/apex/apex/reparameterization/README.md:
--------------------------------------------------------------------------------
1 | Under construction...
2 | 


--------------------------------------------------------------------------------
/apex/csrc/amp_C_frontend.cpp:
--------------------------------------------------------------------------------
 1 | #include <torch/extension.h>
 2 | 
 3 | void multi_tensor_scale_cuda(
 4 |   int chunk_size,
 5 |   at::Tensor noop_flag,
 6 |   std::vector<std::vector<at::Tensor>> tensor_lists,
 7 |   float scale);
 8 | 
 9 | void multi_tensor_axpby_cuda(
10 |   int chunk_size,
11 |   at::Tensor noop_flag,
12 |   std::vector<std::vector<at::Tensor>> tensor_lists,
13 |   float a,
14 |   float b,
15 |   int arg_to_check);
16 | 
17 | at::Tensor multi_tensor_l2norm_cuda(
18 |   int chunk_size,
19 |   at::Tensor noop_flag,
20 |   std::vector<std::vector<at::Tensor>> tensor_lists);
21 | 
22 | PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
23 |   m.def("multi_tensor_scale", &multi_tensor_scale_cuda,
24 |         "Fused overflow check + scale for a list of contiguous tensors");
25 |   m.def("multi_tensor_axpby", &multi_tensor_axpby_cuda,
26 |         "out = a*x + b*y for a list of contiguous tensors");
27 |   m.def("multi_tensor_l2norm", &multi_tensor_l2norm_cuda,
28 |         "Computes L2 norm for a list of contiguous tensors");
29 | }
30 | 


--------------------------------------------------------------------------------
/apex/csrc/flatten_unflatten.cpp:
--------------------------------------------------------------------------------
 1 | #include <torch/extension.h>
 2 | #include <torch/csrc/utils/tensor_flatten.h>
 3 | // https://github.com/pytorch/pytorch/blob/master/torch/csrc/utils/tensor_flatten.h
 4 | 
 5 | at::Tensor flatten(std::vector<at::Tensor> tensors)
 6 | {
 7 |   return torch::utils::flatten_dense_tensors(tensors);
 8 | }
 9 | 
10 | std::vector<at::Tensor> unflatten(at::Tensor flat, std::vector<at::Tensor> tensors)
11 | {
12 |   return torch::utils::unflatten_dense_tensors(flat, tensors);
13 | }
14 | 
15 | PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
16 |   m.def("flatten", &flatten, "Flatten dense tensors");
17 |   m.def("unflatten", &unflatten, "Unflatten dense tensors");
18 | }
19 | 


--------------------------------------------------------------------------------
/apex/csrc/fused_adam_cuda.cpp:
--------------------------------------------------------------------------------
 1 | #include <torch/extension.h>
 2 | 
 3 | // CUDA forward declaration
 4 | void fused_adam_cuda(at::Tensor & p, at::Tensor & p_copy, at::Tensor & m, at::Tensor & v, at::Tensor & g, float lr, float beta1, float beta2, float eps, float grad_scale, int step, int mode, int bias_correction, float decay);
 5 | 
 6 | #define CHECK_CUDA(x) AT_ASSERTM(x.type().is_cuda(), #x " must be a CUDA tensor")
 7 | #define CHECK_CONTIGUOUS(x) AT_ASSERTM(x.is_contiguous(), #x " must be contiguous")
 8 | #define CHECK_INPUT(x) CHECK_CUDA(x); CHECK_CONTIGUOUS(x)
 9 | 
10 | // C++ interface
11 | void adam(at::Tensor & p, at::Tensor & p_copy, at::Tensor & m, at::Tensor & v, at::Tensor & g, float lr, float beta1, float beta2, float eps, float grad_scale, int step, int mode, int bias_correction, float decay) {
12 |         CHECK_INPUT(p)
13 |         if (p_copy.numel() > 0) CHECK_INPUT(p_copy);
14 |         CHECK_INPUT(m);
15 |         CHECK_INPUT(v);
16 |         CHECK_INPUT(g);
17 |         int64_t num_elem = p.numel();
18 |         AT_ASSERTM(m.numel() == num_elem, "number of elements in m and p tensors should be equal");
19 |         AT_ASSERTM(v.numel() == num_elem, "number of elements in v and p tensors should be equal");
20 |         AT_ASSERTM(g.numel() == num_elem, "number of elements in g and p tensors should be equal");
21 |         AT_ASSERTM(p_copy.numel() == num_elem || p_copy.numel() == 0, "number of elements in p_copy and p tensors should be equal, or p_copy should be empty");
22 | 
23 |         fused_adam_cuda(p, p_copy, m, v, g, lr, beta1, beta2, eps, grad_scale, step, mode, bias_correction, decay);
24 | }
25 | 
26 | PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
27 |         m.def("adam", &adam, "Adam optimized CUDA implementation.");
28 | }
29 | 


--------------------------------------------------------------------------------
/apex/csrc/multi_tensor_l2norm_kernel.cu:
--------------------------------------------------------------------------------
  1 | #include <ATen/ATen.h>
  2 | #include <ATen/AccumulateType.h>
  3 | #include <ATen/cuda/CUDAContext.h>
  4 | #include <ATen/cuda/Exceptions.h>
  5 | // Another possibility:
  6 | // #include <torch/all.h>
  7 | 
  8 | #include <assert.h>
  9 | 
 10 | #include "type_shim.h"
 11 | #include "multi_tensor_apply.cuh"
 12 | 
 13 | #define BLOCK_SIZE 512
 14 | #define ILP 4
 15 | 
 16 | template<typename x_t>
 17 | struct L2NormFunctor
 18 | {
 19 |    __device__ __forceinline__ void operator()(
 20 |     int chunk_size,
 21 |     volatile int* noop_gmem,
 22 |     TensorListMetadata<1>& tl,
 23 |     float* output)
 24 |   {
 25 |     // I'd like this kernel to propagate infs/nans.
 26 |     // if(*noop_gmem == 1)
 27 |     //   return;
 28 | 
 29 |     int tensor_loc = tl.block_to_tensor[blockIdx.x];
 30 |     int chunk_idx = tl.block_to_chunk[blockIdx.x];
 31 |     int n = tl.sizes[tensor_loc];
 32 | 
 33 |     x_t* x = (x_t*)tl.addresses[0][tensor_loc];
 34 |     x += chunk_idx*chunk_size;
 35 | 
 36 |     n -= chunk_idx*chunk_size;
 37 | 
 38 |     __shared__ float vals[512];
 39 | 
 40 |     // Non-divergent exit condition for __syncthreads, not necessary here
 41 |     float val = 0;
 42 |     for(int i = threadIdx.x; i < n && i < chunk_size; i += blockDim.x)
 43 |     {
 44 |       float next = static_cast<float>(x[i]);
 45 |       val += next*next;
 46 |     }
 47 | 
 48 |     float final = reduce_block_into_lanes(vals, val);
 49 | 
 50 |     if(threadIdx.x == 0)
 51 |     {
 52 |       if(!isfinite(final))
 53 |         *noop_gmem = 1; // Blindly fire off a write.  These will race but that's ok.
 54 |       output[blockIdx.x] += final;
 55 |     }
 56 |   }
 57 | };
 58 | 
 59 | __global__ void cleanup(float* x, float* ret)
 60 | {
 61 |   __shared__ float vals[512];
 62 | 
 63 |   float val = 0;
 64 |   if(threadIdx.x < 320)
 65 |     val = x[threadIdx.x];
 66 | 
 67 |   float final = reduce_block_into_lanes(vals, val);
 68 | 
 69 |   if(threadIdx.x == 0)
 70 |     *ret = sqrt(final);
 71 | }
 72 | 
 73 | at::Tensor multi_tensor_l2norm_cuda(
 74 |   int chunk_size,
 75 |   at::Tensor noop_flag,
 76 |   std::vector<std::vector<at::Tensor>> tensor_lists)
 77 | {
 78 |   auto output = at::zeros({320}, tensor_lists[0][0].options().dtype(at::kFloat));
 79 | 
 80 |   DISPATCH_FLOAT_AND_HALF(tensor_lists[0][0].scalar_type(), 0, "multi_tensor_l2norm_cuda",
 81 |     multi_tensor_apply<1>(
 82 |       BLOCK_SIZE,
 83 |       chunk_size,
 84 |       noop_flag,
 85 |       tensor_lists,
 86 |       L2NormFunctor<scalar_t_0>(),
 87 |       output.data<float>());)
 88 | 
 89 |   AT_CUDA_CHECK(cudaGetLastError());
 90 | 
 91 |   // AT_CUDA_CHECK(cudaDeviceSynchronize());
 92 | 
 93 |   // This involves one more small kernel launches, but will be negligible end to end.
 94 |   // I could get rid of these by hacking the functor + multi tensor harness with persistence
 95 |   // logic, but keeping it simple for now
 96 |   auto ret = at::empty({1}, output.options());
 97 |   auto stream = at::cuda::getCurrentCUDAStream();
 98 |   cleanup<<<1, 512, 0, stream>>>(output.data<float>(), ret.data<float>());
 99 |   return ret;
100 | }
101 | 


--------------------------------------------------------------------------------
/apex/docs/Makefile:
--------------------------------------------------------------------------------
 1 | # Minimal makefile for Sphinx documentation
 2 | #
 3 | 
 4 | # You can set these variables from the command line.
 5 | SPHINXOPTS    =
 6 | SPHINXBUILD   = sphinx-build
 7 | SPHINXPROJ    = NVIDIAAPEX
 8 | SOURCEDIR     = source
 9 | BUILDDIR      = build
10 | 
11 | # Put it first so that "make" without argument is like "make help".
12 | help:
13 | 	@$(SPHINXBUILD) -M help "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)
14 | 
15 | gh-pages:
16 | 	git checkout gh-pages
17 | 	rm -rf build
18 | 	rm -rf source
19 | 	git checkout master -- .
20 | 	make html
21 | 	rm -rf ../_modules ../_sources ../_static
22 | 	mv -fv build/html/* ../
23 | 	rm -rf build
24 | 	git add -A
25 | 	git commit -m "Generated gh-pages for `git log master -1 --pretty=short --abbrev-commit`" && git push origin gh-pages ; git checkout master
26 | 
27 | .PHONY: help Makefile
28 | 
29 | # Catch-all target: route all unknown targets to Sphinx using the new
30 | # "make mode" option.  $(O) is meant as a shortcut for $(SPHINXOPTS).
31 | %: Makefile
32 | 	@$(SPHINXBUILD) -M $@ "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)
33 | 


--------------------------------------------------------------------------------
/apex/docs/source/_static/css/pytorch_theme.css:
--------------------------------------------------------------------------------
  1 | body {
  2 |     font-family: "Lato","proxima-nova","Helvetica Neue",Arial,sans-serif;
  3 | }
  4 | 
  5 | /* Default header fonts are ugly */
  6 | h1, h2, .rst-content .toctree-wrapper p.caption, h3, h4, h5, h6, legend, p.caption {
  7 |     font-family: "Lato","proxima-nova","Helvetica Neue",Arial,sans-serif;
  8 | }
  9 | 
 10 | /* Use white for docs background */
 11 | .wy-side-nav-search {
 12 |     background-color: #fff;
 13 | }
 14 | 
 15 | .wy-nav-content-wrap, .wy-menu li.current > a  {
 16 |     background-color: #fff;
 17 | }
 18 | 
 19 | @media screen and (min-width: 1400px) {
 20 |     .wy-nav-content-wrap {
 21 |         background-color: rgba(0, 0, 0, 0.0470588);
 22 |     }
 23 | 
 24 |     .wy-nav-content {
 25 |         background-color: #fff;
 26 |     }
 27 | }
 28 | 
 29 | /* Fixes for mobile */
 30 | .wy-nav-top {
 31 |     background-color: #fff;
 32 |     background-image: url('../img/apex.jpg');
 33 |     background-repeat: no-repeat;
 34 |     background-position: center;
 35 |     padding: 0;
 36 |     margin: 0.4045em 0.809em;
 37 |     color: #333;
 38 | }
 39 | 
 40 | .wy-nav-top > a {
 41 |     display: none;
 42 | }
 43 | 
 44 | @media screen and (max-width: 768px) {
 45 |     .wy-side-nav-search>a img.logo {
 46 |         height: 60px;
 47 |     }
 48 | }
 49 | 
 50 | /* This is needed to ensure that logo above search scales properly */
 51 | .wy-side-nav-search a {
 52 |     display: block;
 53 | }
 54 | 
 55 | /* This ensures that multiple constructors will remain in separate lines. */
 56 | .rst-content dl:not(.docutils) dt {
 57 |     display: table;
 58 | }
 59 | 
 60 | /* Use our red for literals (it's very similar to the original color) */
 61 | .rst-content tt.literal, .rst-content tt.literal, .rst-content code.literal {
 62 |     color: #F05732;
 63 | }
 64 | 
 65 | .rst-content tt.xref, a .rst-content tt, .rst-content tt.xref,
 66 | .rst-content code.xref, a .rst-content tt, a .rst-content code {
 67 |     color: #404040;
 68 | }
 69 | 
 70 | /* Change link colors (except for the menu) */
 71 | 
 72 | a {
 73 |     color: #F05732;
 74 | }
 75 | 
 76 | a:hover {
 77 |     color: #F05732;
 78 | }
 79 | 
 80 | 
 81 | a:visited {
 82 |     color: #D44D2C;
 83 | }
 84 | 
 85 | .wy-menu a {
 86 |     color: #b3b3b3;
 87 | }
 88 | 
 89 | .wy-menu a:hover {
 90 |     color: #b3b3b3;
 91 | }
 92 | 
 93 | /* Default footer text is quite big */
 94 | footer {
 95 |     font-size: 80%;
 96 | }
 97 | 
 98 | footer .rst-footer-buttons {
 99 |     font-size: 125%; /* revert footer settings - 1/80% = 125% */
100 | }
101 | 
102 | footer p {
103 |     font-size: 100%;
104 | }
105 | 
106 | /* For hidden headers that appear in TOC tree */
107 | /* see http://stackoverflow.com/a/32363545/3343043 */
108 | .rst-content .hidden-section {
109 |     display: none;
110 | }
111 | 
112 | nav .hidden-section {
113 |     display: inherit;
114 | }
115 | 
116 | .wy-side-nav-search>div.version {
117 |     color: #000;
118 | }
119 | 


--------------------------------------------------------------------------------
/apex/docs/source/_static/img/nv-pytorch2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/apex/docs/source/_static/img/nv-pytorch2.png


--------------------------------------------------------------------------------
/apex/docs/source/_templates/layout.html:
--------------------------------------------------------------------------------
 1 | {% extends "!layout.html" %}
 2 |   {% block sidebartitle %} {{ super() }}
 3 | 
 4 |   <style>
 5 |     /* Sidebar header (and topbar for mobile) */
 6 |     .wy-side-nav-search, .wy-nav-top {
 7 |       background: #76b900;
 8 |     }
 9 | 
10 |     .wy-side-nav-search a:link, .wy-nav-top a:link {
11 |       color: #fff;
12 |     }
13 |     .wy-side-nav-search a:visited, .wy-nav-top a:visited {
14 |       color: #fff;
15 |     }
16 |     .wy-side-nav-search a:hover, .wy-nav-top a:hover {
17 |       color: #fff;
18 |     }
19 | 
20 |     .wy-menu-vertical a:link, .wy-menu-vertical a:visited {
21 |       color: #d9d9d9
22 |     }
23 | 
24 |     .wy-menu-vertical a:active {
25 |       background-color: #76b900
26 |     }
27 | 
28 |     .wy-side-nav-search>div.version {
29 |       color: rgba(0, 0, 0, 0.3)
30 |     }
31 |   </style>
32 |   {% endblock %}
33 | 
34 |   {% block footer %} {{ super() }}
35 | 
36 |   <style>
37 |   a:link, a:visited {
38 |     color: #76b900;
39 |   }
40 | 
41 |   a:hover {
42 |     color: #8c0;
43 |   }
44 | 
45 |   .rst-content dl:not(.docutils) dt {
46 |     background: rgba(118, 185, 0, 0.1);
47 |     color: rgba(59,93,0,1);
48 |     border-top: solid 3px rgba(59,93,0,1);
49 |   }
50 |   </style>
51 |   {% endblock %}
52 | 


--------------------------------------------------------------------------------
/apex/docs/source/fp16_utils.rst:
--------------------------------------------------------------------------------
 1 | .. role:: hidden
 2 |     :class: hidden-section
 3 | 
 4 | apex.fp16_utils
 5 | ===================================
 6 | 
 7 | This submodule contains utilities designed to streamline the mixed precision training recipe 
 8 | presented by NVIDIA `on Parallel Forall`_ and in GTC 2018 Sessions 
 9 | `Training Neural Networks with Mixed Precision: Theory and Practice`_ and 
10 | `Training Neural Networks with Mixed Precision: Real Examples`_.
11 | For Pytorch users, Real Examples in particular is recommended.
12 | 
13 | Full runnable Python scripts demonstrating ``apex.fp16_utils`` 
14 | can be found on the Github page:
15 | 
16 | | `Simple FP16_Optimizer demos`_
17 | |
18 | | `Distributed Mixed Precision Training with imagenet`_
19 | |
20 | | `Mixed Precision Training with word_language_model`_
21 | |
22 | |
23 | 
24 | .. _`on Parallel Forall`:
25 |     https://devblogs.nvidia.com/mixed-precision-training-deep-neural-networks/
26 | .. _`Training Neural Networks with Mixed Precision: Theory and Practice`:
27 |     http://on-demand.gputechconf.com/gtc/2018/video/S8923/
28 | .. _`Training Neural Networks with Mixed Precision: Real Examples`:
29 |     http://on-demand.gputechconf.com/gtc/2018/video/S81012/
30 | .. _`Simple FP16_Optimizer demos`:
31 |     https://github.com/NVIDIA/apex/tree/master/examples/FP16_Optimizer_simple
32 | .. _`Distributed Mixed Precision Training with imagenet`:
33 |     https://github.com/NVIDIA/apex/tree/master/examples/imagenet
34 | .. _`Mixed Precision Training with word_language_model`:
35 |     https://github.com/NVIDIA/apex/tree/master/examples/word_language_model
36 | 
37 | .. automodule:: apex.fp16_utils
38 | .. currentmodule:: apex.fp16_utils
39 | 
40 | Automatic management of master params + loss scaling
41 | ----------------------------------------------------
42 | 
43 | .. autoclass:: FP16_Optimizer
44 |     :members:
45 | 
46 | .. autoclass:: LossScaler
47 |     :members:
48 | 
49 | .. autoclass:: DynamicLossScaler
50 |     :members:
51 | 
52 | Manual master parameter management
53 | ----------------------------------
54 | 
55 | .. autofunction:: prep_param_lists
56 | 
57 | .. autofunction:: master_params_to_model_params
58 | 
59 | .. autofunction:: model_grads_to_master_grads
60 | 


--------------------------------------------------------------------------------
/apex/docs/source/index.rst:
--------------------------------------------------------------------------------
 1 | .. PyTorch documentation master file, created by
 2 |    sphinx-quickstart on Fri Dec 23 13:31:47 2016.
 3 |    You can adapt this file completely to your liking, but it should at least
 4 |    contain the root `toctree` directive.
 5 | 
 6 | :github_url: https://github.com/nvidia/apex
 7 | 
 8 | Apex (A PyTorch Extension)
 9 | ===================================
10 | 
11 | This site contains the API documentation for Apex (https://github.com/nvidia/apex),
12 | a Pytorch extension with NVIDIA-maintained utilities to streamline mixed precision and distributed training.  Some of the code here will be included in upstream Pytorch eventually. The intention of Apex is to make up-to-date utilities available to users as quickly as possible.
13 | 
14 | Installation instructions can be found here:  https://github.com/NVIDIA/apex#quick-start.
15 | 
16 | .. toctree::
17 |    :maxdepth: 1
18 |    :caption: AMP:  Automatic Mixed Precision
19 | 
20 |    amp
21 | 
22 | .. toctree::
23 |    :maxdepth: 1
24 |    :caption: Distributed Training
25 | 
26 |    parallel
27 | 
28 | .. toctree::
29 |    :maxdepth: 1
30 |    :caption: Fused Optimizers
31 | 
32 |    optimizers
33 | 
34 | .. toctree::
35 |    :maxdepth: 1
36 |    :caption: Fused Layer Norm
37 | 
38 |    layernorm
39 | 
40 | ..   .. toctree::
41 |      :maxdepth: 1
42 |      :caption: Deprecated mixed precision API
43 |      fp16_util
44 | 
45 | ..   reparameterization
46 | ..   RNN
47 |    
48 | Indices and tables
49 | ==================
50 | 
51 | * :ref:`genindex`
52 | * :ref:`modindex`
53 | 


--------------------------------------------------------------------------------
/apex/docs/source/layernorm.rst:
--------------------------------------------------------------------------------
 1 | .. role:: hidden
 2 |     :class: hidden-section
 3 | 
 4 | apex.normalization.fused_layer_norm
 5 | ===================================
 6 | 
 7 | .. automodule:: apex.normalization
 8 | .. currentmodule:: apex.normalization
 9 | 
10 | .. FusedAdam
11 |    ----------
12 | 
13 | .. autoclass:: FusedLayerNorm
14 |     :members:
15 | 


--------------------------------------------------------------------------------
/apex/docs/source/optimizers.rst:
--------------------------------------------------------------------------------
 1 | .. role:: hidden
 2 |     :class: hidden-section
 3 | 
 4 | apex.optimizers
 5 | ===================================
 6 | 
 7 | .. automodule:: apex.optimizers
 8 | .. currentmodule:: apex.optimizers
 9 | 
10 | .. FusedAdam
11 |    ----------
12 | 
13 | .. autoclass:: FusedAdam
14 |     :members:
15 | 


--------------------------------------------------------------------------------
/apex/docs/source/parallel.rst:
--------------------------------------------------------------------------------
 1 | .. role:: hidden
 2 |     :class: hidden-section
 3 | 
 4 | apex.parallel
 5 | ===================================
 6 | 
 7 | .. automodule:: apex.parallel
 8 | .. currentmodule:: apex.parallel
 9 | 
10 | .. DistributedDataParallel
11 |    ----------
12 | 
13 | .. autoclass:: DistributedDataParallel
14 |     :members:
15 | 
16 | .. autoclass:: Reducer
17 |     :members:
18 | 
19 | .. autoclass:: SyncBatchNorm
20 |     :members:
21 | 
22 | Utility functions
23 | ----------------------------------
24 | 
25 | .. autofunction:: convert_syncbn_model
26 | 


--------------------------------------------------------------------------------
/apex/examples/README.md:
--------------------------------------------------------------------------------
1 | This directory contains examples illustrating Apex mixed precision and distributed tools.
2 | 
3 | **Note for users of the pre-unification API**:
4 | `deprecated_api` contains examples illustrating the old (pre-unified) APIs.  These APIs will be removed soon, and users are strongly encouraged to switch.  The separate mixed precision tools called `Amp` and `FP16_Optimizer` in the old API are exposed via different flags/optimization levels in the new API.
5 | 


--------------------------------------------------------------------------------
/apex/examples/dcgan/README.md:
--------------------------------------------------------------------------------
1 | Under construction...
2 | 


--------------------------------------------------------------------------------
/apex/examples/docker/Dockerfile:
--------------------------------------------------------------------------------
 1 | # Base image must at least have pytorch and CUDA installed.
 2 | ARG BASE_IMAGE=nvcr.io/nvidia/pytorch:19.03-py3
 3 | FROM $BASE_IMAGE
 4 | ARG BASE_IMAGE
 5 | RUN echo "Installing Apex on top of ${BASE_IMAGE}"
 6 | # make sure we don't overwrite some existing directory called "apex"
 7 | WORKDIR /tmp/unique_for_apex
 8 | # uninstall Apex if present, twice to make absolutely sure :)
 9 | RUN pip uninstall -y apex || :
10 | RUN pip uninstall -y apex || :
11 | # SHA is something the user can touch to force recreation of this Docker layer,
12 | # and therefore force cloning of the latest version of Apex
13 | RUN SHA=ToUcHMe git clone https://github.com/NVIDIA/apex.git
14 | WORKDIR /tmp/unique_for_apex/apex
15 | RUN pip install -v --no-cache-dir --global-option="--cpp_ext" --global-option="--cuda_ext" .
16 | WORKDIR /workspace
17 | 


--------------------------------------------------------------------------------
/apex/examples/docker/README.md:
--------------------------------------------------------------------------------
 1 | ## Option 1:  Create a new container with Apex
 2 | 
 3 | **Dockerfile** installs the latest Apex on top of an existing image.  Run
 4 | ```
 5 | docker build -t new_image_with_apex .
 6 | ```
 7 | By default, **Dockerfile** uses NVIDIA's Pytorch container as the base image,
 8 | which requires an NVIDIA GPU Cloud (NGC) account.  If you don't have an NGC account, you can sign up for free by following the instructions [here](https://docs.nvidia.com/ngc/ngc-getting-started-guide/index.html#generating-api-key).
 9 | 
10 | Alternatively, you can supply your own base image via the `BASE_IMAGE` build-arg.
11 | `BASE_IMAGE` must have Pytorch and Cuda installed.  For example, any
12 | `-devel` image for Pytorch 1.0 and later from the
13 | [official Pytorch Dockerhub](https://hub.docker.com/r/pytorch/pytorch) may be used:
14 | ```
15 | docker build --build-arg BASE_IMAGE=pytorch/pytorch:nightly-devel-cuda10.0-cudnn7 -t new_image_with_apex .
16 | ```
17 | 
18 | If you want to rebuild your image, and force the latest Apex to be cloned and installed, make any small change to the `SHA` variable in **Dockerfile**.
19 | 
20 | **Warning:**
21 | Currently, the non-`-devel` images on Pytorch Dockerhub do not contain the Cuda compiler `nvcc`.  Therefore,
22 | images whose name does not contain `-devel` are not eligible candidates for `BASE_IMAGE`.
23 | 
24 | ### Running your Apex container
25 | 
26 | Like any Cuda-enabled Pytorch container, a container with Apex should be run via [nvidia-docker](https://github.com/NVIDIA/nvidia-docker), for example:
27 | ```
28 | docker run --runtime=nvidia -it --rm --ipc=host new_image_with_apex
29 | ```
30 | 
31 | ## Option 2:  Install Apex in a running container
32 | 
33 | Instead of building a new container, it is also a viable option to `git clone https://github.com/NVIDIA/apex.git` on bare metal, mount the Apex repo into your container at launch by running, for example,
34 | ```
35 | docker run --runtime=nvidia -it --rm --ipc=host -v /bare/metal/apex:/apex/in/container <base image>
36 | ```
37 | then go to /apex/in/container within the running container and
38 | ```
39 | pip install -v --no-cache-dir --global-option="--cpp_ext" --global-option="--cuda_ext" .
40 | ```
41 | 


--------------------------------------------------------------------------------
/apex/examples/simple/distributed/README.md:
--------------------------------------------------------------------------------
 1 | **distributed_data_parallel.py** and **run.sh** show an example using Amp with
 2 | [apex.parallel.DistributedDataParallel](https://nvidia.github.io/apex/parallel.html) or
 3 | [torch.nn.parallel.DistributedDataParallel](https://pytorch.org/docs/stable/nn.html#distributeddataparallel)
 4 | and the Pytorch multiprocess launcher script,
 5 | [torch.distributed.launch](https://pytorch.org/docs/master/distributed.html#launch-utility).
 6 | The use of `Amp` with DistributedDataParallel does not need to change from ordinary 
 7 | single-process use.  The only gotcha is that wrapping your model with `DistributedDataParallel` must
 8 | come after the call to `amp.initialize`.  Test via
 9 | ```bash
10 | bash run.sh
11 | ```
12 | 
13 | **This is intended purely as an instructional example, not a performance showcase.**
14 | 


--------------------------------------------------------------------------------
/apex/examples/simple/distributed/distributed_data_parallel.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | import argparse
 3 | import os
 4 | from apex import amp
 5 | # FOR DISTRIBUTED: (can also use torch.nn.parallel.DistributedDataParallel instead)
 6 | from apex.parallel import DistributedDataParallel
 7 | 
 8 | parser = argparse.ArgumentParser()
 9 | # FOR DISTRIBUTED:  Parse for the local_rank argument, which will be supplied
10 | # automatically by torch.distributed.launch.
11 | parser.add_argument("--local_rank", default=0, type=int)
12 | args = parser.parse_args()
13 | 
14 | # FOR DISTRIBUTED:  If we are running under torch.distributed.launch,
15 | # the 'WORLD_SIZE' environment variable will also be set automatically.
16 | args.distributed = False
17 | if 'WORLD_SIZE' in os.environ:
18 |     args.distributed = int(os.environ['WORLD_SIZE']) > 1
19 | 
20 | if args.distributed:
21 |     # FOR DISTRIBUTED:  Set the device according to local_rank.
22 |     torch.cuda.set_device(args.local_rank)
23 | 
24 |     # FOR DISTRIBUTED:  Initialize the backend.  torch.distributed.launch will provide
25 |     # environment variables, and requires that you use init_method=`env://`.
26 |     torch.distributed.init_process_group(backend='nccl',
27 |                                          init_method='env://')
28 | 
29 | torch.backends.cudnn.benchmark = True
30 | 
31 | N, D_in, D_out = 64, 1024, 16
32 | 
33 | # Each process receives its own batch of "fake input data" and "fake target data."
34 | # The "training loop" in each process just uses this fake batch over and over.
35 | # https://github.com/NVIDIA/apex/tree/master/examples/imagenet provides a more realistic
36 | # example of distributed data sampling for both training and validation.
37 | x = torch.randn(N, D_in, device='cuda')
38 | y = torch.randn(N, D_out, device='cuda')
39 | 
40 | model = torch.nn.Linear(D_in, D_out).cuda()
41 | optimizer = torch.optim.SGD(model.parameters(), lr=1e-3)
42 | 
43 | model, optimizer = amp.initialize(model, optimizer, opt_level="O1")
44 | 
45 | if args.distributed:
46 |     # FOR DISTRIBUTED:  After amp.initialize, wrap the model with
47 |     # apex.parallel.DistributedDataParallel.
48 |     model = DistributedDataParallel(model)
49 |     # torch.nn.parallel.DistributedDataParallel is also fine, with some added args:
50 |     # model = torch.nn.parallel.DistributedDataParallel(model,
51 |     #                                                   device_ids=[args.local_rank],
52 |     #                                                   output_device=args.local_rank)
53 | 
54 | loss_fn = torch.nn.MSELoss()
55 | 
56 | for t in range(500):
57 |     optimizer.zero_grad()
58 |     y_pred = model(x)
59 |     loss = loss_fn(y_pred, y)
60 |     with amp.scale_loss(loss, optimizer) as scaled_loss:
61 |         scaled_loss.backward()
62 |     optimizer.step()
63 | 
64 | if args.local_rank == 0:
65 |     print("final loss = ", loss)
66 | 


--------------------------------------------------------------------------------
/apex/examples/simple/distributed/run.sh:
--------------------------------------------------------------------------------
1 | #!/bin/bash
2 | python -m torch.distributed.launch --nproc_per_node=2 distributed_data_parallel.py
3 | 


--------------------------------------------------------------------------------
/apex/tests/L0/run_amp/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/apex/tests/L0/run_amp/__init__.py


--------------------------------------------------------------------------------
/apex/tests/L0/run_amp/test_multi_tensor_l2norm.py:
--------------------------------------------------------------------------------
 1 | import unittest
 2 | 
 3 | import functools as ft
 4 | import itertools as it
 5 | 
 6 | from apex import amp
 7 | import torch
 8 | from torch import nn
 9 | import torch.nn.functional as F
10 | 
11 | from utils import common_init, HALF, FLOAT,\
12 |     ALWAYS_HALF, ALWAYS_FLOAT, MATCH_INPUT
13 | 
14 | try:
15 |   import amp_C
16 |   from amp_C import multi_tensor_l2norm
17 |   from apex.multi_tensor_apply import MultiTensorApply
18 |   disabled = False
19 | except ImportError as err:
20 |   print("amp_C fused kernels unavailable, disabling TestMultiTensorApply.  ImportError was ", err)
21 |   disabled = True
22 | 
23 | 
24 | class TestMultiTensorL2Norm(unittest.TestCase):
25 | 
26 |     def setUp(self):
27 |         common_init(self)
28 |         self.val = 4.0
29 |         self.overflow_buf = torch.cuda.IntTensor(1).zero_()
30 | 
31 |     def tearDown(self):
32 |         pass
33 | 
34 |     # The tensor creation here is written for convenience, not speed.
35 |     def l2norm(self, sizea, sizeb, applier, repeat_tensors, in_type):
36 |         self.overflow_buf.zero_()
37 |         a = torch.cuda.FloatTensor(sizea).fill_(self.val)
38 |         b = torch.cuda.FloatTensor(sizeb).fill_(self.val)
39 | 
40 |         in_list = []
41 |         for i in range(repeat_tensors):
42 |             in_list += [a.clone().to(in_type), b.clone().to(in_type)]
43 | 
44 | 
45 |         norm = applier(multi_tensor_l2norm, self.overflow_buf, [in_list])
46 | 
47 |         reference = torch.cuda.FloatTensor((sizea + sizeb)*repeat_tensors).fill_(self.val).norm()
48 | 
49 |         self.assertTrue(torch.allclose(norm, reference))
50 |         self.assertTrue(self.overflow_buf.item() == 0)
51 | 
52 |     @unittest.skipIf(disabled, "amp_C is unavailable")
53 |     def test_fuzz(self):
54 |         input_size_pairs = (
55 |             (7777*77, 555*555),
56 |             (777, 555),
57 |             (555, 2048*32+1),
58 |             (2048*32+1, 555),
59 |             (555, 2048*32),
60 |             (2048*32, 555),
61 |             (33333, 555),
62 |             (555, 33333))
63 |         appliers = (
64 |             MultiTensorApply(2048*32), 
65 |             MultiTensorApply(333),
66 |             MultiTensorApply(33333))
67 |         repeat_tensors = (
68 |             1,
69 |             55)
70 | 
71 |         for sizea, sizeb in input_size_pairs:
72 |           for applier in appliers:
73 |             for repeat in repeat_tensors:
74 |               for in_type in (torch.float32, torch.float16):
75 |                 self.l2norm(sizea, sizeb, applier, repeat, in_type, )
76 | 
77 | 
78 | 
79 | if __name__ == '__main__':
80 |     unittest.main()
81 | 


--------------------------------------------------------------------------------
/apex/tests/L0/run_amp/test_promotion.py:
--------------------------------------------------------------------------------
 1 | import unittest
 2 | 
 3 | import itertools as it
 4 | 
 5 | from apex import amp
 6 | import torch
 7 | from torch import nn
 8 | import torch.nn.functional as F
 9 | 
10 | from utils import common_init, HALF, FLOAT, DTYPES
11 | 
12 | class TestPromotion(unittest.TestCase):
13 |     def setUp(self):
14 |         self.handle = amp.init(enabled=True)
15 |         common_init(self)
16 | 
17 |     def tearDown(self):
18 |         self.handle._deactivate()
19 | 
20 |     def run_binary_promote_test(self, fns, input_shape, x_inplace=False):
21 |         type_pairs = it.product(DTYPES, DTYPES)
22 |         for fn, (xtype, ytype) in it.product(fns, type_pairs):
23 |             x = torch.randn(input_shape, dtype=xtype).requires_grad_()
24 |             x_leaf = x
25 |             if x_inplace:
26 |                 # We need a non-leaf to call in place on
27 |                 x = x.clone()
28 |             y = torch.randn(input_shape, dtype=ytype)
29 |             out = fn(x, y)
30 |             if x_inplace:
31 |                 # In place: always match xtype
32 |                 self.assertEqual(out.type(), x.type())
33 |             else:
34 |                 # Out of place: match widest type
35 |                 if xtype == torch.float or ytype == torch.float:
36 |                     self.assertEqual(out.type(), FLOAT)
37 |                 else:
38 |                     self.assertEqual(out.type(), HALF)
39 |             out.float().sum().backward()
40 |             self.assertEqual(x_leaf.grad.dtype, xtype)
41 | 
42 |     def test_atan2_matches_widest(self):
43 |         fns = [lambda x, y : torch.atan2(x, y),
44 |                lambda x, y : x.atan2(y)]
45 |         self.run_binary_promote_test(fns, (self.b,))
46 | 
47 |     def test_mul_matches_widest(self):
48 |         fns = [lambda x, y : torch.mul(x, y),
49 |                lambda x, y: x.mul(y)]
50 |         self.run_binary_promote_test(fns, (self.b,))
51 | 
52 |     def test_cat_matches_widest(self):
53 |         shape = self.b
54 |         ys = [torch.randn(shape, dtype=torch.half) for _ in range(5)]
55 |         x_float = torch.randn(shape)
56 |         out = torch.cat(ys + [x_float])
57 |         self.assertEqual(out.type(), FLOAT)
58 |         x_half = torch.randn(shape, dtype=torch.half)
59 |         out = torch.cat(ys + [x_half])
60 |         self.assertEqual(out.type(), HALF)
61 | 
62 |     def test_inplace_exp_is_error_for_half(self):
63 |         xs = torch.randn(self.b)
64 |         xs.exp_()
65 |         self.assertEqual(xs.type(), FLOAT)
66 |         xs = torch.randn(self.b, dtype=torch.half)
67 |         with self.assertRaises(NotImplementedError):
68 |             xs.exp_()
69 | 
70 |     def test_inplace_add_matches_self(self):
71 |         fn = lambda x, y: x.add_(y)
72 |         self.run_binary_promote_test([fn], (self.b,), x_inplace=True)
73 | 
74 | if __name__ == '__main__':
75 |     unittest.main()
76 | 


--------------------------------------------------------------------------------
/apex/tests/L0/run_amp/utils.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | 
 3 | HALF = 'torch.cuda.HalfTensor'
 4 | FLOAT = 'torch.cuda.FloatTensor'
 5 | 
 6 | DTYPES = [torch.half, torch.float]
 7 | 
 8 | ALWAYS_HALF = {torch.float: HALF,
 9 |                torch.half: HALF}
10 | ALWAYS_FLOAT = {torch.float: FLOAT,
11 |                 torch.half: FLOAT}
12 | MATCH_INPUT = {torch.float: FLOAT,
13 |                torch.half: HALF}
14 | 
15 | def common_init(test_case):
16 |     test_case.h = 64
17 |     test_case.b = 16
18 |     test_case.c = 16
19 |     test_case.k = 3
20 |     test_case.t = 10
21 |     torch.set_default_tensor_type(torch.cuda.FloatTensor)
22 | 


--------------------------------------------------------------------------------
/apex/tests/L0/run_fp16util/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/apex/tests/L0/run_fp16util/__init__.py


--------------------------------------------------------------------------------
/apex/tests/L0/run_fp16util/test_fp16util.py:
--------------------------------------------------------------------------------
 1 | import unittest
 2 | 
 3 | import torch
 4 | import torch.nn as nn
 5 | 
 6 | from apex.fp16_utils import FP16Model
 7 | 
 8 | 
 9 | class DummyBlock(nn.Module):
10 |     def __init__(self):
11 |         super(DummyBlock, self).__init__()
12 | 
13 |         self.conv = nn.Conv2d(10, 10, 2)
14 |         self.bn = nn.BatchNorm2d(10, affine=True)
15 | 
16 |     def forward(self, x):
17 |         return self.conv(self.bn(x))
18 | 
19 | 
20 | class DummyNet(nn.Module):
21 |     def __init__(self):
22 |         super(DummyNet, self).__init__()
23 | 
24 |         self.conv1 = nn.Conv2d(3, 10, 2)
25 |         self.bn1 = nn.BatchNorm2d(10, affine=False)
26 |         self.db1 = DummyBlock()
27 |         self.db2 = DummyBlock()
28 | 
29 |     def forward(self, x):
30 |         out = x
31 |         out = self.conv1(out)
32 |         out = self.bn1(out)
33 |         out = self.db1(out)
34 |         out = self.db2(out)
35 |         return out
36 | 
37 | 
38 | class DummyNetWrapper(nn.Module):
39 |     def __init__(self):
40 |         super(DummyNetWrapper, self).__init__()
41 | 
42 |         self.bn = nn.BatchNorm2d(3, affine=True)
43 |         self.dn = DummyNet()
44 | 
45 |     def forward(self, x):
46 |         return self.dn(self.bn(x))
47 | 
48 | 
49 | class TestFP16Model(unittest.TestCase):
50 |     def setUp(self):
51 |         self.N = 64
52 |         self.C_in = 3
53 |         self.H_in = 16
54 |         self.W_in = 32
55 |         self.in_tensor = torch.randn((self.N, self.C_in, self.H_in, self.W_in)).cuda()
56 |         self.orig_model = DummyNetWrapper().cuda()
57 |         self.fp16_model = FP16Model(self.orig_model)
58 | 
59 |     def test_params_and_buffers(self):
60 |         exempted_modules = [
61 |             self.fp16_model.network.bn,
62 |             self.fp16_model.network.dn.db1.bn,
63 |             self.fp16_model.network.dn.db2.bn,
64 |         ]
65 |         for m in self.fp16_model.modules():
66 |             expected_dtype = torch.float if (m in exempted_modules) else torch.half
67 |             for p in m.parameters(recurse=False):
68 |                 assert p.dtype == expected_dtype
69 |             for b in m.buffers(recurse=False):
70 |                 assert b.dtype in (expected_dtype, torch.int64)
71 | 
72 |     def test_output_is_half(self):
73 |         out_tensor = self.fp16_model(self.in_tensor)
74 |         assert out_tensor.dtype == torch.half
75 | 
76 | 


--------------------------------------------------------------------------------
/apex/tests/L0/run_fused_layer_norm/test_fused_layer_norm.py:
--------------------------------------------------------------------------------
 1 | import unittest
 2 | import os
 3 | import random
 4 | 
 5 | import torch
 6 | import apex
 7 | 
 8 |         
 9 | class TestFusedLayerNorm(unittest.TestCase):
10 |     def setUp(self):
11 |         self.module = apex.normalization.FusedLayerNorm(normalized_shape=[32, 64], elementwise_affine=False)
12 |         self.input_ = torch.randn(16, 32, 64)
13 |         torch.cuda.manual_seed(42)
14 |         
15 |     def forward_cpu(self, input_):
16 |         self.module.cpu()
17 |         return self.module(input_.cpu())
18 |     
19 |     def forward_cuda(self, input_):
20 |         self.module.cuda()
21 |         return self.module(input_.cuda())
22 |     
23 |     def test_forward_cuda(self):
24 |         out_ = self.forward_cuda(self.input_)
25 |         assert out_.is_cuda == True
26 |         
27 |     def test_forward_cpu(self):
28 |         out_ = self.forward_cpu(self.input_)
29 |         assert out_.is_cuda == False
30 |         
31 |     def test_same_output(self):
32 |         out_cpu = self.forward_cpu(self.input_)
33 |         out_cuda = self.forward_cuda(self.input_)
34 |         torch.testing.assert_allclose(out_cpu, out_cuda.cpu())
35 |         
36 |         
37 | class TestFusedLayerNormElemWise(TestFusedLayerNorm):
38 |     def setUp(self):
39 |         self.module = apex.normalization.FusedLayerNorm(normalized_shape=[32, 64], elementwise_affine=True)
40 |         self.input_ = torch.randn(16, 32, 64)
41 |         torch.cuda.manual_seed(42)


--------------------------------------------------------------------------------
/apex/tests/L0/run_mixed_adam/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/apex/tests/L0/run_mixed_adam/__init__.py


--------------------------------------------------------------------------------
/apex/tests/L0/run_test.py:
--------------------------------------------------------------------------------
 1 | import unittest
 2 | import sys
 3 | 
 4 | test_dirs = ["run_amp", "run_fp16util", "run_mixed_adam", "run_fused_layer_norm"]
 5 | 
 6 | runner = unittest.TextTestRunner(verbosity=2)
 7 | 
 8 | errcode = 0
 9 | 
10 | for test_dir in test_dirs:
11 |     suite = unittest.TestLoader().discover(test_dir)
12 | 
13 |     print("\nExecuting tests from " + test_dir)
14 | 
15 |     result = runner.run(suite)
16 | 
17 |     if not result.wasSuccessful():
18 |         errcode = 1
19 | 
20 | sys.exit(errcode)
21 | 


--------------------------------------------------------------------------------
/apex/tests/L1/common/compare.py:
--------------------------------------------------------------------------------
 1 | import argparse
 2 | import torch
 3 | 
 4 | parser = argparse.ArgumentParser(description='Compare')
 5 | parser.add_argument('--opt-level', type=str)
 6 | parser.add_argument('--keep-batchnorm-fp32', type=str, default=None)
 7 | parser.add_argument('--loss-scale', type=str, default=None)
 8 | parser.add_argument('--fused-adam', action='store_true')
 9 | parser.add_argument('--use_baseline', action='store_true')
10 | args = parser.parse_args()
11 | 
12 | base_file = str(args.opt_level) + "_" +\
13 |             str(args.loss_scale) + "_" +\
14 |             str(args.keep_batchnorm_fp32) + "_" +\
15 |             str(args.fused_adam)
16 | 
17 | file_e = "True_" + base_file
18 | file_p = "False_" + base_file
19 | if args.use_baseline:
20 |     file_b = "baselines/True_" + base_file
21 | 
22 | dict_e = torch.load(file_e)
23 | dict_p = torch.load(file_p)
24 | if args.use_baseline:
25 |     dict_b = torch.load(file_b)
26 | 
27 | torch.set_printoptions(precision=10)
28 | 
29 | print(file_e)
30 | print(file_p)
31 | if args.use_baseline:
32 |     print(file_b)
33 | 
34 | # ugly duplication here...
35 | if not args.use_baseline:
36 |     for n, (i_e, i_p) in enumerate(zip(dict_e["Iteration"], dict_p["Iteration"])):
37 |         assert i_e == i_p, "i_e = {}, i_p = {}".format(i_e, i_p)
38 | 
39 |         loss_e = dict_e["Loss"][n]
40 |         loss_p = dict_p["Loss"][n]
41 |         assert loss_e == loss_p, "Iteration {}, loss_e = {}, loss_p = {}".format(i_e, loss_e, loss_p)
42 |         print("{:4} {:15.10f} {:15.10f} {:15.10f} {:15.10f}".format(
43 |               i_e,
44 |               loss_e,
45 |               loss_p,
46 |               dict_e["Speed"][n],
47 |               dict_p["Speed"][n]))
48 | else:
49 |     for n, (i_e, i_p) in enumerate(zip(dict_e["Iteration"], dict_p["Iteration"])):
50 |         assert i_e == i_p, "i_e = {}, i_p = {}".format(i_e, i_p)
51 | 
52 |         loss_e = dict_e["Loss"][n]
53 |         loss_p = dict_p["Loss"][n]
54 |         loss_b = dict_b["Loss"][n]
55 |         assert loss_e == loss_p, "Iteration {}, loss_e = {}, loss_p = {}".format(i_e, loss_e, loss_p)
56 |         assert loss_e == loss_b, "Iteration {}, loss_e = {}, loss_b = {}".format(i_e, loss_e, loss_b)
57 |         print("{:4} {:15.10f} {:15.10f} {:15.10f} {:15.10f} {:15.10f} {:15.10f}".format(
58 |               i_e,
59 |               loss_b,
60 |               loss_e,
61 |               loss_p,
62 |               dict_b["Speed"][n],
63 |               dict_e["Speed"][n],
64 |               dict_p["Speed"][n]))
65 | 


--------------------------------------------------------------------------------
/apex/tests/L1/cross_product/run.sh:
--------------------------------------------------------------------------------
1 | #!/bin/bash
2 | 
3 | DATADIR="/home/mcarilli/Desktop/pt18data/apex_stale/examples/imagenet/bare_metal_train_val/"
4 | # DATADIR="/opt/home/apex/examples/imagenet/"
5 | cp ../common/* .
6 | bash run_test.sh single_gpu $1 $DATADIR yes
7 | 


--------------------------------------------------------------------------------
/apex/tests/L1/cross_product_distributed/run.sh:
--------------------------------------------------------------------------------
1 | #!/bin/bash
2 | 
3 | cp ../common/* .
4 | bash run_test.sh distributed $1
5 | 


--------------------------------------------------------------------------------
/apex/tests/distributed/DDP/ddp_race_condition_test.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | import torch.distributed as dist
 3 | from torch.nn import Parameter
 4 | from torch.nn import Module
 5 | from apex.parallel import DistributedDataParallel as DDP
 6 | import argparse
 7 | import os
 8 | 
 9 | 
10 | parser = argparse.ArgumentParser(description='allreduce hook example')
11 | parser.add_argument("--local_rank", default=0, type=int)
12 | args = parser.parse_args()
13 | 
14 | args.distributed = False
15 | if 'WORLD_SIZE' in os.environ:
16 |     args.distributed = int(os.environ['WORLD_SIZE']) > 1
17 | 
18 | if args.distributed:
19 |     args.gpu = args.local_rank % torch.cuda.device_count()
20 |     torch.cuda.set_device(args.gpu)
21 |     torch.distributed.init_process_group(backend='nccl',
22 |                                          init_method='env://')
23 |     args.world_size = torch.distributed.get_world_size()
24 | 
25 | torch.set_printoptions(precision=10)
26 | torch.manual_seed(args.local_rank)
27 | 
28 | class Model(Module):
29 |     def __init__(self):
30 |         super(Model, self).__init__()
31 |         self.a = Parameter(torch.cuda.FloatTensor(4096*4096).fill_(1.0))
32 |         self.b = Parameter(torch.cuda.FloatTensor(4096*4096).fill_(2.0))
33 |     def forward(self, input):
34 |         return (input*self.a)*self.b
35 | 
36 | model = Model()
37 | # model = DDP(model, message_size=1, gradient_predivide_factor=8.0)
38 | model = DDP(model, delay_allreduce=True)
39 | # model = DDP(model, message_size=1, allreduce_trigger_params=[model.b])
40 | 
41 | x = torch.cuda.FloatTensor(4096*4096)
42 | 
43 | passed = True
44 | torch.cuda.cudart().cudaProfilerStart()
45 | for i in range(10):
46 |     x.fill_(i + args.local_rank) # fill x with new values every iteration for sanity
47 |     model.zero_grad()
48 |     out = model(x)
49 |     loss = out.sum()
50 |     # torch.cuda.nvtx.range_push("backward")
51 |     loss.backward()
52 |     # torch.cuda.nvtx.range_pop()
53 |     
54 |     # torch.cuda.nvtx.range_push("synchronize() + info")
55 |     # torch.cuda.synchronize()
56 |     print("i = {}".format(i))
57 |     def info(name, param, val):
58 |         expected = val*4096*4096*(2.*i+1)/2.
59 |         actual = param.grad.data.sum().item()
60 |         print(name+": grad.data_ptr() = {}, expected sum {}, got {}".format(
61 |               param.grad.data_ptr(), expected, actual))
62 |         return (expected == actual)
63 |     if not info("model.a", model.module.a, 2.):  passed = False
64 |     if not info("model.b", model.module.b, 1.):  passed = False
65 |     # torch.cuda.nvtx.range_pop()
66 | torch.cuda.cudart().cudaProfilerStop()
67 | 
68 | print("passed = ", passed)
69 | 


--------------------------------------------------------------------------------
/apex/tests/distributed/DDP/run_race_test.sh:
--------------------------------------------------------------------------------
1 | #!/bin/bash
2 | 
3 | CUDA_VISIBLE_DEVICES=0,1 python -m torch.distributed.launch --nproc_per_node=2 ddp_race_condition_test.py
4 | 


--------------------------------------------------------------------------------
/apex/tests/distributed/amp_master_params/amp_master_params.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | import argparse
 3 | import os
 4 | from apex import amp
 5 | # FOR DISTRIBUTED: (can also use torch.nn.parallel.DistributedDataParallel instead)
 6 | from apex.parallel import DistributedDataParallel
 7 | 
 8 | parser = argparse.ArgumentParser()
 9 | # FOR DISTRIBUTED:  Parse for the local_rank argument, which will be supplied
10 | # automatically by torch.distributed.launch.
11 | parser.add_argument("--local_rank", default=0, type=int)
12 | args = parser.parse_args()
13 | 
14 | # FOR DISTRIBUTED:  If we are running under torch.distributed.launch,
15 | # the 'WORLD_SIZE' environment variable will also be set automatically.
16 | args.distributed = False
17 | if 'WORLD_SIZE' in os.environ:
18 |     args.distributed = int(os.environ['WORLD_SIZE']) > 1
19 | 
20 | if args.distributed:
21 |     # FOR DISTRIBUTED:  Set the device according to local_rank.
22 |     torch.cuda.set_device(args.local_rank)
23 | 
24 |     # FOR DISTRIBUTED:  Initialize the backend.  torch.distributed.launch will provide
25 |     # environment variables, and requires that you use init_method=`env://`.
26 |     torch.distributed.init_process_group(backend='nccl',
27 |                                          init_method='env://')
28 | 
29 |     torch.manual_seed(torch.distributed.get_rank())
30 | 
31 | torch.backends.cudnn.benchmark = True
32 | 
33 | N, D_in, D_out = 64, 1024, 16
34 | 
35 | # Each process receives its own batch of "fake input data" and "fake target data."
36 | # The "training loop" in each process just uses this fake batch over and over.
37 | # https://github.com/NVIDIA/apex/tree/master/examples/imagenet provides a more realistic
38 | # example of distributed data sampling for both training and validation.
39 | x = torch.randn(N, D_in, device='cuda')
40 | y = torch.randn(N, D_out, device='cuda')
41 | 
42 | model = torch.nn.Linear(D_in, D_out).cuda()
43 | optimizer = torch.optim.SGD(model.parameters(), lr=1e-3)
44 | 
45 | model, optimizer = amp.initialize(model, optimizer, opt_level="O2")
46 | 
47 | if args.distributed:
48 |     # FOR DISTRIBUTED:  After amp.initialize, wrap the model with
49 |     # apex.parallel.DistributedDataParallel.
50 |     model = DistributedDataParallel(model)
51 |     # torch.nn.parallel.DistributedDataParallel is also fine, with some added args:
52 |     # model = torch.nn.parallel.DistributedDataParallel(model,
53 |     #                                                   device_ids=[args.local_rank],
54 |     #                                                   output_device=args.local_rank)
55 | 
56 | loss_fn = torch.nn.MSELoss()
57 | 
58 | for t in range(500):
59 |     optimizer.zero_grad()
60 |     y_pred = model(x)
61 |     loss = loss_fn(y_pred, y)
62 |     with amp.scale_loss(loss, optimizer) as scaled_loss:
63 |         scaled_loss.backward()
64 |     optimizer.step()
65 | 
66 | if args.local_rank == 0:
67 |     print("final loss = ", loss)
68 | 
69 | torch.save(list(model.parameters()), "rank{}model.pth".format(torch.distributed.get_rank()))
70 | torch.save(list(amp.master_params(optimizer)), "rank{}master.pth".format(torch.distributed.get_rank()))
71 | 


--------------------------------------------------------------------------------
/apex/tests/distributed/amp_master_params/compare.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | 
 3 | model_params_rank0 = torch.load("rank0model.pth",
 4 |                            map_location = lambda storage, loc: storage.cuda(0))
 5 | model_params_rank1 = torch.load("rank1model.pth",
 6 |                                  map_location = lambda storage, loc: storage.cuda(0))
 7 | master_params_rank0 = torch.load("rank0master.pth",
 8 |                                  map_location = lambda storage, loc: storage.cuda(0))
 9 | master_params_rank1 = torch.load("rank1master.pth",
10 |                                  map_location = lambda storage, loc: storage.cuda(0))
11 | 
12 | for model_rank0, model_rank1, master_rank0, master_rank1 in zip(
13 |         model_params_rank0,
14 |         model_params_rank1,
15 |         master_params_rank0,
16 |         master_params_rank1):
17 |     assert torch.allclose(model_rank0, model_rank1), "Model param mismatch"
18 |     assert torch.allclose(master_rank0, master_rank1), "Master param mismatch"
19 |     # Some debugging/investigation assistance code:
20 |     # maxval, maxind = torch.max(((torch.abs(model_rank0).float())/torch.abs(master_rank0)).view(-1), 0)
21 |     # offending_val_half = model_rank0.view(-1)[maxind.item()]
22 |     # offending_val_float = master_rank0.view(-1)[maxind.item()]
23 |     # print(maxval.item(), maxind.item(), offending_val_half.item(), offending_val_float.item(),
24 |     #       offending_val_float.half().item())
25 |     # rtol needs to be > 2^-11 because of denormals...
26 |     assert torch.allclose(model_rank0, master_rank0.half(), rtol=.005), "Model-master mismatch"
27 | 
28 | print("OK:  Model and master params match across ranks.")
29 | 


--------------------------------------------------------------------------------
/apex/tests/distributed/amp_master_params/run.sh:
--------------------------------------------------------------------------------
1 | #!/bin/bash
2 | python -m torch.distributed.launch --nproc_per_node=2 amp_master_params.py
3 | 
4 | python compare.py
5 | 


--------------------------------------------------------------------------------
/apex/tests/distributed/synced_batchnorm/unit_test.sh:
--------------------------------------------------------------------------------
1 | python single_gpu_unit_test.py
2 | python -m torch.distributed.launch --nproc_per_node=2 two_gpu_unit_test.py
3 | python -m torch.distributed.launch --nproc_per_node=2 two_gpu_unit_test.py --fp64
4 | #beware, you need a system with at least 4 gpus to test group_size<world_size
5 | python -m torch.distributed.launch --nproc_per_node=4 test_groups.py --group_size=2
6 | 


--------------------------------------------------------------------------------
/apex/tests/docker_extension_builds/run.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | print_banner() {
 4 |   printf "\n\n\n\e[30m\e[42m$1\e[0m\n\n\n\n"
 5 | }
 6 | 
 7 | print_green() {
 8 |   printf "\e[30m\e[42m$1\e[0m\n"
 9 | }
10 | 
11 | print_red() {
12 |   printf "\e[30m\e[41m$1\e[0m\n"
13 | }
14 | 
15 | images=(
16 | "gitlab-master.nvidia.com:5005/dl/dgx/pytorch:19.03-py3-devel"
17 | "gitlab-master.nvidia.com:5005/dl/dgx/pytorch:master-py3-devel"
18 | "pytorch/pytorch:nightly-devel-cuda10.0-cudnn7"
19 | "pytorch/pytorch:1.1.0-cuda10.0-cudnn7.5-devel"
20 | "pytorch/pytorch:1.0.1-cuda10.0-cudnn7-devel"
21 | "pytorch/pytorch:1.0-cuda10.0-cudnn7-devel"
22 | "pytorch/pytorch:nightly-devel-cuda9.2-cudnn7"
23 | )
24 | 
25 | branch="master"
26 | 
27 | # Associative array for exit codes
28 | declare -A exit_codes
29 | for image in images
30 | do
31 |   exit_codes[$image]="None"
32 | done
33 | 
34 | for image in "${images[@]}"
35 | do
36 |   print_banner "$image"
37 |   set -x
38 |   docker pull $image
39 |   # Trying python setup.py install instead of pip install to ensure direct access to error codes.
40 |   # Maybe pip install would be ok too but this works.
41 |   docker run --runtime=nvidia --rm $image /bin/bash -c "yes | pip uninstall apex; yes | pip uninstall apex; git clone https://github.com/NVIDIA/apex.git; cd apex; git checkout $branch; set -e;  python setup.py install --cuda_ext --cpp_ext"
42 |   exit_code=$?
43 |   set +x
44 |   if [ $exit_code != 0 ]
45 |   then
46 |     print_red "Exit code: $exit_code"
47 |   else
48 |     print_green "Exit code: $exit_code"
49 |   fi
50 |   exit_codes[$image]=$exit_code
51 | done
52 | 
53 | success=0
54 | for image in "${images[@]}"
55 | do
56 |   exit_code=${exit_codes[$image]}
57 |   if [ $exit_code != 0 ]
58 |   then
59 |     print_red "$image : $exit_code"
60 |     success=1
61 |   else
62 |     print_green "$image : $exit_code"
63 |   fi
64 | done
65 | 
66 | if [ $success != 0 ]
67 | then
68 |   print_red "Overall status:  failure"
69 | else
70 |   print_green "Overall status:  success"
71 | fi
72 | 
73 | exit $success
74 | 


--------------------------------------------------------------------------------
/configs/rdpnet/r101-isod.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-101"
 4 |   FCOS_ON: True
 5 |   RPN_ONLY: False
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-101-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   FPN:
11 |     ONLY_P6: False
12 |     ATT_DENSE: True
13 |     DENSE: True
14 |   FCOS:
15 |     CENTER_WEIGHT: 1.0
16 |   RETINANET:
17 |     USE_C5: False # FCOS uses P5 instead of C5
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |   ROI_MASK_HEAD:
21 |     POOLER_SCALES: (0.125, 0.0625, 0.03125, 0.015625, 0.0078125)
22 |     FEATURE_EXTRACTOR: "InstanceSaliencyMaskDecoder"
23 |     PREDICTOR: MaskDecoderPredictor
24 |     CONV_LAYERS:  (128, 128, 128, 128)
25 |     POOLER_RESOLUTION: (32, 16, 8, 4, 4)
26 |     POOLER_SAMPLING_RATIO: 2
27 |     RESOLUTION: 32
28 |     SHARE_BOX_FEATURE_EXTRACTOR: False
29 |   MASK_ON: True
30 |   SEG_ON: False
31 |   SEG_ON_ADD_CHANEL: False
32 | DATASETS:
33 |   TRAIN: ("isod_train_cocostyle",)
34 |   TEST: ("isod_test_cocostyle",)
35 | INPUT:
36 |   MIN_SIZE_TRAIN: (320,)
37 |   MAX_SIZE_TRAIN: 480
38 |   MIN_SIZE_TEST: 320
39 |   MAX_SIZE_TEST: 480
40 | DATALOADER:
41 |   SIZE_DIVISIBILITY: 32
42 | SOLVER:
43 |   WEIGHT_DECAY: 0.0001
44 |   BASE_LR: 0.0025
45 |   STEPS: (6000, )
46 |   MAX_ITER: 9000
47 |   IMS_PER_BATCH: 4
48 |   WARMUP_METHOD: "constant"
49 |   CHECKPOINT_PERIOD: 1000
50 | TEST:
51 |   IMS_PER_BATCH: 1
52 | 


--------------------------------------------------------------------------------
/configs/rdpnet/r50-come.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   FCOS_ON: True
 5 |   RPN_ONLY: False
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-50-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   FPN:
11 |     ONLY_P6: False
12 |     ATT_DENSE: True
13 |     DENSE: True
14 |   FCOS:
15 |     CENTER_WEIGHT: 1.0
16 |   RETINANET:
17 |     USE_C5: False # FCOS uses P5 instead of C5
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |   ROI_MASK_HEAD:
21 |     POOLER_SCALES: (0.125, 0.0625, 0.03125, 0.015625, 0.0078125)
22 |     FEATURE_EXTRACTOR: "InstanceSaliencyMaskDecoder"
23 |     PREDICTOR: MaskDecoderPredictor
24 |     CONV_LAYERS:  (128, 128, 128, 128)
25 |     POOLER_RESOLUTION: (32, 16, 8, 4, 4)
26 |     POOLER_SAMPLING_RATIO: 2
27 |     RESOLUTION: 32
28 |     SHARE_BOX_FEATURE_EXTRACTOR: False
29 |   MASK_ON: True
30 |   SEG_ON: False
31 |   SEG_ON_ADD_CHANEL: False
32 | DATASETS:
33 |   TRAIN: ("come_train_cocostyle",)
34 |   TEST: ("come_test_e_cocostyle",)
35 | INPUT:
36 |   MIN_SIZE_TRAIN: (320, )
37 |   MAX_SIZE_TRAIN: 480
38 |   MIN_SIZE_TEST: 320
39 |   MAX_SIZE_TEST: 480
40 | SOLVER:
41 |   BASE_LR: 0.005
42 |   WEIGHT_DECAY: 0.0001
43 |   STEPS: (20000, )
44 |   MAX_ITER: 30000
45 |   IMS_PER_BATCH: 8
46 |   WARMUP_METHOD: "constant"
47 |   CHECKPOINT_PERIOD: 10000
48 | DATALOADER:
49 |   SIZE_DIVISIBILITY: 32
50 | TEST:
51 |   IMS_PER_BATCH: 1
52 | 


--------------------------------------------------------------------------------
/configs/rdpnet/r50-isod-te.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: model_zoo/r50_isod.pth
 4 |   FCOS_ON: True
 5 |   RPN_ONLY: False
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-50-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   FPN:
11 |     ONLY_P6: False
12 |     ATT_DENSE: True
13 |     DENSE: True
14 |   FCOS:
15 |     CENTER_WEIGHT: 1.0
16 |   RETINANET:
17 |     USE_C5: False # FCOS uses P5 instead of C5
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |   ROI_MASK_HEAD:
21 |     POOLER_SCALES: (0.125, 0.0625, 0.03125, 0.015625, 0.0078125)
22 |     FEATURE_EXTRACTOR: "InstanceSaliencyMaskDecoder"
23 |     PREDICTOR: MaskDecoderPredictor
24 |     CONV_LAYERS:  (128, 128, 128, 128)
25 |     POOLER_RESOLUTION: (32, 16, 8, 4, 4)
26 |     POOLER_SAMPLING_RATIO: 2
27 |     RESOLUTION: 32
28 |     SHARE_BOX_FEATURE_EXTRACTOR: False
29 |   MASK_ON: True
30 |   SEG_ON: False
31 |   SEG_ON_ADD_CHANEL: False
32 | DATASETS:
33 |   TRAIN: ("isod_train_cocostyle",)
34 |   TEST: ("isod_test_cocostyle",)
35 | INPUT:
36 |   MIN_SIZE_TRAIN: (320, )
37 |   MAX_SIZE_TRAIN: 480
38 |   MIN_SIZE_TEST: 320
39 |   MAX_SIZE_TEST: 480
40 | SOLVER:
41 |   BASE_LR: 0.0025
42 |   WEIGHT_DECAY: 0.0001
43 |   STEPS: (6000, )
44 |   MAX_ITER: 9000
45 |   IMS_PER_BATCH: 4
46 |   WARMUP_METHOD: "constant"
47 |   CHECKPOINT_PERIOD: 4500
48 | DATALOADER:
49 |   SIZE_DIVISIBILITY: 32
50 | TEST:
51 |   IMS_PER_BATCH: 1
52 | 


--------------------------------------------------------------------------------
/configs/rdpnet/r50-isod.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   FCOS_ON: True
 5 |   RPN_ONLY: False
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-50-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   FPN:
11 |     ONLY_P6: False
12 |     ATT_DENSE: True
13 |     DENSE: True
14 |   FCOS:
15 |     CENTER_WEIGHT: 1.0
16 |   RETINANET:
17 |     USE_C5: False # FCOS uses P5 instead of C5
18 |   ROI_HEADS:
19 |     USE_FPN: True
20 |   ROI_MASK_HEAD:
21 |     POOLER_SCALES: (0.125, 0.0625, 0.03125, 0.015625, 0.0078125)
22 |     FEATURE_EXTRACTOR: "InstanceSaliencyMaskDecoder"
23 |     PREDICTOR: MaskDecoderPredictor
24 |     CONV_LAYERS:  (128, 128, 128, 128)
25 |     POOLER_RESOLUTION: (32, 16, 8, 4, 4)
26 |     POOLER_SAMPLING_RATIO: 2
27 |     RESOLUTION: 32
28 |     SHARE_BOX_FEATURE_EXTRACTOR: False
29 |   MASK_ON: True
30 |   SEG_ON: False
31 |   SEG_ON_ADD_CHANEL: False
32 | DATASETS:
33 |   TRAIN: ("isod_train_cocostyle",)
34 |   TEST: ("isod_test_cocostyle",)
35 | INPUT:
36 |   MIN_SIZE_TRAIN: (320, )
37 |   MAX_SIZE_TRAIN: 480
38 |   MIN_SIZE_TEST: 320
39 |   MAX_SIZE_TEST: 480
40 | SOLVER:
41 |   BASE_LR: 0.0025
42 |   WEIGHT_DECAY: 0.0001
43 |   STEPS: (6000, )
44 |   MAX_ITER: 9000
45 |   IMS_PER_BATCH: 4
46 |   WARMUP_METHOD: "constant"
47 |   CHECKPOINT_PERIOD: 4500
48 | DATALOADER:
49 |   SIZE_DIVISIBILITY: 32
50 | TEST:
51 |   IMS_PER_BATCH: 1
52 | 


--------------------------------------------------------------------------------
/configs/rdpnet/r50-soc-te.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: model_zoo/r50_soc.pth
 4 |   FCOS_ON: True
 5 |   RPN_ONLY: False
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-50-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   FPN:
11 |     ONLY_P6: False
12 |     ATT_DENSE: True
13 |     DENSE: True
14 |   FCOS:
15 |     CENTER_WEIGHT: 1.0
16 |     NMS_TH: 0.8
17 |   RETINANET:
18 |     USE_C5: False # FCOS uses P5 instead of C5
19 |   ROI_HEADS:
20 |     USE_FPN: True
21 |   ROI_MASK_HEAD:
22 |     POOLER_SCALES: (0.125, 0.0625, 0.03125, 0.015625, 0.0078125)
23 |     FEATURE_EXTRACTOR: "InstanceSaliencyMaskDecoder"
24 |     PREDICTOR: MaskDecoderPredictor
25 |     CONV_LAYERS:  (128, 128, 128, 128)
26 |     POOLER_RESOLUTION: (32, 16, 8, 4, 4)
27 |     POOLER_SAMPLING_RATIO: 2
28 |     RESOLUTION: 32
29 |     SHARE_BOX_FEATURE_EXTRACTOR: False
30 |   MASK_ON: True
31 |   SEG_ON: False
32 |   SEG_ON_ADD_CHANEL: False
33 | DATASETS:
34 |   TRAIN: ("soc_train_cocostyle", "soc_val_cocostyle")
35 |   TEST: ("soc_test_cocostyle",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (320, )
38 |   MAX_SIZE_TRAIN: 480
39 |   MIN_SIZE_TEST: 320
40 |   MAX_SIZE_TEST: 480
41 | SOLVER:
42 |   WEIGHT_DECAY: 0.0001
43 |   BASE_LR: 0.0025
44 |   STEPS: (24000, )
45 |   MAX_ITER: 36000
46 |   IMS_PER_BATCH: 4
47 |   WARMUP_METHOD: "constant"
48 |   CHECKPOINT_PERIOD: 6000
49 | DATALOADER:
50 |   SIZE_DIVISIBILITY: 32
51 | TEST:
52 |   IMS_PER_BATCH: 1
53 | 


--------------------------------------------------------------------------------
/configs/rdpnet/r50-soc.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/MSRA/R-50"
 4 |   FCOS_ON: True
 5 |   RPN_ONLY: False
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-50-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |   FPN:
11 |     ONLY_P6: False
12 |     ATT_DENSE: True
13 |     DENSE: True
14 |   FCOS:
15 |     CENTER_WEIGHT: 1.0
16 |     NMS_TH: 0.8
17 |   RETINANET:
18 |     USE_C5: False # FCOS uses P5 instead of C5
19 |   ROI_HEADS:
20 |     USE_FPN: True
21 |   ROI_MASK_HEAD:
22 |     POOLER_SCALES: (0.125, 0.0625, 0.03125, 0.015625, 0.0078125)
23 |     FEATURE_EXTRACTOR: "InstanceSaliencyMaskDecoder"
24 |     PREDICTOR: MaskDecoderPredictor
25 |     CONV_LAYERS:  (128, 128, 128, 128)
26 |     POOLER_RESOLUTION: (32, 16, 8, 4, 4)
27 |     POOLER_SAMPLING_RATIO: 2
28 |     RESOLUTION: 32
29 |     SHARE_BOX_FEATURE_EXTRACTOR: False
30 |   MASK_ON: True
31 |   SEG_ON: False
32 |   SEG_ON_ADD_CHANEL: False
33 | DATASETS:
34 |   TRAIN: ("soc_train_cocostyle", "soc_val_cocostyle")
35 |   TEST: ("soc_test_cocostyle",)
36 | INPUT:
37 |   MIN_SIZE_TRAIN: (320, )
38 |   MAX_SIZE_TRAIN: 480
39 |   MIN_SIZE_TEST: 320
40 |   MAX_SIZE_TEST: 480
41 | SOLVER:
42 |   WEIGHT_DECAY: 0.0001
43 |   BASE_LR: 0.0025
44 |   STEPS: (24000, )
45 |   MAX_ITER: 36000
46 |   IMS_PER_BATCH: 4
47 |   WARMUP_METHOD: "constant"
48 |   CHECKPOINT_PERIOD: 6000
49 | DATALOADER:
50 |   SIZE_DIVISIBILITY: 32
51 | TEST:
52 |   IMS_PER_BATCH: 1
53 | 


--------------------------------------------------------------------------------
/configs/rdpnet/x101-isod.yaml:
--------------------------------------------------------------------------------
 1 | MODEL:
 2 |   META_ARCHITECTURE: "GeneralizedRCNN"
 3 |   WEIGHT: "catalog://ImageNetPretrained/FAIR/20171220/X-101-32x8d"
 4 |   FCOS_ON: True
 5 |   RPN_ONLY: False
 6 |   BACKBONE:
 7 |     CONV_BODY: "R-101-FPN-RETINANET"
 8 |   RESNETS:
 9 |     BACKBONE_OUT_CHANNELS: 256
10 |     STRIDE_IN_1X1: False
11 |     NUM_GROUPS: 32
12 |     WIDTH_PER_GROUP: 8
13 |   FPN:
14 |     ONLY_P6: False
15 |     ATT_DENSE: True
16 |     DENSE: True
17 |   FCOS:
18 |     CENTER_WEIGHT: 1.0
19 |   RETINANET:
20 |     USE_C5: False # FCOS uses P5 instead of C5
21 |   ROI_HEADS:
22 |     USE_FPN: True
23 |   ROI_MASK_HEAD:
24 |     POOLER_SCALES: (0.125, 0.0625, 0.03125, 0.015625, 0.0078125)
25 |     FEATURE_EXTRACTOR: "InstanceSaliencyMaskDecoder"
26 |     PREDICTOR: MaskDecoderPredictor
27 |     CONV_LAYERS:  (128, 128, 128, 128)
28 |     POOLER_RESOLUTION: (32, 16, 8, 4, 4) #(14,) #
29 |     POOLER_SAMPLING_RATIO: 2
30 |     RESOLUTION: 32
31 |     SHARE_BOX_FEATURE_EXTRACTOR: False
32 |   MASK_ON: True
33 |   SEG_ON: False
34 |   SEG_ON_ADD_CHANEL: False
35 | DATASETS:
36 |   TRAIN: ("isod_train_cocostyle",)
37 |   TEST: ("isod_test_cocostyle",)
38 | INPUT:
39 |   MIN_SIZE_TRAIN: (320,)
40 |   MAX_SIZE_TRAIN: 480
41 |   MIN_SIZE_TEST: 320
42 |   MAX_SIZE_TEST: 480
43 | DATALOADER:
44 |   SIZE_DIVISIBILITY: 32
45 | SOLVER:
46 |   WEIGHT_DECAY: 0.0001
47 |   BASE_LR: 0.0025
48 |   STEPS: (6000, )
49 |   MAX_ITER: 9000
50 |   IMS_PER_BATCH: 4
51 |   WARMUP_METHOD: "constant"
52 |   CHECKPOINT_PERIOD: 1000
53 | TEST:
54 |   IMS_PER_BATCH: 1
55 | 


--------------------------------------------------------------------------------
/datasets/PLACE_DATA_HERE:
--------------------------------------------------------------------------------
1 | Place isod/ and soc/ data folders here.
2 | 


--------------------------------------------------------------------------------
/demo/examples/test_10.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/demo/examples/test_10.jpg


--------------------------------------------------------------------------------
/demo/examples/test_14.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/demo/examples/test_14.jpg


--------------------------------------------------------------------------------
/demo/examples/test_20.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/demo/examples/test_20.jpg


--------------------------------------------------------------------------------
/demo/examples/test_23.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/demo/examples/test_23.jpg


--------------------------------------------------------------------------------
/demo/examples/test_24.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/demo/examples/test_24.jpg


--------------------------------------------------------------------------------
/demo/examples/test_25.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/demo/examples/test_25.jpg


--------------------------------------------------------------------------------
/demo/examples/test_3.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/demo/examples/test_3.jpg


--------------------------------------------------------------------------------
/demo/examples/test_5.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/demo/examples/test_5.jpg


--------------------------------------------------------------------------------
/demo/examples/test_53.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/demo/examples/test_53.jpg


--------------------------------------------------------------------------------
/demo/examples/test_6.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/demo/examples/test_6.jpg


--------------------------------------------------------------------------------
/demo/examples/test_9.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/demo/examples/test_9.jpg


--------------------------------------------------------------------------------
/demo/model_zoo:
--------------------------------------------------------------------------------
1 | ../model_zoo


--------------------------------------------------------------------------------
/docker/Dockerfile:
--------------------------------------------------------------------------------
 1 | ARG CUDA="9.0"
 2 | ARG CUDNN="7"
 3 | 
 4 | FROM nvidia/cuda:${CUDA}-cudnn${CUDNN}-devel-ubuntu16.04
 5 | 
 6 | RUN echo 'debconf debconf/frontend select Noninteractive' | debconf-set-selections
 7 | 
 8 | # install basics
 9 | RUN apt-get update -y \
10 |  && apt-get install -y apt-utils git curl ca-certificates bzip2 cmake tree htop bmon iotop g++ \
11 |  && apt-get install -y libglib2.0-0 libsm6 libxext6 libxrender-dev
12 | 
13 | # Install Miniconda
14 | RUN curl -so /miniconda.sh https://repo.continuum.io/miniconda/Miniconda3-latest-Linux-x86_64.sh \
15 |  && chmod +x /miniconda.sh \
16 |  && /miniconda.sh -b -p /miniconda \
17 |  && rm /miniconda.sh
18 | 
19 | ENV PATH=/miniconda/bin:$PATH
20 | 
21 | # Create a Python 3.6 environment
22 | RUN /miniconda/bin/conda install -y conda-build \
23 |  && /miniconda/bin/conda create -y --name py36 python=3.6.7 \
24 |  && /miniconda/bin/conda clean -ya
25 | 
26 | ENV CONDA_DEFAULT_ENV=py36
27 | ENV CONDA_PREFIX=/miniconda/envs/$CONDA_DEFAULT_ENV
28 | ENV PATH=$CONDA_PREFIX/bin:$PATH
29 | ENV CONDA_AUTO_UPDATE_CONDA=false
30 | 
31 | RUN conda install -y ipython
32 | RUN pip install ninja yacs cython matplotlib opencv-python tqdm
33 | 
34 | # Install PyTorch 1.0 Nightly
35 | ARG CUDA
36 | RUN conda install pytorch-nightly cudatoolkit=${CUDA} -c pytorch \
37 |  && conda clean -ya
38 | 
39 | # Install TorchVision master
40 | RUN git clone https://github.com/pytorch/vision.git \
41 |  && cd vision \
42 |  && python setup.py install
43 | 
44 | # install pycocotools
45 | RUN git clone https://github.com/cocodataset/cocoapi.git \
46 |  && cd cocoapi/PythonAPI \
47 |  && python setup.py build_ext install
48 | 
49 | # install PyTorch Detection
50 | ARG FORCE_CUDA="1"
51 | ENV FORCE_CUDA=${FORCE_CUDA}
52 | RUN git clone https://github.com/facebookresearch/maskrcnn-benchmark.git \
53 |  && cd maskrcnn-benchmark \
54 |  && python setup.py build develop
55 | 
56 | WORKDIR /maskrcnn-benchmark
57 | 


--------------------------------------------------------------------------------
/docker/docker-jupyter/Dockerfile:
--------------------------------------------------------------------------------
 1 | ARG CUDA="9.0"
 2 | ARG CUDNN="7"
 3 | 
 4 | FROM nvidia/cuda:${CUDA}-cudnn${CUDNN}-devel-ubuntu16.04
 5 | 
 6 | RUN echo 'debconf debconf/frontend select Noninteractive' | debconf-set-selections
 7 | 
 8 | # install basics
 9 | RUN apt-get update -y \
10 |  && apt-get install -y apt-utils git curl ca-certificates bzip2 cmake tree htop bmon iotop g++
11 | 
12 | # Install Miniconda
13 | RUN curl -so /miniconda.sh https://repo.continuum.io/miniconda/Miniconda3-latest-Linux-x86_64.sh \
14 |  && chmod +x /miniconda.sh \
15 |  && /miniconda.sh -b -p /miniconda \
16 |  && rm /miniconda.sh
17 | 
18 | ENV PATH=/miniconda/bin:$PATH
19 | 
20 | # Create a Python 3.6 environment
21 | RUN /miniconda/bin/conda install -y conda-build \
22 |  && /miniconda/bin/conda create -y --name py36 python=3.6.7 \
23 |  && /miniconda/bin/conda clean -ya
24 | 
25 | ENV CONDA_DEFAULT_ENV=py36
26 | ENV CONDA_PREFIX=/miniconda/envs/$CONDA_DEFAULT_ENV
27 | ENV PATH=$CONDA_PREFIX/bin:$PATH
28 | ENV CONDA_AUTO_UPDATE_CONDA=false
29 | 
30 | RUN conda install -y ipython
31 | RUN pip install ninja yacs cython matplotlib jupyter
32 | 
33 | # Install PyTorch 1.0 Nightly and OpenCV
34 | RUN conda install -y pytorch-nightly -c pytorch \
35 |  && conda install -y opencv -c menpo \
36 |  && conda clean -ya
37 | 
38 | WORKDIR /root
39 | 
40 | USER root
41 | 
42 | RUN mkdir /notebooks
43 | 
44 | WORKDIR /notebooks
45 | 
46 | # Install TorchVision master
47 | RUN git clone https://github.com/pytorch/vision.git \
48 |  && cd vision \
49 |  && python setup.py install
50 | 
51 | # install pycocotools
52 | RUN git clone https://github.com/cocodataset/cocoapi.git \
53 |  && cd cocoapi/PythonAPI \
54 |  && python setup.py build_ext install
55 | 
56 | # install PyTorch Detection
57 | RUN git clone https://github.com/facebookresearch/maskrcnn-benchmark.git \
58 |  && cd maskrcnn-benchmark \
59 |  && python setup.py build develop
60 | 
61 | RUN jupyter notebook --generate-config
62 | 
63 | ENV CONFIG_PATH="/root/.jupyter/jupyter_notebook_config.py"
64 | 
65 | COPY "jupyter_notebook_config.py" ${CONFIG_PATH}
66 | 
67 | ENTRYPOINT ["sh", "-c", "jupyter notebook --allow-root -y --no-browser --ip=0.0.0.0 --config=${CONFIG_PATH}"]
68 | 


--------------------------------------------------------------------------------
/docker/docker-jupyter/jupyter_notebook_config.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | from IPython.lib import passwd
 3 | 
 4 | #c = c  # pylint:disable=undefined-variable
 5 | c = get_config()
 6 | c.NotebookApp.ip = '0.0.0.0'
 7 | c.NotebookApp.port = int(os.getenv('PORT', 8888))
 8 | c.NotebookApp.open_browser = False
 9 | 
10 | # sets a password if PASSWORD is set in the environment
11 | if 'PASSWORD' in os.environ:
12 |   password = os.environ['PASSWORD']
13 |   if password:
14 |     c.NotebookApp.password = passwd(password)
15 |   else:
16 |     c.NotebookApp.password = ''
17 |     c.NotebookApp.token = ''
18 |   del os.environ['PASSWORD']
19 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/_C.cpython-36m-x86_64-linux-gnu.so:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/maskrcnn_benchmark/_C.cpython-36m-x86_64-linux-gnu.so


--------------------------------------------------------------------------------
/maskrcnn_benchmark/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/config/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .defaults import _C as cfg
3 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/csrc/ROIAlign.h:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #pragma once
 3 | 
 4 | #include "cpu/vision.h"
 5 | 
 6 | #ifdef WITH_CUDA
 7 | #include "cuda/vision.h"
 8 | #endif
 9 | 
10 | // Interface for Python
11 | at::Tensor ROIAlign_forward(const at::Tensor& input,
12 |                             const at::Tensor& rois,
13 |                             const float spatial_scale,
14 |                             const int pooled_height,
15 |                             const int pooled_width,
16 |                             const int sampling_ratio) {
17 |   if (input.type().is_cuda()) {
18 | #ifdef WITH_CUDA
19 |     return ROIAlign_forward_cuda(input, rois, spatial_scale, pooled_height, pooled_width, sampling_ratio);
20 | #else
21 |     AT_ERROR("Not compiled with GPU support");
22 | #endif
23 |   }
24 |   return ROIAlign_forward_cpu(input, rois, spatial_scale, pooled_height, pooled_width, sampling_ratio);
25 | }
26 | 
27 | at::Tensor ROIAlign_backward(const at::Tensor& grad,
28 |                              const at::Tensor& rois,
29 |                              const float spatial_scale,
30 |                              const int pooled_height,
31 |                              const int pooled_width,
32 |                              const int batch_size,
33 |                              const int channels,
34 |                              const int height,
35 |                              const int width,
36 |                              const int sampling_ratio) {
37 |   if (grad.type().is_cuda()) {
38 | #ifdef WITH_CUDA
39 |     return ROIAlign_backward_cuda(grad, rois, spatial_scale, pooled_height, pooled_width, batch_size, channels, height, width, sampling_ratio);
40 | #else
41 |     AT_ERROR("Not compiled with GPU support");
42 | #endif
43 |   }
44 |   AT_ERROR("Not implemented on the CPU");
45 | }
46 | 
47 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/csrc/ROIPool.h:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #pragma once
 3 | 
 4 | #include "cpu/vision.h"
 5 | 
 6 | #ifdef WITH_CUDA
 7 | #include "cuda/vision.h"
 8 | #endif
 9 | 
10 | 
11 | std::tuple<at::Tensor, at::Tensor> ROIPool_forward(const at::Tensor& input,
12 |                                 const at::Tensor& rois,
13 |                                 const float spatial_scale,
14 |                                 const int pooled_height,
15 |                                 const int pooled_width) {
16 |   if (input.type().is_cuda()) {
17 | #ifdef WITH_CUDA
18 |     return ROIPool_forward_cuda(input, rois, spatial_scale, pooled_height, pooled_width);
19 | #else
20 |     AT_ERROR("Not compiled with GPU support");
21 | #endif
22 |   }
23 |   AT_ERROR("Not implemented on the CPU");
24 | }
25 | 
26 | at::Tensor ROIPool_backward(const at::Tensor& grad,
27 |                                  const at::Tensor& input,
28 |                                  const at::Tensor& rois,
29 |                                  const at::Tensor& argmax,
30 |                                  const float spatial_scale,
31 |                                  const int pooled_height,
32 |                                  const int pooled_width,
33 |                                  const int batch_size,
34 |                                  const int channels,
35 |                                  const int height,
36 |                                  const int width) {
37 |   if (grad.type().is_cuda()) {
38 | #ifdef WITH_CUDA
39 |     return ROIPool_backward_cuda(grad, input, rois, argmax, spatial_scale, pooled_height, pooled_width, batch_size, channels, height, width);
40 | #else
41 |     AT_ERROR("Not compiled with GPU support");
42 | #endif
43 |   }
44 |   AT_ERROR("Not implemented on the CPU");
45 | }
46 | 
47 | 
48 | 
49 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/csrc/SigmoidFocalLoss.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include "cpu/vision.h"
 4 | 
 5 | #ifdef WITH_CUDA
 6 | #include "cuda/vision.h"
 7 | #endif
 8 | 
 9 | // Interface for Python
10 | at::Tensor SigmoidFocalLoss_forward(
11 | 		const at::Tensor& logits,
12 |                 const at::Tensor& targets,
13 | 		const int num_classes, 
14 | 		const float gamma, 
15 | 		const float alpha) {
16 |   if (logits.type().is_cuda()) {
17 | #ifdef WITH_CUDA
18 |     return SigmoidFocalLoss_forward_cuda(logits, targets, num_classes, gamma, alpha);
19 | #else
20 |     AT_ERROR("Not compiled with GPU support");
21 | #endif
22 |   }
23 |   AT_ERROR("Not implemented on the CPU");
24 | }
25 | 
26 | at::Tensor SigmoidFocalLoss_backward(
27 | 			     const at::Tensor& logits,
28 |                              const at::Tensor& targets,
29 | 			     const at::Tensor& d_losses,
30 | 			     const int num_classes,
31 | 			     const float gamma,
32 | 			     const float alpha) {
33 |   if (logits.type().is_cuda()) {
34 | #ifdef WITH_CUDA
35 |     return SigmoidFocalLoss_backward_cuda(logits, targets, d_losses, num_classes, gamma, alpha);
36 | #else
37 |     AT_ERROR("Not compiled with GPU support");
38 | #endif
39 |   }
40 |   AT_ERROR("Not implemented on the CPU");
41 | }
42 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/csrc/cpu/nms_cpu.cpp:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #include "cpu/vision.h"
 3 | 
 4 | 
 5 | template <typename scalar_t>
 6 | at::Tensor nms_cpu_kernel(const at::Tensor& dets,
 7 |                           const at::Tensor& scores,
 8 |                           const float threshold) {
 9 |   AT_ASSERTM(!dets.type().is_cuda(), "dets must be a CPU tensor");
10 |   AT_ASSERTM(!scores.type().is_cuda(), "scores must be a CPU tensor");
11 |   AT_ASSERTM(dets.type() == scores.type(), "dets should have the same type as scores");
12 | 
13 |   if (dets.numel() == 0) {
14 |     return at::empty({0}, dets.options().dtype(at::kLong).device(at::kCPU));
15 |   }
16 | 
17 |   auto x1_t = dets.select(1, 0).contiguous();
18 |   auto y1_t = dets.select(1, 1).contiguous();
19 |   auto x2_t = dets.select(1, 2).contiguous();
20 |   auto y2_t = dets.select(1, 3).contiguous();
21 | 
22 |   at::Tensor areas_t = (x2_t - x1_t + 1) * (y2_t - y1_t + 1);
23 | 
24 |   auto order_t = std::get<1>(scores.sort(0, /* descending=*/true));
25 | 
26 |   auto ndets = dets.size(0);
27 |   at::Tensor suppressed_t = at::zeros({ndets}, dets.options().dtype(at::kByte).device(at::kCPU));
28 | 
29 |   auto suppressed = suppressed_t.data<uint8_t>();
30 |   auto order = order_t.data<int64_t>();
31 |   auto x1 = x1_t.data<scalar_t>();
32 |   auto y1 = y1_t.data<scalar_t>();
33 |   auto x2 = x2_t.data<scalar_t>();
34 |   auto y2 = y2_t.data<scalar_t>();
35 |   auto areas = areas_t.data<scalar_t>();
36 | 
37 |   for (int64_t _i = 0; _i < ndets; _i++) {
38 |     auto i = order[_i];
39 |     if (suppressed[i] == 1)
40 |       continue;
41 |     auto ix1 = x1[i];
42 |     auto iy1 = y1[i];
43 |     auto ix2 = x2[i];
44 |     auto iy2 = y2[i];
45 |     auto iarea = areas[i];
46 | 
47 |     for (int64_t _j = _i + 1; _j < ndets; _j++) {
48 |       auto j = order[_j];
49 |       if (suppressed[j] == 1)
50 |         continue;
51 |       auto xx1 = std::max(ix1, x1[j]);
52 |       auto yy1 = std::max(iy1, y1[j]);
53 |       auto xx2 = std::min(ix2, x2[j]);
54 |       auto yy2 = std::min(iy2, y2[j]);
55 | 
56 |       auto w = std::max(static_cast<scalar_t>(0), xx2 - xx1 + 1);
57 |       auto h = std::max(static_cast<scalar_t>(0), yy2 - yy1 + 1);
58 |       auto inter = w * h;
59 |       auto ovr = inter / (iarea + areas[j] - inter);
60 |       if (ovr >= threshold)
61 |         suppressed[j] = 1;
62 |    }
63 |   }
64 |   return at::nonzero(suppressed_t == 0).squeeze(1);
65 | }
66 | 
67 | at::Tensor nms_cpu(const at::Tensor& dets,
68 |                const at::Tensor& scores,
69 |                const float threshold) {
70 |   at::Tensor result;
71 |   AT_DISPATCH_FLOATING_TYPES(dets.type(), "nms", [&] {
72 |     result = nms_cpu_kernel<scalar_t>(dets, scores, threshold);
73 |   });
74 |   return result;
75 | }
76 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/csrc/cpu/vision.h:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #pragma once
 3 | #include <torch/extension.h>
 4 | 
 5 | 
 6 | at::Tensor ROIAlign_forward_cpu(const at::Tensor& input,
 7 |                                 const at::Tensor& rois,
 8 |                                 const float spatial_scale,
 9 |                                 const int pooled_height,
10 |                                 const int pooled_width,
11 |                                 const int sampling_ratio);
12 | 
13 | 
14 | at::Tensor nms_cpu(const at::Tensor& dets,
15 |                    const at::Tensor& scores,
16 |                    const float threshold);
17 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/csrc/nms.h:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #pragma once
 3 | #include "cpu/vision.h"
 4 | 
 5 | #ifdef WITH_CUDA
 6 | #include "cuda/vision.h"
 7 | #endif
 8 | 
 9 | 
10 | at::Tensor nms(const at::Tensor& dets,
11 |                const at::Tensor& scores,
12 |                const float threshold) {
13 | 
14 |   if (dets.type().is_cuda()) {
15 | #ifdef WITH_CUDA
16 |     // TODO raise error if not compiled with CUDA
17 |     if (dets.numel() == 0)
18 |       return at::empty({0}, dets.options().dtype(at::kLong).device(at::kCPU));
19 |     auto b = at::cat({dets, scores.unsqueeze(1)}, 1);
20 |     return nms_cuda(b, threshold);
21 | #else
22 |     AT_ERROR("Not compiled with GPU support");
23 | #endif
24 |   }
25 | 
26 |   at::Tensor result = nms_cpu(dets, scores, threshold);
27 |   return result;
28 | }
29 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/csrc/vision.cpp:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #include "nms.h"
 3 | #include "ROIAlign.h"
 4 | #include "ROIPool.h"
 5 | #include "SigmoidFocalLoss.h"
 6 | #include "deform_conv_cuda.h"
 7 | 
 8 | PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
 9 |   m.def("nms", &nms, "non-maximum suppression");
10 |   m.def("roi_align_forward", &ROIAlign_forward, "ROIAlign_forward");
11 |   m.def("roi_align_backward", &ROIAlign_backward, "ROIAlign_backward");
12 |   m.def("roi_pool_forward", &ROIPool_forward, "ROIPool_forward");
13 |   m.def("roi_pool_backward", &ROIPool_backward, "ROIPool_backward");
14 |   m.def("sigmoid_focalloss_forward", &SigmoidFocalLoss_forward, "SigmoidFocalLoss_forward");
15 |   m.def("sigmoid_focalloss_backward", &SigmoidFocalLoss_backward, "SigmoidFocalLoss_backward");
16 |   m.def("deform_conv_forward_cuda", &deform_conv_forward_cuda,
17 |         "deform forward (CUDA)");
18 |   m.def("deform_conv_backward_input_cuda", &deform_conv_backward_input_cuda,
19 |         "deform_conv_backward_input (CUDA)");
20 |   m.def("deform_conv_backward_parameters_cuda",
21 |         &deform_conv_backward_parameters_cuda,
22 |         "deform_conv_backward_parameters (CUDA)");
23 |   m.def("modulated_deform_conv_cuda_forward",
24 |         &modulated_deform_conv_cuda_forward,
25 |         "modulated deform conv forward (CUDA)");
26 |   m.def("modulated_deform_conv_cuda_backward",
27 |         &modulated_deform_conv_cuda_backward,
28 |         "modulated deform conv backward (CUDA)");
29 | }
30 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/data/README.md:
--------------------------------------------------------------------------------
 1 | # Setting Up Datasets
 2 | This file describes how to perform training on other datasets.
 3 | 
 4 | Only Pascal VOC dataset can be loaded from its original format and be outputted to Pascal style results currently.
 5 | 
 6 | We expect the annotations from other datasets be converted to COCO json format, and
 7 | the output will be in COCO-style. (i.e. AP, AP50, AP75, APs, APm, APl for bbox and segm)
 8 | 
 9 | ## Creating Symlinks for PASCAL VOC
10 | 
11 | We assume that your symlinked `datasets/voc/VOC<year>` directory has the following structure:
12 | 
13 | ```
14 | VOC<year>
15 | |_ JPEGImages
16 | |  |_ <im-1-name>.jpg
17 | |  |_ ...
18 | |  |_ <im-N-name>.jpg
19 | |_ Annotations
20 | |  |_ pascal_train<year>.json (optional)
21 | |  |_ pascal_val<year>.json (optional)
22 | |  |_ pascal_test<year>.json (optional)
23 | |  |_ <im-1-name>.xml
24 | |  |_ ...
25 | |  |_ <im-N-name>.xml
26 | |_ VOCdevkit<year>
27 | ```
28 | 
29 | Create symlinks for `voc/VOC<year>`:
30 | 
31 | ```
32 | cd ~/github/maskrcnn-benchmark
33 | mkdir -p datasets/voc/VOC<year>
34 | ln -s /path/to/VOC<year> /datasets/voc/VOC<year>
35 | ```
36 | Example configuration files for PASCAL VOC could be found [here](https://github.com/facebookresearch/maskrcnn-benchmark/blob/master/configs/pascal_voc/).
37 | 
38 | ### PASCAL VOC Annotations in COCO Format
39 | To output COCO-style evaluation result, PASCAL VOC annotations in COCO json format is required and could be downloaded from [here](https://storage.googleapis.com/coco-dataset/external/PASCAL_VOC.zip)
40 | via http://cocodataset.org/#external.
41 | 
42 | ## Creating Symlinks for Cityscapes:
43 | 
44 | We assume that your symlinked `datasets/cityscapes` directory has the following structure:
45 | 
46 | ```
47 | cityscapes
48 | |_ images
49 | |  |_ <im-1-name>.jpg
50 | |  |_ ...
51 | |  |_ <im-N-name>.jpg
52 | |_ annotations
53 | |  |_ instanceonly_gtFile_train.json
54 | |  |_ ...
55 | |_ raw
56 |    |_ gtFine
57 |    |_ ...
58 |    |_ README.md
59 | ```
60 | 
61 | Create symlinks for `cityscapes`:
62 | 
63 | ```
64 | cd ~/github/maskrcnn-benchmark
65 | mkdir -p datasets/cityscapes
66 | ln -s /path/to/cityscapes datasets/data/cityscapes
67 | ```
68 | 
69 | ### Steps to convert Cityscapes Annotations to COCO Format
70 | 1. Download gtFine_trainvaltest.zip from https://www.cityscapes-dataset.com/downloads/ (login required)
71 | 2. Extract it to /path/to/gtFine_trainvaltest
72 | ```
73 | cityscapes
74 | |_ gtFine_trainvaltest.zip
75 | |_ gtFine_trainvaltest
76 |    |_ gtFine
77 | ```
78 | 3. Run the below commands to convert the annotations
79 | 
80 | ```
81 | cd ~/github
82 | git clone https://github.com/mcordts/cityscapesScripts.git
83 | cd cityscapesScripts
84 | cp ~/github/maskrcnn-benchmark/tools/cityscapes/instances2dict_with_polygons.py cityscapesscripts/evaluation
85 | python setup.py install
86 | cd ~/github/maskrcnn-benchmark
87 | python tools/cityscapes/convert_cityscapes_to_coco.py --datadir /path/to/cityscapes --outdir /path/to/cityscapes/annotations
88 | ```
89 | 
90 | Example configuration files for Cityscapes could be found [here](https://github.com/facebookresearch/maskrcnn-benchmark/blob/master/configs/cityscapes/).
91 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/data/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .build import make_data_loader
3 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/data/collate_batch.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from maskrcnn_benchmark.structures.image_list import to_image_list
 3 | 
 4 | 
 5 | class BatchCollator(object):
 6 |     """
 7 |     From a list of samples from the dataset,
 8 |     returns the batched images and targets.
 9 |     This should be passed to the DataLoader
10 |     """
11 | 
12 |     def __init__(self, size_divisible=0):
13 |         self.size_divisible = size_divisible
14 | 
15 |     def __call__(self, batch):
16 |         transposed_batch = list(zip(*batch))
17 |         images = to_image_list(transposed_batch[0], self.size_divisible)
18 |         targets = transposed_batch[1]
19 |         img_ids = transposed_batch[2]
20 |         return images, targets, img_ids
21 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/data/datasets/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .coco import COCODataset
3 | from .voc import PascalVOCDataset
4 | from .concat_dataset import ConcatDataset
5 | 
6 | __all__ = ["COCODataset", "ConcatDataset", "PascalVOCDataset"]
7 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/data/datasets/concat_dataset.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import bisect
 3 | 
 4 | from torch.utils.data.dataset import ConcatDataset as _ConcatDataset
 5 | 
 6 | 
 7 | class ConcatDataset(_ConcatDataset):
 8 |     """
 9 |     Same as torch.utils.data.dataset.ConcatDataset, but exposes an extra
10 |     method for querying the sizes of the image
11 |     """
12 | 
13 |     def get_idxs(self, idx):
14 |         dataset_idx = bisect.bisect_right(self.cumulative_sizes, idx)
15 |         if dataset_idx == 0:
16 |             sample_idx = idx
17 |         else:
18 |             sample_idx = idx - self.cumulative_sizes[dataset_idx - 1]
19 |         return dataset_idx, sample_idx
20 | 
21 |     def get_img_info(self, idx):
22 |         dataset_idx, sample_idx = self.get_idxs(idx)
23 |         return self.datasets[dataset_idx].get_img_info(sample_idx)
24 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/data/datasets/evaluation/__init__.py:
--------------------------------------------------------------------------------
 1 | from maskrcnn_benchmark.data import datasets
 2 | 
 3 | from .coco import coco_evaluation
 4 | from .voc import voc_evaluation
 5 | 
 6 | 
 7 | def evaluate(dataset, predictions, output_folder, **kwargs):
 8 |     """evaluate dataset using different methods based on dataset type.
 9 |     Args:
10 |         dataset: Dataset object
11 |         predictions(list[BoxList]): each item in the list represents the
12 |             prediction results for one image.
13 |         output_folder: output folder, to save evaluation files or results.
14 |         **kwargs: other args.
15 |     Returns:
16 |         evaluation result
17 |     """
18 |     args = dict(
19 |         dataset=dataset, predictions=predictions, output_folder=output_folder, **kwargs
20 |     )
21 |     if isinstance(dataset, datasets.COCODataset):
22 |         return coco_evaluation(**args)
23 |     elif isinstance(dataset, datasets.PascalVOCDataset):
24 |         return voc_evaluation(**args)
25 |     else:
26 |         dataset_name = dataset.__class__.__name__
27 |         raise NotImplementedError("Unsupported dataset type {}.".format(dataset_name))
28 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/data/datasets/evaluation/coco/__init__.py:
--------------------------------------------------------------------------------
 1 | from .coco_eval import do_coco_evaluation
 2 | 
 3 | 
 4 | def coco_evaluation(
 5 |     dataset,
 6 |     predictions,
 7 |     output_folder,
 8 |     box_only,
 9 |     iou_types,
10 |     expected_results,
11 |     expected_results_sigma_tol,
12 | ):
13 |     return do_coco_evaluation(
14 |         dataset=dataset,
15 |         predictions=predictions,
16 |         box_only=box_only,
17 |         output_folder=output_folder,
18 |         iou_types=iou_types,
19 |         expected_results=expected_results,
20 |         expected_results_sigma_tol=expected_results_sigma_tol,
21 |     )
22 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/data/datasets/evaluation/voc/__init__.py:
--------------------------------------------------------------------------------
 1 | import logging
 2 | 
 3 | from .voc_eval import do_voc_evaluation
 4 | 
 5 | 
 6 | def voc_evaluation(dataset, predictions, output_folder, box_only, **_):
 7 |     logger = logging.getLogger("maskrcnn_benchmark.inference")
 8 |     if box_only:
 9 |         logger.warning("voc evaluation doesn't support box_only, ignored.")
10 |     logger.info("performing voc evaluation, ignored iou_types.")
11 |     return do_voc_evaluation(
12 |         dataset=dataset,
13 |         predictions=predictions,
14 |         output_folder=output_folder,
15 |         logger=logger,
16 |     )
17 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/data/datasets/list_dataset.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | """
 3 | Simple dataset class that wraps a list of path names
 4 | """
 5 | 
 6 | from PIL import Image
 7 | 
 8 | from maskrcnn_benchmark.structures.bounding_box import BoxList
 9 | 
10 | 
11 | class ListDataset(object):
12 |     def __init__(self, image_lists, transforms=None):
13 |         self.image_lists = image_lists
14 |         self.transforms = transforms
15 | 
16 |     def __getitem__(self, item):
17 |         img = Image.open(self.image_lists[item]).convert("RGB")
18 | 
19 |         # dummy target
20 |         w, h = img.size
21 |         target = BoxList([[0, 0, w, h]], img.size, mode="xyxy")
22 | 
23 |         if self.transforms is not None:
24 |             img, target = self.transforms(img, target)
25 | 
26 |         return img, target
27 | 
28 |     def __len__(self):
29 |         return len(self.image_lists)
30 | 
31 |     def get_img_info(self, item):
32 |         """
33 |         Return the image dimensions for the image, without
34 |         loading and pre-processing it
35 |         """
36 |         pass
37 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/data/samplers/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .distributed import DistributedSampler
3 | from .grouped_batch_sampler import GroupedBatchSampler
4 | from .iteration_based_batch_sampler import IterationBasedBatchSampler
5 | 
6 | __all__ = ["DistributedSampler", "GroupedBatchSampler", "IterationBasedBatchSampler"]
7 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/data/samplers/distributed.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | # Code is copy-pasted exactly as in torch.utils.data.distributed.
 3 | # FIXME remove this once c10d fixes the bug it has
 4 | import math
 5 | import torch
 6 | import torch.distributed as dist
 7 | from torch.utils.data.sampler import Sampler
 8 | 
 9 | 
10 | class DistributedSampler(Sampler):
11 |     """Sampler that restricts data loading to a subset of the dataset.
12 |     It is especially useful in conjunction with
13 |     :class:`torch.nn.parallel.DistributedDataParallel`. In such case, each
14 |     process can pass a DistributedSampler instance as a DataLoader sampler,
15 |     and load a subset of the original dataset that is exclusive to it.
16 |     .. note::
17 |         Dataset is assumed to be of constant size.
18 |     Arguments:
19 |         dataset: Dataset used for sampling.
20 |         num_replicas (optional): Number of processes participating in
21 |             distributed training.
22 |         rank (optional): Rank of the current process within num_replicas.
23 |     """
24 | 
25 |     def __init__(self, dataset, num_replicas=None, rank=None, shuffle=True):
26 |         if num_replicas is None:
27 |             if not dist.is_available():
28 |                 raise RuntimeError("Requires distributed package to be available")
29 |             num_replicas = dist.get_world_size()
30 |         if rank is None:
31 |             if not dist.is_available():
32 |                 raise RuntimeError("Requires distributed package to be available")
33 |             rank = dist.get_rank()
34 |         self.dataset = dataset
35 |         self.num_replicas = num_replicas
36 |         self.rank = rank
37 |         self.epoch = 0
38 |         self.num_samples = int(math.ceil(len(self.dataset) * 1.0 / self.num_replicas))
39 |         self.total_size = self.num_samples * self.num_replicas
40 |         self.shuffle = shuffle
41 | 
42 |     def __iter__(self):
43 |         if self.shuffle:
44 |             # deterministically shuffle based on epoch
45 |             g = torch.Generator()
46 |             g.manual_seed(self.epoch)
47 |             indices = torch.randperm(len(self.dataset), generator=g).tolist()
48 |         else:
49 |             indices = torch.arange(len(self.dataset)).tolist()
50 | 
51 |         # add extra samples to make it evenly divisible
52 |         indices += indices[: (self.total_size - len(indices))]
53 |         assert len(indices) == self.total_size
54 | 
55 |         # subsample
56 |         offset = self.num_samples * self.rank
57 |         indices = indices[offset : offset + self.num_samples]
58 |         assert len(indices) == self.num_samples
59 | 
60 |         return iter(indices)
61 | 
62 |     def __len__(self):
63 |         return self.num_samples
64 | 
65 |     def set_epoch(self, epoch):
66 |         self.epoch = epoch
67 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/data/samplers/iteration_based_batch_sampler.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from torch.utils.data.sampler import BatchSampler
 3 | 
 4 | 
 5 | class IterationBasedBatchSampler(BatchSampler):
 6 |     """
 7 |     Wraps a BatchSampler, resampling from it until
 8 |     a specified number of iterations have been sampled
 9 |     """
10 | 
11 |     def __init__(self, batch_sampler, num_iterations, start_iter=0):
12 |         self.batch_sampler = batch_sampler
13 |         self.num_iterations = num_iterations
14 |         self.start_iter = start_iter
15 | 
16 |     def __iter__(self):
17 |         iteration = self.start_iter
18 |         while iteration <= self.num_iterations:
19 |             # if the underlying sampler has a set_epoch method, like
20 |             # DistributedSampler, used for making each process see
21 |             # a different split of the dataset, then set it
22 |             if hasattr(self.batch_sampler.sampler, "set_epoch"):
23 |                 self.batch_sampler.sampler.set_epoch(iteration)
24 |             for batch in self.batch_sampler:
25 |                 iteration += 1
26 |                 if iteration > self.num_iterations:
27 |                     break
28 |                 yield batch
29 | 
30 |     def __len__(self):
31 |         return self.num_iterations
32 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/data/transforms/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .transforms import Compose
3 | from .transforms import Resize
4 | from .transforms import RandomHorizontalFlip
5 | from .transforms import ToTensor
6 | from .transforms import Normalize
7 | 
8 | from .build import build_transforms
9 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/data/transforms/build.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from . import transforms as T
 3 | 
 4 | 
 5 | def build_transforms(cfg, is_train=True):
 6 |     if is_train:
 7 |         if cfg.INPUT.MIN_SIZE_RANGE_TRAIN[0] == -1:
 8 |             min_size = cfg.INPUT.MIN_SIZE_TRAIN
 9 |         else:
10 |             assert len(cfg.INPUT.MIN_SIZE_RANGE_TRAIN) == 2, \
11 |                 "MIN_SIZE_RANGE_TRAIN must have two elements (lower bound, upper bound)"
12 |             min_size = range(
13 |                 cfg.INPUT.MIN_SIZE_RANGE_TRAIN[0],
14 |                 cfg.INPUT.MIN_SIZE_RANGE_TRAIN[1] + 1
15 |             )
16 |         max_size = cfg.INPUT.MAX_SIZE_TRAIN
17 |         flip_prob = 0.5  # cfg.INPUT.FLIP_PROB_TRAIN
18 |     else:
19 |         min_size = cfg.INPUT.MIN_SIZE_TEST
20 |         max_size = cfg.INPUT.MAX_SIZE_TEST
21 |         flip_prob = 0
22 | 
23 |     to_bgr255 = cfg.INPUT.TO_BGR255
24 |     normalize_transform = T.Normalize(
25 |         mean=cfg.INPUT.PIXEL_MEAN, std=cfg.INPUT.PIXEL_STD, to_bgr255=to_bgr255
26 |     )
27 | 
28 |     transform = T.Compose(
29 |         [
30 |             T.Resize(min_size, max_size),
31 |             T.RandomHorizontalFlip(flip_prob),
32 |             T.ToTensor(),
33 |             normalize_transform,
34 |         ]
35 |     )
36 |     return transform
37 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/data/transforms/transforms.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import random
 3 | 
 4 | import torch
 5 | import torchvision
 6 | from torchvision.transforms import functional as F
 7 | 
 8 | 
 9 | class Compose(object):
10 |     def __init__(self, transforms):
11 |         self.transforms = transforms
12 | 
13 |     def __call__(self, image, target):
14 |         for t in self.transforms:
15 |             image, target = t(image, target)
16 |         return image, target
17 | 
18 |     def __repr__(self):
19 |         format_string = self.__class__.__name__ + "("
20 |         for t in self.transforms:
21 |             format_string += "\n"
22 |             format_string += "    {0}".format(t)
23 |         format_string += "\n)"
24 |         return format_string
25 | 
26 | 
27 | class Resize(object):
28 |     def __init__(self, min_size, max_size):
29 |         if not isinstance(min_size, (list, tuple)):
30 |             min_size = (min_size,)
31 |         self.min_size = min_size
32 |         self.max_size = max_size
33 | 
34 |     # modified from torchvision to add support for max size
35 |     def get_size(self, image_size):
36 |         w, h = image_size
37 |         size = random.choice(self.min_size)
38 |         max_size = self.max_size
39 |         if max_size is not None:
40 |             min_original_size = float(min((w, h)))
41 |             max_original_size = float(max((w, h)))
42 |             if max_original_size / min_original_size * size > max_size:
43 |                 size = int(round(max_size * min_original_size / max_original_size))
44 | 
45 |         if (w <= h and w == size) or (h <= w and h == size):
46 |             return (h, w)
47 | 
48 |         if w < h:
49 |             ow = size
50 |             oh = int(size * h / w)
51 |         else:
52 |             oh = size
53 |             ow = int(size * w / h)
54 | 
55 |         return (oh, ow)
56 | 
57 |     def __call__(self, image, target):
58 |         size = self.get_size(image.size)
59 |         image = F.resize(image, size)
60 |         target = target.resize(image.size)
61 |         return image, target
62 | 
63 | 
64 | class RandomHorizontalFlip(object):
65 |     def __init__(self, prob=0.5):
66 |         self.prob = prob
67 | 
68 |     def __call__(self, image, target):
69 |         if random.random() < self.prob:
70 |             image = F.hflip(image)
71 |             target = target.transpose(0)
72 |         return image, target
73 | 
74 | 
75 | class ToTensor(object):
76 |     def __call__(self, image, target):
77 |         return F.to_tensor(image), target
78 | 
79 | 
80 | class Normalize(object):
81 |     def __init__(self, mean, std, to_bgr255=True):
82 |         self.mean = mean
83 |         self.std = std
84 |         self.to_bgr255 = to_bgr255
85 | 
86 |     def __call__(self, image, target):
87 |         if self.to_bgr255:
88 |             image = image[[2, 1, 0]] * 255
89 |         image = F.normalize(image, mean=self.mean, std=self.std)
90 |         return image, target
91 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/engine/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/layers/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | from .batch_norm import FrozenBatchNorm2d
 5 | from .misc import Conv2d
 6 | from .misc import ConvTranspose2d
 7 | from .misc import BatchNorm2d
 8 | from .misc import interpolate
 9 | from .nms import nms
10 | from .roi_align import ROIAlign
11 | from .roi_align import roi_align
12 | from .roi_pool import ROIPool
13 | from .roi_pool import roi_pool
14 | from .smooth_l1_loss import smooth_l1_loss
15 | from .sigmoid_focal_loss import SigmoidFocalLoss
16 | from .iou_loss import IOULoss
17 | from .scale import Scale
18 | from .deform_conv import ModulatedDeformConvPack
19 | from .deform_conv import DeformConvPack
20 | 
21 | __all__ = ["nms", "roi_align", "ROIAlign", "roi_pool", "ROIPool",
22 |            "smooth_l1_loss", "Conv2d", "ConvTranspose2d", "interpolate",
23 |            "BatchNorm2d", "FrozenBatchNorm2d", "SigmoidFocalLoss", "IOULoss",
24 |            "Scale", "ModulatedDeformConvPack", "DeformConvPack"]
25 | 
26 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/layers/_utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import glob
 3 | import os.path
 4 | 
 5 | import torch
 6 | 
 7 | try:
 8 |     from torch.utils.cpp_extension import load as load_ext
 9 |     from torch.utils.cpp_extension import CUDA_HOME
10 | except ImportError:
11 |     raise ImportError("The cpp layer extensions requires PyTorch 0.4 or higher")
12 | 
13 | 
14 | def _load_C_extensions():
15 |     this_dir = os.path.dirname(os.path.abspath(__file__))
16 |     this_dir = os.path.dirname(this_dir)
17 |     this_dir = os.path.join(this_dir, "csrc")
18 | 
19 |     main_file = glob.glob(os.path.join(this_dir, "*.cpp"))
20 |     source_cpu = glob.glob(os.path.join(this_dir, "cpu", "*.cpp"))
21 |     source_cuda = glob.glob(os.path.join(this_dir, "cuda", "*.cu"))
22 | 
23 |     source = main_file + source_cpu
24 | 
25 |     extra_cflags = []
26 |     if torch.cuda.is_available() and CUDA_HOME is not None:
27 |         source.extend(source_cuda)
28 |         extra_cflags = ["-DWITH_CUDA"]
29 |     source = [os.path.join(this_dir, s) for s in source]
30 |     extra_include_paths = [this_dir]
31 |     return load_ext(
32 |         "torchvision",
33 |         source,
34 |         extra_cflags=extra_cflags,
35 |         extra_include_paths=extra_include_paths,
36 |     )
37 | 
38 | 
39 | _C = _load_C_extensions()
40 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/layers/batch_norm.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | from torch import nn
 4 | 
 5 | 
 6 | class FrozenBatchNorm2d(nn.Module):
 7 |     """
 8 |     BatchNorm2d where the batch statistics and the affine parameters
 9 |     are fixed
10 |     """
11 | 
12 |     def __init__(self, n):
13 |         super(FrozenBatchNorm2d, self).__init__()
14 |         self.register_buffer("weight", torch.ones(n))
15 |         self.register_buffer("bias", torch.zeros(n))
16 |         self.register_buffer("running_mean", torch.zeros(n))
17 |         self.register_buffer("running_var", torch.ones(n))
18 | 
19 |     def forward(self, x):
20 |         scale = self.weight * self.running_var.rsqrt()
21 |         bias = self.bias - self.running_mean * scale
22 |         scale = scale.reshape(1, -1, 1, 1)
23 |         bias = bias.reshape(1, -1, 1, 1)
24 |         return x * scale + bias
25 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/layers/iou_loss.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from torch import nn
 3 | 
 4 | 
 5 | class IOULoss(nn.Module):
 6 |     def forward(self, pred, target, weight=None):
 7 |         pred_left = pred[:, 0]
 8 |         pred_top = pred[:, 1]
 9 |         pred_right = pred[:, 2]
10 |         pred_bottom = pred[:, 3]
11 | 
12 |         target_left = target[:, 0]
13 |         target_top = target[:, 1]
14 |         target_right = target[:, 2]
15 |         target_bottom = target[:, 3]
16 | 
17 |         target_aera = (target_left + target_right) * \
18 |                       (target_top + target_bottom)
19 |         pred_aera = (pred_left + pred_right) * \
20 |                     (pred_top + pred_bottom)
21 | 
22 |         w_intersect = torch.min(pred_left, target_left) + \
23 |                       torch.min(pred_right, target_right)
24 |         h_intersect = torch.min(pred_bottom, target_bottom) + \
25 |                       torch.min(pred_top, target_top)
26 | 
27 |         area_intersect = w_intersect * h_intersect
28 |         area_union = target_aera + pred_aera - area_intersect
29 | 
30 |         losses = -torch.log((area_intersect + 1.0) / (area_union + 1.0))
31 | 
32 |         if weight is not None and weight.sum() > 0:
33 |             return (losses * weight).sum() / weight.sum()
34 |         else:
35 |             assert losses.numel() != 0
36 |             return losses.mean()
37 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/layers/nms.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | # from ._utils import _C
3 | from maskrcnn_benchmark import _C
4 | 
5 | nms = _C.nms
6 | # nms.__doc__ = """
7 | # This function performs Non-maximum suppresion"""
8 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/layers/roi_align.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | from torch import nn
 4 | from torch.autograd import Function
 5 | from torch.autograd.function import once_differentiable
 6 | from torch.nn.modules.utils import _pair
 7 | 
 8 | from maskrcnn_benchmark import _C
 9 | 
10 | 
11 | class _ROIAlign(Function):
12 |     @staticmethod
13 |     def forward(ctx, input, roi, output_size, spatial_scale, sampling_ratio):
14 |         ctx.save_for_backward(roi)
15 |         ctx.output_size = _pair(output_size)
16 |         ctx.spatial_scale = spatial_scale
17 |         ctx.sampling_ratio = sampling_ratio
18 |         ctx.input_shape = input.size()
19 |         output = _C.roi_align_forward(
20 |             input, roi, spatial_scale, output_size[0], output_size[1], sampling_ratio
21 |         )
22 |         return output
23 | 
24 |     @staticmethod
25 |     @once_differentiable
26 |     def backward(ctx, grad_output):
27 |         rois, = ctx.saved_tensors
28 |         output_size = ctx.output_size
29 |         spatial_scale = ctx.spatial_scale
30 |         sampling_ratio = ctx.sampling_ratio
31 |         bs, ch, h, w = ctx.input_shape
32 |         grad_input = _C.roi_align_backward(
33 |             grad_output,
34 |             rois,
35 |             spatial_scale,
36 |             output_size[0],
37 |             output_size[1],
38 |             bs,
39 |             ch,
40 |             h,
41 |             w,
42 |             sampling_ratio,
43 |         )
44 |         return grad_input, None, None, None, None
45 | 
46 | 
47 | roi_align = _ROIAlign.apply
48 | 
49 | 
50 | class ROIAlign(nn.Module):
51 |     def __init__(self, output_size, spatial_scale, sampling_ratio):
52 |         super(ROIAlign, self).__init__()
53 |         self.output_size = output_size
54 |         self.spatial_scale = spatial_scale
55 |         self.sampling_ratio = sampling_ratio
56 | 
57 |     def forward(self, input, rois):
58 |         return roi_align(
59 |             input, rois, self.output_size, self.spatial_scale, self.sampling_ratio
60 |         )
61 | 
62 |     def __repr__(self):
63 |         tmpstr = self.__class__.__name__ + "("
64 |         tmpstr += "output_size=" + str(self.output_size)
65 |         tmpstr += ", spatial_scale=" + str(self.spatial_scale)
66 |         tmpstr += ", sampling_ratio=" + str(self.sampling_ratio)
67 |         tmpstr += ")"
68 |         return tmpstr
69 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/layers/roi_pool.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | from torch import nn
 4 | from torch.autograd import Function
 5 | from torch.autograd.function import once_differentiable
 6 | from torch.nn.modules.utils import _pair
 7 | 
 8 | from maskrcnn_benchmark import _C
 9 | 
10 | 
11 | class _ROIPool(Function):
12 |     @staticmethod
13 |     def forward(ctx, input, roi, output_size, spatial_scale):
14 |         ctx.output_size = _pair(output_size)
15 |         ctx.spatial_scale = spatial_scale
16 |         ctx.input_shape = input.size()
17 |         output, argmax = _C.roi_pool_forward(
18 |             input, roi, spatial_scale, output_size[0], output_size[1]
19 |         )
20 |         ctx.save_for_backward(input, roi, argmax)
21 |         return output
22 | 
23 |     @staticmethod
24 |     @once_differentiable
25 |     def backward(ctx, grad_output):
26 |         input, rois, argmax = ctx.saved_tensors
27 |         output_size = ctx.output_size
28 |         spatial_scale = ctx.spatial_scale
29 |         bs, ch, h, w = ctx.input_shape
30 |         grad_input = _C.roi_pool_backward(
31 |             grad_output,
32 |             input,
33 |             rois,
34 |             argmax,
35 |             spatial_scale,
36 |             output_size[0],
37 |             output_size[1],
38 |             bs,
39 |             ch,
40 |             h,
41 |             w,
42 |         )
43 |         return grad_input, None, None, None
44 | 
45 | 
46 | roi_pool = _ROIPool.apply
47 | 
48 | 
49 | class ROIPool(nn.Module):
50 |     def __init__(self, output_size, spatial_scale):
51 |         super(ROIPool, self).__init__()
52 |         self.output_size = output_size
53 |         self.spatial_scale = spatial_scale
54 | 
55 |     def forward(self, input, rois):
56 |         return roi_pool(input, rois, self.output_size, self.spatial_scale)
57 | 
58 |     def __repr__(self):
59 |         tmpstr = self.__class__.__name__ + "("
60 |         tmpstr += "output_size=" + str(self.output_size)
61 |         tmpstr += ", spatial_scale=" + str(self.spatial_scale)
62 |         tmpstr += ")"
63 |         return tmpstr
64 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/layers/scale.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from torch import nn
 3 | 
 4 | 
 5 | class Scale(nn.Module):
 6 |     def __init__(self, init_value=1.0):
 7 |         super(Scale, self).__init__()
 8 |         self.scale = nn.Parameter(torch.FloatTensor([init_value]))
 9 | 
10 |     def forward(self, input):
11 |         return input * self.scale
12 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/layers/sigmoid_focal_loss.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from torch import nn
 3 | from torch.autograd import Function
 4 | from torch.autograd.function import once_differentiable
 5 | 
 6 | from maskrcnn_benchmark import _C
 7 | 
 8 | # TODO: Use JIT to replace CUDA implementation in the future.
 9 | class _SigmoidFocalLoss(Function):
10 |     @staticmethod
11 |     def forward(ctx, logits, targets, gamma, alpha):
12 |         ctx.save_for_backward(logits, targets)
13 |         num_classes = logits.shape[1]
14 |         ctx.num_classes = num_classes
15 |         ctx.gamma = gamma
16 |         ctx.alpha = alpha
17 | 
18 |         losses = _C.sigmoid_focalloss_forward(
19 |             logits, targets, num_classes, gamma, alpha
20 |         )
21 |         return losses
22 | 
23 |     @staticmethod
24 |     @once_differentiable
25 |     def backward(ctx, d_loss):
26 |         logits, targets = ctx.saved_tensors
27 |         num_classes = ctx.num_classes
28 |         gamma = ctx.gamma
29 |         alpha = ctx.alpha
30 |         d_loss = d_loss.contiguous()
31 |         d_logits = _C.sigmoid_focalloss_backward(
32 |             logits, targets, d_loss, num_classes, gamma, alpha
33 |         )
34 |         return d_logits, None, None, None, None
35 | 
36 | 
37 | sigmoid_focal_loss_cuda = _SigmoidFocalLoss.apply
38 | 
39 | 
40 | def sigmoid_focal_loss_cpu(logits, targets, gamma, alpha):
41 |     num_classes = logits.shape[1]
42 |     gamma = gamma[0]
43 |     alpha = alpha[0]
44 |     dtype = targets.dtype
45 |     device = targets.device
46 |     class_range = torch.arange(1, num_classes+1, dtype=dtype, device=device).unsqueeze(0)
47 | 
48 |     t = targets.unsqueeze(1)
49 |     p = torch.sigmoid(logits)
50 |     term1 = (1 - p) ** gamma * torch.log(p)
51 |     term2 = p ** gamma * torch.log(1 - p)
52 |     return -(t == class_range).float() * term1 * alpha - ((t != class_range) * (t >= 0)).float() * term2 * (1 - alpha)
53 | 
54 | 
55 | class SigmoidFocalLoss(nn.Module):
56 |     def __init__(self, gamma, alpha):
57 |         super(SigmoidFocalLoss, self).__init__()
58 |         self.gamma = gamma
59 |         self.alpha = alpha
60 | 
61 |     def forward(self, logits, targets):
62 |         device = logits.device
63 |         if logits.is_cuda:
64 |             loss_func = sigmoid_focal_loss_cuda
65 |         else:
66 |             loss_func = sigmoid_focal_loss_cpu
67 | 
68 |         loss = loss_func(logits, targets, self.gamma, self.alpha)
69 |         return loss.sum()
70 | 
71 |     def __repr__(self):
72 |         tmpstr = self.__class__.__name__ + "("
73 |         tmpstr += "gamma=" + str(self.gamma)
74 |         tmpstr += ", alpha=" + str(self.alpha)
75 |         tmpstr += ")"
76 |         return tmpstr
77 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/layers/smooth_l1_loss.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | 
 5 | # TODO maybe push this to nn?
 6 | def smooth_l1_loss(input, target, beta=1. / 9, size_average=True, weight=None):
 7 |     """
 8 |     very similar to the smooth_l1_loss from pytorch, but with
 9 |     the extra beta parameter
10 |     """
11 |     input = torch.log(input)
12 |     target = torch.log(target)
13 |     n = torch.abs(input - target)
14 |     cond = n < beta
15 |     loss = torch.where(cond, 0.5 * n ** 2 / beta, n - 0.5 * beta)
16 |     if weight is not None and weight.sum() > 0:
17 |         return (loss * weight).sum() / weight.sum()
18 |     if size_average:
19 |         return loss.mean()
20 |     return loss.sum()
21 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/maskrcnn_benchmark/modeling/__init__.py


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/backbone/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .backbone import build_backbone
3 | from . import fbnet
4 | from . import segmentation
5 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/backbone/backbone.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from collections import OrderedDict
 3 | 
 4 | from torch import nn
 5 | 
 6 | from maskrcnn_benchmark.modeling import registry
 7 | from maskrcnn_benchmark.modeling.make_layers import conv_with_kaiming_uniform
 8 | from . import fpn as fpn_module
 9 | from . import resnet
10 | 
11 | 
12 | @registry.BACKBONES.register("R-50-C4")
13 | @registry.BACKBONES.register("R-50-C5")
14 | @registry.BACKBONES.register("R-101-C4")
15 | @registry.BACKBONES.register("R-101-C5")
16 | def build_resnet_backbone(cfg):
17 |     body = resnet.ResNet(cfg)
18 |     model = nn.Sequential(OrderedDict([("body", body)]))
19 |     model.out_channels = cfg.MODEL.RESNETS.BACKBONE_OUT_CHANNELS
20 |     return model
21 | 
22 | 
23 | @registry.BACKBONES.register("R-50-FPN")
24 | @registry.BACKBONES.register("R-101-FPN")
25 | @registry.BACKBONES.register("R-152-FPN")
26 | def build_resnet_fpn_backbone(cfg):
27 |     body = resnet.ResNet(cfg)
28 |     in_channels_stage2 = cfg.MODEL.RESNETS.RES2_OUT_CHANNELS
29 |     out_channels = cfg.MODEL.RESNETS.BACKBONE_OUT_CHANNELS
30 |     fpn = fpn_module.FPN(
31 |         in_channels_list=[
32 |             in_channels_stage2,
33 |             in_channels_stage2 * 2,
34 |             in_channels_stage2 * 4,
35 |             in_channels_stage2 * 8,
36 |         ],
37 |         out_channels=out_channels,
38 |         conv_block=conv_with_kaiming_uniform(
39 |             cfg.MODEL.FPN.USE_GN, cfg.MODEL.FPN.USE_RELU
40 |         ),
41 |         top_blocks=fpn_module.LastLevelMaxPool(),
42 |     )
43 |     model = nn.Sequential(OrderedDict([("body", body), ("fpn", fpn)]))
44 |     model.out_channels = out_channels
45 |     return model
46 | 
47 | 
48 | @registry.BACKBONES.register("R-50-FPN-RETINANET")
49 | @registry.BACKBONES.register("R-101-FPN-RETINANET")
50 | def build_resnet_fpn_p3p7_backbone(cfg):
51 |     body = resnet.ResNet(cfg)
52 |     in_channels_stage2 = cfg.MODEL.RESNETS.RES2_OUT_CHANNELS
53 |     out_channels = cfg.MODEL.RESNETS.BACKBONE_OUT_CHANNELS
54 |     only_p6 = cfg.MODEL.FPN.ONLY_P6
55 |     in_channels_p6p7 = in_channels_stage2 * 8 if cfg.MODEL.RETINANET.USE_C5 \
56 |         else out_channels
57 |     if cfg.MODEL.FPN.USE_P6P7:
58 |         top_blocks = fpn_module.LastLevelP6(in_channels_p6p7, out_channels) if only_p6 \
59 |             else fpn_module.LastLevelP6P7(in_channels_p6p7, out_channels)
60 |     else:
61 |         top_blocks = None
62 |     fpn = fpn_module.FPN(
63 |         in_channels_list=[
64 |             0,
65 |             in_channels_stage2 * 2,
66 |             in_channels_stage2 * 4,
67 |             in_channels_stage2 * 8,
68 |         ],
69 |         out_channels=out_channels,
70 |         conv_block=conv_with_kaiming_uniform(
71 |             cfg.MODEL.FPN.USE_GN, cfg.MODEL.FPN.USE_RELU
72 |         ),
73 |         top_blocks=top_blocks,
74 |         dense=cfg.MODEL.FPN.DENSE,
75 |         att_dense=cfg.MODEL.FPN.ATT_DENSE
76 |     )
77 |     model = nn.Sequential(OrderedDict([("body", body), ("fpn", fpn)]))
78 |     model.out_channels = out_channels
79 |     return model
80 | 
81 | 
82 | def build_backbone(cfg):
83 |     assert cfg.MODEL.BACKBONE.CONV_BODY in registry.BACKBONES, \
84 |         "cfg.MODEL.BACKBONE.CONV_BODY: {} are not registered in registry".format(
85 |             cfg.MODEL.BACKBONE.CONV_BODY
86 |         )
87 |     return registry.BACKBONES[cfg.MODEL.BACKBONE.CONV_BODY](cfg)
88 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/backbone/src/checks.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include <ATen/ATen.h>
 4 | 
 5 | // Define AT_CHECK for old version of ATen where the same function was called AT_ASSERT
 6 | #ifndef AT_CHECK
 7 | #define AT_CHECK AT_ASSERT
 8 | #endif
 9 | 
10 | #define CHECK_CUDA(x) AT_CHECK((x).type().is_cuda(), #x " must be a CUDA tensor")
11 | #define CHECK_CPU(x) AT_CHECK(!(x).type().is_cuda(), #x " must be a CPU tensor")
12 | #define CHECK_CONTIGUOUS(x) AT_CHECK((x).is_contiguous(), #x " must be contiguous")
13 | 
14 | #define CHECK_CUDA_INPUT(x) CHECK_CUDA(x); CHECK_CONTIGUOUS(x)
15 | #define CHECK_CPU_INPUT(x) CHECK_CPU(x); CHECK_CONTIGUOUS(x)


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/backbone/src/inplace_abn.cpp:
--------------------------------------------------------------------------------
 1 | #include <torch/extension.h>
 2 | 
 3 | #include <vector>
 4 | 
 5 | #include "inplace_abn.h"
 6 | 
 7 | std::vector<at::Tensor> mean_var(at::Tensor x) {
 8 |   if (x.is_cuda()) {
 9 |     if (x.type().scalarType() == at::ScalarType::Half) {
10 |       return mean_var_cuda_h(x);
11 |     } else {
12 |       return mean_var_cuda(x);
13 |     }
14 |   } else {
15 |     return mean_var_cpu(x);
16 |   }
17 | }
18 | 
19 | at::Tensor forward(at::Tensor x, at::Tensor mean, at::Tensor var, at::Tensor weight, at::Tensor bias,
20 |                    bool affine, float eps) {
21 |   if (x.is_cuda()) {
22 |     if (x.type().scalarType() == at::ScalarType::Half) {
23 |       return forward_cuda_h(x, mean, var, weight, bias, affine, eps);
24 |     } else {
25 |       return forward_cuda(x, mean, var, weight, bias, affine, eps);
26 |     }
27 |   } else {
28 |     return forward_cpu(x, mean, var, weight, bias, affine, eps);
29 |   }
30 | }
31 | 
32 | std::vector<at::Tensor> edz_eydz(at::Tensor z, at::Tensor dz, at::Tensor weight, at::Tensor bias,
33 |                                  bool affine, float eps) {
34 |   if (z.is_cuda()) {
35 |     if (z.type().scalarType() == at::ScalarType::Half) {
36 |       return edz_eydz_cuda_h(z, dz, weight, bias, affine, eps);
37 |     } else {
38 |       return edz_eydz_cuda(z, dz, weight, bias, affine, eps);
39 | 	}
40 |   } else {
41 |     return edz_eydz_cpu(z, dz, weight, bias, affine, eps);
42 |   }
43 | }
44 | 
45 | at::Tensor backward(at::Tensor z, at::Tensor dz, at::Tensor var, at::Tensor weight, at::Tensor bias,
46 |                                  at::Tensor edz, at::Tensor eydz, bool affine, float eps) {
47 |   if (z.is_cuda()) {
48 |     if (z.type().scalarType() == at::ScalarType::Half) {
49 |       return backward_cuda_h(z, dz, var, weight, bias, edz, eydz, affine, eps);
50 | 	} else {
51 |       return backward_cuda(z, dz, var, weight, bias, edz, eydz, affine, eps);
52 |     }
53 |   } else {
54 |     return backward_cpu(z, dz, var, weight, bias, edz, eydz, affine, eps);
55 |   }
56 | }
57 | 
58 | void leaky_relu_forward(at::Tensor z, float slope) {
59 |   at::leaky_relu_(z, slope);
60 | }
61 | 
62 | void leaky_relu_backward(at::Tensor z, at::Tensor dz, float slope) {
63 |   if (z.is_cuda()) {
64 |     if (z.type().scalarType() == at::ScalarType::Half) {
65 |       return leaky_relu_backward_cuda_h(z, dz, slope);
66 | 	} else {
67 |       return leaky_relu_backward_cuda(z, dz, slope);
68 |     }
69 |   } else {
70 |     return leaky_relu_backward_cpu(z, dz, slope);
71 |   }
72 | }
73 | 
74 | void elu_forward(at::Tensor z) {
75 |   at::elu_(z);
76 | }
77 | 
78 | void elu_backward(at::Tensor z, at::Tensor dz) {
79 |   if (z.is_cuda()) {
80 |     return elu_backward_cuda(z, dz);
81 |   } else {
82 |     return elu_backward_cpu(z, dz);
83 |   }
84 | }
85 | 
86 | PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
87 |   m.def("mean_var", &mean_var, "Mean and variance computation");
88 |   m.def("forward", &forward, "In-place forward computation");
89 |   m.def("edz_eydz", &edz_eydz, "First part of backward computation");
90 |   m.def("backward", &backward, "Second part of backward computation");
91 |   m.def("leaky_relu_forward", &leaky_relu_forward, "Leaky relu forward computation");
92 |   m.def("leaky_relu_backward", &leaky_relu_backward, "Leaky relu backward computation and inversion");
93 |   m.def("elu_forward", &elu_forward, "Elu forward computation");
94 |   m.def("elu_backward", &elu_backward, "Elu backward computation and inversion");
95 | }
96 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/backbone/src/utils/checks.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include <ATen/ATen.h>
 4 | 
 5 | // Define AT_CHECK for old version of ATen where the same function was called AT_ASSERT
 6 | #ifndef AT_CHECK
 7 | #define AT_CHECK AT_ASSERT
 8 | #endif
 9 | 
10 | #define CHECK_CUDA(x) AT_CHECK((x).type().is_cuda(), #x " must be a CUDA tensor")
11 | #define CHECK_CPU(x) AT_CHECK(!(x).type().is_cuda(), #x " must be a CPU tensor")
12 | #define CHECK_CONTIGUOUS(x) AT_CHECK((x).is_contiguous(), #x " must be contiguous")
13 | 
14 | #define CHECK_CUDA_INPUT(x) CHECK_CUDA(x); CHECK_CONTIGUOUS(x)
15 | #define CHECK_CPU_INPUT(x) CHECK_CPU(x); CHECK_CONTIGUOUS(x)


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/backbone/src/utils/common.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include <ATen/ATen.h>
 4 | 
 5 | /*
 6 |  * Functions to share code between CPU and GPU
 7 |  */
 8 | 
 9 | #ifdef __CUDACC__
10 | // CUDA versions
11 | 
12 | #define HOST_DEVICE __host__ __device__
13 | #define INLINE_HOST_DEVICE __host__ __device__ inline
14 | #define FLOOR(x) floor(x)
15 | 
16 | #if __CUDA_ARCH__ >= 600
17 | // Recent compute capabilities have block-level atomicAdd for all data types, so we use that
18 | #define ACCUM(x,y) atomicAdd_block(&(x),(y))
19 | #else
20 | // Older architectures don't have block-level atomicAdd, nor atomicAdd for doubles, so we defer to atomicAdd for float
21 | // and use the known atomicCAS-based implementation for double
22 | template<typename data_t>
23 | __device__ inline data_t atomic_add(data_t *address, data_t val) {
24 |   return atomicAdd(address, val);
25 | }
26 | 
27 | template<>
28 | __device__ inline double atomic_add(double *address, double val) {
29 |   unsigned long long int* address_as_ull = (unsigned long long int*)address;
30 |   unsigned long long int old = *address_as_ull, assumed;
31 |   do {
32 |     assumed = old;
33 |     old = atomicCAS(address_as_ull, assumed, __double_as_longlong(val + __longlong_as_double(assumed)));
34 |   } while (assumed != old);
35 |   return __longlong_as_double(old);
36 | }
37 | 
38 | #define ACCUM(x,y) atomic_add(&(x),(y))
39 | #endif // #if __CUDA_ARCH__ >= 600
40 | 
41 | #else
42 | // CPU versions
43 | 
44 | #define HOST_DEVICE
45 | #define INLINE_HOST_DEVICE inline
46 | #define FLOOR(x) std::floor(x)
47 | #define ACCUM(x,y) (x) += (y)
48 | 
49 | #endif // #ifdef __CUDACC__


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/backbone/src/utils/cuda.cuh:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | /*
 4 |  * General settings and functions
 5 |  */
 6 | const int WARP_SIZE = 32;
 7 | const int MAX_BLOCK_SIZE = 1024;
 8 | 
 9 | static int getNumThreads(int nElem) {
10 |   int threadSizes[6] = {32, 64, 128, 256, 512, MAX_BLOCK_SIZE};
11 |   for (int i = 0; i < 6; ++i) {
12 |     if (nElem <= threadSizes[i]) {
13 |       return threadSizes[i];
14 |     }
15 |   }
16 |   return MAX_BLOCK_SIZE;
17 | }
18 | 
19 | /*
20 |  * Reduction utilities
21 |  */
22 | template <typename T>
23 | __device__ __forceinline__ T WARP_SHFL_XOR(T value, int laneMask, int width = warpSize,
24 |                                            unsigned int mask = 0xffffffff) {
25 | #if CUDART_VERSION >= 9000
26 |   return __shfl_xor_sync(mask, value, laneMask, width);
27 | #else
28 |   return __shfl_xor(value, laneMask, width);
29 | #endif
30 | }
31 | 
32 | __device__ __forceinline__ int getMSB(int val) { return 31 - __clz(val); }
33 | 
34 | template<typename T>
35 | struct Pair {
36 |   T v1, v2;
37 |   __device__ Pair() {}
38 |   __device__ Pair(T _v1, T _v2) : v1(_v1), v2(_v2) {}
39 |   __device__ Pair(T v) : v1(v), v2(v) {}
40 |   __device__ Pair(int v) : v1(v), v2(v) {}
41 |   __device__ Pair &operator+=(const Pair<T> &a) {
42 |     v1 += a.v1;
43 |     v2 += a.v2;
44 |     return *this;
45 |   }
46 | };
47 | 
48 | template<typename T>
49 | static __device__ __forceinline__ T warpSum(T val) {
50 | #if __CUDA_ARCH__ >= 300
51 |   for (int i = 0; i < getMSB(WARP_SIZE); ++i) {
52 |     val += WARP_SHFL_XOR(val, 1 << i, WARP_SIZE);
53 |   }
54 | #else
55 |   __shared__ T values[MAX_BLOCK_SIZE];
56 |   values[threadIdx.x] = val;
57 |   __threadfence_block();
58 |   const int base = (threadIdx.x / WARP_SIZE) * WARP_SIZE;
59 |   for (int i = 1; i < WARP_SIZE; i++) {
60 |     val += values[base + ((i + threadIdx.x) % WARP_SIZE)];
61 |   }
62 | #endif
63 |   return val;
64 | }
65 | 
66 | template<typename T>
67 | static __device__ __forceinline__ Pair<T> warpSum(Pair<T> value) {
68 |   value.v1 = warpSum(value.v1);
69 |   value.v2 = warpSum(value.v2);
70 |   return value;
71 | }


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/balanced_positive_negative_sampler.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | 
 5 | class BalancedPositiveNegativeSampler(object):
 6 |     """
 7 |     This class samples batches, ensuring that they contain a fixed proportion of positives
 8 |     """
 9 | 
10 |     def __init__(self, batch_size_per_image, positive_fraction):
11 |         """
12 |         Arguments:
13 |             batch_size_per_image (int): number of elements to be selected per image
14 |             positive_fraction (float): percentace of positive elements per batch
15 |         """
16 |         self.batch_size_per_image = batch_size_per_image
17 |         self.positive_fraction = positive_fraction
18 | 
19 |     def __call__(self, matched_idxs):
20 |         """
21 |         Arguments:
22 |             matched idxs: list of tensors containing -1, 0 or positive values.
23 |                 Each tensor corresponds to a specific image.
24 |                 -1 values are ignored, 0 are considered as negatives and > 0 as
25 |                 positives.
26 | 
27 |         Returns:
28 |             pos_idx (list[tensor])
29 |             neg_idx (list[tensor])
30 | 
31 |         Returns two lists of binary masks for each image.
32 |         The first list contains the positive elements that were selected,
33 |         and the second list the negative example.
34 |         """
35 |         pos_idx = []
36 |         neg_idx = []
37 |         for matched_idxs_per_image in matched_idxs:
38 |             positive = torch.nonzero(matched_idxs_per_image >= 1).squeeze(1)
39 |             negative = torch.nonzero(matched_idxs_per_image == 0).squeeze(1)
40 | 
41 |             num_pos = int(self.batch_size_per_image * self.positive_fraction)
42 |             # protect against not enough positive examples
43 |             num_pos = min(positive.numel(), num_pos)
44 |             num_neg = self.batch_size_per_image - num_pos
45 |             # protect against not enough negative examples
46 |             num_neg = min(negative.numel(), num_neg)
47 | 
48 |             # randomly select positive and negative examples
49 |             perm1 = torch.randperm(positive.numel(), device=positive.device)[:num_pos]
50 |             perm2 = torch.randperm(negative.numel(), device=negative.device)[:num_neg]
51 | 
52 |             pos_idx_per_image = positive[perm1]
53 |             neg_idx_per_image = negative[perm2]
54 | 
55 |             # create binary mask from indices
56 |             pos_idx_per_image_mask = torch.zeros_like(
57 |                 matched_idxs_per_image, dtype=torch.uint8
58 |             )
59 |             neg_idx_per_image_mask = torch.zeros_like(
60 |                 matched_idxs_per_image, dtype=torch.uint8
61 |             )
62 |             pos_idx_per_image_mask[pos_idx_per_image] = 1
63 |             neg_idx_per_image_mask[neg_idx_per_image] = 1
64 | 
65 |             pos_idx.append(pos_idx_per_image_mask)
66 |             neg_idx.append(neg_idx_per_image_mask)
67 | 
68 |         return pos_idx, neg_idx
69 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/detector/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .detectors import build_detection_model
3 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/detector/detectors.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from .generalized_rcnn import GeneralizedRCNN
 3 | 
 4 | 
 5 | _DETECTION_META_ARCHITECTURES = {"GeneralizedRCNN": GeneralizedRCNN}
 6 | 
 7 | 
 8 | def build_detection_model(cfg):
 9 |     meta_arch = _DETECTION_META_ARCHITECTURES[cfg.MODEL.META_ARCHITECTURE]
10 |     return meta_arch(cfg)
11 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/detector/generalized_rcnn.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | """
 3 | Implements the Generalized R-CNN framework
 4 | """
 5 | 
 6 | import torch
 7 | from torch import nn
 8 | import time
 9 | from maskrcnn_benchmark.structures.image_list import to_image_list
10 | 
11 | from ..backbone import build_backbone
12 | from ..rpn.rpn import build_rpn
13 | from ..roi_heads.roi_heads import build_roi_heads
14 | from ..backbone.segmentation import SegHead
15 | import os
16 | import numpy as np
17 | 
18 | 
19 | class GeneralizedRCNN(nn.Module):
20 |     """
21 |     Main class for Generalized R-CNN. Currently supports boxes and masks.
22 |     It consists of three main parts:
23 |     - backbone
24 |     - rpn
25 |     - heads: takes the features + the proposals from the RPN and computes
26 |         detections / masks from it.
27 |     """
28 | 
29 |     def __init__(self, cfg):
30 |         super(GeneralizedRCNN, self).__init__()
31 | 
32 |         self.backbone = build_backbone(cfg)
33 |         self.rpn = build_rpn(cfg, self.backbone.out_channels)
34 |         if cfg.MODEL.SEG_ON:
35 |             self.seg_heads = SegHead(cfg, self.backbone.out_channels)
36 |             #self.fpn_enhance = FPN_ENHANCE(self.backbone.out_channels)
37 |         else:
38 |             self.seg_heads = None
39 |         self.roi_heads = build_roi_heads(cfg, self.backbone.out_channels)
40 |         self.proposals_logger = open('proposal_log.txt', 'w') if os.path.exists('proposal_log.txt') else open('proposal_log.txt', 'a')
41 |         print(sum([p.numel() for p in self.parameters()]))
42 | 
43 |     def forward(self, images, targets=None):
44 |         """
45 |         Arguments:
46 |             images (list[Tensor] or ImageList): images to be processed
47 |             targets (list[BoxList]): ground-truth boxes present in the image (optional)
48 | 
49 |         Returns:
50 |             result (list[BoxList] or dict[Tensor]): the output from the model.
51 |                 During training, it returns a dict[Tensor] which contains the losses.
52 |                 During testing, it returns list[BoxList] contains additional fields
53 |                 like `scores`, `labels` and `mask` (for Mask R-CNN models).
54 | 
55 |         """
56 |         if self.training and targets is None:
57 |             raise ValueError("In training mode, targets should be passed")
58 |         images = to_image_list(images)
59 |         features = self.backbone(images.tensors)
60 |         if self.seg_heads is not None:
61 |             top_features = features[0]#.detach()  # DONE: do not use detach()! WYH
62 |             masks, seg_losses = self.seg_heads(top_features, targets)
63 |             torch.cuda.synchronize()
64 |             t3 = time.time() - start - t1 - t2
65 |         else:
66 |             masks = None; seg_losses = None
67 | 
68 |         proposals, proposal_losses = self.rpn(images,  features, targets, masks=masks)
69 | 
70 |         if self.roi_heads:
71 |             x, result, detector_losses = self.roi_heads(features, proposals, masks=masks, targets=targets)
72 |         else:
73 |             x = features
74 |             result = proposals
75 |             detector_losses = {}
76 |         if self.training:
77 |             losses = {}
78 |             losses.update(detector_losses)
79 |             losses.update(proposal_losses)
80 |             if seg_losses is not None:
81 |                 losses.update(seg_losses)
82 |             return losses
83 |         return result
84 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/registry.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | from maskrcnn_benchmark.utils.registry import Registry
 4 | 
 5 | BACKBONES = Registry()
 6 | RPN_HEADS = Registry()
 7 | ROI_BOX_FEATURE_EXTRACTORS = Registry()
 8 | ROI_BOX_PREDICTOR = Registry()
 9 | ROI_KEYPOINT_FEATURE_EXTRACTORS = Registry()
10 | ROI_KEYPOINT_PREDICTOR = Registry()
11 | ROI_MASK_FEATURE_EXTRACTORS = Registry()
12 | ROI_MASK_PREDICTOR = Registry()
13 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/roi_heads/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/maskrcnn_benchmark/modeling/roi_heads/__init__.py


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/roi_heads/box_head/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/maskrcnn_benchmark/modeling/roi_heads/box_head/__init__.py


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/roi_heads/box_head/box_head.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | from torch import nn
 4 | 
 5 | from .roi_box_feature_extractors import make_roi_box_feature_extractor
 6 | from .roi_box_predictors import make_roi_box_predictor
 7 | from .inference import make_roi_box_post_processor
 8 | from .loss import make_roi_box_loss_evaluator
 9 | 
10 | 
11 | class ROIBoxHead(torch.nn.Module):
12 |     """
13 |     Generic Box Head class.
14 |     """
15 | 
16 |     def __init__(self, cfg, in_channels):
17 |         super(ROIBoxHead, self).__init__()
18 |         self.feature_extractor = make_roi_box_feature_extractor(cfg, in_channels)
19 |         self.predictor = make_roi_box_predictor(
20 |             cfg, self.feature_extractor.out_channels)
21 |         self.post_processor = make_roi_box_post_processor(cfg)
22 |         self.loss_evaluator = make_roi_box_loss_evaluator(cfg)
23 | 
24 |     def forward(self, features, proposals, targets=None):
25 |         """
26 |         Arguments:
27 |             features (list[Tensor]): feature-maps from possibly several levels
28 |             proposals (list[BoxList]): proposal boxes
29 |             targets (list[BoxList], optional): the ground-truth targets.
30 | 
31 |         Returns:
32 |             x (Tensor): the result of the feature extractor
33 |             proposals (list[BoxList]): during training, the subsampled proposals
34 |                 are returned. During testing, the predicted boxlists are returned
35 |             losses (dict[Tensor]): During training, returns the losses for the
36 |                 head. During testing, returns an empty dict.
37 |         """
38 | 
39 |         if self.training:
40 |             # Faster R-CNN subsamples during training the proposals with a fixed
41 |             # positive / negative ratio
42 |             with torch.no_grad():
43 |                 proposals = self.loss_evaluator.subsample(proposals, targets)
44 | 
45 |         # extract features that will be fed to the final classifier. The
46 |         # feature_extractor generally corresponds to the pooler + heads
47 |         x = self.feature_extractor(features, proposals)
48 |         # final classifier that converts the features into predictions
49 |         class_logits, box_regression = self.predictor(x)
50 | 
51 |         if not self.training:
52 |             result = self.post_processor((class_logits, box_regression), proposals)
53 |             return x, result, {}
54 | 
55 |         loss_classifier, loss_box_reg = self.loss_evaluator(
56 |             [class_logits], [box_regression]
57 |         )
58 |         return (
59 |             x,
60 |             proposals,
61 |             dict(loss_classifier=loss_classifier, loss_box_reg=loss_box_reg),
62 |         )
63 | 
64 | 
65 | def build_roi_box_head(cfg, in_channels):
66 |     """
67 |     Constructs a new box head.
68 |     By default, uses ROIBoxHead, but if it turns out not to be enough, just register a new class
69 |     and make it a parameter in the config
70 |     """
71 |     return ROIBoxHead(cfg, in_channels)
72 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/roi_heads/box_head/roi_box_predictors.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from maskrcnn_benchmark.modeling import registry
 3 | from torch import nn
 4 | 
 5 | 
 6 | @registry.ROI_BOX_PREDICTOR.register("FastRCNNPredictor")
 7 | class FastRCNNPredictor(nn.Module):
 8 |     def __init__(self, config, in_channels):
 9 |         super(FastRCNNPredictor, self).__init__()
10 |         assert in_channels is not None
11 | 
12 |         num_inputs = in_channels
13 | 
14 |         num_classes = config.MODEL.ROI_BOX_HEAD.NUM_CLASSES
15 |         self.avgpool = nn.AdaptiveAvgPool2d(1)
16 |         self.cls_score = nn.Linear(num_inputs, num_classes)
17 |         num_bbox_reg_classes = 2 if config.MODEL.CLS_AGNOSTIC_BBOX_REG else num_classes
18 |         self.bbox_pred = nn.Linear(num_inputs, num_bbox_reg_classes * 4)
19 | 
20 |         nn.init.normal_(self.cls_score.weight, mean=0, std=0.01)
21 |         nn.init.constant_(self.cls_score.bias, 0)
22 | 
23 |         nn.init.normal_(self.bbox_pred.weight, mean=0, std=0.001)
24 |         nn.init.constant_(self.bbox_pred.bias, 0)
25 | 
26 |     def forward(self, x):
27 |         x = self.avgpool(x)
28 |         x = x.view(x.size(0), -1)
29 |         cls_logit = self.cls_score(x)
30 |         bbox_pred = self.bbox_pred(x)
31 |         return cls_logit, bbox_pred
32 | 
33 | 
34 | @registry.ROI_BOX_PREDICTOR.register("FPNPredictor")
35 | class FPNPredictor(nn.Module):
36 |     def __init__(self, cfg, in_channels):
37 |         super(FPNPredictor, self).__init__()
38 |         num_classes = cfg.MODEL.ROI_BOX_HEAD.NUM_CLASSES
39 |         representation_size = in_channels
40 | 
41 |         self.cls_score = nn.Linear(representation_size, num_classes)
42 |         num_bbox_reg_classes = 2 if cfg.MODEL.CLS_AGNOSTIC_BBOX_REG else num_classes
43 |         self.bbox_pred = nn.Linear(representation_size, num_bbox_reg_classes * 4)
44 | 
45 |         nn.init.normal_(self.cls_score.weight, std=0.01)
46 |         nn.init.normal_(self.bbox_pred.weight, std=0.001)
47 |         for l in [self.cls_score, self.bbox_pred]:
48 |             nn.init.constant_(l.bias, 0)
49 | 
50 |     def forward(self, x):
51 |         if x.ndimension() == 4:
52 |             assert list(x.shape[2:]) == [1, 1]
53 |             x = x.view(x.size(0), -1)
54 |         scores = self.cls_score(x)
55 |         bbox_deltas = self.bbox_pred(x)
56 | 
57 |         return scores, bbox_deltas
58 | 
59 | 
60 | def make_roi_box_predictor(cfg, in_channels):
61 |     func = registry.ROI_BOX_PREDICTOR[cfg.MODEL.ROI_BOX_HEAD.PREDICTOR]
62 |     return func(cfg, in_channels)
63 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/roi_heads/keypoint_head/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/maskrcnn_benchmark/modeling/roi_heads/keypoint_head/__init__.py


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/roi_heads/keypoint_head/keypoint_head.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | 
 3 | from .roi_keypoint_feature_extractors import make_roi_keypoint_feature_extractor
 4 | from .roi_keypoint_predictors import make_roi_keypoint_predictor
 5 | from .inference import make_roi_keypoint_post_processor
 6 | from .loss import make_roi_keypoint_loss_evaluator
 7 | 
 8 | 
 9 | class ROIKeypointHead(torch.nn.Module):
10 |     def __init__(self, cfg, in_channels):
11 |         super(ROIKeypointHead, self).__init__()
12 |         self.cfg = cfg.clone()
13 |         self.feature_extractor = make_roi_keypoint_feature_extractor(cfg, in_channels)
14 |         self.predictor = make_roi_keypoint_predictor(
15 |             cfg, self.feature_extractor.out_channels)
16 |         self.post_processor = make_roi_keypoint_post_processor(cfg)
17 |         self.loss_evaluator = make_roi_keypoint_loss_evaluator(cfg)
18 | 
19 |     def forward(self, features, proposals, targets=None):
20 |         """
21 |         Arguments:
22 |             features (list[Tensor]): feature-maps from possibly several levels
23 |             proposals (list[BoxList]): proposal boxes
24 |             targets (list[BoxList], optional): the ground-truth targets.
25 | 
26 |         Returns:
27 |             x (Tensor): the result of the feature extractor
28 |             proposals (list[BoxList]): during training, the original proposals
29 |                 are returned. During testing, the predicted boxlists are returned
30 |                 with the `mask` field set
31 |             losses (dict[Tensor]): During training, returns the losses for the
32 |                 head. During testing, returns an empty dict.
33 |         """
34 |         if self.training:
35 |             with torch.no_grad():
36 |                 proposals = self.loss_evaluator.subsample(proposals, targets)
37 | 
38 |         x = self.feature_extractor(features, proposals)
39 |         kp_logits = self.predictor(x)
40 | 
41 |         if not self.training:
42 |             result = self.post_processor(kp_logits, proposals)
43 |             return x, result, {}
44 | 
45 |         loss_kp = self.loss_evaluator(proposals, kp_logits)
46 | 
47 |         return x, proposals, dict(loss_kp=loss_kp)
48 | 
49 | 
50 | def build_roi_keypoint_head(cfg, in_channels):
51 |     return ROIKeypointHead(cfg, in_channels)
52 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/roi_heads/keypoint_head/roi_keypoint_feature_extractors.py:
--------------------------------------------------------------------------------
 1 | from torch import nn
 2 | from torch.nn import functional as F
 3 | 
 4 | from maskrcnn_benchmark.modeling import registry
 5 | from maskrcnn_benchmark.modeling.poolers import Pooler
 6 | 
 7 | from maskrcnn_benchmark.layers import Conv2d
 8 | 
 9 | 
10 | @registry.ROI_KEYPOINT_FEATURE_EXTRACTORS.register("KeypointRCNNFeatureExtractor")
11 | class KeypointRCNNFeatureExtractor(nn.Module):
12 |     def __init__(self, cfg, in_channels):
13 |         super(KeypointRCNNFeatureExtractor, self).__init__()
14 | 
15 |         resolution = cfg.MODEL.ROI_KEYPOINT_HEAD.POOLER_RESOLUTION
16 |         scales = cfg.MODEL.ROI_KEYPOINT_HEAD.POOLER_SCALES
17 |         sampling_ratio = cfg.MODEL.ROI_KEYPOINT_HEAD.POOLER_SAMPLING_RATIO
18 |         pooler = Pooler(
19 |             output_size=(resolution, resolution),
20 |             scales=scales,
21 |             sampling_ratio=sampling_ratio,
22 |         )
23 |         self.pooler = pooler
24 | 
25 |         input_features = in_channels
26 |         layers = cfg.MODEL.ROI_KEYPOINT_HEAD.CONV_LAYERS
27 |         next_feature = input_features
28 |         self.blocks = []
29 |         for layer_idx, layer_features in enumerate(layers, 1):
30 |             layer_name = "conv_fcn{}".format(layer_idx)
31 |             module = Conv2d(next_feature, layer_features, 3, stride=1, padding=1)
32 |             nn.init.kaiming_normal_(module.weight, mode="fan_out", nonlinearity="relu")
33 |             nn.init.constant_(module.bias, 0)
34 |             self.add_module(layer_name, module)
35 |             next_feature = layer_features
36 |             self.blocks.append(layer_name)
37 |         self.out_channels = layer_features
38 | 
39 |     def forward(self, x, proposals):
40 |         x = self.pooler(x, proposals)
41 |         for layer_name in self.blocks:
42 |             x = F.relu(getattr(self, layer_name)(x))
43 |         return x
44 | 
45 | 
46 | def make_roi_keypoint_feature_extractor(cfg, in_channels):
47 |     func = registry.ROI_KEYPOINT_FEATURE_EXTRACTORS[
48 |         cfg.MODEL.ROI_KEYPOINT_HEAD.FEATURE_EXTRACTOR
49 |     ]
50 |     return func(cfg, in_channels)
51 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/roi_heads/keypoint_head/roi_keypoint_predictors.py:
--------------------------------------------------------------------------------
 1 | from torch import nn
 2 | 
 3 | from maskrcnn_benchmark import layers
 4 | from maskrcnn_benchmark.modeling import registry
 5 | 
 6 | 
 7 | @registry.ROI_KEYPOINT_PREDICTOR.register("KeypointRCNNPredictor")
 8 | class KeypointRCNNPredictor(nn.Module):
 9 |     def __init__(self, cfg, in_channels):
10 |         super(KeypointRCNNPredictor, self).__init__()
11 |         input_features = in_channels
12 |         num_keypoints = cfg.MODEL.ROI_KEYPOINT_HEAD.NUM_CLASSES
13 |         deconv_kernel = 4
14 |         self.kps_score_lowres = layers.ConvTranspose2d(
15 |             input_features,
16 |             num_keypoints,
17 |             deconv_kernel,
18 |             stride=2,
19 |             padding=deconv_kernel // 2 - 1,
20 |         )
21 |         nn.init.kaiming_normal_(
22 |             self.kps_score_lowres.weight, mode="fan_out", nonlinearity="relu"
23 |         )
24 |         nn.init.constant_(self.kps_score_lowres.bias, 0)
25 |         self.up_scale = 2
26 |         self.out_channels = num_keypoints
27 | 
28 |     def forward(self, x):
29 |         x = self.kps_score_lowres(x)
30 |         x = layers.interpolate(
31 |             x, scale_factor=self.up_scale, mode="bilinear", align_corners=False
32 |         )
33 |         return x
34 | 
35 | 
36 | def make_roi_keypoint_predictor(cfg, in_channels):
37 |     func = registry.ROI_KEYPOINT_PREDICTOR[cfg.MODEL.ROI_KEYPOINT_HEAD.PREDICTOR]
38 |     return func(cfg, in_channels)
39 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/roi_heads/mask_head/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/maskrcnn_benchmark/modeling/roi_heads/mask_head/__init__.py


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/roi_heads/mask_head/roi_mask_predictors.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | from torch import nn
 4 | from torch.nn import functional as F
 5 | 
 6 | from maskrcnn_benchmark.layers import Conv2d
 7 | from maskrcnn_benchmark.layers import ConvTranspose2d
 8 | from maskrcnn_benchmark.modeling import registry
 9 | from maskrcnn_benchmark.modeling.poolers import Pooler
10 | 
11 | 
12 | @registry.ROI_MASK_PREDICTOR.register("MaskRCNNC4Predictor")
13 | class MaskRCNNC4Predictor(nn.Module):
14 |     def __init__(self, cfg, in_channels):
15 |         super(MaskRCNNC4Predictor, self).__init__()
16 |         num_classes = cfg.MODEL.ROI_BOX_HEAD.NUM_CLASSES
17 |         dim_reduced = cfg.MODEL.ROI_MASK_HEAD.CONV_LAYERS[-1]
18 |         num_inputs = in_channels
19 |         self.conv5_mask = ConvTranspose2d(num_inputs, dim_reduced, 2, 2, 0)
20 |         self.mask_fcn_logits = Conv2d(dim_reduced, num_classes, 1, 1, 0)
21 | 
22 |         for name, param in self.named_parameters():
23 |             if "bias" in name:
24 |                 nn.init.constant_(param, 0)
25 |             elif "weight" in name:
26 |                 # Caffe2 implementation uses MSRAFill, which in fact
27 |                 # corresponds to kaiming_normal_ in PyTorch
28 |                 nn.init.kaiming_normal_(param, mode="fan_out", nonlinearity="relu")
29 | 
30 |     def forward(self, x):
31 |         x = F.relu_(self.conv5_mask(x))
32 |         return self.mask_fcn_logits(x)
33 | 
34 | 
35 | @registry.ROI_MASK_PREDICTOR.register("MaskDecoderPredictor")
36 | class MaskDecoderPredictor(nn.Module):
37 |     def __init__(self, cfg, in_channels):
38 |         super(MaskDecoderPredictor, self).__init__()
39 |         num_classes = cfg.MODEL.ROI_BOX_HEAD.NUM_CLASSES
40 |         dim_reduced = cfg.MODEL.ROI_MASK_HEAD.CONV_LAYERS[-1]
41 |         num_inputs = in_channels
42 | 
43 |         self.mask_fcn_logits = Conv2d(dim_reduced, num_classes, 1, 1, 0)
44 | 
45 |         for name, param in self.named_parameters():
46 |             if "bias" in name:
47 |                 nn.init.constant_(param, 0)
48 |             elif "weight" in name:
49 |                 # Caffe2 implementation uses MSRAFill, which in fact
50 |                 # corresponds to kaiming_normal_ in PyTorch
51 |                 nn.init.kaiming_normal_(param, mode="fan_out", nonlinearity="relu")
52 | 
53 |     def forward(self, x):
54 |         return self.mask_fcn_logits(x)
55 | 
56 | 
57 | 
58 | @registry.ROI_MASK_PREDICTOR.register("MaskRCNNConv1x1Predictor")
59 | class MaskRCNNConv1x1Predictor(nn.Module):
60 |     def __init__(self, cfg, in_channels):
61 |         super(MaskRCNNConv1x1Predictor, self).__init__()
62 |         num_classes = cfg.MODEL.ROI_BOX_HEAD.NUM_CLASSES
63 |         num_inputs = in_channels
64 | 
65 |         self.mask_fcn_logits = Conv2d(num_inputs, num_classes, 1, 1, 0)
66 | 
67 |         for name, param in self.named_parameters():
68 |             if "bias" in name:
69 |                 nn.init.constant_(param, 0)
70 |             elif "weight" in name:
71 |                 # Caffe2 implementation uses MSRAFill, which in fact
72 |                 # corresponds to kaiming_normal_ in PyTorch
73 |                 nn.init.kaiming_normal_(param, mode="fan_out", nonlinearity="relu")
74 | 
75 |     def forward(self, x):
76 |         return self.mask_fcn_logits(x)
77 | 
78 | 
79 | def make_roi_mask_predictor(cfg, in_channels):
80 |     func = registry.ROI_MASK_PREDICTOR[cfg.MODEL.ROI_MASK_HEAD.PREDICTOR]
81 |     return func(cfg, in_channels)
82 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/rpn/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | # from .rpn import build_rpn
3 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/rpn/fcos-drop/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/maskrcnn_benchmark/modeling/rpn/fcos-drop/__init__.py


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/rpn/fcos/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/maskrcnn_benchmark/modeling/rpn/fcos/__init__.py


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/rpn/retinanet/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/maskrcnn_benchmark/modeling/rpn/retinanet/__init__.py


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/rpn/utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | """
 3 | Utility functions minipulating the prediction layers
 4 | """
 5 | 
 6 | from ..utils import cat
 7 | 
 8 | import torch
 9 | 
10 | def permute_and_flatten(layer, N, A, C, H, W):
11 |     layer = layer.view(N, -1, C, H, W)
12 |     layer = layer.permute(0, 3, 4, 1, 2)
13 |     layer = layer.reshape(N, -1, C)
14 |     return layer
15 | 
16 | 
17 | def concat_box_prediction_layers(box_cls, box_regression):
18 |     box_cls_flattened = []
19 |     box_regression_flattened = []
20 |     # for each feature level, permute the outputs to make them be in the
21 |     # same format as the labels. Note that the labels are computed for
22 |     # all feature levels concatenated, so we keep the same representation
23 |     # for the objectness and the box_regression
24 |     for box_cls_per_level, box_regression_per_level in zip(
25 |         box_cls, box_regression
26 |     ):
27 |         N, AxC, H, W = box_cls_per_level.shape
28 |         Ax4 = box_regression_per_level.shape[1]
29 |         A = Ax4 // 4
30 |         C = AxC // A
31 |         box_cls_per_level = permute_and_flatten(
32 |             box_cls_per_level, N, A, C, H, W
33 |         )
34 |         box_cls_flattened.append(box_cls_per_level)
35 | 
36 |         box_regression_per_level = permute_and_flatten(
37 |             box_regression_per_level, N, A, 4, H, W
38 |         )
39 |         box_regression_flattened.append(box_regression_per_level)
40 |     # concatenate on the first dimension (representing the feature levels), to
41 |     # take into account the way the labels were generated (with all feature maps
42 |     # being concatenated as well)
43 |     box_cls = cat(box_cls_flattened, dim=1).reshape(-1, C)
44 |     box_regression = cat(box_regression_flattened, dim=1).reshape(-1, 4)
45 |     return box_cls, box_regression
46 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/modeling/utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | """
 3 | Miscellaneous utility functions
 4 | """
 5 | 
 6 | import torch
 7 | 
 8 | 
 9 | def cat(tensors, dim=0):
10 |     """
11 |     Efficient version of torch.cat that avoids a copy if there is only a single element in a list
12 |     """
13 |     assert isinstance(tensors, (list, tuple))
14 |     if len(tensors) == 1:
15 |         return tensors[0]
16 |     return torch.cat(tensors, dim)
17 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/solver/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
2 | from .build import make_optimizer
3 | from .build import make_lr_scheduler
4 | from .lr_scheduler import WarmupMultiStepLR
5 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/solver/build.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | from .lr_scheduler import WarmupMultiStepLR
 5 | 
 6 | 
 7 | def make_optimizer(cfg, model):
 8 |     params = []
 9 |     for key, value in model.named_parameters():
10 |         if not value.requires_grad:
11 |             continue
12 |         lr = cfg.SOLVER.BASE_LR
13 |         weight_decay = cfg.SOLVER.WEIGHT_DECAY
14 |         if "bias" in key:
15 |             lr = cfg.SOLVER.BASE_LR * cfg.SOLVER.BIAS_LR_FACTOR
16 |             weight_decay = cfg.SOLVER.WEIGHT_DECAY_BIAS
17 |         params += [{"params": [value], "lr": lr, "weight_decay": weight_decay}]
18 | 
19 |     optimizer = torch.optim.SGD(params, lr, momentum=cfg.SOLVER.MOMENTUM)
20 |     return optimizer
21 | 
22 | 
23 | def make_lr_scheduler(cfg, optimizer):
24 |     return WarmupMultiStepLR(
25 |         optimizer,
26 |         cfg.SOLVER.STEPS,
27 |         cfg.SOLVER.GAMMA,
28 |         warmup_factor=cfg.SOLVER.WARMUP_FACTOR,
29 |         warmup_iters=cfg.SOLVER.WARMUP_ITERS,
30 |         warmup_method=cfg.SOLVER.WARMUP_METHOD,
31 |     )
32 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/solver/lr_scheduler.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from bisect import bisect_right
 3 | 
 4 | import torch
 5 | 
 6 | 
 7 | # FIXME ideally this would be achieved with a CombinedLRScheduler,
 8 | # separating MultiStepLR with WarmupLR
 9 | # but the current LRScheduler design doesn't allow it
10 | class WarmupMultiStepLR(torch.optim.lr_scheduler._LRScheduler):
11 |     def __init__(
12 |         self,
13 |         optimizer,
14 |         milestones,
15 |         gamma=0.1,
16 |         warmup_factor=1.0 / 3,
17 |         warmup_iters=500,
18 |         warmup_method="linear",
19 |         last_epoch=-1,
20 |     ):
21 |         if not list(milestones) == sorted(milestones):
22 |             raise ValueError(
23 |                 "Milestones should be a list of" " increasing integers. Got {}",
24 |                 milestones,
25 |             )
26 | 
27 |         if warmup_method not in ("constant", "linear"):
28 |             raise ValueError(
29 |                 "Only 'constant' or 'linear' warmup_method accepted"
30 |                 "got {}".format(warmup_method)
31 |             )
32 |         self.milestones = milestones
33 |         self.gamma = gamma
34 |         self.warmup_factor = warmup_factor
35 |         self.warmup_iters = warmup_iters
36 |         self.warmup_method = warmup_method
37 |         super(WarmupMultiStepLR, self).__init__(optimizer, last_epoch)
38 | 
39 |     def get_lr(self):
40 |         warmup_factor = 1
41 |         if self.last_epoch < self.warmup_iters:
42 |             if self.warmup_method == "constant":
43 |                 warmup_factor = self.warmup_factor
44 |             elif self.warmup_method == "linear":
45 |                 alpha = float(self.last_epoch) / self.warmup_iters
46 |                 warmup_factor = self.warmup_factor * (1 - alpha) + alpha
47 |         return [
48 |             base_lr
49 |             * warmup_factor
50 |             * self.gamma ** bisect_right(self.milestones, self.last_epoch)
51 |             for base_lr in self.base_lrs
52 |         ]
53 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/structures/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/maskrcnn_benchmark/structures/__init__.py


--------------------------------------------------------------------------------
/maskrcnn_benchmark/structures/image_list.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from __future__ import division
 3 | 
 4 | import torch
 5 | 
 6 | 
 7 | class ImageList(object):
 8 |     """
 9 |     Structure that holds a list of images (of possibly
10 |     varying sizes) as a single tensor.
11 |     This works by padding the images to the same size,
12 |     and storing in a field the original sizes of each image
13 |     """
14 | 
15 |     def __init__(self, tensors, image_sizes):
16 |         """
17 |         Arguments:
18 |             tensors (tensor)
19 |             image_sizes (list[tuple[int, int]])
20 |         """
21 |         self.tensors = tensors
22 |         self.image_sizes = image_sizes
23 | 
24 |     def to(self, *args, **kwargs):
25 |         cast_tensor = self.tensors.to(*args, **kwargs)
26 |         return ImageList(cast_tensor, self.image_sizes)
27 | 
28 | 
29 | def to_image_list(tensors, size_divisible=0):
30 |     """
31 |     tensors can be an ImageList, a torch.Tensor or
32 |     an iterable of Tensors. It can't be a numpy array.
33 |     When tensors is an iterable of Tensors, it pads
34 |     the Tensors with zeros so that they have the same
35 |     shape
36 |     """
37 |     if isinstance(tensors, torch.Tensor) and size_divisible > 0:
38 |         tensors = [tensors]
39 | 
40 |     if isinstance(tensors, ImageList):
41 |         return tensors
42 |     elif isinstance(tensors, torch.Tensor):
43 |         # single tensor shape can be inferred
44 |         if tensors.dim() == 3:
45 |             tensors = tensors[None]
46 |         assert tensors.dim() == 4
47 |         image_sizes = [tensor.shape[-2:] for tensor in tensors]
48 |         return ImageList(tensors, image_sizes)
49 |     elif isinstance(tensors, (tuple, list)):
50 |         max_size = tuple(max(s) for s in zip(*[img.shape for img in tensors]))
51 | 
52 |         # TODO Ideally, just remove this and let me model handle arbitrary
53 |         # input sizs
54 |         if size_divisible > 0:
55 |             import math
56 | 
57 |             stride = size_divisible
58 |             max_size = list(max_size)
59 |             max_size[1] = int(math.ceil(max_size[1] / stride) * stride)
60 |             max_size[2] = int(math.ceil(max_size[2] / stride) * stride)
61 |             max_size = tuple(max_size)
62 | 
63 |         batch_shape = (len(tensors),) + max_size
64 |         batched_imgs = tensors[0].new(*batch_shape).zero_()
65 |         for img, pad_img in zip(tensors, batched_imgs):
66 |             pad_img[: img.shape[0], : img.shape[1], : img.shape[2]].copy_(img)
67 | 
68 |         image_sizes = [im.shape[-2:] for im in tensors]
69 | 
70 |         return ImageList(batched_imgs, image_sizes)
71 |     else:
72 |         raise TypeError("Unsupported type for to_image_list: {}".format(type(tensors)))
73 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/utils/README.md:
--------------------------------------------------------------------------------
1 | # Utility functions
2 | 
3 | This folder contain utility functions that are not used in the
4 | core library, but are useful for building models or training
5 | code using the config system.
6 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/utils/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/yuhuan-wu/RDPNet/3fa96438977143b5a2009e97353ab851630226a2/maskrcnn_benchmark/utils/__init__.py


--------------------------------------------------------------------------------
/maskrcnn_benchmark/utils/collect_env.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import PIL
 3 | 
 4 | from torch.utils.collect_env import get_pretty_env_info
 5 | 
 6 | 
 7 | def get_pil_version():
 8 |     return "\n        Pillow ({})".format(PIL.__version__)
 9 | 
10 | 
11 | def collect_env_info():
12 |     env_str = get_pretty_env_info()
13 |     env_str += get_pil_version()
14 |     return env_str
15 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/utils/cv2_util.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Module for cv2 utility functions and maintaining version compatibility
 3 | between 3.x and 4.x
 4 | """
 5 | import cv2
 6 | 
 7 | 
 8 | def findContours(*args, **kwargs):
 9 |     """
10 |     Wraps cv2.findContours to maintain compatiblity between versions
11 |     3 and 4
12 | 
13 |     Returns:
14 |         contours, hierarchy
15 |     """
16 |     if cv2.__version__.startswith('4'):
17 |         contours, hierarchy = cv2.findContours(*args, **kwargs)
18 |     elif cv2.__version__.startswith('3'):
19 |         _, contours, hierarchy = cv2.findContours(*args, **kwargs)
20 |     else:
21 |         raise AssertionError(
22 |             'cv2 must be either version 3 or 4 to call this method')
23 | 
24 |     return contours, hierarchy
25 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/utils/env.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import os
 3 | 
 4 | from maskrcnn_benchmark.utils.imports import import_file
 5 | 
 6 | 
 7 | def setup_environment():
 8 |     """Perform environment setup work. The default setup is a no-op, but this
 9 |     function allows the user to specify a Python source file that performs
10 |     custom setup work that may be necessary to their computing environment.
11 |     """
12 |     custom_module_path = os.environ.get("TORCH_DETECTRON_ENV_MODULE")
13 |     if custom_module_path:
14 |         setup_custom_environment(custom_module_path)
15 |     else:
16 |         # The default setup is a no-op
17 |         pass
18 | 
19 | 
20 | def setup_custom_environment(custom_module_path):
21 |     """Load custom environment setup from a Python source file and run the setup
22 |     function.
23 |     """
24 |     module = import_file("maskrcnn_benchmark.utils.env.custom_module", custom_module_path)
25 |     assert hasattr(module, "setup_environment") and callable(
26 |         module.setup_environment
27 |     ), (
28 |         "Custom environment module defined in {} does not have the "
29 |         "required callable attribute 'setup_environment'."
30 |     ).format(
31 |         custom_module_path
32 |     )
33 |     module.setup_environment()
34 | 
35 | 
36 | # Force environment setup when this module is imported
37 | setup_environment()
38 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/utils/imports.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import torch
 3 | 
 4 | if torch._six.PY3:
 5 |     import importlib
 6 |     import importlib.util
 7 |     import sys
 8 | 
 9 | 
10 |     # from https://stackoverflow.com/questions/67631/how-to-import-a-module-given-the-full-path?utm_medium=organic&utm_source=google_rich_qa&utm_campaign=google_rich_qa
11 |     def import_file(module_name, file_path, make_importable=False):
12 |         spec = importlib.util.spec_from_file_location(module_name, file_path)
13 |         module = importlib.util.module_from_spec(spec)
14 |         spec.loader.exec_module(module)
15 |         if make_importable:
16 |             sys.modules[module_name] = module
17 |         return module
18 | else:
19 |     import imp
20 | 
21 |     def import_file(module_name, file_path, make_importable=None):
22 |         module = imp.load_source(module_name, file_path)
23 |         return module
24 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/utils/logger.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import logging
 3 | import os
 4 | import sys
 5 | 
 6 | 
 7 | def setup_logger(name, save_dir, distributed_rank, filename="log.txt"):
 8 |     logger = logging.getLogger(name)
 9 |     logger.setLevel(logging.DEBUG)
10 |     # don't log results for the non-master process
11 |     if distributed_rank > 0:
12 |         return logger
13 |     ch = logging.StreamHandler(stream=sys.stdout)
14 |     ch.setLevel(logging.DEBUG)
15 |     formatter = logging.Formatter("%(asctime)s %(name)s %(levelname)s: %(message)s")
16 |     ch.setFormatter(formatter)
17 |     logger.addHandler(ch)
18 | 
19 |     if save_dir:
20 |         fh = logging.FileHandler(os.path.join(save_dir, filename))
21 |         fh.setLevel(logging.DEBUG)
22 |         fh.setFormatter(formatter)
23 |         logger.addHandler(fh)
24 | 
25 |     return logger
26 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/utils/metric_logger.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | from collections import defaultdict
 3 | from collections import deque
 4 | 
 5 | import torch
 6 | 
 7 | 
 8 | class SmoothedValue(object):
 9 |     """Track a series of values and provide access to smoothed values over a
10 |     window or the global series average.
11 |     """
12 | 
13 |     def __init__(self, window_size=20):
14 |         self.deque = deque(maxlen=window_size)
15 |         self.series = []
16 |         self.total = 0.0
17 |         self.count = 0
18 | 
19 |     def update(self, value):
20 |         self.deque.append(value)
21 |         self.series.append(value)
22 |         self.count += 1
23 |         self.total += value
24 | 
25 |     @property
26 |     def median(self):
27 |         d = torch.tensor(list(self.deque))
28 |         return d.median().item()
29 | 
30 |     @property
31 |     def avg(self):
32 |         d = torch.tensor(list(self.deque))
33 |         return d.mean().item()
34 | 
35 |     @property
36 |     def global_avg(self):
37 |         return self.total / self.count
38 | 
39 | 
40 | class MetricLogger(object):
41 |     def __init__(self, delimiter="\t"):
42 |         self.meters = defaultdict(SmoothedValue)
43 |         self.delimiter = delimiter
44 | 
45 |     def update(self, **kwargs):
46 |         for k, v in kwargs.items():
47 |             if isinstance(v, torch.Tensor):
48 |                 v = v.item()
49 |             assert isinstance(v, (float, int))
50 |             self.meters[k].update(v)
51 | 
52 |     def __getattr__(self, attr):
53 |         if attr in self.meters:
54 |             return self.meters[attr]
55 |         if attr in self.__dict__:
56 |             return self.__dict__[attr]
57 |         raise AttributeError("'{}' object has no attribute '{}'".format(
58 |                     type(self).__name__, attr))
59 | 
60 |     def __str__(self):
61 |         loss_str = []
62 |         for name, meter in self.meters.items():
63 |             loss_str.append(
64 |                 "{}: {:.4f} ({:.4f})".format(name, meter.median, meter.global_avg)
65 |             )
66 |         return self.delimiter.join(loss_str)
67 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/utils/miscellaneous.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import errno
 3 | import os
 4 | 
 5 | 
 6 | def mkdir(path):
 7 |     try:
 8 |         os.makedirs(path)
 9 |     except OSError as e:
10 |         if e.errno != errno.EEXIST:
11 |             raise
12 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/utils/model_zoo.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | import os
 3 | import sys
 4 | 
 5 | try:
 6 |     from torch.utils.model_zoo import _download_url_to_file
 7 |     from torch.utils.model_zoo import urlparse
 8 |     from torch.utils.model_zoo import HASH_REGEX
 9 | except ImportError:
10 |     from torch.hub import _download_url_to_file
11 |     from torch.hub import urlparse
12 |     from torch.hub import HASH_REGEX
13 | 
14 | from maskrcnn_benchmark.utils.comm import is_main_process
15 | from maskrcnn_benchmark.utils.comm import synchronize
16 | 
17 | 
18 | # very similar to https://github.com/pytorch/pytorch/blob/master/torch/utils/model_zoo.py
19 | # but with a few improvements and modifications
20 | def cache_url(url, model_dir=None, progress=True):
21 |     r"""Loads the Torch serialized object at the given URL.
22 |     If the object is already present in `model_dir`, it's deserialized and
23 |     returned. The filename part of the URL should follow the naming convention
24 |     ``filename-<sha256>.ext`` where ``<sha256>`` is the first eight or more
25 |     digits of the SHA256 hash of the contents of the file. The hash is used to
26 |     ensure unique names and to verify the contents of the file.
27 |     The default value of `model_dir` is ``$TORCH_HOME/models`` where
28 |     ``$TORCH_HOME`` defaults to ``~/.torch``. The default directory can be
29 |     overridden with the ``$TORCH_MODEL_ZOO`` environment variable.
30 |     Args:
31 |         url (string): URL of the object to download
32 |         model_dir (string, optional): directory in which to save the object
33 |         progress (bool, optional): whether or not to display a progress bar to stderr
34 |     Example:
35 |         >>> cached_file = maskrcnn_benchmark.utils.model_zoo.cache_url('https://s3.amazonaws.com/pytorch/models/resnet18-5c106cde.pth')
36 |     """
37 |     if model_dir is None:
38 |         torch_home = os.path.expanduser(os.getenv('TORCH_HOME', '~/.torch'))
39 |         model_dir = os.getenv('TORCH_MODEL_ZOO', os.path.join(torch_home, 'models'))
40 |     if not os.path.exists(model_dir):
41 |         os.makedirs(model_dir)
42 |     parts = urlparse(url)
43 |     filename = os.path.basename(parts.path)
44 |     if filename == "model_final.pkl":
45 |         # workaround as pre-trained Caffe2 models from Detectron have all the same filename
46 |         # so make the full path the filename by replacing / with _
47 |         filename = parts.path.replace("/", "_")
48 |     cached_file = os.path.join(model_dir, filename)
49 |     if not os.path.exists(cached_file) and is_main_process():
50 |         sys.stderr.write('Downloading: "{}" to {}\n'.format(url, cached_file))
51 |         hash_prefix = HASH_REGEX.search(filename)
52 |         if hash_prefix is not None:
53 |             hash_prefix = hash_prefix.group(1)
54 |             # workaround: Caffe2 models don't have a hash, but follow the R-50 convention,
55 |             # which matches the hash PyTorch uses. So we skip the hash matching
56 |             # if the hash_prefix is less than 6 characters
57 |             if len(hash_prefix) < 6:
58 |                 hash_prefix = None
59 |         _download_url_to_file(url, cached_file, hash_prefix, progress=progress)
60 |     synchronize()
61 |     return cached_file
62 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/utils/registry.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | 
 4 | def _register_generic(module_dict, module_name, module):
 5 |     assert module_name not in module_dict
 6 |     module_dict[module_name] = module
 7 | 
 8 | 
 9 | class Registry(dict):
10 |     '''
11 |     A helper class for managing registering modules, it extends a dictionary
12 |     and provides a register functions.
13 | 
14 |     Eg. creeting a registry:
15 |         some_registry = Registry({"default": default_module})
16 | 
17 |     There're two ways of registering new modules:
18 |     1): normal way is just calling register function:
19 |         def foo():
20 |             ...
21 |         some_registry.register("foo_module", foo)
22 |     2): used as decorator when declaring the module:
23 |         @some_registry.register("foo_module")
24 |         @some_registry.register("foo_modeul_nickname")
25 |         def foo():
26 |             ...
27 | 
28 |     Access of module is just like using a dictionary, eg:
29 |         f = some_registry["foo_modeul"]
30 |     '''
31 |     def __init__(self, *args, **kwargs):
32 |         super(Registry, self).__init__(*args, **kwargs)
33 | 
34 |     def register(self, module_name, module=None):
35 |         # used as function call
36 |         if module is not None:
37 |             _register_generic(self, module_name, module)
38 |             return
39 | 
40 |         # used as decorator
41 |         def register_fn(fn):
42 |             _register_generic(self, module_name, fn)
43 |             return fn
44 | 
45 |         return register_fn
46 | 


--------------------------------------------------------------------------------
/maskrcnn_benchmark/utils/timer.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | 
 3 | 
 4 | import time
 5 | import datetime
 6 | 
 7 | 
 8 | class Timer(object):
 9 |     def __init__(self):
10 |         self.reset()
11 | 
12 |     @property
13 |     def average_time(self):
14 |         return self.total_time / self.calls if self.calls > 0 else 0.0
15 | 
16 |     def tic(self):
17 |         # using time.time instead of time.clock because time time.clock
18 |         # does not normalize for multithreading
19 |         self.start_time = time.time()
20 | 
21 |     def toc(self, average=True):
22 |         self.add(time.time() - self.start_time)
23 |         if average:
24 |             return self.average_time
25 |         else:
26 |             return self.diff
27 | 
28 |     def add(self, time_diff):
29 |         self.diff = time_diff
30 |         self.total_time += self.diff
31 |         self.calls += 1
32 | 
33 |     def reset(self):
34 |         self.total_time = 0.0
35 |         self.calls = 0
36 |         self.start_time = 0.0
37 |         self.diff = 0.0
38 | 
39 |     def avg_time_str(self):
40 |         time_str = str(datetime.timedelta(seconds=self.average_time))
41 |         return time_str
42 | 
43 | 
44 | def get_time_str(time_diff):
45 |     time_str = str(datetime.timedelta(seconds=time_diff))
46 |     return time_str
47 | 


--------------------------------------------------------------------------------
/model_zoo/PLACE_WEIGHTS_HERE:
--------------------------------------------------------------------------------
1 | Please put released pretrained weights here.


--------------------------------------------------------------------------------
/my_env.txt:
--------------------------------------------------------------------------------
 1 | 
 2 | ### If you cannot successfully run the code, ###
 3 | ### Please check the version of the follwing packages ###
 4 | 
 5 | ### printed from "pip freeze" ###
 6 | apex==0.1
 7 | backcall==0.2.0
 8 | cycler==0.10.0
 9 | Cython==0.29.22
10 | decorator==4.4.2
11 | ipython==7.16.1
12 | ipython-genutils==0.2.0
13 | jedi==0.18.0
14 | kiwisolver==1.3.1
15 | # Editable install with no version control (maskrcnn-benchmark==0.1)
16 | -e /mnt/4Tvolume/wyh/InstanceSaliency/RDPNet-release
17 | matplotlib==3.3.4
18 | ninja==1.10.0.post2
19 | numpy==1.19.5
20 | opencv-python==3.4.3.18
21 | parso==0.8.1
22 | pexpect==4.8.0
23 | pickleshare==0.7.5
24 | Pillow==8.1.0
25 | pkg-resources==0.0.0
26 | prompt-toolkit==3.0.16
27 | ptyprocess==0.7.0
28 | pycocotools==2.0.2
29 | Pygments==2.8.0
30 | pyparsing==2.4.7
31 | python-dateutil==2.8.1
32 | PyYAML==5.4.1
33 | scipy==1.5.4
34 | six==1.15.0
35 | torch @ https://download.pytorch.org/whl/cu90/torch-1.0.1-cp36-cp36m-linux_x86_64.whl
36 | torchvision==0.2.2.post3
37 | tqdm==4.57.0
38 | traitlets==4.3.3
39 | wcwidth==0.2.5
40 | yacs==0.1.8
41 | 
42 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
1 | ninja
2 | yacs
3 | cython
4 | matplotlib
5 | tqdm
6 | opencv-python==3.4.3.18
7 | torch
8 | scipy
9 | 


--------------------------------------------------------------------------------
/scripts/test_isod.sh:
--------------------------------------------------------------------------------
 1 | 
 2 | cd ../
 3 | SAVE_ROOT=testing_dir/
 4 | SAVE_DIR=isod_r50/
 5 | LOOP_IDX=$1
 6 | SAVE_PATH=$SAVE_ROOT/$SAVE_DIR/$LOOP_IDX
 7 | CONFIG_NAME=configs/rdpnet/r50-isod-te.yaml
 8 | 
 9 | # rsync codes to SAVE_PATH
10 | mkdir $SAVE_ROOT
11 | mkdir $SAVE_ROOT/$SAVE_DIR
12 | mkdir $SAVE_ROOT/$SAVE_DIR/$LOOP_IDX
13 | 
14 | rsync -auv maskrcnn_benchmark $SAVE_PATH
15 | rsync -auv scripts/$0 $SAVE_PATH
16 | rsync -auv $CONFIG_NAME $SAVE_PATH
17 | 
18 | python tools/test_net.py \
19 |     --config-file $CONFIG_NAME \
20 |     DATALOADER.NUM_WORKERS 2 \
21 |     OUTPUT_DIR $SAVE_PATH
22 | cd scripts
23 | 


--------------------------------------------------------------------------------
/scripts/test_soc.sh:
--------------------------------------------------------------------------------
 1 | 
 2 | cd ../
 3 | SAVE_ROOT=testing_dir/
 4 | SAVE_DIR=soc_r50/
 5 | LOOP_IDX=$1
 6 | SAVE_PATH=$SAVE_ROOT/$SAVE_DIR/$LOOP_IDX
 7 | CONFIG_NAME=configs/rdpnet/r50-soc-te.yaml
 8 | 
 9 | # rsync codes to SAVE_PATH
10 | mkdir $SAVE_ROOT
11 | mkdir $SAVE_ROOT/$SAVE_DIR
12 | mkdir $SAVE_ROOT/$SAVE_DIR/$LOOP_IDX
13 | 
14 | rsync -auv maskrcnn_benchmark $SAVE_PATH
15 | rsync -auv scripts/$0 $SAVE_PATH
16 | rsync -auv $CONFIG_NAME $SAVE_PATH
17 | 
18 | python tools/test_net.py \
19 |     --config-file $CONFIG_NAME \
20 |     DATALOADER.NUM_WORKERS 2 \
21 |     OUTPUT_DIR $SAVE_PATH
22 | cd scripts
23 | 


--------------------------------------------------------------------------------
/scripts/train_come.sh:
--------------------------------------------------------------------------------
 1 | 
 2 | cd ../
 3 | SAVE_ROOT=training_dir/
 4 | SAVE_DIR=come_r50/
 5 | SAVE_PATH=$SAVE_ROOT/$SAVE_DIR
 6 | CONFIG_NAME=configs/rdpnet/r50-come.yaml
 7 | 
 8 | # rsync codes to SAVE_PATH
 9 | mkdir $SAVE_ROOT
10 | mkdir $SAVE_ROOT/$SAVE_DIR
11 | 
12 | rsync -auv maskrcnn_benchmark $SAVE_PATH
13 | rsync -auv scripts/$0 $SAVE_PATH
14 | rsync -auv $CONFIG_NAME $SAVE_PATH
15 | 
16 | python -m torch.distributed.launch \
17 |     --nproc_per_node=1 \
18 |     --master_port=$((RANDOM + 10000)) \
19 |     tools/train_net.py \
20 |     --config-file $CONFIG_NAME \
21 |     DATALOADER.NUM_WORKERS 2 \
22 |     OUTPUT_DIR $SAVE_PATH
23 | cd scripts
24 | 


--------------------------------------------------------------------------------
/scripts/train_isod.sh:
--------------------------------------------------------------------------------
 1 | 
 2 | cd ../
 3 | SAVE_ROOT=training_dir/
 4 | SAVE_DIR=isod_r50/
 5 | SAVE_PATH=$SAVE_ROOT/$SAVE_DIR
 6 | CONFIG_NAME=configs/rdpnet/r50-isod.yaml
 7 | 
 8 | # rsync codes to SAVE_PATH
 9 | mkdir $SAVE_ROOT
10 | mkdir $SAVE_ROOT/$SAVE_DIR
11 | 
12 | rsync -auv maskrcnn_benchmark $SAVE_PATH
13 | rsync -auv scripts/$0 $SAVE_PATH
14 | rsync -auv $CONFIG_NAME $SAVE_PATH
15 | 
16 | python -m torch.distributed.launch \
17 |     --nproc_per_node=1 \
18 |     --master_port=$((RANDOM + 10000)) \
19 |     tools/train_net.py \
20 |     --config-file $CONFIG_NAME \
21 |     DATALOADER.NUM_WORKERS 2 \
22 |     OUTPUT_DIR $SAVE_PATH
23 | cd scripts
24 | 


--------------------------------------------------------------------------------
/scripts/train_r101_isod.sh:
--------------------------------------------------------------------------------
 1 | 
 2 | cd ../
 3 | SAVE_ROOT=training_dir/
 4 | SAVE_DIR=isod_resnet101/
 5 | SAVE_PATH=$SAVE_ROOT/$SAVE_DIR
 6 | CONFIG_NAME=configs/rdpnet/r101-isod.yaml
 7 | 
 8 | # rsync codes to SAVE_PATH
 9 | mkdir $SAVE_ROOT
10 | mkdir $SAVE_ROOT/$SAVE_DIR
11 | 
12 | rsync -auv maskrcnn_benchmark $SAVE_PATH
13 | rsync -auv scripts/$0 $SAVE_PATH
14 | rsync -auv $CONFIG_NAME $SAVE_PATH
15 | 
16 | python -m torch.distributed.launch \
17 |     --nproc_per_node=1 \
18 |     --master_port=$((RANDOM + 10000)) \
19 |     tools/train_net.py \
20 |     --config-file $CONFIG_NAME \
21 |     DATALOADER.NUM_WORKERS 2 \
22 |     OUTPUT_DIR $SAVE_PATH
23 | cd scripts
24 | 


--------------------------------------------------------------------------------
/scripts/train_soc.sh:
--------------------------------------------------------------------------------
 1 | 
 2 | cd ../
 3 | SAVE_ROOT=training_dir/
 4 | SAVE_DIR=soc_r50/
 5 | SAVE_PATH=$SAVE_ROOT/$SAVE_DIR
 6 | CONFIG_NAME=configs/rdpnet/r50-soc.yaml
 7 | 
 8 | # rsync codes to SAVE_PATH
 9 | mkdir $SAVE_ROOT
10 | mkdir $SAVE_ROOT/$SAVE_DIR
11 | 
12 | rsync -auv maskrcnn_benchmark $SAVE_PATH
13 | rsync -auv scripts/train_mask.sh $SAVE_PATH
14 | rsync -auv $CONFIG_NAME $SAVE_PATH
15 | 
16 | python -m torch.distributed.launch \
17 |     --nproc_per_node=1 \
18 |     --master_port=$((RANDOM + 10000)) \
19 |     tools/train_net.py \
20 |     --config-file $CONFIG_NAME \
21 |     DATALOADER.NUM_WORKERS 2 \
22 |     OUTPUT_DIR $SAVE_PATH
23 | cd scripts
24 | 


--------------------------------------------------------------------------------
/scripts/train_x101_isod.sh:
--------------------------------------------------------------------------------
 1 | 
 2 | cd ../
 3 | SAVE_ROOT=training_dir/
 4 | SAVE_DIR=isod_resxnet101/
 5 | SAVE_PATH=$SAVE_ROOT/$SAVE_DIR
 6 | CONFIG_NAME=configs/rdpnet/x101-isod.yaml
 7 | 
 8 | # rsync codes to SAVE_PATH
 9 | mkdir $SAVE_ROOT
10 | mkdir $SAVE_ROOT/$SAVE_DIR
11 | 
12 | rsync -auv maskrcnn_benchmark $SAVE_PATH
13 | rsync -auv scripts/$0 $SAVE_PATH
14 | rsync -auv $CONFIG_NAME $SAVE_PATH
15 | 
16 | python -m torch.distributed.launch \
17 |     --nproc_per_node=1 \
18 |     --master_port=$((RANDOM + 10000)) \
19 |     tools/train_net.py \
20 |     --config-file $CONFIG_NAME \
21 |     DATALOADER.NUM_WORKERS 2 \
22 |     OUTPUT_DIR $SAVE_PATH
23 | cd scripts
24 | 


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
 2 | #!/usr/bin/env python
 3 | 
 4 | import glob
 5 | import os
 6 | 
 7 | import torch
 8 | from setuptools import find_packages
 9 | from setuptools import setup
10 | from torch.utils.cpp_extension import CUDA_HOME
11 | from torch.utils.cpp_extension import CppExtension
12 | from torch.utils.cpp_extension import CUDAExtension
13 | 
14 | requirements = ["torch", "torchvision"]
15 | 
16 | 
17 | def get_extensions():
18 |     this_dir = os.path.dirname(os.path.abspath(__file__))
19 |     extensions_dir = os.path.join(this_dir, "maskrcnn_benchmark", "csrc")
20 | 
21 |     main_file = glob.glob(os.path.join(extensions_dir, "*.cpp"))
22 |     source_cpu = glob.glob(os.path.join(extensions_dir, "cpu", "*.cpp"))
23 |     source_cuda = glob.glob(os.path.join(extensions_dir, "cuda", "*.cu"))
24 | 
25 |     sources = main_file + source_cpu
26 |     extension = CppExtension
27 | 
28 |     extra_compile_args = {"cxx": []}
29 |     define_macros = []
30 | 
31 |     if (torch.cuda.is_available() and CUDA_HOME is not None) or os.getenv("FORCE_CUDA", "0") == "1":
32 |         extension = CUDAExtension
33 |         sources += source_cuda
34 |         define_macros += [("WITH_CUDA", None)]
35 |         extra_compile_args["nvcc"] = [
36 |             "-DCUDA_HAS_FP16=1",
37 |             "-D__CUDA_NO_HALF_OPERATORS__",
38 |             "-D__CUDA_NO_HALF_CONVERSIONS__",
39 |             "-D__CUDA_NO_HALF2_OPERATORS__",
40 |         ]
41 | 
42 |     sources = [os.path.join(extensions_dir, s) for s in sources]
43 | 
44 |     include_dirs = [extensions_dir]
45 | 
46 |     ext_modules = [
47 |         extension(
48 |             "maskrcnn_benchmark._C",
49 |             sources,
50 |             include_dirs=include_dirs,
51 |             define_macros=define_macros,
52 |             extra_compile_args=extra_compile_args,
53 |         )
54 |     ]
55 | 
56 |     return ext_modules
57 | 
58 | 
59 | setup(
60 |     name="maskrcnn_benchmark",
61 |     version="0.1",
62 |     author="fmassa",
63 |     url="https://github.com/facebookresearch/maskrcnn-benchmark",
64 |     description="object detection in pytorch",
65 |     packages=find_packages(exclude=("configs", "tests",)),
66 |     # install_requires=requirements,
67 |     ext_modules=get_extensions(),
68 |     cmdclass={"build_ext": torch.utils.cpp_extension.BuildExtension},
69 | )
70 | 


--------------------------------------------------------------------------------
/tools/cityscapes/instances2dict_with_polygons.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/python
 2 | #
 3 | # Convert instances from png files to a dictionary
 4 | # This files is created according to https://github.com/facebookresearch/Detectron/issues/111
 5 | 
 6 | from __future__ import print_function, absolute_import, division
 7 | import os, sys
 8 | 
 9 | sys.path.append( os.path.normpath( os.path.join( os.path.dirname( __file__ ) , '..' , 'helpers' ) ) )
10 | from csHelpers import *
11 | 
12 | # Cityscapes imports
13 | from cityscapesscripts.evaluation.instance import *
14 | from cityscapesscripts.helpers.csHelpers import *
15 | import cv2
16 | from maskrcnn_benchmark.utils import cv2_util
17 | 
18 | 
19 | def instances2dict_with_polygons(imageFileList, verbose=False):
20 |     imgCount     = 0
21 |     instanceDict = {}
22 | 
23 |     if not isinstance(imageFileList, list):
24 |         imageFileList = [imageFileList]
25 | 
26 |     if verbose:
27 |         print("Processing {} images...".format(len(imageFileList)))
28 | 
29 |     for imageFileName in imageFileList:
30 |         # Load image
31 |         img = Image.open(imageFileName)
32 | 
33 |         # Image as numpy array
34 |         imgNp = np.array(img)
35 | 
36 |         # Initialize label categories
37 |         instances = {}
38 |         for label in labels:
39 |             instances[label.name] = []
40 | 
41 |         # Loop through all instance ids in instance image
42 |         for instanceId in np.unique(imgNp):
43 |             if instanceId < 1000:
44 |                 continue
45 |             instanceObj = Instance(imgNp, instanceId)
46 |             instanceObj_dict = instanceObj.toDict()
47 | 
48 |             #instances[id2label[instanceObj.labelID].name].append(instanceObj.toDict())
49 |             if id2label[instanceObj.labelID].hasInstances:
50 |                 mask = (imgNp == instanceId).astype(np.uint8)
51 |                 contour, hier = cv2_util.findContours(
52 |                     mask.copy(), cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_NONE)
53 | 
54 |                 polygons = [c.reshape(-1).tolist() for c in contour]
55 |                 instanceObj_dict['contours'] = polygons
56 | 
57 |             instances[id2label[instanceObj.labelID].name].append(instanceObj_dict)
58 | 
59 |         imgKey = os.path.abspath(imageFileName)
60 |         instanceDict[imgKey] = instances
61 |         imgCount += 1
62 | 
63 |         if verbose:
64 |             print("\rImages Processed: {}".format(imgCount), end=' ')
65 |             sys.stdout.flush()
66 | 
67 |     if verbose:
68 |         print("")
69 | 
70 |     return instanceDict
71 | 
72 | def main(argv):
73 |     fileList = []
74 |     if (len(argv) > 2):
75 |         for arg in argv:
76 |             if ("png" in arg):
77 |                 fileList.append(arg)
78 |     instances2dict_with_polygons(fileList, True)
79 | 
80 | if __name__ == "__main__":
81 |     main(sys.argv[1:])
82 | 


--------------------------------------------------------------------------------