├── projects
    ├── __init__.py
    └── mmdet3d_plugin
    │   ├── ops
    │       ├── voxel_pool
    │       │   ├── __init__.py
    │       │   └── voxel_pool.py
    │       ├── point_ops
    │       │   ├── __init__.py
    │       │   ├── point_ops.py
    │       │   └── src
    │       │   │   ├── point_ops.cpp
    │       │   │   └── point_ops_cuda.cu
    │       └── smooth_sampler
    │       │   └── __init__.py
    │   ├── core
    │       ├── bbox
    │       │   ├── coders
    │       │   │   └── __init__.py
    │       │   ├── assigners
    │       │   │   └── __init__.py
    │       │   ├── iou_calculators
    │       │   │   └── __init__.py
    │       │   └── match_costs
    │       │   │   ├── __init__.py
    │       │   │   └── match_cost.py
    │       └── hook
    │       │   ├── __init__.py
    │       │   ├── utils.py
    │       │   ├── sequentialcontrol.py
    │       │   └── syncbncontrol.py
    │   ├── models
    │       ├── dense_heads
    │       │   ├── render_utils
    │       │   │   ├── fields
    │       │   │   │   └── __init__.py
    │       │   │   ├── models
    │       │   │   │   ├── __init__.py
    │       │   │   │   ├── volsdf.py
    │       │   │   │   └── neus.py
    │       │   │   └── renderers.py
    │       │   └── __init__.py
    │       ├── detectors
    │       │   └── __init__.py
    │       ├── voxel_encoders
    │       │   └── __init__.py
    │       ├── necks
    │       │   └── __init__.py
    │       ├── __init__,py
    │       ├── pts_encoder
    │       │   └── __init__.py
    │       ├── backbones
    │       │   └── __init__.py
    │       └── utils
    │       │   └── __init__.py
    │   ├── datasets
    │       ├── __init__.py
    │       └── pipelines
    │       │   └── __init__.py
    │   └── __init__.py
├── requirements
    ├── build.txt
    ├── optional.txt
    ├── readthedocs.txt
    ├── mminstall.txt
    ├── docs.txt
    ├── tests.txt
    └── runtime.txt
├── mmdet3d
    ├── ops
    │   ├── knn
    │   │   ├── __init__.py
    │   │   └── src
    │   │   │   └── knn.cpp
    │   ├── ball_query
    │   │   ├── __init__.py
    │   │   ├── ball_query.py
    │   │   └── src
    │   │   │   └── ball_query.cpp
    │   ├── gather_points
    │   │   ├── __init__.py
    │   │   └── gather_points.py
    │   ├── iou3d
    │   │   └── __init__.py
    │   ├── interpolate
    │   │   ├── __init__.py
    │   │   └── three_nn.py
    │   ├── group_points
    │   │   └── __init__.py
    │   ├── paconv
    │   │   ├── __init__.py
    │   │   └── src
    │   │   │   └── assign_score_withk.cpp
    │   ├── voxel
    │   │   ├── __init__.py
    │   │   └── src
    │   │   │   └── voxelization.cpp
    │   ├── furthest_point_sample
    │   │   ├── __init__.py
    │   │   └── utils.py
    │   ├── roiaware_pool3d
    │   │   └── __init__.py
    │   ├── pointnet_modules
    │   │   ├── __init__.py
    │   │   └── builder.py
    │   └── spconv
    │   │   ├── include
    │   │       ├── tensorview
    │   │       │   └── helper_launch.h
    │   │       ├── spconv
    │   │       │   ├── mp_helper.h
    │   │       │   ├── reordering.h
    │   │       │   └── maxpool.h
    │   │       ├── utility
    │   │       │   └── timer.h
    │   │       └── pybind11_utils.h
    │   │   └── __init__.py
    ├── models
    │   ├── utils
    │   │   ├── __init__.py
    │   │   ├── clip_sigmoid.py
    │   │   └── mlp.py
    │   ├── decode_heads
    │   │   └── __init__.py
    │   ├── model_utils
    │   │   └── __init__.py
    │   ├── segmentors
    │   │   └── __init__.py
    │   ├── roi_heads
    │   │   ├── mask_heads
    │   │   │   └── __init__.py
    │   │   ├── roi_extractors
    │   │   │   ├── __init__.py
    │   │   │   └── single_roiaware_extractor.py
    │   │   ├── __init__.py
    │   │   └── bbox_heads
    │   │   │   └── __init__.py
    │   ├── necks
    │   │   └── __init__.py
    │   ├── middle_encoders
    │   │   └── __init__.py
    │   ├── voxel_encoders
    │   │   └── __init__.py
    │   ├── fusion_layers
    │   │   └── __init__.py
    │   ├── losses
    │   │   └── __init__.py
    │   ├── detectors
    │   │   ├── two_stage.py
    │   │   ├── ssd3dnet.py
    │   │   ├── fcos_mono3d.py
    │   │   └── __init__.py
    │   ├── backbones
    │   │   ├── __init__.py
    │   │   └── base_pointnet.py
    │   ├── dense_heads
    │   │   └── __init__.py
    │   └── __init__.py
    ├── core
    │   ├── evaluation
    │   │   ├── kitti_utils
    │   │   │   └── __init__.py
    │   │   └── __init__.py
    │   ├── bbox
    │   │   ├── assigners
    │   │   │   └── __init__.py
    │   │   ├── iou_calculators
    │   │   │   └── __init__.py
    │   │   ├── coders
    │   │   │   └── __init__.py
    │   │   ├── samplers
    │   │   │   └── __init__.py
    │   │   ├── structures
    │   │   │   └── __init__.py
    │   │   └── __init__.py
    │   ├── utils
    │   │   └── __init__.py
    │   ├── voxel
    │   │   ├── __init__.py
    │   │   └── builder.py
    │   ├── visualizer
    │   │   └── __init__.py
    │   ├── __init__.py
    │   ├── anchor
    │   │   └── __init__.py
    │   ├── post_processing
    │   │   └── __init__.py
    │   └── points
    │   │   └── __init__.py
    ├── utils
    │   ├── __init__.py
    │   ├── collect_env.py
    │   └── logger.py
    ├── version.py
    ├── apis
    │   ├── __init__.py
    │   └── train.py
    ├── datasets
    │   ├── pipelines
    │   │   └── __init__.py
    │   └── builder.py
    └── __init__.py
├── tools
    ├── data_converter
    │   ├── __init__.py
    │   └── lyft_data_fixer.py
    ├── dist_train.sh
    ├── dist_test.sh
    ├── create_data.sh
    ├── slurm_test.sh
    ├── slurm_train.sh
    ├── misc
    │   ├── print_config.py
    │   └── visualize_results.py
    └── model_converters
    │   └── publish_model.py
├── assets
    └── architecture.png
├── requirements.txt
├── configs
    ├── nuimages
    │   ├── mask_rcnn_r101_fpn_1x_nuim.py
    │   ├── cascade_mask_rcnn_r101_fpn_1x_nuim.py
    │   ├── htc_r50_fpn_coco-20e_20e_nuim.py
    │   ├── htc_r50_fpn_coco-20e_1x_nuim.py
    │   ├── cascade_mask_rcnn_r50_fpn_coco-20e_1x_nuim.py
    │   ├── mask_rcnn_r50_fpn_1x_nuim.py
    │   ├── cascade_mask_rcnn_r50_fpn_coco-20e_20e_nuim.py
    │   ├── mask_rcnn_x101_32x4d_fpn_1x_nuim.py
    │   ├── cascade_mask_rcnn_x101_32x4d_fpn_1x_nuim.py
    │   ├── mask_rcnn_r50_fpn_coco-2x_1x_nuim.py
    │   ├── htc_x101_64x4d_fpn_dconv_c3-c5_coco-20e_16x1_20e_nuim.py
    │   ├── mask_rcnn_r50_fpn_coco-2x_1x_nus-2d.py
    │   ├── htc_r50_fpn_1x_nuim.py
    │   ├── mask_rcnn_r50_caffe_fpn_1x_nuim.py
    │   ├── mask_rcnn_r50_caffe_fpn_coco-3x_1x_nuim.py
    │   └── mask_rcnn_r50_caffe_fpn_coco-3x_20e_nuim.py
    ├── fp16
    │   ├── hv_second_secfpn_fp16_6x8_80e_kitti-3d-car.py
    │   ├── hv_second_secfpn_fp16_6x8_80e_kitti-3d-3class.py
    │   ├── hv_pointpillars_fpn_sbn-all_fp16_2x8_2x_nus-3d.py
    │   ├── hv_pointpillars_secfpn_sbn-all_fp16_2x8_2x_nus-3d.py
    │   └── hv_pointpillars_regnet-400mf_fpn_sbn-all_fp16_2x8_2x_nus-3d.py
    ├── centerpoint
    │   ├── centerpoint_01voxel_second_secfpn_circlenms_4x8_cyclic_20e_nus.py
    │   ├── centerpoint_02pillar_second_secfpn_circlenms_4x8_cyclic_20e_nus.py
    │   ├── centerpoint_0075voxel_second_secfpn_circlenms_4x8_cyclic_20e_nus.py
    │   ├── centerpoint_01voxel_second_secfpn_dcn_4x8_cyclic_20e_nus.py
    │   ├── centerpoint_02pillar_second_secfpn_dcn_4x8_cyclic_20e_nus.py
    │   ├── centerpoint_0075voxel_second_secfpn_dcn_4x8_cyclic_20e_nus.py
    │   ├── centerpoint_01voxel_second_secfpn_dcn_circlenms_4x8_cyclic_20e_nus.py
    │   ├── centerpoint_0075voxel_second_secfpn_dcn_circlenms_4x8_cyclic_20e_nus.py
    │   ├── centerpoint_02pillar_second_secfpn_dcn_circlenms_4x8_cyclic_20e_nus.py
    │   ├── centerpoint_0075voxel_second_secfpn_dcn_4x8_cyclic_flip-tta_20e_nus.py
    │   ├── centerpoint_0075voxel_second_secfpn_dcn_4x8_cyclic_tta_20e_nus.py
    │   └── centerpoint_0075voxel_second_secfpn_dcn_circlenms_4x8_cyclic_flip-tta_20e_nus.py
    ├── _base_
    │   ├── models
    │   │   ├── paconv_cuda_ssg.py
    │   │   ├── hv_pointpillars_fpn_lyft.py
    │   │   ├── hv_pointpillars_fpn_range100_lyft.py
    │   │   ├── pointnet2_msg.py
    │   │   ├── pointnet2_ssg.py
    │   │   └── paconv_ssg.py
    │   ├── schedules
    │   │   ├── mmdet_schedule_1x.py
    │   │   ├── seg_cosine_200e.py
    │   │   ├── seg_cosine_50e.py
    │   │   ├── seg_cosine_150e.py
    │   │   ├── schedule_3x.py
    │   │   ├── schedule_2x.py
    │   │   ├── cosine.py
    │   │   ├── cyclic_20e.py
    │   │   └── cyclic_40e.py
    │   ├── default_runtime.py
    │   └── datasets
    │   │   ├── coco_instance.py
    │   │   └── nuim_instance.py
    ├── pointpillars
    │   ├── hv_pointpillars_fpn_sbn-all_4x8_2x_nus-3d.py
    │   ├── hv_pointpillars_fpn_sbn-all_2x8_2x_lyft-3d.py
    │   ├── hv_pointpillars_fpn_sbn-all_range100_2x8_2x_lyft-3d.py
    │   ├── hv_pointpillars_secfpn_sbn_2x16_2x_waymoD5-3d-3class.py
    │   ├── hv_pointpillars_secfpn_sbn_2x16_2x_waymo-3d-3class.py
    │   ├── hv_pointpillars_secfpn_sbn_2x16_2x_waymoD5-3d-car.py
    │   ├── hv_pointpillars_secfpn_sbn_2x16_2x_waymo-3d-car.py
    │   ├── hv_pointpillars_secfpn_sbn-all_4x8_2x_nus-3d.py
    │   ├── hv_pointpillars_secfpn_sbn-all_2x8_2x_lyft-3d.py
    │   └── hv_pointpillars_secfpn_sbn-all_range100_2x8_2x_lyft-3d.py
    ├── second
    │   ├── hv_second_secfpn_6x8_80e_kitti-3d-3class.py
    │   ├── hv_second_secfpn_6x8_80e_kitti-3d-car.py
    │   └── metafile.yml
    ├── votenet
    │   ├── votenet_iouloss_8x8_scannet-3d-18class.py
    │   ├── votenet_16x8_sunrgbd-3d-10class.py
    │   ├── votenet_8x8_scannet-3d-18class.py
    │   └── metafile.yml
    ├── fcos3d
    │   ├── fcos3d_r101_caffe_fpn_gn-head_dcn_2x8_1x_nus-mono3d_finetune.py
    │   └── metafile.yml
    ├── dynamic_voxelization
    │   ├── dv_second_secfpn_6x8_80e_kitti-3d-car.py
    │   ├── dv_pointpillars_secfpn_6x8_160e_kitti-3d-car.py
    │   └── dv_second_secfpn_2x8_cosine_80e_kitti-3d-3class.py
    ├── free_anchor
    │   ├── hv_pointpillars_regnet-400mf_fpn_sbn-all_free-anchor_4x8_2x_nus-3d.py
    │   ├── hv_pointpillars_regnet-1.6gf_fpn_sbn-all_free-anchor_4x8_2x_nus-3d.py
    │   ├── hv_pointpillars_regnet-3.2gf_fpn_sbn-all_free-anchor_4x8_2x_nus-3d.py
    │   └── hv_pointpillars_fpn_sbn-all_free-anchor_4x8_2x_nus-3d.py
    ├── ssn
    │   ├── hv_ssn_regnet-400mf_secfpn_sbn-all_2x16_2x_nus-3d.py
    │   └── hv_ssn_regnet-400mf_secfpn_sbn-all_1x16_2x_lyft-3d.py
    ├── pointnet2
    │   ├── pointnet2_ssg_16x2_cosine_50e_s3dis_seg-3d-13class.py
    │   ├── pointnet2_msg_16x2_cosine_80e_s3dis_seg-3d-13class.py
    │   ├── pointnet2_ssg_16x2_cosine_200e_scannet_seg-3d-20class.py
    │   └── pointnet2_msg_16x2_cosine_250e_scannet_seg-3d-20class.py
    ├── regnet
    │   ├── hv_pointpillars_regnet-1.6gf_fpn_sbn-all_4x8_2x_nus-3d.py
    │   ├── hv_pointpillars_regnet-400mf_fpn_sbn-all_4x8_2x_nus-3d.py
    │   ├── hv_pointpillars_regnet-400mf_fpn_sbn-all_2x8_2x_lyft-3d.py
    │   ├── hv_pointpillars_regnet-400mf_fpn_sbn-all_range100_2x8_2x_lyft-3d.py
    │   ├── hv_pointpillars_regnet-400mf_secfpn_sbn-all_4x8_2x_nus-3d.py
    │   ├── hv_pointpillars_regnet-400mf_secfpn_sbn-all_2x8_2x_lyft-3d.py
    │   └── hv_pointpillars_regnet-400mf_secfpn_sbn-all_range100_2x8_2x_lyft-3d.py
    ├── 3dssd
    │   └── metafile.yml
    ├── h3dnet
    │   ├── metafile.yml
    │   └── README.md
    ├── imvoxelnet
    │   ├── metafile.yml
    │   └── README.md
    ├── paconv
    │   └── metafile.yml
    ├── mvxnet
    │   ├── metafile.yml
    │   └── README.md
    ├── parta2
    │   ├── metafile.yml
    │   └── README.md
    └── imvotenet
    │   ├── metafile.yml
    │   └── README.md
└── extra_tools
    ├── dist_test_ssl.sh
    ├── create_data.sh
    └── dist_train_ssl.sh


/projects/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/requirements/build.txt:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/requirements/optional.txt:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/requirements/readthedocs.txt:
--------------------------------------------------------------------------------
1 | mmcv
2 | torch
3 | torchvision
4 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/knn/__init__.py:
--------------------------------------------------------------------------------
1 | from .knn import knn
2 | 
3 | __all__ = ['knn']
4 | 


--------------------------------------------------------------------------------
/tools/data_converter/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | 


--------------------------------------------------------------------------------
/assets/architecture.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/hustvl/MIM4D/HEAD/assets/architecture.png


--------------------------------------------------------------------------------
/mmdet3d/ops/ball_query/__init__.py:
--------------------------------------------------------------------------------
1 | from .ball_query import ball_query
2 | 
3 | __all__ = ['ball_query']
4 | 


--------------------------------------------------------------------------------
/requirements/mminstall.txt:
--------------------------------------------------------------------------------
1 | mmcv-full>=1.3.8,<=1.4.0
2 | mmdet>=2.14.0,<=3.0.0
3 | mmsegmentation>=0.14.1,<=1.0.0
4 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/gather_points/__init__.py:
--------------------------------------------------------------------------------
1 | from .gather_points import gather_points
2 | 
3 | __all__ = ['gather_points']
4 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/ops/voxel_pool/__init__.py:
--------------------------------------------------------------------------------
1 | from .voxel_pool import voxel_pool
2 | 
3 | __all__ = ["voxel_pool"]
4 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/core/bbox/coders/__init__.py:
--------------------------------------------------------------------------------
1 | from .nms_free_coder import NMSFreeCoder
2 | 
3 | __all__ = ["NMSFreeCoder"]
4 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/ops/point_ops/__init__.py:
--------------------------------------------------------------------------------
1 | from .point_ops import group_inner_inds
2 | 
3 | __all__ = ["group_inner_inds"]
4 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/ops/smooth_sampler/__init__.py:
--------------------------------------------------------------------------------
1 | from .smooth_sampler import SmoothSampler
2 | 
3 | __all__ = ['SmoothSampler']


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/models/dense_heads/render_utils/fields/__init__.py:
--------------------------------------------------------------------------------
1 | from .sdf_field import SDFField
2 | 
3 | __all__ = ['SDFField']
4 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
1 | -r requirements/build.txt
2 | -r requirements/optional.txt
3 | -r requirements/tests.txt
4 | -r requirements/runtime.txt
5 | 
6 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/core/bbox/assigners/__init__.py:
--------------------------------------------------------------------------------
1 | from .hungarian_assigner_3d import HungarianAssigner3D
2 | 
3 | __all__ = ["HungarianAssigner3D"]
4 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/datasets/__init__.py:
--------------------------------------------------------------------------------
1 | from .nuscenes_dataset import NuScenesSweepDataset
2 | 
3 | __all__ = [
4 |     "NuScenesSweepDataset",
5 | ]
6 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/iou3d/__init__.py:
--------------------------------------------------------------------------------
1 | from .iou3d_utils import boxes_iou_bev, nms_gpu, nms_normal_gpu
2 | 
3 | __all__ = ['boxes_iou_bev', 'nms_gpu', 'nms_normal_gpu']
4 | 


--------------------------------------------------------------------------------
/configs/nuimages/mask_rcnn_r101_fpn_1x_nuim.py:
--------------------------------------------------------------------------------
1 | _base_ = './mask_rcnn_r50_fpn_1x_nuim.py'
2 | model = dict(pretrained='torchvision://resnet101', backbone=dict(depth=101))
3 | 


--------------------------------------------------------------------------------
/configs/fp16/hv_second_secfpn_fp16_6x8_80e_kitti-3d-car.py:
--------------------------------------------------------------------------------
1 | _base_ = '../second/hv_second_secfpn_6x8_80e_kitti-3d-car.py'
2 | # fp16 settings
3 | fp16 = dict(loss_scale=512.)
4 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/interpolate/__init__.py:
--------------------------------------------------------------------------------
1 | from .three_interpolate import three_interpolate
2 | from .three_nn import three_nn
3 | 
4 | __all__ = ['three_nn', 'three_interpolate']
5 | 


--------------------------------------------------------------------------------
/configs/fp16/hv_second_secfpn_fp16_6x8_80e_kitti-3d-3class.py:
--------------------------------------------------------------------------------
1 | _base_ = '../second/hv_second_secfpn_6x8_80e_kitti-3d-3class.py'
2 | # fp16 settings
3 | fp16 = dict(loss_scale=512.)
4 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/group_points/__init__.py:
--------------------------------------------------------------------------------
1 | from .group_points import GroupAll, QueryAndGroup, grouping_operation
2 | 
3 | __all__ = ['QueryAndGroup', 'GroupAll', 'grouping_operation']
4 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/paconv/__init__.py:
--------------------------------------------------------------------------------
1 | from .assign_score import assign_score_withk
2 | from .paconv import PAConv, PAConvCUDA
3 | 
4 | __all__ = ['assign_score_withk', 'PAConv', 'PAConvCUDA']
5 | 


--------------------------------------------------------------------------------
/configs/nuimages/cascade_mask_rcnn_r101_fpn_1x_nuim.py:
--------------------------------------------------------------------------------
1 | _base_ = './cascade_mask_rcnn_r50_fpn_1x_nuim.py'
2 | model = dict(pretrained='torchvision://resnet101', backbone=dict(depth=101))
3 | 


--------------------------------------------------------------------------------
/configs/nuimages/htc_r50_fpn_coco-20e_20e_nuim.py:
--------------------------------------------------------------------------------
1 | _base_ = './htc_r50_fpn_coco-20e_1x_nuim.py'
2 | # learning policy
3 | lr_config = dict(step=[16, 19])
4 | runner = dict(max_epochs=20)
5 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/models/dense_heads/render_utils/models/__init__.py:
--------------------------------------------------------------------------------
1 | from .neus import NeuSModel
2 | from .volsdf import VolSDFModel
3 | 
4 | __all__ = ['NeuSModel', 'VolSDFModel']
5 | 


--------------------------------------------------------------------------------
/mmdet3d/models/utils/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | from .clip_sigmoid import clip_sigmoid
3 | from .mlp import MLP
4 | 
5 | __all__ = ['clip_sigmoid', 'MLP']
6 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/models/detectors/__init__.py:
--------------------------------------------------------------------------------
1 | from .uvtr import UVTR
2 | from .uvtr_ssl_hop import UVTRSSL
3 | from .uvtr_dn import UVTRDN
4 | 
5 | __all__ = ["UVTR", "UVTRSSL","UVTRDN"]
6 | 


--------------------------------------------------------------------------------
/mmdet3d/core/evaluation/kitti_utils/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | from .eval import kitti_eval, kitti_eval_coco_style
3 | 
4 | __all__ = ['kitti_eval', 'kitti_eval_coco_style']
5 | 


--------------------------------------------------------------------------------
/configs/centerpoint/centerpoint_01voxel_second_secfpn_circlenms_4x8_cyclic_20e_nus.py:
--------------------------------------------------------------------------------
1 | _base_ = ['./centerpoint_01voxel_second_secfpn_4x8_cyclic_20e_nus.py']
2 | 
3 | model = dict(test_cfg=dict(pts=dict(nms_type='circle')))
4 | 


--------------------------------------------------------------------------------
/configs/centerpoint/centerpoint_02pillar_second_secfpn_circlenms_4x8_cyclic_20e_nus.py:
--------------------------------------------------------------------------------
1 | _base_ = ['./centerpoint_02pillar_second_secfpn_4x8_cyclic_20e_nus.py']
2 | 
3 | model = dict(test_cfg=dict(pts=dict(nms_type='circle')))
4 | 


--------------------------------------------------------------------------------
/mmdet3d/models/decode_heads/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | from .paconv_head import PAConvHead
3 | from .pointnet2_head import PointNet2Head
4 | 
5 | __all__ = ['PointNet2Head', 'PAConvHead']
6 | 


--------------------------------------------------------------------------------
/mmdet3d/models/model_utils/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | from .transformer import GroupFree3DMHA
3 | from .vote_module import VoteModule
4 | 
5 | __all__ = ['VoteModule', 'GroupFree3DMHA']
6 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/core/bbox/iou_calculators/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | from .iou3d_calculator import PairedBboxOverlaps3D
3 | 
4 | __all__ = [
5 |     'PairedBboxOverlaps3D'
6 | ]
7 | 


--------------------------------------------------------------------------------
/configs/centerpoint/centerpoint_0075voxel_second_secfpn_circlenms_4x8_cyclic_20e_nus.py:
--------------------------------------------------------------------------------
1 | _base_ = ['./centerpoint_0075voxel_second_secfpn_4x8_cyclic_20e_nus.py']
2 | 
3 | model = dict(test_cfg=dict(pts=dict(nms_type='circle')))
4 | 


--------------------------------------------------------------------------------
/configs/nuimages/htc_r50_fpn_coco-20e_1x_nuim.py:
--------------------------------------------------------------------------------
1 | _base_ = './htc_r50_fpn_1x_nuim.py'
2 | 
3 | load_from = 'http://download.openmmlab.com/mmdetection/v2.0/htc/htc_r50_fpn_20e_coco/htc_r50_fpn_20e_coco_20200319-fe28c577.pth'  # noqa
4 | 


--------------------------------------------------------------------------------
/mmdet3d/core/bbox/assigners/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | from mmdet.core.bbox import AssignResult, BaseAssigner, MaxIoUAssigner
3 | 
4 | __all__ = ['BaseAssigner', 'MaxIoUAssigner', 'AssignResult']
5 | 


--------------------------------------------------------------------------------
/mmdet3d/models/segmentors/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | from .base import Base3DSegmentor
3 | from .encoder_decoder import EncoderDecoder3D
4 | 
5 | __all__ = ['Base3DSegmentor', 'EncoderDecoder3D']
6 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/voxel/__init__.py:
--------------------------------------------------------------------------------
1 | from .scatter_points import DynamicScatter, dynamic_scatter
2 | from .voxelize import Voxelization, voxelization
3 | 
4 | __all__ = ['Voxelization', 'voxelization', 'dynamic_scatter', 'DynamicScatter']
5 | 


--------------------------------------------------------------------------------
/mmdet3d/core/utils/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | from .gaussian import draw_heatmap_gaussian, gaussian_2d, gaussian_radius
3 | 
4 | __all__ = ['gaussian_2d', 'gaussian_radius', 'draw_heatmap_gaussian']
5 | 


--------------------------------------------------------------------------------
/mmdet3d/core/voxel/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | from .builder import build_voxel_generator
3 | from .voxel_generator import VoxelGenerator
4 | 
5 | __all__ = ['build_voxel_generator', 'VoxelGenerator']
6 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/core/bbox/match_costs/__init__.py:
--------------------------------------------------------------------------------
1 | from mmdet.core.bbox.match_costs import build_match_cost
2 | from .match_cost import BBox3DL1Cost, BBox3DIoUCost
3 | 
4 | __all__ = ['build_match_cost', 'BBox3DL1Cost', 'BBox3DIoUCost']


--------------------------------------------------------------------------------
/configs/_base_/models/paconv_cuda_ssg.py:
--------------------------------------------------------------------------------
1 | _base_ = './paconv_ssg.py'
2 | 
3 | model = dict(
4 |     backbone=dict(
5 |         sa_cfg=dict(
6 |             type='PAConvCUDASAModule',
7 |             scorenet_cfg=dict(mlp_channels=[8, 16, 16]))))
8 | 


--------------------------------------------------------------------------------
/configs/pointpillars/hv_pointpillars_fpn_sbn-all_4x8_2x_nus-3d.py:
--------------------------------------------------------------------------------
1 | _base_ = [
2 |     '../_base_/models/hv_pointpillars_fpn_nus.py',
3 |     '../_base_/datasets/nus-3d.py', '../_base_/schedules/schedule_2x.py',
4 |     '../_base_/default_runtime.py'
5 | ]
6 | 


--------------------------------------------------------------------------------
/configs/second/hv_second_secfpn_6x8_80e_kitti-3d-3class.py:
--------------------------------------------------------------------------------
1 | _base_ = [
2 |     '../_base_/models/hv_second_secfpn_kitti.py',
3 |     '../_base_/datasets/kitti-3d-3class.py',
4 |     '../_base_/schedules/cyclic_40e.py', '../_base_/default_runtime.py'
5 | ]
6 | 


--------------------------------------------------------------------------------
/configs/pointpillars/hv_pointpillars_fpn_sbn-all_2x8_2x_lyft-3d.py:
--------------------------------------------------------------------------------
1 | _base_ = [
2 |     '../_base_/models/hv_pointpillars_fpn_lyft.py',
3 |     '../_base_/datasets/lyft-3d.py', '../_base_/schedules/schedule_2x.py',
4 |     '../_base_/default_runtime.py'
5 | ]
6 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/models/voxel_encoders/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | # from .dyn_voxel_encoder import CustomDynamicSimpleVFE, GridSample
3 | # 
4 | # __all__ = [
5 | #     'CustomDynamicSimpleVFE', 'GridSample'
6 | # ]
7 | 


--------------------------------------------------------------------------------
/requirements/docs.txt:
--------------------------------------------------------------------------------
 1 | docutils==0.16.0
 2 | m2r
 3 | myst-parser
 4 | opencv-python
 5 | -e git+https://github.com/open-mmlab/pytorch_sphinx_theme.git#egg=pytorch_sphinx_theme
 6 | sphinx==4.0.2
 7 | sphinx-copybutton
 8 | sphinx_markdown_tables
 9 | torch
10 | 


--------------------------------------------------------------------------------
/mmdet3d/models/roi_heads/mask_heads/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | from .pointwise_semantic_head import PointwiseSemanticHead
3 | from .primitive_head import PrimitiveHead
4 | 
5 | __all__ = ['PointwiseSemanticHead', 'PrimitiveHead']
6 | 


--------------------------------------------------------------------------------
/mmdet3d/models/necks/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | from mmdet.models.necks.fpn import FPN
3 | from .imvoxel_neck import OutdoorImVoxelNeck
4 | from .second_fpn import SECONDFPN
5 | 
6 | __all__ = ['FPN', 'SECONDFPN', 'OutdoorImVoxelNeck']
7 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/models/necks/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | from .second3d_fpn import SECOND3DFPN
3 | from .fpn import CustomFPN, DummyFPN
4 | from .cp_fpn import CPFPN
5 | __all__ = ['SECOND3DFPN', 'CustomFPN', 'DummyFPN',"CPFPN"]
6 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/models/dense_heads/__init__.py:
--------------------------------------------------------------------------------
 1 | from .uvtr_head import UVTRHead
 2 | from .render_head_hop import RenderHead
 3 | from .uvtr_dn_head import UVTRDNHead
 4 | 
 5 | 
 6 | __all__ = [
 7 |     "UVTRHead",
 8 |     "RenderHead",
 9 |     "UVTRDNHead",
10 | ]
11 | 


--------------------------------------------------------------------------------
/requirements/tests.txt:
--------------------------------------------------------------------------------
 1 | asynctest
 2 | codecov
 3 | flake8
 4 | interrogate
 5 | isort
 6 | # Note: used for kwarray.group_items, this may be ported to mmcv in the future.
 7 | kwarray
 8 | pytest
 9 | pytest-cov
10 | pytest-runner
11 | ubelt
12 | xdoctest >= 0.10.0
13 | yapf
14 | 


--------------------------------------------------------------------------------
/configs/pointpillars/hv_pointpillars_fpn_sbn-all_range100_2x8_2x_lyft-3d.py:
--------------------------------------------------------------------------------
1 | _base_ = [
2 |     '../_base_/models/hv_pointpillars_fpn_range100_lyft.py',
3 |     '../_base_/datasets/range100_lyft-3d.py',
4 |     '../_base_/schedules/schedule_2x.py', '../_base_/default_runtime.py'
5 | ]
6 | 


--------------------------------------------------------------------------------
/mmdet3d/core/visualizer/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | from .show_result import (show_multi_modality_result, show_result,
3 |                           show_seg_result)
4 | 
5 | __all__ = ['show_result', 'show_seg_result', 'show_multi_modality_result']
6 | 


--------------------------------------------------------------------------------
/configs/fp16/hv_pointpillars_fpn_sbn-all_fp16_2x8_2x_nus-3d.py:
--------------------------------------------------------------------------------
1 | _base_ = '../pointpillars/hv_pointpillars_fpn_sbn-all_4x8_2x_nus-3d.py'
2 | data = dict(samples_per_gpu=2, workers_per_gpu=2)
3 | # fp16 settings, the loss scale is specifically tuned to avoid Nan
4 | fp16 = dict(loss_scale=32.)
5 | 


--------------------------------------------------------------------------------
/configs/pointpillars/hv_pointpillars_secfpn_sbn_2x16_2x_waymoD5-3d-3class.py:
--------------------------------------------------------------------------------
1 | _base_ = [
2 |     '../_base_/models/hv_pointpillars_secfpn_waymo.py',
3 |     '../_base_/datasets/waymoD5-3d-3class.py',
4 |     '../_base_/schedules/schedule_2x.py',
5 |     '../_base_/default_runtime.py',
6 | ]
7 | 


--------------------------------------------------------------------------------
/configs/fp16/hv_pointpillars_secfpn_sbn-all_fp16_2x8_2x_nus-3d.py:
--------------------------------------------------------------------------------
1 | _base_ = '../pointpillars/hv_pointpillars_secfpn_sbn-all_4x8_2x_nus-3d.py'
2 | data = dict(samples_per_gpu=2, workers_per_gpu=2)
3 | # fp16 settings, the loss scale is specifically tuned to avoid Nan
4 | fp16 = dict(loss_scale=32.)
5 | 


--------------------------------------------------------------------------------
/mmdet3d/models/middle_encoders/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | from .pillar_scatter import PointPillarsScatter
3 | from .sparse_encoder import SparseEncoder
4 | from .sparse_unet import SparseUNet
5 | 
6 | __all__ = ['PointPillarsScatter', 'SparseEncoder', 'SparseUNet']
7 | 


--------------------------------------------------------------------------------
/tools/dist_train.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env bash
 2 | 
 3 | CONFIG=$1
 4 | GPUS=$2
 5 | PORT=${PORT:-29500}
 6 | 
 7 | PYTHONPATH="$(dirname $0)/..":$PYTHONPATH \
 8 | python -m torch.distributed.launch --nproc_per_node=$GPUS --master_port=$PORT \
 9 |     $(dirname "$0")/train.py $CONFIG --launcher pytorch ${@:3}
10 | 


--------------------------------------------------------------------------------
/configs/fp16/hv_pointpillars_regnet-400mf_fpn_sbn-all_fp16_2x8_2x_nus-3d.py:
--------------------------------------------------------------------------------
1 | _base_ = '../regnet/hv_pointpillars_regnet-400mf_fpn_sbn-all_4x8_2x_nus-3d.py'
2 | data = dict(samples_per_gpu=2, workers_per_gpu=2)
3 | # fp16 settings, the loss scale is specifically tuned to avoid Nan
4 | fp16 = dict(loss_scale=32.)
5 | 


--------------------------------------------------------------------------------
/mmdet3d/models/roi_heads/roi_extractors/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | from mmdet.models.roi_heads.roi_extractors import SingleRoIExtractor
3 | from .single_roiaware_extractor import Single3DRoIAwareExtractor
4 | 
5 | __all__ = ['SingleRoIExtractor', 'Single3DRoIAwareExtractor']
6 | 


--------------------------------------------------------------------------------
/configs/votenet/votenet_iouloss_8x8_scannet-3d-18class.py:
--------------------------------------------------------------------------------
1 | _base_ = ['./votenet_8x8_scannet-3d-18class.py']
2 | 
3 | # model settings, add iou loss
4 | model = dict(
5 |     bbox_head=dict(
6 |         iou_loss=dict(
7 |             type='AxisAlignedIoULoss', reduction='sum', loss_weight=10.0 /
8 |             3.0)))
9 | 


--------------------------------------------------------------------------------
/requirements/runtime.txt:
--------------------------------------------------------------------------------
 1 | lyft_dataset_sdk
 2 | networkx>=2.2,<2.3
 3 | # we may unlock the verion of numba in the future
 4 | # numba==0.48.0
 5 | numpy<1.20.0
 6 | nuscenes-devkit
 7 | plyfile
 8 | scikit-image
 9 | # by default we also use tensorboard to log results
10 | tensorboard
11 | trimesh>=2.35.39,<2.35.40
12 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/models/__init__,py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | from .backbones import *  # noqa: F401,F403
3 | from .dense_heads import *  # noqa: F401,F403
4 | from .detectors import *  # noqa: F401,F403
5 | from .necks import *  # noqa: F401,F403
6 | from .voxel_encoders import *  # noqa: F401,F403


--------------------------------------------------------------------------------
/configs/nuimages/cascade_mask_rcnn_r50_fpn_coco-20e_1x_nuim.py:
--------------------------------------------------------------------------------
1 | _base_ = './cascade_mask_rcnn_r50_fpn_1x_nuim.py'
2 | 
3 | load_from = 'http://download.openmmlab.com/mmdetection/v2.0/cascade_rcnn/cascade_mask_rcnn_r50_fpn_20e_coco/cascade_mask_rcnn_r50_fpn_20e_coco_bbox_mAP-0.419__segm_mAP-0.365_20200504_174711-4af8e66e.pth'  # noqa
4 | 


--------------------------------------------------------------------------------
/tools/dist_test.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env bash
 2 | 
 3 | CONFIG=$1
 4 | CHECKPOINT=$2
 5 | GPUS=$3
 6 | PORT=${PORT:-29500}
 7 | 
 8 | PYTHONPATH="$(dirname $0)/..":$PYTHONPATH \
 9 | python -m torch.distributed.launch --nproc_per_node=$GPUS --master_port=$PORT \
10 |     $(dirname "$0")/test.py $CONFIG $CHECKPOINT --launcher pytorch ${@:4}
11 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/furthest_point_sample/__init__.py:
--------------------------------------------------------------------------------
1 | from .furthest_point_sample import (furthest_point_sample,
2 |                                     furthest_point_sample_with_dist)
3 | from .points_sampler import Points_Sampler
4 | 
5 | __all__ = [
6 |     'furthest_point_sample', 'furthest_point_sample_with_dist',
7 |     'Points_Sampler'
8 | ]
9 | 


--------------------------------------------------------------------------------
/mmdet3d/utils/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmcv.utils import Registry, build_from_cfg, print_log
 3 | 
 4 | from .collect_env import collect_env
 5 | from .logger import get_root_logger
 6 | 
 7 | __all__ = [
 8 |     'Registry', 'build_from_cfg', 'get_root_logger', 'collect_env', 'print_log'
 9 | ]
10 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/roiaware_pool3d/__init__.py:
--------------------------------------------------------------------------------
1 | from .points_in_boxes import (points_in_boxes_batch, points_in_boxes_cpu,
2 |                               points_in_boxes_gpu)
3 | from .roiaware_pool3d import RoIAwarePool3d
4 | 
5 | __all__ = [
6 |     'RoIAwarePool3d', 'points_in_boxes_gpu', 'points_in_boxes_cpu',
7 |     'points_in_boxes_batch'
8 | ]
9 | 


--------------------------------------------------------------------------------
/configs/nuimages/mask_rcnn_r50_fpn_1x_nuim.py:
--------------------------------------------------------------------------------
1 | _base_ = [
2 |     '../_base_/models/mask_rcnn_r50_fpn.py',
3 |     '../_base_/datasets/nuim_instance.py',
4 |     '../_base_/schedules/mmdet_schedule_1x.py', '../_base_/default_runtime.py'
5 | ]
6 | model = dict(
7 |     roi_head=dict(
8 |         bbox_head=dict(num_classes=10), mask_head=dict(num_classes=10)))
9 | 


--------------------------------------------------------------------------------
/configs/fcos3d/fcos3d_r101_caffe_fpn_gn-head_dcn_2x8_1x_nus-mono3d_finetune.py:
--------------------------------------------------------------------------------
1 | _base_ = './fcos3d_r101_caffe_fpn_gn-head_dcn_2x8_1x_nus-mono3d.py'
2 | # model settings
3 | model = dict(
4 |     train_cfg=dict(
5 |         code_weight=[1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.05, 0.05]))
6 | # optimizer
7 | optimizer = dict(lr=0.001)
8 | load_from = 'work_dirs/fcos3d_nus/latest.pth'
9 | 


--------------------------------------------------------------------------------
/configs/pointpillars/hv_pointpillars_secfpn_sbn_2x16_2x_waymo-3d-3class.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/hv_pointpillars_secfpn_waymo.py',
 3 |     '../_base_/datasets/waymoD5-3d-3class.py',
 4 |     '../_base_/schedules/schedule_2x.py',
 5 |     '../_base_/default_runtime.py',
 6 | ]
 7 | 
 8 | # data settings
 9 | data = dict(train=dict(dataset=dict(load_interval=1)))
10 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/core/hook/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) OpenMMLab. All rights reserved.
2 | from .ema import MEGVIIEMAHook
3 | from .utils import is_parallel
4 | from .sequentialcontrol import SequentialControlHook
5 | from .syncbncontrol import SyncbnControlHook
6 | 
7 | __all__ = ['MEGVIIEMAHook', 'is_parallel', 'SequentialControlHook',
8 |            'SyncbnControlHook']
9 | 


--------------------------------------------------------------------------------
/mmdet3d/core/evaluation/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from .indoor_eval import indoor_eval
 3 | from .kitti_utils import kitti_eval, kitti_eval_coco_style
 4 | from .lyft_eval import lyft_eval
 5 | from .seg_eval import seg_eval
 6 | 
 7 | __all__ = [
 8 |     'kitti_eval_coco_style', 'kitti_eval', 'indoor_eval', 'lyft_eval',
 9 |     'seg_eval'
10 | ]
11 | 


--------------------------------------------------------------------------------
/configs/_base_/schedules/mmdet_schedule_1x.py:
--------------------------------------------------------------------------------
 1 | # optimizer
 2 | optimizer = dict(type='SGD', lr=0.02, momentum=0.9, weight_decay=0.0001)
 3 | optimizer_config = dict(grad_clip=None)
 4 | # learning policy
 5 | lr_config = dict(
 6 |     policy='step',
 7 |     warmup='linear',
 8 |     warmup_iters=500,
 9 |     warmup_ratio=0.001,
10 |     step=[8, 11])
11 | runner = dict(type='EpochBasedRunner', max_epochs=12)
12 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/core/hook/utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from torch import nn
 3 | 
 4 | __all__ = ['is_parallel']
 5 | 
 6 | 
 7 | def is_parallel(model):
 8 |     """check if model is in parallel mode."""
 9 |     parallel_type = (
10 |         nn.parallel.DataParallel,
11 |         nn.parallel.DistributedDataParallel,
12 |     )
13 |     return isinstance(model, parallel_type)
14 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/models/pts_encoder/__init__.py:
--------------------------------------------------------------------------------
 1 | # from .sparse_encoder_hd import SparseEncoderHD
 2 | # from .mask_sparse_encoder_hd import MaskSparseEncoderHD
 3 | # from .minkunet import MinkUNet
 4 | # from .sparse_unet import SpUNetBase
 5 | # 
 6 | # __all__ = [
 7 | #     "SparseEncoderHD",
 8 | #     "MaskSparseEncoderHD",
 9 | #     "MinkUNet",
10 | #     "SparseEncoderHDV2",
11 | #     "SpUNetBase",
12 | # ]
13 | 


--------------------------------------------------------------------------------
/configs/_base_/schedules/seg_cosine_200e.py:
--------------------------------------------------------------------------------
 1 | # optimizer
 2 | # This schedule is mainly used on ScanNet dataset in segmentation task
 3 | optimizer = dict(type='Adam', lr=0.001, weight_decay=0.01)
 4 | optimizer_config = dict(grad_clip=None)
 5 | lr_config = dict(policy='CosineAnnealing', warmup=None, min_lr=1e-5)
 6 | momentum_config = None
 7 | 
 8 | # runtime settings
 9 | runner = dict(type='EpochBasedRunner', max_epochs=200)
10 | 


--------------------------------------------------------------------------------
/configs/_base_/schedules/seg_cosine_50e.py:
--------------------------------------------------------------------------------
 1 | # optimizer
 2 | # This schedule is mainly used on S3DIS dataset in segmentation task
 3 | optimizer = dict(type='Adam', lr=0.001, weight_decay=0.001)
 4 | optimizer_config = dict(grad_clip=None)
 5 | lr_config = dict(policy='CosineAnnealing', warmup=None, min_lr=1e-5)
 6 | momentum_config = None
 7 | 
 8 | # runtime settings
 9 | runner = dict(type='EpochBasedRunner', max_epochs=50)
10 | 


--------------------------------------------------------------------------------
/configs/nuimages/cascade_mask_rcnn_r50_fpn_coco-20e_20e_nuim.py:
--------------------------------------------------------------------------------
1 | _base_ = './cascade_mask_rcnn_r50_fpn_1x_nuim.py'
2 | 
3 | # learning policy
4 | lr_config = dict(step=[16, 19])
5 | runner = dict(max_epochs=20)
6 | 
7 | load_from = 'http://download.openmmlab.com/mmdetection/v2.0/cascade_rcnn/cascade_mask_rcnn_r50_fpn_20e_coco/cascade_mask_rcnn_r50_fpn_20e_coco_bbox_mAP-0.419__segm_mAP-0.365_20200504_174711-4af8e66e.pth'  # noqa
8 | 


--------------------------------------------------------------------------------
/mmdet3d/models/voxel_encoders/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from .pillar_encoder import PillarFeatureNet
 3 | from .voxel_encoder import DynamicSimpleVFE, DynamicVFE, HardSimpleVFE, HardVFE
 4 | # from projects.mmdet3d_plugin.models.voxel_encoders import CustomDynamicSimpleVFE
 5 | 
 6 | __all__ = [
 7 |     'PillarFeatureNet', 'HardVFE', 'DynamicVFE', 'HardSimpleVFE',
 8 |     'DynamicSimpleVFE'
 9 | ]
10 | 


--------------------------------------------------------------------------------
/configs/_base_/schedules/seg_cosine_150e.py:
--------------------------------------------------------------------------------
 1 | # optimizer
 2 | # This schedule is mainly used on S3DIS dataset in segmentation task
 3 | optimizer = dict(type='SGD', lr=0.2, weight_decay=0.0001, momentum=0.9)
 4 | optimizer_config = dict(grad_clip=None)
 5 | lr_config = dict(policy='CosineAnnealing', warmup=None, min_lr=0.002)
 6 | momentum_config = None
 7 | 
 8 | # runtime settings
 9 | runner = dict(type='EpochBasedRunner', max_epochs=150)
10 | 


--------------------------------------------------------------------------------
/mmdet3d/models/fusion_layers/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from .coord_transform import (apply_3d_transformation, bbox_2d_transform,
 3 |                               coord_2d_transform)
 4 | from .point_fusion import PointFusion
 5 | from .vote_fusion import VoteFusion
 6 | 
 7 | __all__ = [
 8 |     'PointFusion', 'VoteFusion', 'apply_3d_transformation',
 9 |     'bbox_2d_transform', 'coord_2d_transform'
10 | ]
11 | 


--------------------------------------------------------------------------------
/mmdet3d/core/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from .anchor import *  # noqa: F401, F403
 3 | from .bbox import *  # noqa: F401, F403
 4 | from .evaluation import *  # noqa: F401, F403
 5 | from .points import *  # noqa: F401, F403
 6 | from .post_processing import *  # noqa: F401, F403
 7 | from .utils import *  # noqa: F401, F403
 8 | from .visualizer import *  # noqa: F401, F403
 9 | from .voxel import *  # noqa: F401, F403
10 | 


--------------------------------------------------------------------------------
/configs/_base_/schedules/schedule_3x.py:
--------------------------------------------------------------------------------
 1 | # optimizer
 2 | # This schedule is mainly used by models on indoor dataset,
 3 | # e.g., VoteNet on SUNRGBD and ScanNet
 4 | lr = 0.008  # max learning rate
 5 | optimizer = dict(type='AdamW', lr=lr, weight_decay=0.01)
 6 | optimizer_config = dict(grad_clip=dict(max_norm=10, norm_type=2))
 7 | lr_config = dict(policy='step', warmup=None, step=[24, 32])
 8 | # runtime settings
 9 | runner = dict(type='EpochBasedRunner', max_epochs=36)
10 | 


--------------------------------------------------------------------------------
/configs/nuimages/mask_rcnn_x101_32x4d_fpn_1x_nuim.py:
--------------------------------------------------------------------------------
 1 | _base_ = './mask_rcnn_r50_fpn_1x_nuim.py'
 2 | model = dict(
 3 |     pretrained='open-mmlab://resnext101_32x4d',
 4 |     backbone=dict(
 5 |         type='ResNeXt',
 6 |         depth=101,
 7 |         groups=32,
 8 |         base_width=4,
 9 |         num_stages=4,
10 |         out_indices=(0, 1, 2, 3),
11 |         frozen_stages=1,
12 |         norm_cfg=dict(type='BN', requires_grad=True),
13 |         style='pytorch'))
14 | 


--------------------------------------------------------------------------------
/configs/nuimages/cascade_mask_rcnn_x101_32x4d_fpn_1x_nuim.py:
--------------------------------------------------------------------------------
 1 | _base_ = './cascade_mask_rcnn_r50_fpn_1x_nuim.py'
 2 | model = dict(
 3 |     pretrained='open-mmlab://resnext101_32x4d',
 4 |     backbone=dict(
 5 |         type='ResNeXt',
 6 |         depth=101,
 7 |         groups=32,
 8 |         base_width=4,
 9 |         num_stages=4,
10 |         out_indices=(0, 1, 2, 3),
11 |         frozen_stages=1,
12 |         norm_cfg=dict(type='BN', requires_grad=True),
13 |         style='pytorch'))
14 | 


--------------------------------------------------------------------------------
/mmdet3d/core/anchor/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmdet.core.anchor import build_prior_generator
 3 | from .anchor_3d_generator import (AlignedAnchor3DRangeGenerator,
 4 |                                   AlignedAnchor3DRangeGeneratorPerCls,
 5 |                                   Anchor3DRangeGenerator)
 6 | 
 7 | __all__ = [
 8 |     'AlignedAnchor3DRangeGenerator', 'Anchor3DRangeGenerator',
 9 |     'build_prior_generator', 'AlignedAnchor3DRangeGeneratorPerCls'
10 | ]
11 | 


--------------------------------------------------------------------------------
/extra_tools/dist_test_ssl.sh:
--------------------------------------------------------------------------------
 1 | 
 2 | #!/usr/bin/env bash
 3 | 
 4 | while true
 5 | do
 6 |     PORT=$(( ((RANDOM<<15)|RANDOM) % 49152 + 10000 ))
 7 |     status="$(nc -z 127.0.0.1 $PORT < /dev/null &>/dev/null; echo $?)"
 8 |     if [ "${status}" != "0" ]; then
 9 |         break;
10 |     fi
11 | done
12 | echo $PORT
13 | 
14 | CONFIG=projects/configs/MIM4D/uvtr_convnext_s_vs0.075_finetune.py
15 | CHECKPOINT=ckpts/uvtrs_mim4d_vs0.075/uvtrs_mim4d_vs0.075_finetune.pth
16 | 
17 | 
18 | python3 $(dirname "$0")/test.py $CONFIG $CHECKPOINT --eval bbox


--------------------------------------------------------------------------------
/configs/_base_/schedules/schedule_2x.py:
--------------------------------------------------------------------------------
 1 | # optimizer
 2 | # This schedule is mainly used by models on nuScenes dataset
 3 | optimizer = dict(type='AdamW', lr=0.001, weight_decay=0.01)
 4 | # max_norm=10 is better for SECOND
 5 | optimizer_config = dict(grad_clip=dict(max_norm=35, norm_type=2))
 6 | lr_config = dict(
 7 |     policy='step',
 8 |     warmup='linear',
 9 |     warmup_iters=1000,
10 |     warmup_ratio=1.0 / 1000,
11 |     step=[20, 23])
12 | momentum_config = None
13 | # runtime settings
14 | runner = dict(type='EpochBasedRunner', max_epochs=24)
15 | 


--------------------------------------------------------------------------------
/configs/nuimages/mask_rcnn_r50_fpn_coco-2x_1x_nuim.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/mask_rcnn_r50_fpn.py',
 3 |     '../_base_/datasets/nuim_instance.py',
 4 |     '../_base_/schedules/mmdet_schedule_1x.py', '../_base_/default_runtime.py'
 5 | ]
 6 | model = dict(
 7 |     roi_head=dict(
 8 |         bbox_head=dict(num_classes=10), mask_head=dict(num_classes=10)))
 9 | load_from = 'https://download.openmmlab.com/mmdetection/v2.0/mask_rcnn/mask_rcnn_r50_fpn_2x_coco/mask_rcnn_r50_fpn_2x_coco_bbox_mAP-0.392__segm_mAP-0.354_20200505_003907-3e542a40.pth'  # noqa
10 | 


--------------------------------------------------------------------------------
/mmdet3d/models/utils/clip_sigmoid.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | import torch
 3 | 
 4 | 
 5 | def clip_sigmoid(x, eps=1e-4):
 6 |     """Sigmoid function for input feature.
 7 | 
 8 |     Args:
 9 |         x (torch.Tensor): Input feature map with the shape of [B, N, H, W].
10 |         eps (float): Lower bound of the range to be clamped to. Defaults
11 |             to 1e-4.
12 | 
13 |     Returns:
14 |         torch.Tensor: Feature map after sigmoid.
15 |     """
16 |     y = torch.clamp(x.sigmoid_(), min=eps, max=1 - eps)
17 |     return y
18 | 


--------------------------------------------------------------------------------
/mmdet3d/core/bbox/iou_calculators/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from .iou3d_calculator import (AxisAlignedBboxOverlaps3D, BboxOverlaps3D,
 3 |                                BboxOverlapsNearest3D,
 4 |                                axis_aligned_bbox_overlaps_3d, bbox_overlaps_3d,
 5 |                                bbox_overlaps_nearest_3d)
 6 | 
 7 | __all__ = [
 8 |     'BboxOverlapsNearest3D', 'BboxOverlaps3D', 'bbox_overlaps_nearest_3d',
 9 |     'bbox_overlaps_3d', 'AxisAlignedBboxOverlaps3D',
10 |     'axis_aligned_bbox_overlaps_3d'
11 | ]
12 | 


--------------------------------------------------------------------------------
/configs/centerpoint/centerpoint_01voxel_second_secfpn_dcn_4x8_cyclic_20e_nus.py:
--------------------------------------------------------------------------------
 1 | _base_ = ['./centerpoint_01voxel_second_secfpn_4x8_cyclic_20e_nus.py']
 2 | 
 3 | model = dict(
 4 |     pts_bbox_head=dict(
 5 |         separate_head=dict(
 6 |             type='DCNSeparateHead',
 7 |             dcn_config=dict(
 8 |                 type='DCN',
 9 |                 in_channels=64,
10 |                 out_channels=64,
11 |                 kernel_size=3,
12 |                 padding=1,
13 |                 groups=4),
14 |             init_bias=-2.19,
15 |             final_kernel=3)))
16 | 


--------------------------------------------------------------------------------
/configs/centerpoint/centerpoint_02pillar_second_secfpn_dcn_4x8_cyclic_20e_nus.py:
--------------------------------------------------------------------------------
 1 | _base_ = ['./centerpoint_02pillar_second_secfpn_4x8_cyclic_20e_nus.py']
 2 | 
 3 | model = dict(
 4 |     pts_bbox_head=dict(
 5 |         separate_head=dict(
 6 |             type='DCNSeparateHead',
 7 |             dcn_config=dict(
 8 |                 type='DCN',
 9 |                 in_channels=64,
10 |                 out_channels=64,
11 |                 kernel_size=3,
12 |                 padding=1,
13 |                 groups=4),
14 |             init_bias=-2.19,
15 |             final_kernel=3)))
16 | 


--------------------------------------------------------------------------------
/mmdet3d/core/voxel/builder.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | import mmcv
 3 | 
 4 | from . import voxel_generator
 5 | 
 6 | 
 7 | def build_voxel_generator(cfg, **kwargs):
 8 |     """Builder of voxel generator."""
 9 |     if isinstance(cfg, voxel_generator.VoxelGenerator):
10 |         return cfg
11 |     elif isinstance(cfg, dict):
12 |         return mmcv.runner.obj_from_dict(
13 |             cfg, voxel_generator, default_args=kwargs)
14 |     else:
15 |         raise TypeError('Invalid type {} for building a sampler'.format(
16 |             type(cfg)))
17 | 


--------------------------------------------------------------------------------
/configs/centerpoint/centerpoint_0075voxel_second_secfpn_dcn_4x8_cyclic_20e_nus.py:
--------------------------------------------------------------------------------
 1 | _base_ = ['./centerpoint_0075voxel_second_secfpn_4x8_cyclic_20e_nus.py']
 2 | 
 3 | model = dict(
 4 |     pts_bbox_head=dict(
 5 |         separate_head=dict(
 6 |             type='DCNSeparateHead',
 7 |             dcn_config=dict(
 8 |                 type='DCN',
 9 |                 in_channels=64,
10 |                 out_channels=64,
11 |                 kernel_size=3,
12 |                 padding=1,
13 |                 groups=4),
14 |             init_bias=-2.19,
15 |             final_kernel=3)))
16 | 


--------------------------------------------------------------------------------
/configs/_base_/default_runtime.py:
--------------------------------------------------------------------------------
 1 | checkpoint_config = dict(interval=1)
 2 | # yapf:disable push
 3 | # By default we use textlogger hook and tensorboard
 4 | # For more loggers see
 5 | # https://mmcv.readthedocs.io/en/latest/api.html#mmcv.runner.LoggerHook
 6 | log_config = dict(
 7 |     interval=50,
 8 |     hooks=[
 9 |         dict(type='TextLoggerHook'),
10 |         dict(type='TensorboardLoggerHook')
11 |     ])
12 | # yapf:enable
13 | dist_params = dict(backend='nccl')
14 | log_level = 'INFO'
15 | work_dir = None
16 | load_from = None
17 | resume_from = None
18 | workflow = [('train', 1)]
19 | 


--------------------------------------------------------------------------------
/mmdet3d/models/losses/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmdet.models.losses import FocalLoss, SmoothL1Loss, binary_cross_entropy
 3 | from .axis_aligned_iou_loss import AxisAlignedIoULoss, axis_aligned_iou_loss
 4 | from .chamfer_distance import ChamferDistance, chamfer_distance
 5 | from .paconv_regularization_loss import PAConvRegularizationLoss
 6 | 
 7 | __all__ = [
 8 |     'FocalLoss', 'SmoothL1Loss', 'binary_cross_entropy', 'ChamferDistance',
 9 |     'chamfer_distance', 'axis_aligned_iou_loss', 'AxisAlignedIoULoss',
10 |     'PAConvRegularizationLoss'
11 | ]
12 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/pointnet_modules/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from .builder import build_sa_module
 3 | from .paconv_sa_module import (PAConvCUDASAModule, PAConvCUDASAModuleMSG,
 4 |                                PAConvSAModule, PAConvSAModuleMSG)
 5 | from .point_fp_module import PointFPModule
 6 | from .point_sa_module import PointSAModule, PointSAModuleMSG
 7 | 
 8 | __all__ = [
 9 |     'build_sa_module', 'PointSAModuleMSG', 'PointSAModule', 'PointFPModule',
10 |     'PAConvSAModule', 'PAConvSAModuleMSG', 'PAConvCUDASAModule',
11 |     'PAConvCUDASAModuleMSG'
12 | ]
13 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/voxel/src/voxelization.cpp:
--------------------------------------------------------------------------------
 1 | #include <torch/extension.h>
 2 | #include "voxelization.h"
 3 | 
 4 | namespace voxelization {
 5 | 
 6 | PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
 7 |   m.def("hard_voxelize", &hard_voxelize, "hard voxelize");
 8 |   m.def("dynamic_voxelize", &dynamic_voxelize, "dynamic voxelization");
 9 |   m.def("dynamic_point_to_voxel_forward", &dynamic_point_to_voxel_forward, "dynamic point to voxel forward");
10 |   m.def("dynamic_point_to_voxel_backward", &dynamic_point_to_voxel_backward, "dynamic point to voxel backward");
11 | }
12 | 
13 | } // namespace voxelization
14 | 


--------------------------------------------------------------------------------
/mmdet3d/version.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Open-MMLab. All rights reserved.
 2 | 
 3 | __version__ = '0.17.3'
 4 | short_version = __version__
 5 | 
 6 | 
 7 | def parse_version_info(version_str):
 8 |     version_info = []
 9 |     for x in version_str.split('.'):
10 |         if x.isdigit():
11 |             version_info.append(int(x))
12 |         elif x.find('rc') != -1:
13 |             patch_version = x.split('rc')
14 |             version_info.append(int(patch_version[0]))
15 |             version_info.append(f'rc{patch_version[1]}')
16 |     return tuple(version_info)
17 | 
18 | 
19 | version_info = parse_version_info(__version__)
20 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/models/backbones/__init__.py:
--------------------------------------------------------------------------------
 1 | from .second_3d import SECOND3D
 2 | from .mask_convnext import MaskConvNeXt
 3 | from .mask_resnet import MaskResNet
 4 | from .temporal_backbone import TemporalDecoder, BiTemporalPredictor, BiTemporalPredictor_longshort
 5 | from .bevformerencoder import BEVFormerEncoder, BEVFormerLayer
 6 | from .temporal_cross_attention import TemporalCrossAttention
 7 | # from .pool_3d import Pool3D
 8 | 
 9 | __all__ = ["SECOND3D", "MaskConvNeXt", "MaskResNet","TemporalDecoder","BiTemporalPredictor","BEVFormerEncoder","BEVFormerLayer","TemporalCrossAttention", "BiTemporalPredictor_longshort"]
10 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/ops/point_ops/point_ops.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from . import point_ops_ext
 3 | 
 4 | 
 5 | def group_inner_inds(points, inverse_inds, K):
 6 |     """
 7 |     Args:
 8 |         points: (N, C)
 9 |         inverse_inds: (N, )
10 |     Return:
11 |         group_points: (valid_voxel_num, K, C)
12 |     """
13 |     valid_voxel_num = inverse_inds.max().item() + 1
14 |     group_inds = torch.full((valid_voxel_num, K), -1, dtype=torch.long, device=points.device)
15 |     point_ops_ext.group_inner_inds_wrapper(inverse_inds.contiguous(), group_inds)
16 |     group_points = points[group_inds]
17 |     return group_points


--------------------------------------------------------------------------------
/mmdet3d/models/detectors/two_stage.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmdet.models import DETECTORS, TwoStageDetector
 3 | from .base import Base3DDetector
 4 | 
 5 | 
 6 | @DETECTORS.register_module()
 7 | class TwoStage3DDetector(Base3DDetector, TwoStageDetector):
 8 |     """Base class of two-stage 3D detector.
 9 | 
10 |     It inherits original ``:class:TwoStageDetector`` and
11 |     ``:class:Base3DDetector``. This class could serve as a base class for all
12 |     two-stage 3D detectors.
13 |     """
14 | 
15 |     def __init__(self, **kwargs):
16 |         super(TwoStage3DDetector, self).__init__(**kwargs)
17 | 


--------------------------------------------------------------------------------
/configs/centerpoint/centerpoint_01voxel_second_secfpn_dcn_circlenms_4x8_cyclic_20e_nus.py:
--------------------------------------------------------------------------------
 1 | _base_ = ['./centerpoint_01voxel_second_secfpn_4x8_cyclic_20e_nus.py']
 2 | 
 3 | model = dict(
 4 |     pts_bbox_head=dict(
 5 |         separate_head=dict(
 6 |             type='DCNSeparateHead',
 7 |             dcn_config=dict(
 8 |                 type='DCN',
 9 |                 in_channels=64,
10 |                 out_channels=64,
11 |                 kernel_size=3,
12 |                 padding=1,
13 |                 groups=4),
14 |             init_bias=-2.19,
15 |             final_kernel=3)),
16 |     test_cfg=dict(pts=dict(nms_type='circle')))
17 | 


--------------------------------------------------------------------------------
/mmdet3d/core/bbox/coders/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmdet.core.bbox import build_bbox_coder
 3 | from .anchor_free_bbox_coder import AnchorFreeBBoxCoder
 4 | from .centerpoint_bbox_coders import CenterPointBBoxCoder
 5 | from .delta_xyzwhlr_bbox_coder import DeltaXYZWLHRBBoxCoder
 6 | from .groupfree3d_bbox_coder import GroupFree3DBBoxCoder
 7 | from .partial_bin_based_bbox_coder import PartialBinBasedBBoxCoder
 8 | 
 9 | __all__ = [
10 |     'build_bbox_coder', 'DeltaXYZWLHRBBoxCoder', 'PartialBinBasedBBoxCoder',
11 |     'CenterPointBBoxCoder', 'AnchorFreeBBoxCoder', 'GroupFree3DBBoxCoder'
12 | ]
13 | 


--------------------------------------------------------------------------------
/configs/centerpoint/centerpoint_0075voxel_second_secfpn_dcn_circlenms_4x8_cyclic_20e_nus.py:
--------------------------------------------------------------------------------
 1 | _base_ = ['./centerpoint_0075voxel_second_secfpn_4x8_cyclic_20e_nus.py']
 2 | 
 3 | model = dict(
 4 |     pts_bbox_head=dict(
 5 |         separate_head=dict(
 6 |             type='DCNSeparateHead',
 7 |             dcn_config=dict(
 8 |                 type='DCN',
 9 |                 in_channels=64,
10 |                 out_channels=64,
11 |                 kernel_size=3,
12 |                 padding=1,
13 |                 groups=4),
14 |             init_bias=-2.19,
15 |             final_kernel=3)),
16 |     test_cfg=dict(pts=dict(nms_type='circle')))
17 | 


--------------------------------------------------------------------------------
/configs/centerpoint/centerpoint_02pillar_second_secfpn_dcn_circlenms_4x8_cyclic_20e_nus.py:
--------------------------------------------------------------------------------
 1 | _base_ = ['./centerpoint_02pillar_second_secfpn_4x8_cyclic_20e_nus.py']
 2 | 
 3 | model = dict(
 4 |     pts_bbox_head=dict(
 5 |         separate_head=dict(
 6 |             type='DCNSeparateHead',
 7 |             dcn_config=dict(
 8 |                 type='DCN',
 9 |                 in_channels=64,
10 |                 out_channels=64,
11 |                 kernel_size=3,
12 |                 padding=1,
13 |                 groups=4),
14 |             init_bias=-2.19,
15 |             final_kernel=3)),
16 |     test_cfg=dict(pts=dict(nms_type='circle')))
17 | 


--------------------------------------------------------------------------------
/mmdet3d/models/roi_heads/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from .base_3droi_head import Base3DRoIHead
 3 | from .bbox_heads import PartA2BboxHead
 4 | from .h3d_roi_head import H3DRoIHead
 5 | from .mask_heads import PointwiseSemanticHead, PrimitiveHead
 6 | from .part_aggregation_roi_head import PartAggregationROIHead
 7 | from .roi_extractors import Single3DRoIAwareExtractor, SingleRoIExtractor
 8 | 
 9 | __all__ = [
10 |     'Base3DRoIHead', 'PartAggregationROIHead', 'PointwiseSemanticHead',
11 |     'Single3DRoIAwareExtractor', 'PartA2BboxHead', 'SingleRoIExtractor',
12 |     'H3DRoIHead', 'PrimitiveHead'
13 | ]
14 | 


--------------------------------------------------------------------------------
/configs/_base_/schedules/cosine.py:
--------------------------------------------------------------------------------
 1 | # This schedule is mainly used by models with dynamic voxelization
 2 | # optimizer
 3 | lr = 0.003  # max learning rate
 4 | optimizer = dict(
 5 |     type='AdamW',
 6 |     lr=lr,
 7 |     betas=(0.95, 0.99),  # the momentum is change during training
 8 |     weight_decay=0.001)
 9 | optimizer_config = dict(grad_clip=dict(max_norm=10, norm_type=2))
10 | 
11 | lr_config = dict(
12 |     policy='CosineAnnealing',
13 |     warmup='linear',
14 |     warmup_iters=1000,
15 |     warmup_ratio=1.0 / 10,
16 |     min_lr_ratio=1e-5)
17 | 
18 | momentum_config = None
19 | 
20 | runner = dict(type='EpochBasedRunner', max_epochs=40)
21 | 


--------------------------------------------------------------------------------
/configs/dynamic_voxelization/dv_second_secfpn_6x8_80e_kitti-3d-car.py:
--------------------------------------------------------------------------------
 1 | _base_ = '../second/hv_second_secfpn_6x8_80e_kitti-3d-car.py'
 2 | 
 3 | point_cloud_range = [0, -40, -3, 70.4, 40, 1]
 4 | voxel_size = [0.05, 0.05, 0.1]
 5 | 
 6 | model = dict(
 7 |     type='DynamicVoxelNet',
 8 |     voxel_layer=dict(
 9 |         _delete_=True,
10 |         max_num_points=-1,
11 |         point_cloud_range=point_cloud_range,
12 |         voxel_size=voxel_size,
13 |         max_voxels=(-1, -1)),
14 |     voxel_encoder=dict(
15 |         _delete_=True,
16 |         type='DynamicSimpleVFE',
17 |         voxel_size=voxel_size,
18 |         point_cloud_range=point_cloud_range))
19 | 


--------------------------------------------------------------------------------
/mmdet3d/apis/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from .inference import (convert_SyncBN, inference_detector,
 3 |                         inference_mono_3d_detector,
 4 |                         inference_multi_modality_detector, inference_segmentor,
 5 |                         init_model, show_result_meshlab)
 6 | from .test import single_gpu_test
 7 | from .train import train_model
 8 | 
 9 | __all__ = [
10 |     'inference_detector', 'init_model', 'single_gpu_test',
11 |     'inference_mono_3d_detector', 'show_result_meshlab', 'convert_SyncBN',
12 |     'train_model', 'inference_multi_modality_detector', 'inference_segmentor'
13 | ]
14 | 


--------------------------------------------------------------------------------
/mmdet3d/core/post_processing/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmdet.core.post_processing import (merge_aug_bboxes, merge_aug_masks,
 3 |                                         merge_aug_proposals, merge_aug_scores,
 4 |                                         multiclass_nms)
 5 | from .box3d_nms import aligned_3d_nms, box3d_multiclass_nms, circle_nms
 6 | from .merge_augs import merge_aug_bboxes_3d
 7 | 
 8 | __all__ = [
 9 |     'multiclass_nms', 'merge_aug_proposals', 'merge_aug_bboxes',
10 |     'merge_aug_scores', 'merge_aug_masks', 'box3d_multiclass_nms',
11 |     'aligned_3d_nms', 'merge_aug_bboxes_3d', 'circle_nms'
12 | ]
13 | 


--------------------------------------------------------------------------------
/mmdet3d/models/roi_heads/bbox_heads/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmdet.models.roi_heads.bbox_heads import (BBoxHead, ConvFCBBoxHead,
 3 |                                                DoubleConvFCBBoxHead,
 4 |                                                Shared2FCBBoxHead,
 5 |                                                Shared4Conv1FCBBoxHead)
 6 | from .h3d_bbox_head import H3DBboxHead
 7 | from .parta2_bbox_head import PartA2BboxHead
 8 | 
 9 | __all__ = [
10 |     'BBoxHead', 'ConvFCBBoxHead', 'Shared2FCBBoxHead',
11 |     'Shared4Conv1FCBBoxHead', 'DoubleConvFCBBoxHead', 'PartA2BboxHead',
12 |     'H3DBboxHead'
13 | ]
14 | 


--------------------------------------------------------------------------------
/tools/create_data.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env bash
 2 | 
 3 | set -x
 4 | export PYTHONPATH=`pwd`:$PYTHONPATH
 5 | 
 6 | PARTITION=$1
 7 | JOB_NAME=$2
 8 | CONFIG=$3
 9 | WORK_DIR=$4
10 | GPUS=${GPUS:-1}
11 | GPUS_PER_NODE=${GPUS_PER_NODE:-1}
12 | SRUN_ARGS=${SRUN_ARGS:-""}
13 | JOB_NAME=create_data
14 | 
15 | srun -p ${PARTITION} \
16 |     --job-name=${JOB_NAME} \
17 |     --gres=gpu:${GPUS_PER_NODE} \
18 |     --ntasks=${GPUS} \
19 |     --ntasks-per-node=${GPUS_PER_NODE} \
20 |     --kill-on-bad-exit=1 \
21 |     ${SRUN_ARGS} \
22 |     python -u tools/create_data.py kitti \
23 |             --root-path ./data/kitti \
24 |             --out-dir ./data/kitti \
25 |             --extra-tag kitti
26 | 


--------------------------------------------------------------------------------
/tools/slurm_test.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env bash
 2 | 
 3 | set -x
 4 | 
 5 | PARTITION=$1
 6 | JOB_NAME=$2
 7 | CONFIG=$3
 8 | CHECKPOINT=$4
 9 | GPUS=${GPUS:-8}
10 | GPUS_PER_NODE=${GPUS_PER_NODE:-8}
11 | CPUS_PER_TASK=${CPUS_PER_TASK:-5}
12 | PY_ARGS=${@:5}
13 | SRUN_ARGS=${SRUN_ARGS:-""}
14 | 
15 | PYTHONPATH="$(dirname $0)/..":$PYTHONPATH \
16 | srun -p ${PARTITION} \
17 |     --job-name=${JOB_NAME} \
18 |     --gres=gpu:${GPUS_PER_NODE} \
19 |     --ntasks=${GPUS} \
20 |     --ntasks-per-node=${GPUS_PER_NODE} \
21 |     --cpus-per-task=${CPUS_PER_TASK} \
22 |     --kill-on-bad-exit=1 \
23 |     ${SRUN_ARGS} \
24 |     python -u tools/test.py ${CONFIG} ${CHECKPOINT} --launcher="slurm" ${PY_ARGS}
25 | 


--------------------------------------------------------------------------------
/extra_tools/create_data.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env bash
 2 | 
 3 | set -x
 4 | export PYTHONPATH=`pwd`:$PYTHONPATH
 5 | 
 6 | PARTITION=$1
 7 | JOB_NAME=$2
 8 | CONFIG=$3
 9 | WORK_DIR=$4
10 | GPUS=${GPUS:-1}
11 | GPUS_PER_NODE=${GPUS_PER_NODE:-1}
12 | SRUN_ARGS=${SRUN_ARGS:-""}
13 | JOB_NAME=create_data
14 | 
15 | srun -p ${PARTITION} \
16 |     --job-name=${JOB_NAME} \
17 |     --gres=gpu:${GPUS_PER_NODE} \
18 |     --ntasks=${GPUS} \
19 |     --ntasks-per-node=${GPUS_PER_NODE} \
20 |     --kill-on-bad-exit=1 \
21 |     ${SRUN_ARGS} \
22 |     python3 -u tools/create_data.py kitti \
23 |             --root-path ./data/kitti \
24 |             --out-dir ./data/kitti \
25 |             --extra-tag kitti
26 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/spconv/include/tensorview/helper_launch.h:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | // from pytorch.aten
 3 | #include "tensorview.h"
 4 | namespace tv
 5 | {
 6 | namespace launch
 7 | {
 8 | 
 9 | template <typename T1, typename T2>
10 | inline int DivUp(const T1 a, const T2 b) { return (a + b - 1) / b; }
11 | 
12 | // Use 1024 threads per block, which requires cuda sm_2x or above
13 | constexpr int CUDA_NUM_THREADS = 1024;
14 | // CUDA: number of blocks for threads.
15 | inline int getBlocks(const int N)
16 | {
17 |     TV_ASSERT_RT_ERR(N > 0, "CUDA kernel launch blocks must be positive, but got N=", N);
18 |     return DivUp(N, CUDA_NUM_THREADS);
19 | }
20 | } // namespace launch
21 | } // namespace tv
22 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/__init__.py:
--------------------------------------------------------------------------------
 1 | from .core.bbox.assigners.hungarian_assigner_3d import HungarianAssigner3D
 2 | from .core.bbox.coders.nms_free_coder import NMSFreeCoder
 3 | from .core.bbox.match_costs import BBox3DL1Cost
 4 | from .datasets import NuScenesSweepDataset
 5 | from .datasets.pipelines import (
 6 |     PhotoMetricDistortionMultiViewImage,
 7 |     PadMultiViewImage,
 8 |     NormalizeMultiviewImage,
 9 |     RandomResizeCropFlipMultiViewImage,
10 | )
11 | from .models.backbones import MaskResNet
12 | from .models.detectors import UVTR
13 | from .models.dense_heads import UVTRHead
14 | # from .models.pts_encoder import SparseEncoderHD
15 | from .models.necks import SECOND3DFPN
16 | 


--------------------------------------------------------------------------------
/tools/slurm_train.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env bash
 2 | 
 3 | set -x
 4 | 
 5 | PARTITION=$1
 6 | JOB_NAME=$2
 7 | CONFIG=$3
 8 | WORK_DIR=$4
 9 | GPUS=${GPUS:-8}
10 | GPUS_PER_NODE=${GPUS_PER_NODE:-8}
11 | CPUS_PER_TASK=${CPUS_PER_TASK:-5}
12 | SRUN_ARGS=${SRUN_ARGS:-""}
13 | PY_ARGS=${@:5}
14 | 
15 | PYTHONPATH="$(dirname $0)/..":$PYTHONPATH \
16 | srun -p ${PARTITION} \
17 |     --job-name=${JOB_NAME} \
18 |     --gres=gpu:${GPUS_PER_NODE} \
19 |     --ntasks=${GPUS} \
20 |     --ntasks-per-node=${GPUS_PER_NODE} \
21 |     --cpus-per-task=${CPUS_PER_TASK} \
22 |     --kill-on-bad-exit=1 \
23 |     ${SRUN_ARGS} \
24 |     python -u tools/train.py ${CONFIG} --work-dir=${WORK_DIR} --launcher="slurm" ${PY_ARGS}
25 | 


--------------------------------------------------------------------------------
/mmdet3d/utils/collect_env.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmcv.utils import collect_env as collect_base_env
 3 | from mmcv.utils import get_git_hash
 4 | 
 5 | import mmdet
 6 | import mmdet3d
 7 | import mmseg
 8 | 
 9 | 
10 | def collect_env():
11 |     """Collect the information of the running environments."""
12 |     env_info = collect_base_env()
13 |     env_info['MMDetection'] = mmdet.__version__
14 |     env_info['MMSegmentation'] = mmseg.__version__
15 |     env_info['MMDetection3D'] = mmdet3d.__version__ + '+' + get_git_hash()[:7]
16 | 
17 |     return env_info
18 | 
19 | 
20 | if __name__ == '__main__':
21 |     for name, val in collect_env().items():
22 |         print(f'{name}: {val}')
23 | 


--------------------------------------------------------------------------------
/configs/dynamic_voxelization/dv_pointpillars_secfpn_6x8_160e_kitti-3d-car.py:
--------------------------------------------------------------------------------
 1 | _base_ = '../pointpillars/hv_pointpillars_secfpn_6x8_160e_kitti-3d-car.py'
 2 | 
 3 | voxel_size = [0.16, 0.16, 4]
 4 | point_cloud_range = [0, -39.68, -3, 69.12, 39.68, 1]
 5 | 
 6 | model = dict(
 7 |     type='DynamicVoxelNet',
 8 |     voxel_layer=dict(
 9 |         max_num_points=-1,
10 |         point_cloud_range=point_cloud_range,
11 |         voxel_size=voxel_size,
12 |         max_voxels=(-1, -1)),
13 |     voxel_encoder=dict(
14 |         type='DynamicPillarFeatureNet',
15 |         in_channels=4,
16 |         feat_channels=[64],
17 |         with_distance=False,
18 |         voxel_size=voxel_size,
19 |         point_cloud_range=point_cloud_range))
20 | 


--------------------------------------------------------------------------------
/mmdet3d/core/bbox/samplers/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmdet.core.bbox.samplers import (BaseSampler, CombinedSampler,
 3 |                                       InstanceBalancedPosSampler,
 4 |                                       IoUBalancedNegSampler, OHEMSampler,
 5 |                                       PseudoSampler, RandomSampler,
 6 |                                       SamplingResult)
 7 | from .iou_neg_piecewise_sampler import IoUNegPiecewiseSampler
 8 | 
 9 | __all__ = [
10 |     'BaseSampler', 'PseudoSampler', 'RandomSampler',
11 |     'InstanceBalancedPosSampler', 'IoUBalancedNegSampler', 'CombinedSampler',
12 |     'OHEMSampler', 'SamplingResult', 'IoUNegPiecewiseSampler'
13 | ]
14 | 


--------------------------------------------------------------------------------
/mmdet3d/models/backbones/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmdet.models.backbones import SSDVGG, HRNet, ResNet, ResNetV1d, ResNeXt
 3 | from .multi_backbone import MultiBackbone
 4 | from .nostem_regnet import NoStemRegNet
 5 | from .pointnet2_sa_msg import PointNet2SAMSG
 6 | from .pointnet2_sa_ssg import PointNet2SASSG
 7 | from .second import SECOND
 8 | # from projects_unipad.mmdet3d_plugin.models.backbones import MaskConvNeXt
 9 | 
10 | __all__ = [
11 |     "ResNet",
12 |     "ResNetV1d",
13 |     "ResNeXt",
14 |     "SSDVGG",
15 |     "HRNet",
16 |     "NoStemRegNet",
17 |     "SECOND",
18 |     "PointNet2SASSG",
19 |     "PointNet2SAMSG",
20 |     "MultiBackbone",
21 |     # "MaskConvNeXt",
22 | ]
23 | 


--------------------------------------------------------------------------------
/configs/free_anchor/hv_pointpillars_regnet-400mf_fpn_sbn-all_free-anchor_4x8_2x_nus-3d.py:
--------------------------------------------------------------------------------
 1 | _base_ = './hv_pointpillars_fpn_sbn-all_free-anchor_4x8_2x_nus-3d.py'
 2 | 
 3 | model = dict(
 4 |     pts_backbone=dict(
 5 |         _delete_=True,
 6 |         type='NoStemRegNet',
 7 |         arch='regnetx_400mf',
 8 |         init_cfg=dict(
 9 |             type='Pretrained', checkpoint='open-mmlab://regnetx_400mf'),
10 |         out_indices=(1, 2, 3),
11 |         frozen_stages=-1,
12 |         strides=(1, 2, 2, 2),
13 |         base_channels=64,
14 |         stem_channels=64,
15 |         norm_cfg=dict(type='naiveSyncBN2d', eps=1e-3, momentum=0.01),
16 |         norm_eval=False,
17 |         style='pytorch'),
18 |     pts_neck=dict(in_channels=[64, 160, 384]))
19 | 


--------------------------------------------------------------------------------
/configs/free_anchor/hv_pointpillars_regnet-1.6gf_fpn_sbn-all_free-anchor_4x8_2x_nus-3d.py:
--------------------------------------------------------------------------------
 1 | _base_ = './hv_pointpillars_fpn_sbn-all_free-anchor_4x8_2x_nus-3d.py'
 2 | 
 3 | model = dict(
 4 |     pts_backbone=dict(
 5 |         _delete_=True,
 6 |         type='NoStemRegNet',
 7 |         arch='regnetx_1.6gf',
 8 |         init_cfg=dict(
 9 |             type='Pretrained', checkpoint='open-mmlab://regnetx_1.6gf'),
10 |         out_indices=(1, 2, 3),
11 |         frozen_stages=-1,
12 |         strides=(1, 2, 2, 2),
13 |         base_channels=64,
14 |         stem_channels=64,
15 |         norm_cfg=dict(type='naiveSyncBN2d', eps=1e-3, momentum=0.01),
16 |         norm_eval=False,
17 |         style='pytorch'),
18 |     pts_neck=dict(in_channels=[168, 408, 912]))
19 | 


--------------------------------------------------------------------------------
/configs/free_anchor/hv_pointpillars_regnet-3.2gf_fpn_sbn-all_free-anchor_4x8_2x_nus-3d.py:
--------------------------------------------------------------------------------
 1 | _base_ = './hv_pointpillars_fpn_sbn-all_free-anchor_4x8_2x_nus-3d.py'
 2 | 
 3 | model = dict(
 4 |     pts_backbone=dict(
 5 |         _delete_=True,
 6 |         type='NoStemRegNet',
 7 |         arch='regnetx_3.2gf',
 8 |         init_cfg=dict(
 9 |             type='Pretrained', checkpoint='open-mmlab://regnetx_3.2gf'),
10 |         out_indices=(1, 2, 3),
11 |         frozen_stages=-1,
12 |         strides=(1, 2, 2, 2),
13 |         base_channels=64,
14 |         stem_channels=64,
15 |         norm_cfg=dict(type='naiveSyncBN2d', eps=1e-3, momentum=0.01),
16 |         norm_eval=False,
17 |         style='pytorch'),
18 |     pts_neck=dict(in_channels=[192, 432, 1008]))
19 | 


--------------------------------------------------------------------------------
/tools/misc/print_config.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | import argparse
 3 | from mmcv import Config, DictAction
 4 | 
 5 | 
 6 | def parse_args():
 7 |     parser = argparse.ArgumentParser(description='Print the whole config')
 8 |     parser.add_argument('config', help='config file path')
 9 |     parser.add_argument(
10 |         '--options', nargs='+', action=DictAction, help='arguments in dict')
11 |     args = parser.parse_args()
12 | 
13 |     return args
14 | 
15 | 
16 | def main():
17 |     args = parse_args()
18 | 
19 |     cfg = Config.fromfile(args.config)
20 |     if args.options is not None:
21 |         cfg.merge_from_dict(args.options)
22 |     print(f'Config:\n{cfg.pretty_text}')
23 | 
24 | 
25 | if __name__ == '__main__':
26 |     main()
27 | 


--------------------------------------------------------------------------------
/configs/dynamic_voxelization/dv_second_secfpn_2x8_cosine_80e_kitti-3d-3class.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/hv_second_secfpn_kitti.py',
 3 |     '../_base_/datasets/kitti-3d-3class.py', '../_base_/schedules/cosine.py',
 4 |     '../_base_/default_runtime.py'
 5 | ]
 6 | 
 7 | point_cloud_range = [0, -40, -3, 70.4, 40, 1]
 8 | voxel_size = [0.05, 0.05, 0.1]
 9 | 
10 | model = dict(
11 |     type='DynamicVoxelNet',
12 |     voxel_layer=dict(
13 |         _delete_=True,
14 |         max_num_points=-1,
15 |         point_cloud_range=point_cloud_range,
16 |         voxel_size=voxel_size,
17 |         max_voxels=(-1, -1)),
18 |     voxel_encoder=dict(
19 |         _delete_=True,
20 |         type='DynamicSimpleVFE',
21 |         voxel_size=voxel_size,
22 |         point_cloud_range=point_cloud_range))
23 | 


--------------------------------------------------------------------------------
/configs/ssn/hv_ssn_regnet-400mf_secfpn_sbn-all_2x16_2x_nus-3d.py:
--------------------------------------------------------------------------------
 1 | _base_ = './hv_ssn_secfpn_sbn-all_2x16_2x_nus-3d.py'
 2 | # model settings
 3 | model = dict(
 4 |     type='MVXFasterRCNN',
 5 |     pts_backbone=dict(
 6 |         _delete_=True,
 7 |         type='NoStemRegNet',
 8 |         arch=dict(w0=24, wa=24.48, wm=2.54, group_w=16, depth=22, bot_mul=1.0),
 9 |         init_cfg=dict(
10 |             type='Pretrained', checkpoint='open-mmlab://regnetx_400mf'),
11 |         out_indices=(1, 2, 3),
12 |         frozen_stages=-1,
13 |         strides=(1, 2, 2, 2),
14 |         base_channels=64,
15 |         stem_channels=64,
16 |         norm_cfg=dict(type='naiveSyncBN2d', eps=1e-3, momentum=0.01),
17 |         norm_eval=False,
18 |         style='pytorch'),
19 |     pts_neck=dict(in_channels=[64, 160, 384]))
20 | 


--------------------------------------------------------------------------------
/mmdet3d/models/detectors/ssd3dnet.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmdet.models import DETECTORS
 3 | from .votenet import VoteNet
 4 | 
 5 | 
 6 | @DETECTORS.register_module()
 7 | class SSD3DNet(VoteNet):
 8 |     """3DSSDNet model.
 9 | 
10 |     https://arxiv.org/abs/2002.10187.pdf
11 |     """
12 | 
13 |     def __init__(self,
14 |                  backbone,
15 |                  bbox_head=None,
16 |                  train_cfg=None,
17 |                  test_cfg=None,
18 |                  init_cfg=None,
19 |                  pretrained=None):
20 |         super(SSD3DNet, self).__init__(
21 |             backbone=backbone,
22 |             bbox_head=bbox_head,
23 |             train_cfg=train_cfg,
24 |             test_cfg=test_cfg,
25 |             init_cfg=init_cfg,
26 |             pretrained=pretrained)
27 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/models/utils/__init__.py:
--------------------------------------------------------------------------------
 1 | from .uni3d_detr import Uni3DDETR, UniTransformerDecoder, UniCrossAtten
 2 | from .uni3d_viewtrans import Uni3DViewTrans
 3 | from .uni3d_voxelpool import Uni3DVoxelPool
 4 | from .uni3d_crossattn import Uni3DCrossAttn
 5 | from .uni3d_voxelpooldepth import Uni3DVoxelPoolDepth
 6 | from .uni3d_viewtransego import Uni3DViewTransEgo
 7 | from .uni3d_detr_v2 import Uni3DTransformer, UniTransformerDecoderV2, UniCrossAttenV2
 8 | 
 9 | __all__ = [
10 |     "Uni3DDETR",
11 |     "UniTransformerDecoder",
12 |     "UniCrossAtten",
13 |     "Uni3DViewTrans",
14 |     "Uni3DVoxelPool",
15 |     "Uni3DCrossAttn",
16 |     "Uni3DVoxelPoolDepth",
17 |     "Uni3DTransformer",
18 |     "UniTransformerDecoderV2",
19 |     "UniCrossAttenV2",
20 |     "UniTransformerDecoderV3",
21 |     "Uni3DViewTransEgo",
22 | ]
23 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/datasets/pipelines/__init__.py:
--------------------------------------------------------------------------------
 1 | from .transform_3d import (
 2 |     PadMultiViewImage, NormalizeMultiviewImage, 
 3 |     PhotoMetricDistortionMultiViewImage,
 4 |     RandomResizeCropFlipMultiViewImage,
 5 |     UnifiedRotScaleTransFlip,
 6 |     NormalizeIntensity)
 7 | from .loading_3d import (LoadMultiViewMultiSweepImageFromFiles)
 8 | from .dbsampler import UnifiedDataBaseSampler
 9 | from .formatting import CollectUnified3D
10 | from .test_time_aug import MultiRotScaleFlipAug3D
11 | 
12 | __all__ = [
13 |     'PadMultiViewImage', 'NormalizeMultiviewImage', 
14 |     'PhotoMetricDistortionMultiViewImage', 
15 |     'RandomResizeCropFlipMultiViewImage',
16 |     'LoadMultiViewMultiSweepImageFromFiles',
17 |     'UnifiedRotScaleTransFlip', 'UnifiedDataBaseSampler',
18 |     'MultiRotScaleFlipAug3D', 'NormalizeIntensity'
19 | ]


--------------------------------------------------------------------------------
/configs/pointnet2/pointnet2_ssg_16x2_cosine_50e_s3dis_seg-3d-13class.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/datasets/s3dis_seg-3d-13class.py',
 3 |     '../_base_/models/pointnet2_ssg.py',
 4 |     '../_base_/schedules/seg_cosine_50e.py', '../_base_/default_runtime.py'
 5 | ]
 6 | 
 7 | # data settings
 8 | data = dict(samples_per_gpu=16)
 9 | evaluation = dict(interval=2)
10 | 
11 | # model settings
12 | model = dict(
13 |     backbone=dict(in_channels=9),  # [xyz, rgb, normalized_xyz]
14 |     decode_head=dict(
15 |         num_classes=13, ignore_index=13,
16 |         loss_decode=dict(class_weight=None)),  # S3DIS doesn't use class_weight
17 |     test_cfg=dict(
18 |         num_points=4096,
19 |         block_size=1.0,
20 |         sample_rate=0.5,
21 |         use_normalized_coord=True,
22 |         batch_size=24))
23 | 
24 | # runtime settings
25 | checkpoint_config = dict(interval=2)
26 | 


--------------------------------------------------------------------------------
/mmdet3d/core/bbox/structures/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from .base_box3d import BaseInstance3DBoxes
 3 | from .box_3d_mode import Box3DMode
 4 | from .cam_box3d import CameraInstance3DBoxes
 5 | from .coord_3d_mode import Coord3DMode
 6 | from .depth_box3d import DepthInstance3DBoxes
 7 | from .lidar_box3d import LiDARInstance3DBoxes
 8 | from .utils import (get_box_type, get_proj_mat_by_coord_type, limit_period,
 9 |                     mono_cam_box2vis, points_cam2img, rotation_3d_in_axis,
10 |                     xywhr2xyxyr)
11 | 
12 | __all__ = [
13 |     'Box3DMode', 'BaseInstance3DBoxes', 'LiDARInstance3DBoxes',
14 |     'CameraInstance3DBoxes', 'DepthInstance3DBoxes', 'xywhr2xyxyr',
15 |     'get_box_type', 'rotation_3d_in_axis', 'limit_period', 'points_cam2img',
16 |     'Coord3DMode', 'mono_cam_box2vis', 'get_proj_mat_by_coord_type'
17 | ]
18 | 


--------------------------------------------------------------------------------
/configs/ssn/hv_ssn_regnet-400mf_secfpn_sbn-all_1x16_2x_lyft-3d.py:
--------------------------------------------------------------------------------
 1 | _base_ = './hv_ssn_secfpn_sbn-all_2x16_2x_lyft-3d.py'
 2 | # model settings
 3 | model = dict(
 4 |     type='MVXFasterRCNN',
 5 |     pts_backbone=dict(
 6 |         _delete_=True,
 7 |         type='NoStemRegNet',
 8 |         arch=dict(w0=24, wa=24.48, wm=2.54, group_w=16, depth=22, bot_mul=1.0),
 9 |         init_cfg=dict(
10 |             type='Pretrained', checkpoint='open-mmlab://regnetx_400mf'),
11 |         out_indices=(1, 2, 3),
12 |         frozen_stages=-1,
13 |         strides=(1, 2, 2, 2),
14 |         base_channels=64,
15 |         stem_channels=64,
16 |         norm_cfg=dict(type='naiveSyncBN2d', eps=1e-3, momentum=0.01),
17 |         norm_eval=False,
18 |         style='pytorch'),
19 |     pts_neck=dict(in_channels=[64, 160, 384]))
20 | # dataset settings
21 | data = dict(samples_per_gpu=1, workers_per_gpu=2)
22 | 


--------------------------------------------------------------------------------
/extra_tools/dist_train_ssl.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env bash
 2 | 
 3 | while true
 4 | do
 5 |     PORT=$(( ((RANDOM<<15)|RANDOM) % 49152 + 10000 ))
 6 |     status="$(nc -z 127.0.0.1 $PORT < /dev/null &>/dev/null; echo $?)"
 7 |     if [ "${status}" != "0" ]; then
 8 |         break;
 9 |     fi
10 | done
11 | echo $PORT
12 | 
13 | GPUS=8
14 | 
15 | CONFIG=projects/configs/MIM4D/uvtr_convnext_s_vs0.1_pretrain.py
16 | 
17 | 
18 | PYTHONPATH="$(dirname $0)/..":$PYTHONPATH \
19 | python3 -m torch.distributed.launch --nproc_per_node=$GPUS --master_port=$PORT \
20 |     $(dirname "$0")/train.py $CONFIG --launcher pytorch --no-validate
21 | 
22 | 
23 | CONFIG=projects/configs/MIM4D/uvtr_convnext_s_vs0.1_finetune.py
24 | 
25 | PYTHONPATH="$(dirname $0)/..":$PYTHONPATH \
26 | python3 -m torch.distributed.launch --nproc_per_node=$GPUS --master_port=$PORT \
27 |     $(dirname "$0")/train.py $CONFIG --launcher pytorch
28 | 
29 | 


--------------------------------------------------------------------------------
/configs/regnet/hv_pointpillars_regnet-1.6gf_fpn_sbn-all_4x8_2x_nus-3d.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/hv_pointpillars_fpn_nus.py',
 3 |     '../_base_/datasets/nus-3d.py',
 4 |     '../_base_/schedules/schedule_2x.py',
 5 |     '../_base_/default_runtime.py',
 6 | ]
 7 | # model settings
 8 | model = dict(
 9 |     type='MVXFasterRCNN',
10 |     pts_backbone=dict(
11 |         _delete_=True,
12 |         type='NoStemRegNet',
13 |         arch='regnetx_1.6gf',
14 |         init_cfg=dict(
15 |             type='Pretrained', checkpoint='open-mmlab://regnetx_1.6gf'),
16 |         out_indices=(1, 2, 3),
17 |         frozen_stages=-1,
18 |         strides=(1, 2, 2, 2),
19 |         base_channels=64,
20 |         stem_channels=64,
21 |         norm_cfg=dict(type='naiveSyncBN2d', eps=1e-3, momentum=0.01),
22 |         norm_eval=False,
23 |         style='pytorch'),
24 |     pts_neck=dict(in_channels=[168, 408, 912]))
25 | 


--------------------------------------------------------------------------------
/configs/_base_/schedules/cyclic_20e.py:
--------------------------------------------------------------------------------
 1 | # For nuScenes dataset, we usually evaluate the model at the end of training.
 2 | # Since the models are trained by 24 epochs by default, we set evaluation
 3 | # interval to be 20. Please change the interval accordingly if you do not
 4 | # use a default schedule.
 5 | # optimizer
 6 | # This schedule is mainly used by models on nuScenes dataset
 7 | optimizer = dict(type='AdamW', lr=1e-4, weight_decay=0.01)
 8 | # max_norm=10 is better for SECOND
 9 | optimizer_config = dict(grad_clip=dict(max_norm=35, norm_type=2))
10 | lr_config = dict(
11 |     policy='cyclic',
12 |     target_ratio=(10, 1e-4),
13 |     cyclic_times=1,
14 |     step_ratio_up=0.4,
15 | )
16 | momentum_config = dict(
17 |     policy='cyclic',
18 |     target_ratio=(0.85 / 0.95, 1),
19 |     cyclic_times=1,
20 |     step_ratio_up=0.4,
21 | )
22 | 
23 | # runtime settings
24 | runner = dict(type='EpochBasedRunner', max_epochs=20)
25 | 


--------------------------------------------------------------------------------
/mmdet3d/models/dense_heads/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from .anchor3d_head import Anchor3DHead
 3 | from .anchor_free_mono3d_head import AnchorFreeMono3DHead
 4 | from .base_conv_bbox_head import BaseConvBboxHead
 5 | from .base_mono3d_dense_head import BaseMono3DDenseHead
 6 | from .centerpoint_head import CenterHead
 7 | from .fcos_mono3d_head import FCOSMono3DHead
 8 | from .free_anchor3d_head import FreeAnchor3DHead
 9 | from .groupfree3d_head import GroupFree3DHead
10 | from .parta2_rpn_head import PartA2RPNHead
11 | from .shape_aware_head import ShapeAwareHead
12 | from .ssd_3d_head import SSD3DHead
13 | from .vote_head import VoteHead
14 | 
15 | __all__ = [
16 |     'Anchor3DHead', 'FreeAnchor3DHead', 'PartA2RPNHead', 'VoteHead',
17 |     'SSD3DHead', 'BaseConvBboxHead', 'CenterHead', 'ShapeAwareHead',
18 |     'BaseMono3DDenseHead', 'AnchorFreeMono3DHead', 'FCOSMono3DHead',
19 |     'GroupFree3DHead'
20 | ]
21 | 


--------------------------------------------------------------------------------
/configs/regnet/hv_pointpillars_regnet-400mf_fpn_sbn-all_4x8_2x_nus-3d.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/hv_pointpillars_fpn_nus.py',
 3 |     '../_base_/datasets/nus-3d.py',
 4 |     '../_base_/schedules/schedule_2x.py',
 5 |     '../_base_/default_runtime.py',
 6 | ]
 7 | # model settings
 8 | model = dict(
 9 |     type='MVXFasterRCNN',
10 |     pts_backbone=dict(
11 |         _delete_=True,
12 |         type='NoStemRegNet',
13 |         arch=dict(w0=24, wa=24.48, wm=2.54, group_w=16, depth=22, bot_mul=1.0),
14 |         init_cfg=dict(
15 |             type='Pretrained', checkpoint='open-mmlab://regnetx_400mf'),
16 |         out_indices=(1, 2, 3),
17 |         frozen_stages=-1,
18 |         strides=(1, 2, 2, 2),
19 |         base_channels=64,
20 |         stem_channels=64,
21 |         norm_cfg=dict(type='naiveSyncBN2d', eps=1e-3, momentum=0.01),
22 |         norm_eval=False,
23 |         style='pytorch'),
24 |     pts_neck=dict(in_channels=[64, 160, 384]))
25 | 


--------------------------------------------------------------------------------
/configs/regnet/hv_pointpillars_regnet-400mf_fpn_sbn-all_2x8_2x_lyft-3d.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/hv_pointpillars_fpn_lyft.py',
 3 |     '../_base_/datasets/lyft-3d.py',
 4 |     '../_base_/schedules/schedule_2x.py',
 5 |     '../_base_/default_runtime.py',
 6 | ]
 7 | # model settings
 8 | model = dict(
 9 |     type='MVXFasterRCNN',
10 |     pts_backbone=dict(
11 |         _delete_=True,
12 |         type='NoStemRegNet',
13 |         arch=dict(w0=24, wa=24.48, wm=2.54, group_w=16, depth=22, bot_mul=1.0),
14 |         init_cfg=dict(
15 |             type='Pretrained', checkpoint='open-mmlab://regnetx_400mf'),
16 |         out_indices=(1, 2, 3),
17 |         frozen_stages=-1,
18 |         strides=(1, 2, 2, 2),
19 |         base_channels=64,
20 |         stem_channels=64,
21 |         norm_cfg=dict(type='naiveSyncBN2d', eps=1e-3, momentum=0.01),
22 |         norm_eval=False,
23 |         style='pytorch'),
24 |     pts_neck=dict(in_channels=[64, 160, 384]))
25 | 


--------------------------------------------------------------------------------
/configs/votenet/votenet_16x8_sunrgbd-3d-10class.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/datasets/sunrgbd-3d-10class.py', '../_base_/models/votenet.py',
 3 |     '../_base_/schedules/schedule_3x.py', '../_base_/default_runtime.py'
 4 | ]
 5 | # model settings
 6 | model = dict(
 7 |     bbox_head=dict(
 8 |         num_classes=10,
 9 |         bbox_coder=dict(
10 |             type='PartialBinBasedBBoxCoder',
11 |             num_sizes=10,
12 |             num_dir_bins=12,
13 |             with_rot=True,
14 |             mean_sizes=[
15 |                 [2.114256, 1.620300, 0.927272], [0.791118, 1.279516, 0.718182],
16 |                 [0.923508, 1.867419, 0.845495], [0.591958, 0.552978, 0.827272],
17 |                 [0.699104, 0.454178, 0.75625], [0.69519, 1.346299, 0.736364],
18 |                 [0.528526, 1.002642, 1.172878], [0.500618, 0.632163, 0.683424],
19 |                 [0.404671, 1.071108, 1.688889], [0.76584, 1.398258, 0.472728]
20 |             ]),
21 |     ))
22 | 


--------------------------------------------------------------------------------
/mmdet3d/models/detectors/fcos_mono3d.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmdet.models.builder import DETECTORS
 3 | from .single_stage_mono3d import SingleStageMono3DDetector
 4 | 
 5 | 
 6 | @DETECTORS.register_module()
 7 | class FCOSMono3D(SingleStageMono3DDetector):
 8 |     r"""`FCOS3D <https://arxiv.org/abs/2104.10956>`_ for monocular 3D object detection.
 9 | 
10 |     Currently please refer to our entry on the
11 |     `leaderboard <https://www.nuscenes.org/object-detection?externalData=all&mapData=all&modalities=Camera>`_.
12 |     """  # noqa: E501
13 | 
14 |     def __init__(self,
15 |                  backbone,
16 |                  neck,
17 |                  bbox_head,
18 |                  train_cfg=None,
19 |                  test_cfg=None,
20 |                  pretrained=None):
21 |         super(FCOSMono3D, self).__init__(backbone, neck, bbox_head, train_cfg,
22 |                                          test_cfg, pretrained)
23 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/core/hook/sequentialcontrol.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmcv.runner.hooks import HOOKS, Hook
 3 | from mmdet3d.core.hook.utils import is_parallel
 4 | 
 5 | __all__ = ['SequentialControlHook']
 6 | 
 7 | 
 8 | @HOOKS.register_module()
 9 | class SequentialControlHook(Hook):
10 |     """ """
11 | 
12 |     def __init__(self, temporal_start_epoch=1):
13 |         super().__init__()
14 |         self.temporal_start_epoch=temporal_start_epoch
15 | 
16 |     def set_temporal_flag(self, runner, flag):
17 |         if is_parallel(runner.model.module):
18 |             runner.model.module.module.with_prev=flag
19 |         else:
20 |             runner.model.module.with_prev = flag
21 | 
22 |     def before_run(self, runner):
23 |         self.set_temporal_flag(runner, False)
24 | 
25 |     def before_train_epoch(self, runner):
26 |         if runner.epoch > self.temporal_start_epoch:
27 |             self.set_temporal_flag(runner, True)


--------------------------------------------------------------------------------
/configs/regnet/hv_pointpillars_regnet-400mf_fpn_sbn-all_range100_2x8_2x_lyft-3d.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/hv_pointpillars_fpn_range100_lyft.py',
 3 |     '../_base_/datasets/range100_lyft-3d.py',
 4 |     '../_base_/schedules/schedule_2x.py',
 5 |     '../_base_/default_runtime.py',
 6 | ]
 7 | # model settings
 8 | model = dict(
 9 |     type='MVXFasterRCNN',
10 |     pts_backbone=dict(
11 |         _delete_=True,
12 |         type='NoStemRegNet',
13 |         arch=dict(w0=24, wa=24.48, wm=2.54, group_w=16, depth=22, bot_mul=1.0),
14 |         init_cfg=dict(
15 |             type='Pretrained', checkpoint='open-mmlab://regnetx_400mf'),
16 |         out_indices=(1, 2, 3),
17 |         frozen_stages=-1,
18 |         strides=(1, 2, 2, 2),
19 |         base_channels=64,
20 |         stem_channels=64,
21 |         norm_cfg=dict(type='naiveSyncBN2d', eps=1e-3, momentum=0.01),
22 |         norm_eval=False,
23 |         style='pytorch'),
24 |     pts_neck=dict(in_channels=[64, 160, 384]))
25 | 


--------------------------------------------------------------------------------
/configs/pointnet2/pointnet2_msg_16x2_cosine_80e_s3dis_seg-3d-13class.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/datasets/s3dis_seg-3d-13class.py',
 3 |     '../_base_/models/pointnet2_msg.py',
 4 |     '../_base_/schedules/seg_cosine_50e.py', '../_base_/default_runtime.py'
 5 | ]
 6 | 
 7 | # data settings
 8 | data = dict(samples_per_gpu=16)
 9 | evaluation = dict(interval=2)
10 | 
11 | # model settings
12 | model = dict(
13 |     backbone=dict(in_channels=9),  # [xyz, rgb, normalized_xyz]
14 |     decode_head=dict(
15 |         num_classes=13, ignore_index=13,
16 |         loss_decode=dict(class_weight=None)),  # S3DIS doesn't use class_weight
17 |     test_cfg=dict(
18 |         num_points=4096,
19 |         block_size=1.0,
20 |         sample_rate=0.5,
21 |         use_normalized_coord=True,
22 |         batch_size=24))
23 | 
24 | # runtime settings
25 | checkpoint_config = dict(interval=2)
26 | # PointNet2-MSG needs longer training time than PointNet2-SSG
27 | runner = dict(type='EpochBasedRunner', max_epochs=80)
28 | 


--------------------------------------------------------------------------------
/configs/nuimages/htc_x101_64x4d_fpn_dconv_c3-c5_coco-20e_16x1_20e_nuim.py:
--------------------------------------------------------------------------------
 1 | _base_ = './htc_r50_fpn_1x_nuim.py'
 2 | model = dict(
 3 |     pretrained='open-mmlab://resnext101_64x4d',
 4 |     backbone=dict(
 5 |         type='ResNeXt',
 6 |         depth=101,
 7 |         groups=64,
 8 |         base_width=4,
 9 |         num_stages=4,
10 |         out_indices=(0, 1, 2, 3),
11 |         frozen_stages=1,
12 |         norm_cfg=dict(type='BN', requires_grad=True),
13 |         norm_eval=True,
14 |         style='pytorch',
15 |         dcn=dict(type='DCN', deform_groups=1, fallback_on_stride=False),
16 |         stage_with_dcn=(False, True, True, True)))
17 | 
18 | data = dict(samples_per_gpu=1, workers_per_gpu=1)
19 | # learning policy
20 | lr_config = dict(step=[16, 19])
21 | runner = dict(max_epochs=20)
22 | 
23 | load_from = 'http://download.openmmlab.com/mmdetection/v2.0/htc/htc_x101_64x4d_fpn_dconv_c3-c5_mstrain_400_1400_16x1_20e_coco/htc_x101_64x4d_fpn_dconv_c3-c5_mstrain_400_1400_16x1_20e_coco_20200312-946fd751.pth'  # noqa
24 | 


--------------------------------------------------------------------------------
/configs/3dssd/metafile.yml:
--------------------------------------------------------------------------------
 1 | Collections:
 2 |   - Name: 3DSSD
 3 |     Metadata:
 4 |       Training Data: KITTI
 5 |       Training Techniques:
 6 |         - AdamW
 7 |       Training Resources: 4x TITAN X
 8 |       Architecture:
 9 |         - PointNet++
10 |     Paper:
11 |       URL: https://arxiv.org/abs/2002.10187
12 |       Title: '3DSSD: Point-based 3D Single Stage Object Detector'
13 |     README: configs/3dssd/README.md
14 |     Code:
15 |       URL: https://github.com/open-mmlab/mmdetection3d/blob/master/mmdet3d/models/detectors/ssd3dnet.py#L7
16 |       Version: v0.6.0
17 | 
18 | Models:
19 |   - Name: 3dssd_4x4_kitti-3d-car
20 |     In Collection: 3DSSD
21 |     Config: configs/3dssd/3dssd_4x4_kitti-3d-car.py
22 |     Metadata:
23 |       Training Memory (GB): 4.7
24 |     Results:
25 |       - Task: 3D Object Detection
26 |         Dataset: KITTI
27 |         Metrics:
28 |           mAP: 78.69
29 |     Weights: https://download.openmmlab.com/mmdetection3d/v0.1.0_models/3dssd/3dssd_kitti-3d-car_20210602_124438-b4276f56.pth
30 | 


--------------------------------------------------------------------------------
/mmdet3d/models/detectors/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from .base import Base3DDetector
 3 | from .centerpoint import CenterPoint
 4 | from .dynamic_voxelnet import DynamicVoxelNet
 5 | from .fcos_mono3d import FCOSMono3D
 6 | from .groupfree3dnet import GroupFree3DNet
 7 | from .h3dnet import H3DNet
 8 | from .imvotenet import ImVoteNet
 9 | from .imvoxelnet import ImVoxelNet
10 | from .mvx_faster_rcnn import DynamicMVXFasterRCNN, MVXFasterRCNN
11 | from .mvx_two_stage import MVXTwoStageDetector
12 | from .parta2 import PartA2
13 | from .single_stage_mono3d import SingleStageMono3DDetector
14 | from .ssd3dnet import SSD3DNet
15 | from .votenet import VoteNet
16 | from .voxelnet import VoxelNet
17 | 
18 | __all__ = [
19 |     'Base3DDetector', 'VoxelNet', 'DynamicVoxelNet', 'MVXTwoStageDetector',
20 |     'DynamicMVXFasterRCNN', 'MVXFasterRCNN', 'PartA2', 'VoteNet', 'H3DNet',
21 |     'CenterPoint', 'SSD3DNet', 'ImVoteNet', 'SingleStageMono3DDetector',
22 |     'FCOSMono3D', 'ImVoxelNet', 'GroupFree3DNet'
23 | ]
24 | 


--------------------------------------------------------------------------------
/mmdet3d/core/points/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from .base_points import BasePoints
 3 | from .cam_points import CameraPoints
 4 | from .depth_points import DepthPoints
 5 | from .lidar_points import LiDARPoints
 6 | 
 7 | __all__ = ['BasePoints', 'CameraPoints', 'DepthPoints', 'LiDARPoints']
 8 | 
 9 | 
10 | def get_points_type(points_type):
11 |     """Get the class of points according to coordinate type.
12 | 
13 |     Args:
14 |         points_type (str): The type of points coordinate.
15 |             The valid value are "CAMERA", "LIDAR", or "DEPTH".
16 | 
17 |     Returns:
18 |         class: Points type.
19 |     """
20 |     if points_type == 'CAMERA':
21 |         points_cls = CameraPoints
22 |     elif points_type == 'LIDAR':
23 |         points_cls = LiDARPoints
24 |     elif points_type == 'DEPTH':
25 |         points_cls = DepthPoints
26 |     else:
27 |         raise ValueError('Only "points_type" of "CAMERA", "LIDAR", or "DEPTH"'
28 |                          f' are supported, got {points_type}')
29 | 
30 |     return points_cls
31 | 


--------------------------------------------------------------------------------
/configs/_base_/models/hv_pointpillars_fpn_lyft.py:
--------------------------------------------------------------------------------
 1 | _base_ = './hv_pointpillars_fpn_nus.py'
 2 | 
 3 | # model settings (based on nuScenes model settings)
 4 | # Voxel size for voxel encoder
 5 | # Usually voxel size is changed consistently with the point cloud range
 6 | # If point cloud range is modified, do remember to change all related
 7 | # keys in the config.
 8 | model = dict(
 9 |     pts_voxel_layer=dict(
10 |         max_num_points=20,
11 |         point_cloud_range=[-80, -80, -5, 80, 80, 3],
12 |         max_voxels=(60000, 60000)),
13 |     pts_voxel_encoder=dict(
14 |         feat_channels=[64], point_cloud_range=[-80, -80, -5, 80, 80, 3]),
15 |     pts_middle_encoder=dict(output_shape=[640, 640]),
16 |     pts_bbox_head=dict(
17 |         num_classes=9,
18 |         anchor_generator=dict(
19 |             ranges=[[-80, -80, -1.8, 80, 80, -1.8]], custom_values=[]),
20 |         bbox_coder=dict(type='DeltaXYZWLHRBBoxCoder', code_size=7)),
21 |     # model training settings (based on nuScenes model settings)
22 |     train_cfg=dict(pts=dict(code_weight=[1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0])))
23 | 


--------------------------------------------------------------------------------
/configs/_base_/models/hv_pointpillars_fpn_range100_lyft.py:
--------------------------------------------------------------------------------
 1 | _base_ = './hv_pointpillars_fpn_nus.py'
 2 | 
 3 | # model settings (based on nuScenes model settings)
 4 | # Voxel size for voxel encoder
 5 | # Usually voxel size is changed consistently with the point cloud range
 6 | # If point cloud range is modified, do remember to change all related
 7 | # keys in the config.
 8 | model = dict(
 9 |     pts_voxel_layer=dict(
10 |         max_num_points=20,
11 |         point_cloud_range=[-100, -100, -5, 100, 100, 3],
12 |         max_voxels=(60000, 60000)),
13 |     pts_voxel_encoder=dict(
14 |         feat_channels=[64], point_cloud_range=[-100, -100, -5, 100, 100, 3]),
15 |     pts_middle_encoder=dict(output_shape=[800, 800]),
16 |     pts_bbox_head=dict(
17 |         num_classes=9,
18 |         anchor_generator=dict(
19 |             ranges=[[-100, -100, -1.8, 100, 100, -1.8]], custom_values=[]),
20 |         bbox_coder=dict(type='DeltaXYZWLHRBBoxCoder', code_size=7)),
21 |     # model training settings (based on nuScenes model settings)
22 |     train_cfg=dict(pts=dict(code_weight=[1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0])))
23 | 


--------------------------------------------------------------------------------
/configs/h3dnet/metafile.yml:
--------------------------------------------------------------------------------
 1 | Collections:
 2 |   - Name: H3DNet
 3 |     Metadata:
 4 |       Training Data: ScanNet
 5 |       Training Techniques:
 6 |         - AdamW
 7 |       Training Resources: 8x GeForce GTX 1080 Ti
 8 |       Architecture:
 9 |     Paper:
10 |       URL: https://arxiv.org/abs/2006.05682
11 |       Title: 'H3DNet: 3D Object Detection Using Hybrid Geometric Primitives'
12 |     README: configs/h3dnet/README.md
13 |     Code:
14 |       URL: https://github.com/open-mmlab/mmdetection3d/blob/master/mmdet3d/models/detectors/h3dnet.py#L10
15 |       Version: v0.6.0
16 | 
17 | Models:
18 |   - Name: h3dnet_3x8_scannet-3d-18class
19 |     In Collection: H3DNet
20 |     Config: configs/h3dnet/h3dnet_3x8_scannet-3d-18class.py
21 |     Metadata:
22 |       Training Memory (GB): 7.9
23 |     Results:
24 |       - Task: 3D Object Detection
25 |         Dataset: ScanNet
26 |         Metrics:
27 |           AP@0.25: 66.43
28 |           AP@0.5: 48.01
29 |     Weights: https://download.openmmlab.com/mmdetection3d/v0.1.0_models/h3dnet/h3dnet_scannet-3d-18class/h3dnet_scannet-3d-18class_20200830_000136-02e36246.pth
30 | 


--------------------------------------------------------------------------------
/configs/imvoxelnet/metafile.yml:
--------------------------------------------------------------------------------
 1 | Collections:
 2 |   - Name: ImVoxelNet
 3 |     Metadata:
 4 |       Training Data: KITTI
 5 |       Training Techniques:
 6 |         - AdamW
 7 |       Training Resources: 8x Tesla P40
 8 |       Architecture:
 9 |         - Anchor3DHead
10 |     Paper:
11 |       URL: https://arxiv.org/abs/2106.01178
12 |       Title: 'ImVoxelNet: Image to Voxels Projection for Monocular and Multi-View General-Purpose 3D Object Detection'
13 |     README: configs/imvoxelnet/README.md
14 |     Code:
15 |       URL: https://github.com/open-mmlab/mmdetection3d/blob/master/mmdet3d/models/detectors/imvoxelnet.py#L11
16 |       Version: v0.15.0
17 | 
18 | Models:
19 |   - Name: imvoxelnet_kitti-3d-car
20 |     In Collection: ImVoxelNet
21 |     Config: configs/imvoxelnet/imvoxelnet_kitti-3d-car.py
22 |     Metadata:
23 |       Training Memory (GB): 15.0
24 |     Results:
25 |       - Task: 3D Object Detection
26 |         Dataset: KITTI
27 |         Metrics:
28 |           mAP: 17.4
29 |     Weights: https://download.openmmlab.com/mmdetection3d/v0.1.0_models/imvoxelnet/imvoxelnet_kitti-3d-car_20210610_152323-b9abba85.pth
30 | 


--------------------------------------------------------------------------------
/mmdet3d/apis/train.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmdet.apis import train_detector
 3 | from mmseg.apis import train_segmentor
 4 | 
 5 | 
 6 | def train_model(model,
 7 |                 dataset,
 8 |                 cfg,
 9 |                 distributed=False,
10 |                 validate=False,
11 |                 timestamp=None,
12 |                 meta=None):
13 |     """A function wrapper for launching model training according to cfg.
14 | 
15 |     Because we need different eval_hook in runner. Should be deprecated in the
16 |     future.
17 |     """
18 |     if cfg.model.type in ['EncoderDecoder3D']:
19 |         train_segmentor(
20 |             model,
21 |             dataset,
22 |             cfg,
23 |             distributed=distributed,
24 |             validate=validate,
25 |             timestamp=timestamp,
26 |             meta=meta)
27 |     else:
28 |         train_detector(
29 |             model,
30 |             dataset,
31 |             cfg,
32 |             distributed=distributed,
33 |             validate=validate,
34 |             timestamp=timestamp,
35 |             meta=meta)
36 | 


--------------------------------------------------------------------------------
/configs/second/hv_second_secfpn_6x8_80e_kitti-3d-car.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/hv_second_secfpn_kitti.py',
 3 |     '../_base_/datasets/kitti-3d-car.py', '../_base_/schedules/cyclic_40e.py',
 4 |     '../_base_/default_runtime.py'
 5 | ]
 6 | point_cloud_range = [0, -40, -3, 70.4, 40, 1]
 7 | model = dict(
 8 |     bbox_head=dict(
 9 |         type='Anchor3DHead',
10 |         num_classes=1,
11 |         anchor_generator=dict(
12 |             _delete_=True,
13 |             type='Anchor3DRangeGenerator',
14 |             ranges=[[0, -40.0, -1.78, 70.4, 40.0, -1.78]],
15 |             sizes=[[1.6, 3.9, 1.56]],
16 |             rotations=[0, 1.57],
17 |             reshape_out=True)),
18 |     # model training and testing settings
19 |     train_cfg=dict(
20 |         _delete_=True,
21 |         assigner=dict(
22 |             type='MaxIoUAssigner',
23 |             iou_calculator=dict(type='BboxOverlapsNearest3D'),
24 |             pos_iou_thr=0.6,
25 |             neg_iou_thr=0.45,
26 |             min_pos_iou=0.45,
27 |             ignore_iof_thr=-1),
28 |         allowed_border=0,
29 |         pos_weight=-1,
30 |         debug=False))
31 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/core/bbox/match_costs/match_cost.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from mmdet.core.bbox.match_costs.builder import MATCH_COST
 3 | from mmdet3d.core.bbox.iou_calculators import BboxOverlaps3D
 4 | 
 5 | 
 6 | @MATCH_COST.register_module()
 7 | class BBox3DL1Cost(object):
 8 |     """BBox3DL1Cost.
 9 |      Args:
10 |          weight (int | float, optional): loss_weight
11 |     """
12 | 
13 |     def __init__(self, weight=1.):
14 |         self.weight = weight
15 | 
16 |     def __call__(self, bbox_pred, gt_bboxes):
17 |         bbox_cost = torch.cdist(bbox_pred, gt_bboxes, p=1)
18 |         return bbox_cost * self.weight
19 | 
20 | 
21 | @MATCH_COST.register_module()
22 | class BBox3DIoUCost(object):
23 |     """BBox3DL1Cost.
24 |      Args:
25 |          weight (int | float, optional): loss_weight
26 |     """
27 | 
28 |     def __init__(self, weight=1., coordinate='lidar'):
29 |         self.weight = weight
30 |         self.iou_calculator = BboxOverlaps3D(coordinate=coordinate)
31 | 
32 |     def __call__(self, bbox_pred, gt_bboxes):
33 |         iou_cost = -self.iou_calculator(bbox_pred, gt_bboxes)
34 |         return iou_cost * self.weight
35 | 


--------------------------------------------------------------------------------
/configs/paconv/metafile.yml:
--------------------------------------------------------------------------------
 1 | Collections:
 2 |   - Name: PAConv
 3 |     Metadata:
 4 |       Training Techniques:
 5 |         - SGD
 6 |       Training Resources: 8x Titan XP GPUs
 7 |       Architecture:
 8 |         - PAConv
 9 |     Paper:
10 |       URL: https://arxiv.org/abs/2103.14635
11 |       Title: 'PAConv: Position Adaptive Convolution with Dynamic Kernel Assembling on Point Clouds'
12 |     README: configs/paconv/README.md
13 |     Code:
14 |       URL: https://github.com/open-mmlab/mmdetection3d/blob/master/mmdet3d/ops/paconv/paconv.py#L106
15 |       Version: v0.16.0
16 | 
17 | Models:
18 |   - Name: paconv_ssg_8x8_cosine_150e_s3dis_seg-3d-13class.py
19 |     In Collection: PAConv
20 |     Config: configs/paconv/paconv_ssg_8x8_cosine_150e_s3dis_seg-3d-13class.py
21 |     Metadata:
22 |       Training Data: S3DIS
23 |       Training Memory (GB): 5.8
24 |     Results:
25 |       - Task: 3D Semantic Segmentation
26 |         Dataset: S3DIS
27 |         Metrics:
28 |           mIoU: 66.65
29 |     Weights: https://download.openmmlab.com/mmdetection3d/v0.1.0_models/paconv/paconv_ssg_8x8_cosine_150e_s3dis_seg-3d-13class/paconv_ssg_8x8_cosine_150e_s3dis_seg-3d-13class_20210729_200615-2147b2d1.pth
30 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/furthest_point_sample/utils.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | 
 3 | 
 4 | def calc_square_dist(point_feat_a, point_feat_b, norm=True):
 5 |     """Calculating square distance between a and b.
 6 | 
 7 |     Args:
 8 |         point_feat_a (Tensor): (B, N, C) Feature vector of each point.
 9 |         point_feat_b (Tensor): (B, M, C) Feature vector of each point.
10 |         norm (Bool): Whether to normalize the distance.
11 |             Default: True.
12 | 
13 |     Returns:
14 |         Tensor: (B, N, M) Distance between each pair points.
15 |     """
16 |     length_a = point_feat_a.shape[1]
17 |     length_b = point_feat_b.shape[1]
18 |     num_channel = point_feat_a.shape[-1]
19 |     # [bs, n, 1]
20 |     a_square = torch.sum(point_feat_a.unsqueeze(dim=2).pow(2), dim=-1)
21 |     # [bs, 1, m]
22 |     b_square = torch.sum(point_feat_b.unsqueeze(dim=1).pow(2), dim=-1)
23 |     a_square = a_square.repeat((1, 1, length_b))  # [bs, n, m]
24 |     b_square = b_square.repeat((1, length_a, 1))  # [bs, n, m]
25 | 
26 |     coor = torch.matmul(point_feat_a, point_feat_b.transpose(1, 2))
27 | 
28 |     dist = a_square + b_square - 2 * coor
29 |     if norm:
30 |         dist = torch.sqrt(dist) / num_channel
31 |     return dist
32 | 


--------------------------------------------------------------------------------
/mmdet3d/utils/logger.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | import logging
 3 | from mmcv.utils import get_logger
 4 | 
 5 | 
 6 | def get_root_logger(log_file=None, log_level=logging.INFO, name='mmdet3d'):
 7 |     """Get root logger and add a keyword filter to it.
 8 | 
 9 |     The logger will be initialized if it has not been initialized. By default a
10 |     StreamHandler will be added. If `log_file` is specified, a FileHandler will
11 |     also be added. The name of the root logger is the top-level package name,
12 |     e.g., "mmdet3d".
13 | 
14 |     Args:
15 |         log_file (str, optional): File path of log. Defaults to None.
16 |         log_level (int, optional): The level of logger.
17 |             Defaults to logging.INFO.
18 |         name (str, optional): The name of the root logger, also used as a
19 |             filter keyword. Defaults to 'mmdet3d'.
20 | 
21 |     Returns:
22 |         :obj:`logging.Logger`: The obtained logger
23 |     """
24 |     logger = get_logger(name=name, log_file=log_file, log_level=log_level)
25 | 
26 |     # add a logging filter
27 |     logging_filter = logging.Filter(name)
28 |     logging_filter.filter = lambda record: record.find(name) != -1
29 | 
30 |     return logger
31 | 


--------------------------------------------------------------------------------
/configs/mvxnet/metafile.yml:
--------------------------------------------------------------------------------
 1 | Collections:
 2 |   - Name: MVX-Net
 3 |     Metadata:
 4 |       Training Data: KITTI
 5 |       Training Techniques:
 6 |         - AdamW
 7 |       Training Resources: 8x V100 GPUs
 8 |       Architecture:
 9 |         - Feature Pyramid Network
10 |         - Dynamic Voxelization
11 |     Paper:
12 |       URL: https://arxiv.org/abs/1904.01649
13 |       Title: 'MVX-Net: Multimodal VoxelNet for 3D Object Detection'
14 |     README: configs/mvxnet/README.md
15 |     Code:
16 |       URL: https://github.com/open-mmlab/mmdetection3d/blob/master/mmdet3d/models/detectors/mvx_two_stage.py#L20
17 |       Version: v0.5.0
18 | 
19 | Models:
20 |   - Name: dv_mvx-fpn_second_secfpn_adamw_2x8_80e_kitti-3d-3class
21 |     In Collection: MVX-Net
22 |     Config: configs/mvxnet/dv_mvx-fpn_second_secfpn_adamw_2x8_80e_kitti-3d-3class.py
23 |     Metadata:
24 |       Training Memory (GB): 6.7
25 |     Results:
26 |       - Task: 3D Object Detection
27 |         Dataset: KITTI
28 |         Metrics:
29 |           mAP: 63.0
30 |     Weights: https://download.openmmlab.com/mmdetection3d/v0.1.0_models/mvxnet/dv_mvx-fpn_second_secfpn_adamw_2x8_80e_kitti-3d-3class/dv_mvx-fpn_second_secfpn_adamw_2x8_80e_kitti-3d-3class_20200621_003904-10140f2d.pth
31 | 


--------------------------------------------------------------------------------
/tools/model_converters/publish_model.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | import argparse
 3 | import subprocess
 4 | import torch
 5 | 
 6 | 
 7 | def parse_args():
 8 |     parser = argparse.ArgumentParser(
 9 |         description='Process a checkpoint to be published')
10 |     parser.add_argument('in_file', help='input checkpoint filename')
11 |     parser.add_argument('out_file', help='output checkpoint filename')
12 |     args = parser.parse_args()
13 |     return args
14 | 
15 | 
16 | def process_checkpoint(in_file, out_file):
17 |     checkpoint = torch.load(in_file, map_location='cpu')
18 |     # remove optimizer for smaller file size
19 |     if 'optimizer' in checkpoint:
20 |         del checkpoint['optimizer']
21 |     # if it is necessary to remove some sensitive data in checkpoint['meta'],
22 |     # add the code here.
23 |     torch.save(checkpoint, out_file)
24 |     sha = subprocess.check_output(['sha256sum', out_file]).decode()
25 |     final_file = out_file.rstrip('.pth') + '-{}.pth'.format(sha[:8])
26 |     subprocess.Popen(['mv', out_file, final_file])
27 | 
28 | 
29 | def main():
30 |     args = parse_args()
31 |     process_checkpoint(args.in_file, args.out_file)
32 | 
33 | 
34 | if __name__ == '__main__':
35 |     main()
36 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/paconv/src/assign_score_withk.cpp:
--------------------------------------------------------------------------------
 1 | // Modified from https://github.com/CVMI-Lab/PAConv/tree/main/scene_seg/lib/paconv_lib/src/gpu
 2 | 
 3 | #include <torch/torch.h>
 4 | #include <torch/extension.h>
 5 | 
 6 | void assign_score_withk_forward_wrapper(
 7 |   int B, int N0, int N1, int M,
 8 |   int K, int O, int aggregate,
 9 |   const at::Tensor& points,
10 |   const at::Tensor& centers,
11 |   const at::Tensor& scores,
12 |   const at::Tensor& knn_idx,
13 |   at::Tensor& output
14 |   );
15 | 
16 | void assign_score_withk_backward_wrapper(
17 |   int B, int N0, int N1, int M,
18 |   int K, int O, int aggregate,
19 |   const at::Tensor& grad_out,
20 |   const at::Tensor& points,
21 |   const at::Tensor& centers,
22 |   const at::Tensor& scores,
23 |   const at::Tensor& knn_idx,
24 |   at::Tensor& grad_points,
25 |   at::Tensor& grad_centers,
26 |   at::Tensor& grad_scores
27 |   );
28 | 
29 | PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
30 |   m.def("assign_score_withk_forward_wrapper",
31 |         &assign_score_withk_forward_wrapper,
32 |         "Assign score kernel forward (GPU), save memory version");
33 |   m.def("assign_score_withk_backward_wrapper",
34 |         &assign_score_withk_backward_wrapper,
35 |         "Assign score kernel backward (GPU), save memory version");
36 | }
37 | 


--------------------------------------------------------------------------------
/configs/pointpillars/hv_pointpillars_secfpn_sbn_2x16_2x_waymoD5-3d-car.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/hv_pointpillars_secfpn_waymo.py',
 3 |     '../_base_/datasets/waymoD5-3d-car.py',
 4 |     '../_base_/schedules/schedule_2x.py',
 5 |     '../_base_/default_runtime.py',
 6 | ]
 7 | 
 8 | # model settings
 9 | model = dict(
10 |     type='MVXFasterRCNN',
11 |     pts_bbox_head=dict(
12 |         type='Anchor3DHead',
13 |         num_classes=1,
14 |         anchor_generator=dict(
15 |             type='AlignedAnchor3DRangeGenerator',
16 |             ranges=[[-74.88, -74.88, -0.0345, 74.88, 74.88, -0.0345]],
17 |             sizes=[[2.08, 4.73, 1.77]],
18 |             rotations=[0, 1.57],
19 |             reshape_out=True)),
20 |     # model training and testing settings
21 |     train_cfg=dict(
22 |         _delete_=True,
23 |         pts=dict(
24 |             assigner=dict(
25 |                 type='MaxIoUAssigner',
26 |                 iou_calculator=dict(type='BboxOverlapsNearest3D'),
27 |                 pos_iou_thr=0.55,
28 |                 neg_iou_thr=0.4,
29 |                 min_pos_iou=0.4,
30 |                 ignore_iof_thr=-1),
31 |             allowed_border=0,
32 |             code_weight=[1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0],
33 |             pos_weight=-1,
34 |             debug=False)))
35 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/core/hook/syncbncontrol.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmcv.runner.hooks import HOOKS, Hook
 3 | from mmdet3d.core.hook.utils import is_parallel
 4 | from torch.nn import SyncBatchNorm
 5 | 
 6 | __all__ = ['SyncbnControlHook']
 7 | 
 8 | 
 9 | @HOOKS.register_module()
10 | class SyncbnControlHook(Hook):
11 |     """ """
12 | 
13 |     def __init__(self, syncbn_start_epoch=1):
14 |         super().__init__()
15 |         self.is_syncbn=False
16 |         self.syncbn_start_epoch = syncbn_start_epoch
17 | 
18 |     def cvt_syncbn(self, runner):
19 |         if is_parallel(runner.model.module):
20 |             runner.model.module.module=\
21 |                 SyncBatchNorm.convert_sync_batchnorm(runner.model.module.module,
22 |                                                      process_group=None)
23 |         else:
24 |             runner.model.module=\
25 |                 SyncBatchNorm.convert_sync_batchnorm(runner.model.module,
26 |                                                      process_group=None)
27 | 
28 |     def before_train_epoch(self, runner):
29 |         if runner.epoch>= self.syncbn_start_epoch and not self.is_syncbn:
30 |             print('start use syncbn')
31 |             self.cvt_syncbn(runner)
32 |             self.is_syncbn=True
33 | 
34 | 


--------------------------------------------------------------------------------
/configs/mvxnet/README.md:
--------------------------------------------------------------------------------
 1 | # MVX-Net: Multimodal VoxelNet for 3D Object Detection
 2 | 
 3 | ## Introduction
 4 | 
 5 | <!-- [ALGORITHM] -->
 6 | 
 7 | We implement MVX-Net and provide its results and models on KITTI dataset.
 8 | 
 9 | ```
10 | @inproceedings{sindagi2019mvx,
11 |   title={MVX-Net: Multimodal voxelnet for 3D object detection},
12 |   author={Sindagi, Vishwanath A and Zhou, Yin and Tuzel, Oncel},
13 |   booktitle={2019 International Conference on Robotics and Automation (ICRA)},
14 |   pages={7276--7282},
15 |   year={2019},
16 |   organization={IEEE}
17 | }
18 | 
19 | ```
20 | 
21 | ## Results
22 | 
23 | ### KITTI
24 | 
25 | |  Backbone   |Class| Lr schd | Mem (GB) | Inf time (fps) | mAP | Download |
26 | | :---------: | :-----: | :------: | :------------: | :----: |:----: | :------: |
27 | |    [SECFPN](./dv_mvx-fpn_second_secfpn_adamw_2x8_80e_kitti-3d-3class.py)|3 Class|cosine 80e|6.7||63.0|[model](https://download.openmmlab.com/mmdetection3d/v0.1.0_models/mvxnet/dv_mvx-fpn_second_secfpn_adamw_2x8_80e_kitti-3d-3class/dv_mvx-fpn_second_secfpn_adamw_2x8_80e_kitti-3d-3class_20200621_003904-10140f2d.pth) &#124; [log](https://download.openmmlab.com/mmdetection3d/v0.1.0_models/mvxnet/dv_mvx-fpn_second_secfpn_adamw_2x8_80e_kitti-3d-3class/dv_mvx-fpn_second_secfpn_adamw_2x8_80e_kitti-3d-3class_20200621_003904.log.json)|
28 | 


--------------------------------------------------------------------------------
/configs/imvoxelnet/README.md:
--------------------------------------------------------------------------------
 1 | # ImVoxelNet: Image to Voxels Projection for Monocular and Multi-View General-Purpose 3D Object Detection
 2 | 
 3 | ## Introduction
 4 | 
 5 | <!-- [ALGORITHM] -->
 6 | 
 7 | We implement a monocular 3D detector ImVoxelNet and provide its results and checkpoints on KITTI dataset.
 8 | Results for SUN RGB-D, ScanNet and nuScenes are currently available in ImVoxelNet authors
 9 | [repo](https://github.com/saic-vul/imvoxelnet) (based on mmdetection3d).
10 | 
11 | ```
12 | @article{rukhovich2021imvoxelnet,
13 |   title={ImVoxelNet: Image to Voxels Projection for Monocular and Multi-View General-Purpose 3D Object Detection},
14 |   author={Danila Rukhovich, Anna Vorontsova, Anton Konushin},
15 |   journal={arXiv preprint arXiv:2106.01178},
16 |   year={2021}
17 | }
18 | ```
19 | 
20 | ## Results
21 | 
22 | ### KITTI
23 | 
24 | |  Backbone   |Class| Lr schd | Mem (GB) | Inf time (fps) | mAP | Download |
25 | | :---------: | :-----: |:-----: | :------: | :------------: | :----: |:----: |
26 | | [ResNet-50](./imvoxelnet_kitti-3d-car.py) | Car | 3x | | |17.4|[model](https://download.openmmlab.com/mmdetection3d/v0.1.0_models/imvoxelnet/imvoxelnet_kitti-3d-car_20210610_152323-b9abba85.pth) &#124; [log](https://download.openmmlab.com/mmdetection3d/v0.1.0_models/imvoxelnet/imvoxelnet_kitti-3d-car_20210610_152323.log.json)|
27 | 


--------------------------------------------------------------------------------
/mmdet3d/models/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from .backbones import *  # noqa: F401,F403
 3 | from .builder import (FUSION_LAYERS, MIDDLE_ENCODERS, VOXEL_ENCODERS,
 4 |                       build_backbone, build_detector, build_fusion_layer,
 5 |                       build_head, build_loss, build_middle_encoder,
 6 |                       build_model, build_neck, build_roi_extractor,
 7 |                       build_shared_head, build_voxel_encoder)
 8 | from .decode_heads import *  # noqa: F401,F403
 9 | from .dense_heads import *  # noqa: F401,F403
10 | from .detectors import *  # noqa: F401,F403
11 | from .fusion_layers import *  # noqa: F401,F403
12 | from .losses import *  # noqa: F401,F403
13 | from .middle_encoders import *  # noqa: F401,F403
14 | from .model_utils import *  # noqa: F401,F403
15 | from .necks import *  # noqa: F401,F403
16 | from .roi_heads import *  # noqa: F401,F403
17 | from .segmentors import *  # noqa: F401,F403
18 | from .voxel_encoders import *  # noqa: F401,F403
19 | 
20 | __all__ = [
21 |     'VOXEL_ENCODERS', 'MIDDLE_ENCODERS', 'FUSION_LAYERS', 'build_backbone',
22 |     'build_neck', 'build_roi_extractor', 'build_shared_head', 'build_head',
23 |     'build_loss', 'build_detector', 'build_fusion_layer', 'build_model',
24 |     'build_middle_encoder', 'build_voxel_encoder'
25 | ]
26 | 


--------------------------------------------------------------------------------
/configs/_base_/models/pointnet2_msg.py:
--------------------------------------------------------------------------------
 1 | _base_ = './pointnet2_ssg.py'
 2 | 
 3 | # model settings
 4 | model = dict(
 5 |     backbone=dict(
 6 |         _delete_=True,
 7 |         type='PointNet2SAMSG',
 8 |         in_channels=6,  # [xyz, rgb], should be modified with dataset
 9 |         num_points=(1024, 256, 64, 16),
10 |         radii=((0.05, 0.1), (0.1, 0.2), (0.2, 0.4), (0.4, 0.8)),
11 |         num_samples=((16, 32), (16, 32), (16, 32), (16, 32)),
12 |         sa_channels=(((16, 16, 32), (32, 32, 64)), ((64, 64, 128), (64, 96,
13 |                                                                     128)),
14 |                      ((128, 196, 256), (128, 196, 256)), ((256, 256, 512),
15 |                                                           (256, 384, 512))),
16 |         aggregation_channels=(None, None, None, None),
17 |         fps_mods=(('D-FPS'), ('D-FPS'), ('D-FPS'), ('D-FPS')),
18 |         fps_sample_range_lists=((-1), (-1), (-1), (-1)),
19 |         dilated_group=(False, False, False, False),
20 |         out_indices=(0, 1, 2, 3),
21 |         sa_cfg=dict(
22 |             type='PointSAModuleMSG',
23 |             pool_mod='max',
24 |             use_xyz=True,
25 |             normalize_xyz=False)),
26 |     decode_head=dict(
27 |         fp_channels=((1536, 256, 256), (512, 256, 256), (352, 256, 128),
28 |                      (128, 128, 128, 128))))
29 | 


--------------------------------------------------------------------------------
/configs/pointnet2/pointnet2_ssg_16x2_cosine_200e_scannet_seg-3d-20class.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/datasets/scannet_seg-3d-20class.py',
 3 |     '../_base_/models/pointnet2_ssg.py',
 4 |     '../_base_/schedules/seg_cosine_200e.py', '../_base_/default_runtime.py'
 5 | ]
 6 | 
 7 | # data settings
 8 | data = dict(samples_per_gpu=16)
 9 | evaluation = dict(interval=5)
10 | 
11 | # model settings
12 | model = dict(
13 |     decode_head=dict(
14 |         num_classes=20,
15 |         ignore_index=20,
16 |         # `class_weight` is generated in data pre-processing, saved in
17 |         # `data/scannet/seg_info/train_label_weight.npy`
18 |         # you can copy paste the values here, or input the file path as
19 |         # `class_weight=data/scannet/seg_info/train_label_weight.npy`
20 |         loss_decode=dict(class_weight=[
21 |             2.389689, 2.7215734, 4.5944676, 4.8543367, 4.096086, 4.907941,
22 |             4.690836, 4.512031, 4.623311, 4.9242644, 5.358117, 5.360071,
23 |             5.019636, 4.967126, 5.3502126, 5.4023647, 5.4027233, 5.4169416,
24 |             5.3954206, 4.6971426
25 |         ])),
26 |     test_cfg=dict(
27 |         num_points=8192,
28 |         block_size=1.5,
29 |         sample_rate=0.5,
30 |         use_normalized_coord=False,
31 |         batch_size=24))
32 | 
33 | # runtime settings
34 | checkpoint_config = dict(interval=5)
35 | 


--------------------------------------------------------------------------------
/configs/pointpillars/hv_pointpillars_secfpn_sbn_2x16_2x_waymo-3d-car.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/hv_pointpillars_secfpn_waymo.py',
 3 |     '../_base_/datasets/waymoD5-3d-car.py',
 4 |     '../_base_/schedules/schedule_2x.py',
 5 |     '../_base_/default_runtime.py',
 6 | ]
 7 | 
 8 | # data settings
 9 | data = dict(train=dict(dataset=dict(load_interval=1)))
10 | 
11 | # model settings
12 | model = dict(
13 |     type='MVXFasterRCNN',
14 |     pts_bbox_head=dict(
15 |         type='Anchor3DHead',
16 |         num_classes=1,
17 |         anchor_generator=dict(
18 |             type='AlignedAnchor3DRangeGenerator',
19 |             ranges=[[-74.88, -74.88, -0.0345, 74.88, 74.88, -0.0345]],
20 |             sizes=[[2.08, 4.73, 1.77]],
21 |             rotations=[0, 1.57],
22 |             reshape_out=True)),
23 |     # model training and testing settings
24 |     train_cfg=dict(
25 |         _delete_=True,
26 |         pts=dict(
27 |             assigner=dict(
28 |                 type='MaxIoUAssigner',
29 |                 iou_calculator=dict(type='BboxOverlapsNearest3D'),
30 |                 pos_iou_thr=0.55,
31 |                 neg_iou_thr=0.4,
32 |                 min_pos_iou=0.4,
33 |                 ignore_iof_thr=-1),
34 |             allowed_border=0,
35 |             code_weight=[1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0],
36 |             pos_weight=-1,
37 |             debug=False)))
38 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/ops/point_ops/src/point_ops.cpp:
--------------------------------------------------------------------------------
 1 | #include <torch/torch.h>
 2 | #include <c10/cuda/CUDAGuard.h>
 3 | 
 4 | #define CHECK_CUDA(x) do { \
 5 |   if (!x.type().is_cuda()) { \
 6 |     fprintf(stderr, "%s must be CUDA tensor at %s:%d\n", #x, __FILE__, __LINE__); \
 7 |     exit(-1); \
 8 |   } \
 9 | } while (0)
10 | #define CHECK_CONTIGUOUS(x) do { \
11 |   if (!x.is_contiguous()) { \
12 |     fprintf(stderr, "%s must be contiguous tensor at %s:%d\n", #x, __FILE__, __LINE__); \
13 |     exit(-1); \
14 |   } \
15 | } while (0)
16 | #define CHECK_INPUT(x) CHECK_CUDA(x);CHECK_CONTIGUOUS(x)
17 | 
18 | void group_inner_inds_launcher(int N, int M, int K, const long *inverse_inds, long *group_inds);
19 | 
20 | int group_inner_inds_wrapper(at::Tensor inverse_inds_tensor, at::Tensor group_inds_tensor) {
21 |     CHECK_INPUT(inverse_inds_tensor);
22 |     CHECK_INPUT(group_inds_tensor);
23 | 
24 |     int N = inverse_inds_tensor.size(0);
25 |     int M = group_inds_tensor.size(0);
26 |     int K = group_inds_tensor.size(1);
27 | 
28 |     const long *inverse_inds = inverse_inds_tensor.data_ptr<long>();
29 |     long *group_inds = group_inds_tensor.data_ptr<long>();
30 | 
31 |     group_inner_inds_launcher(N, M, K, inverse_inds, group_inds);
32 |     return 1;
33 | }
34 | 
35 | PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
36 |     m.def("group_inner_inds_wrapper", &group_inner_inds_wrapper, "group_inner_inds_wrapper");
37 | }


--------------------------------------------------------------------------------
/mmdet3d/ops/spconv/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2019 Yan Yan
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .conv import (SparseConv2d, SparseConv3d, SparseConvTranspose2d,
16 |                    SparseConvTranspose3d, SparseInverseConv2d,
17 |                    SparseInverseConv3d, SubMConv2d, SubMConv3d)
18 | from .modules import SparseModule, SparseSequential
19 | from .pool import SparseMaxPool2d, SparseMaxPool3d
20 | from .structure import SparseConvTensor, scatter_nd
21 | 
22 | __all__ = [
23 |     'SparseConv2d',
24 |     'SparseConv3d',
25 |     'SubMConv2d',
26 |     'SubMConv3d',
27 |     'SparseConvTranspose2d',
28 |     'SparseConvTranspose3d',
29 |     'SparseInverseConv2d',
30 |     'SparseInverseConv3d',
31 |     'SparseModule',
32 |     'SparseSequential',
33 |     'SparseMaxPool2d',
34 |     'SparseMaxPool3d',
35 |     'SparseConvTensor',
36 |     'scatter_nd',
37 | ]
38 | 


--------------------------------------------------------------------------------
/configs/_base_/models/pointnet2_ssg.py:
--------------------------------------------------------------------------------
 1 | # model settings
 2 | model = dict(
 3 |     type='EncoderDecoder3D',
 4 |     backbone=dict(
 5 |         type='PointNet2SASSG',
 6 |         in_channels=6,  # [xyz, rgb], should be modified with dataset
 7 |         num_points=(1024, 256, 64, 16),
 8 |         radius=(0.1, 0.2, 0.4, 0.8),
 9 |         num_samples=(32, 32, 32, 32),
10 |         sa_channels=((32, 32, 64), (64, 64, 128), (128, 128, 256), (256, 256,
11 |                                                                     512)),
12 |         fp_channels=(),
13 |         norm_cfg=dict(type='BN2d'),
14 |         sa_cfg=dict(
15 |             type='PointSAModule',
16 |             pool_mod='max',
17 |             use_xyz=True,
18 |             normalize_xyz=False)),
19 |     decode_head=dict(
20 |         type='PointNet2Head',
21 |         fp_channels=((768, 256, 256), (384, 256, 256), (320, 256, 128),
22 |                      (128, 128, 128, 128)),
23 |         channels=128,
24 |         dropout_ratio=0.5,
25 |         conv_cfg=dict(type='Conv1d'),
26 |         norm_cfg=dict(type='BN1d'),
27 |         act_cfg=dict(type='ReLU'),
28 |         loss_decode=dict(
29 |             type='CrossEntropyLoss',
30 |             use_sigmoid=False,
31 |             class_weight=None,  # should be modified with dataset
32 |             loss_weight=1.0)),
33 |     # model training and testing settings
34 |     train_cfg=dict(),
35 |     test_cfg=dict(mode='slide'))
36 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/spconv/include/spconv/mp_helper.h:
--------------------------------------------------------------------------------
 1 | #ifndef MP_HELPER_H_
 2 | #define MP_HELPER_H_
 3 | #include <type_traits>
 4 | #include <utility>
 5 | 
 6 | namespace spconv {
 7 | template <class... T>
 8 | struct mp_list {};
 9 | 
10 | template <class T, T... I>
11 | using mp_list_c = mp_list<std::integral_constant<T, I>...>;
12 | 
13 | namespace detail {
14 | 
15 | template <class... T, class F>
16 | constexpr F mp_for_each_impl(mp_list<T...>, F &&f) {
17 |   return std::initializer_list<int>{(f(T()), 0)...}, std::forward<F>(f);
18 | }
19 | 
20 | template <class F>
21 | constexpr F mp_for_each_impl(mp_list<>, F &&f) {
22 |   return std::forward<F>(f);
23 | }
24 | 
25 | }  // namespace detail
26 | 
27 | namespace detail {
28 | 
29 | template <class A, template <class...> class B>
30 | struct mp_rename_impl {
31 |   // An error "no type named 'type'" here means that the first argument to
32 |   // mp_rename is not a list
33 | };
34 | 
35 | template <template <class...> class A, class... T, template <class...> class B>
36 | struct mp_rename_impl<A<T...>, B> {
37 |   using type = B<T...>;
38 | };
39 | 
40 | }  // namespace detail
41 | 
42 | template <class A, template <class...> class B>
43 | using mp_rename = typename detail::mp_rename_impl<A, B>::type;
44 | 
45 | template <class L, class F>
46 | constexpr F mp_for_each(F &&f) {
47 |   return detail::mp_for_each_impl(mp_rename<L, mp_list>(), std::forward<F>(f));
48 | }
49 | }  // namespace spconv
50 | 
51 | #endif
52 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/pointnet_modules/builder.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmcv.utils import Registry
 3 | 
 4 | SA_MODULES = Registry('point_sa_module')
 5 | 
 6 | 
 7 | def build_sa_module(cfg, *args, **kwargs):
 8 |     """Build PointNet2 set abstraction (SA) module.
 9 | 
10 |     Args:
11 |         cfg (None or dict): The SA module config, which should contain:
12 |             - type (str): Module type.
13 |             - module args: Args needed to instantiate an SA module.
14 |         args (argument list): Arguments passed to the `__init__`
15 |             method of the corresponding module.
16 |         kwargs (keyword arguments): Keyword arguments passed to the `__init__`
17 |             method of the corresponding SA module .
18 | 
19 |     Returns:
20 |         nn.Module: Created SA module.
21 |     """
22 |     if cfg is None:
23 |         cfg_ = dict(type='PointSAModule')
24 |     else:
25 |         if not isinstance(cfg, dict):
26 |             raise TypeError('cfg must be a dict')
27 |         if 'type' not in cfg:
28 |             raise KeyError('the cfg dict must contain the key "type"')
29 |         cfg_ = cfg.copy()
30 | 
31 |     module_type = cfg_.pop('type')
32 |     if module_type not in SA_MODULES:
33 |         raise KeyError(f'Unrecognized module type {module_type}')
34 |     else:
35 |         sa_module = SA_MODULES.get(module_type)
36 | 
37 |     module = sa_module(*args, **kwargs, **cfg_)
38 | 
39 |     return module
40 | 


--------------------------------------------------------------------------------
/configs/pointnet2/pointnet2_msg_16x2_cosine_250e_scannet_seg-3d-20class.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/datasets/scannet_seg-3d-20class.py',
 3 |     '../_base_/models/pointnet2_msg.py',
 4 |     '../_base_/schedules/seg_cosine_200e.py', '../_base_/default_runtime.py'
 5 | ]
 6 | 
 7 | # data settings
 8 | data = dict(samples_per_gpu=16)
 9 | evaluation = dict(interval=5)
10 | 
11 | # model settings
12 | model = dict(
13 |     decode_head=dict(
14 |         num_classes=20,
15 |         ignore_index=20,
16 |         # `class_weight` is generated in data pre-processing, saved in
17 |         # `data/scannet/seg_info/train_label_weight.npy`
18 |         # you can copy paste the values here, or input the file path as
19 |         # `class_weight=data/scannet/seg_info/train_label_weight.npy`
20 |         loss_decode=dict(class_weight=[
21 |             2.389689, 2.7215734, 4.5944676, 4.8543367, 4.096086, 4.907941,
22 |             4.690836, 4.512031, 4.623311, 4.9242644, 5.358117, 5.360071,
23 |             5.019636, 4.967126, 5.3502126, 5.4023647, 5.4027233, 5.4169416,
24 |             5.3954206, 4.6971426
25 |         ])),
26 |     test_cfg=dict(
27 |         num_points=8192,
28 |         block_size=1.5,
29 |         sample_rate=0.5,
30 |         use_normalized_coord=False,
31 |         batch_size=24))
32 | 
33 | # runtime settings
34 | checkpoint_config = dict(interval=5)
35 | # PointNet2-MSG needs longer training time than PointNet2-SSG
36 | runner = dict(type='EpochBasedRunner', max_epochs=250)
37 | 


--------------------------------------------------------------------------------
/configs/nuimages/mask_rcnn_r50_fpn_coco-2x_1x_nus-2d.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/mask_rcnn_r50_fpn.py',
 3 |     '../_base_/datasets/nuim_instance.py',
 4 |     '../_base_/schedules/mmdet_schedule_1x.py', '../_base_/default_runtime.py'
 5 | ]
 6 | model = dict(
 7 |     roi_head=dict(
 8 |         bbox_head=dict(num_classes=10), mask_head=dict(num_classes=10)))
 9 | 
10 | file_client_args = dict(
11 |     backend='petrel',
12 |     path_mapping=dict({
13 |         './data/nuscenes/': 's3://nuscenes/nuscenes/',
14 |         'data/nuscenes/': 's3://nuscenes/nuscenes/'
15 |     }))
16 | img_norm_cfg = dict(
17 |     mean=[123.675, 116.28, 103.53], std=[58.395, 57.12, 57.375], to_rgb=True)
18 | 
19 | test_pipeline = [
20 |     dict(type='LoadImageFromFile', file_client_args=file_client_args),
21 |     dict(
22 |         type='MultiScaleFlipAug',
23 |         img_scale=(1600, 900),
24 |         flip=False,
25 |         transforms=[
26 |             dict(type='Resize', keep_ratio=True),
27 |             dict(type='RandomFlip'),
28 |             dict(type='Normalize', **img_norm_cfg),
29 |             dict(type='Pad', size_divisor=32),
30 |             dict(type='ImageToTensor', keys=['img']),
31 |             dict(type='Collect', keys=['img']),
32 |         ])
33 | ]
34 | data_root = 'data/nuimages/'
35 | # data = dict(
36 | #     val=dict(
37 | #         ann_file=data_root + 'annotations/nuimages_v1.0-mini.json'),
38 | #     test=dict(
39 | #         ann_file=data_root + 'annotations/nuimages_v1.0-mini.json'))
40 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/interpolate/three_nn.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from torch.autograd import Function
 3 | from typing import Tuple
 4 | 
 5 | from . import interpolate_ext
 6 | 
 7 | 
 8 | class ThreeNN(Function):
 9 | 
10 |     @staticmethod
11 |     def forward(ctx, target: torch.Tensor,
12 |                 source: torch.Tensor) -> Tuple[torch.Tensor, torch.Tensor]:
13 |         """Find the top-3 nearest neighbors of the target set from the source
14 |         set.
15 | 
16 |         Args:
17 |             target (Tensor): shape (B, N, 3), points set that needs to
18 |                 find the nearest neighbors.
19 |             source (Tensor): shape (B, M, 3), points set that is used
20 |                 to find the nearest neighbors of points in target set.
21 | 
22 |         Returns:
23 |             Tensor: shape (B, N, 3), L2 distance of each point in target
24 |                 set to their corresponding nearest neighbors.
25 |         """
26 |         assert target.is_contiguous()
27 |         assert source.is_contiguous()
28 | 
29 |         B, N, _ = target.size()
30 |         m = source.size(1)
31 |         dist2 = torch.cuda.FloatTensor(B, N, 3)
32 |         idx = torch.cuda.IntTensor(B, N, 3)
33 | 
34 |         interpolate_ext.three_nn_wrapper(B, N, m, target, source, dist2, idx)
35 | 
36 |         ctx.mark_non_differentiable(idx)
37 | 
38 |         return torch.sqrt(dist2), idx
39 | 
40 |     @staticmethod
41 |     def backward(ctx, a=None, b=None):
42 |         return None, None
43 | 
44 | 
45 | three_nn = ThreeNN.apply
46 | 


--------------------------------------------------------------------------------
/mmdet3d/models/backbones/base_pointnet.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | import warnings
 3 | from abc import ABCMeta
 4 | from mmcv.runner import BaseModule
 5 | 
 6 | 
 7 | class BasePointNet(BaseModule, metaclass=ABCMeta):
 8 |     """Base class for PointNet."""
 9 | 
10 |     def __init__(self, init_cfg=None, pretrained=None):
11 |         super(BasePointNet, self).__init__(init_cfg)
12 |         self.fp16_enabled = False
13 |         assert not (init_cfg and pretrained), \
14 |             'init_cfg and pretrained cannot be setting at the same time'
15 |         if isinstance(pretrained, str):
16 |             warnings.warn('DeprecationWarning: pretrained is a deprecated, '
17 |                           'please use "init_cfg" instead')
18 |             self.init_cfg = dict(type='Pretrained', checkpoint=pretrained)
19 | 
20 |     @staticmethod
21 |     def _split_point_feats(points):
22 |         """Split coordinates and features of input points.
23 | 
24 |         Args:
25 |             points (torch.Tensor): Point coordinates with features,
26 |                 with shape (B, N, 3 + input_feature_dim).
27 | 
28 |         Returns:
29 |             torch.Tensor: Coordinates of input points.
30 |             torch.Tensor: Features of input points.
31 |         """
32 |         xyz = points[..., 0:3].contiguous()
33 |         if points.size(-1) > 3:
34 |             features = points[..., 3:].transpose(1, 2).contiguous()
35 |         else:
36 |             features = None
37 | 
38 |         return xyz, features
39 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/spconv/include/spconv/reordering.h:
--------------------------------------------------------------------------------
 1 | // Copyright 2019 Yan Yan
 2 | //
 3 | // Licensed under the Apache License, Version 2.0 (the "License");
 4 | // you may not use this file except in compliance with the License.
 5 | // You may obtain a copy of the License at
 6 | //
 7 | //     http://www.apache.org/licenses/LICENSE-2.0
 8 | //
 9 | // Unless required by applicable law or agreed to in writing, software
10 | // distributed under the License is distributed on an "AS IS" BASIS,
11 | // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | // See the License for the specific language governing permissions and
13 | // limitations under the License.
14 | 
15 | #ifndef SPARSE_REORDERING_FUNCTOR_H_
16 | #define SPARSE_REORDERING_FUNCTOR_H_
17 | #include <tensorview/tensorview.h>
18 | 
19 | namespace spconv {
20 | namespace functor {
21 | template <typename Device, typename T, typename Index>
22 | struct SparseGatherFunctor {
23 |   void operator()(const Device& d, tv::TensorView<T> buffer,
24 |                   tv::TensorView<const T> features,
25 |                   tv::TensorView<const Index> indices, int size);
26 | };
27 | 
28 | template <typename Device, typename T, typename Index>
29 | struct SparseScatterAddFunctor {
30 |   void operator()(const Device& d, tv::TensorView<T> out_features,
31 |                   tv::TensorView<const T> buffer,
32 |                   tv::TensorView<const Index> indices, int size,
33 |                   bool stable = false);
34 | };
35 | }  // namespace functor
36 | }  // namespace spconv
37 | 
38 | #endif
39 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/knn/src/knn.cpp:
--------------------------------------------------------------------------------
 1 | // Modified from https://github.com/CVMI-Lab/PAConv/tree/main/scene_seg/lib/pointops/src/knnquery_heap
 2 | 
 3 | #include <torch/serialize/tensor.h>
 4 | #include <torch/extension.h>
 5 | #include <vector>
 6 | // #include <THC/THC.h>
 7 | #include <ATen/cuda/CUDAContext.h>
 8 | 
 9 | // extern THCState *state;
10 | 
11 | #define CHECK_CUDA(x) TORCH_CHECK(x.is_cuda(), #x, " must be a CUDAtensor ")
12 | #define CHECK_CONTIGUOUS(x) TORCH_CHECK(x.is_contiguous(), #x, " must be contiguous ")
13 | #define CHECK_INPUT(x) CHECK_CUDA(x);CHECK_CONTIGUOUS(x)
14 | 
15 | 
16 | void knn_kernel_launcher(
17 |     int b,
18 |     int n,
19 |     int m,
20 |     int nsample,
21 |     const float *xyz,
22 |     const float *new_xyz,
23 |     int *idx,
24 |     float *dist2,
25 |     cudaStream_t stream
26 |     );
27 | 
28 | void knn_wrapper(int b, int n, int m, int nsample, at::Tensor xyz_tensor, at::Tensor new_xyz_tensor, at::Tensor idx_tensor, at::Tensor dist2_tensor)
29 | {
30 |     CHECK_INPUT(new_xyz_tensor);
31 |     CHECK_INPUT(xyz_tensor);
32 | 
33 |     const float *new_xyz = new_xyz_tensor.data_ptr<float>();
34 |     const float *xyz = xyz_tensor.data_ptr<float>();
35 |     int *idx = idx_tensor.data_ptr<int>();
36 |     float *dist2 = dist2_tensor.data_ptr<float>();
37 | 
38 |     cudaStream_t stream = at::cuda::getCurrentCUDAStream();
39 | 
40 |     knn_kernel_launcher(b, n, m, nsample, xyz, new_xyz, idx, dist2, stream);
41 | }
42 | 
43 | 
44 | PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
45 |     m.def("knn_wrapper", &knn_wrapper, "knn_wrapper");
46 | }
47 | 


--------------------------------------------------------------------------------
/tools/data_converter/lyft_data_fixer.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | import argparse
 3 | import numpy as np
 4 | import os
 5 | 
 6 | 
 7 | def fix_lyft(root_folder='./data/lyft', version='v1.01'):
 8 |     # refer to https://www.kaggle.com/c/3d-object-detection-for-autonomous-vehicles/discussion/110000  # noqa
 9 |     lidar_path = 'lidar/host-a011_lidar1_1233090652702363606.bin'
10 |     root_folder = os.path.join(root_folder, f'{version}-train')
11 |     lidar_path = os.path.join(root_folder, lidar_path)
12 |     assert os.path.isfile(lidar_path), f'Please download the complete Lyft ' \
13 |         f'dataset and make sure {lidar_path} is present.'
14 |     points = np.fromfile(lidar_path, dtype=np.float32, count=-1)
15 |     try:
16 |         points.reshape([-1, 5])
17 |         print(f'This fix is not required for version {version}.')
18 |     except ValueError:
19 |         new_points = np.array(list(points) + [100.0, 1.0], dtype='float32')
20 |         new_points.tofile(lidar_path)
21 |         print(f'Appended 100.0 and 1.0 to the end of {lidar_path}.')
22 | 
23 | 
24 | parser = argparse.ArgumentParser(description='Lyft dataset fixer arg parser')
25 | parser.add_argument(
26 |     '--root-folder',
27 |     type=str,
28 |     default='./data/lyft',
29 |     help='specify the root path of Lyft dataset')
30 | parser.add_argument(
31 |     '--version',
32 |     type=str,
33 |     default='v1.01',
34 |     help='specify Lyft dataset version')
35 | args = parser.parse_args()
36 | 
37 | if __name__ == '__main__':
38 |     fix_lyft(root_folder=args.root_folder, version=args.version)
39 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/spconv/include/spconv/maxpool.h:
--------------------------------------------------------------------------------
 1 | // Copyright 2019 Yan Yan
 2 | //
 3 | // Licensed under the Apache License, Version 2.0 (the "License");
 4 | // you may not use this file except in compliance with the License.
 5 | // You may obtain a copy of the License at
 6 | //
 7 | //     http://www.apache.org/licenses/LICENSE-2.0
 8 | //
 9 | // Unless required by applicable law or agreed to in writing, software
10 | // distributed under the License is distributed on an "AS IS" BASIS,
11 | // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | // See the License for the specific language governing permissions and
13 | // limitations under the License.
14 | 
15 | #ifndef SPARSE_MAXPOOL_FUNCTOR_H_
16 | #define SPARSE_MAXPOOL_FUNCTOR_H_
17 | #include <tensorview/tensorview.h>
18 | 
19 | namespace spconv {
20 | namespace functor {
21 | template <typename Device, typename T, typename Index>
22 | struct SparseMaxPoolForwardFunctor {
23 |   void operator()(const Device& d, tv::TensorView<T> outFeatures,
24 |                   tv::TensorView<const T> inFeatures,
25 |                   tv::TensorView<const Index> indices, int size);
26 | };
27 | 
28 | template <typename Device, typename T, typename Index>
29 | struct SparseMaxPoolBackwardFunctor {
30 |   void operator()(const Device& d, tv::TensorView<const T> outFeatures,
31 |                   tv::TensorView<const T> inFeatures,
32 |                   tv::TensorView<const T> dout, tv::TensorView<T> din,
33 |                   tv::TensorView<const Index> indices, int size);
34 | };
35 | 
36 | }  // namespace functor
37 | }  // namespace spconv
38 | 
39 | #endif
40 | 


--------------------------------------------------------------------------------
/configs/nuimages/htc_r50_fpn_1x_nuim.py:
--------------------------------------------------------------------------------
 1 | _base_ = './htc_without_semantic_r50_fpn_1x_nuim.py'
 2 | model = dict(
 3 |     roi_head=dict(
 4 |         semantic_roi_extractor=dict(
 5 |             type='SingleRoIExtractor',
 6 |             roi_layer=dict(type='RoIAlign', output_size=14, sampling_ratio=0),
 7 |             out_channels=256,
 8 |             featmap_strides=[8]),
 9 |         semantic_head=dict(
10 |             type='FusedSemanticHead',
11 |             num_ins=5,
12 |             fusion_level=1,
13 |             num_convs=4,
14 |             in_channels=256,
15 |             conv_out_channels=256,
16 |             num_classes=32,
17 |             ignore_label=0,
18 |             loss_weight=0.2)))
19 | 
20 | data_root = 'data/nuimages/'
21 | img_norm_cfg = dict(
22 |     mean=[123.675, 116.28, 103.53], std=[58.395, 57.12, 57.375], to_rgb=True)
23 | train_pipeline = [
24 |     dict(type='LoadImageFromFile'),
25 |     dict(
26 |         type='LoadAnnotations', with_bbox=True, with_mask=True, with_seg=True),
27 |     dict(
28 |         type='Resize',
29 |         img_scale=[(1280, 720), (1920, 1080)],
30 |         multiscale_mode='range',
31 |         keep_ratio=True),
32 |     dict(type='RandomFlip', flip_ratio=0.5),
33 |     dict(type='Normalize', **img_norm_cfg),
34 |     dict(type='Pad', size_divisor=32),
35 |     dict(type='SegRescale', scale_factor=1 / 8),
36 |     dict(type='DefaultFormatBundle'),
37 |     dict(
38 |         type='Collect',
39 |         keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks', 'gt_semantic_seg'])
40 | ]
41 | data = dict(
42 |     train=dict(
43 |         seg_prefix=data_root + 'annotations/semantic_masks/',
44 |         pipeline=train_pipeline))
45 | 


--------------------------------------------------------------------------------
/tools/misc/visualize_results.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | import argparse
 3 | import mmcv
 4 | from mmcv import Config
 5 | 
 6 | from mmdet3d.datasets import build_dataset
 7 | 
 8 | 
 9 | def parse_args():
10 |     parser = argparse.ArgumentParser(
11 |         description='MMDet3D visualize the results')
12 |     parser.add_argument('config', help='test config file path')
13 |     parser.add_argument('--result', help='results file in pickle format')
14 |     parser.add_argument(
15 |         '--show-dir', help='directory where visualize results will be saved')
16 |     args = parser.parse_args()
17 | 
18 |     return args
19 | 
20 | 
21 | def main():
22 |     args = parse_args()
23 | 
24 |     if args.result is not None and \
25 |             not args.result.endswith(('.pkl', '.pickle')):
26 |         raise ValueError('The results file must be a pkl file.')
27 | 
28 |     cfg = Config.fromfile(args.config)
29 |     cfg.data.test.test_mode = True
30 | 
31 |     # build the dataset
32 |     dataset = build_dataset(cfg.data.test)
33 |     results = mmcv.load(args.result)
34 | 
35 |     if getattr(dataset, 'show', None) is not None:
36 |         # data loading pipeline for showing
37 |         eval_pipeline = cfg.get('eval_pipeline', {})
38 |         if eval_pipeline:
39 |             dataset.show(results, args.show_dir, pipeline=eval_pipeline)
40 |         else:
41 |             dataset.show(results, args.show_dir)  # use default pipeline
42 |     else:
43 |         raise NotImplementedError(
44 |             'Show is not implemented for dataset {}!'.format(
45 |                 type(dataset).__name__))
46 | 
47 | 
48 | if __name__ == '__main__':
49 |     main()
50 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/ball_query/ball_query.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from torch.autograd import Function
 3 | 
 4 | from . import ball_query_ext
 5 | 
 6 | 
 7 | class BallQuery(Function):
 8 |     """Ball Query.
 9 | 
10 |     Find nearby points in spherical space.
11 |     """
12 | 
13 |     @staticmethod
14 |     def forward(ctx, min_radius: float, max_radius: float, sample_num: int,
15 |                 xyz: torch.Tensor, center_xyz: torch.Tensor) -> torch.Tensor:
16 |         """forward.
17 | 
18 |         Args:
19 |             min_radius (float): minimum radius of the balls.
20 |             max_radius (float): maximum radius of the balls.
21 |             sample_num (int): maximum number of features in the balls.
22 |             xyz (Tensor): (B, N, 3) xyz coordinates of the features.
23 |             center_xyz (Tensor): (B, npoint, 3) centers of the ball query.
24 | 
25 |         Returns:
26 |             Tensor: (B, npoint, nsample) tensor with the indicies of
27 |                 the features that form the query balls.
28 |         """
29 |         assert center_xyz.is_contiguous()
30 |         assert xyz.is_contiguous()
31 |         assert min_radius < max_radius
32 | 
33 |         B, N, _ = xyz.size()
34 |         npoint = center_xyz.size(1)
35 |         idx = torch.cuda.IntTensor(B, npoint, sample_num).zero_()
36 | 
37 |         ball_query_ext.ball_query_wrapper(B, N, npoint, min_radius, max_radius,
38 |                                           sample_num, center_xyz, xyz, idx)
39 |         ctx.mark_non_differentiable(idx)
40 |         return idx
41 | 
42 |     @staticmethod
43 |     def backward(ctx, a=None):
44 |         return None, None, None, None
45 | 
46 | 
47 | ball_query = BallQuery.apply
48 | 


--------------------------------------------------------------------------------
/configs/_base_/schedules/cyclic_40e.py:
--------------------------------------------------------------------------------
 1 | # The schedule is usually used by models trained on KITTI dataset
 2 | 
 3 | # The learning rate set in the cyclic schedule is the initial learning rate
 4 | # rather than the max learning rate. Since the target_ratio is (10, 1e-4),
 5 | # the learning rate will change from 0.0018 to 0.018, than go to 0.0018*1e-4
 6 | lr = 0.0018
 7 | # The optimizer follows the setting in SECOND.Pytorch, but here we use
 8 | # the offcial AdamW optimizer implemented by PyTorch.
 9 | optimizer = dict(type='AdamW', lr=lr, betas=(0.95, 0.99), weight_decay=0.01)
10 | optimizer_config = dict(grad_clip=dict(max_norm=10, norm_type=2))
11 | # We use cyclic learning rate and momentum schedule following SECOND.Pytorch
12 | # https://github.com/traveller59/second.pytorch/blob/3aba19c9688274f75ebb5e576f65cfe54773c021/torchplus/train/learning_schedules_fastai.py#L69  # noqa
13 | # We implement them in mmcv, for more details, please refer to
14 | # https://github.com/open-mmlab/mmcv/blob/f48241a65aebfe07db122e9db320c31b685dc674/mmcv/runner/hooks/lr_updater.py#L327  # noqa
15 | # https://github.com/open-mmlab/mmcv/blob/f48241a65aebfe07db122e9db320c31b685dc674/mmcv/runner/hooks/momentum_updater.py#L130  # noqa
16 | lr_config = dict(
17 |     policy='cyclic',
18 |     target_ratio=(10, 1e-4),
19 |     cyclic_times=1,
20 |     step_ratio_up=0.4,
21 | )
22 | momentum_config = dict(
23 |     policy='cyclic',
24 |     target_ratio=(0.85 / 0.95, 1),
25 |     cyclic_times=1,
26 |     step_ratio_up=0.4,
27 | )
28 | # Although the max_epochs is 40, this schedule is usually used we
29 | # RepeatDataset with repeat ratio N, thus the actual max epoch
30 | # number could be Nx40
31 | runner = dict(type='EpochBasedRunner', max_epochs=40)
32 | 


--------------------------------------------------------------------------------
/configs/votenet/votenet_8x8_scannet-3d-18class.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/datasets/scannet-3d-18class.py', '../_base_/models/votenet.py',
 3 |     '../_base_/schedules/schedule_3x.py', '../_base_/default_runtime.py'
 4 | ]
 5 | 
 6 | # model settings
 7 | model = dict(
 8 |     bbox_head=dict(
 9 |         num_classes=18,
10 |         bbox_coder=dict(
11 |             type='PartialBinBasedBBoxCoder',
12 |             num_sizes=18,
13 |             num_dir_bins=1,
14 |             with_rot=False,
15 |             mean_sizes=[[0.76966727, 0.8116021, 0.92573744],
16 |                         [1.876858, 1.8425595, 1.1931566],
17 |                         [0.61328, 0.6148609, 0.7182701],
18 |                         [1.3955007, 1.5121545, 0.83443564],
19 |                         [0.97949594, 1.0675149, 0.6329687],
20 |                         [0.531663, 0.5955577, 1.7500148],
21 |                         [0.9624706, 0.72462326, 1.1481868],
22 |                         [0.83221924, 1.0490936, 1.6875663],
23 |                         [0.21132214, 0.4206159, 0.5372846],
24 |                         [1.4440073, 1.8970833, 0.26985747],
25 |                         [1.0294262, 1.4040797, 0.87554324],
26 |                         [1.3766412, 0.65521795, 1.6813129],
27 |                         [0.6650819, 0.71111923, 1.298853],
28 |                         [0.41999173, 0.37906948, 1.7513971],
29 |                         [0.59359556, 0.5912492, 0.73919016],
30 |                         [0.50867593, 0.50656086, 0.30136237],
31 |                         [1.1511526, 1.0546296, 0.49706793],
32 |                         [0.47535285, 0.49249494, 0.5802117]])))
33 | 
34 | # yapf:disable
35 | log_config = dict(interval=30)
36 | # yapf:enable
37 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/models/dense_heads/render_utils/models/volsdf.py:
--------------------------------------------------------------------------------
 1 | from .base_surface_model import SurfaceModel
 2 | from functools import partial
 3 | 
 4 | 
 5 | class VolSDFModel(SurfaceModel):
 6 |     def __init__(
 7 |         self,
 8 |         pc_range,
 9 |         voxel_size,
10 |         voxel_shape,
11 |         field_cfg,
12 |         collider_cfg,
13 |         sampler_cfg,
14 |         loss_cfg,
15 |         norm_scene,
16 |         **kwargs
17 |     ):
18 |         super().__init__(
19 |             pc_range=pc_range,
20 |             voxel_size=voxel_size,
21 |             voxel_shape=voxel_shape,
22 |             field_cfg=field_cfg,
23 |             collider_cfg=collider_cfg,
24 |             sampler_cfg=sampler_cfg,
25 |             loss_cfg=loss_cfg,
26 |             norm_scene=norm_scene,
27 |             **kwargs
28 |         )
29 | 
30 |     def sample_and_forward_field(self, ray_bundle, feature_volume):
31 |         sampler_out_dict = self.sampler(
32 |             ray_bundle,
33 |             density_fn=self.field.laplace_density,
34 |             sdf_fn=partial(self.field.get_sdf, feature_volume=feature_volume),
35 |         )
36 |         ray_samples = sampler_out_dict.pop("ray_samples")
37 |         field_outputs = self.field(ray_samples, feature_volume)
38 |         weights, _ = ray_samples.get_weights_and_transmittance(field_outputs["density"])
39 | 
40 |         samples_and_field_outputs = {
41 |             "ray_samples": ray_samples,
42 |             "field_outputs": field_outputs,
43 |             "weights": weights,
44 |             "sampled_points": ray_samples.frustums.get_start_positions(),
45 |             **sampler_out_dict,
46 |         }
47 |         return samples_and_field_outputs
48 | 


--------------------------------------------------------------------------------
/configs/parta2/metafile.yml:
--------------------------------------------------------------------------------
 1 | Collections:
 2 |   - Name: Part-A^2
 3 |     Metadata:
 4 |       Training Data: KITTI
 5 |       Training Techniques:
 6 |         - AdamW
 7 |       Training Resources: 8x V100 GPUs
 8 |       Architecture:
 9 |         - Sparse U-Net
10 |     Paper:
11 |       URL: https://arxiv.org/abs/1907.03670
12 |       Title: 'From Points to Parts: 3D Object Detection from Point Cloud with Part-aware and Part-aggregation Network'
13 |     README: configs/parta2/README.md
14 |     Code:
15 |       URL: https://github.com/open-mmlab/mmdetection3d/blob/master/mmdet3d/models/detectors/parta2.py#L12
16 |       Version: v0.5.0
17 | 
18 | Models:
19 |   - Name: hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-3class
20 |     In Collection: Part-A^2
21 |     Config: configs/parta2/hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-3class.py
22 |     Metadata:
23 |       Training Memory (GB): 4.1
24 |     Results:
25 |       - Task: 3D Object Detection
26 |         Dataset: KITTI
27 |         Metrics:
28 |           mAP: 67.9
29 |     Weights: https://download.openmmlab.com/mmdetection3d/v0.1.0_models/parta2/hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-3class/hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-3class_20200620_230724-a2672098.pth
30 | 
31 |   - Name: hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-car
32 |     In Collection: Part-A^2
33 |     Config: configs/parta2/hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-car.py
34 |     Metadata:
35 |       Training Memory (GB): 4.0
36 |     Results:
37 |       - Task: 3D Object Detection
38 |         Dataset: KITTI
39 |         Metrics:
40 |           mAP: 79.16
41 |     Weights: https://download.openmmlab.com/mmdetection3d/v0.1.0_models/parta2/hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-car/hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-car_20200620_230755-f2a38b9a.pth
42 | 


--------------------------------------------------------------------------------
/configs/h3dnet/README.md:
--------------------------------------------------------------------------------
 1 | # H3DNet: 3D Object Detection Using Hybrid Geometric Primitives
 2 | 
 3 | ## Introduction
 4 | 
 5 | <!-- [ALGORITHM] -->
 6 | 
 7 | We implement H3DNet and provide the result and checkpoints on ScanNet datasets.
 8 | 
 9 | ```
10 | @inproceedings{zhang2020h3dnet,
11 |     author = {Zhang, Zaiwei and Sun, Bo and Yang, Haitao and Huang, Qixing},
12 |     title = {H3DNet: 3D Object Detection Using Hybrid Geometric Primitives},
13 |     booktitle = {Proceedings of the European Conference on Computer Vision},
14 |     year = {2020}
15 | }
16 | ```
17 | 
18 | ## Results
19 | 
20 | ### ScanNet
21 | 
22 | |  Backbone   | Lr schd | Mem (GB) | Inf time (fps) | AP@0.25 |AP@0.5| Download |
23 | | :---------: | :-----: | :------: | :------------: | :----: |:----: | :------: |
24 | |    [MultiBackbone](./h3dnet_3x8_scannet-3d-18class.py)     |  3x    |7.9||66.43|48.01|[model](https://download.openmmlab.com/mmdetection3d/v0.1.0_models/h3dnet/h3dnet_scannet-3d-18class/h3dnet_scannet-3d-18class_20200830_000136-02e36246.pth) &#124; [log](https://download.openmmlab.com/mmdetection3d/v0.1.0_models/h3dnet/h3dnet_scannet-3d-18class/h3dnet_scannet-3d-18class_20200830_000136.log.json) |
25 | 
26 | **Notice**: If your current mmdetection3d version >= 0.6.0, and you are using the checkpoints downloaded from the above links or using checkpoints trained with mmdetection3d version < 0.6.0, the checkpoints have to be first converted via [tools/model_converters/convert_h3dnet_checkpoints.py](../../tools/model_converters/convert_h3dnet_checkpoints.py):
27 | 
28 | ```
29 | python ./tools/model_converters/convert_h3dnet_checkpoints.py ${ORIGINAL_CHECKPOINT_PATH} --out=${NEW_CHECKPOINT_PATH}
30 | ```
31 | 
32 | Then you can use the converted checkpoints following [getting_started.md](../../docs/getting_started.md).
33 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/gather_points/gather_points.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from torch.autograd import Function
 3 | 
 4 | from . import gather_points_ext
 5 | 
 6 | 
 7 | class GatherPoints(Function):
 8 |     """Gather Points.
 9 | 
10 |     Gather points with given index.
11 |     """
12 | 
13 |     @staticmethod
14 |     def forward(ctx, features: torch.Tensor,
15 |                 indices: torch.Tensor) -> torch.Tensor:
16 |         """forward.
17 | 
18 |         Args:
19 |             features (Tensor): (B, C, N) features to gather.
20 |             indices (Tensor): (B, M) where M is the number of points.
21 | 
22 |         Returns:
23 |             Tensor: (B, C, M) where M is the number of points.
24 |         """
25 |         assert features.is_contiguous()
26 |         assert indices.is_contiguous()
27 | 
28 |         B, npoint = indices.size()
29 |         _, C, N = features.size()
30 |         output = torch.cuda.FloatTensor(B, C, npoint)
31 | 
32 |         gather_points_ext.gather_points_wrapper(B, C, N, npoint, features,
33 |                                                 indices, output)
34 | 
35 |         ctx.for_backwards = (indices, C, N)
36 |         ctx.mark_non_differentiable(indices)
37 |         return output
38 | 
39 |     @staticmethod
40 |     def backward(ctx, grad_out):
41 |         idx, C, N = ctx.for_backwards
42 |         B, npoint = idx.size()
43 | 
44 |         grad_features = torch.cuda.FloatTensor(B, C, N).zero_()
45 |         grad_out_data = grad_out.data.contiguous()
46 |         gather_points_ext.gather_points_grad_wrapper(B, C, N, npoint,
47 |                                                      grad_out_data, idx,
48 |                                                      grad_features.data)
49 |         return grad_features, None
50 | 
51 | 
52 | gather_points = GatherPoints.apply
53 | 


--------------------------------------------------------------------------------
/mmdet3d/datasets/pipelines/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmdet.datasets.pipelines import Compose
 3 | from .dbsampler import DataBaseSampler
 4 | from .formating import Collect3D, DefaultFormatBundle, DefaultFormatBundle3D
 5 | from .loading import (LoadAnnotations3D, LoadImageFromFileMono3D,
 6 |                       LoadMultiViewImageFromFiles, LoadPointsFromFile,
 7 |                       LoadPointsFromMultiSweeps, NormalizePointsColor,
 8 |                       PointSegClassMapping)
 9 | from .test_time_aug import MultiScaleFlipAug3D
10 | from .transforms_3d import (BackgroundPointsFilter, GlobalAlignment,
11 |                             GlobalRotScaleTrans, IndoorPatchPointSample,
12 |                             IndoorPointSample, ObjectNameFilter, ObjectNoise,
13 |                             ObjectRangeFilter, ObjectSample, PointSample,
14 |                             PointShuffle, PointsRangeFilter,
15 |                             RandomDropPointsColor, RandomFlip3D,
16 |                             RandomJitterPoints, VoxelBasedPointSampler)
17 | 
18 | __all__ = [
19 |     'ObjectSample', 'RandomFlip3D', 'ObjectNoise', 'GlobalRotScaleTrans',
20 |     'PointShuffle', 'ObjectRangeFilter', 'PointsRangeFilter', 'Collect3D',
21 |     'Compose', 'LoadMultiViewImageFromFiles', 'LoadPointsFromFile',
22 |     'DefaultFormatBundle', 'DefaultFormatBundle3D', 'DataBaseSampler',
23 |     'NormalizePointsColor', 'LoadAnnotations3D', 'IndoorPointSample',
24 |     'PointSample', 'PointSegClassMapping', 'MultiScaleFlipAug3D',
25 |     'LoadPointsFromMultiSweeps', 'BackgroundPointsFilter',
26 |     'VoxelBasedPointSampler', 'GlobalAlignment', 'IndoorPatchPointSample',
27 |     'LoadImageFromFileMono3D', 'ObjectNameFilter', 'RandomDropPointsColor',
28 |     'RandomJitterPoints'
29 | ]
30 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/ops/point_ops/src/point_ops_cuda.cu:
--------------------------------------------------------------------------------
 1 | #include <math.h>
 2 | #include <stdio.h>
 3 | #include <stdlib.h>
 4 | #include <curand_kernel.h>
 5 | 
 6 | #define THREADS_PER_BLOCK 256
 7 | #define DIVUP(m,n) ((m) / (n) + ((m) % (n) > 0))
 8 | 
 9 | 
10 | __global__ void group_inner_inds_kernel(int N, int K, const long *inverse_inds, long *group_inds, int *ingroup_counter) {
11 |     int pt_idx = blockIdx.x * blockDim.x + threadIdx.x;
12 |     if (pt_idx >= N) return;
13 |     long this_group_id = inverse_inds[pt_idx];
14 |     if (this_group_id < 0) return;
15 |     int cnt = atomicAdd(ingroup_counter + this_group_id, 1);
16 |     if (cnt < K) group_inds[this_group_id * K + cnt] = pt_idx;
17 | }
18 | 
19 | __global__ void repeat_group_idx_kernel(int M, int K, const int *ingroup_counter, long *group_inds){
20 |     // params ingroup_counter: (M,)
21 |     // params group_inds: (M, K)
22 |     int pt_idx = blockIdx.x * blockDim.x + threadIdx.x;
23 |     if (pt_idx >= M) return;
24 |     int cnt = ingroup_counter[pt_idx];
25 |     if (cnt == 0) return;
26 |     for (int i = cnt; i < K; i++) 
27 |         group_inds[pt_idx * K + i] = group_inds[pt_idx * K + i % cnt];
28 | }
29 | 
30 | void group_inner_inds_launcher(int N, int M, int K, const long *inverse_inds, long *group_inds) {
31 |     int *ingroup_counter = NULL;
32 |     cudaMalloc(&ingroup_counter, M * sizeof(int));
33 |     cudaMemset(ingroup_counter, 0, M * sizeof(int));
34 |     
35 |     dim3 blocks(DIVUP(N, THREADS_PER_BLOCK));
36 |     dim3 threads(THREADS_PER_BLOCK);
37 |     group_inner_inds_kernel<<<blocks, threads>>>(N, K, inverse_inds, group_inds, ingroup_counter);
38 | 
39 |     dim3 blocks1(DIVUP(M, THREADS_PER_BLOCK));
40 |     repeat_group_idx_kernel<<<blocks1, threads>>>(M, K, ingroup_counter, group_inds);
41 |     cudaFree(ingroup_counter);
42 | }


--------------------------------------------------------------------------------
/mmdet3d/core/bbox/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from .assigners import AssignResult, BaseAssigner, MaxIoUAssigner
 3 | from .coders import DeltaXYZWLHRBBoxCoder
 4 | # from .bbox_target import bbox_target
 5 | from .iou_calculators import (AxisAlignedBboxOverlaps3D, BboxOverlaps3D,
 6 |                               BboxOverlapsNearest3D,
 7 |                               axis_aligned_bbox_overlaps_3d, bbox_overlaps_3d,
 8 |                               bbox_overlaps_nearest_3d)
 9 | from .samplers import (BaseSampler, CombinedSampler,
10 |                        InstanceBalancedPosSampler, IoUBalancedNegSampler,
11 |                        PseudoSampler, RandomSampler, SamplingResult)
12 | from .structures import (BaseInstance3DBoxes, Box3DMode, CameraInstance3DBoxes,
13 |                          Coord3DMode, DepthInstance3DBoxes,
14 |                          LiDARInstance3DBoxes, get_box_type, limit_period,
15 |                          mono_cam_box2vis, points_cam2img, xywhr2xyxyr)
16 | from .transforms import bbox3d2result, bbox3d2roi, bbox3d_mapping_back
17 | 
18 | __all__ = [
19 |     'BaseSampler', 'AssignResult', 'BaseAssigner', 'MaxIoUAssigner',
20 |     'PseudoSampler', 'RandomSampler', 'InstanceBalancedPosSampler',
21 |     'IoUBalancedNegSampler', 'CombinedSampler', 'SamplingResult',
22 |     'DeltaXYZWLHRBBoxCoder', 'BboxOverlapsNearest3D', 'BboxOverlaps3D',
23 |     'bbox_overlaps_nearest_3d', 'bbox_overlaps_3d',
24 |     'AxisAlignedBboxOverlaps3D', 'axis_aligned_bbox_overlaps_3d', 'Box3DMode',
25 |     'LiDARInstance3DBoxes', 'CameraInstance3DBoxes', 'bbox3d2roi',
26 |     'bbox3d2result', 'DepthInstance3DBoxes', 'BaseInstance3DBoxes',
27 |     'bbox3d_mapping_back', 'xywhr2xyxyr', 'limit_period', 'points_cam2img',
28 |     'get_box_type', 'Coord3DMode', 'mono_cam_box2vis'
29 | ]
30 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/ops/voxel_pool/voxel_pool.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | 
 3 | from . import voxel_pool_ext
 4 | 
 5 | class QuickCumsumCuda(torch.autograd.Function):
 6 |     @staticmethod
 7 |     def forward(ctx, feats, coords, ranks, B, X, Y, Z):
 8 |         kept = torch.ones(feats.shape[0], device=feats.device, dtype=torch.bool)
 9 |         kept[1:] = ranks[1:] != ranks[:-1]
10 |         interval_starts = torch.where(kept)[0].int()
11 |         interval_lengths = torch.zeros_like(interval_starts)
12 |         interval_lengths[:-1] = interval_starts[1:] - interval_starts[:-1]
13 |         interval_lengths[-1] = feats.shape[0] - interval_starts[-1]
14 |         coords = coords.int()
15 | 
16 |         out = voxel_pool_ext.voxel_pool_forward(feats, coords, interval_lengths, interval_starts, B, X, Y, Z)
17 | 
18 |         ctx.save_for_backward(interval_starts, interval_lengths, coords)
19 |         ctx.saved_shapes = B, X, Y, Z
20 |         return out
21 | 
22 |     @staticmethod
23 |     def backward(ctx, out_grad):
24 |         interval_starts, interval_lengths, coords = ctx.saved_tensors
25 |         B, X, Y, Z = ctx.saved_shapes
26 | 
27 |         out_grad = out_grad.contiguous()
28 |         feats_grad = voxel_pool_ext.voxel_pool_backward(out_grad, coords, interval_lengths, interval_starts, B, X, Y, Z)
29 | 
30 |         return feats_grad, None, None, None, None, None, None
31 | 
32 | 
33 | def voxel_pool(feats, coords, B, X, Y, Z):
34 |     # coords: [bs_idx, x, y, z]
35 |     assert feats.shape[0] == coords.shape[0]
36 | 
37 |     ranks = coords[:, 0] * X * Y * Z + coords[:, 1] * Y * Z + coords[:, 2] * Z + coords[:, 3]
38 |     indices = ranks.argsort()
39 |     feats, coords, ranks = feats[indices], coords[indices], ranks[indices]
40 | 
41 |     x = QuickCumsumCuda.apply(feats, coords, ranks, B, X, Y, Z)
42 | 
43 |     return x
44 | 


--------------------------------------------------------------------------------
/configs/imvotenet/metafile.yml:
--------------------------------------------------------------------------------
 1 | Collections:
 2 |   - Name: ImVoteNet
 3 |     Metadata:
 4 |       Training Data: SUNRGBD
 5 |       Training Techniques:
 6 |         - AdamW
 7 |       Training Resources: 8x TITAN Xp
 8 |       Architecture:
 9 |         - Faster R-CNN
10 |         - VoteNet
11 |         - Feature Pyramid Network
12 |     Paper:
13 |       URL: https://arxiv.org/abs/2001.10692
14 |       Title: 'ImVoteNet: Boosting 3D Object Detection in Point Clouds with Image Votes'
15 |     README: configs/imvotenet/README.md
16 |     Code:
17 |       URL: https://github.com/open-mmlab/mmdetection3d/blob/master/mmdet3d/models/detectors/imvotenet.py#L56
18 |       Version: v0.12.0
19 | 
20 | Models:
21 |   - Name: imvotenet_faster_rcnn_r50_fpn_2x4_sunrgbd-3d-10class
22 |     In Collection: ImVoteNet
23 |     Config: configs/imvotenet/imvotenet_faster_rcnn_r50_fpn_2x4_sunrgbd-3d-10class.py
24 |     Metadata:
25 |       Training Memory (GB): 2.1
26 |     Results:
27 |       - Task: Object Detection
28 |         Dataset: SUNRGBD-2D
29 |         Metrics:
30 |           AP@0.5: 62.70
31 |     Weights: https://download.openmmlab.com/mmdetection3d/v0.1.0_models/imvotenet/imvotenet_faster_rcnn_r50_fpn_2x4_sunrgbd-3d-10class/imvotenet_faster_rcnn_r50_fpn_2x4_sunrgbd-3d-10class_20210323_173222-cad62aeb.pth
32 | 
33 |   - Name: imvotenet_stage2_16x8_sunrgbd-3d-10class
34 |     In Collection: ImVoteNet
35 |     Config: configs/imvotenet/imvotenet_stage2_16x8_sunrgbd-3d-10class.py
36 |     Metadata:
37 |       Training Memory (GB): 9.4
38 |     Results:
39 |       - Task: 3D Object Detection
40 |         Dataset: SUNRGBD-3D
41 |         Metrics:
42 |           AP@0.25: 64.04
43 |     Weights: https://download.openmmlab.com/mmdetection3d/v0.1.0_models/imvotenet/imvotenet_stage2_16x8_sunrgbd-3d-10class/imvotenet_stage2_16x8_sunrgbd-3d-10class_20210323_184021-d44dcb66.pth
44 | 


--------------------------------------------------------------------------------
/configs/parta2/README.md:
--------------------------------------------------------------------------------
 1 | # From Points to Parts: 3D Object Detection from Point Cloud with Part-aware and Part-aggregation Network
 2 | 
 3 | ## Introduction
 4 | 
 5 | <!-- [ALGORITHM] -->
 6 | 
 7 | We implement Part-A^2 and provide its results and checkpoints on KITTI dataset.
 8 | 
 9 | ```
10 | @article{shi2020points,
11 |   title={From points to parts: 3d object detection from point cloud with part-aware and part-aggregation network},
12 |   author={Shi, Shaoshuai and Wang, Zhe and Shi, Jianping and Wang, Xiaogang and Li, Hongsheng},
13 |   journal={IEEE Transactions on Pattern Analysis and Machine Intelligence},
14 |   year={2020},
15 |   publisher={IEEE}
16 | }
17 | ```
18 | 
19 | ## Results
20 | 
21 | ### KITTI
22 | 
23 | |  Backbone   |Class| Lr schd | Mem (GB) | Inf time (fps) | mAP | Download |
24 | | :---------: | :-----: |:-----: | :------: | :------------: | :----: |:----: |
25 | |    [SECFPN](./hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-3class.py) |3 Class|cyclic 80e|4.1||67.9|[model](https://download.openmmlab.com/mmdetection3d/v0.1.0_models/parta2/hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-3class/hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-3class_20200620_230724-a2672098.pth) &#124; [log](https://download.openmmlab.com/mmdetection3d/v0.1.0_models/parta2/hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-3class/hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-3class_20200620_230724.log.json)|
26 | |    [SECFPN](./hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-car.py) |Car |cyclic 80e|4.0||79.16|[model](https://download.openmmlab.com/mmdetection3d/v0.1.0_models/parta2/hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-car/hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-car_20200620_230755-f2a38b9a.pth) &#124; [log](https://download.openmmlab.com/mmdetection3d/v0.1.0_models/parta2/hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-car/hv_PartA2_secfpn_2x8_cyclic_80e_kitti-3d-car_20200620_230755.log.json)|
27 | 


--------------------------------------------------------------------------------
/configs/centerpoint/centerpoint_0075voxel_second_secfpn_dcn_4x8_cyclic_flip-tta_20e_nus.py:
--------------------------------------------------------------------------------
 1 | _base_ = './centerpoint_0075voxel_second_secfpn_dcn_4x8_cyclic_20e_nus.py'
 2 | 
 3 | point_cloud_range = [-54, -54, -5.0, 54, 54, 3.0]
 4 | file_client_args = dict(backend='disk')
 5 | class_names = [
 6 |     'car', 'truck', 'construction_vehicle', 'bus', 'trailer', 'barrier',
 7 |     'motorcycle', 'bicycle', 'pedestrian', 'traffic_cone'
 8 | ]
 9 | 
10 | test_pipeline = [
11 |     dict(
12 |         type='LoadPointsFromFile',
13 |         coord_type='LIDAR',
14 |         load_dim=5,
15 |         use_dim=5,
16 |         file_client_args=file_client_args),
17 |     dict(
18 |         type='LoadPointsFromMultiSweeps',
19 |         sweeps_num=9,
20 |         use_dim=[0, 1, 2, 3, 4],
21 |         file_client_args=file_client_args,
22 |         pad_empty_sweeps=True,
23 |         remove_close=True),
24 |     dict(
25 |         type='MultiScaleFlipAug3D',
26 |         img_scale=(1333, 800),
27 |         pts_scale_ratio=1,
28 |         # Add double-flip augmentation
29 |         flip=True,
30 |         pcd_horizontal_flip=True,
31 |         pcd_vertical_flip=True,
32 |         transforms=[
33 |             dict(
34 |                 type='GlobalRotScaleTrans',
35 |                 rot_range=[0, 0],
36 |                 scale_ratio_range=[1., 1.],
37 |                 translation_std=[0, 0, 0]),
38 |             dict(type='RandomFlip3D', sync_2d=False),
39 |             dict(
40 |                 type='PointsRangeFilter', point_cloud_range=point_cloud_range),
41 |             dict(
42 |                 type='DefaultFormatBundle3D',
43 |                 class_names=class_names,
44 |                 with_label=False),
45 |             dict(type='Collect3D', keys=['points'])
46 |         ])
47 | ]
48 | 
49 | data = dict(
50 |     val=dict(pipeline=test_pipeline), test=dict(pipeline=test_pipeline))
51 | 


--------------------------------------------------------------------------------
/configs/nuimages/mask_rcnn_r50_caffe_fpn_1x_nuim.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/mask_rcnn_r50_fpn.py',
 3 |     '../_base_/datasets/nuim_instance.py',
 4 |     '../_base_/schedules/mmdet_schedule_1x.py', '../_base_/default_runtime.py'
 5 | ]
 6 | model = dict(
 7 |     pretrained='open-mmlab://detectron2/resnet50_caffe',
 8 |     backbone=dict(norm_cfg=dict(requires_grad=False), style='caffe'),
 9 |     roi_head=dict(
10 |         bbox_head=dict(num_classes=10), mask_head=dict(num_classes=10)))
11 | # use caffe img_norm
12 | img_norm_cfg = dict(
13 |     mean=[103.530, 116.280, 123.675], std=[1.0, 1.0, 1.0], to_rgb=False)
14 | train_pipeline = [
15 |     dict(type='LoadImageFromFile'),
16 |     dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
17 |     dict(
18 |         type='Resize',
19 |         img_scale=[(1280, 720), (1920, 1080)],
20 |         multiscale_mode='range',
21 |         keep_ratio=True),
22 |     dict(type='RandomFlip', flip_ratio=0.5),
23 |     dict(type='Normalize', **img_norm_cfg),
24 |     dict(type='Pad', size_divisor=32),
25 |     dict(type='DefaultFormatBundle'),
26 |     dict(type='Collect', keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks']),
27 | ]
28 | test_pipeline = [
29 |     dict(type='LoadImageFromFile'),
30 |     dict(
31 |         type='MultiScaleFlipAug',
32 |         img_scale=(1600, 900),
33 |         flip=False,
34 |         transforms=[
35 |             dict(type='Resize', keep_ratio=True),
36 |             dict(type='RandomFlip'),
37 |             dict(type='Normalize', **img_norm_cfg),
38 |             dict(type='Pad', size_divisor=32),
39 |             dict(type='ImageToTensor', keys=['img']),
40 |             dict(type='Collect', keys=['img']),
41 |         ])
42 | ]
43 | data = dict(
44 |     train=dict(pipeline=train_pipeline),
45 |     val=dict(pipeline=test_pipeline),
46 |     test=dict(pipeline=test_pipeline))
47 | 


--------------------------------------------------------------------------------
/configs/free_anchor/hv_pointpillars_fpn_sbn-all_free-anchor_4x8_2x_nus-3d.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/hv_pointpillars_fpn_nus.py',
 3 |     '../_base_/datasets/nus-3d.py', '../_base_/schedules/schedule_2x.py',
 4 |     '../_base_/default_runtime.py'
 5 | ]
 6 | 
 7 | model = dict(
 8 |     pts_bbox_head=dict(
 9 |         _delete_=True,
10 |         type='FreeAnchor3DHead',
11 |         num_classes=10,
12 |         in_channels=256,
13 |         feat_channels=256,
14 |         use_direction_classifier=True,
15 |         pre_anchor_topk=25,
16 |         bbox_thr=0.5,
17 |         gamma=2.0,
18 |         alpha=0.5,
19 |         anchor_generator=dict(
20 |             type='AlignedAnchor3DRangeGenerator',
21 |             ranges=[[-50, -50, -1.8, 50, 50, -1.8]],
22 |             scales=[1, 2, 4],
23 |             sizes=[
24 |                 [0.8660, 2.5981, 1.],  # 1.5/sqrt(3)
25 |                 [0.5774, 1.7321, 1.],  # 1/sqrt(3)
26 |                 [1., 1., 1.],
27 |                 [0.4, 0.4, 1],
28 |             ],
29 |             custom_values=[0, 0],
30 |             rotations=[0, 1.57],
31 |             reshape_out=True),
32 |         assigner_per_size=False,
33 |         diff_rad_by_sin=True,
34 |         dir_offset=0.7854,  # pi/4
35 |         dir_limit_offset=0,
36 |         bbox_coder=dict(type='DeltaXYZWLHRBBoxCoder', code_size=9),
37 |         loss_cls=dict(
38 |             type='FocalLoss',
39 |             use_sigmoid=True,
40 |             gamma=2.0,
41 |             alpha=0.25,
42 |             loss_weight=1.0),
43 |         loss_bbox=dict(type='SmoothL1Loss', beta=1.0 / 9.0, loss_weight=0.8),
44 |         loss_dir=dict(
45 |             type='CrossEntropyLoss', use_sigmoid=False, loss_weight=0.2)),
46 |     # model training and testing settings
47 |     train_cfg=dict(
48 |         pts=dict(code_weight=[1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.25, 0.25])))
49 | 


--------------------------------------------------------------------------------
/configs/centerpoint/centerpoint_0075voxel_second_secfpn_dcn_4x8_cyclic_tta_20e_nus.py:
--------------------------------------------------------------------------------
 1 | _base_ = './centerpoint_0075voxel_second_secfpn_dcn_4x8_cyclic_20e_nus.py'
 2 | 
 3 | point_cloud_range = [-54, -54, -5.0, 54, 54, 3.0]
 4 | file_client_args = dict(backend='disk')
 5 | class_names = [
 6 |     'car', 'truck', 'construction_vehicle', 'bus', 'trailer', 'barrier',
 7 |     'motorcycle', 'bicycle', 'pedestrian', 'traffic_cone'
 8 | ]
 9 | 
10 | test_pipeline = [
11 |     dict(
12 |         type='LoadPointsFromFile',
13 |         coord_type='LIDAR',
14 |         load_dim=5,
15 |         use_dim=5,
16 |         file_client_args=file_client_args),
17 |     dict(
18 |         type='LoadPointsFromMultiSweeps',
19 |         sweeps_num=9,
20 |         use_dim=[0, 1, 2, 3, 4],
21 |         file_client_args=file_client_args,
22 |         pad_empty_sweeps=True,
23 |         remove_close=True),
24 |     dict(
25 |         type='MultiScaleFlipAug3D',
26 |         img_scale=(1333, 800),
27 |         pts_scale_ratio=[0.95, 1.0, 1.05],
28 |         # Add double-flip augmentation
29 |         flip=True,
30 |         pcd_horizontal_flip=True,
31 |         pcd_vertical_flip=True,
32 |         transforms=[
33 |             dict(
34 |                 type='GlobalRotScaleTrans',
35 |                 rot_range=[0, 0],
36 |                 scale_ratio_range=[1., 1.],
37 |                 translation_std=[0, 0, 0]),
38 |             dict(type='RandomFlip3D', sync_2d=False),
39 |             dict(
40 |                 type='PointsRangeFilter', point_cloud_range=point_cloud_range),
41 |             dict(
42 |                 type='DefaultFormatBundle3D',
43 |                 class_names=class_names,
44 |                 with_label=False),
45 |             dict(type='Collect3D', keys=['points'])
46 |         ])
47 | ]
48 | 
49 | data = dict(
50 |     val=dict(pipeline=test_pipeline), test=dict(pipeline=test_pipeline))
51 | 


--------------------------------------------------------------------------------
/configs/fcos3d/metafile.yml:
--------------------------------------------------------------------------------
 1 | Collections:
 2 |   - Name: FCOS3D
 3 |     Metadata:
 4 |       Training Data: NuScenes
 5 |       Training Techniques:
 6 |         - SGD
 7 |       Training Resources: 8x GeForce RTX 2080 Ti
 8 |       Architecture:
 9 |         - FCOSMono3DHead
10 |     Paper:
11 |       URL: https://arxiv.org/abs/2104.10956
12 |       Title: 'FCOS3D: Fully Convolutional One-Stage Monocular 3D Object Detection'
13 |     README: configs/fcos3d/README.md
14 |     Code:
15 |       URL: https://github.com/open-mmlab/mmdetection3d/blob/master/mmdet3d/models/detectors/fcos_mono3d.py#L7
16 |       Version: v0.13.0
17 | 
18 | Models:
19 |   - Name: fcos3d_r101_caffe_fpn_gn-head_dcn_2x8_1x_nus-mono3d
20 |     In Collection: FCOS3D
21 |     Config: configs/fcos3d/fcos3d_r101_caffe_fpn_gn-head_dcn_2x8_1x_nus-mono3d.py
22 |     Metadata:
23 |       Training Memory (GB): 8.7
24 |     Results:
25 |       - Task: 3D Object Detection
26 |         Dataset: NuScenes
27 |         Metrics:
28 |           mAP: 29.9
29 |           NDS: 37.3
30 |     Weights: https://download.openmmlab.com/mmdetection3d/v0.1.0_models/fcos3d/fcos3d_r101_caffe_fpn_gn-head_dcn_2x8_1x_nus-mono3d/fcos3d_r101_caffe_fpn_gn-head_dcn_2x8_1x_nus-mono3d_20210425_181341-8d5a21fe.pth
31 | 
32 |   - Name: fcos3d_r101_caffe_fpn_gn-head_dcn_2x8_1x_nus-mono3d_finetune
33 |     In Collection: FCOS3D
34 |     Config: configs/fcos3d/fcos3d_r101_caffe_fpn_gn-head_dcn_2x8_1x_nus-mono3d_finetune.py
35 |     Metadata:
36 |       Training Memory (GB): 8.7
37 |     Results:
38 |       - Task: 3D Object Detection
39 |         Dataset: NuScenes
40 |         Metrics:
41 |           mAP: 32.1
42 |           NDS: 39.3
43 |     Weights: https://download.openmmlab.com/mmdetection3d/v0.1.0_models/fcos3d/fcos3d_r101_caffe_fpn_gn-head_dcn_2x8_1x_nus-mono3d_finetune/fcos3d_r101_caffe_fpn_gn-head_dcn_2x8_1x_nus-mono3d_finetune_20210427_091419-35aaaad0.pth
44 | 


--------------------------------------------------------------------------------
/configs/regnet/hv_pointpillars_regnet-400mf_secfpn_sbn-all_4x8_2x_nus-3d.py:
--------------------------------------------------------------------------------
 1 | _base_ = './hv_pointpillars_regnet-400mf_fpn_sbn-all_4x8_2x_nus-3d.py'
 2 | # model settings
 3 | model = dict(
 4 |     pts_neck=dict(
 5 |         type='SECONDFPN',
 6 |         _delete_=True,
 7 |         norm_cfg=dict(type='naiveSyncBN2d', eps=1e-3, momentum=0.01),
 8 |         in_channels=[64, 160, 384],
 9 |         upsample_strides=[1, 2, 4],
10 |         out_channels=[128, 128, 128]),
11 |     pts_bbox_head=dict(
12 |         type='Anchor3DHead',
13 |         in_channels=384,
14 |         feat_channels=384,
15 |         anchor_generator=dict(
16 |             _delete_=True,
17 |             type='AlignedAnchor3DRangeGenerator',
18 |             ranges=[
19 |                 [-49.6, -49.6, -1.80032795, 49.6, 49.6, -1.80032795],
20 |                 [-49.6, -49.6, -1.74440365, 49.6, 49.6, -1.74440365],
21 |                 [-49.6, -49.6, -1.68526504, 49.6, 49.6, -1.68526504],
22 |                 [-49.6, -49.6, -1.67339111, 49.6, 49.6, -1.67339111],
23 |                 [-49.6, -49.6, -1.61785072, 49.6, 49.6, -1.61785072],
24 |                 [-49.6, -49.6, -1.80984986, 49.6, 49.6, -1.80984986],
25 |                 [-49.6, -49.6, -1.763965, 49.6, 49.6, -1.763965],
26 |             ],
27 |             sizes=[
28 |                 [1.95017717, 4.60718145, 1.72270761],  # car
29 |                 [2.4560939, 6.73778078, 2.73004906],  # truck
30 |                 [2.87427237, 12.01320693, 3.81509561],  # trailer
31 |                 [0.60058911, 1.68452161, 1.27192197],  # bicycle
32 |                 [0.66344886, 0.7256437, 1.75748069],  # pedestrian
33 |                 [0.39694519, 0.40359262, 1.06232151],  # traffic_cone
34 |                 [2.49008838, 0.48578221, 0.98297065],  # barrier
35 |             ],
36 |             custom_values=[0, 0],
37 |             rotations=[0, 1.57],
38 |             reshape_out=True)))
39 | 


--------------------------------------------------------------------------------
/configs/regnet/hv_pointpillars_regnet-400mf_secfpn_sbn-all_2x8_2x_lyft-3d.py:
--------------------------------------------------------------------------------
 1 | _base_ = './hv_pointpillars_regnet-400mf_fpn_sbn-all_2x8_2x_lyft-3d.py'
 2 | # model settings
 3 | model = dict(
 4 |     pts_neck=dict(
 5 |         type='SECONDFPN',
 6 |         _delete_=True,
 7 |         norm_cfg=dict(type='naiveSyncBN2d', eps=1e-3, momentum=0.01),
 8 |         in_channels=[64, 160, 384],
 9 |         upsample_strides=[1, 2, 4],
10 |         out_channels=[128, 128, 128]),
11 |     pts_bbox_head=dict(
12 |         type='Anchor3DHead',
13 |         in_channels=384,
14 |         feat_channels=384,
15 |         anchor_generator=dict(
16 |             _delete_=True,
17 |             type='AlignedAnchor3DRangeGenerator',
18 |             ranges=[[-80, -80, -1.0715024, 80, 80, -1.0715024],
19 |                     [-80, -80, -0.3033737, 80, 80, -0.3033737],
20 |                     [-80, -80, -0.3519405, 80, 80, -0.3519405],
21 |                     [-80, -80, -0.8871424, 80, 80, -0.8871424],
22 |                     [-80, -80, -0.6276341, 80, 80, -0.6276341],
23 |                     [-80, -80, -1.3220503, 80, 80, -1.3220503],
24 |                     [-80, -80, -1.0709302, 80, 80, -1.0709302],
25 |                     [-80, -80, -0.9122268, 80, 80, -0.9122268],
26 |                     [-80, -80, -1.8012227, 80, 80, -1.8012227]],
27 |             sizes=[
28 |                 [1.92, 4.75, 1.71],  # car
29 |                 [2.84, 10.24, 3.44],  # truck
30 |                 [2.92, 12.70, 3.42],  # bus
31 |                 [2.42, 6.52, 2.34],  # emergency vehicle
32 |                 [2.75, 8.17, 3.20],  # other vehicle
33 |                 [0.96, 2.35, 1.59],  # motorcycle
34 |                 [0.63, 1.76, 1.44],  # bicycle
35 |                 [0.76, 0.80, 1.76],  # pedestrian
36 |                 [0.35, 0.73, 0.50]  # animal
37 |             ],
38 |             rotations=[0, 1.57],
39 |             reshape_out=True)))
40 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/models/dense_heads/render_utils/models/neus.py:
--------------------------------------------------------------------------------
 1 | from .base_surface_model import SurfaceModel
 2 | from functools import partial
 3 | 
 4 | 
 5 | class NeuSModel(SurfaceModel):
 6 |     def __init__(
 7 |         self,
 8 |         pc_range,
 9 |         voxel_size,
10 |         voxel_shape,
11 |         field_cfg,
12 |         collider_cfg,
13 |         sampler_cfg,
14 |         loss_cfg,
15 |         norm_scene,
16 |         **kwargs
17 |     ):
18 |         super().__init__(
19 |             pc_range=pc_range,
20 |             voxel_size=voxel_size,
21 |             voxel_shape=voxel_shape,
22 |             field_cfg=field_cfg,
23 |             collider_cfg=collider_cfg,
24 |             sampler_cfg=sampler_cfg,
25 |             loss_cfg=loss_cfg,
26 |             norm_scene=norm_scene,
27 |             **kwargs
28 |         )
29 |         self.anneal_end = 50000
30 | 
31 |     def get_training_callbacks(self):
32 |         raise NotImplementedError
33 | 
34 |     def sample_and_forward_field(self, ray_bundle, feature_volume):
35 |         sampler_out_dict = self.sampler(
36 |             ray_bundle,
37 |             occupancy_fn=self.field.get_occupancy,
38 |             sdf_fn=partial(self.field.get_sdf, feature_volume=feature_volume),
39 |         )
40 |         ray_samples = sampler_out_dict.pop("ray_samples")
41 |         field_outputs = self.field(ray_samples, feature_volume, return_alphas=True)
42 |         weights, _ = ray_samples.get_weights_and_transmittance_from_alphas(
43 |             field_outputs["alphas"]
44 |         )
45 | 
46 |         samples_and_field_outputs = {
47 |             "ray_samples": ray_samples,
48 |             "field_outputs": field_outputs,
49 |             "weights": weights,
50 |             "sampled_points": ray_samples.frustums.get_start_positions(),
51 |             **sampler_out_dict,
52 |         }
53 |         return samples_and_field_outputs
54 | 


--------------------------------------------------------------------------------
/configs/centerpoint/centerpoint_0075voxel_second_secfpn_dcn_circlenms_4x8_cyclic_flip-tta_20e_nus.py:
--------------------------------------------------------------------------------
 1 | _base_ = './centerpoint_0075voxel_second_secfpn_dcn_' \
 2 |          'circlenms_4x8_cyclic_20e_nus.py'
 3 | 
 4 | point_cloud_range = [-54, -54, -5.0, 54, 54, 3.0]
 5 | file_client_args = dict(backend='disk')
 6 | class_names = [
 7 |     'car', 'truck', 'construction_vehicle', 'bus', 'trailer', 'barrier',
 8 |     'motorcycle', 'bicycle', 'pedestrian', 'traffic_cone'
 9 | ]
10 | 
11 | test_pipeline = [
12 |     dict(
13 |         type='LoadPointsFromFile',
14 |         coord_type='LIDAR',
15 |         load_dim=5,
16 |         use_dim=5,
17 |         file_client_args=file_client_args),
18 |     dict(
19 |         type='LoadPointsFromMultiSweeps',
20 |         sweeps_num=9,
21 |         use_dim=[0, 1, 2, 3, 4],
22 |         file_client_args=file_client_args,
23 |         pad_empty_sweeps=True,
24 |         remove_close=True),
25 |     dict(
26 |         type='MultiScaleFlipAug3D',
27 |         img_scale=(1333, 800),
28 |         pts_scale_ratio=1,
29 |         # Add double-flip augmentation
30 |         flip=True,
31 |         pcd_horizontal_flip=True,
32 |         pcd_vertical_flip=True,
33 |         transforms=[
34 |             dict(
35 |                 type='GlobalRotScaleTrans',
36 |                 rot_range=[0, 0],
37 |                 scale_ratio_range=[1., 1.],
38 |                 translation_std=[0, 0, 0]),
39 |             dict(type='RandomFlip3D', sync_2d=False),
40 |             dict(
41 |                 type='PointsRangeFilter', point_cloud_range=point_cloud_range),
42 |             dict(
43 |                 type='DefaultFormatBundle3D',
44 |                 class_names=class_names,
45 |                 with_label=False),
46 |             dict(type='Collect3D', keys=['points'])
47 |         ])
48 | ]
49 | 
50 | data = dict(
51 |     val=dict(pipeline=test_pipeline), test=dict(pipeline=test_pipeline))
52 | 


--------------------------------------------------------------------------------
/mmdet3d/models/utils/mlp.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | from mmcv.cnn import ConvModule
 3 | from mmcv.runner import BaseModule
 4 | from torch import nn as nn
 5 | 
 6 | 
 7 | class MLP(BaseModule):
 8 |     """A simple MLP module.
 9 | 
10 |     Pass features (B, C, N) through an MLP.
11 | 
12 |     Args:
13 |         in_channels (int): Number of channels of input features.
14 |             Default: 18.
15 |         conv_channels (tuple[int]): Out channels of the convolution.
16 |             Default: (256, 256).
17 |         conv_cfg (dict): Config of convolution.
18 |             Default: dict(type='Conv1d').
19 |         norm_cfg (dict): Config of normalization.
20 |             Default: dict(type='BN1d').
21 |         act_cfg (dict): Config of activation.
22 |             Default: dict(type='ReLU').
23 |     """
24 | 
25 |     def __init__(self,
26 |                  in_channel=18,
27 |                  conv_channels=(256, 256),
28 |                  conv_cfg=dict(type='Conv1d'),
29 |                  norm_cfg=dict(type='BN1d'),
30 |                  act_cfg=dict(type='ReLU'),
31 |                  init_cfg=None):
32 |         super().__init__(init_cfg=init_cfg)
33 |         self.mlp = nn.Sequential()
34 |         prev_channels = in_channel
35 |         for i, conv_channel in enumerate(conv_channels):
36 |             self.mlp.add_module(
37 |                 f'layer{i}',
38 |                 ConvModule(
39 |                     prev_channels,
40 |                     conv_channels[i],
41 |                     1,
42 |                     padding=0,
43 |                     conv_cfg=conv_cfg,
44 |                     norm_cfg=norm_cfg,
45 |                     act_cfg=act_cfg,
46 |                     bias=True,
47 |                     inplace=True))
48 |             prev_channels = conv_channels[i]
49 | 
50 |     def forward(self, img_features):
51 |         return self.mlp(img_features)
52 | 


--------------------------------------------------------------------------------
/configs/_base_/datasets/coco_instance.py:
--------------------------------------------------------------------------------
 1 | dataset_type = 'CocoDataset'
 2 | data_root = 'data/coco/'
 3 | img_norm_cfg = dict(
 4 |     mean=[123.675, 116.28, 103.53], std=[58.395, 57.12, 57.375], to_rgb=True)
 5 | train_pipeline = [
 6 |     dict(type='LoadImageFromFile'),
 7 |     dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
 8 |     dict(type='Resize', img_scale=(1333, 800), keep_ratio=True),
 9 |     dict(type='RandomFlip', flip_ratio=0.5),
10 |     dict(type='Normalize', **img_norm_cfg),
11 |     dict(type='Pad', size_divisor=32),
12 |     dict(type='DefaultFormatBundle'),
13 |     dict(type='Collect', keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks']),
14 | ]
15 | test_pipeline = [
16 |     dict(type='LoadImageFromFile'),
17 |     dict(
18 |         type='MultiScaleFlipAug',
19 |         img_scale=(1333, 800),
20 |         flip=False,
21 |         transforms=[
22 |             dict(type='Resize', keep_ratio=True),
23 |             dict(type='RandomFlip'),
24 |             dict(type='Normalize', **img_norm_cfg),
25 |             dict(type='Pad', size_divisor=32),
26 |             dict(type='ImageToTensor', keys=['img']),
27 |             dict(type='Collect', keys=['img']),
28 |         ])
29 | ]
30 | data = dict(
31 |     samples_per_gpu=2,
32 |     workers_per_gpu=2,
33 |     train=dict(
34 |         type=dataset_type,
35 |         ann_file=data_root + 'annotations/instances_train2017.json',
36 |         img_prefix=data_root + 'train2017/',
37 |         pipeline=train_pipeline),
38 |     val=dict(
39 |         type=dataset_type,
40 |         ann_file=data_root + 'annotations/instances_val2017.json',
41 |         img_prefix=data_root + 'val2017/',
42 |         pipeline=test_pipeline),
43 |     test=dict(
44 |         type=dataset_type,
45 |         ann_file=data_root + 'annotations/instances_val2017.json',
46 |         img_prefix=data_root + 'val2017/',
47 |         pipeline=test_pipeline))
48 | evaluation = dict(metric=['bbox', 'segm'])
49 | 


--------------------------------------------------------------------------------
/mmdet3d/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | import mmcv
 3 | 
 4 | import mmdet
 5 | import mmseg
 6 | from .version import __version__, short_version
 7 | 
 8 | 
 9 | def digit_version(version_str):
10 |     digit_version = []
11 |     for x in version_str.split('.'):
12 |         if x.isdigit():
13 |             digit_version.append(int(x))
14 |         elif x.find('rc') != -1:
15 |             patch_version = x.split('rc')
16 |             digit_version.append(int(patch_version[0]) - 1)
17 |             digit_version.append(int(patch_version[1]))
18 |     return digit_version
19 | 
20 | 
21 | mmcv_minimum_version = '1.3.8'
22 | mmcv_maximum_version = '1.8.0'
23 | mmcv_version = digit_version(mmcv.__version__)
24 | 
25 | 
26 | assert (mmcv_version >= digit_version(mmcv_minimum_version)
27 |         and mmcv_version <= digit_version(mmcv_maximum_version)), \
28 |     f'MMCV=={mmcv.__version__} is used but incompatible. ' \
29 |     f'Please install mmcv>={mmcv_minimum_version}, <={mmcv_maximum_version}.'
30 | 
31 | mmdet_minimum_version = '2.14.0'
32 | mmdet_maximum_version = '3.0.0'
33 | mmdet_version = digit_version(mmdet.__version__)
34 | assert (mmdet_version >= digit_version(mmdet_minimum_version)
35 |         and mmdet_version <= digit_version(mmdet_maximum_version)), \
36 |     f'MMDET=={mmdet.__version__} is used but incompatible. ' \
37 |     f'Please install mmdet>={mmdet_minimum_version}, ' \
38 |     f'<={mmdet_maximum_version}.'
39 | 
40 | mmseg_minimum_version = '0.14.1'
41 | mmseg_maximum_version = '1.0.0'
42 | mmseg_version = digit_version(mmseg.__version__)
43 | assert (mmseg_version >= digit_version(mmseg_minimum_version)
44 |         and mmseg_version <= digit_version(mmseg_maximum_version)), \
45 |     f'MMSEG=={mmseg.__version__} is used but incompatible. ' \
46 |     f'Please install mmseg>={mmseg_minimum_version}, ' \
47 |     f'<={mmseg_maximum_version}.'
48 | 
49 | __all__ = ['__version__', 'short_version']
50 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/spconv/include/utility/timer.h:
--------------------------------------------------------------------------------
 1 | // Copyright 2019 Yan Yan
 2 | //
 3 | // Licensed under the Apache License, Version 2.0 (the "License");
 4 | // you may not use this file except in compliance with the License.
 5 | // You may obtain a copy of the License at
 6 | //
 7 | //     http://www.apache.org/licenses/LICENSE-2.0
 8 | //
 9 | // Unless required by applicable law or agreed to in writing, software
10 | // distributed under the License is distributed on an "AS IS" BASIS,
11 | // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | // See the License for the specific language governing permissions and
13 | // limitations under the License.
14 | 
15 | #pragma once
16 | #include <chrono>
17 | #include <cuda_runtime_api.h>
18 | #include <iostream>
19 | 
20 | namespace spconv {
21 | 
22 | template <typename TimeT = std::chrono::microseconds> struct CudaContextTimer {
23 |   CudaContextTimer() {
24 |     cudaDeviceSynchronize();
25 |     mCurTime = std::chrono::steady_clock::now();
26 |   }
27 |   typename TimeT::rep report() {
28 |     cudaDeviceSynchronize();
29 |     auto duration = std::chrono::duration_cast<TimeT>(
30 |         std::chrono::steady_clock::now() - mCurTime);
31 |     auto res = duration.count();
32 |     mCurTime = std::chrono::steady_clock::now();
33 |     return res;
34 |   }
35 | 
36 | private:
37 |   std::chrono::time_point<std::chrono::steady_clock> mCurTime;
38 | };
39 | 
40 | template <typename TimeT = std::chrono::microseconds> struct CPUTimer {
41 |   CPUTimer() { mCurTime = std::chrono::steady_clock::now(); }
42 |   typename TimeT::rep report() {
43 |     auto duration = std::chrono::duration_cast<TimeT>(
44 |         std::chrono::steady_clock::now() - mCurTime);
45 |     auto res = duration.count();
46 |     mCurTime = std::chrono::steady_clock::now();
47 |     return res;
48 |   }
49 | 
50 | private:
51 |   std::chrono::time_point<std::chrono::steady_clock> mCurTime;
52 | };
53 | 
54 | } // namespace spconv
55 | 


--------------------------------------------------------------------------------
/configs/regnet/hv_pointpillars_regnet-400mf_secfpn_sbn-all_range100_2x8_2x_lyft-3d.py:
--------------------------------------------------------------------------------
 1 | _base_ = \
 2 |     './hv_pointpillars_regnet-400mf_fpn_sbn-all_range100_2x8_2x_lyft-3d.py'
 3 | # model settings
 4 | model = dict(
 5 |     pts_neck=dict(
 6 |         type='SECONDFPN',
 7 |         _delete_=True,
 8 |         norm_cfg=dict(type='naiveSyncBN2d', eps=1e-3, momentum=0.01),
 9 |         in_channels=[64, 160, 384],
10 |         upsample_strides=[1, 2, 4],
11 |         out_channels=[128, 128, 128]),
12 |     pts_bbox_head=dict(
13 |         type='Anchor3DHead',
14 |         in_channels=384,
15 |         feat_channels=384,
16 |         anchor_generator=dict(
17 |             _delete_=True,
18 |             type='AlignedAnchor3DRangeGenerator',
19 |             ranges=[[-100, -100, -1.0715024, 100, 100, -1.0715024],
20 |                     [-100, -100, -0.3033737, 100, 100, -0.3033737],
21 |                     [-100, -100, -0.3519405, 100, 100, -0.3519405],
22 |                     [-100, -100, -0.8871424, 100, 100, -0.8871424],
23 |                     [-100, -100, -0.6276341, 100, 100, -0.6276341],
24 |                     [-100, -100, -1.3220503, 100, 100, -1.3220503],
25 |                     [-100, -100, -1.0709302, 100, 100, -1.0709302],
26 |                     [-100, -100, -0.9122268, 100, 100, -0.9122268],
27 |                     [-100, -100, -1.8012227, 100, 100, -1.8012227]],
28 |             sizes=[
29 |                 [1.92, 4.75, 1.71],  # car
30 |                 [2.84, 10.24, 3.44],  # truck
31 |                 [2.92, 12.70, 3.42],  # bus
32 |                 [2.42, 6.52, 2.34],  # emergency vehicle
33 |                 [2.75, 8.17, 3.20],  # other vehicle
34 |                 [0.96, 2.35, 1.59],  # motorcycle
35 |                 [0.63, 1.76, 1.44],  # bicycle
36 |                 [0.76, 0.80, 1.76],  # pedestrian
37 |                 [0.35, 0.73, 0.50]  # animal
38 |             ],
39 |             rotations=[0, 1.57],
40 |             reshape_out=True)))
41 | 


--------------------------------------------------------------------------------
/configs/pointpillars/hv_pointpillars_secfpn_sbn-all_4x8_2x_nus-3d.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/hv_pointpillars_fpn_nus.py',
 3 |     '../_base_/datasets/nus-3d.py',
 4 |     '../_base_/schedules/schedule_2x.py',
 5 |     '../_base_/default_runtime.py',
 6 | ]
 7 | # model settings
 8 | model = dict(
 9 |     pts_neck=dict(
10 |         _delete_=True,
11 |         type='SECONDFPN',
12 |         norm_cfg=dict(type='naiveSyncBN2d', eps=1e-3, momentum=0.01),
13 |         in_channels=[64, 128, 256],
14 |         upsample_strides=[1, 2, 4],
15 |         out_channels=[128, 128, 128]),
16 |     pts_bbox_head=dict(
17 |         in_channels=384,
18 |         feat_channels=384,
19 |         anchor_generator=dict(
20 |             _delete_=True,
21 |             type='AlignedAnchor3DRangeGenerator',
22 |             ranges=[
23 |                 [-49.6, -49.6, -1.80032795, 49.6, 49.6, -1.80032795],
24 |                 [-49.6, -49.6, -1.74440365, 49.6, 49.6, -1.74440365],
25 |                 [-49.6, -49.6, -1.68526504, 49.6, 49.6, -1.68526504],
26 |                 [-49.6, -49.6, -1.67339111, 49.6, 49.6, -1.67339111],
27 |                 [-49.6, -49.6, -1.61785072, 49.6, 49.6, -1.61785072],
28 |                 [-49.6, -49.6, -1.80984986, 49.6, 49.6, -1.80984986],
29 |                 [-49.6, -49.6, -1.763965, 49.6, 49.6, -1.763965],
30 |             ],
31 |             sizes=[
32 |                 [1.95017717, 4.60718145, 1.72270761],  # car
33 |                 [2.4560939, 6.73778078, 2.73004906],  # truck
34 |                 [2.87427237, 12.01320693, 3.81509561],  # trailer
35 |                 [0.60058911, 1.68452161, 1.27192197],  # bicycle
36 |                 [0.66344886, 0.7256437, 1.75748069],  # pedestrian
37 |                 [0.39694519, 0.40359262, 1.06232151],  # traffic_cone
38 |                 [2.49008838, 0.48578221, 0.98297065],  # barrier
39 |             ],
40 |             custom_values=[0, 0],
41 |             rotations=[0, 1.57],
42 |             reshape_out=True)))
43 | 


--------------------------------------------------------------------------------
/mmdet3d/datasets/builder.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | import platform
 3 | from mmcv.utils import Registry, build_from_cfg
 4 | 
 5 | from mmdet.datasets import DATASETS
 6 | from mmdet.datasets.builder import _concat_dataset
 7 | 
 8 | if platform.system() != 'Windows':
 9 |     # https://github.com/pytorch/pytorch/issues/973
10 |     import resource
11 |     rlimit = resource.getrlimit(resource.RLIMIT_NOFILE)
12 |     base_soft_limit = rlimit[0]
13 |     hard_limit = rlimit[1]
14 |     soft_limit = min(max(4096, base_soft_limit), hard_limit)
15 |     resource.setrlimit(resource.RLIMIT_NOFILE, (soft_limit, hard_limit))
16 | 
17 | OBJECTSAMPLERS = Registry('Object sampler')
18 | 
19 | 
20 | def build_dataset(cfg, default_args=None):
21 |     from mmdet3d.datasets.dataset_wrappers import CBGSDataset
22 |     from mmdet.datasets.dataset_wrappers import (ClassBalancedDataset,
23 |                                                  ConcatDataset, RepeatDataset)
24 |     if isinstance(cfg, (list, tuple)):
25 |         dataset = ConcatDataset([build_dataset(c, default_args) for c in cfg])
26 |     elif cfg['type'] == 'ConcatDataset':
27 |         dataset = ConcatDataset(
28 |             [build_dataset(c, default_args) for c in cfg['datasets']],
29 |             cfg.get('separate_eval', True))
30 |     elif cfg['type'] == 'RepeatDataset':
31 |         dataset = RepeatDataset(
32 |             build_dataset(cfg['dataset'], default_args), cfg['times'])
33 |     elif cfg['type'] == 'ClassBalancedDataset':
34 |         dataset = ClassBalancedDataset(
35 |             build_dataset(cfg['dataset'], default_args), cfg['oversample_thr'])
36 |     elif cfg['type'] == 'CBGSDataset':
37 |         dataset = CBGSDataset(build_dataset(cfg['dataset'], default_args))
38 |     elif isinstance(cfg.get('ann_file'), (list, tuple)):
39 |         dataset = _concat_dataset(cfg, default_args)
40 |     else:
41 |         dataset = build_from_cfg(cfg, DATASETS, default_args)
42 | 
43 |     return dataset
44 | 


--------------------------------------------------------------------------------
/configs/pointpillars/hv_pointpillars_secfpn_sbn-all_2x8_2x_lyft-3d.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/hv_pointpillars_fpn_lyft.py',
 3 |     '../_base_/datasets/lyft-3d.py',
 4 |     '../_base_/schedules/schedule_2x.py',
 5 |     '../_base_/default_runtime.py',
 6 | ]
 7 | # model settings
 8 | model = dict(
 9 |     pts_neck=dict(
10 |         _delete_=True,
11 |         type='SECONDFPN',
12 |         norm_cfg=dict(type='naiveSyncBN2d', eps=1e-3, momentum=0.01),
13 |         in_channels=[64, 128, 256],
14 |         upsample_strides=[1, 2, 4],
15 |         out_channels=[128, 128, 128]),
16 |     pts_bbox_head=dict(
17 |         in_channels=384,
18 |         feat_channels=384,
19 |         anchor_generator=dict(
20 |             _delete_=True,
21 |             type='AlignedAnchor3DRangeGenerator',
22 |             ranges=[[-80, -80, -1.0715024, 80, 80, -1.0715024],
23 |                     [-80, -80, -0.3033737, 80, 80, -0.3033737],
24 |                     [-80, -80, -0.3519405, 80, 80, -0.3519405],
25 |                     [-80, -80, -0.8871424, 80, 80, -0.8871424],
26 |                     [-80, -80, -0.6276341, 80, 80, -0.6276341],
27 |                     [-80, -80, -1.3220503, 80, 80, -1.3220503],
28 |                     [-80, -80, -1.0709302, 80, 80, -1.0709302],
29 |                     [-80, -80, -0.9122268, 80, 80, -0.9122268],
30 |                     [-80, -80, -1.8012227, 80, 80, -1.8012227]],
31 |             sizes=[
32 |                 [1.92, 4.75, 1.71],  # car
33 |                 [2.84, 10.24, 3.44],  # truck
34 |                 [2.92, 12.70, 3.42],  # bus
35 |                 [2.42, 6.52, 2.34],  # emergency vehicle
36 |                 [2.75, 8.17, 3.20],  # other vehicle
37 |                 [0.96, 2.35, 1.59],  # motorcycle
38 |                 [0.63, 1.76, 1.44],  # bicycle
39 |                 [0.76, 0.80, 1.76],  # pedestrian
40 |                 [0.35, 0.73, 0.50]  # animal
41 |             ],
42 |             rotations=[0, 1.57],
43 |             reshape_out=True)))
44 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/ball_query/src/ball_query.cpp:
--------------------------------------------------------------------------------
 1 | // Modified from
 2 | // https://github.com/sshaoshuai/Pointnet2.PyTorch/tree/master/pointnet2/src/ball_query.cpp
 3 | 
 4 | // #include <THC/THC.h>
 5 | #include <cuda.h>
 6 | #include <cuda_runtime_api.h>
 7 | #include <torch/extension.h>
 8 | #include <torch/serialize/tensor.h>
 9 | #include <ATen/cuda/CUDAContext.h>
10 | #include <vector>
11 | 
12 | // extern THCState *state;
13 | 
14 | #define CHECK_CUDA(x) \
15 |   TORCH_CHECK(x.type().is_cuda(), #x, " must be a CUDAtensor ")
16 | #define CHECK_CONTIGUOUS(x) \
17 |   TORCH_CHECK(x.is_contiguous(), #x, " must be contiguous ")
18 | #define CHECK_INPUT(x) \
19 |   CHECK_CUDA(x);       \
20 |   CHECK_CONTIGUOUS(x)
21 | 
22 | int ball_query_wrapper(int b, int n, int m, float min_radius, float max_radius, int nsample,
23 |                        at::Tensor new_xyz_tensor, at::Tensor xyz_tensor,
24 |                        at::Tensor idx_tensor);
25 | 
26 | void ball_query_kernel_launcher(int b, int n, int m, float min_radius, float max_radius,
27 |                                 int nsample, const float *xyz, const float *new_xyz,
28 |                                 int *idx, cudaStream_t stream);
29 | 
30 | int ball_query_wrapper(int b, int n, int m, float min_radius, float max_radius, int nsample,
31 |                        at::Tensor new_xyz_tensor, at::Tensor xyz_tensor,
32 |                        at::Tensor idx_tensor) {
33 |   CHECK_INPUT(new_xyz_tensor);
34 |   CHECK_INPUT(xyz_tensor);
35 |   const float *new_xyz = new_xyz_tensor.data_ptr<float>();
36 |   const float *xyz = xyz_tensor.data_ptr<float>();
37 |   int *idx = idx_tensor.data_ptr<int>();
38 | 
39 |   cudaStream_t stream = at::cuda::getCurrentCUDAStream().stream();
40 |   ball_query_kernel_launcher(b, n, m, min_radius, max_radius,
41 |                              nsample, new_xyz, xyz, idx, stream);
42 |   return 1;
43 | }
44 | 
45 | PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
46 |   m.def("ball_query_wrapper", &ball_query_wrapper, "ball_query_wrapper");
47 | }
48 | 


--------------------------------------------------------------------------------
/configs/pointpillars/hv_pointpillars_secfpn_sbn-all_range100_2x8_2x_lyft-3d.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/hv_pointpillars_fpn_range100_lyft.py',
 3 |     '../_base_/datasets/range100_lyft-3d.py',
 4 |     '../_base_/schedules/schedule_2x.py', '../_base_/default_runtime.py'
 5 | ]
 6 | # model settings
 7 | model = dict(
 8 |     pts_neck=dict(
 9 |         _delete_=True,
10 |         type='SECONDFPN',
11 |         norm_cfg=dict(type='naiveSyncBN2d', eps=1e-3, momentum=0.01),
12 |         in_channels=[64, 128, 256],
13 |         upsample_strides=[1, 2, 4],
14 |         out_channels=[128, 128, 128]),
15 |     pts_bbox_head=dict(
16 |         in_channels=384,
17 |         feat_channels=384,
18 |         anchor_generator=dict(
19 |             _delete_=True,
20 |             type='AlignedAnchor3DRangeGenerator',
21 |             ranges=[[-100, -100, -1.0715024, 100, 100, -1.0715024],
22 |                     [-100, -100, -0.3033737, 100, 100, -0.3033737],
23 |                     [-100, -100, -0.3519405, 100, 100, -0.3519405],
24 |                     [-100, -100, -0.8871424, 100, 100, -0.8871424],
25 |                     [-100, -100, -0.6276341, 100, 100, -0.6276341],
26 |                     [-100, -100, -1.3220503, 100, 100, -1.3220503],
27 |                     [-100, -100, -1.0709302, 100, 100, -1.0709302],
28 |                     [-100, -100, -0.9122268, 100, 100, -0.9122268],
29 |                     [-100, -100, -1.8012227, 100, 100, -1.8012227]],
30 |             sizes=[
31 |                 [1.92, 4.75, 1.71],  # car
32 |                 [2.84, 10.24, 3.44],  # truck
33 |                 [2.92, 12.70, 3.42],  # bus
34 |                 [2.42, 6.52, 2.34],  # emergency vehicle
35 |                 [2.75, 8.17, 3.20],  # other vehicle
36 |                 [0.96, 2.35, 1.59],  # motorcycle
37 |                 [0.63, 1.76, 1.44],  # bicycle
38 |                 [0.76, 0.80, 1.76],  # pedestrian
39 |                 [0.35, 0.73, 0.50]  # animal
40 |             ],
41 |             rotations=[0, 1.57],
42 |             reshape_out=True)))
43 | 


--------------------------------------------------------------------------------
/configs/imvotenet/README.md:
--------------------------------------------------------------------------------
 1 | # ImVoteNet: Boosting 3D Object Detection in Point Clouds with Image Votes
 2 | 
 3 | ## Introduction
 4 | 
 5 | <!-- [ALGORITHM] -->
 6 | 
 7 | We implement ImVoteNet and provide the result and checkpoints on SUNRGBD.
 8 | 
 9 | ```
10 | @inproceedings{qi2020imvotenet,
11 |   title={Imvotenet: Boosting 3D object detection in point clouds with image votes},
12 |   author={Qi, Charles R and Chen, Xinlei and Litany, Or and Guibas, Leonidas J},
13 |   booktitle={Proceedings of the IEEE/CVF conference on computer vision and pattern recognition},
14 |   pages={4404--4413},
15 |   year={2020}
16 | }
17 | ```
18 | 
19 | ## Results
20 | 
21 | ### SUNRGBD-2D (Stage 1, image branch pre-train)
22 | 
23 | |  Backbone   | Lr schd | Mem (GB) | Inf time (fps) | AP@0.25 |AP@0.5| Download |
24 | | :---------: | :-----: | :------: | :------------: | :----: |:----: | :------: |
25 | |    [PointNet++](./imvotenet_faster_rcnn_r50_fpn_2x4_sunrgbd-3d-10class.py)     |   |2.1| ||62.70|[model](https://download.openmmlab.com/mmdetection3d/v0.1.0_models/imvotenet/imvotenet_faster_rcnn_r50_fpn_2x4_sunrgbd-3d-10class/imvotenet_faster_rcnn_r50_fpn_2x4_sunrgbd-3d-10class_20210323_173222-cad62aeb.pth) &#124; [log](https://download.openmmlab.com/mmdetection3d/v0.1.0_models/imvotenet/imvotenet_faster_rcnn_r50_fpn_2x4_sunrgbd-3d-10class/imvotenet_faster_rcnn_r50_fpn_2x4_sunrgbd-3d-10class_20210323_173222.log.json)|
26 | 
27 | ### SUNRGBD-3D (Stage 2)
28 | 
29 | |  Backbone   | Lr schd | Mem (GB) | Inf time (fps) | AP@0.25 |AP@0.5| Download |
30 | | :---------: | :-----: | :------: | :------------: | :----: |:----: | :------: |
31 | |    [PointNet++](./imvotenet_stage2_16x8_sunrgbd-3d-10class.py)     |  3x    |9.4| |64.04||[model](https://download.openmmlab.com/mmdetection3d/v0.1.0_models/imvotenet/imvotenet_stage2_16x8_sunrgbd-3d-10class/imvotenet_stage2_16x8_sunrgbd-3d-10class_20210323_184021-d44dcb66.pth) &#124; [log](https://download.openmmlab.com/mmdetection3d/v0.1.0_models/imvotenet/imvotenet_stage2_16x8_sunrgbd-3d-10class/imvotenet_stage2_16x8_sunrgbd-3d-10class_20210323_184021.log.json)|
32 | 


--------------------------------------------------------------------------------
/configs/nuimages/mask_rcnn_r50_caffe_fpn_coco-3x_1x_nuim.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/mask_rcnn_r50_fpn.py',
 3 |     '../_base_/datasets/nuim_instance.py',
 4 |     '../_base_/schedules/mmdet_schedule_1x.py', '../_base_/default_runtime.py'
 5 | ]
 6 | model = dict(
 7 |     pretrained='open-mmlab://detectron2/resnet50_caffe',
 8 |     backbone=dict(norm_cfg=dict(requires_grad=False), style='caffe'),
 9 |     roi_head=dict(
10 |         bbox_head=dict(num_classes=10), mask_head=dict(num_classes=10)))
11 | # use caffe img_norm
12 | img_norm_cfg = dict(
13 |     mean=[103.530, 116.280, 123.675], std=[1.0, 1.0, 1.0], to_rgb=False)
14 | train_pipeline = [
15 |     dict(type='LoadImageFromFile'),
16 |     dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
17 |     dict(
18 |         type='Resize',
19 |         img_scale=[(1280, 720), (1920, 1080)],
20 |         multiscale_mode='range',
21 |         keep_ratio=True),
22 |     dict(type='RandomFlip', flip_ratio=0.5),
23 |     dict(type='Normalize', **img_norm_cfg),
24 |     dict(type='Pad', size_divisor=32),
25 |     dict(type='DefaultFormatBundle'),
26 |     dict(type='Collect', keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks']),
27 | ]
28 | test_pipeline = [
29 |     dict(type='LoadImageFromFile'),
30 |     dict(
31 |         type='MultiScaleFlipAug',
32 |         img_scale=(1600, 900),
33 |         flip=False,
34 |         transforms=[
35 |             dict(type='Resize', keep_ratio=True),
36 |             dict(type='RandomFlip'),
37 |             dict(type='Normalize', **img_norm_cfg),
38 |             dict(type='Pad', size_divisor=32),
39 |             dict(type='ImageToTensor', keys=['img']),
40 |             dict(type='Collect', keys=['img']),
41 |         ])
42 | ]
43 | data = dict(
44 |     train=dict(pipeline=train_pipeline),
45 |     val=dict(pipeline=test_pipeline),
46 |     test=dict(pipeline=test_pipeline))
47 | 
48 | load_from = 'https://download.openmmlab.com/mmdetection/v2.0/mask_rcnn/mask_rcnn_r50_caffe_fpn_mstrain-poly_3x_coco/mask_rcnn_r50_caffe_fpn_mstrain-poly_3x_coco_bbox_mAP-0.408__segm_mAP-0.37_20200504_163245-42aa3d00.pth'  # noqa
49 | 


--------------------------------------------------------------------------------
/projects/mmdet3d_plugin/models/dense_heads/render_utils/renderers.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from torch import nn
 3 | 
 4 | 
 5 | class RGBRenderer(nn.Module):
 6 |     """Standard volumetic rendering."""
 7 | 
 8 |     def __init__(self, background_color=(0.0, 0.0, 0.0)):
 9 |         super().__init__()
10 |         self.background_color = background_color
11 | 
12 |     def forward(self, rgb, weights):
13 |         """Composite samples along ray and render color image
14 | 
15 |         Args:
16 |             rgb: RGB for each sample, (num_rays, num_samples, 3)
17 |             weights: Weights for each sample, (num_rays, num_samples, 1)
18 |         Returns:
19 |             Outputs of rgb values.
20 |         """
21 |         comp_rgb = torch.sum(weights * rgb, dim=-2)
22 |         accumulated_weight = torch.sum(weights, dim=-2)
23 |         comp_rgb = comp_rgb + comp_rgb.new_tensor(self.background_color) * (
24 |             1.0 - accumulated_weight
25 |         )
26 |         if not self.training:
27 |             torch.clamp_(comp_rgb, min=0.0, max=1.0)
28 |         return comp_rgb
29 | 
30 | 
31 | class DepthRenderer(nn.Module):
32 |     """Calculate depth along ray."""
33 | 
34 |     def __init__(self, **kwargs):
35 |         super().__init__()
36 | 
37 |     def forward(self, ray_samples, weights):
38 |         """Composite samples along ray and calculate depths.
39 | 
40 |         Args:
41 |             weights: Weights for each sample.
42 |             ray_samples: Set of ray samples.
43 |         Returns:
44 |             Outputs of depth values.
45 |         """
46 |         eps = 1e-10
47 |         steps = ray_samples.frustums.starts
48 |         depth = torch.sum(weights * steps, dim=-2) / (torch.sum(weights, -2) + eps)
49 |         depth = torch.clip(depth, steps.min(), steps.max())
50 |         return depth
51 | 
52 | 
53 | class NormalRenderer(nn.Module):
54 |     """Calculate normals along the ray."""
55 | 
56 |     def __init__(self, **kwargs):
57 |         super().__init__()
58 | 
59 |     def forward(self, normals, weights):
60 |         """Calculate normals along the ray."""
61 |         n = torch.sum(weights * normals, dim=-2)
62 |         return n
63 | 


--------------------------------------------------------------------------------
/configs/votenet/metafile.yml:
--------------------------------------------------------------------------------
 1 | Collections:
 2 |   - Name: VoteNet
 3 |     Metadata:
 4 |       Training Techniques:
 5 |         - AdamW
 6 |       Training Resources: 8x V100 GPUs
 7 |       Architecture:
 8 |         - PointNet++
 9 |     Paper:
10 |       URL: https://arxiv.org/abs/1904.09664
11 |       Title: 'Deep Hough Voting for 3D Object Detection in Point Clouds'
12 |     README: configs/votenet/README.md
13 |     Code:
14 |       URL: https://github.com/open-mmlab/mmdetection3d/blob/master/mmdet3d/models/detectors/votenet.py#L10
15 |       Version: v0.5.0
16 | 
17 | Models:
18 |   - Name: votenet_16x8_sunrgbd-3d-10class.py
19 |     In Collection: VoteNet
20 |     Config: configs/votenet/votenet_16x8_sunrgbd-3d-10class.py
21 |     Metadata:
22 |       Training Data: SUNRGBD
23 |       Training Memory (GB): 8.1
24 |     Results:
25 |       - Task: 3D Object Detection
26 |         Dataset: SUNRGBD
27 |         Metrics:
28 |           AP@0.25: 59.07
29 |           AP@0.5: 35.77
30 |     Weights: https://download.openmmlab.com/mmdetection3d/v0.1.0_models/votenet/votenet_16x8_sunrgbd-3d-10class/votenet_16x8_sunrgbd-3d-10class_20200620_230238-4483c0c0.pth
31 | 
32 |   - Name: votenet_8x8_scannet-3d-18class.py
33 |     In Collection: VoteNet
34 |     Config: configs/votenet/votenet_8x8_scannet-3d-18class.py
35 |     Metadata:
36 |       Training Data: ScanNet
37 |       Training Memory (GB): 4.1
38 |     Results:
39 |       - Task: 3D Object Detection
40 |         Dataset: ScanNet
41 |         Metrics:
42 |           AP@0.25: 62.90
43 |           AP@0.5: 39.91
44 |     Weights: https://download.openmmlab.com/mmdetection3d/v0.1.0_models/votenet/votenet_8x8_scannet-3d-18class/votenet_8x8_scannet-3d-18class_20200620_230238-2cea9c3a.pth
45 | 
46 |   - Name: votenet_iouloss_8x8_scannet-3d-18class
47 |     In Collection: VoteNet
48 |     Config: configs/votenet/votenet_iouloss_8x8_scannet-3d-18class.py
49 |     Metadata:
50 |       Training Data: ScanNet
51 |       Training Memory (GB): 4.1
52 |       Architecture:
53 |         - IoU Loss
54 |     Results:
55 |       - Task: 3D Object Detection
56 |         Dataset: ScanNet
57 |         Metrics:
58 |           AP@0.25: 63.81
59 |           AP@0.5: 44.21
60 | 


--------------------------------------------------------------------------------
/mmdet3d/ops/spconv/include/pybind11_utils.h:
--------------------------------------------------------------------------------
 1 | // Copyright 2019 Yan Yan
 2 | //
 3 | // Licensed under the Apache License, Version 2.0 (the "License");
 4 | // you may not use this file except in compliance with the License.
 5 | // You may obtain a copy of the License at
 6 | //
 7 | //     http://www.apache.org/licenses/LICENSE-2.0
 8 | //
 9 | // Unless required by applicable law or agreed to in writing, software
10 | // distributed under the License is distributed on an "AS IS" BASIS,
11 | // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | // See the License for the specific language governing permissions and
13 | // limitations under the License.
14 | 
15 | #pragma once
16 | #include <algorithm>
17 | #include <iostream>
18 | #include <pybind11/embed.h> // everything needed for embedding
19 | #include <pybind11/functional.h>
20 | #include <pybind11/numpy.h>
21 | #include <pybind11/pybind11.h>
22 | #include <pybind11/stl.h>
23 | 
24 | #include <tensorview/tensorview.h>
25 | 
26 | namespace py = pybind11;
27 | 
28 | template <typename T, typename TPyObject>
29 | std::vector<T> array2Vector(TPyObject arr){
30 |     py::array arr_np = arr;
31 |     size_t size = arr.attr("size").template cast<size_t>();
32 |     py::array_t<T> arr_cc = arr_np;
33 |     std::vector<T> data(arr_cc.data(), arr_cc.data() + size);
34 |     return data;
35 | }
36 | 
37 | template <typename T>
38 | std::vector<T> arrayT2Vector(py::array_t<T> arr)
39 | {
40 |   std::vector<T> data(arr.data(), arr.data() + arr.size());
41 |   return data;
42 | }
43 | 
44 | template <typename T, typename TPyObject>
45 | tv::TensorView<T> array2TensorView(TPyObject arr){
46 |     py::array arr_np = arr;
47 |     py::array_t<T> arr_cc = arr_np;
48 |     tv::Shape shape;
49 |     for (int i = 0; i < arr_cc.ndim(); ++i){
50 |         shape.push_back(arr_cc.shape(i));
51 |     }
52 |     return tv::TensorView<T>(arr_cc.mutable_data(), shape);
53 | }
54 | template <typename T>
55 | tv::TensorView<T> arrayT2TensorView(py::array_t<T> arr){
56 |     tv::Shape shape;
57 |     for (int i = 0; i < arr.ndim(); ++i){
58 |         shape.push_back(arr.shape(i));
59 |     }
60 |     return tv::TensorView<T>(arr.mutable_data(), shape);
61 | }
62 | 


--------------------------------------------------------------------------------
/configs/nuimages/mask_rcnn_r50_caffe_fpn_coco-3x_20e_nuim.py:
--------------------------------------------------------------------------------
 1 | _base_ = [
 2 |     '../_base_/models/mask_rcnn_r50_fpn.py',
 3 |     '../_base_/datasets/nuim_instance.py',
 4 |     '../_base_/schedules/mmdet_schedule_1x.py', '../_base_/default_runtime.py'
 5 | ]
 6 | model = dict(
 7 |     pretrained='open-mmlab://detectron2/resnet50_caffe',
 8 |     backbone=dict(norm_cfg=dict(requires_grad=False), style='caffe'),
 9 |     roi_head=dict(
10 |         bbox_head=dict(num_classes=10), mask_head=dict(num_classes=10)))
11 | # use caffe img_norm
12 | img_norm_cfg = dict(
13 |     mean=[103.530, 116.280, 123.675], std=[1.0, 1.0, 1.0], to_rgb=False)
14 | train_pipeline = [
15 |     dict(type='LoadImageFromFile'),
16 |     dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
17 |     dict(
18 |         type='Resize',
19 |         img_scale=[(1280, 720), (1920, 1080)],
20 |         multiscale_mode='range',
21 |         keep_ratio=True),
22 |     dict(type='RandomFlip', flip_ratio=0.5),
23 |     dict(type='Normalize', **img_norm_cfg),
24 |     dict(type='Pad', size_divisor=32),
25 |     dict(type='DefaultFormatBundle'),
26 |     dict(type='Collect', keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks']),
27 | ]
28 | test_pipeline = [
29 |     dict(type='LoadImageFromFile'),
30 |     dict(
31 |         type='MultiScaleFlipAug',
32 |         img_scale=(1600, 900),
33 |         flip=False,
34 |         transforms=[
35 |             dict(type='Resize', keep_ratio=True),
36 |             dict(type='RandomFlip'),
37 |             dict(type='Normalize', **img_norm_cfg),
38 |             dict(type='Pad', size_divisor=32),
39 |             dict(type='ImageToTensor', keys=['img']),
40 |             dict(type='Collect', keys=['img']),
41 |         ])
42 | ]
43 | data = dict(
44 |     train=dict(pipeline=train_pipeline),
45 |     val=dict(pipeline=test_pipeline),
46 |     test=dict(pipeline=test_pipeline))
47 | 
48 | # learning policy
49 | lr_config = dict(step=[16, 19])
50 | runner = dict(max_epochs=20)
51 | 
52 | load_from = 'http://download.openmmlab.com/mmdetection/v2.0/mask_rcnn/mask_rcnn_r50_caffe_fpn_mstrain-poly_3x_coco/mask_rcnn_r50_caffe_fpn_mstrain-poly_3x_coco_bbox_mAP-0.408__segm_mAP-0.37_20200504_163245-42aa3d00.pth'  # noqa
53 | 


--------------------------------------------------------------------------------
/configs/_base_/models/paconv_ssg.py:
--------------------------------------------------------------------------------
 1 | # model settings
 2 | model = dict(
 3 |     type='EncoderDecoder3D',
 4 |     backbone=dict(
 5 |         type='PointNet2SASSG',
 6 |         in_channels=9,  # [xyz, rgb, normalized_xyz]
 7 |         num_points=(1024, 256, 64, 16),
 8 |         radius=(None, None, None, None),  # use kNN instead of ball query
 9 |         num_samples=(32, 32, 32, 32),
10 |         sa_channels=((32, 32, 64), (64, 64, 128), (128, 128, 256), (256, 256,
11 |                                                                     512)),
12 |         fp_channels=(),
13 |         norm_cfg=dict(type='BN2d', momentum=0.1),
14 |         sa_cfg=dict(
15 |             type='PAConvSAModule',
16 |             pool_mod='max',
17 |             use_xyz=True,
18 |             normalize_xyz=False,
19 |             paconv_num_kernels=[16, 16, 16],
20 |             paconv_kernel_input='w_neighbor',
21 |             scorenet_input='w_neighbor_dist',
22 |             scorenet_cfg=dict(
23 |                 mlp_channels=[16, 16, 16],
24 |                 score_norm='softmax',
25 |                 temp_factor=1.0,
26 |                 last_bn=False))),
27 |     decode_head=dict(
28 |         type='PAConvHead',
29 |         # PAConv model's decoder takes skip connections from beckbone
30 |         # different from PointNet++, it also concats input features in the last
31 |         # level of decoder, leading to `128 + 6` as the channel number
32 |         fp_channels=((768, 256, 256), (384, 256, 256), (320, 256, 128),
33 |                      (128 + 6, 128, 128, 128)),
34 |         channels=128,
35 |         dropout_ratio=0.5,
36 |         conv_cfg=dict(type='Conv1d'),
37 |         norm_cfg=dict(type='BN1d'),
38 |         act_cfg=dict(type='ReLU'),
39 |         loss_decode=dict(
40 |             type='CrossEntropyLoss',
41 |             use_sigmoid=False,
42 |             class_weight=None,  # should be modified with dataset
43 |             loss_weight=1.0)),
44 |     # correlation loss to regularize PAConv's kernel weights
45 |     loss_regularization=dict(
46 |         type='PAConvRegularizationLoss', reduction='sum', loss_weight=10.0),
47 |     # model training and testing settings
48 |     train_cfg=dict(),
49 |     test_cfg=dict(mode='slide'))
50 | 


--------------------------------------------------------------------------------
/mmdet3d/models/roi_heads/roi_extractors/single_roiaware_extractor.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) OpenMMLab. All rights reserved.
 2 | import torch
 3 | from mmcv.runner import BaseModule
 4 | 
 5 | from mmdet3d import ops
 6 | from mmdet.models.builder import ROI_EXTRACTORS
 7 | 
 8 | 
 9 | @ROI_EXTRACTORS.register_module()
10 | class Single3DRoIAwareExtractor(BaseModule):
11 |     """Point-wise roi-aware Extractor.
12 | 
13 |     Extract Point-wise roi features.
14 | 
15 |     Args:
16 |         roi_layer (dict): The config of roi layer.
17 |     """
18 | 
19 |     def __init__(self, roi_layer=None, init_cfg=None):
20 |         super(Single3DRoIAwareExtractor, self).__init__(init_cfg=init_cfg)
21 |         self.roi_layer = self.build_roi_layers(roi_layer)
22 | 
23 |     def build_roi_layers(self, layer_cfg):
24 |         """Build roi layers using `layer_cfg`"""
25 |         cfg = layer_cfg.copy()
26 |         layer_type = cfg.pop('type')
27 |         assert hasattr(ops, layer_type)
28 |         layer_cls = getattr(ops, layer_type)
29 |         roi_layers = layer_cls(**cfg)
30 |         return roi_layers
31 | 
32 |     def forward(self, feats, coordinate, batch_inds, rois):
33 |         """Extract point-wise roi features.
34 | 
35 |         Args:
36 |             feats (torch.FloatTensor): Point-wise features with
37 |                 shape (batch, npoints, channels) for pooling.
38 |             coordinate (torch.FloatTensor): Coordinate of each point.
39 |             batch_inds (torch.LongTensor): Indicate the batch of each point.
40 |             rois (torch.FloatTensor): Roi boxes with batch indices.
41 | 
42 |         Returns:
43 |             torch.FloatTensor: Pooled features
44 |         """
45 |         pooled_roi_feats = []
46 |         for batch_idx in range(int(batch_inds.max()) + 1):
47 |             roi_inds = (rois[..., 0].int() == batch_idx)
48 |             coors_inds = (batch_inds.int() == batch_idx)
49 |             pooled_roi_feat = self.roi_layer(rois[..., 1:][roi_inds],
50 |                                              coordinate[coors_inds],
51 |                                              feats[coors_inds])
52 |             pooled_roi_feats.append(pooled_roi_feat)
53 |         pooled_roi_feats = torch.cat(pooled_roi_feats, 0)
54 |         return pooled_roi_feats
55 | 


--------------------------------------------------------------------------------
/configs/_base_/datasets/nuim_instance.py:
--------------------------------------------------------------------------------
 1 | dataset_type = 'CocoDataset'
 2 | data_root = 'data/nuimages/'
 3 | class_names = [
 4 |     'car', 'truck', 'trailer', 'bus', 'construction_vehicle', 'bicycle',
 5 |     'motorcycle', 'pedestrian', 'traffic_cone', 'barrier'
 6 | ]
 7 | img_norm_cfg = dict(
 8 |     mean=[123.675, 116.28, 103.53], std=[58.395, 57.12, 57.375], to_rgb=True)
 9 | train_pipeline = [
10 |     dict(type='LoadImageFromFile'),
11 |     dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
12 |     dict(
13 |         type='Resize',
14 |         img_scale=[(1280, 720), (1920, 1080)],
15 |         multiscale_mode='range',
16 |         keep_ratio=True),
17 |     dict(type='RandomFlip', flip_ratio=0.5),
18 |     dict(type='Normalize', **img_norm_cfg),
19 |     dict(type='Pad', size_divisor=32),
20 |     dict(type='DefaultFormatBundle'),
21 |     dict(type='Collect', keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks']),
22 | ]
23 | test_pipeline = [
24 |     dict(type='LoadImageFromFile'),
25 |     dict(
26 |         type='MultiScaleFlipAug',
27 |         img_scale=(1600, 900),
28 |         flip=False,
29 |         transforms=[
30 |             dict(type='Resize', keep_ratio=True),
31 |             dict(type='RandomFlip'),
32 |             dict(type='Normalize', **img_norm_cfg),
33 |             dict(type='Pad', size_divisor=32),
34 |             dict(type='ImageToTensor', keys=['img']),
35 |             dict(type='Collect', keys=['img']),
36 |         ])
37 | ]
38 | data = dict(
39 |     samples_per_gpu=2,
40 |     workers_per_gpu=2,
41 |     train=dict(
42 |         type=dataset_type,
43 |         ann_file=data_root + 'annotations/nuimages_v1.0-train.json',
44 |         img_prefix=data_root,
45 |         classes=class_names,
46 |         pipeline=train_pipeline),
47 |     val=dict(
48 |         type=dataset_type,
49 |         ann_file=data_root + 'annotations/nuimages_v1.0-val.json',
50 |         img_prefix=data_root,
51 |         classes=class_names,
52 |         pipeline=test_pipeline),
53 |     test=dict(
54 |         type=dataset_type,
55 |         ann_file=data_root + 'annotations/nuimages_v1.0-val.json',
56 |         img_prefix=data_root,
57 |         classes=class_names,
58 |         pipeline=test_pipeline))
59 | evaluation = dict(metric=['bbox', 'segm'])
60 | 


--------------------------------------------------------------------------------
/configs/second/metafile.yml:
--------------------------------------------------------------------------------
 1 | Collections:
 2 |   - Name: SECOND
 3 |     Metadata:
 4 |       Training Techniques:
 5 |         - AdamW
 6 |       Architecture:
 7 |         - Hard Voxelization
 8 |     Paper:
 9 |       URL: https://www.mdpi.com/1424-8220/18/10/3337
10 |       Title: 'SECOND: Sparsely Embedded Convolutional Detection'
11 |     README: configs/second/README.md
12 |     Code:
13 |       URL: https://github.com/open-mmlab/mmdetection3d/blob/master/mmdet3d/models/backbones/second.py#L11
14 |       Version: v0.5.0
15 | 
16 | Models:
17 |   - Name: hv_second_secfpn_6x8_80e_kitti-3d-car
18 |     In Collection: SECOND
19 |     Config: configs/second/hv_second_secfpn_6x8_80e_kitti-3d-car.py
20 |     Metadata:
21 |       Training Data: KITTI
22 |       Training Memory (GB): 5.4
23 |       Training Resources: 8x V100 GPUs
24 |     Results:
25 |       - Task: 3D Object Detection
26 |         Dataset: KITTI
27 |         Metrics:
28 |           mAP: 79.07
29 |     Weights: https://download.openmmlab.com/mmdetection3d/v0.1.0_models/second/hv_second_secfpn_6x8_80e_kitti-3d-car/hv_second_secfpn_6x8_80e_kitti-3d-car_20200620_230238-393f000c.pth
30 | 
31 |   - Name: hv_second_secfpn_6x8_80e_kitti-3d-3class
32 |     In Collection: SECOND
33 |     Config: configs/second/hv_second_secfpn_6x8_80e_kitti-3d-3class.py
34 |     Metadata:
35 |       Training Data: KITTI
36 |       Training Memory (GB): 5.4
37 |       Training Resources: 8x V100 GPUs
38 |     Results:
39 |       - Task: 3D Object Detection
40 |         Dataset: KITTI
41 |         Metrics:
42 |           mAP: 64.41
43 |     Weights: https://download.openmmlab.com/mmdetection3d/v0.1.0_models/second/hv_second_secfpn_6x8_80e_kitti-3d-3class/hv_second_secfpn_6x8_80e_kitti-3d-3class_20200620_230238-9208083a.pth
44 | 
45 |   - Name: hv_second_secfpn_sbn_2x16_2x_waymoD5-3d-3class
46 |     In Collection: SECOND
47 |     Config: configs/second/hv_second_secfpn_sbn_2x16_2x_waymoD5-3d-3class.py
48 |     Metadata:
49 |       Training Data: Waymo
50 |       Training Memory (GB): 8.12
51 |       Training Resources: 8x GeForce GTX 1080 Ti
52 |     Results:
53 |       - Task: 3D Object Detection
54 |         Dataset: Waymo
55 |         Metrics:
56 |           mAP@L1: 65.3
57 |           mAPH@L1: 61.7
58 |           mAP@L2: 58.9
59 |           mAPH@L2: 55.7
60 | 


--------------------------------------------------------------------------------