├── .gitignore
├── LICENSE
├── README.md
├── config
    ├── EfficientNet-Lite
    │   ├── nanodet-EfficientNet-Lite0_320.yml
    │   ├── nanodet-EfficientNet-Lite1_416.yml
    │   └── nanodet-EfficientNet-Lite2_512.yml
    ├── RepVGG
    │   └── nanodet-RepVGG-A0_416.yml
    ├── Transformer
    │   └── nanodet-t.yml
    ├── nanodet-g-mod.yml
    ├── nanodet-m-416.yml
    ├── nanodet-m-640-mod.yml
    ├── nanodet-m.yml
    └── nanodet_custom_xml_dataset.yml
├── demo
    ├── demo-inference-with-pytorch.ipynb
    └── demo.py
├── demo_android_ncnn
    ├── .gitignore
    ├── Android_demo.jpg
    ├── LICENSE
    ├── README.md
    ├── app
    │   ├── .gitignore
    │   ├── build.gradle
    │   ├── proguard-rules.pro
    │   └── src
    │   │   ├── androidTest
    │   │       └── java
    │   │       │   └── com
    │   │       │       └── rangi
    │   │       │           └── nanodet
    │   │       │               └── ExampleInstrumentedTest.java
    │   │   ├── main
    │   │       ├── AndroidManifest.xml
    │   │       ├── cpp
    │   │       │   ├── CMakeLists.txt
    │   │       │   ├── NanoDet.cpp
    │   │       │   ├── NanoDet.h
    │   │       │   ├── YoloV4.cpp
    │   │       │   ├── YoloV4.h
    │   │       │   ├── YoloV5.cpp
    │   │       │   ├── YoloV5.h
    │   │       │   └── jni_interface.cpp
    │   │       ├── java
    │   │       │   └── com
    │   │       │   │   └── rangi
    │   │       │   │       └── nanodet
    │   │       │   │           ├── AppCrashHandler.java
    │   │       │   │           ├── Box.java
    │   │       │   │           ├── MainActivity.java
    │   │       │   │           ├── NanoDet.java
    │   │       │   │           ├── NcnnApp.java
    │   │       │   │           ├── WelcomeActivity.java
    │   │       │   │           ├── YOLOv4.java
    │   │       │   │           └── YOLOv5.java
    │   │       └── res
    │   │       │   ├── drawable-v24
    │   │       │       └── ic_launcher_foreground.xml
    │   │       │   ├── drawable-xxhdpi
    │   │       │       ├── cpu.png
    │   │       │       ├── gpu.png
    │   │       │       └── ncnn_icon.png
    │   │       │   ├── drawable
    │   │       │       ├── cpu_gpu_bg.xml
    │   │       │       └── ic_launcher_background.xml
    │   │       │   ├── layout
    │   │       │       ├── activity_main.xml
    │   │       │       └── activity_welcome.xml
    │   │       │   ├── mipmap-anydpi-v26
    │   │       │       ├── ic_launcher.xml
    │   │       │       └── ic_launcher_round.xml
    │   │       │   ├── mipmap-hdpi
    │   │       │       ├── ic_launcher.png
    │   │       │       └── ic_launcher_round.png
    │   │       │   ├── mipmap-mdpi
    │   │       │       ├── ic_launcher.png
    │   │       │       └── ic_launcher_round.png
    │   │       │   ├── mipmap-xhdpi
    │   │       │       ├── ic_launcher.png
    │   │       │       └── ic_launcher_round.png
    │   │       │   ├── mipmap-xxhdpi
    │   │       │       ├── ic_launcher.png
    │   │       │       └── ic_launcher_round.png
    │   │       │   ├── mipmap-xxxhdpi
    │   │       │       ├── ic_launcher.png
    │   │       │       └── ic_launcher_round.png
    │   │       │   └── values
    │   │       │       ├── colors.xml
    │   │       │       ├── strings.xml
    │   │       │       └── styles.xml
    │   │   └── test
    │   │       └── java
    │   │           └── com
    │   │               └── rangi
    │   │                   └── nanodet
    │   │                       └── ExampleUnitTest.java
    ├── build.gradle
    ├── gradle.properties
    ├── gradle
    │   └── wrapper
    │   │   ├── gradle-wrapper.jar
    │   │   └── gradle-wrapper.properties
    ├── gradlew
    ├── gradlew.bat
    └── settings.gradle
├── demo_libtorch
    ├── CMakeLists.txt
    ├── README.md
    ├── main.cpp
    ├── nanodet_libtorch.cpp
    └── nanodet_libtorch.h
├── demo_mnn
    ├── CMakeLists.txt
    ├── README.md
    ├── imgs
    │   ├── 000252.jpg
    │   └── 000258.jpg
    ├── main.cpp
    ├── nanodet_mnn.cpp
    ├── nanodet_mnn.hpp
    ├── python
    │   └── demo_mnn.py
    └── results
    │   ├── 000252.jpg
    │   └── 000258.jpg
├── demo_ncnn
    ├── CMakeLists.txt
    ├── README.md
    ├── benchmark.jpg
    ├── main.cpp
    ├── nanodet.cpp
    ├── nanodet.h
    └── python
    │   └── demo_ncnn.py
├── demo_openvino
    ├── CMakeLists.txt
    ├── README.md
    ├── main.cpp
    ├── nanodet_openvino.cpp
    └── nanodet_openvino.h
├── docs
    ├── config_file_detail.md
    └── imgs
    │   ├── Android_demo.jpg
    │   ├── Model_arch.png
    │   └── Title.jpg
├── nanodet
    ├── data
    │   ├── collate.py
    │   ├── dataset
    │   │   ├── __init__.py
    │   │   ├── base.py
    │   │   ├── coco.py
    │   │   └── xml_dataset.py
    │   └── transform
    │   │   ├── __init__.py
    │   │   ├── color.py
    │   │   ├── mosaic.py
    │   │   ├── pipeline.py
    │   │   └── warp.py
    ├── evaluator
    │   ├── __init__.py
    │   └── coco_detection.py
    ├── model
    │   ├── arch
    │   │   ├── __init__.py
    │   │   └── one_stage_detector.py
    │   ├── backbone
    │   │   ├── __init__.py
    │   │   ├── custom_csp.py
    │   │   ├── efficientnet_lite.py
    │   │   ├── ghostnet.py
    │   │   ├── mobilenetv2.py
    │   │   ├── repvgg.py
    │   │   ├── resnet.py
    │   │   └── shufflenetv2.py
    │   ├── fpn
    │   │   ├── __init__.py
    │   │   ├── fpn.py
    │   │   ├── pan.py
    │   │   └── tan.py
    │   ├── head
    │   │   ├── __init__.py
    │   │   ├── assigner
    │   │   │   ├── assign_result.py
    │   │   │   ├── atss_assigner.py
    │   │   │   └── base_assigner.py
    │   │   ├── gfl_head.py
    │   │   └── nanodet_head.py
    │   ├── loss
    │   │   ├── gfocal_loss.py
    │   │   ├── iou_loss.py
    │   │   └── utils.py
    │   └── module
    │   │   ├── activation.py
    │   │   ├── conv.py
    │   │   ├── init_weights.py
    │   │   ├── nms.py
    │   │   ├── norm.py
    │   │   ├── scale.py
    │   │   └── transformer.py
    ├── trainer
    │   ├── __init__.py
    │   ├── dist_trainer.py
    │   ├── task.py
    │   └── trainer.py
    └── util
    │   ├── __init__.py
    │   ├── box_transform.py
    │   ├── check_point.py
    │   ├── config.py
    │   ├── data_parallel.py
    │   ├── distributed_data_parallel.py
    │   ├── flops_counter.py
    │   ├── logger.py
    │   ├── misc.py
    │   ├── path.py
    │   ├── rank_filter.py
    │   ├── scatter_gather.py
    │   ├── util_mixins.py
    │   ├── visualization.py
    │   └── yacs.py
├── requirements.txt
├── setup.py
└── tools
    ├── convert_old_checkpoint.py
    ├── deprecated
        ├── test.py
        └── train.py
    ├── export_onnx.py
    ├── export_torchscript.py
    ├── flops.py
    ├── inference.py
    ├── show_dataset.py
    ├── test.py
    └── train.py


/.gitignore:
--------------------------------------------------------------------------------
  1 | # Byte-compiled / optimized / DLL files
  2 | __pycache__/
  3 | *.py[cod]
  4 | *$py.class
  5 | 
  6 | # C extensions
  7 | *.so
  8 | 
  9 | # Distribution / packaging
 10 | .Python
 11 | build/
 12 | develop-eggs/
 13 | dist/
 14 | downloads/
 15 | eggs/
 16 | .eggs/
 17 | lib/
 18 | lib64/
 19 | parts/
 20 | sdist/
 21 | var/
 22 | wheels/
 23 | *.egg-info/
 24 | .installed.cfg
 25 | *.egg
 26 | MANIFEST
 27 | workspace/
 28 | # PyInstaller
 29 | #  Usually these files are written by a python script from a template
 30 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 31 | *.manifest
 32 | *.spec
 33 | 
 34 | # Installer logs
 35 | pip-log.txt
 36 | pip-delete-this-directory.txt
 37 | 
 38 | # Unit test / coverage reports
 39 | htmlcov/
 40 | .tox/
 41 | .coverage
 42 | .coverage.*
 43 | .cache
 44 | nosetests.xml
 45 | coverage.xml
 46 | *.cover
 47 | .hypothesis/
 48 | .pytest_cache/
 49 | 
 50 | # Translations
 51 | *.mo
 52 | *.pot
 53 | 
 54 | # Django stuff:
 55 | *.log
 56 | local_settings.py
 57 | db.sqlite3
 58 | 
 59 | # Flask stuff:
 60 | instance/
 61 | .webassets-cache
 62 | 
 63 | # Scrapy stuff:
 64 | .scrapy
 65 | 
 66 | # Sphinx documentation
 67 | docs/_build/
 68 | 
 69 | # PyBuilder
 70 | target/
 71 | 
 72 | # Jupyter Notebook
 73 | .ipynb_checkpoints
 74 | 
 75 | # pyenv
 76 | .python-version
 77 | 
 78 | # celery beat schedule file
 79 | celerybeat-schedule
 80 | 
 81 | # SageMath parsed files
 82 | *.sage.py
 83 | 
 84 | # Environments
 85 | .env
 86 | .venv
 87 | env/
 88 | venv/
 89 | ENV/
 90 | env.bak/
 91 | venv.bak/
 92 | 
 93 | # Spyder project settings
 94 | .spyderproject
 95 | .spyproject
 96 | 
 97 | # Rope project settings
 98 | .ropeproject
 99 | 
100 | # mkdocs documentation
101 | /site
102 | 
103 | # mypy
104 | .mypy_cache/
105 | 
106 | .vscode
107 | .idea
108 | .DS_Store
109 | 
110 | # custom
111 | *.pkl
112 | *.pkl.json
113 | *.log.json
114 | work_dirs/
115 | 
116 | # Pytorch
117 | *.pth
118 | *.py~
119 | *.sh~
120 | 


--------------------------------------------------------------------------------
/config/EfficientNet-Lite/nanodet-EfficientNet-Lite0_320.yml:
--------------------------------------------------------------------------------
  1 | # nanodet-EfficientNet-Lite0_320
  2 | # COCO mAP(0.5:0.95) = 0.247
  3 | #             AP_50  = 0.404
  4 | #             AP_75  = 0.250
  5 | #           AP_small = 0.079
  6 | #               AP_m = 0.243
  7 | #               AP_l = 0.406
  8 | save_dir: workspace/efficient0_320
  9 | model:
 10 |   arch:
 11 |     name: OneStageDetector
 12 |     backbone:
 13 |       name: EfficientNetLite
 14 |       model_name: efficientnet_lite0
 15 |       out_stages: [2,4,6]
 16 |       activation: ReLU6
 17 |     fpn:
 18 |       name: PAN
 19 |       in_channels: [40, 112, 320]
 20 |       out_channels: 96
 21 |       start_level: 0
 22 |       num_outs: 3
 23 |     head:
 24 |       name: NanoDetHead
 25 |       num_classes: 80
 26 |       input_channel: 96
 27 |       feat_channels: 96
 28 |       activation: ReLU6
 29 |       stacked_convs: 2
 30 |       share_cls_reg: True
 31 |       octave_base_scale: 5
 32 |       scales_per_octave: 1
 33 |       strides: [8, 16, 32]
 34 |       reg_max: 7
 35 |       norm_cfg:
 36 |         type: BN
 37 |       loss:
 38 |         loss_qfl:
 39 |           name: QualityFocalLoss
 40 |           use_sigmoid: True
 41 |           beta: 2.0
 42 |           loss_weight: 1.0
 43 |         loss_dfl:
 44 |           name: DistributionFocalLoss
 45 |           loss_weight: 0.25
 46 |         loss_bbox:
 47 |           name: GIoULoss
 48 |           loss_weight: 2.0
 49 | data:
 50 |   train:
 51 |     name: coco
 52 |     img_path: /coco/train2017
 53 |     ann_path: /coco/annotations/instances_train2017.json
 54 |     input_size: [320,320] #[w,h]
 55 |     keep_ratio: True
 56 |     pipeline:
 57 |       perspective: 0.0
 58 |       scale: [0.6, 1.4]
 59 |       stretch: [[1, 1], [1, 1]]
 60 |       rotation: 0
 61 |       shear: 0
 62 |       translate: 0.2
 63 |       flip: 0.5
 64 |       brightness: 0.2
 65 |       contrast: [0.6, 1.4]
 66 |       saturation: [0.5, 1.2]
 67 |       normalize: [[127.0, 127.0, 127.0], [128.0, 128.0, 128.0]]
 68 |   val:
 69 |     name: coco
 70 |     img_path: /coco/val2017
 71 |     ann_path: /coco/annotations/instances_val2017.json
 72 |     input_size: [320,320] #[w,h]
 73 |     keep_ratio: True
 74 |     pipeline:
 75 |       normalize: [[127.0, 127.0, 127.0], [128.0, 128.0, 128.0]]
 76 | device:
 77 |   gpu_ids: [0]
 78 |   workers_per_gpu: 12
 79 |   batchsize_per_gpu: 150
 80 | schedule:
 81 | #  resume:
 82 | #  load_model: YOUR_MODEL_PATH
 83 |   optimizer:
 84 |     name: SGD
 85 |     lr: 0.15
 86 |     momentum: 0.9
 87 |     weight_decay: 0.0001
 88 |   warmup:
 89 |     name: linear
 90 |     steps: 500
 91 |     ratio: 0.01
 92 |   total_epochs: 190
 93 |   lr_schedule:
 94 |     name: MultiStepLR
 95 |     milestones: [140,170,180,185]
 96 |     gamma: 0.1
 97 |   val_intervals: 1
 98 | evaluator:
 99 |   name: CocoDetectionEvaluator
100 |   save_key: mAP
101 | 
102 | log:
103 |   interval: 10
104 | 
105 | class_names: ['person', 'bicycle', 'car', 'motorcycle', 'airplane', 'bus',
106 |               'train', 'truck', 'boat', 'traffic_light', 'fire_hydrant',
107 |               'stop_sign', 'parking_meter', 'bench', 'bird', 'cat', 'dog',
108 |               'horse', 'sheep', 'cow', 'elephant', 'bear', 'zebra', 'giraffe',
109 |               'backpack', 'umbrella', 'handbag', 'tie', 'suitcase', 'frisbee',
110 |               'skis', 'snowboard', 'sports_ball', 'kite', 'baseball_bat',
111 |               'baseball_glove', 'skateboard', 'surfboard', 'tennis_racket',
112 |               'bottle', 'wine_glass', 'cup', 'fork', 'knife', 'spoon', 'bowl',
113 |               'banana', 'apple', 'sandwich', 'orange', 'broccoli', 'carrot',
114 |               'hot_dog', 'pizza', 'donut', 'cake', 'chair', 'couch',
115 |               'potted_plant', 'bed', 'dining_table', 'toilet', 'tv', 'laptop',
116 |               'mouse', 'remote', 'keyboard', 'cell_phone', 'microwave',
117 |               'oven', 'toaster', 'sink', 'refrigerator', 'book', 'clock',
118 |               'vase', 'scissors', 'teddy_bear', 'hair_drier', 'toothbrush']
119 | 


--------------------------------------------------------------------------------
/config/EfficientNet-Lite/nanodet-EfficientNet-Lite1_416.yml:
--------------------------------------------------------------------------------
  1 | # nanodet-EfficientNet-Lite1_416
  2 | # COCO mAP(0.5:0.95) = 0.303
  3 | #             AP_50  = 0.471
  4 | #             AP_75  = 0.313
  5 | #           AP_small = 0.122
  6 | #               AP_m = 0.321
  7 | #               AP_l = 0.432
  8 | save_dir: workspace/efficient1_416_SGD
  9 | model:
 10 |   arch:
 11 |     name: OneStageDetector
 12 |     backbone:
 13 |       name: EfficientNetLite
 14 |       model_name: efficientnet_lite1
 15 |       out_stages: [2,4,6]
 16 |       activation: ReLU6
 17 |       pretrain: True
 18 |     fpn:
 19 |       name: PAN
 20 |       in_channels: [40, 112, 320]
 21 |       out_channels: 128
 22 |       start_level: 0
 23 |       num_outs: 3
 24 |     head:
 25 |       name: NanoDetHead
 26 |       num_classes: 80
 27 |       input_channel: 128
 28 |       feat_channels: 128
 29 |       stacked_convs: 3
 30 |       activation: ReLU6
 31 |       share_cls_reg: True
 32 |       octave_base_scale: 8
 33 |       scales_per_octave: 1
 34 |       strides: [8, 16, 32]
 35 |       reg_max: 10
 36 |       norm_cfg:
 37 |         type: BN
 38 |       loss:
 39 |         loss_qfl:
 40 |           name: QualityFocalLoss
 41 |           use_sigmoid: True
 42 |           beta: 2.0
 43 |           loss_weight: 1.0
 44 |         loss_dfl:
 45 |           name: DistributionFocalLoss
 46 |           loss_weight: 0.25
 47 |         loss_bbox:
 48 |           name: GIoULoss
 49 |           loss_weight: 2.0
 50 | data:
 51 |   train:
 52 |     name: coco
 53 |     img_path: /coco/train2017
 54 |     ann_path: /coco/annotations/instances_train2017.json
 55 |     input_size: [416,416] #[w,h]
 56 |     keep_ratio: True
 57 |     pipeline:
 58 |       perspective: 0.0
 59 |       scale: [0.5, 1.5]
 60 |       stretch: [[1, 1], [1, 1]]
 61 |       rotation: 0
 62 |       shear: 0
 63 |       translate: 0.2
 64 |       flip: 0.5
 65 |       brightness: 0.2
 66 |       contrast: [0.6, 1.4]
 67 |       saturation: [0.5, 1.2]
 68 |       normalize: [[127.0, 127.0, 127.0], [128.0, 128.0, 128.0]]
 69 |   val:
 70 |     name: coco
 71 |     img_path: /coco/val2017
 72 |     ann_path: /coco/annotations/instances_val2017.json
 73 |     input_size: [416,416] #[w,h]
 74 |     keep_ratio: True
 75 |     pipeline:
 76 |       normalize: [[127.0, 127.0, 127.0], [128.0, 128.0, 128.0]]
 77 | device:
 78 |   gpu_ids: [0]
 79 |   workers_per_gpu: 12
 80 |   batchsize_per_gpu: 100
 81 | schedule:
 82 | #  resume:
 83 | #  load_model: YOUR_MODEL_PATH
 84 |   optimizer:
 85 |     name: SGD
 86 |     lr: 0.07
 87 |     momentum: 0.9
 88 |     weight_decay: 0.0001
 89 |   warmup:
 90 |     name: linear
 91 |     steps: 500
 92 |     ratio: 0.01
 93 |   total_epochs: 170
 94 |   lr_schedule:
 95 |     name: MultiStepLR
 96 |     milestones: [130,150,160,165]
 97 |     gamma: 0.1
 98 |   val_intervals: 5
 99 | evaluator:
100 |   name: CocoDetectionEvaluator
101 |   save_key: mAP
102 | 
103 | log:
104 |   interval: 10
105 | 
106 | class_names: ['person', 'bicycle', 'car', 'motorcycle', 'airplane', 'bus',
107 |               'train', 'truck', 'boat', 'traffic_light', 'fire_hydrant',
108 |               'stop_sign', 'parking_meter', 'bench', 'bird', 'cat', 'dog',
109 |               'horse', 'sheep', 'cow', 'elephant', 'bear', 'zebra', 'giraffe',
110 |               'backpack', 'umbrella', 'handbag', 'tie', 'suitcase', 'frisbee',
111 |               'skis', 'snowboard', 'sports_ball', 'kite', 'baseball_bat',
112 |               'baseball_glove', 'skateboard', 'surfboard', 'tennis_racket',
113 |               'bottle', 'wine_glass', 'cup', 'fork', 'knife', 'spoon', 'bowl',
114 |               'banana', 'apple', 'sandwich', 'orange', 'broccoli', 'carrot',
115 |               'hot_dog', 'pizza', 'donut', 'cake', 'chair', 'couch',
116 |               'potted_plant', 'bed', 'dining_table', 'toilet', 'tv', 'laptop',
117 |               'mouse', 'remote', 'keyboard', 'cell_phone', 'microwave',
118 |               'oven', 'toaster', 'sink', 'refrigerator', 'book', 'clock',
119 |               'vase', 'scissors', 'teddy_bear', 'hair_drier', 'toothbrush']
120 | 


--------------------------------------------------------------------------------
/config/EfficientNet-Lite/nanodet-EfficientNet-Lite2_512.yml:
--------------------------------------------------------------------------------
  1 | # nanodet-EfficientNet-Lite2_512
  2 | # COCO mAP(0.5:0.95) = 0.326
  3 | #             AP_50  = 0.501
  4 | #             AP_75  = 0.344
  5 | #           AP_small = 0.152
  6 | #               AP_m = 0.342
  7 | #               AP_l = 0.481
  8 | save_dir: workspace/efficientlite2_512
  9 | model:
 10 |   arch:
 11 |     name: OneStageDetector
 12 |     backbone:
 13 |       name: EfficientNetLite
 14 |       model_name: efficientnet_lite2
 15 |       out_stages: [2,4,6]
 16 |       activation: ReLU6
 17 |       pretrain: True
 18 |     fpn:
 19 |       name: PAN
 20 |       in_channels: [48, 120, 352]
 21 |       out_channels: 128
 22 |       start_level: 0
 23 |       num_outs: 3
 24 |     head:
 25 |       name: NanoDetHead
 26 |       num_classes: 80
 27 |       input_channel: 128
 28 |       feat_channels: 128
 29 |       stacked_convs: 4
 30 |       activation: ReLU6
 31 |       share_cls_reg: True
 32 |       octave_base_scale: 5
 33 |       scales_per_octave: 1
 34 |       strides: [8, 16, 32]
 35 |       reg_max: 10
 36 |       norm_cfg:
 37 |         type: BN
 38 |       loss:
 39 |         loss_qfl:
 40 |           name: QualityFocalLoss
 41 |           use_sigmoid: True
 42 |           beta: 2.0
 43 |           loss_weight: 1.0
 44 |         loss_dfl:
 45 |           name: DistributionFocalLoss
 46 |           loss_weight: 0.25
 47 |         loss_bbox:
 48 |           name: GIoULoss
 49 |           loss_weight: 2.0
 50 | data:
 51 |   train:
 52 |     name: coco
 53 |     img_path: /coco/train2017
 54 |     ann_path: /coco/annotations/instances_train2017.json
 55 |     input_size: [512,512] #[w,h]
 56 |     keep_ratio: True
 57 |     pipeline:
 58 |       perspective: 0.0
 59 |       scale: [0.5, 1.5]
 60 |       stretch: [[1, 1], [1, 1]]
 61 |       rotation: 0
 62 |       shear: 0
 63 |       translate: 0.2
 64 |       flip: 0.5
 65 |       brightness: 0.2
 66 |       contrast: [0.6, 1.4]
 67 |       saturation: [0.5, 1.2]
 68 |       normalize: [[127.0, 127.0, 127.0], [128.0, 128.0, 128.0]]
 69 |   val:
 70 |     name: coco
 71 |     img_path: /coco/val2017
 72 |     ann_path: /coco/annotations/instances_val2017.json
 73 |     input_size: [512,512] #[w,h]
 74 |     keep_ratio: True
 75 |     pipeline:
 76 |       normalize: [[127.0, 127.0, 127.0], [128.0, 128.0, 128.0]]
 77 | device:
 78 |   gpu_ids: [0]
 79 |   workers_per_gpu: 12
 80 |   batchsize_per_gpu: 60
 81 | schedule:
 82 | #  resume:
 83 | #  load_model: YOUR_MODEL_PATH
 84 |   optimizer:
 85 |     name: SGD
 86 |     lr: 0.06
 87 |     momentum: 0.9
 88 |     weight_decay: 0.0001
 89 |   warmup:
 90 |     name: linear
 91 |     steps: 300
 92 |     ratio: 0.1
 93 |   total_epochs: 135
 94 |   lr_schedule:
 95 |     name: MultiStepLR
 96 |     milestones: [90,110,120,130]
 97 |     gamma: 0.1
 98 |   val_intervals: 5
 99 | evaluator:
100 |   name: CocoDetectionEvaluator
101 |   save_key: mAP
102 | 
103 | log:
104 |   interval: 10
105 | 
106 | class_names: ['person', 'bicycle', 'car', 'motorcycle', 'airplane', 'bus',
107 |               'train', 'truck', 'boat', 'traffic_light', 'fire_hydrant',
108 |               'stop_sign', 'parking_meter', 'bench', 'bird', 'cat', 'dog',
109 |               'horse', 'sheep', 'cow', 'elephant', 'bear', 'zebra', 'giraffe',
110 |               'backpack', 'umbrella', 'handbag', 'tie', 'suitcase', 'frisbee',
111 |               'skis', 'snowboard', 'sports_ball', 'kite', 'baseball_bat',
112 |               'baseball_glove', 'skateboard', 'surfboard', 'tennis_racket',
113 |               'bottle', 'wine_glass', 'cup', 'fork', 'knife', 'spoon', 'bowl',
114 |               'banana', 'apple', 'sandwich', 'orange', 'broccoli', 'carrot',
115 |               'hot_dog', 'pizza', 'donut', 'cake', 'chair', 'couch',
116 |               'potted_plant', 'bed', 'dining_table', 'toilet', 'tv', 'laptop',
117 |               'mouse', 'remote', 'keyboard', 'cell_phone', 'microwave',
118 |               'oven', 'toaster', 'sink', 'refrigerator', 'book', 'clock',
119 |               'vase', 'scissors', 'teddy_bear', 'hair_drier', 'toothbrush']
120 | 


--------------------------------------------------------------------------------
/config/RepVGG/nanodet-RepVGG-A0_416.yml:
--------------------------------------------------------------------------------
  1 | # nanodet-EfficientNet-Lite1_416
  2 | save_dir: workspace/RepVGG-A0-416
  3 | model:
  4 |   arch:
  5 |     name: OneStageDetector
  6 |     backbone:
  7 |       name: RepVGG
  8 |       arch: A0
  9 |       out_stages: [2,3,4]
 10 |       activation: ReLU
 11 |       last_channel: 512
 12 |       deploy: False
 13 |     fpn:
 14 |       name: PAN
 15 |       in_channels: [96, 192, 512]
 16 |       out_channels: 128
 17 |       start_level: 0
 18 |       num_outs: 3
 19 |     head:
 20 |       name: NanoDetHead
 21 |       num_classes: 80
 22 |       conv_type: Conv
 23 |       input_channel: 128
 24 |       feat_channels: 128
 25 |       stacked_convs: 2
 26 |       activation: ReLU
 27 |       share_cls_reg: True
 28 |       octave_base_scale: 8
 29 |       scales_per_octave: 1
 30 |       strides: [8, 16, 32]
 31 |       reg_max: 10
 32 |       norm_cfg:
 33 |         type: BN
 34 |       loss:
 35 |         loss_qfl:
 36 |           name: QualityFocalLoss
 37 |           use_sigmoid: True
 38 |           beta: 2.0
 39 |           loss_weight: 1.0
 40 |         loss_dfl:
 41 |           name: DistributionFocalLoss
 42 |           loss_weight: 0.25
 43 |         loss_bbox:
 44 |           name: GIoULoss
 45 |           loss_weight: 2.0
 46 | data:
 47 |   train:
 48 |     name: coco
 49 |     img_path: /coco/train2017
 50 |     ann_path: /coco/annotations/instances_train2017.json
 51 |     input_size: [416,416] #[w,h]
 52 |     keep_ratio: True
 53 |     pipeline:
 54 |       perspective: 0.0
 55 |       scale: [0.5, 1.5]
 56 |       stretch: [[1, 1], [1, 1]]
 57 |       rotation: 0
 58 |       shear: 0
 59 |       translate: 0.2
 60 |       flip: 0.5
 61 |       brightness: 0.2
 62 |       contrast: [0.6, 1.4]
 63 |       saturation: [0.5, 1.2]
 64 |       normalize: [[103.53, 116.28, 123.675], [57.375, 57.12, 58.395]]
 65 |   val:
 66 |     name: coco
 67 |     img_path: /coco/val2017
 68 |     ann_path: /coco/annotations/instances_val2017.json
 69 |     input_size: [416,416] #[w,h]
 70 |     keep_ratio: True
 71 |     pipeline:
 72 |       normalize: [[103.53, 116.28, 123.675], [57.375, 57.12, 58.395]]
 73 | device:
 74 |   gpu_ids: [0]
 75 |   workers_per_gpu: 1
 76 |   batchsize_per_gpu: 100
 77 | schedule:
 78 | #  resume:
 79 | #  load_model: YOUR_MODEL_PATH
 80 |   optimizer:
 81 |     name: SGD
 82 |     lr: 0.07
 83 |     momentum: 0.9
 84 |     weight_decay: 0.0001
 85 |   warmup:
 86 |     name: linear
 87 |     steps: 500
 88 |     ratio: 0.01
 89 |   total_epochs: 170
 90 |   lr_schedule:
 91 |     name: MultiStepLR
 92 |     milestones: [130,150,160,165]
 93 |     gamma: 0.1
 94 |   val_intervals: 5
 95 | evaluator:
 96 |   name: CocoDetectionEvaluator
 97 |   save_key: mAP
 98 | 
 99 | log:
100 |   interval: 10
101 | 
102 | class_names: ['person', 'bicycle', 'car', 'motorcycle', 'airplane', 'bus',
103 |               'train', 'truck', 'boat', 'traffic_light', 'fire_hydrant',
104 |               'stop_sign', 'parking_meter', 'bench', 'bird', 'cat', 'dog',
105 |               'horse', 'sheep', 'cow', 'elephant', 'bear', 'zebra', 'giraffe',
106 |               'backpack', 'umbrella', 'handbag', 'tie', 'suitcase', 'frisbee',
107 |               'skis', 'snowboard', 'sports_ball', 'kite', 'baseball_bat',
108 |               'baseball_glove', 'skateboard', 'surfboard', 'tennis_racket',
109 |               'bottle', 'wine_glass', 'cup', 'fork', 'knife', 'spoon', 'bowl',
110 |               'banana', 'apple', 'sandwich', 'orange', 'broccoli', 'carrot',
111 |               'hot_dog', 'pizza', 'donut', 'cake', 'chair', 'couch',
112 |               'potted_plant', 'bed', 'dining_table', 'toilet', 'tv', 'laptop',
113 |               'mouse', 'remote', 'keyboard', 'cell_phone', 'microwave',
114 |               'oven', 'toaster', 'sink', 'refrigerator', 'book', 'clock',
115 |               'vase', 'scissors', 'teddy_bear', 'hair_drier', 'toothbrush']
116 | 


--------------------------------------------------------------------------------
/config/Transformer/nanodet-t.yml:
--------------------------------------------------------------------------------
  1 | # NanoDet-m with transformer attention
  2 | # COCO mAP(0.5:0.95) = 0.217
  3 | #             AP_50  = 0.363
  4 | #             AP_75  = 0.218
  5 | #           AP_small = 0.069
  6 | #               AP_m = 0.214
  7 | #               AP_l = 0.364
  8 | 
  9 | save_dir: workspace/nanodet_t
 10 | model:
 11 |   arch:
 12 |     name: OneStageDetector
 13 |     backbone:
 14 |       name: ShuffleNetV2
 15 |       model_size: 1.0x
 16 |       out_stages: [2,3,4]
 17 |       activation: LeakyReLU
 18 |     fpn:
 19 |       name: TAN # transformer attention network
 20 |       in_channels: [116, 232, 464]
 21 |       out_channels: 128
 22 |       feature_hw: [20,20] # size for position embedding
 23 |       num_heads: 8
 24 |       num_encoders: 1
 25 |       mlp_ratio: 4
 26 |       dropout_ratio: 0.1
 27 |       activation: LeakyReLU
 28 |     head:
 29 |       name: NanoDetHead
 30 |       num_classes: 80
 31 |       input_channel: 128
 32 |       feat_channels: 128
 33 |       stacked_convs: 2
 34 |       share_cls_reg: True
 35 |       octave_base_scale: 5
 36 |       scales_per_octave: 1
 37 |       strides: [8, 16, 32]
 38 |       reg_max: 7
 39 |       norm_cfg:
 40 |         type: BN
 41 |       loss:
 42 |         loss_qfl:
 43 |           name: QualityFocalLoss
 44 |           use_sigmoid: True
 45 |           beta: 2.0
 46 |           loss_weight: 1.0
 47 |         loss_dfl:
 48 |           name: DistributionFocalLoss
 49 |           loss_weight: 0.25
 50 |         loss_bbox:
 51 |           name: GIoULoss
 52 |           loss_weight: 2.0
 53 | data:
 54 |   train:
 55 |     name: coco
 56 |     img_path: coco/train2017
 57 |     ann_path: coco/annotations/instances_train2017.json
 58 |     input_size: [320,320] #[w,h]
 59 |     keep_ratio: True
 60 |     pipeline:
 61 |       perspective: 0.0
 62 |       scale: [0.6, 1.4]
 63 |       stretch: [[1, 1], [1, 1]]
 64 |       rotation: 0
 65 |       shear: 0
 66 |       translate: 0.2
 67 |       flip: 0.5
 68 |       brightness: 0.2
 69 |       contrast: [0.8, 1.2]
 70 |       saturation: [0.8, 1.2]
 71 |       normalize: [[103.53, 116.28, 123.675], [57.375, 57.12, 58.395]]
 72 |   val:
 73 |     name: coco
 74 |     img_path: coco/val2017
 75 |     ann_path: coco/annotations/instances_val2017.json
 76 |     input_size: [320,320] #[w,h]
 77 |     keep_ratio: True
 78 |     pipeline:
 79 |       normalize: [[103.53, 116.28, 123.675], [57.375, 57.12, 58.395]]
 80 | device:
 81 |   gpu_ids: [0]
 82 |   workers_per_gpu: 8
 83 |   batchsize_per_gpu: 160
 84 | schedule:
 85 |   resume:
 86 | #  load_model: YOUR_MODEL_PATH
 87 |   optimizer:
 88 |     name: SGD
 89 |     lr: 0.14
 90 |     momentum: 0.9
 91 |     weight_decay: 0.0001
 92 |   warmup:
 93 |     name: linear
 94 |     steps: 500
 95 |     ratio: 0.01
 96 |   total_epochs: 190
 97 |   lr_schedule:
 98 |     name: MultiStepLR
 99 |     milestones: [140,170,180,185]
100 |     gamma: 0.1
101 |   val_intervals: 10
102 | evaluator:
103 |   name: CocoDetectionEvaluator
104 |   save_key: mAP
105 | 
106 | log:
107 |   interval: 10
108 | 
109 | class_names: ['person', 'bicycle', 'car', 'motorcycle', 'airplane', 'bus',
110 |               'train', 'truck', 'boat', 'traffic_light', 'fire_hydrant',
111 |               'stop_sign', 'parking_meter', 'bench', 'bird', 'cat', 'dog',
112 |               'horse', 'sheep', 'cow', 'elephant', 'bear', 'zebra', 'giraffe',
113 |               'backpack', 'umbrella', 'handbag', 'tie', 'suitcase', 'frisbee',
114 |               'skis', 'snowboard', 'sports_ball', 'kite', 'baseball_bat',
115 |               'baseball_glove', 'skateboard', 'surfboard', 'tennis_racket',
116 |               'bottle', 'wine_glass', 'cup', 'fork', 'knife', 'spoon', 'bowl',
117 |               'banana', 'apple', 'sandwich', 'orange', 'broccoli', 'carrot',
118 |               'hot_dog', 'pizza', 'donut', 'cake', 'chair', 'couch',
119 |               'potted_plant', 'bed', 'dining_table', 'toilet', 'tv', 'laptop',
120 |               'mouse', 'remote', 'keyboard', 'cell_phone', 'microwave',
121 |               'oven', 'toaster', 'sink', 'refrigerator', 'book', 'clock',
122 |               'vase', 'scissors', 'teddy_bear', 'hair_drier', 'toothbrush']
123 | 


--------------------------------------------------------------------------------
/config/nanodet-g-mod.yml:
--------------------------------------------------------------------------------
  1 | # NanoDet-g-416 is designed for edge NPU, GPU or TPU with high parallel computing power but low memory bandwidth
  2 | # COCO mAP(0.5:0.95) = 22.9
  3 | # Flops = 4.2B
  4 | # Params = 3.8M
  5 | # COCO pre-trained weight link: https://drive.google.com/file/d/10uW7oqZKw231l_tr4C1bJWkbCXgBf7av/view?usp=sharing
  6 | save_dir: workspace/rmcv1
  7 | model:
  8 |   arch:
  9 |     name: OneStageDetector
 10 |     backbone:
 11 |       name: CustomCspNet
 12 |       net_cfg: [[ 'Conv', 3, 32, 3, 2],  # 1/2
 13 |                 [ 'MaxPool', 3, 2 ],  # 1/4
 14 |                 [ 'CspBlock', 32, 1, 3, 1 ],  # 1/4
 15 |                 [ 'CspBlock', 64, 2, 3, 2 ],  # 1/8
 16 |                 [ 'CspBlock', 128, 2, 3, 2 ],  # 1/16
 17 |                 [ 'CspBlock', 256, 3, 3, 2 ]]  # 1/32
 18 |       out_stages: [3,4,5]
 19 |       activation: LeakyReLU
 20 |     fpn:
 21 |       name: PAN
 22 |       in_channels: [128, 256, 512]
 23 |       out_channels: 128
 24 |       start_level: 0
 25 |       num_outs: 3
 26 |     head:
 27 |       name: NanoDetHead
 28 |       num_classes: 18
 29 |       conv_type: Conv
 30 |       activation: LeakyReLU
 31 |       input_channel: 128
 32 |       feat_channels: 128
 33 |       stacked_convs: 1
 34 |       share_cls_reg: True
 35 |       octave_base_scale: 8
 36 |       scales_per_octave: 1
 37 |       strides: [8, 16, 32]
 38 |       reg_max: 10
 39 |       norm_cfg:
 40 |         type: BN
 41 |       loss:
 42 |         loss_qfl:
 43 |           name: QualityFocalLoss
 44 |           use_sigmoid: True
 45 |           beta: 2.0
 46 |           loss_weight: 1.0
 47 |         loss_dfl:
 48 |           name: DistributionFocalLoss
 49 |           loss_weight: 0.25
 50 |         loss_bbox:
 51 |           name: GIoULoss
 52 |           loss_weight: 2.0
 53 | data:
 54 |   train:
 55 |     name: coco
 56 |     img_path: ../rmcv_yolo/images
 57 |     ann_path: ../rmcv_yolo/annotations/train.json
 58 |     input_size: [416,416] #[w,h]
 59 |     keep_ratio: True
 60 |     load_mosaic: True
 61 |     mixup: True
 62 |     pipeline:
 63 |       perspective: 0.0002
 64 |       scale: [0.5, 1.5]
 65 |       stretch: [[1, 1], [1, 1]]
 66 |       rotation: 5
 67 |       shear: 3
 68 |       gamma: [0.5,1.7]
 69 |       translate: 0.1
 70 |       flip: 0.5
 71 |       hsv_h: 0.0138
 72 |       hsv_s: 0.464
 73 |       hsv_v: 0.464
 74 |       normalize: [[103.53, 116.28, 123.675], [57.375, 57.12, 58.395]]
 75 |   val:
 76 |     name: coco
 77 |     img_path: ../rmcv_yolo/images
 78 |     ann_path: ../rmcv_yolo/annotations/val.json
 79 |     input_size: [416,416] #[w,h]
 80 |     keep_ratio: True
 81 |     pipeline:
 82 |       normalize: [[103.53, 116.28, 123.675], [57.375, 57.12, 58.395]]
 83 | device:
 84 |   gpu_ids: [0]
 85 |   workers_per_gpu: 4
 86 |   batchsize_per_gpu: 128
 87 | schedule:
 88 |   # resume:
 89 |   load_model: model_0.01.ckpt
 90 |   optimizer:
 91 |     name: SGD
 92 |     lr: 0.003
 93 |     momentum: 0.843
 94 |     weight_decay: 0.00036
 95 |   warmup:
 96 |     name: linear
 97 |     steps: 500
 98 |     ratio: 0.01
 99 |   total_epochs: 50
100 |   lr_schedule:
101 |     name: MultiStepLR
102 |     milestones: [30,45]
103 |     gamma: 0.1
104 |   val_intervals: 1
105 | evaluator:
106 |   name: CocoDetectionEvaluator
107 |   save_key: mAP
108 | 
109 | log:
110 |   interval: 10
111 | 
112 | class_names: ['R1', 'B1', 'R2', 'B2', 'R3', 'B3', 'R4', 'B4','R5', 'B5', 'R7', 'B7', 'R10', 'B10', 'R11', 'B11', 'RE', 'BE']
113 | 
114 | 


--------------------------------------------------------------------------------
/config/nanodet-m-416.yml:
--------------------------------------------------------------------------------
  1 | #nanodet-m-416
  2 | # COCO mAP(0.5:0.95) = 0.235
  3 | #             AP_50  = 0.384
  4 | #             AP_75  = 0.242
  5 | #           AP_small = 0.082
  6 | #               AP_m = 0.240
  7 | #               AP_l = 0.375
  8 | save_dir: workspace/nanodet_m_416
  9 | model:
 10 |   arch:
 11 |     name: OneStageDetector
 12 |     backbone:
 13 |       name: ShuffleNetV2
 14 |       model_size: 1.0x
 15 |       out_stages: [2,3,4]
 16 |       activation: LeakyReLU
 17 |     fpn:
 18 |       name: PAN
 19 |       in_channels: [116, 232, 464]
 20 |       out_channels: 96
 21 |       start_level: 0
 22 |       num_outs: 3
 23 |     head:
 24 |       name: NanoDetHead
 25 |       num_classes: 80
 26 |       input_channel: 96
 27 |       feat_channels: 96
 28 |       stacked_convs: 2
 29 |       share_cls_reg: True
 30 |       octave_base_scale: 5
 31 |       scales_per_octave: 1
 32 |       strides: [8, 16, 32]
 33 |       reg_max: 7
 34 |       norm_cfg:
 35 |         type: BN
 36 |       loss:
 37 |         loss_qfl:
 38 |           name: QualityFocalLoss
 39 |           use_sigmoid: True
 40 |           beta: 2.0
 41 |           loss_weight: 1.0
 42 |         loss_dfl:
 43 |           name: DistributionFocalLoss
 44 |           loss_weight: 0.25
 45 |         loss_bbox:
 46 |           name: GIoULoss
 47 |           loss_weight: 2.0
 48 | data:
 49 |   train:
 50 |     name: coco
 51 |     img_path: coco/train2017
 52 |     ann_path: coco/annotations/instances_train2017.json
 53 |     input_size: [416,416] #[w,h]
 54 |     keep_ratio: True
 55 |     pipeline:
 56 |       perspective: 0.0
 57 |       scale: [0.5, 1.4]
 58 |       stretch: [[1, 1], [1, 1]]
 59 |       rotation: 0
 60 |       shear: 0
 61 |       translate: 0.2
 62 |       flip: 0.5
 63 |       brightness: 0.2
 64 |       contrast: [0.6, 1.4]
 65 |       saturation: [0.5, 1.2]
 66 |       normalize: [[103.53, 116.28, 123.675], [57.375, 57.12, 58.395]]
 67 |   val:
 68 |     name: coco
 69 |     img_path: coco/val2017
 70 |     ann_path: coco/annotations/instances_val2017.json
 71 |     input_size: [416,416] #[w,h]
 72 |     keep_ratio: True
 73 |     pipeline:
 74 |       normalize: [[103.53, 116.28, 123.675], [57.375, 57.12, 58.395]]
 75 | device:
 76 |   gpu_ids: [0]
 77 |   workers_per_gpu: 8
 78 |   batchsize_per_gpu: 192
 79 | schedule:
 80 | #  resume:
 81 | #  load_model: YOUR_MODEL_PATH
 82 |   optimizer:
 83 |     name: SGD
 84 |     lr: 0.14
 85 |     momentum: 0.9
 86 |     weight_decay: 0.0001
 87 |   warmup:
 88 |     name: linear
 89 |     steps: 300
 90 |     ratio: 0.1
 91 |   total_epochs: 280
 92 |   lr_schedule:
 93 |     name: MultiStepLR
 94 |     milestones: [240,260,275]
 95 |     gamma: 0.1
 96 |   val_intervals: 10
 97 | evaluator:
 98 |   name: CocoDetectionEvaluator
 99 |   save_key: mAP
100 | 
101 | log:
102 |   interval: 10
103 | 
104 | class_names: ['person', 'bicycle', 'car', 'motorcycle', 'airplane', 'bus',
105 |               'train', 'truck', 'boat', 'traffic_light', 'fire_hydrant',
106 |               'stop_sign', 'parking_meter', 'bench', 'bird', 'cat', 'dog',
107 |               'horse', 'sheep', 'cow', 'elephant', 'bear', 'zebra', 'giraffe',
108 |               'backpack', 'umbrella', 'handbag', 'tie', 'suitcase', 'frisbee',
109 |               'skis', 'snowboard', 'sports_ball', 'kite', 'baseball_bat',
110 |               'baseball_glove', 'skateboard', 'surfboard', 'tennis_racket',
111 |               'bottle', 'wine_glass', 'cup', 'fork', 'knife', 'spoon', 'bowl',
112 |               'banana', 'apple', 'sandwich', 'orange', 'broccoli', 'carrot',
113 |               'hot_dog', 'pizza', 'donut', 'cake', 'chair', 'couch',
114 |               'potted_plant', 'bed', 'dining_table', 'toilet', 'tv', 'laptop',
115 |               'mouse', 'remote', 'keyboard', 'cell_phone', 'microwave',
116 |               'oven', 'toaster', 'sink', 'refrigerator', 'book', 'clock',
117 |               'vase', 'scissors', 'teddy_bear', 'hair_drier', 'toothbrush']
118 | 


--------------------------------------------------------------------------------
/config/nanodet-m-640-mod.yml:
--------------------------------------------------------------------------------
  1 | #nanodet-m-416
  2 | # COCO mAP(0.5:0.95) = 0.235
  3 | #             AP_50  = 0.384
  4 | #             AP_75  = 0.242
  5 | #           AP_small = 0.082
  6 | #               AP_m = 0.240
  7 | #               AP_l = 0.375
  8 | save_dir: workspace/rmcv_m
  9 | model:
 10 |   arch:
 11 |     name: OneStageDetector
 12 |     backbone:
 13 |       name: ShuffleNetV2
 14 |       model_size: 1.0x
 15 |       out_stages: [2,3,4]
 16 |       activation: LeakyReLU
 17 |     fpn:
 18 |       name: PAN
 19 |       in_channels: [116, 232, 464]
 20 |       out_channels: 96
 21 |       start_level: 0
 22 |       num_outs: 3
 23 |     head:
 24 |       name: NanoDetHead
 25 |       num_classes: 18
 26 |       input_channel: 96
 27 |       feat_channels: 96
 28 |       stacked_convs: 2
 29 |       share_cls_reg: True
 30 |       octave_base_scale: 5
 31 |       scales_per_octave: 1
 32 |       strides: [8, 16, 32]
 33 |       reg_max: 7
 34 |       norm_cfg:
 35 |         type: BN
 36 |       loss:
 37 |         loss_qfl:
 38 |           name: QualityFocalLoss
 39 |           use_sigmoid: True
 40 |           beta: 2.0
 41 |           loss_weight: 1.0
 42 |         loss_dfl:
 43 |           name: DistributionFocalLoss
 44 |           loss_weight: 0.25
 45 |         loss_bbox:
 46 |           name: GIoULoss
 47 |           loss_weight: 2.0
 48 | data:
 49 |   train:
 50 |     name: coco
 51 |     img_path: ../rmcv_yolo/images
 52 |     ann_path: ../rmcv_yolo/annotations/train.json
 53 |     input_size: [640,640] #[w,h]
 54 |     keep_ratio: True
 55 |     mixup: True
 56 |     load_mosaic: False
 57 |     pipeline:
 58 |       perspective: 0.0002
 59 |       scale: [0.5, 1.4]
 60 |       stretch: [[1, 1], [1, 1]]
 61 |       rotation: 5
 62 |       shear: 3
 63 |       translate: 0.1
 64 |       flip: 0.5
 65 |       hsv_h: 0.0138
 66 |       hsv_s: 0.464
 67 |       hsv_v: 0.464
 68 |   val:
 69 |     name: coco
 70 |     img_path: ../rmcv_yolo/images
 71 |     ann_path: ../rmcv_yolo/annotations/val.json
 72 |     input_size: [640,640] #[w,h]
 73 |     keep_ratio: True
 74 |     pipeline:
 75 |       normalize: [[103.53, 116.28, 123.675], [57.375, 57.12, 58.395]]
 76 | device:
 77 |   gpu_ids: [0]
 78 |   workers_per_gpu: 8
 79 |   batchsize_per_gpu: 32
 80 | schedule:
 81 |   resume:
 82 | #  load_model: nanodet_m.ckpt
 83 |   optimizer:
 84 |     name: SGD
 85 |     lr: 0.01
 86 |     momentum: 0.9
 87 |     weight_decay: 0.0001
 88 |   warmup:
 89 |     name: linear
 90 |     steps: 300
 91 |     ratio: 0.01
 92 |   total_epochs: 100
 93 |   lr_schedule:
 94 |     name: MultiStepLR
 95 |     milestones: [30,60,90]
 96 |     gamma: 0.1
 97 |   val_intervals: 2
 98 | evaluator:
 99 |   name: CocoDetectionEvaluator
100 |   save_key: mAP
101 | 
102 | log:
103 |   interval: 10
104 | 
105 | class_names: ['R1', 'B1', 'R2', 'B2', 'R3', 'B3', 'R4', 'B4','R5', 'B5', 'R7', 'B7', 'R10', 'B10', 'R11', 'B11', 'RE', 'BE']
106 | 


--------------------------------------------------------------------------------
/config/nanodet-m.yml:
--------------------------------------------------------------------------------
  1 | #Config File example
  2 | save_dir: workspace/nanodet_m
  3 | model:
  4 |   arch:
  5 |     name: OneStageDetector
  6 |     backbone:
  7 |       name: ShuffleNetV2
  8 |       model_size: 1.0x
  9 |       out_stages: [2,3,4]
 10 |       activation: LeakyReLU
 11 |     fpn:
 12 |       name: PAN
 13 |       in_channels: [116, 232, 464]
 14 |       out_channels: 96
 15 |       start_level: 0
 16 |       num_outs: 3
 17 |     head:
 18 |       name: NanoDetHead
 19 |       num_classes: 80
 20 |       input_channel: 96
 21 |       feat_channels: 96
 22 |       stacked_convs: 2
 23 |       share_cls_reg: True
 24 |       octave_base_scale: 5
 25 |       scales_per_octave: 1
 26 |       strides: [8, 16, 32]
 27 |       reg_max: 7
 28 |       norm_cfg:
 29 |         type: BN
 30 |       loss:
 31 |         loss_qfl:
 32 |           name: QualityFocalLoss
 33 |           use_sigmoid: True
 34 |           beta: 2.0
 35 |           loss_weight: 1.0
 36 |         loss_dfl:
 37 |           name: DistributionFocalLoss
 38 |           loss_weight: 0.25
 39 |         loss_bbox:
 40 |           name: GIoULoss
 41 |           loss_weight: 2.0
 42 | data:
 43 |   train:
 44 |     name: coco
 45 |     img_path: coco/train2017
 46 |     ann_path: coco/annotations/instances_train2017.json
 47 |     input_size: [320,320] #[w,h]
 48 |     keep_ratio: True
 49 |     pipeline:
 50 |       perspective: 0.0
 51 |       scale: [0.6, 1.4]
 52 |       stretch: [[1, 1], [1, 1]]
 53 |       rotation: 0
 54 |       shear: 0
 55 |       translate: 0.2
 56 |       flip: 0.5
 57 |       brightness: 0.2
 58 |       contrast: [0.8, 1.2]
 59 |       saturation: [0.8, 1.2]
 60 |       normalize: [[103.53, 116.28, 123.675], [57.375, 57.12, 58.395]]
 61 |   val:
 62 |     name: coco
 63 |     img_path: coco/val2017
 64 |     ann_path: coco/annotations/instances_val2017.json
 65 |     input_size: [320,320] #[w,h]
 66 |     keep_ratio: True
 67 |     pipeline:
 68 |       normalize: [[103.53, 116.28, 123.675], [57.375, 57.12, 58.395]]
 69 | device:
 70 |   gpu_ids: [0]
 71 |   workers_per_gpu: 12
 72 |   batchsize_per_gpu: 160
 73 | schedule:
 74 | #  resume:
 75 | #  load_model: YOUR_MODEL_PATH
 76 |   optimizer:
 77 |     name: SGD
 78 |     lr: 0.14
 79 |     momentum: 0.9
 80 |     weight_decay: 0.0001
 81 |   warmup:
 82 |     name: linear
 83 |     steps: 300
 84 |     ratio: 0.1
 85 |   total_epochs: 190
 86 |   lr_schedule:
 87 |     name: MultiStepLR
 88 |     milestones: [130,160,175,185]
 89 |     gamma: 0.1
 90 |   val_intervals: 10
 91 | evaluator:
 92 |   name: CocoDetectionEvaluator
 93 |   save_key: mAP
 94 | 
 95 | log:
 96 |   interval: 10
 97 | 
 98 | class_names: ['person', 'bicycle', 'car', 'motorcycle', 'airplane', 'bus',
 99 |               'train', 'truck', 'boat', 'traffic_light', 'fire_hydrant',
100 |               'stop_sign', 'parking_meter', 'bench', 'bird', 'cat', 'dog',
101 |               'horse', 'sheep', 'cow', 'elephant', 'bear', 'zebra', 'giraffe',
102 |               'backpack', 'umbrella', 'handbag', 'tie', 'suitcase', 'frisbee',
103 |               'skis', 'snowboard', 'sports_ball', 'kite', 'baseball_bat',
104 |               'baseball_glove', 'skateboard', 'surfboard', 'tennis_racket',
105 |               'bottle', 'wine_glass', 'cup', 'fork', 'knife', 'spoon', 'bowl',
106 |               'banana', 'apple', 'sandwich', 'orange', 'broccoli', 'carrot',
107 |               'hot_dog', 'pizza', 'donut', 'cake', 'chair', 'couch',
108 |               'potted_plant', 'bed', 'dining_table', 'toilet', 'tv', 'laptop',
109 |               'mouse', 'remote', 'keyboard', 'cell_phone', 'microwave',
110 |               'oven', 'toaster', 'sink', 'refrigerator', 'book', 'clock',
111 |               'vase', 'scissors', 'teddy_bear', 'hair_drier', 'toothbrush']
112 | 


--------------------------------------------------------------------------------
/config/nanodet_custom_xml_dataset.yml:
--------------------------------------------------------------------------------
  1 | #Config File example
  2 | save_dir: workspace/nanodet_m
  3 | model:
  4 |   arch:
  5 |     name: OneStageDetector
  6 |     backbone:
  7 |       name: ShuffleNetV2
  8 |       model_size: 1.0x
  9 |       out_stages: [2,3,4]
 10 |       activation: LeakyReLU
 11 |     fpn:
 12 |       name: PAN
 13 |       in_channels: [116, 232, 464]
 14 |       out_channels: 96
 15 |       start_level: 0
 16 |       num_outs: 3
 17 |     head:
 18 |       name: NanoDetHead
 19 |       num_classes: 80 #Please fill in the number of categories (not include background category)
 20 |       input_channel: 96
 21 |       feat_channels: 96
 22 |       stacked_convs: 2
 23 |       share_cls_reg: True
 24 |       octave_base_scale: 5
 25 |       scales_per_octave: 1
 26 |       strides: [8, 16, 32]
 27 |       reg_max: 7
 28 |       norm_cfg:
 29 |         type: BN
 30 |       loss:
 31 |         loss_qfl:
 32 |           name: QualityFocalLoss
 33 |           use_sigmoid: True
 34 |           beta: 2.0
 35 |           loss_weight: 1.0
 36 |         loss_dfl:
 37 |           name: DistributionFocalLoss
 38 |           loss_weight: 0.25
 39 |         loss_bbox:
 40 |           name: GIoULoss
 41 |           loss_weight: 2.0
 42 | 
 43 | class_names: &class_names ['NAME1', 'NAME2', 'NAME3', 'NAME4', '...']  #Please fill in the category names (not include background category)
 44 | data:
 45 |   train:
 46 |     name: xml_dataset
 47 |     class_names: *class_names
 48 |     img_path: TRAIN_IMAGE_FOLDER  #Please fill in train image path
 49 |     ann_path: TRAIN_XML_FOLDER  #Please fill in train xml path
 50 |     input_size: [320,320] #[w,h]
 51 |     keep_ratio: True
 52 |     pipeline:
 53 |       perspective: 0.0
 54 |       scale: [0.6, 1.4]
 55 |       stretch: [[1, 1], [1, 1]]
 56 |       rotation: 0
 57 |       shear: 0
 58 |       translate: 0.2
 59 |       flip: 0.5
 60 |       brightness: 0.2
 61 |       contrast: [0.8, 1.2]
 62 |       saturation: [0.8, 1.2]
 63 |       normalize: [[103.53, 116.28, 123.675], [57.375, 57.12, 58.395]]
 64 |   val:
 65 |     name: xml_dataset
 66 |     class_names: *class_names
 67 |     img_path: VAL_IMAGE_FOLDER #Please fill in val image path
 68 |     ann_path: VAL_XML_FOLDER #Please fill in val xml path
 69 |     input_size: [320,320] #[w,h]
 70 |     keep_ratio: True
 71 |     pipeline:
 72 |       normalize: [[103.53, 116.28, 123.675], [57.375, 57.12, 58.395]]
 73 | device:
 74 |   gpu_ids: [0]
 75 |   workers_per_gpu: 12
 76 |   batchsize_per_gpu: 160
 77 | schedule:
 78 | #  resume:
 79 | #  load_model: YOUR_MODEL_PATH
 80 |   optimizer:
 81 |     name: SGD
 82 |     lr: 0.14
 83 |     momentum: 0.9
 84 |     weight_decay: 0.0001
 85 |   warmup:
 86 |     name: linear
 87 |     steps: 300
 88 |     ratio: 0.1
 89 |   total_epochs: 190
 90 |   lr_schedule:
 91 |     name: MultiStepLR
 92 |     milestones: [130,160,175,185]
 93 |     gamma: 0.1
 94 |   val_intervals: 10
 95 | evaluator:
 96 |   name: CocoDetectionEvaluator
 97 |   save_key: mAP
 98 | 
 99 | log:
100 |   interval: 10
101 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/.gitignore:
--------------------------------------------------------------------------------
 1 | *.iml
 2 | .gradle
 3 | /local.properties
 4 | /.idea
 5 | /.idea/caches
 6 | /.idea/libraries
 7 | /.idea/modules.xml
 8 | /.idea/workspace.xml
 9 | /.idea/navEditor.xml
10 | /.idea/assetWizardSettings.xml
11 | .DS_Store
12 | /build
13 | /captures
14 | .externalNativeBuild
15 | .cxx
16 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/Android_demo.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_android_ncnn/Android_demo.jpg


--------------------------------------------------------------------------------
/demo_android_ncnn/README.md:
--------------------------------------------------------------------------------
 1 | # NanoDet NCNN Android Demo
 2 | 
 3 | This repo is an Android object detection demo of NanoDet using
 4 | [Tencent's NCNN framework](https://github.com/Tencent/ncnn).
 5 | 
 6 | # Tutorial
 7 | 
 8 | ## Step1. 
 9 | Download ncnn-android-vulkan.zip from ncnn repo or build ncnn-android from source.
10 | 
11 | - [ncnn-android-vulkan.zip download link](https://github.com/Tencent/ncnn/releases)
12 | 
13 | ## Step2.
14 | Unzip ncnn-android-vulkan.zip into demo_android_ncnn/app/src/main/cpp or change the ncnn_DIR path to yours in demo_android_ncnn/app/src/main/cpp/CMakeLists.txt
15 | 
16 | ## Step3.
17 | Copy the NanoDet ncnn model file (nanodet_m.param and nanodet_m.bin) from models folder into demo_android_ncnn/app/src/main/assets
18 | 
19 | * [NanoDet ncnn model download link](https://github.com/RangiLyu/nanodet/releases/download/v0.0.1/nanodet_ncnn_model.zip)
20 | 
21 | If you want to run yolov4-tiny and yolov5s, download them and also put in demo_android_ncnn/app/src/main/assets.
22 | 
23 | * [Yolov4 and v5 ncnn model download link](https://drive.google.com/file/d/1Qk_1fDvOcFmNppDnaMFW-xFpMgLDyeAs/view?usp=sharing)
24 | 
25 | ## Step4.
26 | Open demo_android_ncnn folder with Android Studio and then build it.
27 | 
28 | # Screenshot
29 | ![](Android_demo.jpg)
30 | 
31 | 
32 | # Reference
33 | 
34 | * [ncnn](https://github.com/tencent/ncnn)
35 | * [YOLOv5_NCNN](https://github.com/WZTENG/YOLOv5_NCNN) 
36 | 
37 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/.gitignore:
--------------------------------------------------------------------------------
1 | /build
2 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/build.gradle:
--------------------------------------------------------------------------------
 1 | apply plugin: 'com.android.application'
 2 | 
 3 | android {
 4 |     compileSdkVersion 29
 5 |     buildToolsVersion "29.0.3"
 6 |     defaultConfig {
 7 |         applicationId "com.rangi.nanodet"
 8 |         minSdkVersion 26
 9 |         targetSdkVersion 29
10 |         versionCode 1
11 |         versionName "1.0"
12 |         testInstrumentationRunner "androidx.test.runner.AndroidJUnitRunner"
13 |         externalNativeBuild {
14 |             cmake {
15 |                 cppFlags ""
16 |                 arguments '-DANDROID_PLATFORM=android-24', '-DANDROID_STL=c++_static', '-DANDROID_STL=c++_shared'
17 |             }
18 |         }
19 | 
20 |         ndk {
21 |             moduleName "NcnnJniLog"
22 |             ldLibs "log", "z", "m"
23 |             abiFilters "armeabi-v7a", "arm64-v8a"
24 |         }
25 | 
26 |         multiDexEnabled true
27 |     }
28 |     buildTypes {
29 |         release {
30 |             minifyEnabled false
31 |             proguardFiles getDefaultProguardFile('proguard-android-optimize.txt'), 'proguard-rules.pro'
32 |         }
33 |     }
34 |     externalNativeBuild {
35 |         cmake {
36 |             path "src/main/cpp/CMakeLists.txt"
37 |             version "3.10.2"
38 |         }
39 |     }
40 |     sourceSets {
41 |         main {
42 |             jniLibs.srcDirs = ['libs']
43 |         }
44 |     }
45 | 
46 |     repositories {
47 |         flatDir {
48 |             dirs 'libs'
49 |         }
50 |     }
51 | }
52 | 
53 | dependencies {
54 |     implementation fileTree(dir: 'libs', include: ['*.jar'])
55 |     implementation 'androidx.appcompat:appcompat:1.1.0'
56 |     implementation 'androidx.constraintlayout:constraintlayout:1.1.3'
57 |     testImplementation 'junit:junit:4.12'
58 |     androidTestImplementation 'androidx.test.ext:junit:1.1.1'
59 |     androidTestImplementation 'androidx.test.espresso:espresso-core:3.2.0'
60 | 
61 |     // Use the most recent version of CameraX, currently that is alpha04
62 |     def camerax_version = "1.0.0-alpha05"
63 |     //noinspection GradleDependency
64 |     implementation "androidx.camera:camera-core:${camerax_version}"
65 |     //noinspection GradleDependency
66 |     implementation "androidx.camera:camera-camera2:${camerax_version}"
67 | 
68 |     implementation 'com.android.support:multidex:1.0.3'
69 |     // crash
70 |     implementation 'com.zxy.android:recovery:1.0.0'
71 |     // photoview
72 |     implementation 'com.github.chrisbanes:PhotoView:2.3.0'
73 | //    implementation 'com.bm.photoview:library:1.4.1'
74 | 
75 | }
76 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/proguard-rules.pro:
--------------------------------------------------------------------------------
 1 | # Add project specific ProGuard rules here.
 2 | # You can control the set of applied configuration files using the
 3 | # proguardFiles setting in build.gradle.
 4 | #
 5 | # For more details, see
 6 | #   http://developer.android.com/guide/developing/tools/proguard.html
 7 | 
 8 | # If your project uses WebView with JS, uncomment the following
 9 | # and specify the fully qualified class name to the JavaScript interface
10 | # class:
11 | #-keepclassmembers class fqcn.of.javascript.interface.for.webview {
12 | #   public *;
13 | #}
14 | 
15 | # Uncomment this to preserve the line number information for
16 | # debugging stack traces.
17 | #-keepattributes SourceFile,LineNumberTable
18 | 
19 | # If you keep the line number information, uncomment this to
20 | # hide the original source file name.
21 | #-renamesourcefileattribute SourceFile
22 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/androidTest/java/com/rangi/nanodet/ExampleInstrumentedTest.java:
--------------------------------------------------------------------------------
 1 | package com.rangi.nanodet;
 2 | 
 3 | import android.content.Context;
 4 | 
 5 | import androidx.test.platform.app.InstrumentationRegistry;
 6 | import androidx.test.ext.junit.runners.AndroidJUnit4;
 7 | 
 8 | import org.junit.Test;
 9 | import org.junit.runner.RunWith;
10 | 
11 | import static org.junit.Assert.*;
12 | 
13 | /**
14 |  * Instrumented test, which will execute on an Android device.
15 |  *
16 |  * @see <a href="http://d.android.com/tools/testing">Testing documentation</a>
17 |  */
18 | @RunWith(AndroidJUnit4.class)
19 | public class ExampleInstrumentedTest {
20 |     @Test
21 |     public void useAppContext() {
22 |         // Context of the app under test.
23 |         Context appContext = InstrumentationRegistry.getInstrumentation().getTargetContext();
24 | 
25 |         assertEquals("gd.hq.yolov5", appContext.getPackageName());
26 |     }
27 | }
28 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/AndroidManifest.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?>
 2 | <manifest xmlns:android="http://schemas.android.com/apk/res/android"
 3 |     package="com.rangi.nanodet">
 4 | 
 5 |     <uses-permission android:name="android.permission.READ_EXTERNAL_STORAGE" />
 6 |     <uses-permission android:name="android.permission.WRITE_EXTERNAL_STORAGE" />
 7 |     <uses-permission android:name="android.permission.CAMERA" />
 8 | 
 9 |     <application
10 |         android:name="com.rangi.nanodet.NcnnApp"
11 |         android:allowBackup="true"
12 |         android:icon="@drawable/ncnn_icon"
13 |         android:label="@string/app_name"
14 |         android:roundIcon="@mipmap/ic_launcher_round"
15 |         android:supportsRtl="true"
16 |         android:requestLegacyExternalStorage="true"
17 |         android:theme="@style/AppTheme">
18 |         <activity android:name="com.rangi.nanodet.WelcomeActivity">
19 |             <intent-filter>
20 |                 <action android:name="android.intent.action.MAIN" />
21 | 
22 |                 <category android:name="android.intent.category.LAUNCHER" />
23 |             </intent-filter>
24 |         </activity>
25 |         <activity
26 |             android:name="com.rangi.nanodet.MainActivity"
27 |             android:theme="@style/AppNoTitleTheme" />
28 |     </application>
29 | 
30 | </manifest>


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/cpp/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | cmake_minimum_required(VERSION 3.10)
 2 | 
 3 | set(ncnn_DIR ${CMAKE_SOURCE_DIR}/ncnn-20201218-android-vulkan/${ANDROID_ABI}/lib/cmake/ncnn)
 4 | find_package(ncnn REQUIRED)
 5 | 
 6 | add_library(yolov5 SHARED
 7 |     jni_interface.cpp
 8 |     YoloV5.cpp
 9 |     YoloV4.cpp
10 |     NanoDet.cpp
11 | )
12 | 
13 | target_link_libraries(yolov5 ncnn jnigraphics)
14 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/cpp/NanoDet.h:
--------------------------------------------------------------------------------
 1 | //
 2 | // Create by RangiLyu
 3 | // 2020 / 10 / 2
 4 | //
 5 | 
 6 | #ifndef NANODET_H
 7 | #define NANODET_H
 8 | 
 9 | #include "net.h"
10 | #include "YoloV5.h"
11 | 
12 | typedef struct HeadInfo
13 | {
14 |     std::string cls_layer;
15 |     std::string dis_layer;
16 |     int stride;
17 | } HeadInfo;
18 | 
19 | 
20 | class NanoDet{
21 | public:
22 |     NanoDet(AAssetManager *mgr, const char *param, const char *bin, bool useGPU);
23 | 
24 |     ~NanoDet();
25 | 
26 |     std::vector<BoxInfo> detect(JNIEnv *env, jobject image, float score_threshold, float nms_threshold);
27 |     std::vector<std::string> labels{"person", "bicycle", "car", "motorcycle", "airplane", "bus", "train", "truck", "boat", "traffic light",
28 |                                     "fire hydrant", "stop sign", "parking meter", "bench", "bird", "cat", "dog", "horse", "sheep", "cow",
29 |                                     "elephant", "bear", "zebra", "giraffe", "backpack", "umbrella", "handbag", "tie", "suitcase", "frisbee",
30 |                                     "skis", "snowboard", "sports ball", "kite", "baseball bat", "baseball glove", "skateboard", "surfboard",
31 |                                     "tennis racket", "bottle", "wine glass", "cup", "fork", "knife", "spoon", "bowl", "banana", "apple",
32 |                                     "sandwich", "orange", "broccoli", "carrot", "hot dog", "pizza", "donut", "cake", "chair", "couch",
33 |                                     "potted plant", "bed", "dining table", "toilet", "tv", "laptop", "mouse", "remote", "keyboard", "cell phone",
34 |                                     "microwave", "oven", "toaster", "sink", "refrigerator", "book", "clock", "vase", "scissors", "teddy bear",
35 |                                     "hair drier", "toothbrush"};
36 | private:
37 |     void preprocess(JNIEnv *env, jobject image, ncnn::Mat& in);
38 |     void decode_infer(ncnn::Mat& cls_pred, ncnn::Mat& dis_pred, int stride, float threshold, std::vector<std::vector<BoxInfo>>& results, float width_ratio, float height_ratio);
39 |     BoxInfo disPred2Bbox(const float*& dfl_det, int label, float score, int x, int y, int stride, float width_ratio, float height_ratio);
40 | 
41 |     static void nms(std::vector<BoxInfo>& result, float nms_threshold);
42 | 
43 |     ncnn::Net *Net;
44 |     int input_size = 320;
45 |     int num_class = 80;
46 |     int reg_max = 7;
47 |     std::vector<HeadInfo> heads_info{
48 |         // cls_pred|dis_pred|stride
49 |         {"cls_pred_stride_8", "dis_pred_stride_8", 8},
50 |         {"cls_pred_stride_16", "dis_pred_stride_16", 16},
51 |         {"cls_pred_stride_32", "dis_pred_stride_32", 32},
52 |     };
53 | 
54 | public:
55 |     static NanoDet *detector;
56 |     static bool hasGPU;
57 | };
58 | 
59 | 
60 | #endif //NANODET_H
61 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/cpp/YoloV4.cpp:
--------------------------------------------------------------------------------
 1 | #include "YoloV4.h"
 2 | 
 3 | bool YoloV4::hasGPU = true;
 4 | YoloV4 *YoloV4::detector = nullptr;
 5 | 
 6 | YoloV4::YoloV4(AAssetManager *mgr, const char *param, const char *bin, bool useGPU) {
 7 |     Net = new ncnn::Net();
 8 |     // opt 需要在加载前设置
 9 |     hasGPU = ncnn::get_gpu_count() > 0;
10 |     Net->opt.use_vulkan_compute = hasGPU && useGPU;  // gpu
11 |     Net->opt.use_fp16_arithmetic = true;  // fp16运算加速
12 |     Net->load_param(mgr, param);
13 |     Net->load_model(mgr, bin);
14 | }
15 | 
16 | YoloV4::~YoloV4() {
17 |     delete Net;
18 | }
19 | 
20 | std::vector<BoxInfo> YoloV4::detect(JNIEnv *env, jobject image, float threshold, float nms_threshold) {
21 |     AndroidBitmapInfo img_size;
22 |     AndroidBitmap_getInfo(env, image, &img_size);
23 |     ncnn::Mat in_net = ncnn::Mat::from_android_bitmap_resize(env, image, ncnn::Mat::PIXEL_RGBA2RGB, input_size,
24 |                                                              input_size);
25 |     float norm[3] = {1 / 255.f, 1 / 255.f, 1 / 255.f};
26 |     float mean[3] = {0, 0, 0};
27 |     in_net.substract_mean_normalize(mean, norm);
28 |     auto ex = Net->create_extractor();
29 |     ex.set_light_mode(true);
30 |     ex.set_num_threads(4);
31 |     hasGPU = ncnn::get_gpu_count() > 0;
32 |     ex.set_vulkan_compute(hasGPU);
33 |     ex.input(0, in_net);
34 |     std::vector<BoxInfo> result;
35 |     ncnn::Mat blob;
36 |     ex.extract("output", blob);
37 |     auto boxes = decode_infer(blob, {(int) img_size.width, (int) img_size.height}, input_size, num_class, threshold);
38 |     result.insert(result.begin(), boxes.begin(), boxes.end());
39 | //    nms(result,nms_threshold);
40 |     return result;
41 | }
42 | 
43 | inline float fast_exp(float x) {
44 |     union {
45 |         uint32_t i;
46 |         float f;
47 |     } v{};
48 |     v.i = (1 << 23) * (1.4426950409 * x + 126.93490512f);
49 |     return v.f;
50 | }
51 | 
52 | inline float sigmoid(float x) {
53 |     return 1.0f / (1.0f + fast_exp(-x));
54 | }
55 | 
56 | std::vector<BoxInfo>
57 | YoloV4::decode_infer(ncnn::Mat &data, const yolocv::YoloSize &frame_size, int net_size, int num_classes, float threshold) {
58 |     std::vector<BoxInfo> result;
59 |     for (int i = 0; i < data.h; i++) {
60 |         BoxInfo box;
61 |         const float *values = data.row(i);
62 |         box.label = values[0] - 1;
63 |         box.score = values[1];
64 |         box.x1 = values[2] * (float) frame_size.width;
65 |         box.y1 = values[3] * (float) frame_size.height;
66 |         box.x2 = values[4] * (float) frame_size.width;
67 |         box.y2 = values[5] * (float) frame_size.height;
68 |         result.push_back(box);
69 |     }
70 |     return result;
71 | }
72 | 
73 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/cpp/YoloV4.h:
--------------------------------------------------------------------------------
 1 | #ifndef YOLOV4_H
 2 | #define YOLOV4_H
 3 | 
 4 | #include "net.h"
 5 | #include "YoloV5.h"
 6 | 
 7 | 
 8 | class YoloV4 {
 9 | public:
10 |     YoloV4(AAssetManager *mgr, const char *param, const char *bin, bool useGPU);
11 | 
12 |     ~YoloV4();
13 | 
14 |     std::vector<BoxInfo> detect(JNIEnv *env, jobject image, float threshold, float nms_threshold);
15 |     std::vector<std::string> labels{"person", "bicycle", "car", "motorcycle", "airplane", "bus", "train", "truck", "boat", "traffic light",
16 |                                     "fire hydrant", "stop sign", "parking meter", "bench", "bird", "cat", "dog", "horse", "sheep", "cow",
17 |                                     "elephant", "bear", "zebra", "giraffe", "backpack", "umbrella", "handbag", "tie", "suitcase", "frisbee",
18 |                                     "skis", "snowboard", "sports ball", "kite", "baseball bat", "baseball glove", "skateboard", "surfboard",
19 |                                     "tennis racket", "bottle", "wine glass", "cup", "fork", "knife", "spoon", "bowl", "banana", "apple",
20 |                                     "sandwich", "orange", "broccoli", "carrot", "hot dog", "pizza", "donut", "cake", "chair", "couch",
21 |                                     "potted plant", "bed", "dining table", "toilet", "tv", "laptop", "mouse", "remote", "keyboard", "cell phone",
22 |                                     "microwave", "oven", "toaster", "sink", "refrigerator", "book", "clock", "vase", "scissors", "teddy bear",
23 |                                     "hair drier", "toothbrush"};
24 | private:
25 |     static std::vector<BoxInfo>
26 |     decode_infer(ncnn::Mat &data, const yolocv::YoloSize &frame_size, int net_size, int num_classes, float threshold);
27 | 
28 | //    static void nms(std::vector<BoxInfo>& result,float nms_threshold);
29 |     ncnn::Net *Net;
30 |     int input_size = 640 / 2;
31 |     int num_class = 80;
32 | public:
33 |     static YoloV4 *detector;
34 |     static bool hasGPU;
35 | };
36 | 
37 | 
38 | #endif //YOLOV4_H
39 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/cpp/YoloV5.h:
--------------------------------------------------------------------------------
 1 | //
 2 | // Created by 邓昊晴 on 14/6/2020.
 3 | //
 4 | 
 5 | #ifndef YOLOV5_H
 6 | #define YOLOV5_H
 7 | 
 8 | #include "net.h"
 9 | 
10 | namespace yolocv {
11 |     typedef struct {
12 |         int width;
13 |         int height;
14 |     } YoloSize;
15 | }
16 | 
17 | typedef struct {
18 |     std::string name;
19 |     int stride;
20 |     std::vector<yolocv::YoloSize> anchors;
21 | } YoloLayerData;
22 | 
23 | typedef struct BoxInfo {
24 |     float x1;
25 |     float y1;
26 |     float x2;
27 |     float y2;
28 |     float score;
29 |     int label;
30 | } BoxInfo;
31 | 
32 | class YoloV5 {
33 | public:
34 |     YoloV5(AAssetManager *mgr, const char *param, const char *bin, bool useGPU);
35 | 
36 |     ~YoloV5();
37 | 
38 |     std::vector<BoxInfo> detect(JNIEnv *env, jobject image, float threshold, float nms_threshold);
39 |     std::vector<std::string> labels{"person", "bicycle", "car", "motorcycle", "airplane", "bus", "train", "truck", "boat", "traffic light",
40 |                                     "fire hydrant", "stop sign", "parking meter", "bench", "bird", "cat", "dog", "horse", "sheep", "cow",
41 |                                     "elephant", "bear", "zebra", "giraffe", "backpack", "umbrella", "handbag", "tie", "suitcase", "frisbee",
42 |                                     "skis", "snowboard", "sports ball", "kite", "baseball bat", "baseball glove", "skateboard", "surfboard",
43 |                                     "tennis racket", "bottle", "wine glass", "cup", "fork", "knife", "spoon", "bowl", "banana", "apple",
44 |                                     "sandwich", "orange", "broccoli", "carrot", "hot dog", "pizza", "donut", "cake", "chair", "couch",
45 |                                     "potted plant", "bed", "dining table", "toilet", "tv", "laptop", "mouse", "remote", "keyboard", "cell phone",
46 |                                     "microwave", "oven", "toaster", "sink", "refrigerator", "book", "clock", "vase", "scissors", "teddy bear",
47 |                                     "hair drier", "toothbrush"};
48 | private:
49 |     static std::vector<BoxInfo>
50 |     decode_infer(ncnn::Mat &data, int stride, const yolocv::YoloSize &frame_size, int net_size, int num_classes,
51 |                  const std::vector<yolocv::YoloSize> &anchors, float threshold);
52 | 
53 |     static void nms(std::vector<BoxInfo> &result, float nms_threshold);
54 | 
55 |     ncnn::Net *Net;
56 |     int input_size = 640;
57 |     int num_class = 80;
58 |     std::vector<YoloLayerData> layers{
59 |             {"394",    32, {{116, 90}, {156, 198}, {373, 326}}},
60 |             {"375",    16, {{30,  61}, {62,  45},  {59,  119}}},
61 |             {"output", 8,  {{10,  13}, {16,  30},  {33,  23}}},
62 |     };
63 | 
64 | public:
65 |     static YoloV5 *detector;
66 |     static bool hasGPU;
67 | };
68 | 
69 | 
70 | #endif //YOLOV5_H
71 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/cpp/jni_interface.cpp:
--------------------------------------------------------------------------------
  1 | #include <jni.h>
  2 | #include <string>
  3 | #include <gpu.h>
  4 | #include <android/asset_manager_jni.h>
  5 | #include <android/log.h>
  6 | #include "YoloV5.h"
  7 | #include "YoloV4.h"
  8 | #include "NanoDet.h"
  9 | 
 10 | 
 11 | JNIEXPORT jint JNI_OnLoad(JavaVM *vm, void *reserved) {
 12 |     ncnn::create_gpu_instance();
 13 |     if (ncnn::get_gpu_count() > 0) {
 14 |         YoloV5::hasGPU = true;
 15 |         YoloV4::hasGPU = true;
 16 |         NanoDet::hasGPU = true;
 17 |     }
 18 |     return JNI_VERSION_1_6;
 19 | }
 20 | 
 21 | JNIEXPORT void JNI_OnUnload(JavaVM *vm, void *reserved) {
 22 |     ncnn::destroy_gpu_instance();
 23 | }
 24 | 
 25 | 
 26 | /*********************************************************************************************
 27 |                                          NanoDet
 28 |  ********************************************************************************************/
 29 | 
 30 | extern "C" JNIEXPORT void JNICALL
 31 | Java_com_rangi_nanodet_NanoDet_init(JNIEnv *env, jclass, jobject assetManager, jboolean useGPU) {
 32 |     if (NanoDet::detector == nullptr) {
 33 |         AAssetManager *mgr = AAssetManager_fromJava(env, assetManager);
 34 |         NanoDet::detector = new NanoDet(mgr, "nanodet_m.param", "nanodet_m.bin", useGPU);
 35 |     }
 36 | }
 37 | 
 38 | extern "C" JNIEXPORT jobjectArray JNICALL
 39 | Java_com_rangi_nanodet_NanoDet_detect(JNIEnv *env, jclass, jobject image, jdouble threshold, jdouble nms_threshold) {
 40 |     auto result = NanoDet::detector->detect(env, image, threshold, nms_threshold);
 41 | 
 42 |     auto box_cls = env->FindClass("com/rangi/nanodet/Box");
 43 |     auto cid = env->GetMethodID(box_cls, "<init>", "(FFFFIF)V");
 44 |     jobjectArray ret = env->NewObjectArray(result.size(), box_cls, nullptr);
 45 |     int i = 0;
 46 |     for (auto &box:result) {
 47 |         env->PushLocalFrame(1);
 48 |         jobject obj = env->NewObject(box_cls, cid, box.x1, box.y1, box.x2, box.y2, box.label, box.score);
 49 |         obj = env->PopLocalFrame(obj);
 50 |         env->SetObjectArrayElement(ret, i++, obj);
 51 |     }
 52 |     return ret;
 53 | }
 54 | 
 55 | /*********************************************************************************************
 56 |                                          Yolov5
 57 |  ********************************************************************************************/
 58 | extern "C" JNIEXPORT void JNICALL
 59 | Java_com_rangi_nanodet_YOLOv5_init(JNIEnv *env, jclass, jobject assetManager, jboolean useGPU) {
 60 |     if (YoloV5::detector == nullptr) {
 61 |         AAssetManager *mgr = AAssetManager_fromJava(env, assetManager);
 62 |         YoloV5::detector = new YoloV5(mgr, "yolov5.param", "yolov5.bin", useGPU);
 63 |     }
 64 | }
 65 | 
 66 | extern "C" JNIEXPORT jobjectArray JNICALL
 67 | Java_com_rangi_nanodet_YOLOv5_detect(JNIEnv *env, jclass, jobject image, jdouble threshold, jdouble nms_threshold) {
 68 |     auto result = YoloV5::detector->detect(env, image, threshold, nms_threshold);
 69 | 
 70 |     auto box_cls = env->FindClass("com/rangi/nanodet/Box");
 71 |     auto cid = env->GetMethodID(box_cls, "<init>", "(FFFFIF)V");
 72 |     jobjectArray ret = env->NewObjectArray(result.size(), box_cls, nullptr);
 73 |     int i = 0;
 74 |     for (auto &box:result) {
 75 |         env->PushLocalFrame(1);
 76 |         jobject obj = env->NewObject(box_cls, cid, box.x1, box.y1, box.x2, box.y2, box.label, box.score);
 77 |         obj = env->PopLocalFrame(obj);
 78 |         env->SetObjectArrayElement(ret, i++, obj);
 79 |     }
 80 |     return ret;
 81 | }
 82 | 
 83 | /*********************************************************************************************
 84 |                                          YOLOv4-tiny
 85 |  ********************************************************************************************/
 86 | extern "C" JNIEXPORT void JNICALL
 87 | Java_com_rangi_nanodet_YOLOv4_init(JNIEnv *env, jclass, jobject assetManager, jboolean useGPU) {
 88 |     if (YoloV4::detector == nullptr) {
 89 |         AAssetManager *mgr = AAssetManager_fromJava(env, assetManager);
 90 |         YoloV4::detector = new YoloV4(mgr, "yolov4-tiny-opt.param", "yolov4-tiny-opt.bin", useGPU);
 91 |     }
 92 | }
 93 | 
 94 | extern "C" JNIEXPORT jobjectArray JNICALL
 95 | Java_com_rangi_nanodet_YOLOv4_detect(JNIEnv *env, jclass, jobject image, jdouble threshold, jdouble nms_threshold) {
 96 |     auto result = YoloV4::detector->detect(env, image, threshold, nms_threshold);
 97 | 
 98 |     auto box_cls = env->FindClass("com/rangi/nanodet/Box");
 99 |     auto cid = env->GetMethodID(box_cls, "<init>", "(FFFFIF)V");
100 |     jobjectArray ret = env->NewObjectArray(result.size(), box_cls, nullptr);
101 |     int i = 0;
102 |     for (auto &box:result) {
103 |         env->PushLocalFrame(1);
104 |         jobject obj = env->NewObject(box_cls, cid, box.x1, box.y1, box.x2, box.y2, box.label, box.score);
105 |         obj = env->PopLocalFrame(obj);
106 |         env->SetObjectArrayElement(ret, i++, obj);
107 |     }
108 |     return ret;
109 | }
110 | 
111 | 
112 | 
113 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/java/com/rangi/nanodet/AppCrashHandler.java:
--------------------------------------------------------------------------------
 1 | package com.rangi.nanodet;
 2 | 
 3 | import androidx.annotation.NonNull;
 4 | 
 5 | class AppCrashHandler implements Thread.UncaughtExceptionHandler {
 6 | 
 7 |     private Thread.UncaughtExceptionHandler uncaughtExceptionHandler = Thread.getDefaultUncaughtExceptionHandler();
 8 | 
 9 |     @Override
10 |     public void uncaughtException(@NonNull Thread t, @NonNull Throwable e) {
11 |         uncaughtExceptionHandler.uncaughtException(t, e);
12 |     }
13 | 
14 |     public static void register() {
15 |         Thread.setDefaultUncaughtExceptionHandler(new AppCrashHandler());
16 |     }
17 | 
18 | }
19 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/java/com/rangi/nanodet/Box.java:
--------------------------------------------------------------------------------
 1 | package com.rangi.nanodet;
 2 | 
 3 | import android.graphics.Color;
 4 | import android.graphics.RectF;
 5 | 
 6 | import java.util.Random;
 7 | 
 8 | public class Box {
 9 |     public float x0,y0,x1,y1;
10 |     private int label;
11 |     private float score;
12 |     private static String[] labels={"person", "bicycle", "car", "motorcycle", "airplane", "bus", "train", "truck", "boat", "traffic light",
13 |             "fire hydrant", "stop sign", "parking meter", "bench", "bird", "cat", "dog", "horse", "sheep", "cow",
14 |             "elephant", "bear", "zebra", "giraffe", "backpack", "umbrella", "handbag", "tie", "suitcase", "frisbee",
15 |             "skis", "snowboard", "sports ball", "kite", "baseball bat", "baseball glove", "skateboard", "surfboard",
16 |             "tennis racket", "bottle", "wine glass", "cup", "fork", "knife", "spoon", "bowl", "banana", "apple",
17 |             "sandwich", "orange", "broccoli", "carrot", "hot dog", "pizza", "donut", "cake", "chair", "couch",
18 |             "potted plant", "bed", "dining table", "toilet", "tv", "laptop", "mouse", "remote", "keyboard", "cell phone",
19 |             "microwave", "oven", "toaster", "sink", "refrigerator", "book", "clock", "vase", "scissors", "teddy bear",
20 |             "hair drier", "toothbrush"};
21 |     public Box(float x0,float y0, float x1, float y1, int label, float score){
22 |         this.x0 = x0;
23 |         this.y0 = y0;
24 |         this.x1 = x1;
25 |         this.y1 = y1;
26 |         this.label = label;
27 |         this.score = score;
28 |     }
29 | 
30 |     public RectF getRect(){
31 |         return new RectF(x0,y0,x1,y1);
32 |     }
33 | 
34 |     public String getLabel(){
35 |         return labels[label];
36 |     }
37 | 
38 |     public float getScore(){
39 |         return score;
40 |     }
41 | 
42 |     public int getColor(){
43 |         Random random = new Random(label);
44 |         return Color.argb(255,random.nextInt(256),random.nextInt(256),random.nextInt(256));
45 |     }
46 | }
47 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/java/com/rangi/nanodet/NanoDet.java:
--------------------------------------------------------------------------------
 1 | package com.rangi.nanodet;
 2 | 
 3 | import android.content.res.AssetManager;
 4 | import android.graphics.Bitmap;
 5 | 
 6 | public class NanoDet {
 7 |     static {
 8 |         System.loadLibrary("yolov5");
 9 |     }
10 | 
11 |     public static native void init(AssetManager manager, boolean useGPU);
12 |     public static native Box[] detect(Bitmap bitmap, double threshold, double nms_threshold);
13 | }
14 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/java/com/rangi/nanodet/NcnnApp.java:
--------------------------------------------------------------------------------
 1 | package com.rangi.nanodet;
 2 | 
 3 | import android.app.Application;
 4 | import android.content.Context;
 5 | import android.util.Log;
 6 | 
 7 | import androidx.multidex.MultiDex;
 8 | 
 9 | import com.zxy.recovery.callback.RecoveryCallback;
10 | import com.zxy.recovery.core.Recovery;
11 | 
12 | 
13 | public class NcnnApp extends Application {
14 | 
15 |     @Override
16 |     public void onCreate() {
17 |         super.onCreate();
18 | 
19 |         //崩溃界面
20 |         initRecovery();
21 |     }
22 | 
23 |     @Override
24 |     protected void attachBaseContext(Context base) {
25 |         super.attachBaseContext(base);
26 |         MultiDex.install(base);
27 |     }
28 | 
29 |     private void initRecovery() {
30 |         Recovery.getInstance()
31 |                 .debug(BuildConfig.DEBUG)
32 |                 .recoverInBackground(true)
33 |                 .recoverStack(true)
34 |                 .mainPage(MainActivity.class)
35 |                 .recoverEnabled(true)
36 |                 .callback(new MyCrashCallback())
37 |                 .silent(false, Recovery.SilentMode.RECOVER_ACTIVITY_STACK)
38 | //                .skip(TestActivity.class)
39 |                 .init(this);
40 |         AppCrashHandler.register();
41 |     }
42 | 
43 |     static final class MyCrashCallback implements RecoveryCallback {
44 |         @Override
45 |         public void stackTrace(String exceptionMessage) {
46 |             Log.e("wzt", "exceptionMessage:" + exceptionMessage);
47 |         }
48 | 
49 |         @Override
50 |         public void cause(String cause) {
51 |             Log.e("wzt", "cause:" + cause);
52 |         }
53 | 
54 |         @Override
55 |         public void exception(String exceptionType, String throwClassName, String throwMethodName, int throwLineNumber) {
56 |             Log.e("wzt", "exceptionClassName:" + exceptionType);
57 |             Log.e("wzt", "throwClassName:" + throwClassName);
58 |             Log.e("wzt", "throwMethodName:" + throwMethodName);
59 |             Log.e("wzt", "throwLineNumber:" + throwLineNumber);
60 |         }
61 | 
62 |         @Override
63 |         public void throwable(Throwable throwable) {
64 | 
65 |         }
66 |     }
67 | 
68 | }
69 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/java/com/rangi/nanodet/WelcomeActivity.java:
--------------------------------------------------------------------------------
 1 | package com.rangi.nanodet;
 2 | 
 3 | import androidx.appcompat.app.AlertDialog;
 4 | import androidx.appcompat.app.AppCompatActivity;
 5 | 
 6 | import android.content.Intent;
 7 | import android.os.Bundle;
 8 | import android.view.View;
 9 | import android.widget.Button;
10 | import android.widget.CompoundButton;
11 | import android.widget.ToggleButton;
12 | 
13 | 
14 | public class WelcomeActivity extends AppCompatActivity {
15 | 
16 |     private ToggleButton tbUseGpu;
17 |     private Button nanodet;
18 |     private Button yolov5s;
19 |     private Button yolov4tiny;
20 | 
21 |     private boolean useGPU = false;
22 | 
23 |     @Override
24 |     protected void onCreate(Bundle savedInstanceState) {
25 |         super.onCreate(savedInstanceState);
26 |         setContentView(R.layout.activity_welcome);
27 | 
28 |         tbUseGpu = findViewById(R.id.tb_use_gpu);
29 |         tbUseGpu.setOnCheckedChangeListener(new CompoundButton.OnCheckedChangeListener() {
30 |             @Override
31 |             public void onCheckedChanged(CompoundButton buttonView, boolean isChecked) {
32 |                 useGPU = isChecked;
33 |                 MainActivity.USE_GPU = useGPU;
34 |                 if (useGPU) {
35 |                     AlertDialog.Builder builder = new AlertDialog.Builder(WelcomeActivity.this);
36 |                     builder.setTitle("Warning");
37 |                     builder.setMessage("It may not work well in GPU mode, or errors may occur.");
38 |                     builder.setCancelable(true);
39 |                     builder.setPositiveButton("OK", null);
40 |                     AlertDialog dialog = builder.create();
41 |                     dialog.show();
42 |                 }
43 |             }
44 |         });
45 | 
46 |         nanodet = findViewById(R.id.btn_start_detect0);
47 |         nanodet.setOnClickListener(new View.OnClickListener() {
48 |             @Override
49 |             public void onClick(View v) {
50 |                 MainActivity.USE_MODEL = MainActivity.NANODET;
51 |                 Intent intent = new Intent(WelcomeActivity.this, MainActivity.class);
52 |                 WelcomeActivity.this.startActivity(intent);
53 |             }
54 |         });
55 | 
56 |         yolov5s = findViewById(R.id.btn_start_detect1);
57 |         yolov5s.setOnClickListener(new View.OnClickListener() {
58 |             @Override
59 |             public void onClick(View v) {
60 |                 MainActivity.USE_MODEL = MainActivity.YOLOV5S;
61 |                 Intent intent = new Intent(WelcomeActivity.this, MainActivity.class);
62 |                 WelcomeActivity.this.startActivity(intent);
63 |             }
64 |         });
65 | 
66 |         yolov4tiny = findViewById(R.id.btn_start_detect2);
67 |         yolov4tiny.setOnClickListener(new View.OnClickListener() {
68 |             @Override
69 |             public void onClick(View v) {
70 |                 MainActivity.USE_MODEL = MainActivity.YOLOV4_TINY;
71 |                 Intent intent = new Intent(WelcomeActivity.this, MainActivity.class);
72 |                 WelcomeActivity.this.startActivity(intent);
73 |             }
74 |         });
75 | 
76 |     }
77 | 
78 | }
79 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/java/com/rangi/nanodet/YOLOv4.java:
--------------------------------------------------------------------------------
 1 | package com.rangi.nanodet;
 2 | 
 3 | import android.content.res.AssetManager;
 4 | import android.graphics.Bitmap;
 5 | 
 6 | public class YOLOv4 {
 7 |     static {
 8 |         System.loadLibrary("yolov5");  // 存放在yolov5.so中
 9 |     }
10 | 
11 |     public static native void init(AssetManager manager, boolean useGPU);
12 |     public static native Box[] detect(Bitmap bitmap, double threshold, double nms_threshold);
13 | }
14 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/java/com/rangi/nanodet/YOLOv5.java:
--------------------------------------------------------------------------------
 1 | package com.rangi.nanodet;
 2 | 
 3 | import android.content.res.AssetManager;
 4 | import android.graphics.Bitmap;
 5 | 
 6 | public class YOLOv5 {
 7 |     static {
 8 |         System.loadLibrary("yolov5");
 9 |     }
10 | 
11 |     public static native void init(AssetManager manager, boolean useGPU);
12 |     public static native Box[] detect(Bitmap bitmap, double threshold, double nms_threshold);
13 | }
14 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/drawable-v24/ic_launcher_foreground.xml:
--------------------------------------------------------------------------------
 1 | <vector xmlns:android="http://schemas.android.com/apk/res/android"
 2 |     xmlns:aapt="http://schemas.android.com/aapt"
 3 |     android:width="108dp"
 4 |     android:height="108dp"
 5 |     android:viewportWidth="108"
 6 |     android:viewportHeight="108">
 7 |     <path
 8 |         android:fillType="evenOdd"
 9 |         android:pathData="M32,64C32,64 38.39,52.99 44.13,50.95C51.37,48.37 70.14,49.57 70.14,49.57L108.26,87.69L108,109.01L75.97,107.97L32,64Z"
10 |         android:strokeWidth="1"
11 |         android:strokeColor="#00000000">
12 |         <aapt:attr name="android:fillColor">
13 |             <gradient
14 |                 android:endX="78.5885"
15 |                 android:endY="90.9159"
16 |                 android:startX="48.7653"
17 |                 android:startY="61.0927"
18 |                 android:type="linear">
19 |                 <item
20 |                     android:color="#44000000"
21 |                     android:offset="0.0" />
22 |                 <item
23 |                     android:color="#00000000"
24 |                     android:offset="1.0" />
25 |             </gradient>
26 |         </aapt:attr>
27 |     </path>
28 |     <path
29 |         android:fillColor="#FFFFFF"
30 |         android:fillType="nonZero"
31 |         android:pathData="M66.94,46.02L66.94,46.02C72.44,50.07 76,56.61 76,64L32,64C32,56.61 35.56,50.11 40.98,46.06L36.18,41.19C35.45,40.45 35.45,39.3 36.18,38.56C36.91,37.81 38.05,37.81 38.78,38.56L44.25,44.05C47.18,42.57 50.48,41.71 54,41.71C57.48,41.71 60.78,42.57 63.68,44.05L69.11,38.56C69.84,37.81 70.98,37.81 71.71,38.56C72.44,39.3 72.44,40.45 71.71,41.19L66.94,46.02ZM62.94,56.92C64.08,56.92 65,56.01 65,54.88C65,53.76 64.08,52.85 62.94,52.85C61.8,52.85 60.88,53.76 60.88,54.88C60.88,56.01 61.8,56.92 62.94,56.92ZM45.06,56.92C46.2,56.92 47.13,56.01 47.13,54.88C47.13,53.76 46.2,52.85 45.06,52.85C43.92,52.85 43,53.76 43,54.88C43,56.01 43.92,56.92 45.06,56.92Z"
32 |         android:strokeWidth="1"
33 |         android:strokeColor="#00000000" />
34 | </vector>
35 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/drawable-xxhdpi/cpu.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_android_ncnn/app/src/main/res/drawable-xxhdpi/cpu.png


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/drawable-xxhdpi/gpu.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_android_ncnn/app/src/main/res/drawable-xxhdpi/gpu.png


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/drawable-xxhdpi/ncnn_icon.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_android_ncnn/app/src/main/res/drawable-xxhdpi/ncnn_icon.png


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/drawable/cpu_gpu_bg.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <selector xmlns:android="http://schemas.android.com/apk/res/android">
3 |     <item android:drawable="@drawable/gpu" android:state_checked="true" />
4 |     <item android:drawable="@drawable/cpu" android:state_checked="false" />
5 | </selector>
6 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/layout/activity_main.xml:
--------------------------------------------------------------------------------
  1 | <?xml version="1.0" encoding="utf-8"?>
  2 | <androidx.constraintlayout.widget.ConstraintLayout xmlns:android="http://schemas.android.com/apk/res/android"
  3 |     xmlns:app="http://schemas.android.com/apk/res-auto"
  4 |     xmlns:tools="http://schemas.android.com/tools"
  5 |     android:layout_width="match_parent"
  6 |     android:layout_height="match_parent"
  7 |     tools:context=".MainActivity">
  8 | 
  9 |     <Button
 10 |         android:id="@+id/button"
 11 |         android:layout_width="wrap_content"
 12 |         android:layout_height="wrap_content"
 13 |         android:layout_marginTop="3dp"
 14 |         android:text="Detect"
 15 |         app:layout_constraintStart_toStartOf="parent"
 16 |         app:layout_constraintTop_toBottomOf="@+id/threshold_seek" />
 17 | 
 18 |     <ImageView
 19 |         android:id="@+id/imageView"
 20 |         android:layout_width="0dp"
 21 |         android:layout_height="0dp"
 22 |         app:layout_constraintEnd_toEndOf="parent"
 23 |         app:layout_constraintHorizontal_bias="1.0"
 24 |         app:layout_constraintStart_toStartOf="parent"
 25 |         app:layout_constraintTop_toBottomOf="@+id/button"
 26 |         app:layout_constraintBottom_toTopOf="@+id/view_finder"
 27 |         app:layout_constraintVertical_bias="1.0" />
 28 | 
 29 |     <TextureView
 30 |         android:id="@+id/view_finder"
 31 |         android:layout_width="0dp"
 32 |         android:layout_height="150dp"
 33 |         android:layout_marginLeft="0dp"
 34 |         android:layout_marginTop="0dp"
 35 |         app:layout_constraintBottom_toBottomOf="parent"
 36 |         app:layout_constraintDimensionRatio="h,4:3"
 37 |         app:layout_constraintStart_toStartOf="parent" />
 38 | 
 39 |     <TextView
 40 |         android:id="@+id/textView"
 41 |         android:layout_width="0dp"
 42 |         android:layout_height="wrap_content"
 43 |         android:layout_marginTop="10dp"
 44 |         android:layout_marginLeft="5dp"
 45 |         android:text="NMS"
 46 |         app:layout_constraintEnd_toEndOf="@+id/txtThresh"
 47 |         app:layout_constraintStart_toStartOf="parent"
 48 |         app:layout_constraintTop_toTopOf="parent" />
 49 | 
 50 |     <SeekBar
 51 |         android:id="@+id/nms_seek"
 52 |         android:layout_width="0dp"
 53 |         android:layout_height="wrap_content"
 54 |         android:layout_marginStart="4dp"
 55 |         android:layout_marginTop="10dp"
 56 |         android:layout_marginEnd="8dp"
 57 |         android:max="100"
 58 |         android:progress="70"
 59 |         app:layout_constraintEnd_toEndOf="parent"
 60 |         app:layout_constraintHorizontal_bias="0.497"
 61 |         app:layout_constraintStart_toEndOf="@+id/textView"
 62 |         app:layout_constraintTop_toTopOf="parent" />
 63 | 
 64 |     <TextView
 65 |         android:id="@+id/txtThresh"
 66 |         android:layout_width="wrap_content"
 67 |         android:layout_height="wrap_content"
 68 |         android:layout_marginTop="8dp"
 69 |         android:layout_marginLeft="5dp"
 70 |         android:text="Threshold"
 71 |         app:layout_constraintTop_toBottomOf="@+id/textView"
 72 |         tools:layout_editor_absoluteX="0dp"
 73 |         tools:ignore="MissingConstraints" />
 74 | 
 75 |     <SeekBar
 76 |         android:id="@+id/threshold_seek"
 77 |         android:layout_width="0dp"
 78 |         android:layout_height="wrap_content"
 79 |         android:layout_marginStart="4dp"
 80 |         android:layout_marginTop="10dp"
 81 |         android:layout_marginEnd="8dp"
 82 |         android:max="100"
 83 |         android:progress="30"
 84 |         app:layout_constraintEnd_toEndOf="parent"
 85 |         app:layout_constraintHorizontal_bias="0.0"
 86 |         app:layout_constraintStart_toEndOf="@+id/txtThresh"
 87 |         app:layout_constraintTop_toBottomOf="@+id/nms_seek" />
 88 | 
 89 |     <TextView
 90 |         android:id="@+id/valTxtView"
 91 |         android:layout_width="wrap_content"
 92 |         android:layout_height="wrap_content"
 93 |         android:layout_marginLeft="5dp"
 94 |         android:text="Thresh:-.--,NMS:-.--"
 95 |         app:layout_constraintBottom_toTopOf="@+id/imageView"
 96 |         app:layout_constraintStart_toEndOf="@+id/button"
 97 |         app:layout_constraintTop_toBottomOf="@+id/threshold_seek" />
 98 | 
 99 |     <TextView
100 |         android:id="@+id/tv_info"
101 |         android:layout_width="wrap_content"
102 |         android:layout_height="wrap_content"
103 |         android:text="Please wait..."
104 |         android:paddingLeft="5dp"
105 |         android:paddingTop="2dp"
106 |         app:layout_constraintStart_toEndOf="@+id/view_finder"
107 |         app:layout_constraintTop_toBottomOf="@+id/imageView"
108 |         />
109 | 
110 | </androidx.constraintlayout.widget.ConstraintLayout>


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/layout/activity_welcome.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?>
 2 | <androidx.constraintlayout.widget.ConstraintLayout xmlns:android="http://schemas.android.com/apk/res/android"
 3 |     xmlns:app="http://schemas.android.com/apk/res-auto"
 4 |     xmlns:tools="http://schemas.android.com/tools"
 5 |     android:layout_width="match_parent"
 6 |     android:layout_height="match_parent"
 7 |     tools:context=".MainActivity">
 8 | 
 9 |     <!--    <ImageView-->
10 |     <!--        android:layout_width="30dp"-->
11 |     <!--        android:layout_height="30dp"-->
12 |     <!--        android:alpha="0.2"-->
13 |     <!--        android:src="@drawable/ncnn_icon"-->
14 |     <!--        app:layout_constraintBottom_toBottomOf="parent"-->
15 |     <!--        app:layout_constraintEnd_toEndOf="parent"-->
16 |     <!--        app:layout_constraintStart_toStartOf="parent" />-->
17 | 
18 |     <ToggleButton
19 |         android:id="@+id/tb_use_gpu"
20 |         android:layout_width="40dp"
21 |         android:layout_height="40dp"
22 |         android:alpha="0.5"
23 |         android:background="@drawable/cpu_gpu_bg"
24 |         android:textColor="#0000FF"
25 |         android:textOff=""
26 |         android:textOn=""
27 |         app:layout_constraintBottom_toBottomOf="parent"
28 |         app:layout_constraintEnd_toEndOf="parent"
29 |         app:layout_constraintStart_toStartOf="parent" />
30 | 
31 |     <ScrollView
32 |         android:layout_width="match_parent"
33 |         android:layout_height="match_parent"
34 |         app:layout_constraintBottom_toBottomOf="parent"
35 |         app:layout_constraintEnd_toEndOf="parent"
36 |         app:layout_constraintStart_toStartOf="parent"
37 |         app:layout_constraintTop_toTopOf="parent">
38 | 
39 |         <LinearLayout
40 |             android:layout_width="match_parent"
41 |             android:layout_height="wrap_content"
42 |             android:orientation="vertical"
43 |             app:layout_constraintBottom_toBottomOf="parent"
44 |             app:layout_constraintEnd_toEndOf="parent"
45 |             app:layout_constraintStart_toStartOf="parent"
46 |             app:layout_constraintTop_toTopOf="parent">
47 | 
48 |             <Button
49 |                 android:id="@+id/btn_start_detect0"
50 |                 android:layout_width="match_parent"
51 |                 android:layout_height="wrap_content"
52 |                 android:text="NanoDet"
53 |                 android:textAllCaps="false"
54 |                 app:layout_constraintTop_toTopOf="parent" />
55 | 
56 |             <Button
57 |                 android:id="@+id/btn_start_detect1"
58 |                 android:layout_width="match_parent"
59 |                 android:layout_height="wrap_content"
60 |                 android:text="YOLOv5s"
61 |                 android:textAllCaps="false"
62 |                 app:layout_constraintTop_toBottomOf="@id/btn_start_detect0" />
63 | 
64 |             <Button
65 |                 android:id="@+id/btn_start_detect2"
66 |                 android:layout_width="match_parent"
67 |                 android:layout_height="wrap_content"
68 |                 android:text="YOLOv4_tiny"
69 |                 android:textAllCaps="false"
70 |                 app:layout_constraintTop_toBottomOf="@id/btn_start_detect1" />
71 | 
72 |         </LinearLayout>
73 |     </ScrollView>
74 | 
75 | </androidx.constraintlayout.widget.ConstraintLayout>
76 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/mipmap-anydpi-v26/ic_launcher.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <adaptive-icon xmlns:android="http://schemas.android.com/apk/res/android">
3 |     <background android:drawable="@drawable/ic_launcher_background" />
4 |     <foreground android:drawable="@drawable/ic_launcher_foreground" />
5 | </adaptive-icon>


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/mipmap-anydpi-v26/ic_launcher_round.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <adaptive-icon xmlns:android="http://schemas.android.com/apk/res/android">
3 |     <background android:drawable="@drawable/ic_launcher_background" />
4 |     <foreground android:drawable="@drawable/ic_launcher_foreground" />
5 | </adaptive-icon>


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/mipmap-hdpi/ic_launcher.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_android_ncnn/app/src/main/res/mipmap-hdpi/ic_launcher.png


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/mipmap-hdpi/ic_launcher_round.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_android_ncnn/app/src/main/res/mipmap-hdpi/ic_launcher_round.png


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/mipmap-mdpi/ic_launcher.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_android_ncnn/app/src/main/res/mipmap-mdpi/ic_launcher.png


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/mipmap-mdpi/ic_launcher_round.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_android_ncnn/app/src/main/res/mipmap-mdpi/ic_launcher_round.png


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/mipmap-xhdpi/ic_launcher.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_android_ncnn/app/src/main/res/mipmap-xhdpi/ic_launcher.png


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/mipmap-xhdpi/ic_launcher_round.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_android_ncnn/app/src/main/res/mipmap-xhdpi/ic_launcher_round.png


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/mipmap-xxhdpi/ic_launcher.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_android_ncnn/app/src/main/res/mipmap-xxhdpi/ic_launcher.png


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/mipmap-xxhdpi/ic_launcher_round.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_android_ncnn/app/src/main/res/mipmap-xxhdpi/ic_launcher_round.png


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/mipmap-xxxhdpi/ic_launcher.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_android_ncnn/app/src/main/res/mipmap-xxxhdpi/ic_launcher.png


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/mipmap-xxxhdpi/ic_launcher_round.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_android_ncnn/app/src/main/res/mipmap-xxxhdpi/ic_launcher_round.png


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/values/colors.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <resources>
3 |     <color name="colorPrimary">#123F70</color>
4 |     <color name="colorPrimaryDark">#122F49</color>
5 |     <color name="colorAccent">#D81B60</color>
6 | 
7 |     <color name="imageResultbg">#DDDDDD</color>
8 | </resources>
9 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/values/strings.xml:
--------------------------------------------------------------------------------
1 | <resources>
2 |     <string name="app_name">NanoDet</string>
3 | </resources>
4 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/main/res/values/styles.xml:
--------------------------------------------------------------------------------
 1 | <resources>
 2 | 
 3 |     <!-- Base application theme. -->
 4 |     <style name="AppTheme" parent="Theme.AppCompat.Light.DarkActionBar">
 5 |         <!-- Customize your theme here. -->
 6 |         <item name="colorPrimary">@color/colorPrimary</item>
 7 |         <item name="colorPrimaryDark">@color/colorPrimaryDark</item>
 8 |         <item name="colorAccent">@color/colorAccent</item>
 9 |     </style>
10 |     <style name="AppNoTitleTheme" parent="Theme.AppCompat.Light.NoActionBar">
11 |         <!-- Customize your theme here. -->
12 |         <item name="colorPrimary">@color/colorPrimary</item>
13 |         <item name="colorPrimaryDark">@color/colorPrimaryDark</item>
14 |         <item name="colorAccent">@color/colorAccent</item>
15 |     </style>
16 | 
17 | </resources>
18 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/app/src/test/java/com/rangi/nanodet/ExampleUnitTest.java:
--------------------------------------------------------------------------------
 1 | package com.rangi.nanodet;
 2 | 
 3 | import org.junit.Test;
 4 | 
 5 | import static org.junit.Assert.*;
 6 | 
 7 | /**
 8 |  * Example local unit test, which will execute on the development machine (host).
 9 |  *
10 |  * @see <a href="http://d.android.com/tools/testing">Testing documentation</a>
11 |  */
12 | public class ExampleUnitTest {
13 |     @Test
14 |     public void addition_isCorrect() {
15 |         assertEquals(4, 2 + 2);
16 |     }
17 | }


--------------------------------------------------------------------------------
/demo_android_ncnn/build.gradle:
--------------------------------------------------------------------------------
 1 | // Top-level build file where you can add configuration options common to all sub-projects/modules.
 2 | 
 3 | buildscript {
 4 |     repositories {
 5 |         google()
 6 |         jcenter()
 7 |         
 8 |     }
 9 |     dependencies {
10 |         classpath 'com.android.tools.build:gradle:4.0.0'
11 |         
12 |         // NOTE: Do not place your application dependencies here; they belong
13 |         // in the individual module build.gradle files
14 |     }
15 | }
16 | 
17 | allprojects {
18 |     repositories {
19 |         google()
20 |         jcenter()
21 |         maven { url "https://jitpack.io" }
22 |     }
23 | }
24 | 
25 | task clean(type: Delete) {
26 |     delete rootProject.buildDir
27 | }
28 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/gradle.properties:
--------------------------------------------------------------------------------
 1 | # Project-wide Gradle settings.
 2 | # IDE (e.g. Android Studio) users:
 3 | # Gradle settings configured through the IDE *will override*
 4 | # any settings specified in this file.
 5 | # For more details on how to configure your build environment visit
 6 | # http://www.gradle.org/docs/current/userguide/build_environment.html
 7 | # Specifies the JVM arguments used for the daemon process.
 8 | # The setting is particularly useful for tweaking memory settings.
 9 | org.gradle.jvmargs=-Xmx1536m
10 | # When configured, Gradle will run in incubating parallel mode.
11 | # This option should only be used with decoupled projects. More details, visit
12 | # http://www.gradle.org/docs/current/userguide/multi_project_builds.html#sec:decoupled_projects
13 | # org.gradle.parallel=true
14 | # AndroidX package structure to make it clearer which packages are bundled with the
15 | # Android operating system, and which are packaged with your app's APK
16 | # https://developer.android.com/topic/libraries/support-library/androidx-rn
17 | android.useAndroidX=true
18 | # Automatically convert third-party libraries to use AndroidX
19 | android.enableJetifier=true
20 | 
21 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/gradle/wrapper/gradle-wrapper.jar:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_android_ncnn/gradle/wrapper/gradle-wrapper.jar


--------------------------------------------------------------------------------
/demo_android_ncnn/gradle/wrapper/gradle-wrapper.properties:
--------------------------------------------------------------------------------
1 | #Mon Jun 15 13:17:33 HKT 2020
2 | distributionBase=GRADLE_USER_HOME
3 | distributionPath=wrapper/dists
4 | zipStoreBase=GRADLE_USER_HOME
5 | zipStorePath=wrapper/dists
6 | distributionUrl=https\://services.gradle.org/distributions/gradle-6.1.1-all.zip
7 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/gradlew.bat:
--------------------------------------------------------------------------------
 1 | @if "%DEBUG%" == "" @echo off
 2 | @rem ##########################################################################
 3 | @rem
 4 | @rem  Gradle startup script for Windows
 5 | @rem
 6 | @rem ##########################################################################
 7 | 
 8 | @rem Set local scope for the variables with windows NT shell
 9 | if "%OS%"=="Windows_NT" setlocal
10 | 
11 | set DIRNAME=%~dp0
12 | if "%DIRNAME%" == "" set DIRNAME=.
13 | set APP_BASE_NAME=%~n0
14 | set APP_HOME=%DIRNAME%
15 | 
16 | @rem Add default JVM options here. You can also use JAVA_OPTS and GRADLE_OPTS to pass JVM options to this script.
17 | set DEFAULT_JVM_OPTS=
18 | 
19 | @rem Find java.exe
20 | if defined JAVA_HOME goto findJavaFromJavaHome
21 | 
22 | set JAVA_EXE=java.exe
23 | %JAVA_EXE% -version >NUL 2>&1
24 | if "%ERRORLEVEL%" == "0" goto init
25 | 
26 | echo.
27 | echo ERROR: JAVA_HOME is not set and no 'java' command could be found in your PATH.
28 | echo.
29 | echo Please set the JAVA_HOME variable in your environment to match the
30 | echo location of your Java installation.
31 | 
32 | goto fail
33 | 
34 | :findJavaFromJavaHome
35 | set JAVA_HOME=%JAVA_HOME:"=%
36 | set JAVA_EXE=%JAVA_HOME%/bin/java.exe
37 | 
38 | if exist "%JAVA_EXE%" goto init
39 | 
40 | echo.
41 | echo ERROR: JAVA_HOME is set to an invalid directory: %JAVA_HOME%
42 | echo.
43 | echo Please set the JAVA_HOME variable in your environment to match the
44 | echo location of your Java installation.
45 | 
46 | goto fail
47 | 
48 | :init
49 | @rem Get command-line arguments, handling Windows variants
50 | 
51 | if not "%OS%" == "Windows_NT" goto win9xME_args
52 | 
53 | :win9xME_args
54 | @rem Slurp the command line arguments.
55 | set CMD_LINE_ARGS=
56 | set _SKIP=2
57 | 
58 | :win9xME_args_slurp
59 | if "x%~1" == "x" goto execute
60 | 
61 | set CMD_LINE_ARGS=%*
62 | 
63 | :execute
64 | @rem Setup the command line
65 | 
66 | set CLASSPATH=%APP_HOME%\gradle\wrapper\gradle-wrapper.jar
67 | 
68 | @rem Execute Gradle
69 | "%JAVA_EXE%" %DEFAULT_JVM_OPTS% %JAVA_OPTS% %GRADLE_OPTS% "-Dorg.gradle.appname=%APP_BASE_NAME%" -classpath "%CLASSPATH%" org.gradle.wrapper.GradleWrapperMain %CMD_LINE_ARGS%
70 | 
71 | :end
72 | @rem End local scope for the variables with windows NT shell
73 | if "%ERRORLEVEL%"=="0" goto mainEnd
74 | 
75 | :fail
76 | rem Set variable GRADLE_EXIT_CONSOLE if you need the _script_ return code instead of
77 | rem the _cmd.exe /c_ return code!
78 | if  not "" == "%GRADLE_EXIT_CONSOLE%" exit 1
79 | exit /b 1
80 | 
81 | :mainEnd
82 | if "%OS%"=="Windows_NT" endlocal
83 | 
84 | :omega
85 | 


--------------------------------------------------------------------------------
/demo_android_ncnn/settings.gradle:
--------------------------------------------------------------------------------
1 | include ':app'
2 | rootProject.name='NanoDet'
3 | 


--------------------------------------------------------------------------------
/demo_libtorch/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | cmake_minimum_required(VERSION 3.4.1)
 2 | set(CMAKE_CXX_STANDARD 14)
 3 | 
 4 | project(nanodet_demo)
 5 | 
 6 | find_package(OpenCV REQUIRED)
 7 | find_package(Torch REQUIRED)
 8 | set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${TORCH_CXX_FLAGS}")
 9 | 
10 | include_directories(
11 |     ${OpenCV_INCLUDE_DIRS}
12 |     ${CMAKE_CURRENT_SOURCE_DIR}
13 |     ${CMAKE_CURRENT_BINARY_DIR}
14 | )
15 | 
16 | add_executable(nanodet_demo main.cpp nanodet_libtorch.cpp)
17 | 
18 | target_link_libraries(
19 |     nanodet_demo 
20 |     ${TORCH_LIBRARIES}
21 |     ${OpenCV_LIBS} 
22 | )
23 | 
24 | if (MSVC)
25 |   file(GLOB TORCH_DLLS "${TORCH_INSTALL_PREFIX}/lib/*.dll")
26 |   add_custom_command(TARGET nanodet_demo
27 |                      POST_BUILD
28 |                      COMMAND ${CMAKE_COMMAND} -E copy_if_different
29 |                      ${TORCH_DLLS}
30 |                      $<TARGET_FILE_DIR:nanodet_demo>)
31 | endif (MSVC)


--------------------------------------------------------------------------------
/demo_libtorch/README.md:
--------------------------------------------------------------------------------
 1 | # NanoDet TorchScript / LibTorch Demo
 2 | 
 3 | This folder provides NanoDet inference code using for LibTorch.  
 4 | 
 5 | ## Install dependencies
 6 | 
 7 | This project needs OpenCV and CMake to work.
 8 | 
 9 | Install CMake using a package manager of your choice. For example, the following command will install CMake on Ubuntu:
10 | 
11 | ```bash
12 | sudo apt install cmake libopencv-dev
13 | ```
14 | 
15 | Also, you'll need to download LibTorch. Refer to [this page](https://pytorch.org/cppdocs/installing.html) for more info.
16 | 
17 | ## Convert model
18 | 
19 | Export TorchScript model using `tools/export_torchscript.py`:
20 | 
21 | ```shell
22 | python ./tools/export_torchscript.py --cfg_path ${CONFIG_PATH} --model_path ${PYTORCH_MODEL_PATH} --input_shape ${MO}
23 | ```
24 | ## Build
25 | 
26 | ### Linux
27 | ```shell
28 | mkdir build
29 | cd build
30 | cmake -DCMAKE_PREFIX_PATH=/absolute/path/to/libtorch ..
31 | make
32 | ```


--------------------------------------------------------------------------------
/demo_libtorch/nanodet_libtorch.h:
--------------------------------------------------------------------------------
 1 | #include <torch/torch.h>
 2 | #include <opencv2/core/core.hpp>
 3 | 
 4 | 
 5 | typedef struct BoxInfo 
 6 | {
 7 |     float x1;
 8 |     float y1;
 9 |     float x2;
10 |     float y2;
11 |     float score;
12 |     int label;
13 | } BoxInfo;
14 | 
15 | class NanoDet
16 | {
17 | public:
18 |     NanoDet(const char* model_path);
19 |     ~NanoDet();
20 |     torch::jit::script::Module Net;
21 |     std::vector<BoxInfo> detect(cv::Mat image, float score_threshold, float nms_threshold);
22 | 
23 | private:
24 |     torch::Tensor preprocess(cv::Mat& image);
25 |     void decode_infer(torch::Tensor& cls_pred, torch::Tensor& dis_pred, int stage_idx, float threshold, std::vector<std::vector<BoxInfo>>& results);
26 |     BoxInfo disPred2Bbox(const float*& dfl_det, int label, float score, int x, int y, int stride);
27 |     static void nms(std::vector<BoxInfo>& result, float nms_threshold);
28 |     std::vector<int> strides_{ 8, 16, 32 };
29 |     int input_size_ = 320;
30 |     int num_class_ = 80;
31 |     int reg_max_ = 7;
32 | 
33 | };


--------------------------------------------------------------------------------
/demo_mnn/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | cmake_minimum_required(VERSION 3.9)
 2 | project(nanodet-mnn)
 3 | 
 4 | set(CMAKE_CXX_STANDARD 17)
 5 | 
 6 | # find_package(OpenCV REQUIRED PATHS "/work/dependence/opencv/opencv-3.4.3/build")
 7 | find_package(OpenCV REQUIRED)
 8 | include_directories(
 9 |         mnn/include
10 |         .
11 | )
12 | 
13 | link_directories(mnn/lib)
14 | 
15 | add_executable(nanodet-mnn main.cpp nanodet_mnn.cpp)
16 | target_link_libraries(nanodet-mnn MNN ${OpenCV_LIBS})
17 | 


--------------------------------------------------------------------------------
/demo_mnn/README.md:
--------------------------------------------------------------------------------
  1 | # NanoDet MNN Demo
  2 | 
  3 | This fold provides NanoDet inference code using
  4 | [Alibaba's MNN framework](https://github.com/alibaba/MNN). Most of the implements in
  5 | this fold are same as *demo_ncnn*.
  6 | 
  7 | ## Install MNN
  8 | 
  9 | ### Python library
 10 | 
 11 | Just run:
 12 | 
 13 | ``` shell
 14 | pip install MNN
 15 | ```
 16 | 
 17 | ### C++ library
 18 | 
 19 | Please follow the [official document](https://www.yuque.com/mnn/en/build_linux) to build MNN engine.
 20 | 
 21 | ## Convert model
 22 | 
 23 | 1. Export ONNX model
 24 | 
 25 |    ```shell
 26 |    python ./tools/export_onnx.py
 27 |    ```
 28 | 
 29 | 2. Use *onnx-simplifier* to simplify it
 30 | 
 31 |    ``` shell
 32 |    python -m onnxsim ./output.onnx sim.onnx
 33 |    ```
 34 | 
 35 | 3. Convert to MNN
 36 | 
 37 |    ``` shell
 38 |    python -m MNN.tools.mnnconvert -f ONNX --modelFile sim.onnx --MNNModel nanodet-320.mnn
 39 |    ```
 40 | 
 41 | It should be note that the input size does not have to be 320, it can be any integer multiple of strides,
 42 | since NanoDet is anchor free. We can adapt the shape of `dummy_input` in *./tools/export_onnx.py* to get ONNX and MNN models
 43 | with different input sizes.
 44 | 
 45 | Here are converted model [Baidu Disk](https://pan.baidu.com/s/1DE4_yo0xez6Wd95xv7NnDQ)(extra code: *5mfa*),
 46 | [Google Drive](https://drive.google.com/drive/folders/1dEdAXkof_lCusYBNrgbGzdLFZbDPMiFn?usp=sharing).
 47 | 
 48 | ## Build
 49 | 
 50 | The python code *demo_mnn.py* can run directly and independently without main NanoDet repo.
 51 | `NanoDetONNX` and `NanoDetTorch` are two classes used to check the similarity of MNN inference results
 52 | with ONNX model and Pytorch model. They can be remove with no side effects.
 53 | 
 54 | For C++ code, replace `libMNN.so` under *./mnn/lib* with the one you just compiled, modify OpenCV path at CMake file,
 55 | and run
 56 | 
 57 | ``` shell
 58 | mkdir build && cd build
 59 | cmake ..
 60 | make
 61 | ```
 62 | 
 63 | Note that a flag at `main.cpp` is used to control whether to show the detection result or save it into a fold.
 64 | 
 65 | ``` c++
 66 | #define __SAVE_RESULT__ // if defined save drawed results to ../results, else show it in windows
 67 | ```
 68 | 
 69 | ## Run
 70 | 
 71 | ### Python
 72 | 
 73 | `demo_mnn.py` provide an inference class `NanoDetMNN` that combines preprocess, post process, visualization.
 74 | Besides it can be used in command line with the form:
 75 | 
 76 | ```shell
 77 | demo_mnn.py [-h] [--model_path MODEL_PATH] [--cfg_path CFG_PATH]
 78 |     [--img_fold IMG_FOLD] [--result_fold RESULT_FOLD]
 79 |     [--input_shape INPUT_SHAPE INPUT_SHAPE]
 80 |     [--backend {MNN,ONNX,torch}]
 81 | ```
 82 | 
 83 | For example:
 84 | 
 85 | ``` shell
 86 | # run MNN 320 model
 87 | python ./demo_mnn.py --model_path ../model/nanodet-320.mnn --img_fold ../imgs --result_fold ../results
 88 | # run MNN 160 model
 89 | python ./demo_mnn.py --model_path ../model/nanodet-160.mnn --input_shape 160 160 --backend MNN
 90 | # run onnx model
 91 | python ./demo_mnn.py --model_path ../model/sim.onnx --backend ONNX
 92 | # run Pytorch model
 93 | python ./demo_mnn.py --model_path ../model/nanodet_m.pth ../../config/nanodet-m.yml --backend torch
 94 | ```
 95 | 
 96 | ### C++
 97 | 
 98 | C++ inference interface is same with NCNN code, to detect images in a fold, run:
 99 | 
100 | ``` shell
101 | ./nanodet-mnn "1" "../imgs/*.jpg"
102 | ```
103 | 
104 | For speed benchmark
105 | 
106 | ``` shell
107 | ./nanodet-mnn "3" "0"
108 | ```
109 | 
110 | ## Reference
111 | 
112 | [Ultra-Light-Fast-Generic-Face-Detector-1MB](https://github.com/Linzaer/Ultra-Light-Fast-Generic-Face-Detector-1MB/tree/master/MNN)
113 | 
114 | [ONNX Simplifier](https://github.com/daquexian/onnx-simplifier)
115 | 
116 | [NanoDet NCNN](https://github.com/RangiLyu/nanodet/tree/main/demo_ncnn)
117 | 
118 | [MNN](https://github.com/alibaba/MNN)
119 | 
120 | ## Example results
121 | 
122 | ![screenshot](./results/000252.jpg?raw=true)
123 | ![screenshot](./results/000258.jpg?raw=true)
124 | 


--------------------------------------------------------------------------------
/demo_mnn/imgs/000252.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_mnn/imgs/000252.jpg


--------------------------------------------------------------------------------
/demo_mnn/imgs/000258.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_mnn/imgs/000258.jpg


--------------------------------------------------------------------------------
/demo_mnn/nanodet_mnn.hpp:
--------------------------------------------------------------------------------
  1 | #ifndef __NanoDet_H__
  2 | #define __NanoDet_H__
  3 | 
  4 | #pragma once
  5 | 
  6 | #include "Interpreter.hpp"
  7 | 
  8 | #include "MNNDefine.h"
  9 | #include "Tensor.hpp"
 10 | #include "ImageProcess.hpp"
 11 | #include <opencv2/opencv.hpp>
 12 | #include <algorithm>
 13 | #include <iostream>
 14 | #include <string>
 15 | #include <vector>
 16 | #include <memory>
 17 | #include <chrono>
 18 | 
 19 | 
 20 | typedef struct HeadInfo_
 21 | {
 22 |     std::string cls_layer;
 23 |     std::string dis_layer;
 24 |     int stride;
 25 | } HeadInfo;
 26 | 
 27 | typedef struct BoxInfo_
 28 | {
 29 |     float x1;
 30 |     float y1;
 31 |     float x2;
 32 |     float y2;
 33 |     float score;
 34 |     int label;
 35 | } BoxInfo;
 36 | 
 37 | class NanoDet {
 38 | public:
 39 |     NanoDet(const std::string &mnn_path,
 40 |             int input_width, int input_length, int num_thread_ = 4, float score_threshold_ = 0.5, float nms_threshold_ = 0.3);
 41 | 
 42 |     ~NanoDet();
 43 | 
 44 |     int detect(cv::Mat &img, std::vector<BoxInfo> &result_list);
 45 |     std::string get_label_str(int label);
 46 | 
 47 | private:
 48 |     void decode_infer(MNN::Tensor *cls_pred, MNN::Tensor *dis_pred, int stride, float threshold, std::vector<std::vector<BoxInfo>> &results);
 49 |     BoxInfo disPred2Bbox(const float *&dfl_det, int label, float score, int x, int y, int stride);
 50 |     void nms(std::vector<BoxInfo> &input_boxes, float NMS_THRESH);
 51 | 
 52 | private:
 53 | 
 54 |     std::shared_ptr<MNN::Interpreter> NanoDet_interpreter;
 55 |     MNN::Session *NanoDet_session = nullptr;
 56 |     MNN::Tensor *input_tensor = nullptr;
 57 | 
 58 |     int num_thread;
 59 |     int image_w;
 60 |     int image_h;
 61 | 
 62 |     int in_w = 320;
 63 |     int in_h = 320;
 64 | 
 65 |     float score_threshold;
 66 |     float nms_threshold;
 67 | 
 68 |     const float mean_vals[3] = { 103.53f, 116.28f, 123.675f };
 69 |     const float norm_vals[3] = { 0.017429f, 0.017507f, 0.017125f };
 70 | 
 71 |     const int num_class = 80;
 72 |     const int reg_max = 7;
 73 | 
 74 |     std::vector<HeadInfo> heads_info{
 75 |         // cls_pred|dis_pred|stride
 76 |         {"cls_pred_stride_8", "dis_pred_stride_8", 8},
 77 |         {"cls_pred_stride_16", "dis_pred_stride_16", 16},
 78 |         {"cls_pred_stride_32", "dis_pred_stride_32", 32},
 79 |     };
 80 | 
 81 |     std::vector<std::string>
 82 |     labels{"person", "bicycle", "car", "motorcycle", "airplane", "bus", "train", "truck", "boat", "traffic light",
 83 |            "fire hydrant", "stop sign", "parking meter", "bench", "bird", "cat", "dog", "horse", "sheep", "cow",
 84 |            "elephant", "bear", "zebra", "giraffe", "backpack", "umbrella", "handbag", "tie", "suitcase", "frisbee",
 85 |            "skis", "snowboard", "sports ball", "kite", "baseball bat", "baseball glove", "skateboard", "surfboard",
 86 |            "tennis racket", "bottle", "wine glass", "cup", "fork", "knife", "spoon", "bowl", "banana", "apple",
 87 |            "sandwich", "orange", "broccoli", "carrot", "hot dog", "pizza", "donut", "cake", "chair", "couch",
 88 |            "potted plant", "bed", "dining table", "toilet", "tv", "laptop", "mouse", "remote", "keyboard", "cell phone",
 89 |            "microwave", "oven", "toaster", "sink", "refrigerator", "book", "clock", "vase", "scissors", "teddy bear",
 90 |            "hair drier", "toothbrush"};
 91 | };
 92 | 
 93 | template <typename _Tp>
 94 | int activation_function_softmax(const _Tp *src, _Tp *dst, int length);
 95 | 
 96 | inline float fast_exp(float x);
 97 | inline float sigmoid(float x);
 98 | 
 99 | #endif // __NanoDet_H__
100 | 


--------------------------------------------------------------------------------
/demo_mnn/results/000252.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_mnn/results/000252.jpg


--------------------------------------------------------------------------------
/demo_mnn/results/000258.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_mnn/results/000258.jpg


--------------------------------------------------------------------------------
/demo_ncnn/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | cmake_minimum_required(VERSION 3.4.1)
 2 | set(CMAKE_CXX_STANDARD 17)
 3 | 
 4 | project(nanodet_demo)
 5 | 
 6 | find_package(OpenMP REQUIRED)
 7 | if(OPENMP_FOUND)
 8 |     message("OPENMP FOUND")
 9 |     set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} ${OpenMP_C_FLAGS}")
10 |     set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${OpenMP_CXX_FLAGS}")
11 |     set(CMAKE_EXE_LINKER_FLAGS "${CMAKE_EXE_LINKER_FLAGS} ${OpenMP_EXE_LINKER_FLAGS}")
12 | endif()
13 | 
14 | find_package(OpenCV REQUIRED)
15 | 
16 | find_package(ncnn REQUIRED)
17 | if(NOT TARGET ncnn)
18 |     message(WARNING "ncnn NOT FOUND!  Please set ncnn_DIR environment variable")
19 | else()
20 |     message("ncnn FOUND ")
21 | endif()
22 | 
23 | include_directories(
24 |     ${OpenCV_INCLUDE_DIRS}
25 |     ${CMAKE_CURRENT_SOURCE_DIR}
26 |     ${CMAKE_CURRENT_BINARY_DIR}
27 | )
28 | 
29 | 
30 | add_executable(nanodet_demo main.cpp nanodet.cpp)
31 | 
32 | target_link_libraries(
33 |     nanodet_demo 
34 |     ncnn
35 |     ${OpenCV_LIBS} 
36 | )


--------------------------------------------------------------------------------
/demo_ncnn/README.md:
--------------------------------------------------------------------------------
  1 | # NanoDet NCNN Demo
  2 | 
  3 | This project provides NanoDet image inference, webcam inference and benchmark using
  4 | [Tencent's NCNN framework](https://github.com/Tencent/ncnn).
  5 | 
  6 | # How to build
  7 | 
  8 | ## Windows
  9 | ### Step1.
 10 | Download and Install Visual Studio from https://visualstudio.microsoft.com/vs/community/
 11 | 
 12 | ### Step2.
 13 | Download and install OpenCV from https://github.com/opencv/opencv/releases
 14 | 
 15 | ### Step3(Optional).
 16 | Download and install Vulkan SDK from https://vulkan.lunarg.com/sdk/home
 17 | 
 18 | ### Step4.
 19 | Clone NCNN repository
 20 | 
 21 | ``` shell script
 22 | git clone --recursive https://github.com/Tencent/ncnn.git
 23 | ```
 24 | Build NCNN following this tutorial: [Build for Windows x64 using VS2017](https://github.com/Tencent/ncnn/wiki/how-to-build#build-for-windows-x64-using-visual-studio-community-2017)
 25 | 
 26 | ### Step5.
 27 | 
 28 | Add `ncnn_DIR` = `YOUR_NCNN_PATH/build/install/lib/cmake/ncnn` to system environment variables.
 29 | 
 30 | Build project: Open x64 Native Tools Command Prompt for VS 2019 or 2017
 31 | 
 32 | ``` cmd
 33 | cd <this-folder>
 34 | mkdir -p build
 35 | cd build
 36 | cmake ..
 37 | msbuild nanodet_demo.vcxproj /p:configuration=release /p:platform=x64
 38 | ```
 39 | 
 40 | ## Linux
 41 | 
 42 | ### Step1.
 43 | Build and install OpenCV from https://github.com/opencv/opencv
 44 | 
 45 | ### Step2(Optional).
 46 | Download Vulkan SDK from https://vulkan.lunarg.com/sdk/home
 47 | 
 48 | ### Step3.
 49 | Clone NCNN repository
 50 | 
 51 | ``` shell script
 52 | git clone --recursive https://github.com/Tencent/ncnn.git 
 53 | ```
 54 | 
 55 | Build NCNN following this tutorial: [Build for Linux / NVIDIA Jetson / Raspberry Pi](https://github.com/Tencent/ncnn/wiki/how-to-build#build-for-linux)
 56 | 
 57 | ### Step4.
 58 | 
 59 | Set environment variables. Run:
 60 | 
 61 | ``` shell script
 62 | export ncnn_DIR=YOUR_NCNN_PATH/build/install/lib/cmake/ncnn
 63 | ```
 64 | 
 65 | Build project
 66 | 
 67 | ``` shell script
 68 | cd <this-folder>
 69 | mkdir build
 70 | cd build
 71 | cmake ..
 72 | make
 73 | ```
 74 | 
 75 | # Run demo
 76 | 
 77 | Download NanoDet ncnn model.
 78 | * [NanoDet ncnn model download link](https://github.com/RangiLyu/nanodet/releases/download/v0.0.1/nanodet_ncnn_model.zip)
 79 | 
 80 | Copy nanodet_m.param and nanodet_m.bin to demo program folder.
 81 | 
 82 | ## Webcam
 83 | 
 84 | ```shell script
 85 | nanodet_demo 0 0
 86 | ```
 87 | 
 88 | ## Inference images
 89 | 
 90 | ```shell script
 91 | nanodet_demo 1 IMAGE_FOLDER/*.jpg
 92 | ```
 93 | 
 94 | ## Inference video
 95 | 
 96 | ```shell script
 97 | nanodet_demo 2 VIDEO_PATH
 98 | ```
 99 | 
100 | ## Benchmark
101 | 
102 | ```shell script
103 | nanodet_demo 3 0
104 | ```
105 | ![bench_mark](benchmark.jpg)
106 | ****
107 | 
108 | Notice:
109 | 
110 | If benchmark speed is slow, try to limit omp thread num.
111 | 
112 | Linux:
113 | 
114 | ```shell script
115 | export OMP_THREAD_LIMIT=4
116 | ```
117 | 


--------------------------------------------------------------------------------
/demo_ncnn/benchmark.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/demo_ncnn/benchmark.jpg


--------------------------------------------------------------------------------
/demo_ncnn/nanodet.h:
--------------------------------------------------------------------------------
 1 | //
 2 | // Create by RangiLyu
 3 | // 2020 / 10 / 2
 4 | //
 5 | 
 6 | #ifndef NANODET_H
 7 | #define NANODET_H
 8 | 
 9 | #include <opencv2/core/core.hpp>
10 | #include <net.h>
11 | 
12 | typedef struct HeadInfo
13 | {
14 |     std::string cls_layer;
15 |     std::string dis_layer;
16 |     int stride;
17 | };
18 | 
19 | typedef struct BoxInfo 
20 | {
21 |     float x1;
22 |     float y1;
23 |     float x2;
24 |     float y2;
25 |     float score;
26 |     int label;
27 | } BoxInfo;
28 | 
29 | class NanoDet
30 | {
31 | public:
32 |     NanoDet(const char* param, const char* bin, bool useGPU);
33 | 
34 |     ~NanoDet();
35 | 
36 |     static NanoDet* detector;
37 |     ncnn::Net* Net;
38 |     static bool hasGPU;
39 | 
40 |     std::vector<HeadInfo> heads_info{
41 |         // cls_pred|dis_pred|stride
42 |         {"cls_pred_stride_8", "dis_pred_stride_8", 8},
43 |         {"cls_pred_stride_16", "dis_pred_stride_16", 16},
44 |         {"cls_pred_stride_32", "dis_pred_stride_32", 32},
45 |     };
46 | 
47 |     std::vector<BoxInfo> detect(cv::Mat image, float score_threshold, float nms_threshold);
48 | 
49 |     std::vector<std::string> labels{ "person", "bicycle", "car", "motorcycle", "airplane", "bus", "train", "truck", "boat", "traffic light",
50 |                                     "fire hydrant", "stop sign", "parking meter", "bench", "bird", "cat", "dog", "horse", "sheep", "cow",
51 |                                     "elephant", "bear", "zebra", "giraffe", "backpack", "umbrella", "handbag", "tie", "suitcase", "frisbee",
52 |                                     "skis", "snowboard", "sports ball", "kite", "baseball bat", "baseball glove", "skateboard", "surfboard",
53 |                                     "tennis racket", "bottle", "wine glass", "cup", "fork", "knife", "spoon", "bowl", "banana", "apple",
54 |                                     "sandwich", "orange", "broccoli", "carrot", "hot dog", "pizza", "donut", "cake", "chair", "couch",
55 |                                     "potted plant", "bed", "dining table", "toilet", "tv", "laptop", "mouse", "remote", "keyboard", "cell phone",
56 |                                     "microwave", "oven", "toaster", "sink", "refrigerator", "book", "clock", "vase", "scissors", "teddy bear",
57 |                                     "hair drier", "toothbrush" };
58 | private:
59 |     void preprocess(cv::Mat& image, ncnn::Mat& in);
60 |     void decode_infer(ncnn::Mat& cls_pred, ncnn::Mat& dis_pred, int stride, float threshold, std::vector<std::vector<BoxInfo>>& results);
61 |     BoxInfo disPred2Bbox(const float*& dfl_det, int label, float score, int x, int y, int stride);
62 |     static void nms(std::vector<BoxInfo>& result, float nms_threshold);
63 |     int input_size[2] = {320, 320};
64 |     int num_class = 80;
65 |     int reg_max = 7;
66 | 
67 | };
68 | 
69 | 
70 | #endif //NANODET_H
71 | 


--------------------------------------------------------------------------------
/demo_openvino/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | cmake_minimum_required(VERSION 3.4.1)
 2 | set(CMAKE_CXX_STANDARD 14)
 3 | 
 4 | project(nanodet_demo)
 5 | 
 6 | find_package(OpenCV REQUIRED)
 7 | find_package(InferenceEngine REQUIRED)
 8 | find_package(ngraph REQUIRED)
 9 | 
10 | include_directories(
11 |     ${OpenCV_INCLUDE_DIRS}
12 |     ${CMAKE_CURRENT_SOURCE_DIR}
13 |     ${CMAKE_CURRENT_BINARY_DIR}
14 | )
15 | 
16 | add_executable(nanodet_demo main.cpp nanodet_openvino.cpp)
17 | 
18 | target_link_libraries(
19 |     nanodet_demo 
20 |     ${InferenceEngine_LIBRARIES}
21 |     ${NGRAPH_LIBRARIES}
22 |     ${OpenCV_LIBS} 
23 | )


--------------------------------------------------------------------------------
/demo_openvino/README.md:
--------------------------------------------------------------------------------
  1 | # NanoDet OpenVINO Demo
  2 | 
  3 | This fold provides NanoDet inference code using
  4 | [Intel's OpenVINO Toolkit](https://software.intel.com/content/www/us/en/develop/tools/openvino-toolkit.html). Most of the implements in this fold are same as *demo_ncnn*.
  5 | 
  6 | ## Install OpenVINO Toolkit
  7 | 
  8 | Go to [OpenVINO HomePage](https://software.intel.com/content/www/us/en/develop/tools/openvino-toolkit.html)
  9 | 
 10 | Download a suitable version and install.
 11 | 
 12 | Follow the official Get Started Guides: https://docs.openvinotoolkit.org/latest/get_started_guides.html
 13 | 
 14 | ## Set the Environment Variables
 15 | 
 16 | ### Windows:
 17 | 
 18 | Run this command in cmd. (Every time before using OpenVINO)
 19 | ```cmd
 20 | <INSTSLL_DIR>\openvino_2021\bin\setupvars.bat
 21 | ``` 
 22 | 
 23 | 
 24 | Or set the system environment variables once for all:
 25 | 
 26 | Name                  |Value
 27 | :--------------------:|:--------:
 28 | INTEL_OPENVINO_DIR | <INSTSLL_DIR>\openvino_2021
 29 | INTEL_CVSDK_DIR | %INTEL_OPENVINO_DIR%
 30 | InferenceEngine_DIR | %INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\share
 31 | HDDL_INSTALL_DIR | %INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\external\hddl
 32 | ngraph_DIR | %INTEL_OPENVINO_DIR%\deployment_tools\ngraph\cmake
 33 | 
 34 | And add this to ```Path```
 35 | ```
 36 | %INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\bin\intel64\Debug;%INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\bin\intel64\Release;%HDDL_INSTALL_DIR%\bin;%INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\external\tbb\bin;%INTEL_OPENVINO_DIR%\deployment_tools\ngraph\lib
 37 | ```
 38 | 
 39 | ### Linux
 40 | 
 41 | Run this command in shell. (Every time before using OpenVINO)
 42 | 
 43 | ```shell
 44 | source /opt/intel/openvino_2021/bin/setupvars.sh
 45 | ```
 46 | 
 47 | Or edit .bashrc
 48 | 
 49 | ```shell
 50 | vi ~/.bashrc
 51 | ```
 52 | 
 53 | Add this line to the end of the file
 54 | 
 55 | ```shell
 56 | source /opt/intel/openvino_2021/bin/setupvars.sh
 57 | ```
 58 | 
 59 | ## Convert model
 60 | 
 61 | 1. Export ONNX model
 62 | 
 63 |    ```shell
 64 |    python ./tools/export_onnx.py --cfg_path ${CONFIG_PATH} --model_path ${PYTORCH_MODEL_PATH}
 65 |    ```
 66 | 
 67 | 2. Use *onnx-simplifier* to simplify it
 68 | 
 69 |    ``` shell
 70 |    python -m onnxsim ${INPUT_ONNX_MODEL} ${OUTPUT_ONNX_MODEL}
 71 |    ```
 72 | 
 73 | 3. Convert to OpenVINO 
 74 | 
 75 |    ``` shell
 76 |    cd <INSTSLL_DIR>/openvino_2021/deployment_tools/model_optimizer
 77 |    ```
 78 | 
 79 |    Install requirements for convert tool
 80 | 
 81 |    ```shell
 82 |    sudo ./install_prerequisites/install_prerequisites_onnx.sh
 83 |    ```
 84 | 
 85 |    Then convert model. Notice: mean_values and scale_values should be the same with your training settings in YAML config file.
 86 |    ```shell
 87 |    python3 mo_onnx.py --input_model <ONNX_MODEL> --mean_values [103.53,116.28,123.675] --scale_values [57.375,57.12,58.395]
 88 |    ```
 89 | 
 90 | ## Build
 91 | 
 92 | ### Windows
 93 | 
 94 | ```cmd
 95 | <OPENVINO_INSTSLL_DIR>\openvino_2021\bin\setupvars.bat
 96 | mkdir -p build
 97 | cd build
 98 | cmake ..
 99 | msbuild nanodet_demo.vcxproj /p:configuration=release /p:platform=x64
100 | ```
101 | 
102 | ### Linux
103 | ```shell
104 | source /opt/intel/openvino_2021/bin/setupvars.sh
105 | mkdir build
106 | cd build
107 | cmake ..
108 | make
109 | ```
110 | 
111 | 
112 | ## Run demo
113 | 
114 | First, move nanodet openvino model files to the demo's folder. Then run these commands:
115 | 
116 | ### Webcam
117 | 
118 | ```shell
119 | nanodet_demo 0 0
120 | ```
121 | 
122 | ### Inference images
123 | 
124 | ```shell
125 | nanodet_demo 1 IMAGE_FOLDER/*.jpg
126 | ```
127 | 
128 | ### Inference video
129 | 
130 | ```shell
131 | nanodet_demo 2 VIDEO_PATH
132 | ```
133 | 
134 | ### Benchmark
135 | 
136 | ```shell
137 | nanodet_demo 3 0
138 | ```
139 | 


--------------------------------------------------------------------------------
/demo_openvino/nanodet_openvino.h:
--------------------------------------------------------------------------------
 1 | //
 2 | // Create by RangiLyu
 3 | // 2021 / 1 / 12
 4 | //
 5 | 
 6 | #ifndef _NANODET_OPENVINO_H_
 7 | #define _NANODET_OPENVINO_H_
 8 | 
 9 | #include <string>
10 | #include <opencv2/core.hpp>
11 | #include <inference_engine.hpp>
12 | 
13 | 
14 | typedef struct HeadInfo
15 | {
16 |     std::string cls_layer;
17 |     std::string dis_layer;
18 |     int stride;
19 | } HeadInfo;
20 | 
21 | typedef struct BoxInfo 
22 | {
23 |     float x1;
24 |     float y1;
25 |     float x2;
26 |     float y2;
27 |     float score;
28 |     int label;
29 | } BoxInfo;
30 | 
31 | class NanoDet
32 | {
33 | public:
34 |     NanoDet(const char* param);
35 | 
36 |     ~NanoDet();
37 |     
38 |     InferenceEngine::ExecutableNetwork network_;
39 |     InferenceEngine::InferRequest infer_request_;
40 |     // static bool hasGPU;
41 | 
42 |     std::vector<HeadInfo> heads_info_{
43 |         // cls_pred|dis_pred|stride
44 |         {"cls_pred_stride_8", "dis_pred_stride_8", 8},
45 |         {"cls_pred_stride_16", "dis_pred_stride_16", 16},
46 |         {"cls_pred_stride_32", "dis_pred_stride_32", 32},
47 |     };
48 | 
49 |     std::vector<BoxInfo> detect(cv::Mat image, float score_threshold, float nms_threshold);
50 | 
51 | private:
52 |     void preprocess(cv::Mat& image, InferenceEngine::Blob::Ptr& blob);
53 |     void decode_infer(const float*& cls_pred, const float*& dis_pred, int stride, float threshold, std::vector<std::vector<BoxInfo>>& results);
54 |     BoxInfo disPred2Bbox(const float*& dfl_det, int label, float score, int x, int y, int stride);
55 |     static void nms(std::vector<BoxInfo>& result, float nms_threshold);
56 |     std::string input_name_;
57 |     int input_size_ = 320;
58 |     int num_class_ = 80;
59 |     int reg_max_ = 7;
60 | 
61 | };
62 | 
63 | 
64 | #endif //_NANODE_TOPENVINO_H_


--------------------------------------------------------------------------------
/docs/imgs/Android_demo.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/docs/imgs/Android_demo.jpg


--------------------------------------------------------------------------------
/docs/imgs/Model_arch.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/docs/imgs/Model_arch.png


--------------------------------------------------------------------------------
/docs/imgs/Title.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cxnaive/nanodet-TensorRT/56ef43cef8a71202cab7536798b479382742c8b9/docs/imgs/Title.jpg


--------------------------------------------------------------------------------
/nanodet/data/collate.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | import torch.nn.functional as F
 3 | 
 4 | import re
 5 | from torch._six import container_abcs, string_classes, int_classes
 6 | 
 7 | 
 8 | np_str_obj_array_pattern = re.compile(r'[SaUO]')
 9 | 
10 | 
11 | default_collate_err_msg_format = (
12 |     "default_collate: batch must contain tensors, numpy arrays, numbers, "
13 |     "dicts or lists; found {}")
14 | 
15 | 
16 | def collate_function(batch):
17 |     r"""Puts each data field into a tensor with outer dimension batch size"""
18 | 
19 |     elem = batch[0]
20 |     elem_type = type(elem)
21 |     if isinstance(elem, torch.Tensor):
22 |         out = None
23 |         # TODO: support pytorch < 1.3
24 |         # if torch.utils.data.get_worker_info() is not None:
25 |         #     # If we're in a background process, concatenate directly into a
26 |         #     # shared memory tensor to avoid an extra copy
27 |         #     numel = sum([x.numel() for x in batch])
28 |         #     storage = elem.storage()._new_shared(numel)
29 |         #     out = elem.new(storage)
30 |         return torch.stack(batch, 0, out=out)
31 |     elif elem_type.__module__ == 'numpy' and elem_type.__name__ != 'str_' \
32 |             and elem_type.__name__ != 'string_':
33 |         elem = batch[0]
34 |         if elem_type.__name__ == 'ndarray':
35 |             # array of string classes and object
36 |             if np_str_obj_array_pattern.search(elem.dtype.str) is not None:
37 |                 raise TypeError(default_collate_err_msg_format.format(elem.dtype))
38 | 
39 |             # return collate_function([torch.as_tensor(b) for b in batch])
40 |             return batch
41 |         elif elem.shape == ():  # scalars
42 |             # return torch.as_tensor(batch)
43 |             return batch
44 |     elif isinstance(elem, float):
45 |         return torch.tensor(batch, dtype=torch.float64)
46 |     elif isinstance(elem, int_classes):
47 |         return torch.tensor(batch)
48 |     elif isinstance(elem, string_classes):
49 |         return batch
50 |     elif isinstance(elem, container_abcs.Mapping):
51 |         return {key: collate_function([d[key] for d in batch]) for key in elem}
52 |     elif isinstance(elem, tuple) and hasattr(elem, '_fields'):  # namedtuple
53 |         return elem_type(*(collate_function(samples) for samples in zip(*batch)))
54 |     elif isinstance(elem, container_abcs.Sequence):
55 |         transposed = zip(*batch)
56 |         return [collate_function(samples) for samples in transposed]
57 | 
58 |     raise TypeError(default_collate_err_msg_format.format(elem_type))
59 | 


--------------------------------------------------------------------------------
/nanodet/data/dataset/__init__.py:
--------------------------------------------------------------------------------
 1 | import copy
 2 | from .coco import CocoDataset
 3 | from .xml_dataset import XMLDataset
 4 | 
 5 | 
 6 | def build_dataset(cfg, mode):
 7 |     dataset_cfg = copy.deepcopy(cfg)
 8 |     name = dataset_cfg.pop('name')
 9 |     if name == 'coco':
10 |         return CocoDataset(mode=mode, **dataset_cfg)
11 |     if name == 'xml_dataset':
12 |         return XMLDataset(mode=mode, **dataset_cfg)
13 |     else:
14 |         raise NotImplementedError('Unknown dataset type!')
15 | 


--------------------------------------------------------------------------------
/nanodet/data/transform/__init__.py:
--------------------------------------------------------------------------------
1 | 
2 | from .pipeline import Pipeline


--------------------------------------------------------------------------------
/nanodet/data/transform/color.py:
--------------------------------------------------------------------------------
 1 | import numpy as np
 2 | import cv2
 3 | import random
 4 | 
 5 | 
 6 | # def random_brightness(img, delta):
 7 | #     img += random.uniform(-delta, delta)
 8 | #     return img
 9 | 
10 | #Gamma trans
11 | def gamma_trans(img, gamma):  # gamma函数处理
12 |     gamma_table = [np.power(x / 255.0, gamma) * 255.0 for x in range(256)]  # 建立映射表
13 |     gamma_table = np.round(np.array(gamma_table)).astype(np.uint8)  # 颜色值为整数
14 |     return cv2.LUT(img, gamma_table)  # 图片颜色查表。另外可以根据光强（颜色）均匀化原则设计自适应算法。
15 | 
16 | def random_gamma(img, gamma_low, gamme_up):
17 |     gamma = random.uniform(gamma_low, gamme_up)
18 |     return gamma_trans(img,gamma)
19 | 
20 | 
21 | def augment_hsv(img, hgain=0.5, sgain=0.5, vgain=0.5):
22 |     r = np.random.uniform(-1, 1, 3) * [hgain, sgain, vgain] + 1  # random gains
23 |     hue, sat, val = cv2.split(cv2.cvtColor(img, cv2.COLOR_BGR2HSV))
24 |     dtype = img.dtype  # uint8
25 | 
26 |     x = np.arange(0, 256, dtype=np.int16)
27 |     lut_hue = ((x * r[0]) % 180).astype(dtype)
28 |     lut_sat = np.clip(x * r[1], 0, 255).astype(dtype)
29 |     lut_val = np.clip(x * r[2], 0, 255).astype(dtype)
30 | 
31 |     img_hsv = cv2.merge((cv2.LUT(hue, lut_hue), cv2.LUT(sat, lut_sat), cv2.LUT(val, lut_val))).astype(dtype)
32 |     cv2.cvtColor(img_hsv, cv2.COLOR_HSV2BGR, dst=img)  # no return needed
33 | 
34 | def normalize(meta, mean, std):
35 |     img = meta['img'].astype(np.float32)
36 |     mean = np.array(mean, dtype=np.float64).reshape(1, -1)
37 |     stdinv = 1 / np.array(std, dtype=np.float64).reshape(1, -1)
38 |     cv2.subtract(img, mean, img)
39 |     cv2.multiply(img, stdinv, img)
40 |     meta['img'] = img
41 |     return meta
42 | 
43 | 
44 | def _normalize(img, mean, std):
45 |     img = img.astype(np.float32)
46 |     mean = np.array(mean, dtype=np.float32).reshape(1, 1, 3)
47 |     std = np.array(std, dtype=np.float32).reshape(1, 1, 3)
48 |     img = (img - mean) / std
49 |     return img
50 | 
51 | 
52 | def color_aug_and_norm(meta, kwargs):
53 |     img = meta['img'] #.astype(np.float32) / 255
54 |     if 'gamma' in kwargs and random.randint(0, 1):
55 |         img = random_gamma(img, *kwargs['gamma'])
56 |     #print(kwargs)
57 |     if 'hsv_h' in kwargs and 'hsv_s' in kwargs and 'hsv_v' in kwargs:
58 |         hgain=kwargs['hsv_h']
59 |         sgain=kwargs['hsv_s']
60 |         vgain=kwargs['hsv_v']
61 |         augment_hsv(img,hgain,sgain,vgain)
62 |     # if 'brightness' in kwargs and random.randint(0, 1):
63 |     #     hsv_img = random_brightness(hsv_img, kwargs['brightness'])
64 | 
65 |     # if 'saturation' in kwargs and random.randint(0, 1):
66 |     #     hsv_img = random_saturation(hsv_img, *kwargs['saturation'])
67 | 
68 |     # if 'contrast' in kwargs and random.randint(0, 1):
69 |     #     img = random_contrast(img, *kwargs['contrast'])
70 |     # cv2.imshow('trans', img)
71 |     # cv2.waitKey(0)
72 |     # img = _normalize(img, *kwargs['normalize'])
73 |     meta['img'] = img.astype(np.float32) / 255.0
74 |     return meta
75 | 
76 | 
77 | 


--------------------------------------------------------------------------------
/nanodet/data/transform/mosaic.py:
--------------------------------------------------------------------------------
 1 | import numpy as np
 2 | 
 3 | 
 4 | def merge_box(box1, box2):
 5 |     xl = max(box1[0],box2[0])
 6 |     xr = min(box1[2],box2[2])
 7 |     yl = max(box1[1],box2[1])
 8 |     yr = min(box1[3],box2[3])
 9 |     if xl >= xr or yl >= yr:
10 |         return None
11 |     else:
12 |         area_before = (box1[2] - box1[0]) * (box1[3] - box1[1])
13 |         area_after = (xr - xl) * (yr - yl)
14 |         
15 |         #eliminate incomplete boxes 
16 |         if area_after / area_before < 0.2 or (xr - xl) / (box1[2] - box1[0]) < 0.4 or (yr - yl) / (box1[3] - box1[1]) < 0.4:
17 |             return None
18 |         return [xl,yl,xr,yr]
19 | 
20 | 
21 | def merge_bboxes(bboxes, labels, cutx, cuty, im_w, im_h):
22 |     merge_bbox = []
23 |     merge_label = []
24 |     for i in range(len(bboxes)):
25 |         for j in range(len(bboxes[i])):
26 |             # print(labels[i][j], bboxes[i][j])
27 |             if i == 0:
28 |                 box_now = merge_box(bboxes[i][j], [0, 0, cutx, cuty])
29 |             if i == 1:
30 |                 box_now = merge_box(bboxes[i][j], [0, cuty, cutx, im_h])
31 |             if i == 2:
32 |                 box_now = merge_box(bboxes[i][j], [cutx, cuty, im_w, im_h])
33 |             if i == 3:
34 |                 box_now = merge_box(bboxes[i][j], [cutx, 0, im_w, cuty])
35 |     
36 |             if box_now == None:
37 |                 continue
38 |             
39 |             merge_bbox.append(box_now)
40 |             merge_label.append(labels[i][j])
41 |     # print(merge_bbox)
42 |     if len(merge_bbox) == 0:
43 |         return [], []
44 |     else:
45 |         return merge_label, merge_bbox
46 | 


--------------------------------------------------------------------------------
/nanodet/data/transform/pipeline.py:
--------------------------------------------------------------------------------
 1 | from .warp import warp_and_resize
 2 | from .color import color_aug_and_norm
 3 | import functools
 4 | 
 5 | 
 6 | class Pipeline:
 7 |     def __init__(self,
 8 |                  cfg,
 9 |                  keep_ratio):
10 |         self.warp = functools.partial(warp_and_resize,
11 |                                       warp_kwargs=cfg,
12 |                                       keep_ratio=keep_ratio)
13 |         self.color = functools.partial(color_aug_and_norm,
14 |                                        kwargs=cfg)
15 | 
16 |     def __call__(self, meta, dst_shape):
17 |         meta = self.warp(meta=meta, dst_shape=dst_shape)
18 |         meta = self.color(meta=meta)
19 |         return meta
20 | 


--------------------------------------------------------------------------------
/nanodet/evaluator/__init__.py:
--------------------------------------------------------------------------------
1 | from .coco_detection import CocoDetectionEvaluator
2 | 
3 | 
4 | def build_evaluator(cfg, dataset):
5 |     if cfg.evaluator.name == 'CocoDetectionEvaluator':
6 |         return CocoDetectionEvaluator(dataset)
7 |     else:
8 |         raise NotImplementedError
9 | 


--------------------------------------------------------------------------------
/nanodet/evaluator/coco_detection.py:
--------------------------------------------------------------------------------
 1 | import pycocotools.coco as coco
 2 | from pycocotools.cocoeval import COCOeval
 3 | import json
 4 | import os
 5 | import copy
 6 | 
 7 | 
 8 | def xyxy2xywh(bbox):
 9 |     """
10 |     change bbox to coco format
11 |     :param bbox: [x1, y1, x2, y2]
12 |     :return: [x, y, w, h]
13 |     """
14 |     return [
15 |         bbox[0],
16 |         bbox[1],
17 |         bbox[2] - bbox[0],
18 |         bbox[3] - bbox[1],
19 |     ]
20 | 
21 | 
22 | class CocoDetectionEvaluator:
23 |     def __init__(self, dataset):
24 |         assert hasattr(dataset, 'coco_api')
25 |         self.coco_api = dataset.coco_api
26 |         self.cat_ids = dataset.cat_ids
27 |         self.metric_names = ['mAP', 'AP_50', 'AP_75', 'AP_small', 'AP_m', 'AP_l']
28 | 
29 |     def results2json(self, results):
30 |         """
31 |         results: {image_id: {label: [bboxes...] } }
32 |         :return coco json format: {image_id:
33 |                                    category_id:
34 |                                    bbox:
35 |                                    score: }
36 |         """
37 |         json_results = []
38 |         for image_id, dets in results.items():
39 |             for label, bboxes in dets.items():
40 |                 category_id = self.cat_ids[label]
41 |                 for bbox in bboxes:
42 |                     score = float(bbox[4])
43 |                     detection = dict(
44 |                         image_id=int(image_id),
45 |                         category_id=int(category_id),
46 |                         bbox=xyxy2xywh(bbox),
47 |                         score=score)
48 |                     json_results.append(detection)
49 |         return json_results
50 | 
51 |     def evaluate(self, results, save_dir, rank=-1):
52 |         results_json = self.results2json(results)
53 |         json_path = os.path.join(save_dir, 'results{}.json'.format(rank))
54 |         json.dump(results_json, open(json_path, 'w'))
55 |         coco_dets = self.coco_api.loadRes(json_path)
56 |         coco_eval = COCOeval(copy.deepcopy(self.coco_api), copy.deepcopy(coco_dets), "bbox")
57 |         coco_eval.evaluate()
58 |         coco_eval.accumulate()
59 |         coco_eval.summarize()
60 |         aps = coco_eval.stats[:6]
61 |         eval_results = {}
62 |         for k, v in zip(self.metric_names, aps):
63 |             eval_results[k] = v
64 |         return eval_results
65 | 


--------------------------------------------------------------------------------
/nanodet/model/arch/__init__.py:
--------------------------------------------------------------------------------
 1 | import warnings
 2 | 
 3 | from .one_stage_detector import OneStageDetector
 4 | 
 5 | 
 6 | def build_model(model_cfg):
 7 |     if model_cfg.arch.name == 'GFL':
 8 |         warnings.warn("Model architecture name is changed to 'OneStageDetector'. "
 9 |                       "The name 'GFL' is deprecated, please change the model->arch->name "
10 |                       "in your YAML config file to OneStageDetector. ")
11 |         model = OneStageDetector(model_cfg.arch.backbone, model_cfg.arch.fpn, model_cfg.arch.head)
12 |     elif model_cfg.arch.name == 'OneStageDetector':
13 |         model = OneStageDetector(model_cfg.arch.backbone, model_cfg.arch.fpn, model_cfg.arch.head)
14 |     else:
15 |         raise NotImplementedError
16 |     return model
17 | 


--------------------------------------------------------------------------------
/nanodet/model/arch/one_stage_detector.py:
--------------------------------------------------------------------------------
 1 | import time
 2 | import torch
 3 | import torch.nn as nn
 4 | from ..backbone import build_backbone
 5 | from ..fpn import build_fpn
 6 | from ..head import build_head
 7 | 
 8 | 
 9 | class OneStageDetector(nn.Module):
10 |     def __init__(self,
11 |                  backbone_cfg,
12 |                  fpn_cfg=None,
13 |                  head_cfg=None,):
14 |         super(OneStageDetector, self).__init__()
15 |         self.backbone = build_backbone(backbone_cfg)
16 |         if fpn_cfg is not None:
17 |             self.fpn = build_fpn(fpn_cfg)
18 |         if head_cfg is not None:
19 |             self.head = build_head(head_cfg)
20 | 
21 |     def forward(self, x):
22 |         x = self.backbone(x)
23 |         if hasattr(self, 'fpn'):
24 |             x = self.fpn(x)
25 |         if hasattr(self, 'head'):
26 |             x = self.head(x)
27 |         return x
28 | 
29 |     def inference(self, meta):
30 |         with torch.no_grad():
31 |             torch.cuda.synchronize()
32 |             time1 = time.time()
33 |             preds = self(meta['img'])
34 |             torch.cuda.synchronize()
35 |             time2 = time.time()
36 |             print('forward time: {:.3f}s'.format((time2 - time1)), end=' | ')
37 |             results = self.head.post_process(preds, meta)
38 |             torch.cuda.synchronize()
39 |             print('decode time: {:.3f}s'.format((time.time() - time2)), end=' | ')
40 |         return results
41 | 
42 |     def forward_train(self, gt_meta):
43 |         preds = self(gt_meta['img'])
44 |         loss, loss_states = self.head.loss(preds, gt_meta)
45 | 
46 |         return preds, loss, loss_states
47 | 


--------------------------------------------------------------------------------
/nanodet/model/backbone/__init__.py:
--------------------------------------------------------------------------------
 1 | import copy
 2 | from .resnet import ResNet
 3 | from .ghostnet import GhostNet
 4 | from .shufflenetv2 import ShuffleNetV2
 5 | from .mobilenetv2 import MobileNetV2
 6 | from .efficientnet_lite import EfficientNetLite
 7 | from .custom_csp import CustomCspNet
 8 | from .repvgg import RepVGG
 9 | 
10 | 
11 | def build_backbone(cfg):
12 |     backbone_cfg = copy.deepcopy(cfg)
13 |     name = backbone_cfg.pop('name')
14 |     if name == 'ResNet':
15 |         return ResNet(**backbone_cfg)
16 |     elif name == 'ShuffleNetV2':
17 |         return ShuffleNetV2(**backbone_cfg)
18 |     elif name == 'GhostNet':
19 |         return GhostNet(**backbone_cfg)
20 |     elif name == 'MobileNetV2':
21 |         return MobileNetV2(**backbone_cfg)
22 |     elif name == 'EfficientNetLite':
23 |         return EfficientNetLite(**backbone_cfg)
24 |     elif name == 'CustomCspNet':
25 |         return CustomCspNet(**backbone_cfg)
26 |     elif name == 'RepVGG':
27 |         return RepVGG(**backbone_cfg)
28 |     else:
29 |         raise NotImplementedError
30 | 
31 | 


--------------------------------------------------------------------------------
/nanodet/model/backbone/custom_csp.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | import torch.nn as nn
 3 | from ..module.conv import ConvModule
 4 | 
 5 | 
 6 | class TinyResBlock(nn.Module):
 7 |     def __init__(self, in_channels, kernel_size, norm_cfg, activation, res_type='concat'):
 8 |         super(TinyResBlock, self).__init__()
 9 |         assert in_channels % 2 == 0
10 |         assert res_type in ['concat', 'add']
11 |         self.res_type = res_type
12 |         self.in_conv = ConvModule(in_channels, in_channels//2, kernel_size, padding=(kernel_size-1)//2, norm_cfg=norm_cfg, activation=activation)
13 |         self.mid_conv = ConvModule(in_channels//2, in_channels//2, kernel_size, padding=(kernel_size-1)//2, norm_cfg=norm_cfg, activation=activation)
14 |         if res_type == 'add':
15 |             self.out_conv = ConvModule(in_channels//2, in_channels, kernel_size, padding=(kernel_size-1)//2, norm_cfg=norm_cfg, activation=activation)
16 | 
17 |     def forward(self, x):
18 |         x = self.in_conv(x)
19 |         x1 = self.mid_conv(x)
20 |         if self.res_type == 'add':
21 |             return self.out_conv(x+x1)
22 |         else:
23 |             return torch.cat((x1, x), dim=1)
24 | 
25 | 
26 | class CspBlock(nn.Module):
27 |     def __init__(self, in_channels, num_res, kernel_size=3, stride=0, norm_cfg=dict(type='BN', requires_grad=True), activation='LeakyReLU'):
28 |         super(CspBlock, self).__init__()
29 |         assert in_channels % 2 == 0
30 |         self.in_conv = ConvModule(in_channels, in_channels, kernel_size, stride, padding=(kernel_size-1)//2, norm_cfg=norm_cfg, activation=activation)
31 |         res_blocks = []
32 |         for i in range(num_res):
33 |             res_block = TinyResBlock(in_channels, kernel_size, norm_cfg, activation)
34 |             res_blocks.append(res_block)
35 |         self.res_blocks = nn.Sequential(*res_blocks)
36 |         self.res_out_conv = ConvModule(in_channels, in_channels, kernel_size, padding=(kernel_size-1)//2, norm_cfg=norm_cfg, activation=activation)
37 | 
38 |     def forward(self, x):
39 |         x = self.in_conv(x)
40 |         x1 = self.res_blocks(x)
41 |         x1 = self.res_out_conv(x1)
42 |         out = torch.cat((x1, x), dim=1)
43 |         return out
44 | 
45 | 
46 | class CustomCspNet(nn.Module):
47 |     def __init__(self, net_cfg, out_stages, norm_cfg=dict(type='BN', requires_grad=True), activation='LeakyReLU'):
48 |         super(CustomCspNet, self).__init__()
49 |         self.out_stages = out_stages
50 |         self.activation = activation
51 |         self.stages = nn.ModuleList()
52 |         for stage_cfg in net_cfg:
53 |             if stage_cfg[0] == 'Conv':
54 |                 in_channels, out_channels, kernel_size, stride = stage_cfg[1:]
55 |                 stage = ConvModule(in_channels, out_channels, kernel_size, stride, padding=(kernel_size-1)//2, norm_cfg=norm_cfg, activation=activation)
56 |             elif stage_cfg[0] == 'CspBlock':
57 |                 in_channels, num_res, kernel_size, stride = stage_cfg[1:]
58 |                 stage = CspBlock(in_channels, num_res, kernel_size, stride, norm_cfg, activation)
59 |             elif stage_cfg[0] == 'MaxPool':
60 |                 kernel_size, stride = stage_cfg[1:]
61 |                 stage = nn.MaxPool2d(kernel_size, stride, padding=(kernel_size-1)//2)
62 |             else:
63 |                 raise ModuleNotFoundError
64 |             self.stages.append(stage)
65 |         self._init_weight()
66 |     
67 |     def forward(self, x):
68 |         output = []
69 |         for i, stage in enumerate(self.stages):
70 |             x = stage(x)
71 |             if i in self.out_stages:
72 |                 output.append(x)
73 |         return tuple(output)
74 | 
75 |     def _init_weight(self):
76 |         for m in self.modules():
77 |             if self.activation == 'LeakyReLU':
78 |                 nonlinearity = 'leaky_relu'
79 |             else:
80 |                 nonlinearity = 'relu'
81 |             if isinstance(m, nn.Conv2d):
82 |                 nn.init.kaiming_normal_(m.weight, mode='fan_out', nonlinearity=nonlinearity)
83 |             elif isinstance(m, nn.BatchNorm2d):
84 |                 m.weight.data.fill_(1)
85 |                 m.bias.data.zero_()
86 | 
87 | 
88 | 


--------------------------------------------------------------------------------
/nanodet/model/backbone/mobilenetv2.py:
--------------------------------------------------------------------------------
  1 | from __future__ import absolute_import
  2 | from __future__ import division
  3 | from __future__ import print_function
  4 | 
  5 | import torch
  6 | import torch.nn as nn
  7 | from ..module.activation import act_layers
  8 | 
  9 | 
 10 | class ConvBNReLU(nn.Sequential):
 11 |     def __init__(self, in_planes, out_planes, kernel_size=3, stride=1, groups=1, act='ReLU'):
 12 |         padding = (kernel_size - 1) // 2
 13 |         super(ConvBNReLU, self).__init__(
 14 |             nn.Conv2d(in_planes, out_planes, kernel_size, stride, padding, groups=groups, bias=False),
 15 |             nn.BatchNorm2d(out_planes),
 16 |             act_layers(act)
 17 |         )
 18 | 
 19 | 
 20 | class InvertedResidual(nn.Module):
 21 |     def __init__(self, inp, oup, stride, expand_ratio, act='ReLU'):
 22 |         super(InvertedResidual, self).__init__()
 23 |         self.stride = stride
 24 |         assert stride in [1, 2]
 25 | 
 26 |         hidden_dim = int(round(inp * expand_ratio))
 27 |         self.use_res_connect = self.stride == 1 and inp == oup
 28 | 
 29 |         layers = []
 30 |         if expand_ratio != 1:
 31 |             # pw
 32 |             layers.append(ConvBNReLU(inp, hidden_dim, kernel_size=1, act=act))
 33 |         layers.extend([
 34 |             # dw
 35 |             ConvBNReLU(hidden_dim, hidden_dim, stride=stride, groups=hidden_dim, act=act),
 36 |             # pw-linear
 37 |             nn.Conv2d(hidden_dim, oup, 1, 1, 0, bias=False),
 38 |             nn.BatchNorm2d(oup),
 39 |         ])
 40 |         self.conv = nn.Sequential(*layers)
 41 | 
 42 |     def forward(self, x):
 43 |         if self.use_res_connect:
 44 |             return x + self.conv(x)
 45 |         else:
 46 |             return self.conv(x)
 47 | 
 48 | 
 49 | class MobileNetV2(nn.Module):
 50 |     def __init__(self, width_mult=1., out_stages=(1, 2, 4, 6), last_channel=1280, act='ReLU'):
 51 |         super(MobileNetV2, self).__init__()
 52 |         self.width_mult = width_mult
 53 |         self.out_stages = out_stages
 54 |         input_channel = 32
 55 |         self.last_channel = last_channel
 56 |         self.act = act
 57 |         self.interverted_residual_setting = [
 58 |             # t, c, n, s
 59 |             [1, 16, 1, 1],
 60 |             [6, 24, 2, 2],
 61 |             [6, 32, 3, 2],
 62 |             [6, 64, 4, 2],
 63 |             [6, 96, 3, 1],
 64 |             [6, 160, 3, 2],
 65 |             [6, 320, 1, 1],
 66 |         ]
 67 | 
 68 |         # building first layer
 69 |         self.input_channel = int(input_channel * width_mult)
 70 |         self.first_layer = ConvBNReLU(3, input_channel, stride=2, act=self.act)
 71 |         # building inverted residual blocks
 72 |         for i in range(7):
 73 |             name = 'stage{}'.format(i)
 74 |             setattr(self, name, self.build_mobilenet_stage(stage_num=i))
 75 | 
 76 |     def build_mobilenet_stage(self, stage_num):
 77 |         stage = []
 78 |         t, c, n, s = self.interverted_residual_setting[stage_num]
 79 |         output_channel = int(c * self.width_mult)
 80 |         for i in range(n):
 81 |             if i == 0:
 82 |                 stage.append(InvertedResidual(self.input_channel, output_channel, s, expand_ratio=t, act=self.act))
 83 |             else:
 84 |                 stage.append(InvertedResidual(self.input_channel, output_channel, 1, expand_ratio=t, act=self.act))
 85 |             self.input_channel = output_channel
 86 |         if stage_num == 6:
 87 |             last_layer = ConvBNReLU(self.input_channel, self.last_channel, kernel_size=1, act=self.act)
 88 |             stage.append(last_layer)
 89 |         stage = nn.Sequential(*stage)
 90 |         return stage
 91 | 
 92 |     def forward(self, x):
 93 |         x = self.first_layer(x)
 94 |         output = []
 95 |         for i in range(0, 7):
 96 |             stage = getattr(self, 'stage{}'.format(i))
 97 |             x = stage(x)
 98 |             if i in self.out_stages:
 99 |                 output.append(x)
100 | 
101 |         return tuple(output)
102 | 
103 |     def init_weights(self):
104 |         for m in self.modules():
105 |             if isinstance(m, nn.Conv2d):
106 |                 nn.init.normal_(m.weight, std=0.001)
107 |                 if m.bias is not None:
108 |                     m.bias.data.zero_()
109 |             elif isinstance(m, nn.BatchNorm2d):
110 |                 m.weight.data.fill_(1)
111 |                 m.bias.data.zero_()
112 | 
113 | 


--------------------------------------------------------------------------------
/nanodet/model/fpn/__init__.py:
--------------------------------------------------------------------------------
 1 | import copy
 2 | from .fpn import FPN
 3 | from .pan import PAN
 4 | from .tan import TAN
 5 | 
 6 | 
 7 | def build_fpn(cfg):
 8 |     fpn_cfg = copy.deepcopy(cfg)
 9 |     name = fpn_cfg.pop('name')
10 |     if name == 'FPN':
11 |         return FPN(**fpn_cfg)
12 |     elif name == 'PAN':
13 |         return PAN(**fpn_cfg)
14 |     elif name == 'TAN':
15 |         return TAN(**fpn_cfg)
16 |     else:
17 |         raise NotImplementedError
18 | 


--------------------------------------------------------------------------------
/nanodet/model/fpn/fpn.py:
--------------------------------------------------------------------------------
 1 | # Modification 2020 RangiLyu
 2 | # Copyright 2018-2019 Open-MMLab.
 3 | 
 4 | # Licensed under the Apache License, Version 2.0 (the "License");
 5 | # you may not use this file except in compliance with the License.
 6 | # You may obtain a copy of the License at
 7 | 
 8 | #     http://www.apache.org/licenses/LICENSE-2.0
 9 | 
10 | # Unless required by applicable law or agreed to in writing, software
11 | # distributed under the License is distributed on an "AS IS" BASIS,
12 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 | # See the License for the specific language governing permissions and
14 | # limitations under the License.
15 | 
16 | import torch.nn as nn
17 | import torch.nn.functional as F
18 | from ..module.conv import ConvModule
19 | from ..module.init_weights import xavier_init
20 | 
21 | 
22 | class FPN(nn.Module):
23 | 
24 |     def __init__(self,
25 |                  in_channels,
26 |                  out_channels,
27 |                  num_outs,
28 |                  start_level=0,
29 |                  end_level=-1,
30 |                  conv_cfg=None,
31 |                  norm_cfg=None,
32 |                  activation=None
33 |                  ):
34 |         super(FPN, self).__init__()
35 |         assert isinstance(in_channels, list)
36 |         self.in_channels = in_channels
37 |         self.out_channels = out_channels
38 |         self.num_ins = len(in_channels)
39 |         self.num_outs = num_outs
40 |         self.fp16_enabled = False
41 | 
42 |         if end_level == -1:
43 |             self.backbone_end_level = self.num_ins
44 |             assert num_outs >= self.num_ins - start_level
45 |         else:
46 |             # if end_level < inputs, no extra level is allowed
47 |             self.backbone_end_level = end_level
48 |             assert end_level <= len(in_channels)
49 |             assert num_outs == end_level - start_level
50 |         self.start_level = start_level
51 |         self.end_level = end_level
52 |         self.lateral_convs = nn.ModuleList()
53 | 
54 |         for i in range(self.start_level, self.backbone_end_level):
55 |             l_conv = ConvModule(
56 |                 in_channels[i],
57 |                 out_channels,
58 |                 1,
59 |                 conv_cfg=conv_cfg,
60 |                 norm_cfg=norm_cfg,
61 |                 activation=activation,
62 |                 inplace=False)
63 | 
64 |             self.lateral_convs.append(l_conv)
65 |         self.init_weights()
66 | 
67 |     # default init_weights for conv(msra) and norm in ConvModule
68 |     def init_weights(self):
69 |         for m in self.modules():
70 |             if isinstance(m, nn.Conv2d):
71 |                 xavier_init(m, distribution='uniform')
72 | 
73 |     def forward(self, inputs):
74 |         assert len(inputs) == len(self.in_channels)
75 | 
76 |         # build laterals
77 |         laterals = [
78 |             lateral_conv(inputs[i + self.start_level])
79 |             for i, lateral_conv in enumerate(self.lateral_convs)
80 |         ]
81 | 
82 |         # build top-down path
83 |         used_backbone_levels = len(laterals)
84 |         for i in range(used_backbone_levels - 1, 0, -1):
85 |             prev_shape = laterals[i - 1].shape[2:]
86 |             laterals[i - 1] += F.interpolate(
87 |                 laterals[i], scale_factor=2, mode='bilinear')
88 | 
89 |         # build outputs
90 |         outs = [
91 |             # self.fpn_convs[i](laterals[i]) for i in range(used_backbone_levels)
92 |             laterals[i] for i in range(used_backbone_levels)
93 |         ]
94 |         return tuple(outs)
95 | 
96 | 
97 | # if __name__ == '__main__':
98 | 


--------------------------------------------------------------------------------
/nanodet/model/fpn/pan.py:
--------------------------------------------------------------------------------
 1 | import torch.nn as nn
 2 | import torch.nn.functional as F
 3 | from ..module.conv import ConvModule
 4 | from .fpn import FPN
 5 | 
 6 | 
 7 | class PAN(FPN):
 8 |     """Path Aggregation Network for Instance Segmentation.
 9 | 
10 |     This is an implementation of the `PAN in Path Aggregation Network
11 |     <https://arxiv.org/abs/1803.01534>`_.
12 | 
13 |     Args:
14 |         in_channels (List[int]): Number of input channels per scale.
15 |         out_channels (int): Number of output channels (used at each scale)
16 |         num_outs (int): Number of output scales.
17 |         start_level (int): Index of the start input backbone level used to
18 |             build the feature pyramid. Default: 0.
19 |         end_level (int): Index of the end input backbone level (exclusive) to
20 |             build the feature pyramid. Default: -1, which means the last level.
21 |         add_extra_convs (bool): Whether to add conv layers on top of the
22 |             original feature maps. Default: False.
23 |         extra_convs_on_inputs (bool): Whether to apply extra conv on
24 |             the original feature from the backbone. Default: False.
25 |         relu_before_extra_convs (bool): Whether to apply relu before the extra
26 |             conv. Default: False.
27 |         no_norm_on_lateral (bool): Whether to apply norm on lateral.
28 |             Default: False.
29 |         conv_cfg (dict): Config dict for convolution layer. Default: None.
30 |         norm_cfg (dict): Config dict for normalization layer. Default: None.
31 |         act_cfg (str): Config dict for activation layer in ConvModule.
32 |             Default: None.
33 |     """
34 | 
35 |     def __init__(self,
36 |                  in_channels,
37 |                  out_channels,
38 |                  num_outs,
39 |                  start_level=0,
40 |                  end_level=-1,
41 |                  conv_cfg=None,
42 |                  norm_cfg=None,
43 |                  activation=None):
44 |         super(PAN,
45 |               self).__init__(in_channels, out_channels, num_outs, start_level,
46 |                              end_level, conv_cfg, norm_cfg, activation)
47 |         self.init_weights()
48 | 
49 |     def forward(self, inputs):
50 |         """Forward function."""
51 |         assert len(inputs) == len(self.in_channels)
52 | 
53 |         # build laterals
54 |         laterals = [
55 |             lateral_conv(inputs[i + self.start_level])
56 |             for i, lateral_conv in enumerate(self.lateral_convs)
57 |         ]
58 | 
59 |         # build top-down path
60 |         used_backbone_levels = len(laterals)
61 |         for i in range(used_backbone_levels - 1, 0, -1):
62 |             laterals[i - 1] += F.interpolate(
63 |                 laterals[i], scale_factor=2, mode='bilinear')
64 | 
65 |         # build outputs
66 |         # part 1: from original levels
67 |         inter_outs = [
68 |             laterals[i] for i in range(used_backbone_levels)
69 |         ]
70 | 
71 |         # part 2: add bottom-up path
72 |         for i in range(0, used_backbone_levels - 1):
73 |             inter_outs[i + 1] += F.interpolate(inter_outs[i], scale_factor=0.5, mode='bilinear')
74 | 
75 |         outs = []
76 |         outs.append(inter_outs[0])
77 |         outs.extend([
78 |             inter_outs[i] for i in range(1, used_backbone_levels)
79 |         ])
80 |         return tuple(outs)
81 | 


--------------------------------------------------------------------------------
/nanodet/model/fpn/tan.py:
--------------------------------------------------------------------------------
  1 | # Copyright 2021 RangiLyu.
  2 | #
  3 | # Licensed under the Apache License, Version 2.0 (the "License");
  4 | # you may not use this file except in compliance with the License.
  5 | # You may obtain a copy of the License at
  6 | #
  7 | #     http://www.apache.org/licenses/LICENSE-2.0
  8 | #
  9 | # Unless required by applicable law or agreed to in writing, software
 10 | # distributed under the License is distributed on an "AS IS" BASIS,
 11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 12 | # See the License for the specific language governing permissions and
 13 | # limitations under the License.
 14 | 
 15 | import torch
 16 | import torch.nn as nn
 17 | import torch.nn.functional as F
 18 | from ..module.conv import ConvModule
 19 | from ..module.transformer import TransformerBlock
 20 | from ..module.init_weights import normal_init
 21 | 
 22 | 
 23 | class TAN(nn.Module):
 24 |     """
 25 |     Transformer Attention Network.
 26 | 
 27 |     :param in_channels: Number of input channels per scale.
 28 |     :param out_channels: Number of output channel.
 29 |     :param feature_hw: Size of feature map input to transformer.
 30 |     :param num_heads: Number of attention heads.
 31 |     :param num_encoders: Number of transformer encoder layers.
 32 |     :param mlp_ratio: Hidden layer dimension expand ratio in MLP.
 33 |     :param dropout_ratio: Probability of an element to be zeroed.
 34 |     :param activation: Activation layer type.
 35 |     """
 36 |     def __init__(self,
 37 |                  in_channels,
 38 |                  out_channels,
 39 |                  feature_hw,
 40 |                  num_heads,
 41 |                  num_encoders,
 42 |                  mlp_ratio,
 43 |                  dropout_ratio,
 44 |                  activation='LeakyReLU'
 45 |                  ):
 46 |         super(TAN, self).__init__()
 47 |         assert isinstance(in_channels, list)
 48 |         self.in_channels = in_channels
 49 |         self.out_channels = out_channels
 50 |         self.num_ins = len(in_channels)
 51 |         assert self.num_ins == 3
 52 | 
 53 |         self.lateral_convs = nn.ModuleList()
 54 |         for i in range(self.num_ins):
 55 |             l_conv = ConvModule(in_channels[i], out_channels, 1,
 56 |                 norm_cfg=dict(type='BN'), activation=activation, inplace=False)
 57 |             self.lateral_convs.append(l_conv)
 58 |         self.transformer = TransformerBlock(out_channels*self.num_ins, out_channels, num_heads,
 59 |                                             num_encoders, mlp_ratio, dropout_ratio, activation=activation)
 60 |         self.pos_embed = nn.Parameter(torch.zeros(feature_hw[0] * feature_hw[1], 1, out_channels))
 61 | 
 62 |         self.init_weights()
 63 | 
 64 |     def init_weights(self):
 65 |         torch.nn.init.trunc_normal_(self.pos_embed, std=0.02)
 66 |         for m in self.modules():
 67 |             if isinstance(m, nn.Linear):
 68 |                 torch.nn.init.trunc_normal_(m.weight, std=.02)
 69 |                 if isinstance(m, nn.Linear) and m.bias is not None:
 70 |                     nn.init.constant_(m.bias, 0)
 71 |             elif isinstance(m, nn.LayerNorm):
 72 |                 nn.init.constant_(m.bias, 0)
 73 |                 nn.init.constant_(m.weight, 1.0)
 74 |             elif isinstance(m, nn.Conv2d):
 75 |                 normal_init(m, 0.01)
 76 | 
 77 |     def forward(self, inputs):
 78 |         assert len(inputs) == len(self.in_channels)
 79 | 
 80 |         # build laterals
 81 |         laterals = [
 82 |             lateral_conv(inputs[i])
 83 |             for i, lateral_conv in enumerate(self.lateral_convs)
 84 |         ]
 85 | 
 86 |         # transformer attention
 87 |         mid_shape = laterals[1].shape[2:]
 88 |         mid_lvl = torch.cat((F.interpolate(laterals[0], size=mid_shape, mode='bilinear'),
 89 |                   laterals[1], F.interpolate(laterals[2], size=mid_shape, mode='bilinear')), dim=1)
 90 |         mid_lvl = self.transformer(mid_lvl, self.pos_embed)
 91 | 
 92 |         # outs = [
 93 |         #     torch.cat((laterals[0], F.interpolate(mid_lvl, size=laterals[0].shape[2:], mode='bilinear')), dim=1),
 94 |         #     torch.cat((laterals[1], mid_lvl), dim=1),
 95 |         #     torch.cat((laterals[2], F.interpolate(mid_lvl, size=laterals[2].shape[2:], mode='bilinear')), dim=1)
 96 |         # ]
 97 |         # build outputs
 98 |         outs = [
 99 |             laterals[0]+F.interpolate(mid_lvl, size=laterals[0].shape[2:], mode='bilinear'),
100 |             laterals[1]+mid_lvl,
101 |             laterals[2]+F.interpolate(mid_lvl, size=laterals[2].shape[2:], mode='bilinear')
102 |         ]
103 |         return tuple(outs)
104 | 


--------------------------------------------------------------------------------
/nanodet/model/head/__init__.py:
--------------------------------------------------------------------------------
 1 | import copy
 2 | from .gfl_head import GFLHead
 3 | from .nanodet_head import NanoDetHead
 4 | 
 5 | 
 6 | def build_head(cfg):
 7 |     head_cfg = copy.deepcopy(cfg)
 8 |     name = head_cfg.pop('name')
 9 |     if name == 'GFLHead':
10 |         return GFLHead(**head_cfg)
11 |     elif name == 'NanoDetHead':
12 |         return NanoDetHead(**head_cfg)
13 |     else:
14 |         raise NotImplementedError


--------------------------------------------------------------------------------
/nanodet/model/head/assigner/base_assigner.py:
--------------------------------------------------------------------------------
1 | from abc import ABCMeta, abstractmethod
2 | 
3 | 
4 | class BaseAssigner(metaclass=ABCMeta):
5 | 
6 |     @abstractmethod
7 |     def assign(self, bboxes, gt_bboxes, gt_bboxes_ignore=None, gt_labels=None):
8 |         pass


--------------------------------------------------------------------------------
/nanodet/model/loss/utils.py:
--------------------------------------------------------------------------------
 1 | import functools
 2 | 
 3 | import torch.nn.functional as F
 4 | 
 5 | 
 6 | def reduce_loss(loss, reduction):
 7 |     """Reduce loss as specified.
 8 | 
 9 |     Args:
10 |         loss (Tensor): Elementwise loss tensor.
11 |         reduction (str): Options are "none", "mean" and "sum".
12 | 
13 |     Return:
14 |         Tensor: Reduced loss tensor.
15 |     """
16 |     reduction_enum = F._Reduction.get_enum(reduction)
17 |     # none: 0, elementwise_mean:1, sum: 2
18 |     if reduction_enum == 0:
19 |         return loss
20 |     elif reduction_enum == 1:
21 |         return loss.mean()
22 |     elif reduction_enum == 2:
23 |         return loss.sum()
24 | 
25 | 
26 | def weight_reduce_loss(loss, weight=None, reduction='mean', avg_factor=None):
27 |     """Apply element-wise weight and reduce loss.
28 | 
29 |     Args:
30 |         loss (Tensor): Element-wise loss.
31 |         weight (Tensor): Element-wise weights.
32 |         reduction (str): Same as built-in losses of PyTorch.
33 |         avg_factor (float): Avarage factor when computing the mean of losses.
34 | 
35 |     Returns:
36 |         Tensor: Processed loss values.
37 |     """
38 |     # if weight is specified, apply element-wise weight
39 |     if weight is not None:
40 |         loss = loss * weight
41 | 
42 |     # if avg_factor is not specified, just reduce the loss
43 |     if avg_factor is None:
44 |         loss = reduce_loss(loss, reduction)
45 |     else:
46 |         # if reduction is mean, then average the loss by avg_factor
47 |         if reduction == 'mean':
48 |             loss = loss.sum() / avg_factor
49 |         # if reduction is 'none', then do nothing, otherwise raise an error
50 |         elif reduction != 'none':
51 |             raise ValueError('avg_factor can not be used with reduction="sum"')
52 |     return loss
53 | 
54 | 
55 | def weighted_loss(loss_func):
56 |     """Create a weighted version of a given loss function.
57 | 
58 |     To use this decorator, the loss function must have the signature like
59 |     `loss_func(pred, target, **kwargs)`. The function only needs to compute
60 |     element-wise loss without any reduction. This decorator will add weight
61 |     and reduction arguments to the function. The decorated function will have
62 |     the signature like `loss_func(pred, target, weight=None, reduction='mean',
63 |     avg_factor=None, **kwargs)`.
64 | 
65 |     :Example:
66 | 
67 |     >>> import torch
68 |     >>> @weighted_loss
69 |     >>> def l1_loss(pred, target):
70 |     >>>     return (pred - target).abs()
71 | 
72 |     >>> pred = torch.Tensor([0, 2, 3])
73 |     >>> target = torch.Tensor([1, 1, 1])
74 |     >>> weight = torch.Tensor([1, 0, 1])
75 | 
76 |     >>> l1_loss(pred, target)
77 |     tensor(1.3333)
78 |     >>> l1_loss(pred, target, weight)
79 |     tensor(1.)
80 |     >>> l1_loss(pred, target, reduction='none')
81 |     tensor([1., 1., 2.])
82 |     >>> l1_loss(pred, target, weight, avg_factor=2)
83 |     tensor(1.5000)
84 |     """
85 | 
86 |     @functools.wraps(loss_func)
87 |     def wrapper(pred,
88 |                 target,
89 |                 weight=None,
90 |                 reduction='mean',
91 |                 avg_factor=None,
92 |                 **kwargs):
93 |         # get element-wise loss
94 |         loss = loss_func(pred, target, **kwargs)
95 |         loss = weight_reduce_loss(loss, weight, reduction, avg_factor)
96 |         return loss
97 | 
98 |     return wrapper
99 | 


--------------------------------------------------------------------------------
/nanodet/model/module/activation.py:
--------------------------------------------------------------------------------
 1 | import torch.nn as nn
 2 | 
 3 | activations = {'ReLU': nn.ReLU,
 4 |                'LeakyReLU': nn.LeakyReLU,
 5 |                'ReLU6': nn.ReLU6,
 6 |                'SELU': nn.SELU,
 7 |                'ELU': nn.ELU,
 8 |                'GELU': nn.GELU,
 9 |                None: nn.Identity
10 |                }
11 | 
12 | 
13 | def act_layers(name):
14 |     assert name in activations.keys()
15 |     if name == 'LeakyReLU':
16 |         return nn.LeakyReLU(negative_slope=0.1, inplace=True)
17 |     elif name == 'GELU':
18 |         return nn.GELU()
19 |     else:
20 |         return activations[name](inplace=True)
21 | 


--------------------------------------------------------------------------------
/nanodet/model/module/init_weights.py:
--------------------------------------------------------------------------------
 1 | """
 2 | from MMDetection
 3 | """
 4 | import torch.nn as nn
 5 | 
 6 | 
 7 | def kaiming_init(module,
 8 |                  a=0,
 9 |                  mode='fan_out',
10 |                  nonlinearity='relu',
11 |                  bias=0,
12 |                  distribution='normal'):
13 |     assert distribution in ['uniform', 'normal']
14 |     if distribution == 'uniform':
15 |         nn.init.kaiming_uniform_(
16 |             module.weight, a=a, mode=mode, nonlinearity=nonlinearity)
17 |     else:
18 |         nn.init.kaiming_normal_(
19 |             module.weight, a=a, mode=mode, nonlinearity=nonlinearity)
20 |     if hasattr(module, 'bias') and module.bias is not None:
21 |         nn.init.constant_(module.bias, bias)
22 | 
23 | 
24 | def xavier_init(module, gain=1, bias=0, distribution='normal'):
25 |     assert distribution in ['uniform', 'normal']
26 |     if distribution == 'uniform':
27 |         nn.init.xavier_uniform_(module.weight, gain=gain)
28 |     else:
29 |         nn.init.xavier_normal_(module.weight, gain=gain)
30 |     if hasattr(module, 'bias') and module.bias is not None:
31 |         nn.init.constant_(module.bias, bias)
32 | 
33 | 
34 | def normal_init(module, mean=0, std=1, bias=0):
35 |     nn.init.normal_(module.weight, mean, std)
36 |     if hasattr(module, 'bias') and module.bias is not None:
37 |         nn.init.constant_(module.bias, bias)
38 | 
39 | 
40 | def constant_init(module, val, bias=0):
41 |     if hasattr(module, 'weight') and module.weight is not None:
42 |         nn.init.constant_(module.weight, val)
43 |     if hasattr(module, 'bias') and module.bias is not None:
44 |         nn.init.constant_(module.bias, bias)


--------------------------------------------------------------------------------
/nanodet/model/module/norm.py:
--------------------------------------------------------------------------------
 1 | import torch.nn as nn
 2 | 
 3 | norm_cfg = {
 4 |     # format: layer_type: (abbreviation, module)
 5 |     'BN': ('bn', nn.BatchNorm2d),
 6 |     'SyncBN': ('bn', nn.SyncBatchNorm),
 7 |     'GN': ('gn', nn.GroupNorm),
 8 |     # and potentially 'SN'
 9 | }
10 | 
11 | 
12 | def build_norm_layer(cfg, num_features, postfix=''):
13 |     """ Build normalization layer
14 | 
15 |     Args:
16 |         cfg (dict): cfg should contain:
17 |             type (str): identify norm layer type.
18 |             layer args: args needed to instantiate a norm layer.
19 |             requires_grad (bool): [optional] whether stop gradient updates
20 |         num_features (int): number of channels from input.
21 |         postfix (int, str): appended into norm abbreviation to
22 |             create named layer.
23 | 
24 |     Returns:
25 |         name (str): abbreviation + postfix
26 |         layer (nn.Module): created norm layer
27 |     """
28 |     assert isinstance(cfg, dict) and 'type' in cfg
29 |     cfg_ = cfg.copy()
30 | 
31 |     layer_type = cfg_.pop('type')
32 |     if layer_type not in norm_cfg:
33 |         raise KeyError('Unrecognized norm type {}'.format(layer_type))
34 |     else:
35 |         abbr, norm_layer = norm_cfg[layer_type]
36 |         if norm_layer is None:
37 |             raise NotImplementedError
38 | 
39 |     assert isinstance(postfix, (int, str))
40 |     name = abbr + str(postfix)
41 | 
42 |     requires_grad = cfg_.pop('requires_grad', True)
43 |     cfg_.setdefault('eps', 1e-5)
44 |     if layer_type != 'GN':
45 |         layer = norm_layer(num_features, **cfg_)
46 |         if layer_type == 'SyncBN':
47 |             layer._specify_ddp_gpu_num(1)
48 |     else:
49 |         assert 'num_groups' in cfg_
50 |         layer = norm_layer(num_channels=num_features, **cfg_)
51 | 
52 |     for param in layer.parameters():
53 |         param.requires_grad = requires_grad
54 | 
55 |     return name, layer
56 | 


--------------------------------------------------------------------------------
/nanodet/model/module/scale.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | import torch.nn as nn
 3 | 
 4 | 
 5 | class Scale(nn.Module):
 6 |     """
 7 |     A learnable scale parameter
 8 |     """
 9 | 
10 |     def __init__(self, scale=1.0):
11 |         super(Scale, self).__init__()
12 |         self.scale = nn.Parameter(torch.tensor(scale, dtype=torch.float))
13 | 
14 |     def forward(self, x):
15 |         return x * self.scale
16 | 


--------------------------------------------------------------------------------
/nanodet/model/module/transformer.py:
--------------------------------------------------------------------------------
  1 | # Copyright 2021 RangiLyu.
  2 | #
  3 | # Licensed under the Apache License, Version 2.0 (the "License");
  4 | # you may not use this file except in compliance with the License.
  5 | # You may obtain a copy of the License at
  6 | #
  7 | #     http://www.apache.org/licenses/LICENSE-2.0
  8 | #
  9 | # Unless required by applicable law or agreed to in writing, software
 10 | # distributed under the License is distributed on an "AS IS" BASIS,
 11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 12 | # See the License for the specific language governing permissions and
 13 | # limitations under the License.
 14 | 
 15 | import torch
 16 | import torch.nn as nn
 17 | from nanodet.model.module.activation import act_layers
 18 | from nanodet.model.module.conv import ConvModule
 19 | 
 20 | 
 21 | class MLP(nn.Module):
 22 |     def __init__(self,
 23 |                  in_dim,
 24 |                  hidden_dim=None,
 25 |                  out_dim=None,
 26 |                  drop=0.,
 27 |                  activation='GELU'
 28 |                  ):
 29 |         super(MLP, self).__init__()
 30 |         out_dim = out_dim or in_dim
 31 |         hidden_dim = hidden_dim or in_dim
 32 |         self.fc1 = nn.Linear(in_dim, hidden_dim)
 33 |         self.act = act_layers(activation)
 34 |         self.fc2 = nn.Linear(hidden_dim, out_dim)
 35 |         self.drop = nn.Dropout(drop)
 36 | 
 37 |     def forward(self, x):
 38 |         x = self.fc1(x)
 39 |         x = self.act(x)
 40 |         x = self.drop(x)
 41 |         x = self.fc2(x)
 42 |         x = self.drop(x)
 43 |         return x
 44 | 
 45 | 
 46 | class TransformerEncoder(nn.Module):
 47 |     """
 48 |     Encoder layer of transformer
 49 |     :param dim: feature dimension
 50 |     :param num_heads: number of attention heads
 51 |     :param mlp_ratio: hidden layer dimension expand ratio in MLP
 52 |     :param dropout_ratio: probability of an element to be zeroed
 53 |     :param activation: activation layer type
 54 |     :param kv_bias: add bias on key and values
 55 |     """
 56 |     def __init__(self,
 57 |                  dim,
 58 |                  num_heads,
 59 |                  mlp_ratio,
 60 |                  dropout_ratio=0.0,
 61 |                  activation='GELU',
 62 |                  kv_bias=False
 63 |                  ):
 64 |         super(TransformerEncoder, self).__init__()
 65 |         self.norm1 = nn.LayerNorm(dim)
 66 |         self.attn = nn.MultiheadAttention(embed_dim=dim, num_heads=num_heads,
 67 |                                           dropout=dropout_ratio, add_bias_kv=kv_bias)
 68 |         self.norm2 = nn.LayerNorm(dim)
 69 |         self.mlp = MLP(in_dim=dim, hidden_dim=dim * mlp_ratio,
 70 |                        drop=dropout_ratio, activation=activation)
 71 | 
 72 |     def forward(self, x):
 73 |         _x = self.norm1(x)
 74 |         x = x + self.attn(_x, _x, _x)[0]
 75 |         x = x + self.mlp(self.norm2(x))
 76 |         return x
 77 | 
 78 | 
 79 | class TransformerBlock(nn.Module):
 80 |     """
 81 |     Block of transformer encoder layers. Used in vision task.
 82 |     :param in_channels: input channels
 83 |     :param out_channels: output channels
 84 |     :param num_heads: number of attention heads
 85 |     :param num_encoders: number of transformer encoder layers
 86 |     :param mlp_ratio: hidden layer dimension expand ratio in MLP
 87 |     :param dropout_ratio: probability of an element to be zeroed
 88 |     :param activation: activation layer type
 89 |     :param kv_bias: add bias on key and values
 90 |     """
 91 |     def __init__(self,
 92 |                  in_channels,
 93 |                  out_channels,
 94 |                  num_heads,
 95 |                  num_encoders=1,
 96 |                  mlp_ratio=1,
 97 |                  dropout_ratio=0.,
 98 |                  kv_bias=False,
 99 |                  activation='GELU'
100 |                  ):
101 |         super(TransformerBlock, self).__init__()
102 |         self.conv = nn.Identity() if in_channels == out_channels else \
103 |             ConvModule(in_channels, out_channels, 1)
104 |         self.linear = nn.Linear(out_channels, out_channels)
105 |         encoders = [TransformerEncoder(out_channels, num_heads, mlp_ratio,
106 |                                        dropout_ratio, activation, kv_bias)
107 |                     for _ in range(num_encoders)]
108 |         self.encoders = nn.Sequential(*encoders)
109 | 
110 |     def forward(self, x, pos_embed):
111 |         b, _, h, w = x.shape
112 |         x = self.conv(x)
113 |         x = x.flatten(2).permute(2, 0, 1)
114 |         x = x + pos_embed
115 |         x = self.encoders(x)
116 |         x = x.permute(1, 2, 0).reshape(b, -1, h, w)
117 |         return x
118 | 


--------------------------------------------------------------------------------
/nanodet/trainer/__init__.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from .trainer import Trainer
 3 | from .dist_trainer import DistTrainer
 4 | 
 5 | 
 6 | def build_trainer(rank, cfg, model, logger):
 7 |     if len(cfg.device.gpu_ids) > 1:
 8 |         trainer = DistTrainer(rank, cfg, model, logger)
 9 |         trainer.set_device(cfg.device.batchsize_per_gpu, rank, device=torch.device('cuda'))  # TODO: device
10 |     else:
11 |         trainer = Trainer(rank, cfg, model, logger)
12 |         trainer.set_device(cfg.device.batchsize_per_gpu, cfg.device.gpu_ids, device=torch.device('cuda'))
13 |     return trainer
14 | 
15 | 


--------------------------------------------------------------------------------
/nanodet/trainer/dist_trainer.py:
--------------------------------------------------------------------------------
 1 | import torch.distributed as dist
 2 | from .trainer import Trainer
 3 | from ..util import DDP
 4 | 
 5 | 
 6 | def average_gradients(model):
 7 |     """ Gradient averaging. """
 8 |     size = float(dist.get_world_size())
 9 |     for param in model.parameters():
10 |         if param.grad is not None:
11 |             dist.all_reduce(param.grad.data, op=dist.ReduceOp.SUM)
12 |             param.grad.data /= size
13 | 
14 | 
15 | 
16 | class DistTrainer(Trainer):
17 |     """
18 |     Distributed trainer for multi-gpu training. (not finish yet)
19 |     """
20 |     def run_step(self, model, batch, mode='train'):
21 |         output, loss, loss_stats = model.module.forward_train(batch)
22 |         loss = loss.mean()
23 |         if mode == 'train':
24 |             self.optimizer.zero_grad()
25 |             loss.backward()
26 |             average_gradients(model)
27 |             self.optimizer.step()
28 |         return output, loss, loss_stats
29 | 
30 |     def set_device(self, batch_per_gpu, rank, device):
31 |         """
32 |         Set model device for Distributed-Data-Parallel
33 |         :param batch_per_gpu: batch size of each gpu
34 |         :param rank: distributed training process rank
35 |         :param device: cuda
36 |         """
37 |         self.rank = rank
38 |         self.model = DDP(batch_per_gpu, module=self.model.cuda(), device_ids=[rank], output_device=rank)
39 | 
40 | 
41 | 


--------------------------------------------------------------------------------
/nanodet/util/__init__.py:
--------------------------------------------------------------------------------
 1 | from .rank_filter import rank_filter
 2 | from .path import mkdir
 3 | from .logger import Logger, MovingAverage, AverageMeter
 4 | from .data_parallel import DataParallel
 5 | from .distributed_data_parallel import DDP
 6 | from .check_point import load_model_weight, save_model, convert_old_model
 7 | from .config import cfg, load_config
 8 | from .box_transform import *
 9 | from .util_mixins import NiceRepr
10 | from .visualization import Visualizer, overlay_bbox_cv
11 | from .flops_counter import get_model_complexity_info
12 | from .misc import multi_apply, images_to_levels, unmap
13 | 


--------------------------------------------------------------------------------
/nanodet/util/box_transform.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | 
 3 | 
 4 | def distance2bbox(points, distance, max_shape=None):
 5 |     """Decode distance prediction to bounding box.
 6 | 
 7 |     Args:
 8 |         points (Tensor): Shape (n, 2), [x, y].
 9 |         distance (Tensor): Distance from the given point to 4
10 |             boundaries (left, top, right, bottom).
11 |         max_shape (tuple): Shape of the image.
12 | 
13 |     Returns:
14 |         Tensor: Decoded bboxes.
15 |     """
16 |     x1 = points[:, 0] - distance[:, 0]
17 |     y1 = points[:, 1] - distance[:, 1]
18 |     x2 = points[:, 0] + distance[:, 2]
19 |     y2 = points[:, 1] + distance[:, 3]
20 |     if max_shape is not None:
21 |         x1 = x1.clamp(min=0, max=max_shape[1])
22 |         y1 = y1.clamp(min=0, max=max_shape[0])
23 |         x2 = x2.clamp(min=0, max=max_shape[1])
24 |         y2 = y2.clamp(min=0, max=max_shape[0])
25 |     return torch.stack([x1, y1, x2, y2], -1)
26 | 
27 | 
28 | def bbox2distance(points, bbox, max_dis=None, eps=0.1):
29 |     """Decode bounding box based on distances.
30 | 
31 |     Args:
32 |         points (Tensor): Shape (n, 2), [x, y].
33 |         bbox (Tensor): Shape (n, 4), "xyxy" format
34 |         max_dis (float): Upper bound of the distance.
35 |         eps (float): a small value to ensure target < max_dis, instead <=
36 | 
37 |     Returns:
38 |         Tensor: Decoded distances.
39 |     """
40 |     left = points[:, 0] - bbox[:, 0]
41 |     top = points[:, 1] - bbox[:, 1]
42 |     right = bbox[:, 2] - points[:, 0]
43 |     bottom = bbox[:, 3] - points[:, 1]
44 |     if max_dis is not None:
45 |         left = left.clamp(min=0, max=max_dis - eps)
46 |         top = top.clamp(min=0, max=max_dis - eps)
47 |         right = right.clamp(min=0, max=max_dis - eps)
48 |         bottom = bottom.clamp(min=0, max=max_dis - eps)
49 |     return torch.stack([left, top, right, bottom], -1)


--------------------------------------------------------------------------------
/nanodet/util/check_point.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | import pytorch_lightning as pl
 3 | from collections import OrderedDict
 4 | from .rank_filter import rank_filter
 5 | 
 6 | 
 7 | def load_model_weight(model, checkpoint, logger):
 8 |     state_dict = checkpoint['state_dict']
 9 |     # strip prefix of state_dict
10 |     if list(state_dict.keys())[0].startswith('module.'):
11 |         state_dict = {k[7:]: v for k, v in checkpoint['state_dict'].items()}
12 |     if list(state_dict.keys())[0].startswith('model.'):
13 |         state_dict = {k[6:]: v for k, v in checkpoint['state_dict'].items()}
14 | 
15 |     model_state_dict = model.module.state_dict() if hasattr(model, 'module') else model.state_dict()
16 | 
17 |     # check loaded parameters and created model parameters
18 |     for k in state_dict:
19 |         if k in model_state_dict:
20 |             if state_dict[k].shape != model_state_dict[k].shape:
21 |                 logger.log('Skip loading parameter {}, required shape{}, loaded shape{}.'.format(
22 |                     k, model_state_dict[k].shape, state_dict[k].shape))
23 |                 state_dict[k] = model_state_dict[k]
24 |         else:
25 |             logger.log('Drop parameter {}.'.format(k))
26 |     for k in model_state_dict:
27 |         if not (k in state_dict):
28 |             logger.log('No param {}.'.format(k))
29 |             state_dict[k] = model_state_dict[k]
30 |     model.load_state_dict(state_dict, strict=False)
31 | 
32 | 
33 | @rank_filter
34 | def save_model(model, path, epoch, iter, optimizer=None):
35 |     model_state_dict = model.module.state_dict() if hasattr(model, 'module') else model.state_dict()
36 |     data = {'epoch': epoch,
37 |             'state_dict': model_state_dict,
38 |             'iter': iter}
39 |     if optimizer is not None:
40 |         data['optimizer'] = optimizer.state_dict()
41 | 
42 |     torch.save(data, path)
43 | 
44 | 
45 | def convert_old_model(old_model_dict):
46 |     if 'pytorch-lightning_version' in old_model_dict:
47 |         raise ValueError('This model is not old format. No need to convert!')
48 |     version = pl.__version__
49 |     epoch = old_model_dict['epoch']
50 |     global_step = old_model_dict['iter']
51 |     state_dict = old_model_dict['state_dict']
52 |     new_state_dict = OrderedDict()
53 |     for name, value in state_dict.items():
54 |         new_state_dict['model.' + name] = value
55 | 
56 |     new_checkpoint = {'epoch': epoch,
57 |                       'global_step': global_step,
58 |                       'pytorch-lightning_version': version,
59 |                       'state_dict': new_state_dict,
60 |                       'lr_schedulers': []}
61 | 
62 |     if 'optimizer' in old_model_dict:
63 |         optimizer_states = [old_model_dict['optimizer']]
64 |         new_checkpoint['optimizer_states'] = optimizer_states
65 | 
66 |     return new_checkpoint
67 | 


--------------------------------------------------------------------------------
/nanodet/util/config.py:
--------------------------------------------------------------------------------
 1 | from .yacs import CfgNode
 2 | 
 3 | cfg = CfgNode(new_allowed=True)
 4 | cfg.save_dir = './'
 5 | # common params for NETWORK
 6 | cfg.model = CfgNode()
 7 | cfg.model.arch = CfgNode(new_allowed=True)
 8 | cfg.model.arch.backbone = CfgNode(new_allowed=True)
 9 | cfg.model.arch.neck = CfgNode(new_allowed=True)
10 | cfg.model.arch.head = CfgNode(new_allowed=True)
11 | 
12 | # DATASET related params
13 | cfg.data = CfgNode(new_allowed=True)
14 | cfg.data.train = CfgNode(new_allowed=True)
15 | cfg.data.val = CfgNode(new_allowed=True)
16 | cfg.device = CfgNode(new_allowed=True)
17 | # train
18 | cfg.schedule = CfgNode(new_allowed=True)
19 | 
20 | # logger
21 | cfg.log = CfgNode()
22 | cfg.log.interval = 50
23 | 
24 | # testing
25 | cfg.test = CfgNode()
26 | # size of images for each device
27 | 
28 | 
29 | def load_config(cfg, args_cfg):
30 |     cfg.defrost()
31 |     cfg.merge_from_file(args_cfg)
32 |     cfg.freeze()
33 | 
34 | 
35 | if __name__ == '__main__':
36 |     import sys
37 | 
38 |     with open(sys.argv[1], 'w') as f:
39 |         print(cfg, file=f)
40 | 


--------------------------------------------------------------------------------
/nanodet/util/distributed_data_parallel.py:
--------------------------------------------------------------------------------
 1 | from torch.nn.parallel import DistributedDataParallel
 2 | from .scatter_gather import scatter_kwargs
 3 | 
 4 | 
 5 | class DDP(DistributedDataParallel):
 6 | 
 7 |     def __init__(self, batchsize, **kwargs):
 8 |         self.batchsize = batchsize
 9 |         super(DDP, self).__init__(**kwargs)
10 | 
11 |     def scatter(self, inputs, kwargs, device_ids):
12 |         return scatter_kwargs(inputs, kwargs, device_ids, dim=self.dim, chunk_sizes=[self.batchsize])


--------------------------------------------------------------------------------
/nanodet/util/logger.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import logging
 3 | import torch
 4 | import numpy as np
 5 | from termcolor import colored
 6 | from .rank_filter import rank_filter
 7 | from .path import mkdir
 8 | 
 9 | 
10 | class Logger:
11 |     def __init__(self, local_rank, save_dir='./', use_tensorboard=True):
12 |         mkdir(local_rank, save_dir)
13 |         self.rank = local_rank
14 |         fmt = colored('[%(name)s]', 'magenta', attrs=['bold']) + colored('[%(asctime)s]', 'blue') + \
15 |               colored('%(levelname)s:', 'green') + colored('%(message)s', 'white')
16 |         logging.basicConfig(level=logging.INFO,
17 |                             filename=os.path.join(save_dir, 'logs.txt'),
18 |                             filemode='w')
19 |         self.log_dir = os.path.join(save_dir, 'logs')
20 |         console = logging.StreamHandler()
21 |         console.setLevel(logging.INFO)
22 |         formatter = logging.Formatter(fmt, datefmt="%m-%d %H:%M:%S")
23 |         console.setFormatter(formatter)
24 |         logging.getLogger().addHandler(console)
25 |         if use_tensorboard:
26 |             try:
27 |                 from torch.utils.tensorboard import SummaryWriter
28 |             except ImportError:
29 |                 raise ImportError(
30 |                     'Please run "pip install future tensorboard" to install '
31 |                     'the dependencies to use torch.utils.tensorboard '
32 |                     '(applicable to PyTorch 1.1 or higher)')
33 |             if self.rank < 1:
34 |                 logging.info('Using Tensorboard, logs will be saved in {}'.format(self.log_dir))
35 |                 self.writer = SummaryWriter(log_dir=self.log_dir)
36 | 
37 |     def log(self, string):
38 |         if self.rank < 1:
39 |             logging.info(string)
40 | 
41 |     def scalar_summary(self, tag, phase, value, step):
42 |         if self.rank < 1:
43 |             self.writer.add_scalars(tag, {phase: value}, step)
44 | 
45 | 
46 | class MovingAverage(object):
47 |     def __init__(self, val, window_size=50):
48 |         self.window_size = window_size
49 |         self.reset()
50 |         self.push(val)
51 | 
52 |     def reset(self):
53 |         self.queue = []
54 | 
55 |     def push(self, val):
56 |         self.queue.append(val)
57 |         if len(self.queue) > self.window_size:
58 |             self.queue.pop(0)
59 | 
60 |     def avg(self):
61 |         return np.mean(self.queue)
62 | 
63 | 
64 | class AverageMeter(object):
65 |     """Computes and stores the average and current value"""
66 | 
67 |     def __init__(self, val):
68 |         self.reset()
69 |         self.update(val)
70 | 
71 |     def reset(self):
72 |         self.val = 0
73 |         self.avg = 0
74 |         self.sum = 0
75 |         self.count = 0
76 | 
77 |     def update(self, val, n=1):
78 |         self.val = val
79 |         self.sum += val * n
80 |         self.count += n
81 |         if self.count > 0:
82 |             self.avg = self.sum / self.count
83 | 


--------------------------------------------------------------------------------
/nanodet/util/misc.py:
--------------------------------------------------------------------------------
 1 | # Modification 2020 RangiLyu
 2 | # Copyright 2018-2019 Open-MMLab.
 3 | 
 4 | # Licensed under the Apache License, Version 2.0 (the "License");
 5 | # you may not use this file except in compliance with the License.
 6 | # You may obtain a copy of the License at
 7 | 
 8 | #     http://www.apache.org/licenses/LICENSE-2.0
 9 | 
10 | # Unless required by applicable law or agreed to in writing, software
11 | # distributed under the License is distributed on an "AS IS" BASIS,
12 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 | # See the License for the specific language governing permissions and
14 | # limitations under the License.
15 | 
16 | import torch
17 | from functools import partial
18 | 
19 | 
20 | def multi_apply(func, *args, **kwargs):
21 |     pfunc = partial(func, **kwargs) if kwargs else func
22 |     map_results = map(pfunc, *args)
23 |     return tuple(map(list, zip(*map_results)))
24 | 
25 | 
26 | def images_to_levels(target, num_level_anchors):
27 |     """Convert targets by image to targets by feature level.
28 | 
29 |     [target_img0, target_img1] -> [target_level0, target_level1, ...]
30 |     """
31 |     target = torch.stack(target, 0)
32 |     level_targets = []
33 |     start = 0
34 |     for n in num_level_anchors:
35 |         end = start + n
36 |         level_targets.append(target[:, start:end].squeeze(0))
37 |         start = end
38 |     return level_targets
39 | 
40 | 
41 | def unmap(data, count, inds, fill=0):
42 |     """ Unmap a subset of item (data) back to the original set of items (of
43 |     size count) """
44 |     if data.dim() == 1:
45 |         ret = data.new_full((count, ), fill)
46 |         ret[inds.type(torch.bool)] = data
47 |     else:
48 |         new_size = (count, ) + data.size()[1:]
49 |         ret = data.new_full(new_size, fill)
50 |         ret[inds.type(torch.bool), :] = data
51 |     return ret


--------------------------------------------------------------------------------
/nanodet/util/path.py:
--------------------------------------------------------------------------------
1 | import os
2 | from .rank_filter import rank_filter
3 | 
4 | 
5 | @rank_filter
6 | def mkdir(path):
7 |     if not os.path.exists(path):
8 |         os.makedirs(path)
9 | 


--------------------------------------------------------------------------------
/nanodet/util/rank_filter.py:
--------------------------------------------------------------------------------
1 | 
2 | def rank_filter(func):
3 |     def func_filter(local_rank=-1, *args, **kwargs):
4 |         if local_rank < 1:
5 |             return func(*args, **kwargs)
6 |         else:
7 |             pass
8 |     return func_filter
9 | 


--------------------------------------------------------------------------------
/nanodet/util/scatter_gather.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from torch.autograd import Variable
 3 | from torch.nn.parallel._functions import Scatter
 4 | 
 5 | 
 6 | def list_scatter(input, target_gpus, chunk_sizes):
 7 |     ret = []
 8 |     for idx, size in enumerate(chunk_sizes):
 9 |         ret.append(input[:size])
10 |         del input[:size]
11 |     return tuple(ret)
12 | 
13 | def scatter(inputs, target_gpus, dim=0, chunk_sizes=None):
14 |     """
15 |     Slices variables into approximately equal chunks and
16 |     distributes them across given GPUs. Duplicates
17 |     references to objects that are not variables. Does not
18 |     support Tensors.
19 |     """
20 |     def scatter_map(obj):
21 |         if isinstance(obj, Variable):
22 |             return Scatter.apply(target_gpus, chunk_sizes, dim, obj)
23 |         assert not torch.is_tensor(obj), "Tensors not supported in scatter."
24 |         if isinstance(obj, list):
25 |             return list_scatter(obj, target_gpus, chunk_sizes)
26 |         if isinstance(obj, tuple):
27 |             return list(zip(*map(scatter_map, obj)))
28 |         if isinstance(obj, dict):
29 |             return list(map(type(obj), zip(*map(scatter_map, obj.items()))))
30 |         return [obj for targets in target_gpus]
31 | 
32 |     return scatter_map(inputs)
33 | 
34 | 
35 | def scatter_kwargs(inputs, kwargs, target_gpus, dim=0, chunk_sizes=None):
36 |     r"""Scatter with support for kwargs dictionary"""
37 |     inputs = scatter(inputs, target_gpus, dim, chunk_sizes) if inputs else []
38 |     kwargs = scatter(kwargs, target_gpus, dim, chunk_sizes) if kwargs else []
39 |     if len(inputs) < len(kwargs):
40 |         inputs.extend([() for _ in range(len(kwargs) - len(inputs))])
41 |     elif len(kwargs) < len(inputs):
42 |         kwargs.extend([{} for _ in range(len(inputs) - len(kwargs))])
43 |     inputs = tuple(inputs)
44 |     kwargs = tuple(kwargs)
45 |     return inputs, kwargs


--------------------------------------------------------------------------------
/nanodet/util/util_mixins.py:
--------------------------------------------------------------------------------
  1 | """This module defines the :class:`NiceRepr` mixin class, which defines a
  2 | ``__repr__`` and ``__str__`` method that only depend on a custom ``__nice__``
  3 | method, which you must define. This means you only have to overload one
  4 | function instead of two.  Furthermore, if the object defines a ``__len__``
  5 | method, then the ``__nice__`` method defaults to something sensible, otherwise
  6 | it is treated as abstract and raises ``NotImplementedError``.
  7 | 
  8 | To use simply have your object inherit from :class:`NiceRepr`
  9 | (multi-inheritance should be ok).
 10 | 
 11 | This code was copied from the ubelt library: https://github.com/Erotemic/ubelt
 12 | 
 13 | Example:
 14 |     >>> # Objects that define __nice__ have a default __str__ and __repr__
 15 |     >>> class Student(NiceRepr):
 16 |     ...    def __init__(self, name):
 17 |     ...        self.name = name
 18 |     ...    def __nice__(self):
 19 |     ...        return self.name
 20 |     >>> s1 = Student('Alice')
 21 |     >>> s2 = Student('Bob')
 22 |     >>> print(f's1 = {s1}')
 23 |     >>> print(f's2 = {s2}')
 24 |     s1 = <Student(Alice)>
 25 |     s2 = <Student(Bob)>
 26 | 
 27 | Example:
 28 |     >>> # Objects that define __len__ have a default __nice__
 29 |     >>> class Group(NiceRepr):
 30 |     ...    def __init__(self, data):
 31 |     ...        self.data = data
 32 |     ...    def __len__(self):
 33 |     ...        return len(self.data)
 34 |     >>> g = Group([1, 2, 3])
 35 |     >>> print(f'g = {g}')
 36 |     g = <Group(3)>
 37 | """
 38 | import warnings
 39 | 
 40 | 
 41 | class NiceRepr(object):
 42 |     """Inherit from this class and define ``__nice__`` to "nicely" print your
 43 |     objects.
 44 | 
 45 |     Defines ``__str__`` and ``__repr__`` in terms of ``__nice__`` function
 46 |     Classes that inherit from :class:`NiceRepr` should redefine ``__nice__``.
 47 |     If the inheriting class has a ``__len__``, method then the default
 48 |     ``__nice__`` method will return its length.
 49 | 
 50 |     Example:
 51 |         >>> class Foo(NiceRepr):
 52 |         ...    def __nice__(self):
 53 |         ...        return 'info'
 54 |         >>> foo = Foo()
 55 |         >>> assert str(foo) == '<Foo(info)>'
 56 |         >>> assert repr(foo).startswith('<Foo(info) at ')
 57 | 
 58 |     Example:
 59 |         >>> class Bar(NiceRepr):
 60 |         ...    pass
 61 |         >>> bar = Bar()
 62 |         >>> import pytest
 63 |         >>> with pytest.warns(None) as record:
 64 |         >>>     assert 'object at' in str(bar)
 65 |         >>>     assert 'object at' in repr(bar)
 66 | 
 67 |     Example:
 68 |         >>> class Baz(NiceRepr):
 69 |         ...    def __len__(self):
 70 |         ...        return 5
 71 |         >>> baz = Baz()
 72 |         >>> assert str(baz) == '<Baz(5)>'
 73 |     """
 74 | 
 75 |     def __nice__(self):
 76 |         """str: a "nice" summary string describing this module"""
 77 |         if hasattr(self, '__len__'):
 78 |             # It is a common pattern for objects to use __len__ in __nice__
 79 |             # As a convenience we define a default __nice__ for these objects
 80 |             return str(len(self))
 81 |         else:
 82 |             # In all other cases force the subclass to overload __nice__
 83 |             raise NotImplementedError(
 84 |                 f'Define the __nice__ method for {self.__class__!r}')
 85 | 
 86 |     def __repr__(self):
 87 |         """str: the string of the module"""
 88 |         try:
 89 |             nice = self.__nice__()
 90 |             classname = self.__class__.__name__
 91 |             return f'<{classname}({nice}) at {hex(id(self))}>'
 92 |         except NotImplementedError as ex:
 93 |             warnings.warn(str(ex), category=RuntimeWarning)
 94 |             return object.__repr__(self)
 95 | 
 96 |     def __str__(self):
 97 |         """str: the string of the module"""
 98 |         try:
 99 |             classname = self.__class__.__name__
100 |             nice = self.__nice__()
101 |             return f'<{classname}({nice})>'
102 |         except NotImplementedError as ex:
103 |             warnings.warn(str(ex), category=RuntimeWarning)
104 |             return object.__repr__(self)
105 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
 1 | Cython
 2 | termcolor
 3 | numpy
 4 | torch>=1.6
 5 | torchvision
 6 | tensorboard
 7 | pycocotools
 8 | matplotlib
 9 | pyaml
10 | opencv-python
11 | tqdm
12 | pytorch-lightning>=1.2.5
13 | torchmetrics


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | from setuptools import find_packages, setup
 3 | 
 4 | __version__ = "0.3.0"
 5 | 
 6 | if __name__ == '__main__':
 7 |     setup(
 8 |         name='nanodet',
 9 |         version=__version__,
10 |         description='Deep Learning Object Detection Toolbox',
11 |         url='https://github.com/RangiLyu/nanodet',
12 |         author='RangiLyu',
13 |         author_email='lyuchqi@gmail.com',
14 |         keywords='deep learning',
15 |         packages=find_packages(exclude=('config', 'tools', 'demo')),
16 |         classifiers=[
17 |             'Development Status :: Beta',
18 |             'License :: OSI Approved :: Apache Software License',
19 |             'Operating System :: OS Independent',
20 |             'Programming Language :: Python :: 3.5',
21 |             'Programming Language :: Python :: 3.6',
22 |             'Programming Language :: Python :: 3.7',
23 |             'Programming Language :: Python :: 3.8',
24 |         ],
25 |         license='Apache License 2.0',
26 |         zip_safe=False)
27 | 


--------------------------------------------------------------------------------
/tools/convert_old_checkpoint.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2021 RangiLyu.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | import argparse
17 | import torch
18 | 
19 | from nanodet.util import convert_old_model
20 | 
21 | 
22 | def parse_args():
23 |     parser = argparse.ArgumentParser(
24 |         formatter_class=argparse.ArgumentDefaultsHelpFormatter,
25 |         description='Convert .pth model to onnx.')
26 |     parser.add_argument('--file_path',
27 |                         type=str,
28 |                         help='Path to .pth checkpoint.')
29 |     parser.add_argument('--out_path',
30 |                         type=str,
31 |                         help='Path to .ckpt checkpoint.')
32 |     return parser.parse_args()
33 | 
34 | 
35 | if __name__ == '__main__':
36 |     args = parse_args()
37 |     file_path = args.file_path
38 |     out_path = args.out_path
39 |     old_check_point = torch.load(file_path)
40 |     new_check_point = convert_old_model(old_check_point)
41 |     torch.save(new_check_point, out_path)
42 |     print("Checkpoint saved to:", out_path)
43 | 


--------------------------------------------------------------------------------
/tools/deprecated/test.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import torch
 3 | import json
 4 | import datetime
 5 | import argparse
 6 | import warnings
 7 | 
 8 | from nanodet.util import mkdir, Logger, cfg, load_config
 9 | from nanodet.trainer import build_trainer
10 | from nanodet.data.collate import collate_function
11 | from nanodet.data.dataset import build_dataset
12 | from nanodet.model.arch import build_model
13 | from nanodet.evaluator import build_evaluator
14 | 
15 | 
16 | def parse_args():
17 |     parser = argparse.ArgumentParser()
18 |     parser.add_argument('--task', type=str, default='val', help='task to run, test or val')
19 |     parser.add_argument('--config', type=str, help='model config file(.yml) path')
20 |     parser.add_argument('--model', type=str, help='model weight file(.pth) path')
21 |     parser.add_argument('--save_result', action='store_true', default=True, help='save val results to txt')
22 |     args = parser.parse_args()
23 |     return args
24 | 
25 | 
26 | def main(args):
27 |     warnings.warn('Warning! Old testing code is deprecated and will be deleted '
28 |                   'in next version. Please use tools/test.py')
29 |     load_config(cfg, args.config)
30 |     local_rank = -1
31 |     torch.backends.cudnn.enabled = True
32 |     torch.backends.cudnn.benchmark = True
33 |     cfg.defrost()
34 |     timestr = datetime.datetime.now().__format__('%Y%m%d%H%M%S')
35 |     cfg.save_dir = os.path.join(cfg.save_dir, timestr)
36 |     cfg.freeze()
37 |     mkdir(local_rank, cfg.save_dir)
38 |     logger = Logger(local_rank, cfg.save_dir)
39 | 
40 |     logger.log('Creating model...')
41 |     model = build_model(cfg.model)
42 | 
43 |     logger.log('Setting up data...')
44 |     val_dataset = build_dataset(cfg.data.val, args.task)
45 |     val_dataloader = torch.utils.data.DataLoader(val_dataset, batch_size=1, shuffle=False, num_workers=1,
46 |                                                  pin_memory=True, collate_fn=collate_function, drop_last=True)
47 |     trainer = build_trainer(local_rank, cfg, model, logger)
48 |     cfg.schedule.update({'load_model': args.model})
49 |     trainer.load_model(cfg)
50 |     evaluator = build_evaluator(cfg, val_dataset)
51 |     logger.log('Starting testing...')
52 |     with torch.no_grad():
53 |         results, val_loss_dict = trainer.run_epoch(0, val_dataloader, mode=args.task)
54 |     if args.task == 'test':
55 |         res_json = evaluator.results2json(results)
56 |         json_path = os.path.join(cfg.save_dir, 'results{}.json'.format(timestr))
57 |         json.dump(res_json, open(json_path, 'w'))
58 |     elif args.task == 'val':
59 |         eval_results = evaluator.evaluate(results, cfg.save_dir, rank=local_rank)
60 |         if args.save_result:
61 |             txt_path = os.path.join(cfg.save_dir, "eval_results{}.txt".format(timestr))
62 |             with open(txt_path, "a") as f:
63 |                 for k, v in eval_results.items():
64 |                     f.write("{}: {}\n".format(k, v))
65 | 
66 | 
67 | if __name__ == '__main__':
68 |     args = parse_args()
69 |     main(args)
70 | 


--------------------------------------------------------------------------------
/tools/deprecated/train.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import torch
 3 | import logging
 4 | import warnings
 5 | import argparse
 6 | import numpy as np
 7 | import torch.distributed as dist
 8 | 
 9 | from nanodet.util import mkdir, Logger, cfg, load_config
10 | from nanodet.trainer import build_trainer
11 | from nanodet.data.collate import collate_function
12 | from nanodet.data.dataset import build_dataset
13 | from nanodet.model.arch import build_model
14 | from nanodet.evaluator import build_evaluator
15 | 
16 | 
17 | def parse_args():
18 |     parser = argparse.ArgumentParser()
19 |     parser.add_argument('config', help='train config file path')
20 |     parser.add_argument('--local_rank', default=-1, type=int,
21 |                         help='node rank for distributed training')
22 |     parser.add_argument('--seed', type=int, default=None,
23 |                         help='random seed')
24 |     args = parser.parse_args()
25 |     return args
26 | 
27 | 
28 | def init_seeds(seed=0):
29 |     """
30 |     manually set a random seed for numpy, torch and cuda
31 |     :param seed: random seed
32 |     """
33 |     torch.manual_seed(seed)
34 |     np.random.seed(seed)
35 |     torch.cuda.manual_seed(seed)
36 |     torch.cuda.manual_seed_all(seed)
37 |     if seed == 0:
38 |         torch.backends.cudnn.deterministic = True
39 |         torch.backends.cudnn.benchmark = False
40 | 
41 | 
42 | def main(args):
43 |     warnings.warn('Warning! Old training code is deprecated and will be deleted '
44 |                   'in next version. Please use tools/train.py')
45 |     load_config(cfg, args.config)
46 |     local_rank = int(args.local_rank)
47 |     torch.backends.cudnn.enabled = True
48 |     torch.backends.cudnn.benchmark = True
49 |     mkdir(local_rank, cfg.save_dir)
50 |     logger = Logger(local_rank, cfg.save_dir)
51 |     if args.seed is not None:
52 |         logger.log('Set random seed to {}'.format(args.seed))
53 |         init_seeds(args.seed)
54 | 
55 |     logger.log('Creating model...')
56 |     model = build_model(cfg.model)
57 | 
58 |     logger.log('Setting up data...')
59 |     train_dataset = build_dataset(cfg.data.train, 'train')
60 |     val_dataset = build_dataset(cfg.data.val, 'test')
61 | 
62 |     if len(cfg.device.gpu_ids) > 1:
63 |         print('rank = ', local_rank)
64 |         num_gpus = torch.cuda.device_count()
65 |         torch.cuda.set_device(local_rank % num_gpus)
66 |         dist.init_process_group(backend='nccl')
67 |         train_sampler = torch.utils.data.distributed.DistributedSampler(train_dataset)
68 |         train_dataloader = torch.utils.data.DataLoader(train_dataset, batch_size=cfg.device.batchsize_per_gpu,
69 |                                                        num_workers=cfg.device.workers_per_gpu, pin_memory=True,
70 |                                                        collate_fn=collate_function, sampler=train_sampler,
71 |                                                        drop_last=True)
72 |     else:
73 |         train_dataloader = torch.utils.data.DataLoader(train_dataset, batch_size=cfg.device.batchsize_per_gpu,
74 |                                                        shuffle=True, num_workers=cfg.device.workers_per_gpu,
75 |                                                        pin_memory=True, collate_fn=collate_function, drop_last=True)
76 | 
77 |     val_dataloader = torch.utils.data.DataLoader(val_dataset, batch_size=1, shuffle=False, num_workers=1,
78 |                                                  pin_memory=True, collate_fn=collate_function, drop_last=True)
79 | 
80 |     trainer = build_trainer(local_rank, cfg, model, logger)
81 | 
82 |     if 'load_model' in cfg.schedule:
83 |         trainer.load_model(cfg)
84 |     if 'resume' in cfg.schedule:
85 |         trainer.resume(cfg)
86 | 
87 |     evaluator = build_evaluator(cfg, val_dataset)
88 | 
89 |     logger.log('Starting training...')
90 |     trainer.run(train_dataloader, val_dataloader, evaluator)
91 | 
92 | 
93 | if __name__ == '__main__':
94 |     args = parse_args()
95 |     main(args)
96 | 


--------------------------------------------------------------------------------
/tools/export_onnx.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import argparse
 3 | import torch
 4 | from nanodet.model.arch import build_model
 5 | from nanodet.util import Logger, cfg, load_config, load_model_weight
 6 | 
 7 | 
 8 | def generate_ouput_names(head_cfg):
 9 |     cls_names, dis_names = [], []
10 |     for stride in head_cfg.strides:
11 |         cls_names.append('cls_pred_stride_{}'.format(stride))
12 |         dis_names.append('dis_pred_stride_{}'.format(stride))
13 |     return cls_names + dis_names
14 | 
15 | 
16 | def main(config, model_path, output_path, input_shape=(320, 320)):
17 |     logger = Logger(-1, config.save_dir, False)
18 |     model = build_model(config.model)
19 |     checkpoint = torch.load(model_path, map_location=lambda storage, loc: storage)
20 |     load_model_weight(model, checkpoint, logger)
21 |     if config.model.arch.backbone.name == 'RepVGG':
22 |         deploy_config = config.model
23 |         deploy_config.arch.backbone.update({'deploy': True})
24 |         deploy_model = build_model(deploy_config)
25 |         from nanodet.model.backbone.repvgg import repvgg_det_model_convert
26 |         model = repvgg_det_model_convert(model, deploy_model)
27 |     dummy_input = torch.autograd.Variable(torch.randn(1, 3, input_shape[0], input_shape[1]))
28 |     output_names = None
29 |     # if config.model.arch.head.name == 'NanoDetHead':
30 |     #     output_names = generate_ouput_names(config.model.arch.head)
31 |     torch.onnx.export(model,
32 |                       dummy_input,
33 |                       output_path,
34 |                       verbose=True,
35 |                       keep_initializers_as_inputs=True,
36 |                       opset_version=11,
37 |                       output_names=output_names)
38 |     logger.log('finished exporting onnx ')
39 | 
40 | 
41 | def parse_args():
42 |     parser = argparse.ArgumentParser(
43 |         formatter_class=argparse.ArgumentDefaultsHelpFormatter,
44 |         description='Convert .pth model to onnx.')
45 |     parser.add_argument('--cfg_path',
46 |                         type=str,
47 |                         help='Path to .yml config file.')
48 |     parser.add_argument('--model_path',
49 |                         type=str,
50 |                         default=None,
51 |                         help='Path to .ckpt model.')
52 |     parser.add_argument('--out_path',
53 |                         type=str,
54 |                         default='nanodet.onnx',
55 |                         help='Onnx model output path.')
56 |     parser.add_argument('--input_shape',
57 |                         type=str,
58 |                         default=None,
59 |                         help='Model intput shape.')
60 |     return parser.parse_args()
61 | 
62 | 
63 | if __name__ == '__main__':
64 |     args = parse_args()
65 |     cfg_path = args.cfg_path
66 |     model_path = args.model_path
67 |     out_path = args.out_path
68 |     input_shape = args.input_shape
69 |     load_config(cfg, cfg_path)
70 |     if input_shape is None:
71 |         input_shape = cfg.data.train.input_size
72 |     else:
73 |         input_shape = tuple(map(int, input_shape.split(',')))
74 |         assert len(input_shape) == 2
75 |     if model_path is None:
76 |         model_path = os.path.join(cfg.save_dir, "model_best/model_best.ckpt")
77 |     main(cfg, model_path, out_path, input_shape)
78 |     print("Model saved to:", out_path)
79 | 


--------------------------------------------------------------------------------
/tools/export_torchscript.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import argparse
 3 | import torch
 4 | from nanodet.model.arch import build_model
 5 | from nanodet.util import Logger, cfg, load_config, load_model_weight
 6 | 
 7 | 
 8 | def main(config, model_path: str, output_path: str, input_shape=(320, 320)):
 9 |     logger = Logger(local_rank=-1, save_dir=config.save_dir, use_tensorboard=False)
10 | 
11 |     # Create model and load weights
12 |     model = build_model(config.model)
13 |     checkpoint = torch.load(model_path, map_location=lambda storage, loc: storage)
14 |     load_model_weight(model, checkpoint, logger)
15 | 
16 |     # Convert backbone weights for RepVGG models
17 |     if config.model.arch.backbone.name == 'RepVGG':
18 |         deploy_config = config.model
19 |         deploy_config.arch.backbone.update({'deploy': True})
20 |         deploy_model = build_model(deploy_config)
21 |         from nanodet.model.backbone.repvgg import repvgg_det_model_convert
22 |         model = repvgg_det_model_convert(model, deploy_model)
23 | 
24 |     # TorchScript: tracing the model with dummy inputs
25 |     with torch.no_grad():
26 |         dummy_input = torch.zeros(1, 3, input_shape[0], input_shape[1])  # Batch size = 1
27 |         model.eval().cpu()
28 |         model_traced = torch.jit.trace(model, example_inputs=dummy_input).eval()
29 |         model_traced.save(output_path)
30 |         print('Finished export to TorchScript')
31 | 
32 | 
33 | def parse_args():
34 |     parser = argparse.ArgumentParser(
35 |         formatter_class=argparse.ArgumentDefaultsHelpFormatter,
36 |         description='Convert .pth model weights to TorchScript.')
37 |     parser.add_argument('--cfg_path',
38 |                         type=str,
39 |                         help='Path to .yml config file.')
40 |     parser.add_argument('--model_path',
41 |                         type=str,
42 |                         default=None,
43 |                         help='Path to .ckpt model.')
44 |     parser.add_argument('--out_path',
45 |                         type=str,
46 |                         default='nanodet.torchscript.pth',
47 |                         help='TorchScript model output path.')
48 |     parser.add_argument('--input_shape',
49 |                         type=str,
50 |                         default=None,
51 |                         help='Model input shape.')
52 |     return parser.parse_args()
53 | 
54 | 
55 | if __name__ == '__main__':
56 |     args = parse_args()
57 |     cfg_path = args.cfg_path
58 |     model_path = args.model_path
59 |     out_path = args.out_path
60 |     input_shape = args.input_shape
61 |     load_config(cfg, cfg_path)
62 |     if input_shape is None:
63 |         input_shape = cfg.data.train.input_size
64 |     else:
65 |         input_shape = tuple(map(int, input_shape.split(',')))
66 |         assert len(input_shape) == 2
67 |     if model_path is None:
68 |         model_path = os.path.join(cfg.save_dir, "model_best/model_best.ckpt")
69 |     main(cfg, model_path, out_path, input_shape)
70 |     print("Model saved to:", out_path)
71 | 


--------------------------------------------------------------------------------
/tools/flops.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from nanodet.model.arch import build_model
 3 | from nanodet.util import cfg, load_config, get_model_complexity_info
 4 | 
 5 | 
 6 | def main(config, input_shape=(3, 320, 320)):
 7 |     model = build_model(config.model)
 8 |     flops, params = get_model_complexity_info(model, input_shape)
 9 |     split_line = '=' * 30
10 |     print(f'{split_line}\nInput shape: {input_shape}\n'
11 |           f'Flops: {flops}\nParams: {params}\n{split_line}')
12 | 
13 | 
14 | if __name__ == '__main__':
15 |     cfg_path = r"config/nanodet-m.yml"
16 |     load_config(cfg, cfg_path)
17 |     main(config=cfg,
18 |          input_shape=(3, 320, 320)
19 |          )
20 | 


--------------------------------------------------------------------------------
/tools/inference.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import cv2
 3 | import time
 4 | import torch
 5 | 
 6 | from nanodet.model.arch import build_model
 7 | from nanodet.util import load_model_weight
 8 | from nanodet.data.transform import Pipeline
 9 | 
10 | 
11 | class Predictor(object):
12 |     def __init__(self, cfg, model_path, logger, device='cuda:0'):
13 |         self.cfg = cfg
14 |         self.device = device
15 |         model = build_model(cfg.model)
16 |         ckpt = torch.load(model_path, map_location=lambda storage, loc: storage)
17 |         load_model_weight(model, ckpt, logger)
18 |         if cfg.model.arch.backbone.name == 'RepVGG':
19 |             deploy_config = cfg.model
20 |             deploy_config.arch.backbone.update({'deploy': True})
21 |             deploy_model = build_model(deploy_config)
22 |             from nanodet.model.backbone.repvgg import repvgg_det_model_convert
23 |             model = repvgg_det_model_convert(model, deploy_model)
24 |         self.model = model.to(device).eval()
25 |         self.pipeline = Pipeline(cfg.data.val.pipeline, cfg.data.val.keep_ratio)
26 | 
27 |     def inference(self, img):
28 |         img_info = {}
29 |         if isinstance(img, str):
30 |             img_info['file_name'] = os.path.basename(img)
31 |             img = cv2.imread(img)
32 |         else:
33 |             img_info['file_name'] = None
34 | 
35 |         height, width = img.shape[:2]
36 |         img_info['height'] = height
37 |         img_info['width'] = width
38 |         meta = dict(img_info=img_info,
39 |                     raw_img=img,
40 |                     img=img)
41 |         meta = self.pipeline(meta, self.cfg.data.val.input_size)
42 |         meta['img'] = torch.from_numpy(meta['img'].transpose(2, 0, 1)).unsqueeze(0).to(self.device)
43 |         with torch.no_grad():
44 |             results = self.model.inference(meta)
45 |         return meta, results
46 | 
47 |     def visualize(self, dets, meta, class_names, score_thres, wait=0):
48 |         time1 = time.time()
49 |         self.model.head.show_result(meta['raw_img'], dets, class_names, score_thres=score_thres, show=True)
50 |         print('viz time: {:.3f}s'.format(time.time()-time1))
51 | 


--------------------------------------------------------------------------------
/tools/show_dataset.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import torch
 3 | import argparse
 4 | import numpy as np
 5 | import cv2
 6 | import warnings
 7 | import pytorch_lightning as pl
 8 | from pytorch_lightning.callbacks import ProgressBar
 9 | 
10 | from nanodet.util import mkdir, Logger, cfg, load_config, convert_old_model
11 | from nanodet.data.collate import collate_function
12 | from nanodet.data.dataset import build_dataset
13 | from nanodet.trainer.task import TrainingTask
14 | from nanodet.evaluator import build_evaluator
15 | 
16 | def parse_args():
17 |     parser = argparse.ArgumentParser()
18 |     parser.add_argument('config', help='train config file path')
19 |     parser.add_argument('--local_rank', default=-1, type=int,
20 |                         help='node rank for distributed training')
21 |     parser.add_argument('--seed', type=int, default=None,
22 |                         help='random seed')
23 |     args = parser.parse_args()
24 |     return args
25 | 
26 | 
27 | def main(args):
28 |     load_config(cfg, args.config)
29 |     if cfg.model.arch.head.num_classes != len(cfg.class_names):
30 |         raise ValueError('cfg.model.arch.head.num_classes must equal len(cfg.class_names),but got {} and {}'.format(cfg.model.arch.head.num_classes,len(cfg.class_names)))
31 |     local_rank = int(args.local_rank)
32 |     torch.backends.cudnn.enabled = True
33 |     torch.backends.cudnn.benchmark = True
34 |     mkdir(local_rank, cfg.save_dir)
35 |     logger = Logger(local_rank, cfg.save_dir)
36 | 
37 |     if args.seed is not None:
38 |         logger.log('Set random seed to {}'.format(args.seed))
39 |         pl.seed_everything(args.seed)
40 | 
41 |     logger.log('Setting up data...')
42 |     # print(cfg.data.train)
43 |     train_dataset = build_dataset(cfg.data.train, 'train')
44 |     val_dataset = build_dataset(cfg.data.val, 'test')
45 | 
46 |     evaluator = build_evaluator(cfg, val_dataset)
47 | 
48 |     show_cnt = 0
49 |     for meta in train_dataset:
50 |         img = meta['img'].numpy().transpose(1,2,0).copy()
51 |         #cv2.imshow('gray',np.ones(img.shape,dtype=np.float32) * 0.5)
52 |         #print(meta['gt_bboxes'])
53 |         #print(img.shape)
54 |         for idx in range(len(meta['gt_bboxes'])):
55 |             rect = meta['gt_bboxes'][idx]
56 |             #print(rect[0])
57 |             label = meta['gt_labels'][idx]
58 |             #print(label)
59 |             cv2.rectangle(img, (int(rect[0]),int(rect[1])),(int(rect[2]),int(rect[3])),(0, 255, 0), 1)
60 |             cv2.putText(img,str(cfg.class_names[label]),(int(rect[0]),int(rect[1] + 1.5)),cv2.FONT_HERSHEY_SIMPLEX,0.7,(0,255,0),1)
61 |         cv2.imshow('dataset_img',img)
62 |         cv2.waitKey(0)
63 |         
64 |         show_cnt += 1
65 |         if show_cnt > 50:
66 |             break
67 | 
68 | 
69 | if __name__ == '__main__':
70 |     args = parse_args()
71 |     main(args)


--------------------------------------------------------------------------------
/tools/test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2021 RangiLyu.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | import torch
17 | import json
18 | import datetime
19 | import argparse
20 | import warnings
21 | import pytorch_lightning as pl
22 | 
23 | from nanodet.util import mkdir, Logger, cfg, load_config, convert_old_model
24 | from nanodet.data.collate import collate_function
25 | from nanodet.data.dataset import build_dataset
26 | from nanodet.trainer.task import TrainingTask
27 | from nanodet.evaluator import build_evaluator
28 | 
29 | 
30 | def parse_args():
31 |     parser = argparse.ArgumentParser()
32 |     parser.add_argument('--task', type=str, default='val', help='task to run, test or val')
33 |     parser.add_argument('--config', type=str, help='model config file(.yml) path')
34 |     parser.add_argument('--model', type=str, help='ckeckpoint file(.ckpt) path')
35 |     args = parser.parse_args()
36 |     return args
37 | 
38 | 
39 | def main(args):
40 |     load_config(cfg, args.config)
41 |     local_rank = -1
42 |     torch.backends.cudnn.enabled = True
43 |     torch.backends.cudnn.benchmark = True
44 |     cfg.defrost()
45 |     timestr = datetime.datetime.now().__format__('%Y%m%d%H%M%S')
46 |     cfg.save_dir = os.path.join(cfg.save_dir, timestr)
47 |     mkdir(local_rank, cfg.save_dir)
48 |     logger = Logger(local_rank, cfg.save_dir)
49 | 
50 |     assert args.task in ['val', 'test']
51 |     cfg.update({'test_mode': args.task})
52 | 
53 |     logger.log('Setting up data...')
54 |     val_dataset = build_dataset(cfg.data.val, args.task)
55 |     val_dataloader = torch.utils.data.DataLoader(val_dataset, batch_size=1, shuffle=False,
56 |                                                  num_workers=cfg.device.workers_per_gpu,
57 |                                                  pin_memory=True, collate_fn=collate_function, drop_last=True)
58 |     evaluator = build_evaluator(cfg, val_dataset)
59 | 
60 |     logger.log('Creating model...')
61 |     task = TrainingTask(cfg, evaluator)
62 | 
63 |     ckpt = torch.load(args.model)
64 |     if 'pytorch-lightning_version' not in ckpt:
65 |         warnings.warn('Warning! Old .pth checkpoint is deprecated. '
66 |                       'Convert the checkpoint with tools/convert_old_checkpoint.py ')
67 |         ckpt = convert_old_model(ckpt)
68 |     task.load_state_dict(ckpt['state_dict'])
69 | 
70 |     trainer = pl.Trainer(default_root_dir=cfg.save_dir,
71 |                          gpus=cfg.device.gpu_ids,
72 |                          accelerator='ddp',
73 |                          log_every_n_steps=cfg.log.interval,
74 |                          num_sanity_val_steps=0,
75 |                          )
76 |     logger.log('Starting testing...')
77 |     trainer.test(task, val_dataloader)
78 | 
79 | 
80 | if __name__ == '__main__':
81 |     args = parse_args()
82 |     main(args)
83 | 


--------------------------------------------------------------------------------
/tools/train.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2021 RangiLyu.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | import torch
17 | import argparse
18 | import numpy as np
19 | import warnings
20 | import pytorch_lightning as pl
21 | from pytorch_lightning.callbacks import ProgressBar
22 | 
23 | from nanodet.util import mkdir, Logger, cfg, load_config, convert_old_model
24 | from nanodet.data.collate import collate_function
25 | from nanodet.data.dataset import build_dataset
26 | from nanodet.trainer.task import TrainingTask
27 | from nanodet.evaluator import build_evaluator
28 | 
29 | 
30 | def parse_args():
31 |     parser = argparse.ArgumentParser()
32 |     parser.add_argument('config', help='train config file path')
33 |     parser.add_argument('--local_rank', default=-1, type=int,
34 |                         help='node rank for distributed training')
35 |     parser.add_argument('--seed', type=int, default=None,
36 |                         help='random seed')
37 |     args = parser.parse_args()
38 |     return args
39 | 
40 | 
41 | def main(args):
42 |     load_config(cfg, args.config)
43 |     if cfg.model.arch.head.num_classes != len(cfg.class_names):
44 |         raise ValueError('cfg.model.arch.head.num_classes must equal len(cfg.class_names),but got {} and {}'.format(cfg.model.arch.head.num_classes,len(cfg.class_names)))
45 |     local_rank = int(args.local_rank)
46 |     torch.backends.cudnn.enabled = True
47 |     torch.backends.cudnn.benchmark = True
48 |     mkdir(local_rank, cfg.save_dir)
49 |     logger = Logger(local_rank, cfg.save_dir)
50 | 
51 |     if args.seed is not None:
52 |         logger.log('Set random seed to {}'.format(args.seed))
53 |         pl.seed_everything(args.seed)
54 | 
55 |     logger.log('Setting up data...')
56 |     train_dataset = build_dataset(cfg.data.train, 'train')
57 |     val_dataset = build_dataset(cfg.data.val, 'test')
58 | 
59 |     evaluator = build_evaluator(cfg, val_dataset)
60 | 
61 |     train_dataloader = torch.utils.data.DataLoader(train_dataset, batch_size=cfg.device.batchsize_per_gpu,
62 |                                                    shuffle=True, num_workers=cfg.device.workers_per_gpu,
63 |                                                    pin_memory=True, collate_fn=collate_function, drop_last=True)
64 |     # TODO: batch eval
65 |     val_dataloader = torch.utils.data.DataLoader(val_dataset, batch_size=1, shuffle=False,
66 |                                                  num_workers=cfg.device.workers_per_gpu,
67 |                                                  pin_memory=True, collate_fn=collate_function, drop_last=True)
68 | 
69 |     logger.log('Creating model...')
70 |     task = TrainingTask(cfg, evaluator)
71 | 
72 |     if 'load_model' in cfg.schedule:
73 |         ckpt = torch.load(cfg.schedule.load_model)
74 |         if 'pytorch-lightning_version' not in ckpt:
75 |             warnings.warn('Warning! Old .pth checkpoint is deprecated. '
76 |                           'Convert the checkpoint with tools/convert_old_checkpoint.py ')
77 |             ckpt = convert_old_model(ckpt)
78 |         task.load_state_dict(ckpt['state_dict'])
79 | 
80 |     model_resume_path = os.path.join(cfg.save_dir, 'model_last.ckpt') if 'resume' in cfg.schedule else None
81 | 
82 |     trainer = pl.Trainer(default_root_dir=cfg.save_dir,
83 |                          max_epochs=cfg.schedule.total_epochs,
84 |                          gpus=cfg.device.gpu_ids,
85 |                          check_val_every_n_epoch=cfg.schedule.val_intervals,
86 |                          accelerator='ddp',
87 |                          log_every_n_steps=cfg.log.interval,
88 |                          num_sanity_val_steps=0,
89 |                          resume_from_checkpoint=model_resume_path,
90 |                          callbacks=[ProgressBar(refresh_rate=0)]  # disable tqdm bar
91 |                          )
92 | 
93 |     trainer.fit(task, train_dataloader, val_dataloader)
94 | 
95 | 
96 | if __name__ == '__main__':
97 |     args = parse_args()
98 |     main(args)
99 | 


--------------------------------------------------------------------------------