├── docs
    ├── .gitignore
    ├── demo
    │   ├── ncnn_cpp_readme.md
    │   ├── onnx_readme.md
    │   ├── trt_cpp_readme.md
    │   ├── trt_py_readme.md
    │   ├── megengine_cpp_readme.md
    │   ├── ncnn_android_readme.md
    │   ├── openvino_cpp_readme.md
    │   ├── openvino_py_readme.md
    │   └── megengine_py_readme.md
    ├── requirements-doc.txt
    ├── index.rst
    ├── Makefile
    ├── _static
    │   └── css
    │   │   └── custom.css
    ├── updates_note.md
    ├── manipulate_training_image_size.md
    ├── quick_run.md
    └── model_zoo.md
├── demo
    ├── ncnn
    │   ├── android
    │   │   ├── settings.gradle
    │   │   ├── gradle
    │   │   │   └── wrapper
    │   │   │   │   ├── gradle-wrapper.jar
    │   │   │   │   └── gradle-wrapper.properties
    │   │   ├── app
    │   │   │   ├── src
    │   │   │   │   └── main
    │   │   │   │   │   ├── res
    │   │   │   │   │       ├── values
    │   │   │   │   │       │   └── strings.xml
    │   │   │   │   │       └── layout
    │   │   │   │   │       │   └── main.xml
    │   │   │   │   │   ├── jni
    │   │   │   │   │       └── CMakeLists.txt
    │   │   │   │   │   ├── AndroidManifest.xml
    │   │   │   │   │   └── java
    │   │   │   │   │       └── com
    │   │   │   │   │           └── megvii
    │   │   │   │   │               └── yoloXncnn
    │   │   │   │   │                   └── YOLOXncnn.java
    │   │   │   └── build.gradle
    │   │   ├── build.gradle
    │   │   ├── README.md
    │   │   ├── gradlew.bat
    │   │   └── gradlew
    │   └── cpp
    │   │   └── README.md
    ├── OpenVINO
    │   ├── README.md
    │   ├── cpp
    │   │   ├── CMakeLists.txt
    │   │   └── README.md
    │   └── python
    │   │   ├── README.md
    │   │   └── openvino_inference.py
    ├── MegEngine
    │   ├── python
    │   │   ├── models
    │   │   │   ├── __init__.py
    │   │   │   ├── yolox.py
    │   │   │   ├── yolo_fpn.py
    │   │   │   ├── yolo_pafpn.py
    │   │   │   └── darknet.py
    │   │   ├── README.md
    │   │   ├── dump.py
    │   │   ├── build.py
    │   │   └── convert_weights.py
    │   └── cpp
    │   │   └── build.sh
    ├── TensorRT
    │   ├── cpp
    │   │   ├── CMakeLists.txt
    │   │   └── README.md
    │   └── python
    │   │   └── README.md
    └── ONNXRuntime
    │   ├── onnx_inference.py
    │   └── README.md
├── assets
    ├── dog.jpg
    ├── demo.png
    ├── logo.png
    ├── zebra.jpg
    ├── git_fig.png
    ├── overall.png
    └── results.png
├── .gitattributes
├── tools
    ├── __init__.py
    ├── export_torchscript.py
    ├── trt.py
    ├── export_onnx.py
    └── train.py
├── exps
    ├── default
    │   ├── __init__.py
    │   ├── yolox_l.py
    │   ├── yolox_m.py
    │   ├── yolox_s.py
    │   ├── yolox_x.py
    │   ├── yolox_tiny.py
    │   ├── yolov3.py
    │   └── yolox_nano.py
    └── example
    │   ├── custom
    │       ├── cfp_l.py
    │       ├── cfp_m.py
    │       ├── cfp_s.py
    │       └── nano.py
    │   └── yolox_voc
    │       └── yolox_voc_s.py
├── cfp
    ├── __init__.py
    ├── layers
    │   ├── __init__.py
    │   └── csrc
    │   │   ├── vision.cpp
    │   │   └── cocoeval
    │   │       └── cocoeval.h
    ├── core
    │   ├── __init__.py
    │   └── launch.py
    ├── evaluators
    │   └── __init__.py
    ├── exp
    │   ├── __init__.py
    │   ├── default
    │   │   └── __init__.py
    │   ├── build.py
    │   └── base_exp.py
    ├── models
    │   ├── __init__.py
    │   ├── yolox.py
    │   ├── losses.py
    │   ├── yolo_fpn.py
    │   └── yolo_pafpn.py
    ├── data
    │   ├── datasets
    │   │   ├── __init__.py
    │   │   ├── voc_classes.py
    │   │   ├── coco_classes.py
    │   │   └── datasets_wrapper.py
    │   ├── __init__.py
    │   ├── data_prefetcher.py
    │   ├── samplers.py
    │   └── dataloading.py
    ├── utils
    │   ├── __init__.py
    │   ├── checkpoint.py
    │   ├── ema.py
    │   ├── setup_env.py
    │   ├── logger.py
    │   ├── allreduce_norm.py
    │   ├── metric.py
    │   ├── model_utils.py
    │   ├── visualize.py
    │   ├── demo_utils.py
    │   └── boxes.py
    └── tools
    │   └── __init__.py
├── .github
    └── workflows
    │   ├── format_check.sh
    │   └── ci.yaml
├── requirements.txt
├── .readthedocs.yaml
├── setup.cfg
├── cfp_train.sh
├── datasets
    └── README.md
├── =2.0.2
├── setup.py
├── feamap_visual.py
├── .gitignore
└── README.md


/docs/.gitignore:
--------------------------------------------------------------------------------
1 | _build


--------------------------------------------------------------------------------
/demo/ncnn/android/settings.gradle:
--------------------------------------------------------------------------------
1 | include ':app'
2 | 


--------------------------------------------------------------------------------
/docs/demo/ncnn_cpp_readme.md:
--------------------------------------------------------------------------------
1 | ../../demo/ncnn/cpp/README.md


--------------------------------------------------------------------------------
/docs/demo/onnx_readme.md:
--------------------------------------------------------------------------------
1 | ../../demo/ONNXRuntime/README.md


--------------------------------------------------------------------------------
/docs/demo/trt_cpp_readme.md:
--------------------------------------------------------------------------------
1 | ../../demo/TensorRT/cpp/README.md


--------------------------------------------------------------------------------
/docs/demo/trt_py_readme.md:
--------------------------------------------------------------------------------
1 | ../../demo/TensorRT/python/README.md


--------------------------------------------------------------------------------
/docs/demo/megengine_cpp_readme.md:
--------------------------------------------------------------------------------
1 | ../../demo/MegEngine/cpp/README.md


--------------------------------------------------------------------------------
/docs/demo/ncnn_android_readme.md:
--------------------------------------------------------------------------------
1 | ../../demo/ncnn/android/README.md


--------------------------------------------------------------------------------
/docs/demo/openvino_cpp_readme.md:
--------------------------------------------------------------------------------
1 | ../../demo/OpenVINO/cpp/README.md


--------------------------------------------------------------------------------
/docs/demo/openvino_py_readme.md:
--------------------------------------------------------------------------------
1 | ../../demo/OpenVINO/python/README.md


--------------------------------------------------------------------------------
/docs/demo/megengine_py_readme.md:
--------------------------------------------------------------------------------
1 | ../../demo/MegEngine/python/README.md


--------------------------------------------------------------------------------
/assets/dog.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/QY1994-0919/CFPNet/HEAD/assets/dog.jpg


--------------------------------------------------------------------------------
/.gitattributes:
--------------------------------------------------------------------------------
1 | # Auto detect text files and perform LF normalization
2 | * text=auto
3 | 


--------------------------------------------------------------------------------
/assets/demo.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/QY1994-0919/CFPNet/HEAD/assets/demo.png


--------------------------------------------------------------------------------
/assets/logo.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/QY1994-0919/CFPNet/HEAD/assets/logo.png


--------------------------------------------------------------------------------
/assets/zebra.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/QY1994-0919/CFPNet/HEAD/assets/zebra.jpg


--------------------------------------------------------------------------------
/assets/git_fig.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/QY1994-0919/CFPNet/HEAD/assets/git_fig.png


--------------------------------------------------------------------------------
/assets/overall.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/QY1994-0919/CFPNet/HEAD/assets/overall.png


--------------------------------------------------------------------------------
/assets/results.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/QY1994-0919/CFPNet/HEAD/assets/results.png


--------------------------------------------------------------------------------
/demo/OpenVINO/README.md:
--------------------------------------------------------------------------------
1 | ## YOLOX for OpenVINO
2 | 
3 | * [C++ Demo](./cpp)
4 | * [Python Demo](./python)


--------------------------------------------------------------------------------
/tools/__init__.py:
--------------------------------------------------------------------------------
1 | #!/usr/bin/env python3
2 | # -*- coding:utf-8 -*-
3 | # Copyright (c) Megvii, Inc. and its affiliates.
4 | 


--------------------------------------------------------------------------------
/exps/default/__init__.py:
--------------------------------------------------------------------------------
1 | #!/usr/bin/env python3
2 | # -*- coding:utf-8 -*-
3 | # Copyright (c) Megvii, Inc. and its affiliates.
4 | 


--------------------------------------------------------------------------------
/demo/ncnn/android/gradle/wrapper/gradle-wrapper.jar:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/QY1994-0919/CFPNet/HEAD/demo/ncnn/android/gradle/wrapper/gradle-wrapper.jar


--------------------------------------------------------------------------------
/cfp/__init__.py:
--------------------------------------------------------------------------------
1 | #!/usr/bin/env python3
2 | # -*- coding:utf-8 -*-
3 | 
4 | from .utils import configure_module
5 | 
6 | configure_module()
7 | 
8 | __version__ = "0.2.0"
9 | 


--------------------------------------------------------------------------------
/demo/ncnn/android/app/src/main/res/values/strings.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="utf-8"?>
2 | <resources>
3 |     <string name="app_name">yoloXncnn</string>
4 | </resources>
5 | 


--------------------------------------------------------------------------------
/cfp/layers/__init__.py:
--------------------------------------------------------------------------------
1 | #!/usr/bin/env python3
2 | # -*- coding:utf-8 -*-
3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
4 | 
5 | from .fast_coco_eval_api import COCOeval_opt
6 | 


--------------------------------------------------------------------------------
/cfp/core/__init__.py:
--------------------------------------------------------------------------------
1 | #!/usr/bin/env python3
2 | # -*- coding:utf-8 -*-
3 | # Copyright (c) Megvii, Inc. and its affiliates.
4 | 
5 | from .launch import launch
6 | from .trainer import Trainer
7 | 


--------------------------------------------------------------------------------
/cfp/evaluators/__init__.py:
--------------------------------------------------------------------------------
1 | #!/usr/bin/env python3
2 | # -*- coding:utf-8 -*-
3 | # Copyright (c) Megvii, Inc. and its affiliates.
4 | 
5 | from .coco_evaluator import COCOEvaluator
6 | from .voc_evaluator import VOCEvaluator
7 | 


--------------------------------------------------------------------------------
/cfp/exp/__init__.py:
--------------------------------------------------------------------------------
1 | #!/usr/bin/env python3
2 | # -*- coding:utf-8 -*-
3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
4 | 
5 | from .base_exp import BaseExp
6 | from .build import get_exp
7 | from .yolox_base import Exp
8 | 


--------------------------------------------------------------------------------
/docs/requirements-doc.txt:
--------------------------------------------------------------------------------
1 | docutils==0.16
2 | # https://github.com/sphinx-doc/sphinx/commit/7acd3ada3f38076af7b2b5c9f3b60bb9c2587a3d
3 | sphinx==3.2.0
4 | recommonmark==0.6.0
5 | sphinx_rtd_theme
6 | omegaconf>=2.1.0.dev24
7 | hydra-core>=1.1.0.dev5
8 | sphinx-markdown-tables==0.0.15
9 | 


--------------------------------------------------------------------------------
/demo/ncnn/android/gradle/wrapper/gradle-wrapper.properties:
--------------------------------------------------------------------------------
1 | #Sun Aug 25 10:34:48 CST 2019
2 | distributionBase=GRADLE_USER_HOME
3 | distributionPath=wrapper/dists
4 | zipStoreBase=GRADLE_USER_HOME
5 | zipStorePath=wrapper/dists
6 | distributionUrl=https\://services.gradle.org/distributions/gradle-5.4.1-all.zip
7 | 


--------------------------------------------------------------------------------
/demo/MegEngine/python/models/__init__.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
 4 | 
 5 | from .darknet import CSPDarknet, Darknet
 6 | from .yolo_fpn import YOLOFPN
 7 | from .yolo_head import YOLOXHead
 8 | from .yolo_pafpn import YOLOPAFPN
 9 | from .yolox import YOLOX
10 | 


--------------------------------------------------------------------------------
/cfp/models/__init__.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
 4 | 
 5 | from .darknet import CSPDarknet, Darknet
 6 | from .losses import IOUloss
 7 | from .yolo_fpn import YOLOFPN
 8 | from .yolo_head import YOLOXHead
 9 | from .yolo_pafpn import YOLOPAFPN
10 | from .yolox import YOLOX
11 | 


--------------------------------------------------------------------------------
/cfp/data/datasets/__init__.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | from .coco import COCODataset
 6 | from .coco_classes import COCO_CLASSES
 7 | from .datasets_wrapper import ConcatDataset, Dataset, MixConcatDataset
 8 | from .mosaicdetection import MosaicDetection
 9 | from .voc import VOCDetection
10 | 


--------------------------------------------------------------------------------
/demo/ncnn/android/app/src/main/jni/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | project(yoloXncnn)
 2 | 
 3 | cmake_minimum_required(VERSION 3.4.1)
 4 | 
 5 | set(ncnn_DIR ${CMAKE_SOURCE_DIR}/ncnn-20210525-android-vulkan/${ANDROID_ABI}/lib/cmake/ncnn)
 6 | find_package(ncnn REQUIRED)
 7 | 
 8 | add_library(yoloXncnn SHARED yoloXncnn_jni.cpp)
 9 | 
10 | target_link_libraries(yoloXncnn
11 |     ncnn
12 | 
13 |     jnigraphics
14 | )
15 | 


--------------------------------------------------------------------------------
/cfp/data/__init__.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | from .data_augment import TrainTransform, ValTransform
 6 | from .data_prefetcher import DataPrefetcher
 7 | from .dataloading import DataLoader, get_yolox_datadir, worker_init_reset_seed
 8 | from .datasets import *
 9 | from .samplers import InfiniteSampler, YoloBatchSampler
10 | 


--------------------------------------------------------------------------------
/.github/workflows/format_check.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash -e
 2 | 
 3 | set -e
 4 | 
 5 | export PYTHONPATH=$PWD:$PYTHONPATH
 6 | 
 7 | flake8 yolox exps tools || flake8_ret=$?
 8 | if [ "$flake8_ret" ]; then
 9 |     exit $flake8_ret
10 | fi
11 | echo "All flake check passed!"
12 | isort --check-only -rc yolox exps || isort_ret=$?
13 | if [ "$isort_ret" ]; then
14 |     exit $isort_ret
15 | fi
16 | echo "All isort check passed!"
17 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
 1 | # TODO: Update with exact module version
 2 | numpy
 3 | torch>=1.7
 4 | opencv_python
 5 | loguru
 6 | scikit-image
 7 | tqdm
 8 | torchvision
 9 | Pillow
10 | thop
11 | ninja
12 | tabulate
13 | tensorboard
14 | 
15 | # verified versions
16 | # pycocotools corresponds to https://github.com/ppwwyyxx/cocoapi
17 | pycocotools>=2.0.2
18 | onnx==1.8.1
19 | onnxruntime==1.8.0
20 | onnx-simplifier==0.3.5
21 | 


--------------------------------------------------------------------------------
/demo/ncnn/android/build.gradle:
--------------------------------------------------------------------------------
 1 | // Top-level build file where you can add configuration options common to all sub-projects/modules.
 2 | buildscript {
 3 |     repositories {
 4 |         jcenter()
 5 |         google()
 6 |     }
 7 |     dependencies {
 8 |         classpath 'com.android.tools.build:gradle:3.5.0'
 9 |     }
10 | }
11 | 
12 | allprojects {
13 |     repositories {
14 |         jcenter()
15 |         google()
16 |     }
17 | }
18 | 


--------------------------------------------------------------------------------
/exps/default/yolox_l.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | import os
 6 | 
 7 | from cfp.exp import Exp as MyExp
 8 | 
 9 | 
10 | class Exp(MyExp):
11 |     def __init__(self):
12 |         super(Exp, self).__init__()
13 |         self.depth = 1.0
14 |         self.width = 1.0
15 |         self.exp_name = os.path.split(os.path.realpath(__file__))[1].split(".")[0]
16 | 


--------------------------------------------------------------------------------
/exps/default/yolox_m.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | import os
 6 | 
 7 | from cfp.exp import Exp as MyExp
 8 | 
 9 | 
10 | class Exp(MyExp):
11 |     def __init__(self):
12 |         super(Exp, self).__init__()
13 |         self.depth = 0.67
14 |         self.width = 0.75
15 |         self.exp_name = os.path.split(os.path.realpath(__file__))[1].split(".")[0]
16 | 


--------------------------------------------------------------------------------
/exps/default/yolox_s.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | import os
 6 | 
 7 | from cfp.exp import Exp as MyExp
 8 | 
 9 | 
10 | class Exp(MyExp):
11 |     def __init__(self):
12 |         super(Exp, self).__init__()
13 |         self.depth = 0.33
14 |         self.width = 0.50
15 |         self.exp_name = os.path.split(os.path.realpath(__file__))[1].split(".")[0]
16 | 


--------------------------------------------------------------------------------
/exps/default/yolox_x.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | import os
 6 | 
 7 | from cfp.exp import Exp as MyExp
 8 | 
 9 | 
10 | class Exp(MyExp):
11 |     def __init__(self):
12 |         super(Exp, self).__init__()
13 |         self.depth = 1.33
14 |         self.width = 1.25
15 |         self.exp_name = os.path.split(os.path.realpath(__file__))[1].split(".")[0]
16 | 


--------------------------------------------------------------------------------
/cfp/utils/__init__.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
 4 | 
 5 | from .allreduce_norm import *
 6 | from .boxes import *
 7 | from .checkpoint import load_ckpt, save_checkpoint
 8 | from .demo_utils import *
 9 | from .dist import *
10 | from .ema import *
11 | from .logger import setup_logger
12 | from .lr_scheduler import LRScheduler
13 | from .metric import *
14 | from .model_utils import *
15 | from .setup_env import *
16 | from .visualize import *
17 | 


--------------------------------------------------------------------------------
/cfp/data/datasets/voc_classes.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | # VOC_CLASSES = ( '__background__', # always index 0
 6 | VOC_CLASSES = (
 7 |     "aeroplane",
 8 |     "bicycle",
 9 |     "bird",
10 |     "boat",
11 |     "bottle",
12 |     "bus",
13 |     "car",
14 |     "cat",
15 |     "chair",
16 |     "cow",
17 |     "diningtable",
18 |     "dog",
19 |     "horse",
20 |     "motorbike",
21 |     "person",
22 |     "pottedplant",
23 |     "sheep",
24 |     "sofa",
25 |     "train",
26 |     "tvmonitor",
27 | )
28 | 


--------------------------------------------------------------------------------
/cfp/layers/csrc/vision.cpp:
--------------------------------------------------------------------------------
 1 | #include "cocoeval/cocoeval.h"
 2 | 
 3 | PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
 4 |     m.def("COCOevalAccumulate", &COCOeval::Accumulate, "COCOeval::Accumulate");
 5 |     m.def(
 6 |         "COCOevalEvaluateImages",
 7 |         &COCOeval::EvaluateImages,
 8 |         "COCOeval::EvaluateImages");
 9 |     pybind11::class_<COCOeval::InstanceAnnotation>(m, "InstanceAnnotation")
10 |         .def(pybind11::init<uint64_t, double, double, bool, bool>());
11 |     pybind11::class_<COCOeval::ImageEvaluation>(m, "ImageEvaluation")
12 |         .def(pybind11::init<>());
13 | }
14 | 


--------------------------------------------------------------------------------
/demo/OpenVINO/cpp/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | cmake_minimum_required(VERSION 3.4.1)
 2 | set(CMAKE_CXX_STANDARD 14)
 3 | 
 4 | project(yolox_openvino_demo)
 5 | 
 6 | find_package(OpenCV REQUIRED)
 7 | find_package(InferenceEngine REQUIRED)
 8 | find_package(ngraph REQUIRED)
 9 | 
10 | include_directories(
11 |     ${OpenCV_INCLUDE_DIRS}
12 |     ${CMAKE_CURRENT_SOURCE_DIR}
13 |     ${CMAKE_CURRENT_BINARY_DIR}
14 | )
15 | 
16 | add_executable(yolox_openvino yolox_openvino.cpp)
17 | 
18 | target_link_libraries(
19 |      yolox_openvino
20 |     ${InferenceEngine_LIBRARIES}
21 |     ${NGRAPH_LIBRARIES}
22 |     ${OpenCV_LIBS} 
23 | )


--------------------------------------------------------------------------------
/demo/ncnn/android/app/build.gradle:
--------------------------------------------------------------------------------
 1 | apply plugin: 'com.android.application'
 2 | 
 3 | android {
 4 |     compileSdkVersion 24
 5 |     buildToolsVersion "29.0.2"
 6 | 
 7 |     defaultConfig {
 8 |         applicationId "com.megvii.yoloXncnn"
 9 |         archivesBaseName = "$applicationId"
10 | 
11 |         ndk {
12 |             moduleName "ncnn"
13 |             abiFilters "armeabi-v7a", "arm64-v8a"
14 |         }
15 |         minSdkVersion 24
16 |     }
17 | 
18 |     externalNativeBuild {
19 |         cmake {
20 |             version "3.10.2"
21 |             path file('src/main/jni/CMakeLists.txt')
22 |         }
23 |     }
24 | }
25 | 


--------------------------------------------------------------------------------
/.readthedocs.yaml:
--------------------------------------------------------------------------------
 1 | # .readthedocs.yaml
 2 | # Read the Docs configuration file
 3 | # See https://docs.readthedocs.io/en/stable/config-file/v2.html for details
 4 | 
 5 | # Required
 6 | version: 2
 7 | 
 8 | # Build documentation in the docs/ directory with Sphinx
 9 | sphinx:
10 |    configuration: docs/conf.py
11 | 
12 | # Optionally build your docs in additional formats such as PDF
13 | formats:
14 |    - pdf
15 | 
16 | # Optionally set the version of Python and requirements required to build your docs
17 | python:
18 |    version: "3.7"
19 |    install:
20 |    - requirements: docs/requirements-doc.txt
21 |    - requirements: requirements.txt
22 | 


--------------------------------------------------------------------------------
/exps/default/yolox_tiny.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | import os
 6 | 
 7 | from cfp.exp import Exp as MyExp
 8 | 
 9 | 
10 | class Exp(MyExp):
11 |     def __init__(self):
12 |         super(Exp, self).__init__()
13 |         self.depth = 0.33
14 |         self.width = 0.375
15 |         self.input_size = (416, 416)
16 |         self.mosaic_scale = (0.5, 1.5)
17 |         self.random_size = (10, 20)
18 |         self.test_size = (416, 416)
19 |         self.exp_name = os.path.split(os.path.realpath(__file__))[1].split(".")[0]
20 |         self.enable_mixup = False
21 | 


--------------------------------------------------------------------------------
/docs/index.rst:
--------------------------------------------------------------------------------
 1 | 
 2 | Welcome to YOLOX's documentation!
 3 | ======================================
 4 | 
 5 | .. image:: ../assets/logo.png
 6 | 
 7 | .. toctree::
 8 |    :maxdepth: 2
 9 |    :caption: Quick Run
10 |    
11 |    quick_run
12 |    model_zoo
13 | 
14 | .. toctree::
15 |    :maxdepth: 2
16 |    :caption: Tutorials
17 | 
18 |    train_custom_data
19 | 
20 | .. toctree::
21 |    :maxdepth: 2
22 |    :caption: Demployment
23 | 
24 |    demo/trt_py_readme
25 |    demo/trt_cpp_readme
26 |    demo/megengine_cpp_readme
27 |    demo/megengine_py_readme
28 |    demo/ncnn_android_readme
29 |    demo/ncnn_cpp_readme
30 |    demo/onnx_readme
31 |    demo/openvino_py_readme
32 |    demo/openvino_cpp_readme


--------------------------------------------------------------------------------
/setup.cfg:
--------------------------------------------------------------------------------
 1 | [isort]
 2 | line_length = 100
 3 | multi_line_output = 3
 4 | balanced_wrapping = True
 5 | known_standard_library = setuptools
 6 | known_third_party = tqdm,loguru
 7 | known_data_processing = cv2,numpy,scipy,PIL,matplotlib,scikit_image
 8 | known_datasets = pycocotools
 9 | known_deeplearning = torch,torchvision,caffe2,onnx,apex,timm,thop,torch2trt,tensorrt,openvino,onnxruntime
10 | known_myself = yolox
11 | sections = FUTURE,STDLIB,THIRDPARTY,data_processing,datasets,deeplearning,myself,FIRSTPARTY,LOCALFOLDER
12 | no_lines_before=STDLIB,THIRDPARTY,datasets
13 | default_section = FIRSTPARTY
14 | 
15 | [flake8]
16 | max-line-length = 100
17 | max-complexity = 18
18 | exclude = __init__.py
19 | 


--------------------------------------------------------------------------------
/docs/Makefile:
--------------------------------------------------------------------------------
 1 | # Minimal makefile for Sphinx documentation
 2 | # Copyright (c) Facebook, Inc. and its affiliates.
 3 | 
 4 | # You can set these variables from the command line.
 5 | SPHINXOPTS    =
 6 | SPHINXBUILD   = sphinx-build
 7 | SOURCEDIR     = .
 8 | BUILDDIR      = _build
 9 | 
10 | # Put it first so that "make" without argument is like "make help".
11 | help:
12 | 	@$(SPHINXBUILD) -M help "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)
13 | 
14 | .PHONY: help Makefile
15 | 
16 | # Catch-all target: route all unknown targets to Sphinx using the new
17 | # "make mode" option.  $(O) is meant as a shortcut for $(SPHINXOPTS).
18 | %: Makefile
19 | 	@$(SPHINXBUILD) -M $@ "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)


--------------------------------------------------------------------------------
/docs/_static/css/custom.css:
--------------------------------------------------------------------------------
 1 | /*
 2 |  * Copyright (c) Facebook, Inc. and its affiliates.
 3 |  * some extra css to make markdown look similar between github/sphinx
 4 |  */
 5 | 
 6 | /*
 7 |  * Below is for install.md:
 8 |  */
 9 |  .rst-content code {
10 |     white-space: pre;
11 |     border: 0px;
12 |   }
13 |   
14 |   .rst-content th {
15 |     border: 1px solid #e1e4e5;
16 |   }
17 |   
18 |   .rst-content th p {
19 |     /* otherwise will be default 24px for regular paragraph */
20 |     margin-bottom: 0px;
21 |   }
22 |   
23 |   .rst-content .line-block {
24 |     /* otherwise will be 24px */
25 |     margin-bottom: 0px;
26 |   }
27 |   
28 |   div.section > details {
29 |     padding-bottom: 1em;
30 |   }
31 |   


--------------------------------------------------------------------------------
/demo/ncnn/android/app/src/main/AndroidManifest.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?>
 2 | <manifest xmlns:android="http://schemas.android.com/apk/res/android"
 3 |       package="com.megvii.yoloXncnn"
 4 |       android:versionCode="1"
 5 |       android:versionName="1.1">
 6 |     <application android:label="@string/app_name" >
 7 |         <activity android:name="MainActivity"
 8 |                   android:label="@string/app_name">
 9 |             <intent-filter>
10 |                 <action android:name="android.intent.action.MAIN" />
11 |                 <category android:name="android.intent.category.LAUNCHER" />
12 |             </intent-filter>
13 |         </activity>
14 |     </application>
15 | </manifest> 
16 | 


--------------------------------------------------------------------------------
/demo/ncnn/android/app/src/main/java/com/megvii/yoloXncnn/YOLOXncnn.java:
--------------------------------------------------------------------------------
 1 | // Copyright (C) Megvii, Inc. and its affiliates. All rights reserved.
 2 | 
 3 | package com.megvii.yoloXncnn;
 4 | 
 5 | import android.content.res.AssetManager;
 6 | import android.graphics.Bitmap;
 7 | 
 8 | public class YOLOXncnn
 9 | {
10 |     public native boolean Init(AssetManager mgr);
11 | 
12 |     public class Obj
13 |     {
14 |         public float x;
15 |         public float y;
16 |         public float w;
17 |         public float h;
18 |         public String label;
19 |         public float prob;
20 |     }
21 | 
22 |     public native Obj[] Detect(Bitmap bitmap, boolean use_gpu);
23 | 
24 |     static {
25 |         System.loadLibrary("yoloXncnn");
26 |     }
27 | }
28 | 


--------------------------------------------------------------------------------
/cfp_train.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash 
 2 | 
 3 | #SBATCH -J train  # 作业名为 test
 4 | 
 5 | #SBATCH -p defq  # 提交到 defq 队列
 6 | 
 7 | #SBATCH -N 1     # 使用 1 个节点
 8 | 
 9 | #SBATCH --ntasks-per-node=8  # 每个节点开启 6 个进程
10 | 
11 | #SBATCH --cpus-per-task=2    # 每个进程占用一个 cpu 核心
12 | 
13 | #SBATCH -t 7-24:00:00 # 任务最大运行时间是 10 分钟 (非必需项) 48:00:00
14 | 
15 | 
16 | #SBATCH --gres=gpu:2    # 如果是gpu任务需要在此行定义gpu数量,此处为1
17 | 
18 | module load cuda11.0/toolkit/11.0.3
19 | 
20 | #python tools/demo.py image -f exps/default/yolox_s.py -c ./weights/cfp_s.pth --path assets/dog.jpg --conf 0.25 --nms 0.45 --tsize 640 --save_result --device gpu
21 | python tools/train.py -f exps/example/custom/cfp_s.py -d 1 -b 16 --fp16 -o -c ./weights/cfp_s.pth
22 | #python tools/train.py -f exps/example/custom/cfp_s.py -d 2 -b 16 --fp16 -o -c ./YOLOX_outputs/l_CCF/latest_ckpt.pth --resume -e 10
23 | 
24 | 
25 | 
26 | 


--------------------------------------------------------------------------------
/datasets/README.md:
--------------------------------------------------------------------------------
 1 | # Prepare datasets
 2 | 
 3 | If you have a dataset directory, you could use os environment variable named `YOLOX_DATADIR`. Under this directory, YOLOX will look for datasets in the structure described below, if needed.
 4 | ```
 5 | $YOLOX_DATADIR/
 6 |   COCO/
 7 | ```
 8 | You can set the location for builtin datasets by
 9 | ```shell
10 | export YOLOX_DATADIR=/path/to/your/datasets
11 | ```
12 | If `YOLOX_DATADIR` is not set, the default value of dataset directory is `./datasets` relative to your current working directory.
13 | 
14 | ## Expected dataset structure for [COCO detection](https://cocodataset.org/#download):
15 | 
16 | ```
17 | COCO/
18 |   annotations/
19 |     instances_{train,val}2017.json
20 |   {train,val}2017/
21 |     # image files that are mentioned in the corresponding json
22 | ```
23 | 
24 | You can use the 2014 version of the dataset as well.
25 | 


--------------------------------------------------------------------------------
/exps/example/custom/cfp_l.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | import os
 5 | 
 6 | from cfp.exp import Exp as MyExp
 7 | 
 8 | 
 9 | class Exp(MyExp):
10 |     def __init__(self):
11 |         super(Exp, self).__init__()
12 |         self.depth = 1.00
13 |         self.width = 1.00
14 |         self.exp_name = os.path.split(os.path.realpath(__file__))[1].split(".")[0]
15 | 
16 |         # Define yourself dataset path
17 |         self.data_dir = "/home/10102006/dataset/coco"  #"datasets/coco128"
18 |         self.train_ann = "instances_train2017.json"  #"instances_train2017.json"
19 |         self.val_ann = "instances_val2017.json"   # "instances_val2017.json"
20 | 
21 |         self.num_classes = 80
22 | 
23 |         self.max_epoch = 150
24 |         self.data_num_workers = 4
25 |         self.eval_interval = 1
26 | 


--------------------------------------------------------------------------------
/exps/example/custom/cfp_m.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | import os
 5 | 
 6 | from cfp.exp import Exp as MyExp
 7 | 
 8 | 
 9 | class Exp(MyExp):
10 |     def __init__(self):
11 |         super(Exp, self).__init__()
12 |         self.depth = 0.67
13 |         self.width = 0.75
14 |         self.exp_name = os.path.split(os.path.realpath(__file__))[1].split(".")[0]
15 | 
16 |         # Define yourself dataset path
17 |         self.data_dir = "/home/10102006/dataset/coco"  #"datasets/coco128"
18 |         self.train_ann = "instances_train2017.json"  #"instances_train2017.json"
19 |         self.val_ann = "instances_val2017.json"   # "instances_val2017.json"
20 | 
21 |         self.num_classes = 80
22 | 
23 |         self.max_epoch = 60
24 |         self.data_num_workers = 4
25 |         self.eval_interval = 1
26 | 


--------------------------------------------------------------------------------
/exps/example/custom/cfp_s.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | import os
 5 | 
 6 | from cfp.exp import Exp as MyExp
 7 | 
 8 | 
 9 | class Exp(MyExp):
10 |     def __init__(self):
11 |         super(Exp, self).__init__()
12 |         self.depth = 0.33
13 |         self.width = 0.50
14 |         self.exp_name = os.path.split(os.path.realpath(__file__))[1].split(".")[0]
15 | 
16 |         # Define yourself dataset path
17 |         self.data_dir = "/home/10102006/dataset/coco"  #"datasets/coco128"
18 |         self.train_ann = "instances_train2017.json"  #"instances_train2017.json"
19 |         self.val_ann = "instances_val2017.json"   # "instances_val2017.json"
20 | 
21 |         self.num_classes = 80
22 | 
23 |         self.max_epoch = 150
24 |         self.data_num_workers = 4
25 |         self.eval_interval = 1
26 | 


--------------------------------------------------------------------------------
/demo/MegEngine/python/README.md:
--------------------------------------------------------------------------------
 1 | # YOLOX-Python-MegEngine
 2 | 
 3 | Python version of YOLOX object detection base on [MegEngine](https://github.com/MegEngine/MegEngine).
 4 | 
 5 | ## Tutorial
 6 | 
 7 | ### Step1: install requirements
 8 | 
 9 | ```
10 | python3 -m pip install megengine -f https://megengine.org.cn/whl/mge.html
11 | ```
12 | 
13 | ### Step2: convert checkpoint weights from torch's path file
14 | 
15 | ```
16 | python3 convert_weights.py -w yolox_s.pth -o yolox_s_mge.pkl
17 | ```
18 | 
19 | ### Step3: run demo
20 | 
21 | This part is the same as torch's python demo, but no need to specify device.
22 | 
23 | ```
24 | python3 demo.py image -n yolox-s -c yolox_s_mge.pkl --path ../../../assets/dog.jpg --conf 0.25 --nms 0.45 --tsize 640 --save_result
25 | ```
26 | 
27 | ###  [Optional]Step4: dump model for cpp inference
28 | 
29 | > **Note**: result model is dumped with `optimize_for_inference` and `enable_fuse_conv_bias_nonlinearity`.
30 | 
31 | ```
32 | python3 dump.py -n yolox-s -c yolox_s_mge.pkl --dump_path yolox_s.mge
33 | ```
34 | 


--------------------------------------------------------------------------------
/demo/MegEngine/python/models/yolox.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- encoding: utf-8 -*-
 3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
 4 | 
 5 | import megengine.module as M
 6 | 
 7 | from .yolo_head import YOLOXHead
 8 | from .yolo_pafpn import YOLOPAFPN
 9 | 
10 | 
11 | class YOLOX(M.Module):
12 |     """
13 |     YOLOX model module. The module list is defined by create_yolov3_modules function.
14 |     The network returns loss values from three YOLO layers during training
15 |     and detection results during test.
16 |     """
17 | 
18 |     def __init__(self, backbone=None, head=None):
19 |         super().__init__()
20 |         if backbone is None:
21 |             backbone = YOLOPAFPN()
22 |         if head is None:
23 |             head = YOLOXHead(80)
24 | 
25 |         self.backbone = backbone
26 |         self.head = head
27 | 
28 |     def forward(self, x):
29 |         # fpn output content features of [dark3, dark4, dark5]
30 |         fpn_outs = self.backbone(x)
31 |         assert not self.training
32 |         outputs = self.head(fpn_outs)
33 | 
34 |         return outputs
35 | 


--------------------------------------------------------------------------------
/cfp/tools/__init__.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
 4 | 
 5 | # This file is used for package installation. Script of train/eval/export will be available.
 6 | 
 7 | import importlib
 8 | import sys
 9 | from pathlib import Path
10 | 
11 | _TOOLS_PATH = Path(__file__).resolve().parent.parent.parent / "tools"
12 | 
13 | if _TOOLS_PATH.is_dir():
14 |     # This is true only for in-place installation (pip install -e, setup.py develop),
15 |     # where setup(package_dir=) does not work: https://github.com/pypa/setuptools/issues/230
16 | 
17 |     class _PathFinder(importlib.abc.MetaPathFinder):
18 | 
19 |         def find_spec(self, name, path, target=None):
20 |             if not name.startswith("cfp.tools."):
21 |                 return
22 |             project_name = name.split(".")[-1] + ".py"
23 |             target_file = _TOOLS_PATH / project_name
24 |             if not target_file.is_file():
25 |                 return
26 |             return importlib.util.spec_from_file_location(name, target_file)
27 | 
28 |     sys.meta_path.append(_PathFinder())
29 | 


--------------------------------------------------------------------------------
/cfp/exp/default/__init__.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
 4 | 
 5 | # This file is used for package installation and find default exp file
 6 | 
 7 | import importlib
 8 | import sys
 9 | from pathlib import Path
10 | 
11 | _EXP_PATH = Path(__file__).resolve().parent.parent.parent.parent / "exps" / "default"
12 | 
13 | if _EXP_PATH.is_dir():
14 |     # This is true only for in-place installation (pip install -e, setup.py develop),
15 |     # where setup(package_dir=) does not work: https://github.com/pypa/setuptools/issues/230
16 | 
17 |     class _ExpFinder(importlib.abc.MetaPathFinder):
18 |         
19 |         def find_spec(self, name, path, target=None):
20 |             if not name.startswith("yolox.exp.default"):
21 |                 return
22 |             project_name = name.split(".")[-1] + ".py"
23 |             target_file = _EXP_PATH / project_name
24 |             if not target_file.is_file():
25 |                 return
26 |             return importlib.util.spec_from_file_location(name, target_file)
27 | 
28 |     sys.meta_path.append(_ExpFinder())
29 | 


--------------------------------------------------------------------------------
/exps/default/yolov3.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | import os
 6 | 
 7 | import torch.nn as nn
 8 | 
 9 | from cfp.exp import Exp as MyExp
10 | 
11 | 
12 | class Exp(MyExp):
13 |     def __init__(self):
14 |         super(Exp, self).__init__()
15 |         self.depth = 1.0
16 |         self.width = 1.0
17 |         self.exp_name = os.path.split(os.path.realpath(__file__))[1].split(".")[0]
18 | 
19 |     def get_model(self, sublinear=False):
20 |         def init_yolo(M):
21 |             for m in M.modules():
22 |                 if isinstance(m, nn.BatchNorm2d):
23 |                     m.eps = 1e-3
24 |                     m.momentum = 0.03
25 |         if "model" not in self.__dict__:
26 |             from yolox.models import YOLOX, YOLOFPN, YOLOXHead
27 |             backbone = YOLOFPN()
28 |             head = YOLOXHead(self.num_classes, self.width, in_channels=[128, 256, 512], act="lrelu")
29 |             self.model = YOLOX(backbone, head)
30 |         self.model.apply(init_yolo)
31 |         self.model.head.initialize_biases(1e-2)
32 | 
33 |         return self.model
34 | 


--------------------------------------------------------------------------------
/demo/ncnn/android/README.md:
--------------------------------------------------------------------------------
 1 | # YOLOX-Android-ncnn
 2 | 
 3 | Andoird app of YOLOX object detection base on [ncnn](https://github.com/Tencent/ncnn)
 4 | 
 5 | 
 6 | ## Tutorial
 7 | 
 8 | ### Step1
 9 | 
10 | Download ncnn-android-vulkan.zip from [releases of ncnn](https://github.com/Tencent/ncnn/releases). This repo uses
11 | [20210525 release](https://github.com/Tencent/ncnn/releases/download/20210525/ncnn-20210525-android-vulkan.zip) for building.
12 | 
13 | ### Step2
14 | 
15 | After downloading, please extract your zip file. Then, there are two ways to finish this step:
16 | * put your extracted directory into **app/src/main/jni**
17 | * change the **ncnn_DIR** path in **app/src/main/jni/CMakeLists.txt** to your extracted directory
18 | 
19 | ### Step3
20 | Download example param and bin file from [onedrive](https://megvii-my.sharepoint.cn/:u:/g/personal/gezheng_megvii_com/ESXBH_GSSmFMszWJ6YG2VkQB5cWDfqVWXgk0D996jH0rpQ?e=qzEqUh) or [github](https://github.com/Megvii-BaseDetection/storage/releases/download/0.0.1/yolox_s_ncnn.tar.gz). Unzip the file to **app/src/main/assets**.
21 | 
22 | ### Step4
23 | Open this project with Android Studio, build it and enjoy!
24 | 
25 | ## Reference
26 | 
27 | * [ncnn-android-yolov5](https://github.com/nihui/ncnn-android-yolov5)
28 | 


--------------------------------------------------------------------------------
/demo/TensorRT/cpp/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | cmake_minimum_required(VERSION 2.6)
 2 | 
 3 | project(yolox)
 4 | 
 5 | add_definitions(-std=c++11)
 6 | 
 7 | option(CUDA_USE_STATIC_CUDA_RUNTIME OFF)
 8 | set(CMAKE_CXX_STANDARD 11)
 9 | set(CMAKE_BUILD_TYPE Debug)
10 | 
11 | find_package(CUDA REQUIRED)
12 | 
13 | include_directories(${PROJECT_SOURCE_DIR}/include)
14 | # include and link dirs of cuda and tensorrt, you need adapt them if yours are different
15 | # cuda
16 | include_directories(/data/cuda/cuda-10.2/cuda/include)
17 | link_directories(/data/cuda/cuda-10.2/cuda/lib64)
18 | # cudnn
19 | include_directories(/data/cuda/cuda-10.2/cudnn/v8.0.4/include)
20 | link_directories(/data/cuda/cuda-10.2/cudnn/v8.0.4/lib64)
21 | # tensorrt
22 | include_directories(/data/cuda/cuda-10.2/TensorRT/v7.2.1.6/include)
23 | link_directories(/data/cuda/cuda-10.2/TensorRT/v7.2.1.6/lib)
24 | 
25 | set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -std=c++11 -Wall -Ofast -Wfatal-errors -D_MWAITXINTRIN_H_INCLUDED")
26 | 
27 | find_package(OpenCV)
28 | include_directories(${OpenCV_INCLUDE_DIRS})
29 | 
30 | add_executable(yolox ${PROJECT_SOURCE_DIR}/yolox.cpp)
31 | target_link_libraries(yolox nvinfer)
32 | target_link_libraries(yolox cudart)
33 | target_link_libraries(yolox ${OpenCV_LIBS})
34 | 
35 | add_definitions(-O2 -pthread)
36 | 
37 | 


--------------------------------------------------------------------------------
/demo/ncnn/android/app/src/main/res/layout/main.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?>
 2 | <LinearLayout xmlns:android="http://schemas.android.com/apk/res/android"
 3 |     android:orientation="vertical"
 4 |     android:layout_width="fill_parent"
 5 |     android:layout_height="fill_parent">
 6 | 
 7 |     <LinearLayout
 8 |         android:orientation="horizontal"
 9 |         android:layout_width="fill_parent"
10 |         android:layout_height="wrap_content">
11 | 
12 |     <Button
13 |         android:id="@+id/buttonImage"
14 |         android:layout_width="wrap_content"
15 |         android:layout_height="wrap_content"
16 |         android:text="image" />
17 |     <Button
18 |         android:id="@+id/buttonDetect"
19 |         android:layout_width="wrap_content"
20 |         android:layout_height="wrap_content"
21 |         android:text="infer-cpu" />
22 |     <Button
23 |         android:id="@+id/buttonDetectGPU"
24 |         android:layout_width="wrap_content"
25 |         android:layout_height="wrap_content"
26 |         android:text="infer-gpu" />
27 |     </LinearLayout>
28 | 
29 |     <ImageView
30 |         android:id="@+id/imageView"
31 |         android:layout_width="fill_parent"
32 |         android:layout_height="fill_parent"
33 |         android:layout_weight="1" />
34 | 
35 | </LinearLayout>
36 | 


--------------------------------------------------------------------------------
/.github/workflows/ci.yaml:
--------------------------------------------------------------------------------
 1 | # This is a basic workflow to help you get started with Actions
 2 | 
 3 | name: CI
 4 | 
 5 | # Controls when the action will run. Triggers the workflow on push or pull request
 6 | # events but only for the master branch
 7 | on:
 8 |   push:
 9 |   pull_request:
10 | 
11 | # A workflow run is made up of one or more jobs that can run sequentially or in parallel
12 | jobs:
13 |   # This workflow contains a single job called "build"
14 |   build:
15 |     # The type of runner that the job will run on
16 |     runs-on: ubuntu-latest
17 |     strategy:
18 |       matrix:
19 |         python-version: [3.6, 3.7, 3.8]
20 | 
21 |     # Steps represent a sequence of tasks that will be executed as part of the job
22 |     steps:
23 |     # Checks-out your repository under $GITHUB_WORKSPACE, so your job can access it
24 |     - uses: actions/checkout@v2
25 | 
26 |     - name: Set up Python ${{ matrix.python-version }}
27 |       uses: actions/setup-python@v1
28 |       with:
29 |         python-version: ${{ matrix.python-version }}
30 | 
31 |     - name: Install dependencies
32 |       run: |
33 |         python -m pip install --upgrade pip
34 |         pip install -r requirements.txt
35 |         pip install isort==4.3.21
36 |         pip install flake8==3.8.3
37 |     # Runs a set of commands using the runners shell
38 |     - name: Format check
39 |       run: ./.github/workflows/format_check.sh
40 | 


--------------------------------------------------------------------------------
/cfp/exp/build.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
 4 | 
 5 | import importlib
 6 | import os
 7 | import sys
 8 | 
 9 | 
10 | def get_exp_by_file(exp_file):
11 |     try:
12 |         sys.path.append(os.path.dirname(exp_file))
13 |         current_exp = importlib.import_module(os.path.basename(exp_file).split(".")[0])
14 |         exp = current_exp.Exp()
15 |     except Exception:
16 |         raise ImportError("{} doesn't contains class named 'Exp'".format(exp_file))
17 |     return exp
18 | 
19 | 
20 | def get_exp_by_name(exp_name):
21 |     exp = exp_name.replace("-", "_")  # convert string like "yolox-s" to "yolox_s"
22 |     module_name = ".".join(["yolox", "exp", "default", exp])
23 |     exp_object = importlib.import_module(module_name).Exp()
24 |     return exp_object
25 | 
26 | 
27 | def get_exp(exp_file=None, exp_name=None):
28 |     """
29 |     get Exp object by file or name. If exp_file and exp_name
30 |     are both provided, get Exp by exp_file.
31 | 
32 |     Args:
33 |         exp_file (str): file path of experiment.
34 |         exp_name (str): name of experiment. "yolo-s",
35 |     """
36 |     assert (
37 |         exp_file is not None or exp_name is not None
38 |     ), "plz provide exp file or exp name."
39 |     if exp_file is not None:
40 |         return get_exp_by_file(exp_file)
41 |     else:
42 |         return get_exp_by_name(exp_name)
43 | 


--------------------------------------------------------------------------------
/demo/TensorRT/cpp/README.md:
--------------------------------------------------------------------------------
 1 | # YOLOX-TensorRT in C++
 2 | 
 3 | As YOLOX models are easy to convert to tensorrt using [torch2trt gitrepo](https://github.com/NVIDIA-AI-IOT/torch2trt), 
 4 | our C++ demo does not include the model converting or constructing like other tenorrt demos.
 5 | 
 6 | 
 7 | ## Step 1: Prepare serialized engine file
 8 | 
 9 | Follow the trt [python demo README](https://github.com/Megvii-BaseDetection/YOLOX/blob/main/demo/TensorRT/python/README.md) to convert and save the serialized engine file.
10 | 
11 | Check the 'model_trt.engine' file generated from Step 1, which will be automatically saved at the current demo dir.
12 | 
13 | 
14 | ## Step 2: build the demo
15 | 
16 | Please follow the [TensorRT Installation Guide](https://docs.nvidia.com/deeplearning/tensorrt/install-guide/index.html) to install TensorRT.
17 | 
18 | And you should set the TensorRT path and CUDA path in CMakeLists.txt.
19 | 
20 | If you train your custom dataset, you may need to modify the value of `num_class`.
21 | 
22 | ```c++
23 | const int num_class = 80;
24 | ```
25 | 
26 | Install opencv with ```sudo apt-get install libopencv-dev``` (we don't need a higher version of opencv like v3.3+). 
27 | 
28 | build the demo:
29 | 
30 | ```shell
31 | mkdir build
32 | cd build
33 | cmake ..
34 | make
35 | ```
36 | 
37 | Then run the demo:
38 | 
39 | ```shell
40 | ./yolox ../model_trt.engine -i ../../../../assets/dog.jpg
41 | ```
42 | 
43 | or
44 | 
45 | ```shell
46 | ./yolox <path/to/your/engine_file> -i <path/to/image>
47 | ```
48 | 
49 | 


--------------------------------------------------------------------------------
/demo/MegEngine/python/dump.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | import argparse
 6 | 
 7 | import megengine as mge
 8 | import numpy as np
 9 | from megengine import jit
10 | 
11 | from build import build_and_load
12 | 
13 | 
14 | def make_parser():
15 |     parser = argparse.ArgumentParser("YOLOX Demo Dump")
16 |     parser.add_argument("-n", "--name", type=str, default="yolox-s", help="model name")
17 |     parser.add_argument("-c", "--ckpt", default=None, type=str, help="ckpt for eval")
18 |     parser.add_argument(
19 |         "--dump_path", default="model.mge", help="path to save the dumped model"
20 |     )
21 |     return parser
22 | 
23 | 
24 | def dump_static_graph(model, graph_name="model.mge"):
25 |     model.eval()
26 |     model.head.decode_in_inference = False
27 | 
28 |     data = mge.Tensor(np.random.random((1, 3, 640, 640)))
29 | 
30 |     @jit.trace(capture_as_const=True)
31 |     def pred_func(data):
32 |         outputs = model(data)
33 |         return outputs
34 | 
35 |     pred_func(data)
36 |     pred_func.dump(
37 |         graph_name,
38 |         arg_names=["data"],
39 |         optimize_for_inference=True,
40 |         enable_fuse_conv_bias_nonlinearity=True,
41 |     )
42 | 
43 | 
44 | def main(args):
45 |     model = build_and_load(args.ckpt, name=args.name)
46 |     dump_static_graph(model, args.dump_path)
47 | 
48 | 
49 | if __name__ == "__main__":
50 |     args = make_parser().parse_args()
51 |     main(args)
52 | 


--------------------------------------------------------------------------------
/cfp/utils/checkpoint.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
 4 | import os
 5 | import shutil
 6 | from loguru import logger
 7 | 
 8 | import torch
 9 | 
10 | 
11 | def load_ckpt(model, ckpt):
12 |     model_state_dict = model.state_dict()
13 |     load_dict = {}
14 |     for key_model, v in model_state_dict.items():
15 |         if key_model not in ckpt:
16 |             logger.warning(
17 |                 "{} is not in the ckpt. Please double check and see if this is desired.".format(
18 |                     key_model
19 |                 )
20 |             )
21 |             continue
22 |         v_ckpt = ckpt[key_model]
23 |         if v.shape != v_ckpt.shape:
24 |             logger.warning(
25 |                 "Shape of {} in checkpoint is {}, while shape of {} in model is {}.".format(
26 |                     key_model, v_ckpt.shape, key_model, v.shape
27 |                 )
28 |             )
29 |             continue
30 |         load_dict[key_model] = v_ckpt
31 | 
32 |     model.load_state_dict(load_dict, strict=False)
33 |     return model
34 | 
35 | 
36 | def save_checkpoint(state, is_best, save_dir, model_name=""):
37 |     if not os.path.exists(save_dir):
38 |         os.makedirs(save_dir)
39 |     filename = os.path.join(save_dir, model_name + "_ckpt.pth")
40 |     torch.save(state, filename)
41 |     if is_best:
42 |         best_filename = os.path.join(save_dir, "best_ckpt.pth")
43 |         shutil.copyfile(filename, best_filename)
44 | 


--------------------------------------------------------------------------------
/cfp/models/yolox.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | # -*- encoding: utf-8 -*-
 3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
 4 | 
 5 | import torch.nn as nn
 6 | 
 7 | from .yolo_head import YOLOXHead
 8 | from .yolo_pafpn import YOLOPAFPN
 9 | 
10 | 
11 | class YOLOX(nn.Module):
12 |     """
13 |     YOLOX model module. The module list is defined by create_yolov3_modules function.
14 |     The network returns loss values from three YOLO layers during training
15 |     and detection results during test.
16 |     """
17 | 
18 |     def __init__(self, backbone=None, head=None):
19 |         super().__init__()
20 |         if backbone is None:
21 |             backbone = YOLOPAFPN()
22 |         if head is None:
23 |             head = YOLOXHead(80)
24 | 
25 |         self.backbone = backbone
26 |         self.head = head
27 | 
28 |     def forward(self, x, targets=None):
29 |         # fpn output content features of [dark3, dark4, dark5]不够准确，应该是[pan_out0,pan_out1,pan_out2]的输出
30 |         fpn_outs = self.backbone(x)
31 | 
32 |         if self.training:
33 |             assert targets is not None
34 |             loss, iou_loss, conf_loss, cls_loss, l1_loss, num_fg = self.head(
35 |                 fpn_outs, targets, x
36 |             )
37 |             outputs = {
38 |                 "total_loss": loss,
39 |                 "iou_loss": iou_loss,
40 |                 "l1_loss": l1_loss,
41 |                 "conf_loss": conf_loss,
42 |                 "cls_loss": cls_loss,
43 |                 "num_fg": num_fg,
44 |             }
45 |         else:
46 |             outputs = self.head(fpn_outs)
47 | 
48 |         return outputs
49 | 


--------------------------------------------------------------------------------
/=2.0.2:
--------------------------------------------------------------------------------
 1 | Requirement already satisfied: pycocotools in /home/10102006/anaconda3/envs/yolox/lib/python3.8/site-packages (2.0.4)
 2 | Requirement already satisfied: matplotlib>=2.1.0 in /home/10102006/anaconda3/envs/yolox/lib/python3.8/site-packages (from pycocotools) (3.5.1)
 3 | Requirement already satisfied: numpy in /home/10102006/anaconda3/envs/yolox/lib/python3.8/site-packages (from pycocotools) (1.22.2)
 4 | Requirement already satisfied: fonttools>=4.22.0 in /home/10102006/anaconda3/envs/yolox/lib/python3.8/site-packages (from matplotlib>=2.1.0->pycocotools) (4.29.1)
 5 | Requirement already satisfied: pillow>=6.2.0 in /home/10102006/anaconda3/envs/yolox/lib/python3.8/site-packages (from matplotlib>=2.1.0->pycocotools) (9.0.1)
 6 | Requirement already satisfied: python-dateutil>=2.7 in /home/10102006/anaconda3/envs/yolox/lib/python3.8/site-packages (from matplotlib>=2.1.0->pycocotools) (2.8.2)
 7 | Requirement already satisfied: packaging>=20.0 in /home/10102006/anaconda3/envs/yolox/lib/python3.8/site-packages (from matplotlib>=2.1.0->pycocotools) (21.3)
 8 | Requirement already satisfied: kiwisolver>=1.0.1 in /home/10102006/anaconda3/envs/yolox/lib/python3.8/site-packages (from matplotlib>=2.1.0->pycocotools) (1.3.2)
 9 | Requirement already satisfied: pyparsing>=2.2.1 in /home/10102006/anaconda3/envs/yolox/lib/python3.8/site-packages (from matplotlib>=2.1.0->pycocotools) (3.0.7)
10 | Requirement already satisfied: cycler>=0.10 in /home/10102006/anaconda3/envs/yolox/lib/python3.8/site-packages (from matplotlib>=2.1.0->pycocotools) (0.11.0)
11 | Requirement already satisfied: six>=1.5 in /home/10102006/anaconda3/envs/yolox/lib/python3.8/site-packages (from python-dateutil>=2.7->matplotlib>=2.1.0->pycocotools) (1.16.0)
12 | 


--------------------------------------------------------------------------------
/cfp/data/datasets/coco_classes.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | COCO_CLASSES = (
 6 |     "person",
 7 |     "bicycle",
 8 |     "car",
 9 |     "motorcycle",
10 |     "airplane",
11 |     "bus",
12 |     "train",
13 |     "truck",
14 |     "boat",
15 |     "traffic light",
16 |     "fire hydrant",
17 |     "stop sign",
18 |     "parking meter",
19 |     "bench",
20 |     "bird",
21 |     "cat",
22 |     "dog",
23 |     "horse",
24 |     "sheep",
25 |     "cow",
26 |     "elephant",
27 |     "bear",
28 |     "zebra",
29 |     "giraffe",
30 |     "backpack",
31 |     "umbrella",
32 |     "handbag",
33 |     "tie",
34 |     "suitcase",
35 |     "frisbee",
36 |     "skis",
37 |     "snowboard",
38 |     "sports ball",
39 |     "kite",
40 |     "baseball bat",
41 |     "baseball glove",
42 |     "skateboard",
43 |     "surfboard",
44 |     "tennis racket",
45 |     "bottle",
46 |     "wine glass",
47 |     "cup",
48 |     "fork",
49 |     "knife",
50 |     "spoon",
51 |     "bowl",
52 |     "banana",
53 |     "apple",
54 |     "sandwich",
55 |     "orange",
56 |     "broccoli",
57 |     "carrot",
58 |     "hot dog",
59 |     "pizza",
60 |     "donut",
61 |     "cake",
62 |     "chair",
63 |     "couch",
64 |     "potted plant",
65 |     "bed",
66 |     "dining table",
67 |     "toilet",
68 |     "tv",
69 |     "laptop",
70 |     "mouse",
71 |     "remote",
72 |     "keyboard",
73 |     "cell phone",
74 |     "microwave",
75 |     "oven",
76 |     "toaster",
77 |     "sink",
78 |     "refrigerator",
79 |     "book",
80 |     "clock",
81 |     "vase",
82 |     "scissors",
83 |     "teddy bear",
84 |     "hair drier",
85 |     "toothbrush",
86 | )
87 | 


--------------------------------------------------------------------------------
/demo/TensorRT/python/README.md:
--------------------------------------------------------------------------------
 1 | # YOLOX-TensorRT in Python
 2 | 
 3 | This tutorial includes a Python demo for TensorRT.
 4 | 
 5 | ## Install TensorRT Toolkit
 6 | 
 7 | Please follow the [TensorRT Installation Guide](https://docs.nvidia.com/deeplearning/tensorrt/install-guide/index.html) and [torch2trt gitrepo](https://github.com/NVIDIA-AI-IOT/torch2trt) to install TensorRT and torch2trt.
 8 | 
 9 | ## Convert model
10 | 
11 | YOLOX models can be easily conveted to TensorRT models using torch2trt
12 | 
13 |    If you want to convert our model, use the flag -n to specify a model name:
14 |    ```shell
15 |    python tools/trt.py -n <YOLOX_MODEL_NAME> -c <YOLOX_CHECKPOINT>
16 |    ```
17 |    For example:
18 |    ```shell
19 |    python tools/trt.py -n yolox-s -c your_ckpt.pth
20 |    ```
21 |    <YOLOX_MODEL_NAME> can be: yolox-nano, yolox-tiny. yolox-s, yolox-m, yolox-l, yolox-x.
22 | 
23 |    If you want to convert your customized model, use the flag -f to specify you exp file:
24 |    ```shell
25 |    python tools/trt.py -f <YOLOX_EXP_FILE> -c <YOLOX_CHECKPOINT>
26 |    ```
27 |    For example:
28 |    ```shell
29 |    python tools/trt.py -f /path/to/your/yolox/exps/yolox_s.py -c your_ckpt.pth
30 |    ```
31 |    *yolox_s.py* can be any exp file modified by you.
32 | 
33 | The converted model and the serialized engine file (for C++ demo) will be saved on your experiment output dir.  
34 | 
35 | ## Demo
36 | 
37 | The TensorRT python demo is merged on our pytorch demo file, so you can run the pytorch demo command with ```--trt```.
38 | 
39 | ```shell
40 | python tools/demo.py image -n yolox-s --trt --save_result
41 | ```
42 | or
43 | ```shell
44 | python tools/demo.py image -f exps/default/yolox_s.py --trt --save_result
45 | ```
46 | 
47 | 


--------------------------------------------------------------------------------
/exps/default/yolox_nano.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | import os
 6 | 
 7 | import torch.nn as nn
 8 | 
 9 | from cfp.exp import Exp as MyExp
10 | 
11 | 
12 | class Exp(MyExp):
13 |     def __init__(self):
14 |         super(Exp, self).__init__()
15 |         self.depth = 0.33
16 |         self.width = 0.25
17 |         self.input_size = (416, 416)
18 |         self.random_size = (10, 20)
19 |         self.mosaic_scale = (0.5, 1.5)
20 |         self.test_size = (416, 416)
21 |         self.mosaic_prob = 0.5
22 |         self.enable_mixup = False
23 |         self.exp_name = os.path.split(os.path.realpath(__file__))[1].split(".")[0]
24 | 
25 |     def get_model(self, sublinear=False):
26 | 
27 |         def init_yolo(M):
28 |             for m in M.modules():
29 |                 if isinstance(m, nn.BatchNorm2d):
30 |                     m.eps = 1e-3
31 |                     m.momentum = 0.03
32 |         if "model" not in self.__dict__:
33 |             from yolox.models import YOLOX, YOLOPAFPN, YOLOXHead
34 |             in_channels = [256, 512, 1024]
35 |             # NANO model use depthwise = True, which is main difference.
36 |             backbone = YOLOPAFPN(
37 |                 self.depth, self.width, in_channels=in_channels,
38 |                 act=self.act, depthwise=True,
39 |             )
40 |             head = YOLOXHead(
41 |                 self.num_classes, self.width, in_channels=in_channels,
42 |                 act=self.act, depthwise=True
43 |             )
44 |             self.model = YOLOX(backbone, head)
45 | 
46 |         self.model.apply(init_yolo)
47 |         self.model.head.initialize_biases(1e-2)
48 |         return self.model
49 | 


--------------------------------------------------------------------------------
/demo/MegEngine/python/build.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | 
 4 | import megengine as mge
 5 | import megengine.module as M
 6 | 
 7 | from models.yolo_fpn import YOLOFPN
 8 | from models.yolo_head import YOLOXHead
 9 | from models.yolo_pafpn import YOLOPAFPN
10 | from models.yolox import YOLOX
11 | 
12 | 
13 | def build_yolox(name="yolox-s"):
14 |     num_classes = 80
15 | 
16 |     # value meaning: depth, width
17 |     param_dict = {
18 |         "yolox-nano": (0.33, 0.25),
19 |         "yolox-tiny": (0.33, 0.375),
20 |         "yolox-s": (0.33, 0.50),
21 |         "yolox-m": (0.67, 0.75),
22 |         "yolox-l": (1.0, 1.0),
23 |         "yolox-x": (1.33, 1.25),
24 |     }
25 |     if name == "yolov3":
26 |         depth = 1.0
27 |         width = 1.0
28 |         backbone = YOLOFPN()
29 |         head = YOLOXHead(num_classes, width, in_channels=[128, 256, 512], act="lrelu")
30 |         model = YOLOX(backbone, head)
31 |     else:
32 |         assert name in param_dict
33 |         kwargs = {}
34 |         depth, width = param_dict[name]
35 |         if name == "yolox-nano":
36 |             kwargs["depthwise"] = True
37 |         in_channels = [256, 512, 1024]
38 |         backbone = YOLOPAFPN(depth, width, in_channels=in_channels, **kwargs)
39 |         head = YOLOXHead(num_classes, width, in_channels=in_channels, **kwargs)
40 |         model = YOLOX(backbone, head)
41 | 
42 |     for m in model.modules():
43 |         if isinstance(m, M.BatchNorm2d):
44 |             m.eps = 1e-3
45 | 
46 |     return model
47 | 
48 | 
49 | def build_and_load(weight_file, name="yolox-s"):
50 |     model = build_yolox(name)
51 |     model_weights = mge.load(weight_file)
52 |     model.load_state_dict(model_weights, strict=False)
53 |     return model
54 | 


--------------------------------------------------------------------------------
/exps/example/custom/nano.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | import os
 6 | 
 7 | import torch.nn as nn
 8 | 
 9 | from cfp.exp import Exp as MyExp
10 | 
11 | 
12 | class Exp(MyExp):
13 |     def __init__(self):
14 |         super(Exp, self).__init__()
15 |         self.depth = 0.33
16 |         self.width = 0.25
17 |         self.input_size = (416, 416)
18 |         self.mosaic_scale = (0.5, 1.5)
19 |         self.random_size = (10, 20)
20 |         self.test_size = (416, 416)
21 |         self.exp_name = os.path.split(os.path.realpath(__file__))[1].split(".")[0]
22 |         self.enable_mixup = False
23 | 
24 |         # Define yourself dataset path
25 |         self.data_dir = "datasets/coco128"
26 |         self.train_ann = "instances_train2017.json"
27 |         self.val_ann = "instances_val2017.json"
28 | 
29 |         self.num_classes = 71
30 | 
31 |     def get_model(self, sublinear=False):
32 | 
33 |         def init_yolo(M):
34 |             for m in M.modules():
35 |                 if isinstance(m, nn.BatchNorm2d):
36 |                     m.eps = 1e-3
37 |                     m.momentum = 0.03
38 |         if "model" not in self.__dict__:
39 |             from yolox.models import YOLOX, YOLOPAFPN, YOLOXHead
40 |             in_channels = [256, 512, 1024]
41 |             # NANO model use depthwise = True, which is main difference.
42 |             backbone = YOLOPAFPN(self.depth, self.width, in_channels=in_channels, depthwise=True)
43 |             head = YOLOXHead(self.num_classes, self.width, in_channels=in_channels, depthwise=True)
44 |             self.model = YOLOX(backbone, head)
45 | 
46 |         self.model.apply(init_yolo)
47 |         self.model.head.initialize_biases(1e-2)
48 |         return self.model
49 | 


--------------------------------------------------------------------------------
/cfp/data/data_prefetcher.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | import torch
 6 | 
 7 | 
 8 | class DataPrefetcher:
 9 |     """
10 |     DataPrefetcher is inspired by code of following file:
11 |     https://github.com/NVIDIA/apex/blob/master/examples/imagenet/main_amp.py
12 |     It could speedup your pytorch dataloader. For more information, please check
13 |     https://github.com/NVIDIA/apex/issues/304#issuecomment-493562789.
14 |     """
15 | 
16 |     def __init__(self, loader):
17 |         self.loader = iter(loader)
18 |         self.stream = torch.cuda.Stream()
19 |         self.input_cuda = self._input_cuda_for_image
20 |         self.record_stream = DataPrefetcher._record_stream_for_image
21 |         self.preload()
22 | 
23 |     def preload(self):
24 |         try:
25 |             self.next_input, self.next_target, _, _ = next(self.loader)
26 |         except StopIteration:
27 |             self.next_input = None
28 |             self.next_target = None
29 |             return
30 | 
31 |         with torch.cuda.stream(self.stream):
32 |             self.input_cuda()
33 |             self.next_target = self.next_target.cuda(non_blocking=True)
34 | 
35 |     def next(self):
36 |         torch.cuda.current_stream().wait_stream(self.stream)
37 |         input = self.next_input
38 |         target = self.next_target
39 |         if input is not None:
40 |             self.record_stream(input)
41 |         if target is not None:
42 |             target.record_stream(torch.cuda.current_stream())
43 |         self.preload()
44 |         return input, target
45 | 
46 |     def _input_cuda_for_image(self):
47 |         self.next_input = self.next_input.cuda(non_blocking=True)
48 | 
49 |     @staticmethod
50 |     def _record_stream_for_image(input):
51 |         input.record_stream(torch.cuda.current_stream())
52 | 


--------------------------------------------------------------------------------
/cfp/models/losses.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | # -*- encoding: utf-8 -*-
 3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
 4 | 
 5 | import torch
 6 | import torch.nn as nn
 7 | 
 8 | 
 9 | class IOUloss(nn.Module):
10 |     def __init__(self, reduction="none", loss_type="iou"):
11 |         super(IOUloss, self).__init__()
12 |         self.reduction = reduction
13 |         self.loss_type = loss_type
14 | 
15 |     def forward(self, pred, target):
16 |         assert pred.shape[0] == target.shape[0]
17 | 
18 |         pred = pred.view(-1, 4)
19 |         target = target.view(-1, 4)
20 |         tl = torch.max(
21 |             (pred[:, :2] - pred[:, 2:] / 2), (target[:, :2] - target[:, 2:] / 2)
22 |         )
23 |         br = torch.min(
24 |             (pred[:, :2] + pred[:, 2:] / 2), (target[:, :2] + target[:, 2:] / 2)
25 |         )
26 | 
27 |         area_p = torch.prod(pred[:, 2:], 1)
28 |         area_g = torch.prod(target[:, 2:], 1)
29 | 
30 |         en = (tl < br).type(tl.type()).prod(dim=1)
31 |         area_i = torch.prod(br - tl, 1) * en
32 |         area_u = area_p + area_g - area_i
33 |         iou = (area_i) / (area_u + 1e-16)
34 | 
35 |         if self.loss_type == "iou":
36 |             loss = 1 - iou ** 2
37 |         elif self.loss_type == "giou":
38 |             c_tl = torch.min(
39 |                 (pred[:, :2] - pred[:, 2:] / 2), (target[:, :2] - target[:, 2:] / 2)
40 |             )
41 |             c_br = torch.max(
42 |                 (pred[:, :2] + pred[:, 2:] / 2), (target[:, :2] + target[:, 2:] / 2)
43 |             )
44 |             area_c = torch.prod(c_br - c_tl, 1)
45 |             giou = iou - (area_c - area_u) / area_c.clamp(1e-16)
46 |             loss = 1 - giou.clamp(min=-1.0, max=1.0)
47 | 
48 |         if self.reduction == "mean":
49 |             loss = loss.mean()
50 |         elif self.reduction == "sum":
51 |             loss = loss.sum()
52 | 
53 |         return loss
54 | 


--------------------------------------------------------------------------------
/demo/MegEngine/python/convert_weights.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | import argparse
 4 | from collections import OrderedDict
 5 | 
 6 | import megengine as mge
 7 | import torch
 8 | 
 9 | 
10 | def make_parser():
11 |     parser = argparse.ArgumentParser()
12 |     parser.add_argument("-w", "--weights", type=str, help="path of weight file")
13 |     parser.add_argument(
14 |         "-o",
15 |         "--output",
16 |         default="weight_mge.pkl",
17 |         type=str,
18 |         help="path of weight file",
19 |     )
20 |     return parser
21 | 
22 | 
23 | def numpy_weights(weight_file):
24 |     torch_weights = torch.load(weight_file, map_location="cpu")
25 |     if "model" in torch_weights:
26 |         torch_weights = torch_weights["model"]
27 |     new_dict = OrderedDict()
28 |     for k, v in torch_weights.items():
29 |         new_dict[k] = v.cpu().numpy()
30 |     return new_dict
31 | 
32 | 
33 | def map_weights(weight_file, output_file):
34 |     torch_weights = numpy_weights(weight_file)
35 | 
36 |     new_dict = OrderedDict()
37 |     for k, v in torch_weights.items():
38 |         if "num_batches_tracked" in k:
39 |             print("drop: {}".format(k))
40 |             continue
41 |         if k.endswith("bias"):
42 |             print("bias key: {}".format(k))
43 |             v = v.reshape(1, -1, 1, 1)
44 |             new_dict[k] = v
45 |         elif "dconv" in k and "conv.weight" in k:
46 |             print("depthwise conv key: {}".format(k))
47 |             cout, cin, k1, k2 = v.shape
48 |             v = v.reshape(cout, 1, cin, k1, k2)
49 |             new_dict[k] = v
50 |         else:
51 |             new_dict[k] = v
52 | 
53 |     mge.save(new_dict, output_file)
54 |     print("save weights to {}".format(output_file))
55 | 
56 | 
57 | def main():
58 |     parser = make_parser()
59 |     args = parser.parse_args()
60 |     map_weights(args.weights, args.output)
61 | 
62 | 
63 | if __name__ == "__main__":
64 |     main()
65 | 


--------------------------------------------------------------------------------
/docs/updates_note.md:
--------------------------------------------------------------------------------
 1 | 
 2 | # Updates notes
 3 | 
 4 | ## 【2021/08/19】
 5 | 
 6 | * Support image caching for faster training, which requires large system RAM. 
 7 | * Remove the dependence of apex and support torch amp training. 
 8 | * Optimize the preprocessing for faster training 
 9 | * Replace the older distort augmentation with new HSV aug for faster training and better performance. 
10 | 
11 | ### 2X Faster training
12 | 
13 | We optimize the data preprocess and support image caching with `--cache` flag:
14 | 
15 | ```shell
16 | python tools/train.py -n yolox-s -d 8 -b 64 --fp16 -o [--cache]
17 |                          yolox-m
18 |                          yolox-l
19 |                          yolox-x
20 | ```
21 | * -d: number of gpu devices
22 | * -b: total batch size, the recommended number for -b is num-gpu * 8
23 | * --fp16: mixed precision training
24 | * --cache: caching imgs into RAM to accelarate training, which need large system RAM.
25 | 
26 | ### Higher performance
27 | 
28 | New models achive **~1%** higher performance! See [Model_Zoo](model_zoo.md) for more details.
29 | 
30 | ### Support torch amp
31 | 
32 | We now support torch.cuda.amp training and Apex is not used anymore.
33 | 
34 | ### Breaking changes
35 | 
36 | We remove the normalization operation like -mean/std. This will make the old weights **incompatible**.
37 | 
38 | If you still want to use old weights, you can add `--legacy' in demo and eval:
39 | 
40 | ```shell
41 | python tools/demo.py image -n yolox-s -c /path/to/your/yolox_s.pth --path assets/dog.jpg --conf 0.25 --nms 0.45 --tsize 640 --save_result --device [cpu/gpu] [--legacy]
42 | ```
43 | 
44 | and 
45 | 
46 | ```shell
47 | python tools/eval.py -n  yolox-s -c yolox_s.pth -b 64 -d 8 --conf 0.001 [--fp16] [--fuse] [--legacy]
48 |                          yolox-m
49 |                          yolox-l
50 |                          yolox-x
51 | ```
52 | 
53 | But for deployment demo, we don't support the old weights anymore. Users could checkout to YOLOX version 0.1.0 to use legacy weights for deployment
54 | 
55 | 
56 | 


--------------------------------------------------------------------------------
/docs/manipulate_training_image_size.md:
--------------------------------------------------------------------------------
 1 | # Manipulating Your Training Image Size
 2 | 
 3 | This tutorial explains how to control your image size when training on your own data.
 4 | 
 5 | ## 1. Introduction
 6 | 
 7 | There are 3 hyperparamters control the training size:
 8 | 
 9 | - self.input_size = (640, 640) &emsp; #(height, width)
10 | - self.multiscale_range = 5
11 | - self.random_size = (14, 26)
12 | 
13 | There is 1 hyperparameter constrols the testing size:
14 | 
15 | - self.test_size = (640, 640)
16 | 
17 | The self.input_size is suggested to set to the same value as self.test_size. By default, it is set to (640, 640) for most models and (416, 416) for yolox-tiny and yolox-nano.
18 | 
19 | ## 2. Multi Scale Training
20 | 
21 | When training on your custom dataset, you can use multiscale training in 2 ways:
22 | 
23 | 1. **【Default】Only specifying the self.input_size and leaving others unchanged.**
24 | 
25 |    If so, the actual multiscale sizes range from:
26 | 
27 |    [self.input_size[0] - self.multiscale_range\*32,  self.input_size[0] + self.multiscale_range\*32]
28 | 
29 |    For example, if you only set:
30 | 
31 |    ```python
32 |    self.input_size = (640, 640)
33 |    ```
34 | 
35 |    the actual multiscale range is [640 - 5*32, 640 + 5\*32], i.e., [480, 800].
36 | 
37 |    You can modify self.multiscale_range to change the multiscale range.
38 | 
39 | 2. **Simultaneously specifying the self.input_size and self.random_size**
40 | 
41 |    ```python
42 |    self.input_size = (416, 416)
43 |    self.random_size = (10, 20)
44 |    ```
45 | 
46 |    In this case, the actual multiscale range is [self.random_size[0]\*32, self.random_size[1]\*32], i.e., [320, 640]
47 | 
48 |    **Note: You must specify the self.input_size because it is used for initializing resize aug in dataset.**
49 | 
50 | ## 3. Single Scale Training
51 | 
52 | If you want to train in a single scale. You need to specify the self.input_size and self.multiscale_range=0:
53 | 
54 | ```python
55 | self.input_size = (416, 416)
56 | self.multiscale_range = 0
57 | ```
58 | 
59 | **DO NOT** set the self.random_size.
60 | 


--------------------------------------------------------------------------------
/cfp/exp/base_exp.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
 4 | 
 5 | import ast
 6 | import pprint
 7 | from abc import ABCMeta, abstractmethod
 8 | from typing import Dict
 9 | from tabulate import tabulate
10 | 
11 | import torch
12 | from torch.nn import Module
13 | 
14 | from cfp.utils import LRScheduler
15 | 
16 | 
17 | class BaseExp(metaclass=ABCMeta):
18 |     """Basic class for any experiment."""
19 | 
20 |     def __init__(self):
21 |         self.seed = None
22 |         self.output_dir = "./YOLOX_outputs"
23 |         self.print_interval = 100
24 |         self.eval_interval = 10
25 | 
26 |     @abstractmethod
27 |     def get_model(self) -> Module:
28 |         pass
29 | 
30 |     @abstractmethod
31 |     def get_data_loader(
32 |         self, batch_size: int, is_distributed: bool
33 |     ) -> Dict[str, torch.utils.data.DataLoader]:
34 |         pass
35 | 
36 |     @abstractmethod
37 |     def get_optimizer(self, batch_size: int) -> torch.optim.Optimizer:
38 |         pass
39 | 
40 |     @abstractmethod
41 |     def get_lr_scheduler(
42 |         self, lr: float, iters_per_epoch: int, **kwargs
43 |     ) -> LRScheduler:
44 |         pass
45 | 
46 |     @abstractmethod
47 |     def get_evaluator(self):
48 |         pass
49 | 
50 |     @abstractmethod
51 |     def eval(self, model, evaluator, weights):
52 |         pass
53 | 
54 |     def __repr__(self):
55 |         table_header = ["keys", "values"]
56 |         exp_table = [
57 |             (str(k), pprint.pformat(v))
58 |             for k, v in vars(self).items()
59 |             if not k.startswith("_")
60 |         ]
61 |         return tabulate(exp_table, headers=table_header, tablefmt="fancy_grid")
62 | 
63 |     def merge(self, cfg_list):
64 |         assert len(cfg_list) % 2 == 0
65 |         for k, v in zip(cfg_list[0::2], cfg_list[1::2]):
66 |             # only update value with same key
67 |             if hasattr(self, k):
68 |                 src_value = getattr(self, k)
69 |                 src_type = type(src_value)
70 |                 if src_value is not None and src_type != type(v):
71 |                     try:
72 |                         v = src_type(v)
73 |                     except Exception:
74 |                         v = ast.literal_eval(v)
75 |                 setattr(self, k, v)
76 | 


--------------------------------------------------------------------------------
/cfp/utils/ema.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
 4 | import math
 5 | from copy import deepcopy
 6 | 
 7 | import torch
 8 | import torch.nn as nn
 9 | 
10 | __all__ = ["ModelEMA", "is_parallel"]
11 | 
12 | 
13 | def is_parallel(model):
14 |     """check if model is in parallel mode."""
15 |     parallel_type = (
16 |         nn.parallel.DataParallel,
17 |         nn.parallel.DistributedDataParallel,
18 |     )
19 |     return isinstance(model, parallel_type)
20 | 
21 | 
22 | class ModelEMA:
23 |     """
24 |     Model Exponential Moving Average from https://github.com/rwightman/pytorch-image-models
25 |     Keep a moving average of everything in the model state_dict (parameters and buffers).
26 |     This is intended to allow functionality like
27 |     https://www.tensorflow.org/api_docs/python/tf/train/ExponentialMovingAverage
28 |     A smoothed version of the weights is necessary for some training schemes to perform well.
29 |     This class is sensitive where it is initialized in the sequence of model init,
30 |     GPU assignment and distributed training wrappers.
31 |     """
32 | 
33 |     def __init__(self, model, decay=0.9999, updates=0):
34 |         """
35 |         Args:
36 |             model (nn.Module): model to apply EMA.
37 |             decay (float): ema decay reate.
38 |             updates (int): counter of EMA updates.
39 |         """
40 |         # Create EMA(FP32)
41 |         self.ema = deepcopy(model.module if is_parallel(model) else model).eval()
42 |         self.updates = updates
43 |         # decay exponential ramp (to help early epochs)
44 |         self.decay = lambda x: decay * (1 - math.exp(-x / 2000))
45 |         for p in self.ema.parameters():
46 |             p.requires_grad_(False)
47 | 
48 |     def update(self, model):
49 |         # Update EMA parameters
50 |         with torch.no_grad():
51 |             self.updates += 1
52 |             d = self.decay(self.updates)
53 | 
54 |             msd = (
55 |                 model.module.state_dict() if is_parallel(model) else model.state_dict()
56 |             )  # model state_dict
57 |             for k, v in self.ema.state_dict().items():
58 |                 if v.dtype.is_floating_point:
59 |                     v *= d
60 |                     v += (1.0 - d) * msd[k].detach()
61 | 


--------------------------------------------------------------------------------
/tools/export_torchscript.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | import argparse
 6 | import os
 7 | from loguru import logger
 8 | 
 9 | import torch
10 | 
11 | from cfp.exp import get_exp
12 | 
13 | 
14 | def make_parser():
15 |     parser = argparse.ArgumentParser("YOLOX torchscript deploy")
16 |     parser.add_argument(
17 |         "--output-name", type=str, default="yolox.torchscript.pt", help="output name of models"
18 |     )
19 |     parser.add_argument("--batch-size", type=int, default=1, help="batch size")
20 |     parser.add_argument(
21 |         "-f",
22 |         "--exp_file",
23 |         default=None,
24 |         type=str,
25 |         help="expriment description file",
26 |     )
27 |     parser.add_argument("-expn", "--experiment-name", type=str, default=None)
28 |     parser.add_argument("-n", "--name", type=str, default=None, help="model name")
29 |     parser.add_argument("-c", "--ckpt", default=None, type=str, help="ckpt path")
30 |     parser.add_argument(
31 |         "opts",
32 |         help="Modify config options using the command-line",
33 |         default=None,
34 |         nargs=argparse.REMAINDER,
35 |     )
36 | 
37 |     return parser
38 | 
39 | 
40 | @logger.catch
41 | def main():
42 |     args = make_parser().parse_args()
43 |     logger.info("args value: {}".format(args))
44 |     exp = get_exp(args.exp_file, args.name)
45 |     exp.merge(args.opts)
46 | 
47 |     if not args.experiment_name:
48 |         args.experiment_name = exp.exp_name
49 | 
50 |     model = exp.get_model()
51 |     if args.ckpt is None:
52 |         file_name = os.path.join(exp.output_dir, args.experiment_name)
53 |         ckpt_file = os.path.join(file_name, "best_ckpt.pth")
54 |     else:
55 |         ckpt_file = args.ckpt
56 | 
57 |     # load the model state dict
58 |     ckpt = torch.load(ckpt_file, map_location="cpu")
59 | 
60 |     model.eval()
61 |     if "model" in ckpt:
62 |         ckpt = ckpt["model"]
63 |     model.load_state_dict(ckpt)
64 |     model.head.decode_in_inference = False
65 | 
66 |     logger.info("loading checkpoint done.")
67 |     dummy_input = torch.randn(args.batch_size, 3, exp.test_size[0], exp.test_size[1])
68 | 
69 |     mod = torch.jit.trace(model, dummy_input)
70 |     mod.save(args.output_name)
71 |     logger.info("generated torchscript model named {}".format(args.output_name))
72 | 
73 | 
74 | if __name__ == "__main__":
75 |     main()
76 | 


--------------------------------------------------------------------------------
/demo/ncnn/android/gradlew.bat:
--------------------------------------------------------------------------------
 1 | @if "%DEBUG%" == "" @echo off
 2 | @rem ##########################################################################
 3 | @rem
 4 | @rem  Gradle startup script for Windows
 5 | @rem
 6 | @rem ##########################################################################
 7 | 
 8 | @rem Set local scope for the variables with windows NT shell
 9 | if "%OS%"=="Windows_NT" setlocal
10 | 
11 | set DIRNAME=%~dp0
12 | if "%DIRNAME%" == "" set DIRNAME=.
13 | set APP_BASE_NAME=%~n0
14 | set APP_HOME=%DIRNAME%
15 | 
16 | @rem Add default JVM options here. You can also use JAVA_OPTS and GRADLE_OPTS to pass JVM options to this script.
17 | set DEFAULT_JVM_OPTS=
18 | 
19 | @rem Find java.exe
20 | if defined JAVA_HOME goto findJavaFromJavaHome
21 | 
22 | set JAVA_EXE=java.exe
23 | %JAVA_EXE% -version >NUL 2>&1
24 | if "%ERRORLEVEL%" == "0" goto init
25 | 
26 | echo.
27 | echo ERROR: JAVA_HOME is not set and no 'java' command could be found in your PATH.
28 | echo.
29 | echo Please set the JAVA_HOME variable in your environment to match the
30 | echo location of your Java installation.
31 | 
32 | goto fail
33 | 
34 | :findJavaFromJavaHome
35 | set JAVA_HOME=%JAVA_HOME:"=%
36 | set JAVA_EXE=%JAVA_HOME%/bin/java.exe
37 | 
38 | if exist "%JAVA_EXE%" goto init
39 | 
40 | echo.
41 | echo ERROR: JAVA_HOME is set to an invalid directory: %JAVA_HOME%
42 | echo.
43 | echo Please set the JAVA_HOME variable in your environment to match the
44 | echo location of your Java installation.
45 | 
46 | goto fail
47 | 
48 | :init
49 | @rem Get command-line arguments, handling Windows variants
50 | 
51 | if not "%OS%" == "Windows_NT" goto win9xME_args
52 | 
53 | :win9xME_args
54 | @rem Slurp the command line arguments.
55 | set CMD_LINE_ARGS=
56 | set _SKIP=2
57 | 
58 | :win9xME_args_slurp
59 | if "x%~1" == "x" goto execute
60 | 
61 | set CMD_LINE_ARGS=%*
62 | 
63 | :execute
64 | @rem Setup the command line
65 | 
66 | set CLASSPATH=%APP_HOME%\gradle\wrapper\gradle-wrapper.jar
67 | 
68 | @rem Execute Gradle
69 | "%JAVA_EXE%" %DEFAULT_JVM_OPTS% %JAVA_OPTS% %GRADLE_OPTS% "-Dorg.gradle.appname=%APP_BASE_NAME%" -classpath "%CLASSPATH%" org.gradle.wrapper.GradleWrapperMain %CMD_LINE_ARGS%
70 | 
71 | :end
72 | @rem End local scope for the variables with windows NT shell
73 | if "%ERRORLEVEL%"=="0" goto mainEnd
74 | 
75 | :fail
76 | rem Set variable GRADLE_EXIT_CONSOLE if you need the _script_ return code instead of
77 | rem the _cmd.exe /c_ return code!
78 | if  not "" == "%GRADLE_EXIT_CONSOLE%" exit 1
79 | exit /b 1
80 | 
81 | :mainEnd
82 | if "%OS%"=="Windows_NT" endlocal
83 | 
84 | :omega
85 | 


--------------------------------------------------------------------------------
/demo/MegEngine/python/models/yolo_fpn.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- encoding: utf-8 -*-
 3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
 4 | 
 5 | import megengine.functional as F
 6 | import megengine.module as M
 7 | 
 8 | from .darknet import Darknet
 9 | from .network_blocks import BaseConv, UpSample
10 | 
11 | 
12 | class YOLOFPN(M.Module):
13 |     """
14 |     YOLOFPN module. Darknet 53 is the default backbone of this model.
15 |     """
16 | 
17 |     def __init__(
18 |         self, depth=53, in_features=["dark3", "dark4", "dark5"],
19 |     ):
20 |         super().__init__()
21 | 
22 |         self.backbone = Darknet(depth)
23 |         self.in_features = in_features
24 | 
25 |         # out 1
26 |         self.out1_cbl = self._make_cbl(512, 256, 1)
27 |         self.out1 = self._make_embedding([256, 512], 512 + 256)
28 | 
29 |         # out 2
30 |         self.out2_cbl = self._make_cbl(256, 128, 1)
31 |         self.out2 = self._make_embedding([128, 256], 256 + 128)
32 | 
33 |         # upsample
34 |         self.upsample = UpSample(scale_factor=2, mode="bilinear")
35 | 
36 |     def _make_cbl(self, _in, _out, ks):
37 |         return BaseConv(_in, _out, ks, stride=1, act="lrelu")
38 | 
39 |     def _make_embedding(self, filters_list, in_filters):
40 |         m = M.Sequential(
41 |             *[
42 |                 self._make_cbl(in_filters, filters_list[0], 1),
43 |                 self._make_cbl(filters_list[0], filters_list[1], 3),
44 | 
45 |                 self._make_cbl(filters_list[1], filters_list[0], 1),
46 | 
47 |                 self._make_cbl(filters_list[0], filters_list[1], 3),
48 |                 self._make_cbl(filters_list[1], filters_list[0], 1),
49 |             ]
50 |         )
51 |         return m
52 | 
53 |     def forward(self, inputs):
54 |         """
55 |         Args:
56 |             inputs (Tensor): input image.
57 | 
58 |         Returns:
59 |             Tuple[Tensor]: FPN output features..
60 |         """
61 |         #  backbone
62 |         out_features = self.backbone(inputs)
63 |         x2, x1, x0 = [out_features[f] for f in self.in_features]
64 | 
65 |         #  yolo branch 1
66 |         x1_in = self.out1_cbl(x0)
67 |         x1_in = self.upsample(x1_in)
68 |         x1_in = F.concat([x1_in, x1], 1)
69 |         out_dark4 = self.out1(x1_in)
70 | 
71 |         #  yolo branch 2
72 |         x2_in = self.out2_cbl(out_dark4)
73 |         x2_in = self.upsample(x2_in)
74 |         x2_in = F.concat([x2_in, x2], 1)
75 |         out_dark3 = self.out2(x2_in)
76 | 
77 |         outputs = (out_dark3, out_dark4, x0)
78 |         return outputs
79 | 


--------------------------------------------------------------------------------
/demo/MegEngine/cpp/build.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env bash
 2 | set -e
 3 | 
 4 | if [ -z $CXX ];then
 5 |     echo "please export you c++ toolchain to CXX"
 6 |     echo "for example:"
 7 |     echo "build for host:                                        export CXX=g++"
 8 |     echo "cross build for aarch64-android(always locate in NDK): export CXX=aarch64-linux-android21-clang++"
 9 |     echo "cross build for aarch64-linux:                         export CXX=aarch64-linux-gnu-g++"
10 |     exit -1
11 | fi
12 | 
13 | if [ -z $MGE_INSTALL_PATH ];then
14 |     echo "please refsi ./README.md to init MGE_INSTALL_PATH env"
15 |     exit -1
16 | fi
17 | 
18 | if [ -z $OPENCV_INSTALL_INCLUDE_PATH ];then
19 |     echo "please refs ./README.md to init OPENCV_INSTALL_INCLUDE_PATH env"
20 |     exit -1
21 | fi
22 | 
23 | if [ -z $OPENCV_INSTALL_LIB_PATH ];then
24 |     echo "please refs ./README.md to init OPENCV_INSTALL_LIB_PATH env"
25 |     exit -1
26 | fi
27 | 
28 | INCLUDE_FLAG="-I$MGE_INSTALL_PATH/include -I$OPENCV_INSTALL_INCLUDE_PATH"
29 | LINK_FLAG="-L$MGE_INSTALL_PATH/lib/ -lmegengine -L$OPENCV_INSTALL_LIB_PATH -lopencv_core -lopencv_highgui -lopencv_imgproc -lopencv_imgcodecs"
30 | BUILD_FLAG="-static-libstdc++ -O3 -pie -fPIE -g"
31 | 
32 | if [[ $CXX =~ "android" ]]; then
33 |     LINK_FLAG="${LINK_FLAG} -llog -lz"
34 | fi
35 | 
36 | echo "CXX: $CXX"
37 | echo "MGE_INSTALL_PATH: $MGE_INSTALL_PATH"
38 | echo "INCLUDE_FLAG: $INCLUDE_FLAG"
39 | echo "LINK_FLAG: $LINK_FLAG"
40 | echo "BUILD_FLAG: $BUILD_FLAG"
41 | 
42 | echo "[" > compile_commands.json
43 | echo "{" >> compile_commands.json
44 | echo "\"directory\": \"$PWD\"," >> compile_commands.json
45 | echo "\"command\": \"$CXX yolox.cpp -o yolox ${INCLUDE_FLAG} ${LINK_FLAG}\"," >> compile_commands.json
46 | echo "\"file\": \"$PWD/yolox.cpp\"," >> compile_commands.json
47 | echo "}," >> compile_commands.json
48 | echo "]" >> compile_commands.json
49 | $CXX yolox.cpp -o yolox ${INCLUDE_FLAG} ${LINK_FLAG} ${BUILD_FLAG}
50 | 
51 | echo "build success, output file: yolox"
52 | if [[ $CXX =~ "android" ]]; then
53 |     echo "try command to run:"
54 |     echo "adb push/scp $MGE_INSTALL_PATH/lib/libmegengine.so android_phone"
55 |     echo "adb push/scp $OPENCV_INSTALL_LIB_PATH/*.so android_phone"
56 |     echo "adb push/scp ./yolox yolox_s.mge android_phone"
57 |     echo "adb push/scp ../../../assets/dog.jpg android_phone"
58 |     echo "adb/ssh to android_phone, then run: LD_LIBRARY_PATH=. ./yolox yolox_s.mge dog.jpg cpu/multithread <warmup_count> <thread_number> <use_fast_run> <use_weight_preprocess>"
59 | else
60 |     echo "try command to run: LD_LIBRARY_PATH=$MGE_INSTALL_PATH/lib/:$OPENCV_INSTALL_LIB_PATH ./yolox yolox_s.mge ../../../assets/dog.jpg cuda/cpu/multithread <warmup_count> <thread_number> <use_fast_run> <use_weight_preprocess>"
61 | fi
62 | 


--------------------------------------------------------------------------------
/cfp/models/yolo_fpn.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | # -*- encoding: utf-8 -*-
 3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
 4 | 
 5 | import torch
 6 | import torch.nn as nn
 7 | 
 8 | from .darknet import Darknet
 9 | from .network_blocks import BaseConv
10 | 
11 | 
12 | class YOLOFPN(nn.Module):
13 |     """
14 |     YOLOFPN module. Darknet 53 is the default backbone of this model.
15 |     """
16 | 
17 |     def __init__(
18 |         self,
19 |         depth=53,
20 |         in_features=["dark3", "dark4", "dark5"],
21 |     ):
22 |         super().__init__()
23 | 
24 |         self.backbone = Darknet(depth)
25 |         self.in_features = in_features
26 | 
27 |         # out 1
28 |         self.out1_cbl = self._make_cbl(512, 256, 1)
29 |         self.out1 = self._make_embedding([256, 512], 512 + 256)
30 | 
31 |         # out 2
32 |         self.out2_cbl = self._make_cbl(256, 128, 1)
33 |         self.out2 = self._make_embedding([128, 256], 256 + 128)
34 | 
35 |         # upsample
36 |         self.upsample = nn.Upsample(scale_factor=2, mode="nearest")
37 | 
38 |     def _make_cbl(self, _in, _out, ks):
39 |         return BaseConv(_in, _out, ks, stride=1, act="lrelu")
40 | 
41 |     def _make_embedding(self, filters_list, in_filters):
42 |         m = nn.Sequential(
43 |             *[
44 |                 self._make_cbl(in_filters, filters_list[0], 1),
45 |                 self._make_cbl(filters_list[0], filters_list[1], 3),
46 |                 self._make_cbl(filters_list[1], filters_list[0], 1),
47 |                 self._make_cbl(filters_list[0], filters_list[1], 3),
48 |                 self._make_cbl(filters_list[1], filters_list[0], 1),
49 |             ]
50 |         )
51 |         return m
52 | 
53 |     def load_pretrained_model(self, filename="./weights/darknet53.mix.pth"):
54 |         with open(filename, "rb") as f:
55 |             state_dict = torch.load(f, map_location="cpu")
56 |         print("loading pretrained weights...")
57 |         self.backbone.load_state_dict(state_dict)
58 | 
59 |     def forward(self, inputs):
60 |         """
61 |         Args:
62 |             inputs (Tensor): input image.
63 | 
64 |         Returns:
65 |             Tuple[Tensor]: FPN output features..
66 |         """
67 |         #  backbone
68 |         out_features = self.backbone(inputs)
69 |         x2, x1, x0 = [out_features[f] for f in self.in_features]
70 | 
71 |         #  yolo branch 1
72 |         x1_in = self.out1_cbl(x0)
73 |         x1_in = self.upsample(x1_in)
74 |         x1_in = torch.cat([x1_in, x1], 1)
75 |         out_dark4 = self.out1(x1_in)
76 | 
77 |         #  yolo branch 2
78 |         x2_in = self.out2_cbl(out_dark4)
79 |         x2_in = self.upsample(x2_in)
80 |         x2_in = torch.cat([x2_in, x2], 1)
81 |         out_dark3 = self.out2(x2_in)
82 | 
83 |         outputs = (out_dark3, out_dark4, x0)
84 |         return outputs
85 | 


--------------------------------------------------------------------------------
/tools/trt.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | import argparse
 6 | import os
 7 | import shutil
 8 | from loguru import logger
 9 | 
10 | import tensorrt as trt
11 | import torch
12 | from torch2trt import torch2trt
13 | 
14 | from cfp.exp import get_exp
15 | 
16 | 
17 | def make_parser():
18 |     parser = argparse.ArgumentParser("YOLOX ncnn deploy")
19 |     parser.add_argument("-expn", "--experiment-name", type=str, default=None)
20 |     parser.add_argument("-n", "--name", type=str, default=None, help="model name")
21 | 
22 |     parser.add_argument(
23 |         "-f",
24 |         "--exp_file",
25 |         default=None,
26 |         type=str,
27 |         help="pls input your expriment description file",
28 |     )
29 |     parser.add_argument("-c", "--ckpt", default=None, type=str, help="ckpt path")
30 |     parser.add_argument(
31 |         "-w", '--workspace', type=int, default=32, help='max workspace size in detect'
32 |     )
33 |     parser.add_argument("-b", '--batch', type=int, default=1, help='max batch size in detect')
34 |     return parser
35 | 
36 | 
37 | @logger.catch
38 | @torch.no_grad()
39 | def main():
40 |     args = make_parser().parse_args()
41 |     exp = get_exp(args.exp_file, args.name)
42 |     if not args.experiment_name:
43 |         args.experiment_name = exp.exp_name
44 | 
45 |     model = exp.get_model()
46 |     file_name = os.path.join(exp.output_dir, args.experiment_name)
47 |     os.makedirs(file_name, exist_ok=True)
48 |     if args.ckpt is None:
49 |         ckpt_file = os.path.join(file_name, "best_ckpt.pth")
50 |     else:
51 |         ckpt_file = args.ckpt
52 | 
53 |     ckpt = torch.load(ckpt_file, map_location="cpu")
54 |     # load the model state dict
55 | 
56 |     model.load_state_dict(ckpt["model"])
57 |     logger.info("loaded checkpoint done.")
58 |     model.eval()
59 |     model.cuda()
60 |     model.head.decode_in_inference = False
61 |     x = torch.ones(1, 3, exp.test_size[0], exp.test_size[1]).cuda()
62 |     model_trt = torch2trt(
63 |         model,
64 |         [x],
65 |         fp16_mode=True,
66 |         log_level=trt.Logger.INFO,
67 |         max_workspace_size=(1 << args.workspace),
68 |         max_batch_size=args.batch,
69 |     )
70 |     torch.save(model_trt.state_dict(), os.path.join(file_name, "model_trt.pth"))
71 |     logger.info("Converted TensorRT model done.")
72 |     engine_file = os.path.join(file_name, "model_trt.engine")
73 |     engine_file_demo = os.path.join("demo", "TensorRT", "cpp", "model_trt.engine")
74 |     with open(engine_file, "wb") as f:
75 |         f.write(model_trt.engine.serialize())
76 | 
77 |     shutil.copyfile(engine_file, engine_file_demo)
78 | 
79 |     logger.info("Converted TensorRT model engine file is saved for C++ inference.")
80 | 
81 | 
82 | if __name__ == "__main__":
83 |     main()
84 | 


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | # Copyright (c) Megvii, Inc. and its affiliates. All Rights Reserved
 3 | 
 4 | import re
 5 | import setuptools
 6 | import glob
 7 | from os import path
 8 | import torch
 9 | from torch.utils.cpp_extension import CppExtension
10 | 
11 | 
12 | def get_extensions():
13 |     this_dir = path.dirname(path.abspath(__file__))
14 |     extensions_dir = path.join(this_dir, "yolox", "layers", "csrc")
15 | 
16 |     main_source = path.join(extensions_dir, "vision.cpp")
17 |     sources = glob.glob(path.join(extensions_dir, "**", "*.cpp"))
18 | 
19 |     sources = [main_source] + sources
20 |     extension = CppExtension
21 | 
22 |     extra_compile_args = {"cxx": ["-O3"]}
23 |     define_macros = []
24 | 
25 |     include_dirs = [extensions_dir]
26 | 
27 |     ext_modules = [
28 |         extension(
29 |             "yolox._C",
30 |             sources,
31 |             include_dirs=include_dirs,
32 |             define_macros=define_macros,
33 |             extra_compile_args=extra_compile_args,
34 |         )
35 |     ]
36 | 
37 |     return ext_modules
38 | 
39 | 
40 | def get_package_dir():
41 |     pkg_dir = {
42 |         "cfp.tools": "tools",
43 |         "cfp.exp.default": "exps/default",
44 |     }
45 |     return pkg_dir
46 | 
47 | 
48 | def get_install_requirements():
49 |     with open("requirements.txt", "r", encoding="utf-8") as f:
50 |         reqs = [x.strip() for x in f.read().splitlines()]
51 |     reqs = [x for x in reqs if not x.startswith("#")]
52 |     return reqs
53 | 
54 | 
55 | def get_yolox_version():
56 |     with open("cfp/__init__.py", "r") as f:
57 |         version = re.search(
58 |             r'^__version__\s*=\s*[\'"]([^\'"]*)[\'"]',
59 |             f.read(), re.MULTILINE
60 |         ).group(1)
61 |     return version
62 | 
63 | 
64 | def get_long_description():
65 |     with open("README.md", "r", encoding="utf-8") as f:
66 |         long_description = f.read()
67 |     return long_description
68 | 
69 | 
70 | setuptools.setup(
71 |     name="yolox",
72 |     version=get_yolox_version(),
73 |     author="megvii basedet team",
74 |     url="https://github.com/Megvii-BaseDetection/YOLOX",
75 |     package_dir=get_package_dir(),
76 |     python_requires=">=3.6",
77 |     install_requires=get_install_requirements(),
78 |     long_description=get_long_description(),
79 |     long_description_content_type="text/markdown",
80 |     ext_modules=get_extensions(),
81 |     classifiers=[
82 |         "Programming Language :: Python :: 3", "Operating System :: OS Independent",
83 |         "License :: OSI Approved :: Apache Software License",
84 |     ],
85 |     cmdclass={"build_ext": torch.utils.cpp_extension.BuildExtension},
86 |     packages=setuptools.find_packages(),
87 |     project_urls={
88 |         "Documentation": "https://yolox.readthedocs.io",
89 |         "Source": "https://github.com/Megvii-BaseDetection/YOLOX",
90 |         "Tracker": "https://github.com/Megvii-BaseDetection/YOLOX/issues",
91 |     },
92 | )
93 | 


--------------------------------------------------------------------------------
/cfp/utils/setup_env.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
 4 | 
 5 | import os
 6 | import subprocess
 7 | from loguru import logger
 8 | 
 9 | import cv2
10 | 
11 | from .dist import get_world_size, is_main_process
12 | 
13 | __all__ = ["configure_nccl", "configure_module", "configure_omp"]
14 | 
15 | 
16 | def configure_nccl():
17 |     """Configure multi-machine environment variables of NCCL."""
18 |     os.environ["NCCL_LAUNCH_MODE"] = "PARALLEL"
19 |     os.environ["NCCL_IB_HCA"] = subprocess.getoutput(
20 |         "pushd /sys/class/infiniband/ > /dev/null; for i in mlx5_*; "
21 |         "do cat $i/ports/1/gid_attrs/types/* 2>/dev/null "
22 |         "| grep v >/dev/null && echo $i ; done; popd > /dev/null"
23 |     )
24 |     os.environ["NCCL_IB_GID_INDEX"] = "3"
25 |     os.environ["NCCL_IB_TC"] = "106"
26 | 
27 | 
28 | def configure_omp(num_threads=1):
29 |     """
30 |     If OMP_NUM_THREADS is not configured and world_size is greater than 1,
31 |     Configure OMP_NUM_THREADS environment variables of NCCL to `num_thread`.
32 | 
33 |     Args:
34 |         num_threads (int): value of `OMP_NUM_THREADS` to set.
35 |     """
36 |     # We set OMP_NUM_THREADS=1 by default, which achieves the best speed on our machines
37 |     # feel free to change it for better performance.
38 |     if "OMP_NUM_THREADS" not in os.environ and get_world_size() > 1:
39 |         os.environ["OMP_NUM_THREADS"] = str(num_threads)
40 |         if is_main_process():
41 |             logger.info(
42 |                 "\n***************************************************************\n"
43 |                 "We set `OMP_NUM_THREADS` for each process to {} to speed up.\n"
44 |                 "please further tune the variable for optimal performance.\n"
45 |                 "***************************************************************".format(
46 |                     os.environ["OMP_NUM_THREADS"]
47 |                 )
48 |             )
49 | 
50 | 
51 | def configure_module(ulimit_value=8192):
52 |     """
53 |     Configure pytorch module environment. setting of ulimit and cv2 will be set.
54 | 
55 |     Args:
56 |         ulimit_value(int): default open file number on linux. Default value: 8192.
57 |     """
58 |     # system setting
59 |     try:
60 |         import resource
61 | 
62 |         rlimit = resource.getrlimit(resource.RLIMIT_NOFILE)
63 |         resource.setrlimit(resource.RLIMIT_NOFILE, (ulimit_value, rlimit[1]))
64 |     except Exception:
65 |         # Exception might be raised in Windows OS or rlimit reaches max limit number.
66 |         # However, set rlimit value might not be necessary.
67 |         pass
68 | 
69 |     # cv2
70 |     # multiprocess might be harmful on performance of torch dataloader
71 |     os.environ["OPENCV_OPENCL_RUNTIME"] = "disabled"
72 |     try:
73 |         cv2.setNumThreads(0)
74 |         cv2.ocl.setUseOpenCL(False)
75 |     except Exception:
76 |         # cv2 version mismatch might rasie exceptions.
77 |         pass
78 | 


--------------------------------------------------------------------------------
/demo/ONNXRuntime/onnx_inference.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding: utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | import argparse
 6 | import os
 7 | 
 8 | import cv2
 9 | import numpy as np
10 | 
11 | import onnxruntime
12 | 
13 | from yolox.data.data_augment import preproc as preprocess
14 | from yolox.data.datasets import COCO_CLASSES
15 | from yolox.utils import mkdir, multiclass_nms, demo_postprocess, vis
16 | 
17 | 
18 | def make_parser():
19 |     parser = argparse.ArgumentParser("onnxruntime inference sample")
20 |     parser.add_argument(
21 |         "-m",
22 |         "--model",
23 |         type=str,
24 |         default="yolox.onnx",
25 |         help="Input your onnx model.",
26 |     )
27 |     parser.add_argument(
28 |         "-i",
29 |         "--image_path",
30 |         type=str,
31 |         default='test_image.png',
32 |         help="Path to your input image.",
33 |     )
34 |     parser.add_argument(
35 |         "-o",
36 |         "--output_dir",
37 |         type=str,
38 |         default='demo_output',
39 |         help="Path to your output directory.",
40 |     )
41 |     parser.add_argument(
42 |         "-s",
43 |         "--score_thr",
44 |         type=float,
45 |         default=0.3,
46 |         help="Score threshould to filter the result.",
47 |     )
48 |     parser.add_argument(
49 |         "--input_shape",
50 |         type=str,
51 |         default="640,640",
52 |         help="Specify an input shape for inference.",
53 |     )
54 |     parser.add_argument(
55 |         "--with_p6",
56 |         action="store_true",
57 |         help="Whether your model uses p6 in FPN/PAN.",
58 |     )
59 |     return parser
60 | 
61 | 
62 | if __name__ == '__main__':
63 |     args = make_parser().parse_args()
64 | 
65 |     input_shape = tuple(map(int, args.input_shape.split(',')))
66 |     origin_img = cv2.imread(args.image_path)
67 |     img, ratio = preprocess(origin_img, input_shape)
68 | 
69 |     session = onnxruntime.InferenceSession(args.model)
70 | 
71 |     ort_inputs = {session.get_inputs()[0].name: img[None, :, :, :]}
72 |     output = session.run(None, ort_inputs)
73 |     predictions = demo_postprocess(output[0], input_shape, p6=args.with_p6)[0]
74 | 
75 |     boxes = predictions[:, :4]
76 |     scores = predictions[:, 4:5] * predictions[:, 5:]
77 | 
78 |     boxes_xyxy = np.ones_like(boxes)
79 |     boxes_xyxy[:, 0] = boxes[:, 0] - boxes[:, 2]/2.
80 |     boxes_xyxy[:, 1] = boxes[:, 1] - boxes[:, 3]/2.
81 |     boxes_xyxy[:, 2] = boxes[:, 0] + boxes[:, 2]/2.
82 |     boxes_xyxy[:, 3] = boxes[:, 1] + boxes[:, 3]/2.
83 |     boxes_xyxy /= ratio
84 |     dets = multiclass_nms(boxes_xyxy, scores, nms_thr=0.45, score_thr=0.1)
85 |     if dets is not None:
86 |         final_boxes, final_scores, final_cls_inds = dets[:, :4], dets[:, 4], dets[:, 5]
87 |         origin_img = vis(origin_img, final_boxes, final_scores, final_cls_inds,
88 |                          conf=args.score_thr, class_names=COCO_CLASSES)
89 | 
90 |     mkdir(args.output_dir)
91 |     output_path = os.path.join(args.output_dir, os.path.basename(args.image_path))
92 |     cv2.imwrite(output_path, origin_img)
93 | 


--------------------------------------------------------------------------------
/cfp/utils/logger.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
 4 | 
 5 | import inspect
 6 | import os
 7 | import sys
 8 | from loguru import logger
 9 | 
10 | 
11 | def get_caller_name(depth=0):
12 |     """
13 |     Args:
14 |         depth (int): Depth of caller conext, use 0 for caller depth. Default value: 0.
15 | 
16 |     Returns:
17 |         str: module name of the caller
18 |     """
19 |     # the following logic is a little bit faster than inspect.stack() logic
20 |     frame = inspect.currentframe().f_back
21 |     for _ in range(depth):
22 |         frame = frame.f_back
23 | 
24 |     return frame.f_globals["__name__"]
25 | 
26 | 
27 | class StreamToLoguru:
28 |     """
29 |     stream object that redirects writes to a logger instance.
30 |     """
31 | 
32 |     def __init__(self, level="INFO", caller_names=("apex", "pycocotools")):
33 |         """
34 |         Args:
35 |             level(str): log level string of loguru. Default value: "INFO".
36 |             caller_names(tuple): caller names of redirected module.
37 |                 Default value: (apex, pycocotools).
38 |         """
39 |         self.level = level
40 |         self.linebuf = ""
41 |         self.caller_names = caller_names
42 | 
43 |     def write(self, buf):
44 |         full_name = get_caller_name(depth=1)
45 |         module_name = full_name.rsplit(".", maxsplit=-1)[0]
46 |         if module_name in self.caller_names:
47 |             for line in buf.rstrip().splitlines():
48 |                 # use caller level log
49 |                 logger.opt(depth=2).log(self.level, line.rstrip())
50 |         else:
51 |             sys.__stdout__.write(buf)
52 | 
53 |     def flush(self):
54 |         pass
55 | 
56 | 
57 | def redirect_sys_output(log_level="INFO"):
58 |     redirect_logger = StreamToLoguru(log_level)
59 |     sys.stderr = redirect_logger
60 |     sys.stdout = redirect_logger
61 | 
62 | 
63 | def setup_logger(save_dir, distributed_rank=0, filename="log.txt", mode="a"):
64 |     """setup logger for training and testing.
65 |     Args:
66 |         save_dir(str): location to save log file
67 |         distributed_rank(int): device rank when multi-gpu environment
68 |         filename (string): log save name.
69 |         mode(str): log file write mode, `append` or `override`. default is `a`.
70 | 
71 |     Return:
72 |         logger instance.
73 |     """
74 |     loguru_format = (
75 |         "<green>{time:YYYY-MM-DD HH:mm:ss}</green> | "
76 |         "<level>{level: <8}</level> | "
77 |         "<cyan>{name}</cyan>:<cyan>{line}</cyan> - <level>{message}</level>"
78 |     )
79 | 
80 |     logger.remove()
81 |     save_file = os.path.join(save_dir, filename)
82 |     if mode == "o" and os.path.exists(save_file):
83 |         os.remove(save_file)
84 |     # only keep logger in rank0 process
85 |     if distributed_rank == 0:
86 |         logger.add(
87 |             sys.stderr,
88 |             format=loguru_format,
89 |             level="INFO",
90 |             enqueue=True,
91 |         )
92 |         logger.add(save_file)
93 | 
94 |     # redirect stdout/stderr to loguru
95 |     redirect_sys_output("INFO")
96 | 


--------------------------------------------------------------------------------
/demo/ONNXRuntime/README.md:
--------------------------------------------------------------------------------
 1 | ## YOLOX-ONNXRuntime in Python
 2 | 
 3 | This doc introduces how to convert your pytorch model into onnx, and how to run an onnxruntime demo to verify your convertion.
 4 | 
 5 | ### Download ONNX models.
 6 | 
 7 | | Model | Parameters | GFLOPs | Test Size | mAP | Weights |
 8 | |:------| :----: | :----: | :---: | :---: | :---: |
 9 | |  YOLOX-Nano |  0.91M  | 1.08 | 416x416 | 25.8 |[github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_nano.onnx) |
10 | |  YOLOX-Tiny | 5.06M     | 6.45 | 416x416 |32.8 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_tiny.onnx) |
11 | |  YOLOX-S | 9.0M | 26.8 | 640x640 |40.5 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_s.onnx) |
12 | |  YOLOX-M | 25.3M | 73.8 | 640x640 |47.2 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_m.onnx) |
13 | |  YOLOX-L | 54.2M | 155.6 | 640x640 |50.1 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_l.onnx) |
14 | |  YOLOX-Darknet53| 63.72M | 185.3 | 640x640 |48.0 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_darknet.onnx) |
15 | |  YOLOX-X | 99.1M | 281.9 | 640x640 |51.5 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox.onnx) |
16 | 
17 | 
18 | ### Convert Your Model to ONNX
19 | 
20 | First, you should move to <YOLOX_HOME> by:
21 | ```shell
22 | cd <YOLOX_HOME>
23 | ```
24 | Then, you can:
25 | 
26 | 1. Convert a standard YOLOX model by -n:
27 | ```shell
28 | python3 tools/export_onnx.py --output-name yolox_s.onnx -n yolox-s -c yolox_s.pth
29 | ```
30 | Notes:
31 | * -n: specify a model name. The model name must be one of the [yolox-s,m,l,x and yolox-nane, yolox-tiny, yolov3]
32 | * -c: the model you have trained
33 | * -o: opset version, default 11. **However, if you will further convert your onnx model to [OpenVINO](https://github.com/Megvii-BaseDetection/YOLOX/demo/OpenVINO/), please specify the opset version to 10.**
34 | * --no-onnxsim: disable onnxsim
35 | * To customize an input shape for onnx model,  modify the following code in tools/export.py:
36 | 
37 |     ```python
38 |     dummy_input = torch.randn(1, 3, exp.test_size[0], exp.test_size[1])
39 |     ```
40 | 
41 | 2. Convert a standard YOLOX model by -f. When using -f, the above command is equivalent to:
42 | 
43 | ```shell
44 | python3 tools/export_onnx.py --output-name yolox_s.onnx -f exps/default/yolox_s.py -c yolox_s.pth
45 | ```
46 | 
47 | 3. To convert your customized model, please use -f:
48 | 
49 | ```shell
50 | python3 tools/export_onnx.py --output-name your_yolox.onnx -f exps/your_dir/your_yolox.py -c your_yolox.pth
51 | ```
52 | 
53 | ### ONNXRuntime Demo
54 | 
55 | Step1.
56 | ```shell
57 | cd <YOLOX_HOME>/demo/ONNXRuntime
58 | ```
59 | 
60 | Step2. 
61 | ```shell
62 | python3 onnx_inference.py -m <ONNX_MODEL_PATH> -i <IMAGE_PATH> -o <OUTPUT_DIR> -s 0.3 --input_shape 640,640
63 | ```
64 | Notes:
65 | * -m: your converted onnx model
66 | * -i: input_image
67 | * -s: score threshold for visualization.
68 | * --input_shape: should be consistent with the shape you used for onnx convertion.
69 | 


--------------------------------------------------------------------------------
/cfp/data/samplers.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | # -*- coding:utf-8 -*-
 3 | # Copyright (c) Megvii, Inc. and its affiliates.
 4 | 
 5 | import itertools
 6 | from typing import Optional
 7 | 
 8 | import torch
 9 | import torch.distributed as dist
10 | from torch.utils.data.sampler import BatchSampler as torchBatchSampler
11 | from torch.utils.data.sampler import Sampler
12 | 
13 | 
14 | class YoloBatchSampler(torchBatchSampler):
15 |     """
16 |     This batch sampler will generate mini-batches of (mosaic, index) tuples from another sampler.
17 |     It works just like the :class:`torch.utils.data.sampler.BatchSampler`,
18 |     but it will turn on/off the mosaic aug.
19 |     """
20 | 
21 |     def __init__(self, *args, mosaic=True, **kwargs):
22 |         super().__init__(*args, **kwargs)
23 |         self.mosaic = mosaic
24 | 
25 |     def __iter__(self):
26 |         for batch in super().__iter__():
27 |             yield [(self.mosaic, idx) for idx in batch]
28 | 
29 | 
30 | class InfiniteSampler(Sampler):
31 |     """
32 |     In training, we only care about the "infinite stream" of training data.
33 |     So this sampler produces an infinite stream of indices and
34 |     all workers cooperate to correctly shuffle the indices and sample different indices.
35 |     The samplers in each worker effectively produces `indices[worker_id::num_workers]`
36 |     where `indices` is an infinite stream of indices consisting of
37 |     `shuffle(range(size)) + shuffle(range(size)) + ...` (if shuffle is True)
38 |     or `range(size) + range(size) + ...` (if shuffle is False)
39 |     """
40 | 
41 |     def __init__(
42 |         self,
43 |         size: int,
44 |         shuffle: bool = True,
45 |         seed: Optional[int] = 0,
46 |         rank=0,
47 |         world_size=1,
48 |     ):
49 |         """
50 |         Args:
51 |             size (int): the total number of data of the underlying dataset to sample from
52 |             shuffle (bool): whether to shuffle the indices or not
53 |             seed (int): the initial seed of the shuffle. Must be the same
54 |                 across all workers. If None, will use a random seed shared
55 |                 among workers (require synchronization among all workers).
56 |         """
57 |         self._size = size
58 |         assert size > 0
59 |         self._shuffle = shuffle
60 |         self._seed = int(seed)
61 | 
62 |         if dist.is_available() and dist.is_initialized():
63 |             self._rank = dist.get_rank()
64 |             self._world_size = dist.get_world_size()
65 |         else:
66 |             self._rank = rank
67 |             self._world_size = world_size
68 | 
69 |     def __iter__(self):
70 |         start = self._rank
71 |         yield from itertools.islice(
72 |             self._infinite_indices(), start, None, self._world_size
73 |         )
74 | 
75 |     def _infinite_indices(self):
76 |         g = torch.Generator()
77 |         g.manual_seed(self._seed)
78 |         while True:
79 |             if self._shuffle:
80 |                 yield from torch.randperm(self._size, generator=g)
81 |             else:
82 |                 yield from torch.arange(self._size)
83 | 
84 |     def __len__(self):
85 |         return self._size // self._world_size
86 | 


--------------------------------------------------------------------------------
/docs/quick_run.md:
--------------------------------------------------------------------------------
 1 | 
 2 | # Get Started
 3 | 
 4 | ## 1.Installation
 5 | 
 6 | Step1. Install YOLOX.
 7 | ```shell
 8 | git clone git@github.com:Megvii-BaseDetection/YOLOX.git
 9 | cd YOLOX
10 | pip3 install -U pip && pip3 install -r requirements.txt
11 | pip3 install -v -e .  # or  python3 setup.py develop
12 | ```
13 | Step2. Install [pycocotools](https://github.com/cocodataset/cocoapi).
14 | 
15 | ```shell
16 | pip3 install cython; pip3 install 'git+https://github.com/cocodataset/cocoapi.git#subdirectory=PythonAPI'
17 | ```
18 | 
19 | ## 2.Demo
20 | 
21 | Step1. Download a pretrained model from the benchmark table.
22 | 
23 | Step2. Use either -n or -f to specify your detector's config. For example:
24 | 
25 | ```shell
26 | python tools/demo.py image -n yolox-s -c /path/to/your/yolox_s.pth --path assets/dog.jpg --conf 0.25 --nms 0.45 --tsize 640 --save_result --device [cpu/gpu]
27 | ```
28 | or
29 | ```shell
30 | python tools/demo.py image -f exps/default/yolox_s.py -c /path/to/your/yolox_s.pth --path assets/dog.jpg --conf 0.25 --nms 0.45 --tsize 640 --save_result --device [cpu/gpu]
31 | ```
32 | Demo for video:
33 | ```shell
34 | python tools/demo.py video -n yolox-s -c /path/to/your/yolox_s.pth --path /path/to/your/video --conf 0.25 --nms 0.45 --tsize 640 --save_result --device [cpu/gpu]
35 | ```
36 | 
37 | 
38 | ## 3.Reproduce our results on COCO
39 | 
40 | Step1. Prepare COCO dataset
41 | ```shell
42 | cd <YOLOX_HOME>
43 | ln -s /path/to/your/COCO ./datasets/COCO
44 | ```
45 | 
46 | Step2. Reproduce our results on COCO by specifying -n:
47 | 
48 | ```shell
49 | python tools/train.py -n yolox-s -d 8 -b 64 --fp16 -o [--cache]
50 |                          yolox-m
51 |                          yolox-l
52 |                          yolox-x
53 | ```
54 | * -d: number of gpu devices
55 | * -b: total batch size, the recommended number for -b is num-gpu * 8
56 | * --fp16: mixed precision training
57 | * --cache: caching imgs into RAM to accelarate training, which need large system RAM.
58 | 
59 | **Multi Machine Training**
60 | 
61 | We also support multi-nodes training. Just add the following args:
62 | * --num\_machines: num of your total training nodes
63 | * --machine\_rank: specify the rank of each node
64 | 
65 | When using -f, the above commands are equivalent to:
66 | 
67 | ```shell
68 | python tools/train.py -f exps/default/yolox-s.py -d 8 -b 64 --fp16 -o [--cache]
69 |                          exps/default/yolox-m.py
70 |                          exps/default/yolox-l.py
71 |                          exps/default/yolox-x.py
72 | ```
73 | 
74 | ## 4.Evaluation
75 | 
76 | We support batch testing for fast evaluation:
77 | 
78 | ```shell
79 | python tools/eval.py -n  yolox-s -c yolox_s.pth -b 64 -d 8 --conf 0.001 [--fp16] [--fuse]
80 |                          yolox-m
81 |                          yolox-l
82 |                          yolox-x
83 | ```
84 | * --fuse: fuse conv and bn
85 | * -d: number of GPUs used for evaluation. DEFAULT: All GPUs available will be used.
86 | * -b: total batch size across on all GPUs
87 | 
88 | To reproduce speed test, we use the following command:
89 | ```shell
90 | python tools/eval.py -n  yolox-s -c yolox_s.pth -b 1 -d 1 --conf 0.001 --fp16 --fuse
91 |                          yolox-m
92 |                          yolox-l
93 |                          yolox-x
94 | ```
95 | 


--------------------------------------------------------------------------------
/cfp/utils/allreduce_norm.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding:utf-8 -*-
  3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
  4 | 
  5 | import pickle
  6 | from collections import OrderedDict
  7 | 
  8 | import torch
  9 | from torch import distributed as dist
 10 | from torch import nn
 11 | 
 12 | from .dist import _get_global_gloo_group, get_world_size
 13 | 
 14 | ASYNC_NORM = (
 15 |     nn.BatchNorm1d,
 16 |     nn.BatchNorm2d,
 17 |     nn.BatchNorm3d,
 18 |     nn.InstanceNorm1d,
 19 |     nn.InstanceNorm2d,
 20 |     nn.InstanceNorm3d,
 21 | )
 22 | 
 23 | __all__ = [
 24 |     "get_async_norm_states",
 25 |     "pyobj2tensor",
 26 |     "tensor2pyobj",
 27 |     "all_reduce",
 28 |     "all_reduce_norm",
 29 | ]
 30 | 
 31 | 
 32 | def get_async_norm_states(module):
 33 |     async_norm_states = OrderedDict()
 34 |     for name, child in module.named_modules():
 35 |         if isinstance(child, ASYNC_NORM):
 36 |             for k, v in child.state_dict().items():
 37 |                 async_norm_states[".".join([name, k])] = v
 38 |     return async_norm_states
 39 | 
 40 | 
 41 | def pyobj2tensor(pyobj, device="cuda"):
 42 |     """serialize picklable python object to tensor"""
 43 |     storage = torch.ByteStorage.from_buffer(pickle.dumps(pyobj))
 44 |     return torch.ByteTensor(storage).to(device=device)
 45 | 
 46 | 
 47 | def tensor2pyobj(tensor):
 48 |     """deserialize tensor to picklable python object"""
 49 |     return pickle.loads(tensor.cpu().numpy().tobytes())
 50 | 
 51 | 
 52 | def _get_reduce_op(op_name):
 53 |     return {
 54 |         "sum": dist.ReduceOp.SUM,
 55 |         "mean": dist.ReduceOp.SUM,
 56 |     }[op_name.lower()]
 57 | 
 58 | 
 59 | def all_reduce(py_dict, op="sum", group=None):
 60 |     """
 61 |     Apply all reduce function for python dict object.
 62 |     NOTE: make sure that every py_dict has the same keys and values are in the same shape.
 63 | 
 64 |     Args:
 65 |         py_dict (dict): dict to apply all reduce op.
 66 |         op (str): operator, could be "sum" or "mean".
 67 |     """
 68 |     world_size = get_world_size()
 69 |     if world_size == 1:
 70 |         return py_dict
 71 |     if group is None:
 72 |         group = _get_global_gloo_group()
 73 |     if dist.get_world_size(group) == 1:
 74 |         return py_dict
 75 | 
 76 |     # all reduce logic across different devices.
 77 |     py_key = list(py_dict.keys())
 78 |     py_key_tensor = pyobj2tensor(py_key)
 79 |     dist.broadcast(py_key_tensor, src=0)
 80 |     py_key = tensor2pyobj(py_key_tensor)
 81 | 
 82 |     tensor_shapes = [py_dict[k].shape for k in py_key]
 83 |     tensor_numels = [py_dict[k].numel() for k in py_key]
 84 | 
 85 |     flatten_tensor = torch.cat([py_dict[k].flatten() for k in py_key])
 86 |     dist.all_reduce(flatten_tensor, op=_get_reduce_op(op))
 87 |     if op == "mean":
 88 |         flatten_tensor /= world_size
 89 | 
 90 |     split_tensors = [
 91 |         x.reshape(shape)
 92 |         for x, shape in zip(torch.split(flatten_tensor, tensor_numels), tensor_shapes)
 93 |     ]
 94 |     return OrderedDict({k: v for k, v in zip(py_key, split_tensors)})
 95 | 
 96 | 
 97 | def all_reduce_norm(module):
 98 |     """
 99 |     All reduce norm statistics in different devices.
100 |     """
101 |     states = get_async_norm_states(module)
102 |     states = all_reduce(states, op="mean")
103 |     module.load_state_dict(states, strict=False)
104 | 


--------------------------------------------------------------------------------
/demo/ncnn/cpp/README.md:
--------------------------------------------------------------------------------
 1 | # YOLOX-CPP-ncnn
 2 | 
 3 | Cpp file compile of YOLOX object detection base on [ncnn](https://github.com/Tencent/ncnn).  
 4 | YOLOX is included in ncnn now, you could also try building from ncnn, it's better.
 5 | 
 6 | ## Tutorial
 7 | 
 8 | ### Step1
 9 | Clone [ncnn](https://github.com/Tencent/ncnn) first, then please following [build tutorial of ncnn](https://github.com/Tencent/ncnn/wiki/how-to-build) to build on your own device.
10 | 
11 | ### Step2
12 | Use provided tools to generate onnx file.
13 | For example, if you want to generate onnx file of yolox-s, please run the following command:
14 | ```shell
15 | cd <path of yolox>
16 | python3 tools/export_onnx.py -n yolox-s
17 | ```
18 | Then, a yolox.onnx file is generated.
19 | 
20 | ### Step3
21 | Generate ncnn param and bin file.
22 | ```shell
23 | cd <path of ncnn>
24 | cd build/tools/ncnn
25 | ./onnx2ncnn yolox.onnx model.param model.bin
26 | ```
27 | 
28 | Since Focus module is not supported in ncnn. Warnings like:
29 | ```shell
30 | Unsupported slice step ! 
31 | ```
32 | will be printed. However, don't  worry!  C++ version of Focus layer is already implemented in yolox.cpp.
33 | 
34 | ### Step4
35 | Open **model.param**, and modify it.
36 | Before (just an example):
37 | ```
38 | 295 328
39 | Input            images                   0 1 images
40 | Split            splitncnn_input0         1 4 images images_splitncnn_0 images_splitncnn_1 images_splitncnn_2 images_splitncnn_3
41 | Crop             Slice_4                  1 1 images_splitncnn_3 647 -23309=1,0 -23310=1,2147483647 -23311=1,1
42 | Crop             Slice_9                  1 1 647 652 -23309=1,0 -23310=1,2147483647 -23311=1,2
43 | Crop             Slice_14                 1 1 images_splitncnn_2 657 -23309=1,0 -23310=1,2147483647 -23311=1,1
44 | Crop             Slice_19                 1 1 657 662 -23309=1,1 -23310=1,2147483647 -23311=1,2
45 | Crop             Slice_24                 1 1 images_splitncnn_1 667 -23309=1,1 -23310=1,2147483647 -23311=1,1
46 | Crop             Slice_29                 1 1 667 672 -23309=1,0 -23310=1,2147483647 -23311=1,2
47 | Crop             Slice_34                 1 1 images_splitncnn_0 677 -23309=1,1 -23310=1,2147483647 -23311=1,1
48 | Crop             Slice_39                 1 1 677 682 -23309=1,1 -23310=1,2147483647 -23311=1,2
49 | Concat           Concat_40                4 1 652 672 662 682 683 0=0
50 | ...
51 | ```
52 | * Change first number for 295 to 295 - 9 = 286(since we will remove 10 layers and add 1 layers, total layers number should minus 9). 
53 | * Then remove 10 lines of code from Split to Concat, but remember the last but 2nd number: 683.
54 | * Add YoloV5Focus layer After Input (using previous number 683):
55 | ```
56 | YoloV5Focus      focus                    1 1 images 683
57 | ```
58 | After(just an example):
59 | ```
60 | 286 328
61 | Input            images                   0 1 images
62 | YoloV5Focus      focus                    1 1 images 683
63 | ...
64 | ```
65 | 
66 | ### Step5
67 | Use ncnn_optimize to generate new param and bin:
68 | ```shell
69 | # suppose you are still under ncnn/build/tools/ncnn dir.
70 | ../ncnnoptimize model.param model.bin yolox.param yolox.bin 65536
71 | ```
72 | 
73 | ### Step6
74 | Copy or Move yolox.cpp file into ncnn/examples, modify the CMakeList.txt, then build yolox
75 | 
76 | ### Step7
77 | Inference image with executable file yolox, enjoy the detect result:
78 | ```shell
79 | ./yolox demo.jpg
80 | ```
81 | 
82 | ## Acknowledgement
83 | 
84 | * [ncnn](https://github.com/Tencent/ncnn)
85 | 


--------------------------------------------------------------------------------
/demo/OpenVINO/python/README.md:
--------------------------------------------------------------------------------
 1 | # YOLOX-OpenVINO in Python
 2 | 
 3 | This tutorial includes a Python demo for OpenVINO, as well as some converted models.
 4 | 
 5 | ### Download OpenVINO models.
 6 | 
 7 | | Model | Parameters | GFLOPs | Test Size | mAP | Weights |
 8 | |:------| :----: | :----: | :---: | :---: | :---: |
 9 | |  [YOLOX-Nano](../../../exps/default/nano.py) |  0.91M  | 1.08 | 416x416 | 25.8 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_nano_openvino.tar.gz) |
10 | |  [YOLOX-Tiny](../../../exps/default/yolox_tiny.py) | 5.06M     | 6.45 | 416x416 |32.8 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_tiny_openvino.tar.gz) |
11 | |  [YOLOX-S](../../../exps/default/yolox_s.py) | 9.0M | 26.8 | 640x640 |40.5 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_s_openvino.tar.gz) |
12 | |  [YOLOX-M](../../../exps/default/yolox_m.py) | 25.3M | 73.8 | 640x640 |47.2 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_m_openvino.tar.gz) |
13 | |  [YOLOX-L](../../../exps/default/yolox_l.py) | 54.2M | 155.6 | 640x640 |50.1 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_l_openvino.tar.gz) |
14 | |  [YOLOX-Darknet53](../../../exps/default/yolov3.py) | 63.72M | 185.3 | 640x640 |48.0 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_dark_openvino.tar.gz) | 
15 | |  [YOLOX-X](../../../exps/default/yolox_x.py) | 99.1M | 281.9 | 640x640 |51.5 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_x_openvino.tar.gz) |
16 | 
17 | ## Install OpenVINO Toolkit
18 | 
19 | Please visit [Openvino Homepage](https://docs.openvinotoolkit.org/latest/get_started_guides.html) for more details.
20 | 
21 | ## Set up the Environment
22 | 
23 | ### For Linux
24 | 
25 | **Option1. Set up the environment tempororally. You need to run this command everytime you start a new shell window.**
26 | 
27 | ```shell
28 | source /opt/intel/openvino_2021/bin/setupvars.sh
29 | ```
30 | 
31 | **Option2. Set up the environment permenantly.**
32 | 
33 | *Step1.* For Linux:
34 | ```shell
35 | vim ~/.bashrc
36 | ```
37 | 
38 | *Step2.* Add the following line into your file:
39 | 
40 | ```shell
41 | source /opt/intel/openvino_2021/bin/setupvars.sh
42 | ```
43 | 
44 | *Step3.* Save and exit the file, then run:
45 | 
46 | ```shell
47 | source ~/.bashrc
48 | ```
49 | 
50 | 
51 | ## Convert model
52 | 
53 | 1. Export ONNX model
54 | 
55 |    Please refer to the [ONNX toturial](https://github.com/Megvii-BaseDetection/YOLOX/demo/ONNXRuntime). **Note that you should set --opset to 10, otherwise your next step will fail.**
56 | 
57 | 2. Convert ONNX to OpenVINO
58 | 
59 |    ``` shell
60 |    cd <INSTSLL_DIR>/openvino_2021/deployment_tools/model_optimizer
61 |    ```
62 | 
63 |    Install requirements for convert tool
64 | 
65 |    ```shell
66 |    sudo ./install_prerequisites/install_prerequisites_onnx.sh
67 |    ```
68 | 
69 |    Then convert model.
70 |    ```shell
71 |    python3 mo.py --input_model <ONNX_MODEL> --input_shape <INPUT_SHAPE> [--data_type FP16]
72 |    ```
73 |    For example:
74 |    ```shell
75 |    python3 mo.py --input_model yolox.onnx --input_shape [1,3,640,640] --data_type FP16 --output_dir converted_output
76 |    ```
77 | 
78 | ## Demo
79 | 
80 | ### python
81 | 
82 | ```shell
83 | python openvino_inference.py -m <XML_MODEL_PATH> -i <IMAGE_PATH> 
84 | ```
85 | or
86 | ```shell
87 | python openvino_inference.py -m <XML_MODEL_PATH> -i <IMAGE_PATH> -o <OUTPUT_DIR> -s <SCORE_THR> -d <DEVICE>
88 | ```
89 | 
90 | 


--------------------------------------------------------------------------------
/demo/OpenVINO/cpp/README.md:
--------------------------------------------------------------------------------
 1 | # YOLOX-OpenVINO in C++
 2 | 
 3 | This tutorial includes a C++ demo for OpenVINO, as well as some converted models.
 4 | 
 5 | ### Download OpenVINO models.
 6 | 
 7 | | Model | Parameters | GFLOPs | Test Size | mAP | Weights |
 8 | |:------| :----: | :----: | :---: | :---: | :---: |
 9 | |  [YOLOX-Nano](../../../exps/default/nano.py) |  0.91M  | 1.08 | 416x416 | 25.8 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_nano_openvino.tar.gz) |
10 | |  [YOLOX-Tiny](../../../exps/default/yolox_tiny.py) | 5.06M     | 6.45 | 416x416 |32.8 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_tiny_openvino.tar.gz) |
11 | |  [YOLOX-S](../../../exps/default/yolox_s.py) | 9.0M | 26.8 | 640x640 |40.5 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_s_openvino.tar.gz) |
12 | |  [YOLOX-M](../../../exps/default/yolox_m.py) | 25.3M | 73.8 | 640x640 |47.2 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_m_openvino.tar.gz) |
13 | |  [YOLOX-L](../../../exps/default/yolox_l.py) | 54.2M | 155.6 | 640x640 |50.1 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_l_openvino.tar.gz) |
14 | |  [YOLOX-Darknet53](../../../exps/default/yolov3.py) | 63.72M | 185.3 | 640x640 |48.0 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_dark_openvino.tar.gz) | 
15 | |  [YOLOX-X](../../../exps/default/yolox_x.py) | 99.1M | 281.9 | 640x640 |51.5 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_x_openvino.tar.gz) |
16 | 
17 | ## Install OpenVINO Toolkit
18 | 
19 | Please visit [Openvino Homepage](https://docs.openvinotoolkit.org/latest/get_started_guides.html) for more details.
20 | 
21 | ## Set up the Environment
22 | 
23 | ### For Linux
24 | 
25 | **Option1. Set up the environment tempororally. You need to run this command everytime you start a new shell window.**
26 | 
27 | ```shell
28 | source /opt/intel/openvino_2021/bin/setupvars.sh
29 | ```
30 | 
31 | **Option2. Set up the environment permenantly.**
32 | 
33 | *Step1.* For Linux:
34 | ```shell
35 | vim ~/.bashrc 
36 | ```
37 | 
38 | *Step2.* Add the following line into your file:
39 | 
40 | ```shell
41 | source /opt/intel/openvino_2021/bin/setupvars.sh
42 | ```
43 | 
44 | *Step3.* Save and exit the file, then run:
45 | 
46 | ```shell
47 | source ~/.bashrc
48 | ```
49 | 
50 | 
51 | ## Convert model
52 | 
53 | 1. Export ONNX model
54 |    
55 |    Please refer to the [ONNX toturial](../../ONNXRuntime). **Note that you should set --opset to 10, otherwise your next step will fail.**
56 | 
57 | 2. Convert ONNX to OpenVINO 
58 | 
59 |    ``` shell
60 |    cd <INSTSLL_DIR>/openvino_2021/deployment_tools/model_optimizer
61 |    ```
62 | 
63 |    Install requirements for convert tool
64 | 
65 |    ```shell
66 |    sudo ./install_prerequisites/install_prerequisites_onnx.sh
67 |    ```
68 | 
69 |    Then convert model.
70 |    ```shell
71 |    python3 mo.py --input_model <ONNX_MODEL> --input_shape <INPUT_SHAPE> [--data_type FP16]
72 |    ```
73 |    For example:
74 |    ```shell
75 |    python3 mo.py --input_model yolox_tiny.onnx --input_shape [1,3,416,416] --data_type FP16
76 |    ```  
77 | 
78 |    Make sure the input shape is consistent with [those](yolox_openvino.cpp#L24-L25) in cpp file. 
79 | 
80 | ## Build 
81 | 
82 | ### Linux
83 | ```shell
84 | source /opt/intel/openvino_2021/bin/setupvars.sh
85 | mkdir build
86 | cd build
87 | cmake ..
88 | make
89 | ```
90 | 
91 | ## Demo
92 | 
93 | ### c++
94 | 
95 | ```shell
96 | ./yolox_openvino <XML_MODEL_PATH> <IMAGE_PATH> <DEVICE>
97 | ```
98 | 


--------------------------------------------------------------------------------
/feamap_visual.py:
--------------------------------------------------------------------------------
  1 | import os
  2 | import torch
  3 | import torchvision as tv
  4 | import torchvision.transforms as transforms
  5 | import torch.nn as nn
  6 | import torch.optim as optim
  7 | import argparse
  8 | import skimage.data
  9 | import skimage.io
 10 | import skimage.transform
 11 | import numpy as np
 12 | import matplotlib.pyplot as plt
 13 | import torchvision.models as models
 14 | from PIL import Image
 15 | import cv2
 16 | 
 17 | # 下面的模块是根据所指定的模型筛选出指定层的特征图输出，
 18 | # 如果未指定也就是extracted_layers是None则以字典的形式输出全部的特征图，
 19 | # 另外因为全连接层本身是一维的没必要输出因此进行了过滤。
 20 | 
 21 | class FeatureExtractor(nn.Module):
 22 |     def __init__(self, submodule, extracted_layers):
 23 |         super(FeatureExtractor, self).__init__()
 24 |         self.submodule = submodule
 25 |         self.extracted_layers = extracted_layers
 26 | 
 27 |     def forward(self, x):
 28 |         outputs = {}
 29 |         for name, module in self.submodule._modules.items():
 30 |             if "fc" in name:
 31 |                 x = x.view(x.size(0), -1)
 32 | 
 33 |             x = module(x)
 34 |             print(name)
 35 |             if self.extracted_layers is None or name in self.extracted_layers and 'fc' not in name:
 36 |                 outputs[name] = x
 37 | 
 38 |         return outputs
 39 | 
 40 | 
 41 | def get_picture(pic_name, transform):
 42 |     img = skimage.io.imread(pic_name)
 43 |     img = skimage.transform.resize(img, (256, 256))
 44 |     img = np.asarray(img, dtype=np.float32)
 45 |     return transform(img)
 46 | 
 47 | 
 48 | def make_dirs(path):
 49 |     if os.path.exists(path) is False:
 50 |         os.makedirs(path)
 51 | 
 52 | 
 53 | def get_feature():
 54 |     pic_dir = 'path/imgs/AAA.jpg'  
 55 |     transform = transforms.ToTensor()
 56 |     img = get_picture(pic_dir, transform)
 57 |     device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 58 |     # 插入维度
 59 |     img = img.unsqueeze(0)
 60 | 
 61 |     img = img.to(device)
 62 | 
 63 |     # 这里主要是一些参数，比如要提取的网络，网络的权重，要提取的层，指定的图像放大的大小，存储路径等等。
 64 |     net = models.resnet101().to(device) 
 65 |     net.load_state_dict(torch.load('PATH/weights/resnet101-5d3b4d8f.pth')) #
 66 |     exact_list = None
 67 |     dst = './feautures/'
 68 |     therd_size = 640
 69 | 
 70 |     myexactor = FeatureExtractor(net, exact_list)
 71 |     outs = myexactor(img)
 72 |     # 这段主要是存储图片，为每个层创建一个文件夹将特征图以JET的colormap进行按顺序存储到该文件夹，
 73 |     # 并且如果特征图过小也会对特征图放大同时存储原始图和放大后的图。
 74 |     for k, v in outs.items():
 75 |         features = v[0]
 76 |         iter_range = features.shape[0]
 77 |         for i in range(iter_range):
 78 |             # plt.imshow(x[0].data.numpy()[0,i,:,:],cmap='jet')
 79 |             if 'fc' in k:
 80 |                 continue
 81 | 
 82 |             feature = features.data.cpu().numpy()
 83 |             feature_img = feature[i, :, :]
 84 |             feature_img = np.asarray(feature_img * 255, dtype=np.uint8)
 85 | 
 86 |             dst_path = os.path.join(dst, k)
 87 | 
 88 |             make_dirs(dst_path)
 89 |             feature_img = cv2.applyColorMap(feature_img, cv2.COLORMAP_JET)
 90 |             if feature_img.shape[0] < therd_size:
 91 |                 tmp_file = os.path.join(dst_path, str(i) + '_' + str(therd_size) + '.jpg')
 92 |                 tmp_img = feature_img.copy()
 93 |                 tmp_img = cv2.resize(tmp_img, (therd_size, therd_size), interpolation=cv2.INTER_NEAREST)
 94 |                 cv2.imwrite(tmp_file, tmp_img)
 95 | 
 96 |             dst_file = os.path.join(dst_path, str(i) + '.jpg')
 97 |             cv2.imwrite(dst_file, feature_img)
 98 | 
 99 | 
100 | if __name__ == '__main__':
101 |     get_feature()
102 | 


--------------------------------------------------------------------------------
/cfp/utils/metric.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding: utf-8 -*-
  3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
  4 | import functools
  5 | import os
  6 | import time
  7 | from collections import defaultdict, deque
  8 | 
  9 | import numpy as np
 10 | 
 11 | import torch
 12 | 
 13 | __all__ = [
 14 |     "AverageMeter",
 15 |     "MeterBuffer",
 16 |     "get_total_and_free_memory_in_Mb",
 17 |     "occupy_mem",
 18 |     "gpu_mem_usage",
 19 | ]
 20 | 
 21 | 
 22 | def get_total_and_free_memory_in_Mb(cuda_device):
 23 |     devices_info_str = os.popen(
 24 |         "nvidia-smi --query-gpu=memory.total,memory.used --format=csv,nounits,noheader"
 25 |     )
 26 |     devices_info = devices_info_str.read().strip().split("\n")
 27 |     total, used = devices_info[int(cuda_device)].split(",")
 28 |     return int(total), int(used)
 29 | 
 30 | 
 31 | def occupy_mem(cuda_device, mem_ratio=0.9):
 32 |     """
 33 |     pre-allocate gpu memory for training to avoid memory Fragmentation.
 34 |     """
 35 |     total, used = get_total_and_free_memory_in_Mb(cuda_device)
 36 |     max_mem = int(total * mem_ratio)
 37 |     block_mem = max_mem - used
 38 |     x = torch.cuda.FloatTensor(256, 1024, block_mem)
 39 |     del x
 40 |     time.sleep(5)
 41 | 
 42 | 
 43 | def gpu_mem_usage():
 44 |     """
 45 |     Compute the GPU memory usage for the current device (MB).
 46 |     """
 47 |     mem_usage_bytes = torch.cuda.max_memory_allocated()
 48 |     return mem_usage_bytes / (1024 * 1024)
 49 | 
 50 | 
 51 | class AverageMeter:
 52 |     """Track a series of values and provide access to smoothed values over a
 53 |     window or the global series average.
 54 |     """
 55 | 
 56 |     def __init__(self, window_size=50):
 57 |         self._deque = deque(maxlen=window_size)
 58 |         self._total = 0.0
 59 |         self._count = 0
 60 | 
 61 |     def update(self, value):
 62 |         self._deque.append(value)
 63 |         self._count += 1
 64 |         self._total += value
 65 | 
 66 |     @property
 67 |     def median(self):
 68 |         d = np.array(list(self._deque))
 69 |         return np.median(d)
 70 | 
 71 |     @property
 72 |     def avg(self):
 73 |         # if deque is empty, nan will be returned.
 74 |         d = np.array(list(self._deque))
 75 |         return d.mean()
 76 | 
 77 |     @property
 78 |     def global_avg(self):
 79 |         return self._total / max(self._count, 1e-5)
 80 | 
 81 |     @property
 82 |     def latest(self):
 83 |         return self._deque[-1] if len(self._deque) > 0 else None
 84 | 
 85 |     @property
 86 |     def total(self):
 87 |         return self._total
 88 | 
 89 |     def reset(self):
 90 |         self._deque.clear()
 91 |         self._total = 0.0
 92 |         self._count = 0
 93 | 
 94 |     def clear(self):
 95 |         self._deque.clear()
 96 | 
 97 | 
 98 | class MeterBuffer(defaultdict):
 99 |     """Computes and stores the average and current value"""
100 | 
101 |     def __init__(self, window_size=20):
102 |         factory = functools.partial(AverageMeter, window_size=window_size)
103 |         super().__init__(factory)
104 | 
105 |     def reset(self):
106 |         for v in self.values():
107 |             v.reset()
108 | 
109 |     def get_filtered_meter(self, filter_key="time"):
110 |         return {k: v for k, v in self.items() if filter_key in k}
111 | 
112 |     def update(self, values=None, **kwargs):
113 |         if values is None:
114 |             values = {}
115 |         values.update(kwargs)
116 |         for k, v in values.items():
117 |             if isinstance(v, torch.Tensor):
118 |                 v = v.detach()
119 |             self[k].update(v)
120 | 
121 |     def clear_meters(self):
122 |         for v in self.values():
123 |             v.clear()
124 | 


--------------------------------------------------------------------------------
/cfp/utils/model_utils.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding:utf-8 -*-
  3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
  4 | 
  5 | from copy import deepcopy
  6 | 
  7 | import torch
  8 | import torch.nn as nn
  9 | from thop import profile
 10 | 
 11 | __all__ = [
 12 |     "fuse_conv_and_bn",
 13 |     "fuse_model",
 14 |     "get_model_info",
 15 |     "replace_module",
 16 | ]
 17 | 
 18 | 
 19 | def get_model_info(model, tsize):
 20 | 
 21 |     stride = 64
 22 |     img = torch.zeros((1, 3, stride, stride), device=next(model.parameters()).device)
 23 |     flops, params = profile(deepcopy(model), inputs=(img,), verbose=False)
 24 |     params /= 1e6
 25 |     flops /= 1e9
 26 |     flops *= tsize[0] * tsize[1] / stride / stride * 2  # Gflops
 27 |     info = "Params: {:.2f}M, Gflops: {:.2f}".format(params, flops)
 28 |     return info
 29 | 
 30 | 
 31 | def fuse_conv_and_bn(conv, bn):
 32 |     # Fuse convolution and batchnorm layers https://tehnokv.com/posts/fusing-batchnorm-and-conv/
 33 |     fusedconv = (
 34 |         nn.Conv2d(
 35 |             conv.in_channels,
 36 |             conv.out_channels,
 37 |             kernel_size=conv.kernel_size,
 38 |             stride=conv.stride,
 39 |             padding=conv.padding,
 40 |             groups=conv.groups,
 41 |             bias=True,
 42 |         )
 43 |         .requires_grad_(False)
 44 |         .to(conv.weight.device)
 45 |     )
 46 | 
 47 |     # prepare filters
 48 |     w_conv = conv.weight.clone().view(conv.out_channels, -1)
 49 |     w_bn = torch.diag(bn.weight.div(torch.sqrt(bn.eps + bn.running_var)))
 50 |     fusedconv.weight.copy_(torch.mm(w_bn, w_conv).view(fusedconv.weight.shape))
 51 | 
 52 |     # prepare spatial bias
 53 |     b_conv = (
 54 |         torch.zeros(conv.weight.size(0), device=conv.weight.device)
 55 |         if conv.bias is None
 56 |         else conv.bias
 57 |     )
 58 |     b_bn = bn.bias - bn.weight.mul(bn.running_mean).div(
 59 |         torch.sqrt(bn.running_var + bn.eps)
 60 |     )
 61 |     fusedconv.bias.copy_(torch.mm(w_bn, b_conv.reshape(-1, 1)).reshape(-1) + b_bn)
 62 | 
 63 |     return fusedconv
 64 | 
 65 | 
 66 | def fuse_model(model):
 67 |     from yolox.models.network_blocks import BaseConv
 68 | 
 69 |     for m in model.modules():
 70 |         if type(m) is BaseConv and hasattr(m, "bn"):
 71 |             m.conv = fuse_conv_and_bn(m.conv, m.bn)  # update conv
 72 |             delattr(m, "bn")  # remove batchnorm
 73 |             m.forward = m.fuseforward  # update forward
 74 |     return model
 75 | 
 76 | 
 77 | def replace_module(module, replaced_module_type, new_module_type, replace_func=None):
 78 |     """
 79 |     Replace given type in module to a new type. mostly used in deploy.
 80 | 
 81 |     Args:
 82 |         module (nn.Module): model to apply replace operation.
 83 |         replaced_module_type (Type): module type to be replaced.
 84 |         new_module_type (Type)
 85 |         replace_func (function): python function to describe replace logic. Defalut value None.
 86 | 
 87 |     Returns:
 88 |         model (nn.Module): module that already been replaced.
 89 |     """
 90 | 
 91 |     def default_replace_func(replaced_module_type, new_module_type):
 92 |         return new_module_type()
 93 | 
 94 |     if replace_func is None:
 95 |         replace_func = default_replace_func
 96 | 
 97 |     model = module
 98 |     if isinstance(module, replaced_module_type):
 99 |         model = replace_func(replaced_module_type, new_module_type)
100 |     else:  # recurrsively replace
101 |         for name, child in module.named_children():
102 |             new_child = replace_module(child, replaced_module_type, new_module_type)
103 |             if new_child is not child:  # child is already replaced
104 |                 model.add_module(name, new_child)
105 | 
106 |     return model
107 | 


--------------------------------------------------------------------------------
/cfp/layers/csrc/cocoeval/cocoeval.h:
--------------------------------------------------------------------------------
 1 | // Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved
 2 | #pragma once
 3 | 
 4 | #include <pybind11/numpy.h>
 5 | #include <pybind11/pybind11.h>
 6 | #include <pybind11/stl.h>
 7 | #include <pybind11/stl_bind.h>
 8 | #include <vector>
 9 | 
10 | namespace py = pybind11;
11 | 
12 | namespace COCOeval {
13 | 
14 | // Annotation data for a single object instance in an image
15 | struct InstanceAnnotation {
16 |   InstanceAnnotation(
17 |       uint64_t id,
18 |       double score,
19 |       double area,
20 |       bool is_crowd,
21 |       bool ignore)
22 |       : id{id}, score{score}, area{area}, is_crowd{is_crowd}, ignore{ignore} {}
23 |   uint64_t id;
24 |   double score = 0.;
25 |   double area = 0.;
26 |   bool is_crowd = false;
27 |   bool ignore = false;
28 | };
29 | 
30 | // Stores intermediate results for evaluating detection results for a single
31 | // image that has D detected instances and G ground truth instances. This stores
32 | // matches between detected and ground truth instances
33 | struct ImageEvaluation {
34 |   // For each of the D detected instances, the id of the matched ground truth
35 |   // instance, or 0 if unmatched
36 |   std::vector<uint64_t> detection_matches;
37 | 
38 |   // The detection score of each of the D detected instances
39 |   std::vector<double> detection_scores;
40 | 
41 |   // Marks whether or not each of G instances was ignored from evaluation (e.g.,
42 |   // because it's outside area_range)
43 |   std::vector<bool> ground_truth_ignores;
44 | 
45 |   // Marks whether or not each of D instances was ignored from evaluation (e.g.,
46 |   // because it's outside aRng)
47 |   std::vector<bool> detection_ignores;
48 | };
49 | 
50 | template <class T>
51 | using ImageCategoryInstances = std::vector<std::vector<std::vector<T>>>;
52 | 
53 | // C++ implementation of COCO API cocoeval.py::COCOeval.evaluateImg().  For each
54 | // combination of image, category, area range settings, and IOU thresholds to
55 | // evaluate, it matches detected instances to ground truth instances and stores
56 | // the results into a vector of ImageEvaluation results, which will be
57 | // interpreted by the COCOeval::Accumulate() function to produce precion-recall
58 | // curves.  The parameters of nested vectors have the following semantics:
59 | //   image_category_ious[i][c][d][g] is the intersection over union of the d'th
60 | //     detected instance and g'th ground truth instance of
61 | //     category category_ids[c] in image image_ids[i]
62 | //   image_category_ground_truth_instances[i][c] is a vector of ground truth
63 | //     instances in image image_ids[i] of category category_ids[c]
64 | //   image_category_detection_instances[i][c] is a vector of detected
65 | //     instances in image image_ids[i] of category category_ids[c]
66 | std::vector<ImageEvaluation> EvaluateImages(
67 |     const std::vector<std::array<double, 2>>& area_ranges, // vector of 2-tuples
68 |     int max_detections,
69 |     const std::vector<double>& iou_thresholds,
70 |     const ImageCategoryInstances<std::vector<double>>& image_category_ious,
71 |     const ImageCategoryInstances<InstanceAnnotation>&
72 |         image_category_ground_truth_instances,
73 |     const ImageCategoryInstances<InstanceAnnotation>&
74 |         image_category_detection_instances);
75 | 
76 | // C++ implementation of COCOeval.accumulate(), which generates precision
77 | // recall curves for each set of category, IOU threshold, detection area range,
78 | // and max number of detections parameters.  It is assumed that the parameter
79 | // evaluations is the return value of the functon COCOeval::EvaluateImages(),
80 | // which was called with the same parameter settings params
81 | py::dict Accumulate(
82 |     const py::object& params,
83 |     const std::vector<ImageEvaluation>& evalutations);
84 | 
85 | } // namespace COCOeval
86 | 


--------------------------------------------------------------------------------
/demo/MegEngine/python/models/yolo_pafpn.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- encoding: utf-8 -*-
  3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
  4 | 
  5 | import megengine.module as M
  6 | import megengine.functional as F
  7 | 
  8 | from .darknet import CSPDarknet
  9 | from .network_blocks import BaseConv, CSPLayer, DWConv, UpSample
 10 | 
 11 | 
 12 | class YOLOPAFPN(M.Module):
 13 |     """
 14 |     YOLOv3 model. Darknet 53 is the default backbone of this model.
 15 |     """
 16 | 
 17 |     def __init__(
 18 |         self, depth=1.0, width=1.0, in_features=("dark3", "dark4", "dark5"),
 19 |         in_channels=[256, 512, 1024], depthwise=False, act="silu",
 20 |     ):
 21 |         super().__init__()
 22 |         self.backbone = CSPDarknet(depth, width, depthwise=depthwise, act=act)
 23 |         self.in_features = in_features
 24 |         self.in_channels = in_channels
 25 |         Conv = DWConv if depthwise else BaseConv
 26 | 
 27 |         self.upsample = UpSample(scale_factor=2, mode="bilinear")
 28 |         self.lateral_conv0 = BaseConv(
 29 |             int(in_channels[2] * width), int(in_channels[1] * width), 1, 1, act=act
 30 |         )
 31 |         self.C3_p4 = CSPLayer(
 32 |             int(2 * in_channels[1] * width),
 33 |             int(in_channels[1] * width),
 34 |             round(3 * depth),
 35 |             False,
 36 |             depthwise=depthwise,
 37 |             act=act,
 38 |         )  # cat
 39 | 
 40 |         self.reduce_conv1 = BaseConv(
 41 |             int(in_channels[1] * width), int(in_channels[0] * width), 1, 1, act=act
 42 |         )
 43 |         self.C3_p3 = CSPLayer(
 44 |             int(2 * in_channels[0] * width),
 45 |             int(in_channels[0] * width),
 46 |             round(3 * depth),
 47 |             False,
 48 |             depthwise=depthwise,
 49 |             act=act,
 50 |         )
 51 | 
 52 |         # bottom-up conv
 53 |         self.bu_conv2 = Conv(
 54 |             int(in_channels[0] * width), int(in_channels[0] * width), 3, 2, act=act
 55 |         )
 56 |         self.C3_n3 = CSPLayer(
 57 |             int(2 * in_channels[0] * width),
 58 |             int(in_channels[1] * width),
 59 |             round(3 * depth),
 60 |             False,
 61 |             depthwise=depthwise,
 62 |             act=act,
 63 |         )
 64 | 
 65 |         # bottom-up conv
 66 |         self.bu_conv1 = Conv(
 67 |             int(in_channels[1] * width), int(in_channels[1] * width), 3, 2, act=act
 68 |         )
 69 |         self.C3_n4 = CSPLayer(
 70 |             int(2 * in_channels[1] * width),
 71 |             int(in_channels[2] * width),
 72 |             round(3 * depth),
 73 |             False,
 74 |             depthwise=depthwise,
 75 |             act=act,
 76 |         )
 77 | 
 78 |     def forward(self, input):
 79 |         """
 80 |         Args:
 81 |             inputs: input images.
 82 | 
 83 |         Returns:
 84 |             Tuple[Tensor]: FPN feature.
 85 |         """
 86 | 
 87 |         #  backbone
 88 |         out_features = self.backbone(input)
 89 |         features = [out_features[f] for f in self.in_features]
 90 |         [x2, x1, x0] = features
 91 | 
 92 |         fpn_out0 = self.lateral_conv0(x0)  # 1024->512/32
 93 |         f_out0 = self.upsample(fpn_out0)  # 512/16
 94 |         f_out0 = F.concat([f_out0, x1], 1)  # 512->1024/16
 95 |         f_out0 = self.C3_p4(f_out0)  # 1024->512/16
 96 | 
 97 |         fpn_out1 = self.reduce_conv1(f_out0)  # 512->256/16
 98 |         f_out1 = self.upsample(fpn_out1)  # 256/8
 99 |         f_out1 = F.concat([f_out1, x2], 1)  # 256->512/8
100 |         pan_out2 = self.C3_p3(f_out1)  # 512->256/8
101 | 
102 |         p_out1 = self.bu_conv2(pan_out2)  # 256->256/16
103 |         p_out1 = F.concat([p_out1, fpn_out1], 1)  # 256->512/16
104 |         pan_out1 = self.C3_n3(p_out1)  # 512->512/16
105 | 
106 |         p_out0 = self.bu_conv1(pan_out1)  # 512->512/32
107 |         p_out0 = F.concat([p_out0, fpn_out0], 1)  # 512->1024/32
108 |         pan_out0 = self.C3_n4(p_out0)  # 1024->1024/32
109 | 
110 |         outputs = (pan_out2, pan_out1, pan_out0)
111 |         return outputs
112 | 


--------------------------------------------------------------------------------
/cfp/data/dataloading.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding:utf-8 -*-
  3 | # Copyright (c) Megvii, Inc. and its affiliates.
  4 | 
  5 | import os
  6 | import random
  7 | import uuid
  8 | 
  9 | import numpy as np
 10 | 
 11 | import torch
 12 | from torch.utils.data.dataloader import DataLoader as torchDataLoader
 13 | from torch.utils.data.dataloader import default_collate
 14 | 
 15 | from .samplers import YoloBatchSampler
 16 | 
 17 | 
 18 | def get_yolox_datadir():
 19 |     """
 20 |     get dataset dir of YOLOX. If environment variable named `YOLOX_DATADIR` is set,
 21 |     this function will return value of the environment variable. Otherwise, use data
 22 |     """
 23 |     yolox_datadir = os.getenv("YOLOX_DATADIR", None)
 24 |     if yolox_datadir is None:
 25 |         import yolox
 26 | 
 27 |         yolox_path = os.path.dirname(os.path.dirname(yolox.__file__))
 28 |         yolox_datadir = os.path.join(yolox_path, "datasets")
 29 |     return yolox_datadir
 30 | 
 31 | 
 32 | class DataLoader(torchDataLoader):
 33 |     """
 34 |     Lightnet dataloader that enables on the fly resizing of the images.
 35 |     See :class:`torch.utils.data.DataLoader` for more information on the arguments.
 36 |     Check more on the following website:
 37 |     https://gitlab.com/EAVISE/lightnet/-/blob/master/lightnet/data/_dataloading.py
 38 |     """
 39 | 
 40 |     def __init__(self, *args, **kwargs):
 41 |         super().__init__(*args, **kwargs)
 42 |         self.__initialized = False
 43 |         shuffle = False
 44 |         batch_sampler = None
 45 |         if len(args) > 5:
 46 |             shuffle = args[2]
 47 |             sampler = args[3]
 48 |             batch_sampler = args[4]
 49 |         elif len(args) > 4:
 50 |             shuffle = args[2]
 51 |             sampler = args[3]
 52 |             if "batch_sampler" in kwargs:
 53 |                 batch_sampler = kwargs["batch_sampler"]
 54 |         elif len(args) > 3:
 55 |             shuffle = args[2]
 56 |             if "sampler" in kwargs:
 57 |                 sampler = kwargs["sampler"]
 58 |             if "batch_sampler" in kwargs:
 59 |                 batch_sampler = kwargs["batch_sampler"]
 60 |         else:
 61 |             if "shuffle" in kwargs:
 62 |                 shuffle = kwargs["shuffle"]
 63 |             if "sampler" in kwargs:
 64 |                 sampler = kwargs["sampler"]
 65 |             if "batch_sampler" in kwargs:
 66 |                 batch_sampler = kwargs["batch_sampler"]
 67 | 
 68 |         # Use custom BatchSampler
 69 |         if batch_sampler is None:
 70 |             if sampler is None:
 71 |                 if shuffle:
 72 |                     sampler = torch.utils.data.sampler.RandomSampler(self.dataset)
 73 |                     # sampler = torch.utils.data.DistributedSampler(self.dataset)
 74 |                 else:
 75 |                     sampler = torch.utils.data.sampler.SequentialSampler(self.dataset)
 76 |             batch_sampler = YoloBatchSampler(
 77 |                 sampler,
 78 |                 self.batch_size,
 79 |                 self.drop_last,
 80 |                 input_dimension=self.dataset.input_dim,
 81 |             )
 82 |             # batch_sampler = IterationBasedBatchSampler(batch_sampler, num_iterations =
 83 | 
 84 |         self.batch_sampler = batch_sampler
 85 | 
 86 |         self.__initialized = True
 87 | 
 88 |     def close_mosaic(self):
 89 |         self.batch_sampler.mosaic = False
 90 | 
 91 | 
 92 | def list_collate(batch):
 93 |     """
 94 |     Function that collates lists or tuples together into one list (of lists/tuples).
 95 |     Use this as the collate function in a Dataloader, if you want to have a list of
 96 |     items as an output, as opposed to tensors (eg. Brambox.boxes).
 97 |     """
 98 |     items = list(zip(*batch))
 99 | 
100 |     for i in range(len(items)):
101 |         if isinstance(items[i][0], (list, tuple)):
102 |             items[i] = list(items[i])
103 |         else:
104 |             items[i] = default_collate(items[i])
105 | 
106 |     return items
107 | 
108 | 
109 | def worker_init_reset_seed(worker_id):
110 |     seed = uuid.uuid4().int % 2**32
111 |     random.seed(seed)
112 |     torch.set_rng_state(torch.manual_seed(seed).get_state())
113 |     np.random.seed(seed)
114 | 


--------------------------------------------------------------------------------
/cfp/utils/visualize.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding:utf-8 -*-
  3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
  4 | 
  5 | import cv2
  6 | import numpy as np
  7 | 
  8 | __all__ = ["vis"]
  9 | 
 10 | 
 11 | def vis(img, boxes, scores, cls_ids, conf=0.5, class_names=None):
 12 | 
 13 |     for i in range(len(boxes)):
 14 |         box = boxes[i]
 15 |         cls_id = int(cls_ids[i])
 16 |         score = scores[i]
 17 |         if score < conf:
 18 |             continue
 19 |         x0 = int(box[0])
 20 |         y0 = int(box[1])
 21 |         x1 = int(box[2])
 22 |         y1 = int(box[3])
 23 | 
 24 |         color = (_COLORS[cls_id] * 255).astype(np.uint8).tolist()
 25 |         text = '{}:{:.1f}%'.format(class_names[cls_id], score * 100)
 26 |         txt_color = (0, 0, 0) if np.mean(_COLORS[cls_id]) > 0.5 else (255, 255, 255)
 27 |         font = cv2.FONT_HERSHEY_SIMPLEX
 28 | 
 29 |         txt_size = cv2.getTextSize(text, font, 0.4, 1)[0]
 30 |         cv2.rectangle(img, (x0, y0), (x1, y1), color, 2)
 31 | 
 32 |         txt_bk_color = (_COLORS[cls_id] * 255 * 0.7).astype(np.uint8).tolist()
 33 |         cv2.rectangle(
 34 |             img,
 35 |             (x0, y0 + 1),
 36 |             (x0 + txt_size[0] + 1, y0 + int(1.5*txt_size[1])),
 37 |             txt_bk_color,
 38 |             -1
 39 |         )
 40 |         cv2.putText(img, text, (x0, y0 + txt_size[1]), font, 0.4, txt_color, thickness=1)
 41 | 
 42 |     return img
 43 | 
 44 | 
 45 | _COLORS = np.array(
 46 |     [
 47 |         0.000, 0.447, 0.741,
 48 |         0.850, 0.325, 0.098,
 49 |         0.929, 0.694, 0.125,
 50 |         0.494, 0.184, 0.556,
 51 |         0.466, 0.674, 0.188,
 52 |         0.301, 0.745, 0.933,
 53 |         0.635, 0.078, 0.184,
 54 |         0.300, 0.300, 0.300,
 55 |         0.600, 0.600, 0.600,
 56 |         1.000, 0.000, 0.000,
 57 |         1.000, 0.500, 0.000,
 58 |         0.749, 0.749, 0.000,
 59 |         0.000, 1.000, 0.000,
 60 |         0.000, 0.000, 1.000,
 61 |         0.667, 0.000, 1.000,
 62 |         0.333, 0.333, 0.000,
 63 |         0.333, 0.667, 0.000,
 64 |         0.333, 1.000, 0.000,
 65 |         0.667, 0.333, 0.000,
 66 |         0.667, 0.667, 0.000,
 67 |         0.667, 1.000, 0.000,
 68 |         1.000, 0.333, 0.000,
 69 |         1.000, 0.667, 0.000,
 70 |         1.000, 1.000, 0.000,
 71 |         0.000, 0.333, 0.500,
 72 |         0.000, 0.667, 0.500,
 73 |         0.000, 1.000, 0.500,
 74 |         0.333, 0.000, 0.500,
 75 |         0.333, 0.333, 0.500,
 76 |         0.333, 0.667, 0.500,
 77 |         0.333, 1.000, 0.500,
 78 |         0.667, 0.000, 0.500,
 79 |         0.667, 0.333, 0.500,
 80 |         0.667, 0.667, 0.500,
 81 |         0.667, 1.000, 0.500,
 82 |         1.000, 0.000, 0.500,
 83 |         1.000, 0.333, 0.500,
 84 |         1.000, 0.667, 0.500,
 85 |         1.000, 1.000, 0.500,
 86 |         0.000, 0.333, 1.000,
 87 |         0.000, 0.667, 1.000,
 88 |         0.000, 1.000, 1.000,
 89 |         0.333, 0.000, 1.000,
 90 |         0.333, 0.333, 1.000,
 91 |         0.333, 0.667, 1.000,
 92 |         0.333, 1.000, 1.000,
 93 |         0.667, 0.000, 1.000,
 94 |         0.667, 0.333, 1.000,
 95 |         0.667, 0.667, 1.000,
 96 |         0.667, 1.000, 1.000,
 97 |         1.000, 0.000, 1.000,
 98 |         1.000, 0.333, 1.000,
 99 |         1.000, 0.667, 1.000,
100 |         0.333, 0.000, 0.000,
101 |         0.500, 0.000, 0.000,
102 |         0.667, 0.000, 0.000,
103 |         0.833, 0.000, 0.000,
104 |         1.000, 0.000, 0.000,
105 |         0.000, 0.167, 0.000,
106 |         0.000, 0.333, 0.000,
107 |         0.000, 0.500, 0.000,
108 |         0.000, 0.667, 0.000,
109 |         0.000, 0.833, 0.000,
110 |         0.000, 1.000, 0.000,
111 |         0.000, 0.000, 0.167,
112 |         0.000, 0.000, 0.333,
113 |         0.000, 0.000, 0.500,
114 |         0.000, 0.000, 0.667,
115 |         0.000, 0.000, 0.833,
116 |         0.000, 0.000, 1.000,
117 |         0.000, 0.000, 0.000,
118 |         0.143, 0.143, 0.143,
119 |         0.286, 0.286, 0.286,
120 |         0.429, 0.429, 0.429,
121 |         0.571, 0.571, 0.571,
122 |         0.714, 0.714, 0.714,
123 |         0.857, 0.857, 0.857,
124 |         0.000, 0.447, 0.741,
125 |         0.314, 0.717, 0.741,
126 |         0.50, 0.5, 0
127 |     ]
128 | ).astype(np.float32).reshape(-1, 3)
129 | 


--------------------------------------------------------------------------------
/tools/export_onnx.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding:utf-8 -*-
  3 | # Copyright (c) Megvii, Inc. and its affiliates.
  4 | 
  5 | import argparse
  6 | import os
  7 | from loguru import logger
  8 | 
  9 | import torch
 10 | from torch import nn
 11 | 
 12 | from cfp.exp import get_exp
 13 | from cfp.models.network_blocks import SiLU
 14 | from cfp.utils import replace_module
 15 | 
 16 | 
 17 | def make_parser():
 18 |     parser = argparse.ArgumentParser("YOLOX onnx deploy")
 19 |     parser.add_argument(
 20 |         "--output-name", type=str, default="yolox.onnx", help="output name of models"
 21 |     )
 22 |     parser.add_argument(
 23 |         "--input", default="images", type=str, help="input node name of onnx model"
 24 |     )
 25 |     parser.add_argument(
 26 |         "--output", default="output", type=str, help="output node name of onnx model"
 27 |     )
 28 |     parser.add_argument(
 29 |         "-o", "--opset", default=11, type=int, help="onnx opset version"
 30 |     )
 31 |     parser.add_argument("--batch-size", type=int, default=1, help="batch size")
 32 |     parser.add_argument(
 33 |         "--dynamic", action="store_true", help="whether the input shape should be dynamic or not"
 34 |     )
 35 |     parser.add_argument("--no-onnxsim", action="store_true", help="use onnxsim or not")
 36 |     parser.add_argument(
 37 |         "-f",
 38 |         "--exp_file",
 39 |         default=None,
 40 |         type=str,
 41 |         help="expriment description file",
 42 |     )
 43 |     parser.add_argument("-expn", "--experiment-name", type=str, default=None)
 44 |     parser.add_argument("-n", "--name", type=str, default=None, help="model name")
 45 |     parser.add_argument("-c", "--ckpt", default=None, type=str, help="ckpt path")
 46 |     parser.add_argument(
 47 |         "opts",
 48 |         help="Modify config options using the command-line",
 49 |         default=None,
 50 |         nargs=argparse.REMAINDER,
 51 |     )
 52 | 
 53 |     return parser
 54 | 
 55 | 
 56 | @logger.catch
 57 | def main():
 58 |     args = make_parser().parse_args()
 59 |     logger.info("args value: {}".format(args))
 60 |     exp = get_exp(args.exp_file, args.name)
 61 |     exp.merge(args.opts)
 62 | 
 63 |     if not args.experiment_name:
 64 |         args.experiment_name = exp.exp_name
 65 | 
 66 |     model = exp.get_model()
 67 |     if args.ckpt is None:
 68 |         file_name = os.path.join(exp.output_dir, args.experiment_name)
 69 |         ckpt_file = os.path.join(file_name, "best_ckpt.pth")
 70 |     else:
 71 |         ckpt_file = args.ckpt
 72 | 
 73 |     # load the model state dict
 74 |     ckpt = torch.load(ckpt_file, map_location="cpu")
 75 | 
 76 |     model.eval()
 77 |     if "model" in ckpt:
 78 |         ckpt = ckpt["model"]
 79 |     model.load_state_dict(ckpt)
 80 |     model = replace_module(model, nn.SiLU, SiLU)
 81 |     model.head.decode_in_inference = False
 82 | 
 83 |     logger.info("loading checkpoint done.")
 84 |     dummy_input = torch.randn(args.batch_size, 3, exp.test_size[0], exp.test_size[1])
 85 | 
 86 |     torch.onnx._export(
 87 |         model,
 88 |         dummy_input,
 89 |         args.output_name,
 90 |         input_names=[args.input],
 91 |         output_names=[args.output],
 92 |         dynamic_axes={args.input: {0: 'batch'},
 93 |                       args.output: {0: 'batch'}} if args.dynamic else None,
 94 |         opset_version=args.opset,
 95 |     )
 96 |     logger.info("generated onnx model named {}".format(args.output_name))
 97 | 
 98 |     if not args.no_onnxsim:
 99 |         import onnx
100 | 
101 |         from onnxsim import simplify
102 | 
103 |         input_shapes = {args.input: list(dummy_input.shape)} if args.dynamic else None
104 | 
105 |         # use onnxsimplify to reduce reduent model.
106 |         onnx_model = onnx.load(args.output_name)
107 |         model_simp, check = simplify(onnx_model,
108 |                                      dynamic_input_shape=args.dynamic,
109 |                                      input_shapes=input_shapes)
110 |         assert check, "Simplified ONNX model could not be validated"
111 |         onnx.save(model_simp, args.output_name)
112 |         logger.info("generated simplified onnx model named {}".format(args.output_name))
113 | 
114 | 
115 | if __name__ == "__main__":
116 |     main()
117 | 


--------------------------------------------------------------------------------
/cfp/data/datasets/datasets_wrapper.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding:utf-8 -*-
  3 | # Copyright (c) Megvii, Inc. and its affiliates.
  4 | 
  5 | import bisect
  6 | from functools import wraps
  7 | 
  8 | from torch.utils.data.dataset import ConcatDataset as torchConcatDataset
  9 | from torch.utils.data.dataset import Dataset as torchDataset
 10 | 
 11 | 
 12 | class ConcatDataset(torchConcatDataset):
 13 |     def __init__(self, datasets):
 14 |         super(ConcatDataset, self).__init__(datasets)
 15 |         if hasattr(self.datasets[0], "input_dim"):
 16 |             self._input_dim = self.datasets[0].input_dim
 17 |             self.input_dim = self.datasets[0].input_dim
 18 | 
 19 |     def pull_item(self, idx):
 20 |         if idx < 0:
 21 |             if -idx > len(self):
 22 |                 raise ValueError(
 23 |                     "absolute value of index should not exceed dataset length"
 24 |                 )
 25 |             idx = len(self) + idx
 26 |         dataset_idx = bisect.bisect_right(self.cumulative_sizes, idx)
 27 |         if dataset_idx == 0:
 28 |             sample_idx = idx
 29 |         else:
 30 |             sample_idx = idx - self.cumulative_sizes[dataset_idx - 1]
 31 |         return self.datasets[dataset_idx].pull_item(sample_idx)
 32 | 
 33 | 
 34 | class MixConcatDataset(torchConcatDataset):
 35 |     def __init__(self, datasets):
 36 |         super(MixConcatDataset, self).__init__(datasets)
 37 |         if hasattr(self.datasets[0], "input_dim"):
 38 |             self._input_dim = self.datasets[0].input_dim
 39 |             self.input_dim = self.datasets[0].input_dim
 40 | 
 41 |     def __getitem__(self, index):
 42 | 
 43 |         if not isinstance(index, int):
 44 |             idx = index[1]
 45 |         if idx < 0:
 46 |             if -idx > len(self):
 47 |                 raise ValueError(
 48 |                     "absolute value of index should not exceed dataset length"
 49 |                 )
 50 |             idx = len(self) + idx
 51 |         dataset_idx = bisect.bisect_right(self.cumulative_sizes, idx)
 52 |         if dataset_idx == 0:
 53 |             sample_idx = idx
 54 |         else:
 55 |             sample_idx = idx - self.cumulative_sizes[dataset_idx - 1]
 56 |         if not isinstance(index, int):
 57 |             index = (index[0], sample_idx, index[2])
 58 | 
 59 |         return self.datasets[dataset_idx][index]
 60 | 
 61 | 
 62 | class Dataset(torchDataset):
 63 |     """ This class is a subclass of the base :class:`torch.utils.data.Dataset`,
 64 |     that enables on the fly resizing of the ``input_dim``.
 65 | 
 66 |     Args:
 67 |         input_dimension (tuple): (width,height) tuple with default dimensions of the network
 68 |     """
 69 | 
 70 |     def __init__(self, input_dimension, mosaic=True):
 71 |         super().__init__()
 72 |         self.__input_dim = input_dimension[:2]
 73 |         self.enable_mosaic = mosaic
 74 | 
 75 |     @property
 76 |     def input_dim(self):
 77 |         """
 78 |         Dimension that can be used by transforms to set the correct image size, etc.
 79 |         This allows transforms to have a single source of truth
 80 |         for the input dimension of the network.
 81 | 
 82 |         Return:
 83 |             list: Tuple containing the current width,height
 84 |         """
 85 |         if hasattr(self, "_input_dim"):
 86 |             return self._input_dim
 87 |         return self.__input_dim
 88 | 
 89 |     @staticmethod
 90 |     def mosaic_getitem(getitem_fn):
 91 |         """
 92 |         Decorator method that needs to be used around the ``__getitem__`` method. |br|
 93 |         This decorator enables the closing mosaic
 94 | 
 95 |         Example:
 96 |             >>> class CustomSet(ln.data.Dataset):
 97 |             ...     def __len__(self):
 98 |             ...         return 10
 99 |             ...     @ln.data.Dataset.mosaic_getitem
100 |             ...     def __getitem__(self, index):
101 |             ...         return self.enable_mosaic
102 |         """
103 | 
104 |         @wraps(getitem_fn)
105 |         def wrapper(self, index):
106 |             if not isinstance(index, int):
107 |                 self.enable_mosaic = index[0]
108 |                 index = index[1]
109 | 
110 |             ret_val = getitem_fn(self, index)
111 | 
112 |             return ret_val
113 | 
114 |         return wrapper
115 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
  1 | ### Linux ###
  2 | *~
  3 | 
  4 | # user experiments directory
  5 | YOLOX_outputs/
  6 | 
  7 | # do not ignore datasets under cfp/data
  8 | !*cfp/data/datasets/
  9 | 
 10 | # temporary files which can be created if a process still has a handle open of a deleted file
 11 | .fuse_hidden*
 12 | 
 13 | # KDE directory preferences
 14 | .directory
 15 | 
 16 | # Linux trash folder which might appear on any partition or disk
 17 | .Trash-*
 18 | 
 19 | # .nfs files are created when an open file is removed but is still being accessed
 20 | .nfs*
 21 | 
 22 | ### PyCharm ###
 23 | # User-specific stuff
 24 | .idea
 25 | 
 26 | # CMake
 27 | cmake-build-*/
 28 | 
 29 | # Mongo Explorer plugin
 30 | .idea/**/mongoSettings.xml
 31 | 
 32 | # File-based project format
 33 | *.iws
 34 | 
 35 | # IntelliJ
 36 | out/
 37 | 
 38 | # mpeltonen/sbt-idea plugin
 39 | .idea_modules/
 40 | 
 41 | # JIRA plugin
 42 | atlassian-ide-plugin.xml
 43 | 
 44 | # Cursive Clojure plugin
 45 | .idea/replstate.xml
 46 | 
 47 | # Crashlytics plugin (for Android Studio and IntelliJ)
 48 | com_crashlytics_export_strings.xml
 49 | crashlytics.properties
 50 | crashlytics-build.properties
 51 | fabric.properties
 52 | 
 53 | # Editor-based Rest Client
 54 | .idea/httpRequests
 55 | 
 56 | # Android studio 3.1+ serialized cache file
 57 | .idea/caches/build_file_checksums.ser
 58 | 
 59 | # JetBrains templates
 60 | **___jb_tmp___
 61 | 
 62 | ### Python ###
 63 | # Byte-compiled / optimized / DLL files
 64 | __pycache__/
 65 | *.py[cod]
 66 | *$py.class
 67 | 
 68 | # C extensions
 69 | *.so
 70 | 
 71 | # Distribution / packaging
 72 | .Python
 73 | build/
 74 | develop-eggs/
 75 | dist/
 76 | downloads/
 77 | eggs/
 78 | .eggs/
 79 | lib/
 80 | lib64/
 81 | parts/
 82 | sdist/
 83 | var/
 84 | wheels/
 85 | pip-wheel-metadata/
 86 | share/python-wheels/
 87 | *.egg-info/
 88 | .installed.cfg
 89 | *.egg
 90 | MANIFEST
 91 | 
 92 | # PyInstaller
 93 | #  Usually these files are written by a python script from a template
 94 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 95 | *.manifest
 96 | *.spec
 97 | 
 98 | # Installer logs
 99 | pip-log.txt
100 | pip-delete-this-directory.txt
101 | 
102 | # Unit test / coverage reports
103 | htmlcov/
104 | .tox/
105 | .nox/
106 | .coverage
107 | .coverage.*
108 | .cache
109 | nosetests.xml
110 | coverage.xml
111 | *.cover
112 | .hypothesis/
113 | .pytest_cache/
114 | 
115 | # Translations
116 | *.mo
117 | *.pot
118 | 
119 | # Django stuff:
120 | *.log
121 | local_settings.py
122 | db.sqlite3
123 | 
124 | # Flask stuff:
125 | instance/
126 | .webassets-cache
127 | 
128 | # Scrapy stuff:
129 | .scrapy
130 | 
131 | # Sphinx documentation
132 | docs/_build/
133 | docs/build/
134 | 
135 | # PyBuilder
136 | target/
137 | 
138 | # Jupyter Notebook
139 | .ipynb_checkpoints
140 | 
141 | # IPython
142 | profile_default/
143 | ipython_config.py
144 | 
145 | # pyenv
146 | .python-version
147 | 
148 | # pipenv
149 | #   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
150 | #   However, in case of collaboration, if having platform-specific dependencies or dependencies
151 | #   having no cross-platform support, pipenv may install dependencies that don’t work, or not
152 | #   install all needed dependencies.
153 | #Pipfile.lock
154 | 
155 | # celery beat schedule file
156 | celerybeat-schedule
157 | 
158 | # SageMath parsed files
159 | *.sage.py
160 | 
161 | # Environments
162 | .env
163 | .venv
164 | env/
165 | venv/
166 | ENV/
167 | env.bak/
168 | venv.bak/
169 | 
170 | # Spyder project settings
171 | .spyderproject
172 | .spyproject
173 | 
174 | # Rope project settings
175 | .ropeproject
176 | 
177 | # mkdocs documentation
178 | /site
179 | 
180 | # mypy
181 | .mypy_cache/
182 | .dmypy.json
183 | dmypy.json
184 | 
185 | # Pyre type checker
186 | .pyre/
187 | 
188 | ### Vim ###
189 | # Swap
190 | [._]*.s[a-v][a-z]
191 | [._]*.sw[a-p]
192 | [._]s[a-rt-v][a-z]
193 | [._]ss[a-gi-z]
194 | [._]sw[a-p]
195 | 
196 | # Session
197 | Session.vim
198 | 
199 | # Temporary
200 | .netrwhist
201 | # Auto-generated tag files
202 | tags
203 | # Persistent undo
204 | [._]*.un~
205 | 
206 | # output
207 | docs/api
208 | .code-workspace.code-workspace
209 | *.pkl
210 | *.npy
211 | *.pth
212 | *.onnx
213 | *.engine
214 | events.out.tfevents*
215 | 
216 | # vscode
217 | *.code-workspace
218 | .vscode
219 | 
220 | # vim
221 | .vim
222 | 


--------------------------------------------------------------------------------
/docs/model_zoo.md:
--------------------------------------------------------------------------------
 1 | # Model Zoo
 2 | 
 3 | ## Standard Models.
 4 | 
 5 | |Model |size |mAP<sup>val<br>0.5:0.95 |mAP<sup>test<br>0.5:0.95 | Speed V100<br>(ms) | Params<br>(M) |FLOPs<br>(G)| weights |
 6 | | ------        |:---: | :---:    | :---:       |:---:     |:---:  | :---: | :----: |
 7 | |[YOLOX-s](./exps/default/yolox_s.py)    |640  |40.5 |40.5      |9.8      |9.0 | 26.8 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_s.pth) |
 8 | |[YOLOX-m](./exps/default/yolox_m.py)    |640  |46.9 |47.2      |12.3     |25.3 |73.8| [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_m.pth) |
 9 | |[YOLOX-l](./exps/default/yolox_l.py)    |640  |49.7 |50.1      |14.5     |54.2| 155.6 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_l.pth) |
10 | |[YOLOX-x](./exps/default/yolox_x.py)   |640   |51.1 |**51.5**  | 17.3    |99.1 |281.9 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_x.pth) |
11 | |[YOLOX-Darknet53](./exps/default/yolov3.py)   |640  | 47.7 | 48.0 | 11.1 |63.7 | 185.3 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_darknet.pth) 
12 | 
13 | <details>
14 | <summary>Legacy models</summary>
15 | 
16 | |Model |size |mAP<sup>test<br>0.5:0.95 | Speed V100<br>(ms) | Params<br>(M) |FLOPs<br>(G)| weights |
17 | | ------        |:---: | :---:       |:---:     |:---:  | :---: | :----: |
18 | |[YOLOX-s](./exps/default/yolox_s.py)    |640  |39.6      |9.8     |9.0 | 26.8 | [onedrive](https://megvii-my.sharepoint.cn/:u:/g/personal/gezheng_megvii_com/EW62gmO2vnNNs5npxjzunVwB9p307qqygaCkXdTO88BLUg?e=NMTQYw)/[github](https://github.com/Megvii-BaseDetection/storage/releases/download/0.0.1/yolox_s.pth) |
19 | |[YOLOX-m](./exps/default/yolox_m.py)    |640  |46.4      |12.3     |25.3 |73.8| [onedrive](https://megvii-my.sharepoint.cn/:u:/g/personal/gezheng_megvii_com/ERMTP7VFqrVBrXKMU7Vl4TcBQs0SUeCT7kvc-JdIbej4tQ?e=1MDo9y)/[github](https://github.com/Megvii-BaseDetection/storage/releases/download/0.0.1/yolox_m.pth) |
20 | |[YOLOX-l](./exps/default/yolox_l.py)    |640  |50.0  |14.5 |54.2| 155.6 | [onedrive](https://megvii-my.sharepoint.cn/:u:/g/personal/gezheng_megvii_com/EWA8w_IEOzBKvuueBqfaZh0BeoG5sVzR-XYbOJO4YlOkRw?e=wHWOBE)/[github](https://github.com/Megvii-BaseDetection/storage/releases/download/0.0.1/yolox_l.pth) |
21 | |[YOLOX-x](./exps/default/yolox_x.py)   |640  |**51.2**      | 17.3 |99.1 |281.9 | [onedrive](https://megvii-my.sharepoint.cn/:u:/g/personal/gezheng_megvii_com/EdgVPHBziOVBtGAXHfeHI5kBza0q9yyueMGdT0wXZfI1rQ?e=tABO5u)/[github](https://github.com/Megvii-BaseDetection/storage/releases/download/0.0.1/yolox_x.pth) |
22 | |[YOLOX-Darknet53](./exps/default/yolov3.py)   |640  | 47.4      | 11.1 |63.7 | 185.3 | [onedrive](https://megvii-my.sharepoint.cn/:u:/g/personal/gezheng_megvii_com/EZ-MV1r_fMFPkPrNjvbJEMoBLOLAnXH-XKEB77w8LhXL6Q?e=mf6wOc)/[github](https://github.com/Megvii-BaseDetection/storage/releases/download/0.0.1/yolox_darknet53.pth) |
23 | 
24 | </details>
25 | 
26 | ## Light Models.
27 | 
28 | |Model |size |mAP<sup>val<br>0.5:0.95 | Params<br>(M) |FLOPs<br>(G)| weights |
29 | | ------        |:---:  |  :---:       |:---:     |:---:  | :---: |
30 | |[YOLOX-Nano](./exps/default/nano.py) |416  |25.8  | 0.91 |1.08 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_nano.pth) |
31 | |[YOLOX-Tiny](./exps/default/yolox_tiny.py) |416  |32.8 | 5.06 |6.45 | [github](https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_tiny.pth) |
32 | 
33 | 
34 | <details>
35 | <summary>Legacy models</summary>
36 | 
37 | |Model |size |mAP<sup>val<br>0.5:0.95 | Params<br>(M) |FLOPs<br>(G)| weights |
38 | | ------        |:---:  |  :---:       |:---:     |:---:  | :---: |
39 | |[YOLOX-Nano](./exps/default/nano.py) |416  |25.3  | 0.91 |1.08 | [onedrive](https://megvii-my.sharepoint.cn/:u:/g/personal/gezheng_megvii_com/EdcREey-krhLtdtSnxolxiUBjWMy6EFdiaO9bdOwZ5ygCQ?e=yQpdds)/[github](https://github.com/Megvii-BaseDetection/storage/releases/download/0.0.1/yolox_nano.pth) |
40 | |[YOLOX-Tiny](./exps/default/yolox_tiny.py) |416  |32.8 | 5.06 |6.45 | [onedrive](https://megvii-my.sharepoint.cn/:u:/g/personal/gezheng_megvii_com/EbZuinX5X1dJmNy8nqSRegABWspKw3QpXxuO82YSoFN1oQ?e=Q7V7XE)/[github](https://github.com/Megvii-BaseDetection/storage/releases/download/0.0.1/yolox_tiny_32dot8.pth) |
41 | 
42 | </details>
43 | 


--------------------------------------------------------------------------------
/cfp/utils/demo_utils.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding:utf-8 -*-
  3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
  4 | 
  5 | import os
  6 | 
  7 | import numpy as np
  8 | 
  9 | __all__ = ["mkdir", "nms", "multiclass_nms", "demo_postprocess"]
 10 | 
 11 | 
 12 | def mkdir(path):
 13 |     if not os.path.exists(path):
 14 |         os.makedirs(path)
 15 | 
 16 | 
 17 | def nms(boxes, scores, nms_thr):
 18 |     """Single class NMS implemented in Numpy."""
 19 |     x1 = boxes[:, 0]
 20 |     y1 = boxes[:, 1]
 21 |     x2 = boxes[:, 2]
 22 |     y2 = boxes[:, 3]
 23 | 
 24 |     areas = (x2 - x1 + 1) * (y2 - y1 + 1)
 25 |     order = scores.argsort()[::-1]
 26 | 
 27 |     keep = []
 28 |     while order.size > 0:
 29 |         i = order[0]
 30 |         keep.append(i)
 31 |         xx1 = np.maximum(x1[i], x1[order[1:]])
 32 |         yy1 = np.maximum(y1[i], y1[order[1:]])
 33 |         xx2 = np.minimum(x2[i], x2[order[1:]])
 34 |         yy2 = np.minimum(y2[i], y2[order[1:]])
 35 | 
 36 |         w = np.maximum(0.0, xx2 - xx1 + 1)
 37 |         h = np.maximum(0.0, yy2 - yy1 + 1)
 38 |         inter = w * h
 39 |         ovr = inter / (areas[i] + areas[order[1:]] - inter)
 40 | 
 41 |         inds = np.where(ovr <= nms_thr)[0]
 42 |         order = order[inds + 1]
 43 | 
 44 |     return keep
 45 | 
 46 | 
 47 | def multiclass_nms(boxes, scores, nms_thr, score_thr, class_agnostic=True):
 48 |     """Multiclass NMS implemented in Numpy"""
 49 |     if class_agnostic:
 50 |         nms_method = multiclass_nms_class_agnostic
 51 |     else:
 52 |         nms_method = multiclass_nms_class_aware
 53 |     return nms_method(boxes, scores, nms_thr, score_thr)
 54 | 
 55 | 
 56 | def multiclass_nms_class_aware(boxes, scores, nms_thr, score_thr):
 57 |     """Multiclass NMS implemented in Numpy. Class-aware version."""
 58 |     final_dets = []
 59 |     num_classes = scores.shape[1]
 60 |     for cls_ind in range(num_classes):
 61 |         cls_scores = scores[:, cls_ind]
 62 |         valid_score_mask = cls_scores > score_thr
 63 |         if valid_score_mask.sum() == 0:
 64 |             continue
 65 |         else:
 66 |             valid_scores = cls_scores[valid_score_mask]
 67 |             valid_boxes = boxes[valid_score_mask]
 68 |             keep = nms(valid_boxes, valid_scores, nms_thr)
 69 |             if len(keep) > 0:
 70 |                 cls_inds = np.ones((len(keep), 1)) * cls_ind
 71 |                 dets = np.concatenate(
 72 |                     [valid_boxes[keep], valid_scores[keep, None], cls_inds], 1
 73 |                 )
 74 |                 final_dets.append(dets)
 75 |     if len(final_dets) == 0:
 76 |         return None
 77 |     return np.concatenate(final_dets, 0)
 78 | 
 79 | 
 80 | def multiclass_nms_class_agnostic(boxes, scores, nms_thr, score_thr):
 81 |     """Multiclass NMS implemented in Numpy. Class-agnostic version."""
 82 |     cls_inds = scores.argmax(1)
 83 |     cls_scores = scores[np.arange(len(cls_inds)), cls_inds]
 84 | 
 85 |     valid_score_mask = cls_scores > score_thr
 86 |     if valid_score_mask.sum() == 0:
 87 |         return None
 88 |     valid_scores = cls_scores[valid_score_mask]
 89 |     valid_boxes = boxes[valid_score_mask]
 90 |     valid_cls_inds = cls_inds[valid_score_mask]
 91 |     keep = nms(valid_boxes, valid_scores, nms_thr)
 92 |     if keep:
 93 |         dets = np.concatenate(
 94 |             [valid_boxes[keep], valid_scores[keep, None], valid_cls_inds[keep, None]], 1
 95 |         )
 96 |     return dets
 97 | 
 98 | 
 99 | def demo_postprocess(outputs, img_size, p6=False):
100 | 
101 |     grids = []
102 |     expanded_strides = []
103 | 
104 |     if not p6:
105 |         strides = [8, 16, 32]
106 |     else:
107 |         strides = [8, 16, 32, 64]
108 | 
109 |     hsizes = [img_size[0] // stride for stride in strides]
110 |     wsizes = [img_size[1] // stride for stride in strides]
111 | 
112 |     for hsize, wsize, stride in zip(hsizes, wsizes, strides):
113 |         xv, yv = np.meshgrid(np.arange(wsize), np.arange(hsize))
114 |         grid = np.stack((xv, yv), 2).reshape(1, -1, 2)
115 |         grids.append(grid)
116 |         shape = grid.shape[:2]
117 |         expanded_strides.append(np.full((*shape, 1), stride))
118 | 
119 |     grids = np.concatenate(grids, 1)
120 |     expanded_strides = np.concatenate(expanded_strides, 1)
121 |     outputs[..., :2] = (outputs[..., :2] + grids) * expanded_strides
122 |     outputs[..., 2:4] = np.exp(outputs[..., 2:4]) * expanded_strides
123 | 
124 |     return outputs
125 | 


--------------------------------------------------------------------------------
/tools/train.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding:utf-8 -*-
  3 | # Copyright (c) Megvii, Inc. and its affiliates.
  4 | import sys
  5 | sys.path.append(r'/Path/CFP-master')
  6 | import argparse
  7 | import random
  8 | import warnings
  9 | from loguru import logger
 10 | 
 11 | import torch
 12 | import torch.backends.cudnn as cudnn
 13 | 
 14 | from cfp.core import Trainer, launch
 15 | from cfp.exp import get_exp
 16 | from cfp.utils import configure_nccl, configure_omp, get_num_devices
 17 | 
 18 | 
 19 | def make_parser():
 20 |     parser = argparse.ArgumentParser("CFP train parser")
 21 |     parser.add_argument("-expn", "--experiment-name", type=str, default="cfp_s_outputs")
 22 |     parser.add_argument("-n", "--name", type=str, default=None, help="model name")
 23 | 
 24 |     # distributed
 25 |     parser.add_argument(
 26 |         "--dist-backend", default="nccl", type=str, help="distributed backend"
 27 |     )
 28 |     parser.add_argument(
 29 |         "--dist-url",
 30 |         default=None,
 31 |         type=str,
 32 |         help="url used to set up distributed training",
 33 |     )
 34 |     parser.add_argument("-b", "--batch-size", type=int, default=64, help="batch size") #设置 batch_size
 35 |     parser.add_argument("-d", "--devices", default=None, type=int, help="device for training")     #设置gpu，因为我只有一张卡，所以设 default=0
 36 |     parser.add_argument(
 37 |         "-f",
 38 |         "--exp_file",
 39 |         default="../exps/example/custom/cfp_s.py",
 40 |         type=str,
 41 |         help="plz input your experiment description file",
 42 |     )
 43 |     parser.add_argument(
 44 |         "--resume", default=False, action="store_true", help="resume training"
 45 |     )
 46 |     parser.add_argument("-c", "--ckpt", default="../weights/cfp_s.pth", type=str, help="checkpoint file")
 47 |     parser.add_argument(
 48 |         "-e",
 49 |         "--start_epoch",
 50 |         default=None,
 51 |         type=int,
 52 |         help="resume training start epoch",
 53 |     )
 54 |     parser.add_argument(
 55 |         "--num_machines", default=1, type=int, help="num of node for training"
 56 |     )
 57 |     parser.add_argument(
 58 |         "--machine_rank", default=0, type=int, help="node rank for multi-node training"
 59 |     )
 60 |     parser.add_argument(
 61 |         "--fp16",
 62 |         dest="fp16",
 63 |         default=False,
 64 |         action="store_true",
 65 |         help="Adopting mix precision training.",
 66 |     )
 67 |     parser.add_argument(
 68 |         "--cache",
 69 |         dest="cache",
 70 |         default=False,
 71 |         action="store_true",
 72 |         help="Caching imgs to RAM for fast training.",
 73 |     )
 74 |     parser.add_argument(
 75 |         "-o",
 76 |         "--occupy",
 77 |         dest="occupy",
 78 |         default=False,
 79 |         action="store_true",
 80 |         help="occupy GPU memory first for training.",
 81 |     )
 82 |     parser.add_argument(
 83 |         "opts",
 84 |         help="Modify config options using the command-line",
 85 |         default=None,
 86 |         nargs=argparse.REMAINDER,
 87 |     )
 88 |     return parser
 89 | 
 90 | 
 91 | @logger.catch
 92 | def main(exp, args):
 93 |     if exp.seed is not None:
 94 |         random.seed(exp.seed)
 95 |         torch.manual_seed(exp.seed)
 96 |         cudnn.deterministic = True
 97 |         warnings.warn(
 98 |             "You have chosen to seed training. This will turn on the CUDNN deterministic setting, "
 99 |             "which can slow down your training considerably! You may see unexpected behavior "
100 |             "when restarting from checkpoints."
101 |         )
102 | 
103 |     # set environment variables for distributed training
104 |     configure_nccl()
105 |     configure_omp()
106 |     cudnn.benchmark = True
107 | 
108 |     trainer = Trainer(exp, args)
109 |     trainer.train()
110 | 
111 | 
112 | if __name__ == "__main__":
113 |     args = make_parser().parse_args()
114 |     exp = get_exp(args.exp_file, args.name)
115 |     exp.merge(args.opts)
116 | 
117 |     if not args.experiment_name:
118 |         args.experiment_name = exp.exp_name
119 | 
120 |     num_gpu = get_num_devices() if args.devices is None else args.devices
121 |     assert num_gpu <= get_num_devices()
122 | 
123 |     dist_url = "auto" if args.dist_url is None else args.dist_url
124 |     launch(
125 |         main,
126 |         num_gpu,
127 |         args.num_machines,
128 |         args.machine_rank,
129 |         backend=args.dist_backend,
130 |         dist_url=dist_url,
131 |         args=(exp, args),
132 |     )
133 | 


--------------------------------------------------------------------------------
/cfp/models/yolo_pafpn.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python
  2 | # -*- encoding: utf-8 -*-
  3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
  4 | 
  5 | import torch
  6 | import torch.nn as nn
  7 | 
  8 | from .darknet import CSPDarknet
  9 | from .evc_blocks import BaseConv, CSPLayer, DWConv, EVCBlock
 10 | 
 11 | 
 12 | class YOLOPAFPN(nn.Module):
 13 |     """
 14 |     YOLOv3 model. Darknet 53 is the default backbone of this model.
 15 |     """
 16 | 
 17 |     def __init__(
 18 |         self,
 19 |         depth=0.33,  # s/m/l
 20 |         width=0.50,
 21 |         in_features=("dark3", "dark4", "dark5"),
 22 |         in_channels=[128, 256, 512],  # s,m,l，in_channels不同，s:[128,256, 512] m[192,384,768],L[256, 512, 1024]
 23 |         depthwise=False,
 24 |         act="silu",
 25 |     ):
 26 |         super().__init__()
 27 |         self.backbone = CSPDarknet(depth, width, depthwise=depthwise, act=act)
 28 |         self.in_features = in_features
 29 |         self.in_channels = in_channels
 30 |         Conv = DWConv if depthwise else BaseConv
 31 |         self.upsample = nn.Upsample(scale_factor=2, mode="nearest")
 32 | 
 33 |         self.lateral_conv0 = BaseConv(
 34 |             int(in_channels[2] * width), int(in_channels[1] * width), 1, 1, act=act
 35 |         )
 36 | 
 37 |         """ADD our core module"""
 38 |         # EVCBlock
 39 |         self.evcblock = EVCBlock(
 40 |             int(2 * in_channels[0] * width),  #c1
 41 |             int(in_channels[1] * width), #c2
 42 |             channel_ratio=4, base_channel=16,
 43 |             )   
 44 | 
 45 |         # CSP1
 46 |         self.C3_p4 = CSPLayer(
 47 |             int(2 * in_channels[1] * width),
 48 |             int(in_channels[1] * width),
 49 |             round(3 * depth),
 50 |             False,
 51 |             depthwise=depthwise,
 52 |             act=act,
 53 |         )  # cat
 54 |         # CBL
 55 |         self.reduce_conv1 = BaseConv(
 56 |             int(in_channels[1] * width), int(in_channels[0] * width), 1, 1, act=act
 57 |         )
 58 | 
 59 |         self.C3_p3 = CSPLayer(
 60 |             int(2 * in_channels[0] * width),
 61 |             int(in_channels[0] * width),
 62 |             round(3 * depth),
 63 |             False,
 64 |             depthwise=depthwise,
 65 |             act=act,
 66 |         )
 67 | 
 68 |         self.bu_conv2 = Conv(
 69 |             int(in_channels[0] * width), int(in_channels[0] * width), 3, 2, act=act
 70 |         )
 71 | 
 72 |         self.C3_n3 = CSPLayer(
 73 |             int(2 * in_channels[0] * width),
 74 |             int(in_channels[1] * width),
 75 |             round(3 * depth),
 76 |             False,
 77 |             depthwise=depthwise,
 78 |             act=act,
 79 |         )
 80 |         # bottom-up conv
 81 |         self.bu_conv1 = Conv(
 82 |             int(in_channels[1] * width), int(in_channels[1] * width), 3, 2, act=act
 83 |         )
 84 |         self.C3_n4 = CSPLayer(
 85 |             int(2 * in_channels[1] * width),
 86 |             int(in_channels[2] * width),
 87 |             round(3 * depth),
 88 |             False,
 89 |             depthwise=depthwise,
 90 |             act=act,
 91 |         )
 92 | 
 93 |     def forward(self, input):
 94 |         """
 95 |         Args:
 96 |             inputs: input images.
 97 | 
 98 |         Returns:
 99 |             Tuple[Tensor]: FPN feature.
100 |         """
101 |         #  backbone
102 |         out_features = self.backbone(input)
103 |         features = [out_features[f] for f in self.in_features]
104 |         [x2, x1, x0] = features
105 | 
106 |         fpn_out0 = self.lateral_conv0(x0)  # 1024->512/32
107 |         f_out0 = self.upsample(fpn_out0)  # 512/16
108 | 
109 |         fevc_out0 = self.evcblock(f_out0)
110 |         f_out0 = torch.cat([fevc_out0, x1], 1)  # 512->1024/16
111 |         f_out0 = self.C3_p4(f_out0)  # 1024->512/16
112 | 
113 |         fpn_out1 = self.reduce_conv1(f_out0)  # 512->256/16
114 |         f_out1 = self.upsample(fpn_out1)  # 256/8
115 |         f_out1 = torch.cat([f_out1, x2], 1)  # 256->512/8
116 |         pan_out2 = self.C3_p3(f_out1)  # 512->256/8
117 | 
118 |         p_out1 = self.bu_conv2(pan_out2)  # 256->256/16
119 |         p_out1 = torch.cat([p_out1, fpn_out1], 1)  # 256->512/16
120 |         pan_out1 = self.C3_n3(p_out1)  # 512->512/16
121 | 
122 |         p_out0 = self.bu_conv1(pan_out1)  # 512->512/32
123 |         p_out0 = torch.cat([p_out0, fpn_out0], 1)  # 512->1024/32
124 |         pan_out0 = self.C3_n4(p_out0)  # 1024->1024/32
125 | 
126 |         outputs = (pan_out2, pan_out1, pan_out0)
127 |         return outputs
128 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | # CFP for Object Detection
 2 | 
 3 | This repository contains the official PyTorch implementation of the following paper:
 4 | 
 5 | #### Centralized Feature Pyramid for Object Detection  
 6 | 
 7 | Yu Quan,  Dong Zhang, Liyan Zhang and Jinhui Tang  
 8 | Computer Science and Engineering, Nanjing University of Science and Technology   
 9 | https://arxiv.org/abs/2210.02093
10 | 
11 | ## Abstract 
12 | <p align="justify">
13 | Visual feature pyramid has shown its superiority in both effectiveness and efficiency in a wide range of applications. However, the existing methods exorbitantly concentrate on the inter-layer feature interactions but ignore the intra-layer feature regulations, which are empirically proved beneficial. Although some methods try to learn a compact intra-layer feature representation with the help of the attention mechanism or the vision transformer, they ignore the neglected corner regions that are important for dense prediction tasks. To address this problem, in this paper, we propose a Centralized Feature Pyramid (CFP) for object detection, which is based on a globally explicit centralized feature regulation. Specifically, we first propose a spatial explicit visual center scheme, where a lightweight MLP is used to capture the globally long-range dependencies and a parallel learnable visual center mechanism is used to capture the local corner regions of the input images. Based on this, we then propose a globally centralized regulation for the commonly-used feature pyramid in a top-down fashion, where the explicit visual center information obtained from the deepest intra-layer feature is used to regulate frontal shallow features. Compared to the existing feature pyramids, CFP not only has the ability to capture the global long-range dependencies, but also efficiently obtain an all-round yet discriminative feature representation. Experimental results on the challenging MS-COCO validate that our proposed CFP can achieve the consistent performance gains on the state-of-the-art YOLOv5 and YOLOX object detection baselines.  
14 | 
15 | ## The overall architecture
16 | ![The overall architecture](https://github.com/QY1994-0919/CFP-master/blob/main/assets/overall.png)<br>
17 | 
18 | ## Qualitative results
19 | ![Qualitative results](https://github.com/QY1994-0919/CFPNet/blob/main/assets/results.png)<br>
20 | 
21 | ## Quantitative results and training weights<br>
22 | We provide training weights of CFP with YOLOX and YOLOv5 as the baseline.<br>
23 |  
24 | | Model | size | mAP(%) | weights |
25 | | :--- | :---: | :---: | ---: |
26 | | CFP-s (YOLOX)| 640 | 41.10 | [weight](https://pan.baidu.com/disk/main#/index?category=all&path=%2FCFP-main%2Fweights) | 
27 | | CFP-m (YOLOX)| 640 | 46.40 | [weight](https://pan.baidu.com/disk/main#/index?category=all&path=%2FCFP-main%2Fweights) |
28 | | CFP-l (YOLOX)| 640 | 49.40 | [weight](https://pan.baidu.com/disk/main#/index?category=all&path=%2FCFP-main%2Fweights) | 
29 | | CFP-s (YOLOv5)| 640 | 36.00 | [weight](https://pan.baidu.com/disk/main#/index?category=all&path=%2FCFP-main%2Fweights) | 
30 | | CFP-m (YOLOv5)| 640 | 43.20 | [weight](https://pan.baidu.com/disk/main#/index?category=all&path=%2FCFP-main%2Fweights) |
31 | | CFP-l (YOLOv5)| 640 | 46.60 | [weight](https://pan.baidu.com/disk/main#/index?category=all&path=%2FCFP-main%2Fweights) | 
32 | 
33 | ## Installation<br>
34 | #### - Install CFP-main from source<br>
35 | ```
36 | git clone git@github.com:QY1994-0919/CFP-main.git  
37 | cd CFP-main    
38 | pip3 install -v -e .  # or  python3 setup.py develop   
39 | ```
40 | 
41 | #### - Prepare COCO dataset<br>
42 | ```
43 | cd CFP-main   
44 | ln -s /path/to/your/COCO ./datasets/COCO   
45 | ```
46 | 
47 | ## Usage
48 | #### - To train the model, please run:
49 | ```
50 | python -m cfp.tools.train -f cfp-s -d 2 -b 16 --fp16 -o [--cache]
51 | python -m cfp.tools.train -f cfp-m -d 2 -b 16 --fp16 -o [--cache]
52 | python -m cfp.tools.train -f cfp-l -d 2 -b 16 --fp16 -o [--cache]
53 | ```        
54 | 
55 | #### - To test the model, please run:
56 | ```                           
57 | python -m cfp.tools.eval -n  cfp-s -c cfp_s.pth -b 16 -d 2 --conf 0.001 [--fp16] [--fuse]
58 | python -m cfp.tools.eval -n  cfp-m -c cfp_s.pth -b 16 -d 2 --conf 0.001 [--fp16] [--fuse]
59 | python -m cfp.tools.eval -n  cfp-l -c cfp_s.pth -b 16 -d 2 --conf 0.001 [--fp16] [--fuse]
60 | ```                        
61 | 
62 | ## Acknowledgement<br>
63 |  Thanks [YOLOv5](https://github.com/ultralytics/yolov5) and [YOLOX](https://arxiv.org/abs/2107.08430) teams for the wonderful open source project!
64 | 
65 | ## Bibtex
66 | If you find this work is useful for your research, please cite our paper:<br>
67 | ```
68 | @article{quan2022centralized,
69 | title={Centralized Feature Pyramid for Object Detection},
70 | author={Quan, Yu and Zhang, Dong and Zhang, Liyan and Tang, Jinhu},
71 | journal={arXiv},
72 | year={2022}}
73 | ```
74 | 


--------------------------------------------------------------------------------
/cfp/core/launch.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding:utf-8 -*-
  3 | # Code are based on
  4 | # https://github.com/facebookresearch/detectron2/blob/master/detectron2/engine/launch.py
  5 | # Copyright (c) Facebook, Inc. and its affiliates.
  6 | # Copyright (c) Megvii, Inc. and its affiliates.
  7 | 
  8 | import sys
  9 | from datetime import timedelta
 10 | from loguru import logger
 11 | 
 12 | import torch
 13 | import torch.distributed as dist
 14 | import torch.multiprocessing as mp
 15 | 
 16 | import cfp.utils.dist as comm
 17 | 
 18 | __all__ = ["launch"]
 19 | 
 20 | 
 21 | DEFAULT_TIMEOUT = timedelta(minutes=30)
 22 | 
 23 | 
 24 | def _find_free_port():
 25 |     """
 26 |     Find an available port of current machine / node.
 27 |     """
 28 |     import socket
 29 | 
 30 |     sock = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
 31 |     # Binding to port 0 will cause the OS to find an available port for us
 32 |     sock.bind(("", 0))
 33 |     port = sock.getsockname()[1]
 34 |     sock.close()
 35 |     # NOTE: there is still a chance the port could be taken by other processes.
 36 |     return port
 37 | 
 38 | 
 39 | def launch(
 40 |     main_func,
 41 |     num_gpus_per_machine,
 42 |     num_machines=1,
 43 |     machine_rank=0,
 44 |     backend="nccl",
 45 |     dist_url=None,
 46 |     args=(),
 47 |     timeout=DEFAULT_TIMEOUT,
 48 | ):
 49 |     """
 50 |     Args:
 51 |         main_func: a function that will be called by `main_func(*args)`
 52 |         num_machines (int): the total number of machines
 53 |         machine_rank (int): the rank of this machine (one per machine)
 54 |         dist_url (str): url to connect to for distributed training, including protocol
 55 |                        e.g. "tcp://127.0.0.1:8686".
 56 |                        Can be set to auto to automatically select a free port on localhost
 57 |         args (tuple): arguments passed to main_func
 58 |     """
 59 |     world_size = num_machines * num_gpus_per_machine
 60 |     if world_size > 1:
 61 |         # https://github.com/pytorch/pytorch/pull/14391
 62 |         # TODO prctl in spawned processes
 63 | 
 64 |         if dist_url == "auto":
 65 |             assert (
 66 |                 num_machines == 1
 67 |             ), "dist_url=auto cannot work with distributed training."
 68 |             port = _find_free_port()
 69 |             dist_url = f"tcp://127.0.0.1:{port}"
 70 | 
 71 |         start_method = "spawn"
 72 |         cache = vars(args[1]).get("cache", False)
 73 | 
 74 |         # To use numpy memmap for caching image into RAM, we have to use fork method
 75 |         if cache:
 76 |             assert sys.platform != "win32", (
 77 |                 "As Windows platform doesn't support fork method, "
 78 |                 "do not add --cache in your training command."
 79 |             )
 80 |             start_method = "fork"
 81 | 
 82 |         mp.start_processes(
 83 |             _distributed_worker,
 84 |             nprocs=num_gpus_per_machine,
 85 |             args=(
 86 |                 main_func,
 87 |                 world_size,
 88 |                 num_gpus_per_machine,
 89 |                 machine_rank,
 90 |                 backend,
 91 |                 dist_url,
 92 |                 args,
 93 |             ),
 94 |             daemon=False,
 95 |             start_method=start_method,
 96 |         )
 97 |     else:
 98 |         main_func(*args)
 99 | 
100 | 
101 | def _distributed_worker(
102 |     local_rank,
103 |     main_func,
104 |     world_size,
105 |     num_gpus_per_machine,
106 |     machine_rank,
107 |     backend,
108 |     dist_url,
109 |     args,
110 |     timeout=DEFAULT_TIMEOUT,
111 | ):
112 |     assert (
113 |         torch.cuda.is_available()
114 |     ), "cuda is not available. Please check your installation."
115 |     global_rank = machine_rank * num_gpus_per_machine + local_rank
116 |     logger.info("Rank {} initialization finished.".format(global_rank))
117 |     try:
118 |         dist.init_process_group(
119 |             backend=backend,
120 |             init_method=dist_url,
121 |             world_size=world_size,
122 |             rank=global_rank,
123 |             timeout=timeout,
124 |         )
125 |     except Exception:
126 |         logger.error("Process group URL: {}".format(dist_url))
127 |         raise
128 | 
129 |     # Setup the local process group (which contains ranks within the same machine)
130 |     assert comm._LOCAL_PROCESS_GROUP is None
131 |     num_machines = world_size // num_gpus_per_machine
132 |     for i in range(num_machines):
133 |         ranks_on_i = list(
134 |             range(i * num_gpus_per_machine, (i + 1) * num_gpus_per_machine)
135 |         )
136 |         pg = dist.new_group(ranks_on_i)
137 |         if i == machine_rank:
138 |             comm._LOCAL_PROCESS_GROUP = pg
139 | 
140 |     # synchronize is needed here to prevent a possible timeout after calling init_process_group
141 |     # See: https://github.com/facebookresearch/maskrcnn-benchmark/issues/172
142 |     comm.synchronize()
143 | 
144 |     assert num_gpus_per_machine <= torch.cuda.device_count()
145 |     torch.cuda.set_device(local_rank)
146 | 
147 |     main_func(*args)
148 | 


--------------------------------------------------------------------------------
/cfp/utils/boxes.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding:utf-8 -*-
  3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
  4 | 
  5 | import numpy as np
  6 | 
  7 | import torch
  8 | import torchvision
  9 | 
 10 | __all__ = [
 11 |     "filter_box",
 12 |     "postprocess",
 13 |     "bboxes_iou",
 14 |     "matrix_iou",
 15 |     "adjust_box_anns",
 16 |     "xyxy2xywh",
 17 |     "xyxy2cxcywh",
 18 | ]
 19 | 
 20 | 
 21 | def filter_box(output, scale_range):
 22 |     """
 23 |     output: (N, 5+class) shape
 24 |     """
 25 |     min_scale, max_scale = scale_range
 26 |     w = output[:, 2] - output[:, 0]
 27 |     h = output[:, 3] - output[:, 1]
 28 |     keep = (w * h > min_scale * min_scale) & (w * h < max_scale * max_scale)
 29 |     return output[keep]
 30 | 
 31 | 
 32 | def postprocess(prediction, num_classes, conf_thre=0.7, nms_thre=0.45, class_agnostic=False):
 33 |     box_corner = prediction.new(prediction.shape)
 34 |     box_corner[:, :, 0] = prediction[:, :, 0] - prediction[:, :, 2] / 2
 35 |     box_corner[:, :, 1] = prediction[:, :, 1] - prediction[:, :, 3] / 2
 36 |     box_corner[:, :, 2] = prediction[:, :, 0] + prediction[:, :, 2] / 2
 37 |     box_corner[:, :, 3] = prediction[:, :, 1] + prediction[:, :, 3] / 2
 38 |     prediction[:, :, :4] = box_corner[:, :, :4]
 39 | 
 40 |     output = [None for _ in range(len(prediction))]
 41 |     for i, image_pred in enumerate(prediction):
 42 | 
 43 |         # If none are remaining => process next image
 44 |         if not image_pred.size(0):
 45 |             continue
 46 |         # Get score and class with highest confidence
 47 |         class_conf, class_pred = torch.max(image_pred[:, 5: 5 + num_classes], 1, keepdim=True)
 48 | 
 49 |         conf_mask = (image_pred[:, 4] * class_conf.squeeze() >= conf_thre).squeeze()
 50 |         # Detections ordered as (x1, y1, x2, y2, obj_conf, class_conf, class_pred)
 51 |         detections = torch.cat((image_pred[:, :5], class_conf, class_pred.float()), 1)
 52 |         detections = detections[conf_mask]
 53 |         if not detections.size(0):
 54 |             continue
 55 | 
 56 |         if class_agnostic:
 57 |             nms_out_index = torchvision.ops.nms(
 58 |                 detections[:, :4],
 59 |                 detections[:, 4] * detections[:, 5],
 60 |                 nms_thre,
 61 |             )
 62 |         else:
 63 |             nms_out_index = torchvision.ops.batched_nms(
 64 |                 detections[:, :4],
 65 |                 detections[:, 4] * detections[:, 5],
 66 |                 detections[:, 6],
 67 |                 nms_thre,
 68 |             )
 69 | 
 70 |         detections = detections[nms_out_index]
 71 |         if output[i] is None:
 72 |             output[i] = detections
 73 |         else:
 74 |             output[i] = torch.cat((output[i], detections))
 75 | 
 76 |     return output
 77 | 
 78 | 
 79 | def bboxes_iou(bboxes_a, bboxes_b, xyxy=True):
 80 |     if bboxes_a.shape[1] != 4 or bboxes_b.shape[1] != 4:
 81 |         raise IndexError
 82 | 
 83 |     if xyxy:
 84 |         tl = torch.max(bboxes_a[:, None, :2], bboxes_b[:, :2])
 85 |         br = torch.min(bboxes_a[:, None, 2:], bboxes_b[:, 2:])
 86 |         area_a = torch.prod(bboxes_a[:, 2:] - bboxes_a[:, :2], 1)
 87 |         area_b = torch.prod(bboxes_b[:, 2:] - bboxes_b[:, :2], 1)
 88 |     else:
 89 |         tl = torch.max(
 90 |             (bboxes_a[:, None, :2] - bboxes_a[:, None, 2:] / 2),
 91 |             (bboxes_b[:, :2] - bboxes_b[:, 2:] / 2),
 92 |         )
 93 |         br = torch.min(
 94 |             (bboxes_a[:, None, :2] + bboxes_a[:, None, 2:] / 2),
 95 |             (bboxes_b[:, :2] + bboxes_b[:, 2:] / 2),
 96 |         )
 97 | 
 98 |         area_a = torch.prod(bboxes_a[:, 2:], 1)
 99 |         area_b = torch.prod(bboxes_b[:, 2:], 1)
100 |     en = (tl < br).type(tl.type()).prod(dim=2)
101 |     area_i = torch.prod(br - tl, 2) * en  # * ((tl < br).all())
102 |     return area_i / (area_a[:, None] + area_b - area_i)
103 | 
104 | 
105 | def matrix_iou(a, b):
106 |     """
107 |     return iou of a and b, numpy version for data augenmentation
108 |     """
109 |     lt = np.maximum(a[:, np.newaxis, :2], b[:, :2])
110 |     rb = np.minimum(a[:, np.newaxis, 2:], b[:, 2:])
111 | 
112 |     area_i = np.prod(rb - lt, axis=2) * (lt < rb).all(axis=2)
113 |     area_a = np.prod(a[:, 2:] - a[:, :2], axis=1)
114 |     area_b = np.prod(b[:, 2:] - b[:, :2], axis=1)
115 |     return area_i / (area_a[:, np.newaxis] + area_b - area_i + 1e-12)
116 | 
117 | 
118 | def adjust_box_anns(bbox, scale_ratio, padw, padh, w_max, h_max):
119 |     bbox[:, 0::2] = np.clip(bbox[:, 0::2] * scale_ratio + padw, 0, w_max)
120 |     bbox[:, 1::2] = np.clip(bbox[:, 1::2] * scale_ratio + padh, 0, h_max)
121 |     return bbox
122 | 
123 | 
124 | def xyxy2xywh(bboxes):
125 |     bboxes[:, 2] = bboxes[:, 2] - bboxes[:, 0]
126 |     bboxes[:, 3] = bboxes[:, 3] - bboxes[:, 1]
127 |     return bboxes
128 | 
129 | 
130 | def xyxy2cxcywh(bboxes):
131 |     bboxes[:, 2] = bboxes[:, 2] - bboxes[:, 0]
132 |     bboxes[:, 3] = bboxes[:, 3] - bboxes[:, 1]
133 |     bboxes[:, 0] = bboxes[:, 0] + bboxes[:, 2] * 0.5
134 |     bboxes[:, 1] = bboxes[:, 1] + bboxes[:, 3] * 0.5
135 |     return bboxes
136 | 


--------------------------------------------------------------------------------
/exps/example/yolox_voc/yolox_voc_s.py:
--------------------------------------------------------------------------------
  1 | # encoding: utf-8
  2 | import os
  3 | 
  4 | import torch
  5 | import torch.distributed as dist
  6 | 
  7 | from cfp.data import get_yolox_datadir
  8 | from cfp.exp import Exp as MyExp
  9 | 
 10 | 
 11 | class Exp(MyExp):
 12 |     def __init__(self):
 13 |         super(Exp, self).__init__()
 14 |         self.num_classes = 20
 15 |         self.depth = 0.33
 16 |         self.width = 0.50
 17 |         self.warmup_epochs = 1
 18 | 
 19 |         # ---------- transform config ------------ #
 20 |         self.mosaic_prob = 1.0
 21 |         self.mixup_prob = 1.0
 22 |         self.hsv_prob = 1.0
 23 |         self.flip_prob = 0.5
 24 | 
 25 |         self.exp_name = os.path.split(os.path.realpath(__file__))[1].split(".")[0]
 26 | 
 27 |     def get_data_loader(self, batch_size, is_distributed, no_aug=False, cache_img=False):
 28 |         from yolox.data import (
 29 |             VOCDetection,
 30 |             TrainTransform,
 31 |             YoloBatchSampler,
 32 |             DataLoader,
 33 |             InfiniteSampler,
 34 |             MosaicDetection,
 35 |             worker_init_reset_seed,
 36 |         )
 37 |         from yolox.utils import (
 38 |             wait_for_the_master,
 39 |             get_local_rank,
 40 |         )
 41 |         local_rank = get_local_rank()
 42 | 
 43 |         with wait_for_the_master(local_rank):
 44 |             dataset = VOCDetection(
 45 |                 data_dir=os.path.join(get_yolox_datadir(), "/home/10102006/dataset/voc/VOCdevkit/"), # VOCdevkit
 46 |                 image_sets=[('VOC2007', 'trainval'), ('VOC2012', 'trainval')], # ('2007', 'trainval'), ('2012', 'trainval')
 47 |                 img_size=self.input_size,
 48 |                 preproc=TrainTransform(
 49 |                     max_labels=50,
 50 |                     flip_prob=self.flip_prob,
 51 |                     hsv_prob=self.hsv_prob),
 52 |                 cache=cache_img,
 53 |             )
 54 | 
 55 |         dataset = MosaicDetection(
 56 |             dataset,
 57 |             mosaic=not no_aug,
 58 |             img_size=self.input_size,
 59 |             preproc=TrainTransform(
 60 |                 max_labels=120,
 61 |                 flip_prob=self.flip_prob,
 62 |                 hsv_prob=self.hsv_prob),
 63 |             degrees=self.degrees,
 64 |             translate=self.translate,
 65 |             mosaic_scale=self.mosaic_scale,
 66 |             mixup_scale=self.mixup_scale,
 67 |             shear=self.shear,
 68 |             enable_mixup=self.enable_mixup,
 69 |             mosaic_prob=self.mosaic_prob,
 70 |             mixup_prob=self.mixup_prob,
 71 |         )
 72 | 
 73 |         self.dataset = dataset
 74 | 
 75 |         if is_distributed:
 76 |             batch_size = batch_size // dist.get_world_size()
 77 | 
 78 |         sampler = InfiniteSampler(
 79 |             len(self.dataset), seed=self.seed if self.seed else 0
 80 |         )
 81 | 
 82 |         batch_sampler = YoloBatchSampler(
 83 |             sampler=sampler,
 84 |             batch_size=batch_size,
 85 |             drop_last=False,
 86 |             mosaic=not no_aug,
 87 |         )
 88 | 
 89 |         dataloader_kwargs = {"num_workers": self.data_num_workers, "pin_memory": True}
 90 |         dataloader_kwargs["batch_sampler"] = batch_sampler
 91 | 
 92 |         # Make sure each process has different random seed, especially for 'fork' method
 93 |         dataloader_kwargs["worker_init_fn"] = worker_init_reset_seed
 94 | 
 95 |         train_loader = DataLoader(self.dataset, **dataloader_kwargs)
 96 | 
 97 |         return train_loader
 98 | 
 99 |     def get_eval_loader(self, batch_size, is_distributed, testdev=False, legacy=False):
100 |         from yolox.data import VOCDetection, ValTransform
101 | 
102 |         valdataset = VOCDetection(
103 |             data_dir=os.path.join(get_yolox_datadir(), "VOCdevkit"),
104 |             image_sets=[('2007', 'test')],
105 |             img_size=self.test_size,
106 |             preproc=ValTransform(legacy=legacy),
107 |         )
108 | 
109 |         if is_distributed:
110 |             batch_size = batch_size // dist.get_world_size()
111 |             sampler = torch.utils.data.distributed.DistributedSampler(
112 |                 valdataset, shuffle=False
113 |             )
114 |         else:
115 |             sampler = torch.utils.data.SequentialSampler(valdataset)
116 | 
117 |         dataloader_kwargs = {
118 |             "num_workers": self.data_num_workers,
119 |             "pin_memory": True,
120 |             "sampler": sampler,
121 |         }
122 |         dataloader_kwargs["batch_size"] = batch_size
123 |         val_loader = torch.utils.data.DataLoader(valdataset, **dataloader_kwargs)
124 | 
125 |         return val_loader
126 | 
127 |     def get_evaluator(self, batch_size, is_distributed, testdev=False, legacy=False):
128 |         from yolox.evaluators import VOCEvaluator
129 | 
130 |         val_loader = self.get_eval_loader(batch_size, is_distributed, testdev, legacy)
131 |         evaluator = VOCEvaluator(
132 |             dataloader=val_loader,
133 |             img_size=self.test_size,
134 |             confthre=self.test_conf,
135 |             nmsthre=self.nmsthre,
136 |             num_classes=self.num_classes,
137 |         )
138 |         return evaluator
139 | 


--------------------------------------------------------------------------------
/demo/ncnn/android/gradlew:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env sh
  2 | 
  3 | ##############################################################################
  4 | ##
  5 | ##  Gradle start up script for UN*X
  6 | ##
  7 | ##############################################################################
  8 | 
  9 | # Attempt to set APP_HOME
 10 | # Resolve links: $0 may be a link
 11 | PRG="$0"
 12 | # Need this for relative symlinks.
 13 | while [ -h "$PRG" ] ; do
 14 |     ls=`ls -ld "$PRG"`
 15 |     link=`expr "$ls" : '.*-> \(.*\)$'`
 16 |     if expr "$link" : '/.*' > /dev/null; then
 17 |         PRG="$link"
 18 |     else
 19 |         PRG=`dirname "$PRG"`"/$link"
 20 |     fi
 21 | done
 22 | SAVED="`pwd`"
 23 | cd "`dirname \"$PRG\"`/" >/dev/null
 24 | APP_HOME="`pwd -P`"
 25 | cd "$SAVED" >/dev/null
 26 | 
 27 | APP_NAME="Gradle"
 28 | APP_BASE_NAME=`basename "$0"`
 29 | 
 30 | # Add default JVM options here. You can also use JAVA_OPTS and GRADLE_OPTS to pass JVM options to this script.
 31 | DEFAULT_JVM_OPTS=""
 32 | 
 33 | # Use the maximum available, or set MAX_FD != -1 to use that value.
 34 | MAX_FD="maximum"
 35 | 
 36 | warn () {
 37 |     echo "$*"
 38 | }
 39 | 
 40 | die () {
 41 |     echo
 42 |     echo "$*"
 43 |     echo
 44 |     exit 1
 45 | }
 46 | 
 47 | # OS specific support (must be 'true' or 'false').
 48 | cygwin=false
 49 | msys=false
 50 | darwin=false
 51 | nonstop=false
 52 | case "`uname`" in
 53 |   CYGWIN* )
 54 |     cygwin=true
 55 |     ;;
 56 |   Darwin* )
 57 |     darwin=true
 58 |     ;;
 59 |   MINGW* )
 60 |     msys=true
 61 |     ;;
 62 |   NONSTOP* )
 63 |     nonstop=true
 64 |     ;;
 65 | esac
 66 | 
 67 | CLASSPATH=$APP_HOME/gradle/wrapper/gradle-wrapper.jar
 68 | 
 69 | # Determine the Java command to use to start the JVM.
 70 | if [ -n "$JAVA_HOME" ] ; then
 71 |     if [ -x "$JAVA_HOME/jre/sh/java" ] ; then
 72 |         # IBM's JDK on AIX uses strange locations for the executables
 73 |         JAVACMD="$JAVA_HOME/jre/sh/java"
 74 |     else
 75 |         JAVACMD="$JAVA_HOME/bin/java"
 76 |     fi
 77 |     if [ ! -x "$JAVACMD" ] ; then
 78 |         die "ERROR: JAVA_HOME is set to an invalid directory: $JAVA_HOME
 79 | 
 80 | Please set the JAVA_HOME variable in your environment to match the
 81 | location of your Java installation."
 82 |     fi
 83 | else
 84 |     JAVACMD="java"
 85 |     which java >/dev/null 2>&1 || die "ERROR: JAVA_HOME is not set and no 'java' command could be found in your PATH.
 86 | 
 87 | Please set the JAVA_HOME variable in your environment to match the
 88 | location of your Java installation."
 89 | fi
 90 | 
 91 | # Increase the maximum file descriptors if we can.
 92 | if [ "$cygwin" = "false" -a "$darwin" = "false" -a "$nonstop" = "false" ] ; then
 93 |     MAX_FD_LIMIT=`ulimit -H -n`
 94 |     if [ $? -eq 0 ] ; then
 95 |         if [ "$MAX_FD" = "maximum" -o "$MAX_FD" = "max" ] ; then
 96 |             MAX_FD="$MAX_FD_LIMIT"
 97 |         fi
 98 |         ulimit -n $MAX_FD
 99 |         if [ $? -ne 0 ] ; then
100 |             warn "Could not set maximum file descriptor limit: $MAX_FD"
101 |         fi
102 |     else
103 |         warn "Could not query maximum file descriptor limit: $MAX_FD_LIMIT"
104 |     fi
105 | fi
106 | 
107 | # For Darwin, add options to specify how the application appears in the dock
108 | if $darwin; then
109 |     GRADLE_OPTS="$GRADLE_OPTS \"-Xdock:name=$APP_NAME\" \"-Xdock:icon=$APP_HOME/media/gradle.icns\""
110 | fi
111 | 
112 | # For Cygwin, switch paths to Windows format before running java
113 | if $cygwin ; then
114 |     APP_HOME=`cygpath --path --mixed "$APP_HOME"`
115 |     CLASSPATH=`cygpath --path --mixed "$CLASSPATH"`
116 |     JAVACMD=`cygpath --unix "$JAVACMD"`
117 | 
118 |     # We build the pattern for arguments to be converted via cygpath
119 |     ROOTDIRSRAW=`find -L / -maxdepth 1 -mindepth 1 -type d 2>/dev/null`
120 |     SEP=""
121 |     for dir in $ROOTDIRSRAW ; do
122 |         ROOTDIRS="$ROOTDIRS$SEP$dir"
123 |         SEP="|"
124 |     done
125 |     OURCYGPATTERN="(^($ROOTDIRS))"
126 |     # Add a user-defined pattern to the cygpath arguments
127 |     if [ "$GRADLE_CYGPATTERN" != "" ] ; then
128 |         OURCYGPATTERN="$OURCYGPATTERN|($GRADLE_CYGPATTERN)"
129 |     fi
130 |     # Now convert the arguments - kludge to limit ourselves to /bin/sh
131 |     i=0
132 |     for arg in "$@" ; do
133 |         CHECK=`echo "$arg"|egrep -c "$OURCYGPATTERN" -`
134 |         CHECK2=`echo "$arg"|egrep -c "^-"`                                 ### Determine if an option
135 | 
136 |         if [ $CHECK -ne 0 ] && [ $CHECK2 -eq 0 ] ; then                    ### Added a condition
137 |             eval `echo args$i`=`cygpath --path --ignore --mixed "$arg"`
138 |         else
139 |             eval `echo args$i`="\"$arg\""
140 |         fi
141 |         i=$((i+1))
142 |     done
143 |     case $i in
144 |         (0) set -- ;;
145 |         (1) set -- "$args0" ;;
146 |         (2) set -- "$args0" "$args1" ;;
147 |         (3) set -- "$args0" "$args1" "$args2" ;;
148 |         (4) set -- "$args0" "$args1" "$args2" "$args3" ;;
149 |         (5) set -- "$args0" "$args1" "$args2" "$args3" "$args4" ;;
150 |         (6) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" ;;
151 |         (7) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" ;;
152 |         (8) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" "$args7" ;;
153 |         (9) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" "$args7" "$args8" ;;
154 |     esac
155 | fi
156 | 
157 | # Escape application args
158 | save () {
159 |     for i do printf %s\\n "$i" | sed "s/'/'\\\\''/g;1s/^/'/;\$s/\$/' \\\\/" ; done
160 |     echo " "
161 | }
162 | APP_ARGS=$(save "$@")
163 | 
164 | # Collect all arguments for the java command, following the shell quoting and substitution rules
165 | eval set -- $DEFAULT_JVM_OPTS $JAVA_OPTS $GRADLE_OPTS "\"-Dorg.gradle.appname=$APP_BASE_NAME\"" -classpath "\"$CLASSPATH\"" org.gradle.wrapper.GradleWrapperMain "$APP_ARGS"
166 | 
167 | # by default we should be in the correct project dir, but when run from Finder on Mac, the cwd is wrong
168 | if [ "$(uname)" = "Darwin" ] && [ "$HOME" = "$PWD" ]; then
169 |   cd "$(dirname "$0")"
170 | fi
171 | 
172 | exec "$JAVACMD" "$@"
173 | 


--------------------------------------------------------------------------------
/demo/MegEngine/python/models/darknet.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- encoding: utf-8 -*-
  3 | # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
  4 | 
  5 | import megengine.module as M
  6 | 
  7 | from .network_blocks import BaseConv, CSPLayer, DWConv, Focus, ResLayer, SPPBottleneck
  8 | 
  9 | 
 10 | class Darknet(M.Module):
 11 |     # number of blocks from dark2 to dark5.
 12 |     depth2blocks = {21: [1, 2, 2, 1], 53: [2, 8, 8, 4]}
 13 | 
 14 |     def __init__(
 15 |         self, depth, in_channels=3, stem_out_channels=32, out_features=("dark3", "dark4", "dark5"),
 16 |     ):
 17 |         """
 18 |         Args:
 19 |             depth (int): depth of darknet used in model, usually use [21, 53] for this param.
 20 |             in_channels (int): number of input channels, for example, use 3 for RGB image.
 21 |             stem_out_channels (int): number of output chanels of darknet stem.
 22 |                 It decides channels of darknet layer2 to layer5.
 23 |             out_features (Tuple[str]): desired output layer name.
 24 |         """
 25 |         super().__init__()
 26 |         assert out_features, "please provide output features of Darknet"
 27 |         self.out_features = out_features
 28 |         self.stem = M.Sequential(
 29 |             BaseConv(in_channels, stem_out_channels, ksize=3, stride=1, act="lrelu"),
 30 |             *self.make_group_layer(stem_out_channels, num_blocks=1, stride=2),
 31 |         )
 32 |         in_channels = stem_out_channels * 2  # 64
 33 | 
 34 |         num_blocks = Darknet.depth2blocks[depth]
 35 |         # create darknet with `stem_out_channels` and `num_blocks` layers.
 36 |         # to make model structure more clear, we don't use `for` statement in python.
 37 |         self.dark2 = M.Sequential(*self.make_group_layer(in_channels, num_blocks[0], stride=2))
 38 |         in_channels *= 2  # 128
 39 |         self.dark3 = M.Sequential(*self.make_group_layer(in_channels, num_blocks[1], stride=2))
 40 |         in_channels *= 2  # 256
 41 |         self.dark4 = M.Sequential(*self.make_group_layer(in_channels, num_blocks[2], stride=2))
 42 |         in_channels *= 2  # 512
 43 | 
 44 |         self.dark5 = M.Sequential(
 45 |             *self.make_group_layer(in_channels, num_blocks[3], stride=2),
 46 |             *self.make_spp_block([in_channels, in_channels * 2], in_channels * 2),
 47 |         )
 48 | 
 49 |     def make_group_layer(self, in_channels: int, num_blocks: int, stride: int = 1):
 50 |         "starts with conv layer then has `num_blocks` `ResLayer`"
 51 |         return [
 52 |             BaseConv(in_channels, in_channels * 2, ksize=3, stride=stride, act="lrelu"),
 53 |             *[(ResLayer(in_channels * 2)) for _ in range(num_blocks)]
 54 |         ]
 55 | 
 56 |     def make_spp_block(self, filters_list, in_filters):
 57 |         m = M.Sequential(
 58 |             *[
 59 |                 BaseConv(in_filters, filters_list[0], 1, stride=1, act="lrelu"),
 60 |                 BaseConv(filters_list[0], filters_list[1], 3, stride=1, act="lrelu"),
 61 |                 SPPBottleneck(
 62 |                     in_channels=filters_list[1],
 63 |                     out_channels=filters_list[0],
 64 |                     activation="lrelu"
 65 |                 ),
 66 |                 BaseConv(filters_list[0], filters_list[1], 3, stride=1, act="lrelu"),
 67 |                 BaseConv(filters_list[1], filters_list[0], 1, stride=1, act="lrelu"),
 68 |             ]
 69 |         )
 70 |         return m
 71 | 
 72 |     def forward(self, x):
 73 |         outputs = {}
 74 |         x = self.stem(x)
 75 |         outputs["stem"] = x
 76 |         x = self.dark2(x)
 77 |         outputs["dark2"] = x
 78 |         x = self.dark3(x)
 79 |         outputs["dark3"] = x
 80 |         x = self.dark4(x)
 81 |         outputs["dark4"] = x
 82 |         x = self.dark5(x)
 83 |         outputs["dark5"] = x
 84 |         return {k: v for k, v in outputs.items() if k in self.out_features}
 85 | 
 86 | 
 87 | class CSPDarknet(M.Module):
 88 | 
 89 |     def __init__(
 90 |         self, dep_mul, wid_mul,
 91 |         out_features=("dark3", "dark4", "dark5"),
 92 |         depthwise=False, act="silu",
 93 |     ):
 94 |         super().__init__()
 95 |         assert out_features, "please provide output features of Darknet"
 96 |         self.out_features = out_features
 97 |         Conv = DWConv if depthwise else BaseConv
 98 | 
 99 |         base_channels = int(wid_mul * 64)  # 64
100 |         base_depth = max(round(dep_mul * 3), 1)  # 3
101 | 
102 |         # stem
103 |         self.stem = Focus(3, base_channels, ksize=3, act=act)
104 | 
105 |         # dark2
106 |         self.dark2 = M.Sequential(
107 |             Conv(base_channels, base_channels * 2, 3, 2, act=act),
108 |             CSPLayer(
109 |                 base_channels * 2, base_channels * 2,
110 |                 n=base_depth, depthwise=depthwise, act=act
111 |             ),
112 |         )
113 | 
114 |         # dark3
115 |         self.dark3 = M.Sequential(
116 |             Conv(base_channels * 2, base_channels * 4, 3, 2, act=act),
117 |             CSPLayer(
118 |                 base_channels * 4, base_channels * 4,
119 |                 n=base_depth * 3, depthwise=depthwise, act=act,
120 |             ),
121 |         )
122 | 
123 |         # dark4
124 |         self.dark4 = M.Sequential(
125 |             Conv(base_channels * 4, base_channels * 8, 3, 2, act=act),
126 |             CSPLayer(
127 |                 base_channels * 8, base_channels * 8,
128 |                 n=base_depth * 3, depthwise=depthwise, act=act,
129 |             ),
130 |         )
131 | 
132 |         # dark5
133 |         self.dark5 = M.Sequential(
134 |             Conv(base_channels * 8, base_channels * 16, 3, 2, act=act),
135 |             SPPBottleneck(base_channels * 16, base_channels * 16, activation=act),
136 |             CSPLayer(
137 |                 base_channels * 16, base_channels * 16, n=base_depth,
138 |                 shortcut=False, depthwise=depthwise, act=act,
139 |             ),
140 |         )
141 | 
142 |     def forward(self, x):
143 |         outputs = {}
144 |         x = self.stem(x)
145 |         outputs["stem"] = x
146 |         x = self.dark2(x)
147 |         outputs["dark2"] = x
148 |         x = self.dark3(x)
149 |         outputs["dark3"] = x
150 |         x = self.dark4(x)
151 |         outputs["dark4"] = x
152 |         x = self.dark5(x)
153 |         outputs["dark5"] = x
154 |         return {k: v for k, v in outputs.items() if k in self.out_features}
155 | 


--------------------------------------------------------------------------------
/demo/OpenVINO/python/openvino_inference.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding: utf-8 -*-
  3 | # Copyright (C) 2018-2021 Intel Corporation
  4 | # SPDX-License-Identifier: Apache-2.0
  5 | # Copyright (c) Megvii, Inc. and its affiliates.
  6 | 
  7 | import argparse
  8 | import logging as log
  9 | import os
 10 | import sys
 11 | 
 12 | import cv2
 13 | import numpy as np
 14 | 
 15 | from openvino.inference_engine import IECore
 16 | 
 17 | from cfp.data.data_augment import preproc as preprocess
 18 | from cfp.data.datasets import COCO_CLASSES
 19 | from cfp.utils import mkdir, multiclass_nms, demo_postprocess, vis
 20 | 
 21 | 
 22 | def parse_args() -> argparse.Namespace:
 23 |     """Parse and return command line arguments"""
 24 |     parser = argparse.ArgumentParser(add_help=False)
 25 |     args = parser.add_argument_group('Options')
 26 |     args.add_argument(
 27 |         '-h',
 28 |         '--help',
 29 |         action='help',
 30 |         help='Show this help message and exit.')
 31 |     args.add_argument(
 32 |         '-m',
 33 |         '--model',
 34 |         required=True,
 35 |         type=str,
 36 |         help='Required. Path to an .xml or .onnx file with a trained model.')
 37 |     args.add_argument(
 38 |         '-i',
 39 |         '--input',
 40 |         required=True,
 41 |         type=str,
 42 |         help='Required. Path to an image file.')
 43 |     args.add_argument(
 44 |         '-o',
 45 |         '--output_dir',
 46 |         type=str,
 47 |         default='demo_output',
 48 |         help='Path to your output dir.')
 49 |     args.add_argument(
 50 |         '-s',
 51 |         '--score_thr',
 52 |         type=float,
 53 |         default=0.3,
 54 |         help="Score threshould to visualize the result.")
 55 |     args.add_argument(
 56 |         '-d',
 57 |         '--device',
 58 |         default='CPU',
 59 |         type=str,
 60 |         help='Optional. Specify the target device to infer on; CPU, GPU, \
 61 |               MYRIAD, HDDL or HETERO: is acceptable. The sample will look \
 62 |               for a suitable plugin for device specified. Default value \
 63 |               is CPU.')
 64 |     args.add_argument(
 65 |         '--labels',
 66 |         default=None,
 67 |         type=str,
 68 |         help='Option:al. Path to a labels mapping file.')
 69 |     args.add_argument(
 70 |         '-nt',
 71 |         '--number_top',
 72 |         default=10,
 73 |         type=int,
 74 |         help='Optional. Number of top results.')
 75 |     return parser.parse_args()
 76 | 
 77 | 
 78 | def main():
 79 |     log.basicConfig(format='[ %(levelname)s ] %(message)s', level=log.INFO, stream=sys.stdout)
 80 |     args = parse_args()
 81 | 
 82 |     # ---------------------------Step 1. Initialize inference engine core--------------------------------------------------
 83 |     log.info('Creating Inference Engine')
 84 |     ie = IECore()
 85 | 
 86 |     # ---------------------------Step 2. Read a model in OpenVINO Intermediate Representation or ONNX format---------------
 87 |     log.info(f'Reading the network: {args.model}')
 88 |     # (.xml and .bin files) or (.onnx file)
 89 |     net = ie.read_network(model=args.model)
 90 | 
 91 |     if len(net.input_info) != 1:
 92 |         log.error('Sample supports only single input topologies')
 93 |         return -1
 94 |     if len(net.outputs) != 1:
 95 |         log.error('Sample supports only single output topologies')
 96 |         return -1
 97 | 
 98 |     # ---------------------------Step 3. Configure input & output----------------------------------------------------------
 99 |     log.info('Configuring input and output blobs')
100 |     # Get names of input and output blobs
101 |     input_blob = next(iter(net.input_info))
102 |     out_blob = next(iter(net.outputs))
103 | 
104 |     # Set input and output precision manually
105 |     net.input_info[input_blob].precision = 'FP32'
106 |     net.outputs[out_blob].precision = 'FP16'
107 | 
108 |     # Get a number of classes recognized by a model
109 |     num_of_classes = max(net.outputs[out_blob].shape)
110 | 
111 |     # ---------------------------Step 4. Loading model to the device-------------------------------------------------------
112 |     log.info('Loading the model to the plugin')
113 |     exec_net = ie.load_network(network=net, device_name=args.device)
114 | 
115 |     # ---------------------------Step 5. Create infer request--------------------------------------------------------------
116 |     # load_network() method of the IECore class with a specified number of requests (default 1) returns an ExecutableNetwork
117 |     # instance which stores infer requests. So you already created Infer requests in the previous step.
118 | 
119 |     # ---------------------------Step 6. Prepare input---------------------------------------------------------------------
120 |     origin_img = cv2.imread(args.input)
121 |     _, _, h, w = net.input_info[input_blob].input_data.shape
122 |     image, ratio = preprocess(origin_img, (h, w))
123 | 
124 |     # ---------------------------Step 7. Do inference----------------------------------------------------------------------
125 |     log.info('Starting inference in synchronous mode')
126 |     res = exec_net.infer(inputs={input_blob: image})
127 | 
128 |     # ---------------------------Step 8. Process output--------------------------------------------------------------------
129 |     res = res[out_blob]
130 | 
131 |     predictions = demo_postprocess(res, (h, w), p6=False)[0]
132 | 
133 |     boxes = predictions[:, :4]
134 |     scores = predictions[:, 4, None] * predictions[:, 5:]
135 | 
136 |     boxes_xyxy = np.ones_like(boxes)
137 |     boxes_xyxy[:, 0] = boxes[:, 0] - boxes[:, 2]/2.
138 |     boxes_xyxy[:, 1] = boxes[:, 1] - boxes[:, 3]/2.
139 |     boxes_xyxy[:, 2] = boxes[:, 0] + boxes[:, 2]/2.
140 |     boxes_xyxy[:, 3] = boxes[:, 1] + boxes[:, 3]/2.
141 |     boxes_xyxy /= ratio
142 |     dets = multiclass_nms(boxes_xyxy, scores, nms_thr=0.45, score_thr=0.1)
143 | 
144 |     if dets is not None:
145 |         final_boxes = dets[:, :4]
146 |         final_scores, final_cls_inds = dets[:, 4], dets[:, 5]
147 |         origin_img = vis(origin_img, final_boxes, final_scores, final_cls_inds,
148 |                          conf=args.score_thr, class_names=COCO_CLASSES)
149 | 
150 |     mkdir(args.output_dir)
151 |     output_path = os.path.join(args.output_dir, os.path.basename(args.input))
152 |     cv2.imwrite(output_path, origin_img)
153 | 
154 | 
155 | if __name__ == '__main__':
156 |     sys.exit(main())
157 | 


--------------------------------------------------------------------------------