├── .gitignore
├── LICENSE
├── README.md
├── app
    ├── README.md
    └── face_detection_openvino.py
├── config
    └── config.json
├── detection
    ├── __init__.py
    ├── age_gender_detection_ov.py
    ├── detection_base_ov.py
    └── face_detection_ov.py
├── files
    ├── README.md
    ├── intel-openvino.conf
    └── intel-openvino.sh
├── inference_services
    ├── README.md
    ├── facedetection
    │   ├── Dockerfile
    │   ├── README.md
    │   ├── detection
    │   │   ├── __init__.py
    │   │   ├── age_gender_detection_ov.py
    │   │   ├── detection_base_ov.py
    │   │   └── face_detection_ov.py
    │   ├── face_detection_service.py
    │   ├── inference_config.json
    │   ├── models
    │   │   ├── age-gender-recognition-retail-0013.bin
    │   │   ├── age-gender-recognition-retail-0013.xml
    │   │   ├── det1-0001.bin
    │   │   ├── det1-0001.mapping
    │   │   ├── det1-0001.xml
    │   │   ├── det2-0001.bin
    │   │   ├── det2-0001.mapping
    │   │   ├── det2-0001.xml
    │   │   ├── det3-0001.bin
    │   │   ├── det3-0001.mapping
    │   │   └── det3-0001.xml
    │   ├── requirements.txt
    │   └── utils
    │   │   ├── __init__.py
    │   │   └── image_utils.py
    └── flask_hello_world
    │   ├── Dockerfile
    │   ├── README.md
    │   ├── flask_app.py
    │   └── requirements.txt
├── models
    └── README.md
└── utils
    ├── __init__.py
    └── image_utils.py


/.gitignore:
--------------------------------------------------------------------------------
1 | venv/
2 | .idea/
3 | __pycache__/


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | # MIT License
 2 | #
 3 | # Copyright (c) 2019 Onur Dundar
 4 | #
 5 | # Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | # of this software and associated documentation files (the "Software"), to deal
 7 | # in the Software without restriction, including without limitation the rights
 8 | # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | # copies of the Software, and to permit persons to whom the Software is
10 | # furnished to do so, subject to the following conditions:
11 | #
12 | # The above copyright notice and this permission notice shall be included in all
13 | # copies or substantial portions of the Software.
14 | #
15 | # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | # SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | # Python AI Project with Intel(R) OpenVINO(TM) Inference Engine Python API
 2 | 
 3 | Here is a template project to reuse for production ready applications to use Deep Learning models focusing on Face, Age, Gender detection models.
 4 | 
 5 | At this stage, only OpenVINO has been integrated. 
 6 | 
 7 | # OpenVINO(TM) Toolkit Installation and Configuration for Ubuntu 18.04
 8 | 
 9 |  ``OpenVINO(TM) Version: 2019.2.242``
10 | 
11 | You can install OpenVINO(TM) by following the instructions published online documentation.
12 | 
13 | - https://docs.openvinotoolkit.org/
14 | 
15 | - https://docs.openvinotoolkit.org/latest/_docs_install_guides_installing_openvino_linux.html
16 | 
17 | Before running this Python application:
18 | 
19 | 1. Set Environment Variables on the current workspace:
20 | 
21 | ```bash
22 | source /opt/intel/openvino/bin/setupvars.sh
23 | ```
24 | 
25 | **OR**
26 | 
27 | 2. Set Environment Variables System Wide
28 | 
29 | Copy `files/intel-openvino.sh` & `files/intel-openvino.conf` file as shown below:
30 | 
31 | ```bash
32 | sudo cp files/intel-openvino.sh /etc/profile.d/
33 | sudo cp files/intel-openvino.conf /etc/ld.so.conf.d/ 
34 | sudo reboot
35 | ```
36 | 
37 | ## Clone This Repository
38 | 
39 | ```bash
40 | git clone https://github.com/odundar/face_detection.git
41 | ```
42 | 
43 | ## Quick Run for Face Detection Application
44 | If all setup completed successfully, you can use the default configurations to give a start for face detection application. 
45 | 
46 | ```bash
47 | python3 face_detection_openvino.py config/config.json
48 | ```
49 | 
50 | ## app/
51 | 
52 | `app` folder includes apps ready to run for face, age, gender detection applications.
53 | 
54 | ## services/
55 | 
56 | service modules stored here which are to be deployed in docker microservices
57 | 
58 | ## config/
59 | 
60 | `config` folder includes app and service default configurations to be used as template.  
61 | 
62 | ## detection/
63 | 
64 | `detection` folder contains the modules and classes to reuse for inference application development.
65 | 
66 | ```
67 | detection\
68 |     detection_base_ov.py\
69 |         InferenceConfig
70 |         InferenceBase
71 |     
72 |     age_gender_detection_ov.py\
73 |         AgeGenderDetectionTypes
74 |         AgeGenderDetection
75 |         AgeGenderConfig
76 |         MTCNNAgeGenderDetection
77 |         MTCNNAgeGenderConfig
78 |     
79 |     face_detection_ov.py\
80 |         FaceDetectionModelTypes
81 |         FaceDetectionConfig
82 |         OpenMZooFaceDetection
83 |         MTCNNFaceDetectionConfig
84 |         MtCNNFaceDetection
85 | ```
86 | 
87 | ## docker/
88 | 
89 | Includes instructions to deploy face, age-gender detection services as docker services.
90 | 
91 | ## files/
92 | 
93 | This folder includes system configuration files for OpenVINO(TM) Toolkit
94 | 
95 | ## models/
96 | 
97 | Folder includes instructions how to fetch models, convert and use them. 
98 |  
99 | 


--------------------------------------------------------------------------------
/app/README.md:
--------------------------------------------------------------------------------
 1 | # Run Application
 2 | 
 3 | This is a test application to run face-age-gender detections configured with the json file stored in config folder.
 4 | 
 5 | Before running this application make sure OpenVINO environment has been setup correctly and `detection`, `utils` modules are in same directory as `app` folder.
 6 | 
 7 | ```bash
 8 | python3 app/face_detection_openvino.py config/config.json
 9 | ```
10 | 
11 | If you run inside the `app` folder make sure `detection` and `utils` modules are included in `PYTHONPATH`
12 | 
13 | 
14 | 
15 | 


--------------------------------------------------------------------------------
/app/face_detection_openvino.py:
--------------------------------------------------------------------------------
  1 | # MIT License
  2 | #
  3 | # Copyright (c) 2019 Onur Dundar onur.dundar1@gmail.com
  4 | #
  5 | # Permission is hereby granted, free of charge, to any person obtaining a copy
  6 | # of this software and associated documentation files (the "Software"), to deal
  7 | # in the Software without restriction, including without limitation the rights
  8 | # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  9 | # copies of the Software, and to permit persons to whom the Software is
 10 | # furnished to do so, subject to the following conditions:
 11 | #
 12 | # The above copyright notice and this permission notice shall be included in all
 13 | # copies or substantial portions of the Software.
 14 | #
 15 | # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 16 | # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 17 | # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 18 | # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 19 | # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 20 | # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 21 | # SOFTWARE.
 22 | 
 23 | import sys
 24 | import cv2 as cv
 25 | import json
 26 | import logging
 27 | 
 28 | from detection.face_detection_ov import FaceDetectionConfig, OpenMZooFaceDetection, FaceDetectionModelTypes, MtCNNFaceDetection, MTCNNFaceDetectionConfig
 29 | from detection.age_gender_detection_ov import AgeGenderConfig, MTCNNAgeGenderDetection, AgeGenderDetectionTypes, MTCNNAgeGenderConfig, AgeGenderDetection
 30 | from utils.image_utils import ImageUtil
 31 | 
 32 | 
 33 | def prepare_configs():
 34 |     """
 35 |     Set Configurations for Face, Age Gender Models
 36 |     :return: face config, age_gender config
 37 |     """
 38 |     logging.log(logging.INFO, "Setting Configurations")
 39 |     if face_detection_model == FaceDetectionModelTypes.MTCNN:
 40 |         face_infer_cfg = MTCNNFaceDetectionConfig()
 41 |     else:
 42 |         face_infer_cfg = FaceDetectionConfig()
 43 | 
 44 |     face_infer_cfg.parse_json(config_file)
 45 | 
 46 |     age_gender_cfg = None
 47 | 
 48 |     if run_age_gender:
 49 |         if age_gender_model == AgeGenderDetectionTypes.MTCNN:
 50 |             age_gender_cfg = MTCNNAgeGenderConfig()
 51 |         else:
 52 |             age_gender_cfg = AgeGenderConfig()
 53 |         age_gender_cfg.parse_json(config_file)
 54 | 
 55 |     return face_infer_cfg, age_gender_cfg
 56 | 
 57 | 
 58 | def run_app():
 59 |     """
 60 |     Runs Face Detection Application
 61 |     """
 62 |     face_cfg, age_cfg = prepare_configs()
 63 | 
 64 |     '''Open Web Cam (change 0 to any video file if required)'''
 65 | 
 66 |     if input_type == "video" or input_type == "webcam":
 67 |         if input_type == "video":
 68 |             capture = cv.VideoCapture(input_path)
 69 |             has_frame, frame = capture.read()
 70 |         elif input_type == "webcam":
 71 |             capture = cv.VideoCapture(web_cam_index)
 72 |             has_frame, frame = capture.read()
 73 | 
 74 |         face_cfg.InputHeight = frame.shape[0]
 75 |         face_cfg.InputWidth = frame.shape[1]
 76 | 
 77 |         if face_detection_model == FaceDetectionModelTypes.MTCNN:
 78 |             face_infer = MtCNNFaceDetection(face_cfg)
 79 |         else:
 80 |             face_infer = OpenMZooFaceDetection(face_cfg)
 81 | 
 82 |         if run_age_gender:
 83 |             if age_gender_model == AgeGenderDetectionTypes.MTCNN:
 84 |                 age_gender_infer = MTCNNAgeGenderDetection(age_cfg)
 85 |             else:
 86 |                 age_gender_infer = AgeGenderDetection(age_cfg)
 87 | 
 88 |         video_inference(face_inference=face_infer, age_inference=age_gender_infer, source=capture)
 89 | 
 90 |     elif input_type == "image":
 91 |         frame = cv.imread(input_path)
 92 | 
 93 |         face_cfg.InputHeight = frame.shape[0]
 94 |         face_cfg.InputWidth = frame.shape[1]
 95 | 
 96 |         if face_detection_model == FaceDetectionModelTypes.MTCNN:
 97 |             face_infer = MtCNNFaceDetection(face_cfg)
 98 |         else:
 99 |             face_infer = OpenMZooFaceDetection(face_cfg)
100 | 
101 |         if run_age_gender:
102 |             if age_gender_model == AgeGenderDetectionTypes.MTCNN:
103 |                 age_gender_infer = MTCNNAgeGenderDetection(age_cfg)
104 |             else:
105 |                 age_gender_infer = AgeGenderDetection(age_cfg)
106 | 
107 |         image_inference(face_inference=face_infer, age_inference=age_gender_infer, source=frame)
108 |     else:
109 |         logging.log(logging.ERROR, "Invalid Input Type: {}".format(input_type))
110 |         exit(-1)
111 | 
112 |     return None
113 | 
114 | 
115 | def image_inference(face_inference=None, age_inference=None, source=None):
116 |     """
117 | 
118 |     :param face_inference:
119 |     :param age_inference:
120 |     :param source:
121 |     :return:
122 |     """
123 |     cv.namedWindow(cv_window_name, cv.WINDOW_NORMAL)
124 |     cv.resizeWindow(cv_window_name, 800, 600)
125 | 
126 |     frame_order = []
127 |     frame_id = 1
128 | 
129 |     face_inference.infer(source)
130 |     faces = face_inference.get_face_detection_data()
131 |     if face_inference.Config.ModelType == FaceDetectionModelTypes.MTCNN:
132 |         landmarks = face_inference.get_face_landmarks_data()
133 | 
134 |     if len(faces) > 0:
135 |         print("Detected {} Faces with {} Threshold".format(len(faces), face_inference.Config.FaceDetectionThreshold))
136 |         for idx, face in enumerate(faces):
137 |             ImageUtil.draw_rectangle(source, (face[0], face[1], face[2], face[3]))
138 |             if face_inference.Config.ModelType == FaceDetectionModelTypes.MTCNN:
139 |                 for coordinate in range(0, len(landmarks[idx]), 2):
140 |                     ImageUtil.draw_ellipse(source, [landmarks[idx][coordinate], landmarks[idx][coordinate + 1]])
141 | 
142 |             if run_age_gender:
143 |                 cropped_image = ImageUtil.crop_frame(source, (face[0], face[1], face[2], face[3]))
144 |                 if cropped_image.size > 0:
145 |                     age_inference.infer(cropped_image)
146 |                     age, gender = age_inference.get_age_gender_data()
147 |                     age_gender_text = '{} - {}'
148 |                     age_gender_text = age_gender_text.format(age, gender)
149 |                     ImageUtil.draw_text(source, age_gender_text,
150 |                                         (face[0], face[1], face[2], face[3]))
151 | 
152 |     cv.imshow(cv_window_name, source)
153 |     cv.waitKey(0)
154 | 
155 |     return None
156 | 
157 | 
158 | def video_inference(face_inference=None, age_inference=None, source=None):
159 |     """
160 | 
161 |     :param face_inference:
162 |     :param age_inference:
163 |     :param source:
164 |     :return:
165 |     """
166 |     face_request_order = list()
167 |     face_process_order = list()
168 | 
169 |     for i in range(face_inference.Config.RequestCount):
170 |         face_request_order.append(i)
171 | 
172 |     cv.namedWindow(cv_window_name, cv.WINDOW_NORMAL)
173 |     cv.resizeWindow(cv_window_name, 800, 600)
174 | 
175 |     frame_order = []
176 |     frame_id = 1
177 | 
178 |     has_frame, frame = source.read()
179 | 
180 |     while has_frame:
181 |         logging.log(logging.DEBUG, "Processing Frame {}".format(frame_id))
182 |         if len(face_request_order) > 0:
183 |             req_id = face_request_order[0]
184 |             face_request_order.pop(0)
185 |             face_inference.infer(frame, req_id)
186 |             face_process_order.append(req_id)
187 |             frame_order.append(frame)
188 | 
189 |         if len(face_process_order) > 0:
190 |             first = face_process_order[0]
191 |             if face_inference.request_ready(request_id=first):
192 |                 detected_faces = face_inference.get_face_detection_data(first)
193 |                 if face_inference.Config.ModelType == FaceDetectionModelTypes.MTCNN:
194 |                     face_landmarks = face_inference.get_face_landmarks_data(first)
195 |                 face_process_order.pop(0)
196 |                 face_request_order.append(first)
197 |                 show_frame = frame_order[0]
198 |                 frame_order.pop(0)
199 |                 if len(detected_faces) > 0:
200 |                     for idx, face in enumerate(detected_faces):
201 |                         ImageUtil.draw_rectangle(show_frame, (face[0], face[1], face[2], face[3]))
202 | 
203 |                         if face_inference.Config.ModelType == FaceDetectionModelTypes.MTCNN:
204 |                             for coordinate in range(0, len(face_landmarks[idx]), 2):
205 |                                 ImageUtil.draw_ellipse(show_frame, [face_landmarks[idx][coordinate],
206 |                                                                     face_landmarks[idx][coordinate + 1]])
207 | 
208 |                         if run_age_gender:
209 |                             cropped_image = ImageUtil.crop_frame(show_frame, (face[0], face[1], face[2], face[3]))
210 |                             if cropped_image.size > 0:
211 |                                 age_inference.infer(cropped_image)
212 |                                 age, gender = age_inference.get_age_gender_data()
213 |                                 age_gender_text = '{} - {}'
214 |                                 age_gender_text = age_gender_text.format(age, gender)
215 |                                 ImageUtil.draw_text(show_frame, age_gender_text, (face[0], face[1], face[2], face[3]))
216 | 
217 |                 cv.imshow(cv_window_name, show_frame)
218 |                 if cv.waitKey(1) & 0xFF == ord('q'):
219 |                     break
220 | 
221 |         if len(face_request_order) > 0:
222 |             has_frame, frame = source.read()
223 |             frame_id += 1
224 | 
225 |     face_inference.print_inference_performance_metrics()
226 |     if run_age_gender:
227 |         age_inference.print_inference_performance_metrics()
228 | 
229 |     return None
230 | 
231 | 
232 | """
233 | Global Parameters Used for Application Configuration
234 | """
235 | 
236 | cv_window_name = 'Face-Detection'
237 | run_age_gender = False
238 | input_type = "image"
239 | input_path = ''
240 | web_cam_index = 0
241 | face_detection_model = FaceDetectionModelTypes.OPENMODELZOO
242 | age_gender_model = AgeGenderDetectionTypes.OPENMODELZOO
243 | config_file = "~/Projects/face_detection/config/config.json"
244 | 
245 | 
246 | def parse_config_file(config_json='config.json'):
247 |     """
248 |     Parse Config File
249 |     :param config_json:
250 |     :return:
251 |     """
252 |     global config_file
253 |     config_file = config_json
254 | 
255 |     try:
256 |         with open(config_json) as json_file:
257 |             data = json.load(json_file)
258 | 
259 |             global cv_window_name
260 |             cv_window_name = data['output_window_name']
261 | 
262 |             global input_path
263 |             input_path = data["input_path"]
264 | 
265 |             global input_type
266 |             input_type = data["input_type"]
267 | 
268 |             global web_cam_index
269 |             web_cam_index = int(data["web_cam_index"])
270 | 
271 |             global run_age_gender
272 |             if data['run_age_gender'] == "True":
273 |                 run_age_gender = True
274 | 
275 |             global face_detection_model
276 |             if data['face_detection_model'] == FaceDetectionModelTypes.MTCNN:
277 |                 face_detection_model = FaceDetectionModelTypes.MTCNN
278 | 
279 |             global age_gender_model
280 |             if data['age_gender_detection_model'] == AgeGenderDetectionTypes.MTCNN:
281 |                 age_gender_model = AgeGenderDetectionTypes.MTCNN
282 | 
283 |             if data["log_level"] == "DEBUG":
284 |                 logging.basicConfig(level=logging.DEBUG)
285 |             elif data["log_level"] == "INFO":
286 |                 logging.basicConfig(level=logging.INFO)
287 |             elif data["log_level"] == "WARN":
288 |                 logging.basicConfig(level=logging.WARN)
289 |             else:
290 |                 logging.basicConfig(level=logging.ERROR)
291 | 
292 |             logging.log(logging.WARN, "Log Level Set to: {}".format(data["log_level"]))
293 | 
294 |     except FileNotFoundError:
295 |         print('{} FileNotFound'.format(config_json))
296 |         exit(-1)
297 | 
298 | 
299 | def print_help():
300 |     print('Usage: python3 face_detection_openvino.py <config_file.json>')
301 | 
302 | 
303 | # Application Entry Point
304 | if __name__ == "__main__":
305 | 
306 |     if len(sys.argv) is not 2:
307 |         print_help()
308 |         print('Using default config file: {}'.format(config_file))
309 |         parse_config_file(config_file)
310 |     else:
311 |         parse_config_file(sys.argv[1])
312 | 
313 |     # Run FD App
314 |     run_app()
315 | 


--------------------------------------------------------------------------------
/config/config.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "omz_facedetection" : {
 3 |     "model_path" : "~/openvino_models/Retail/object_detection/face/sqnet1.0modif-ssd/0004/dldt/",
 4 |     "model_name" : "face-detection-retail-0004",
 5 |     "target_device" : "CPU",
 6 |     "cpu_extension" : "True",
 7 |     "cpu_extension_path" : "~/inference_engine_samples_build/intel64/Release/lib/libcpu_extension.so",
 8 |     "face_detection_threshold" : 0.6,
 9 |     "async" : "False",
10 |     "request_count" : 1,
11 |     "dynamic_batch" : "False",
12 |     "batch_size" : 1,
13 |     "limit_cpu_threads" : "False",
14 |     "number_of_cpu_threads" : 4,
15 |     "bind_cpu_threads" : "True",
16 |     "cpu_stream" : "AUTO",
17 |     "gpu_stream" : "AUTO"
18 |   },
19 | 
20 |   "omz_age_gender" : {
21 |     "model_path" : "~/openvino_models/Retail/object_attributes/age_gender/dldt/FP32/",
22 |     "model_name" : "age-gender-recognition-retail-0013",
23 |     "target_device" : "CPU",
24 |     "cpu_extension" : "True",
25 |     "cpu_extension_path" : "~/inference_engine_samples_build/intel64/Release/lib/libcpu_extension.so",
26 |     "async" : "False",
27 |     "request_count" : 1,
28 |     "dynamic_batch" : "False",
29 |     "batch_size" : 1,
30 |     "limit_cpu_threads" : "False",
31 |     "number_of_cpu_threads" : 4,
32 |     "bind_cpu_threads" : "True",
33 |     "cpu_stream" : "AUTO",
34 |     "gpu_stream" : "AUTO"
35 |   },
36 | 
37 |   "mtcnn_facedetection" : {
38 |     "model_path" : "~/Projects/customer_tests/face_detection_mtcnn_opr/FP32/",
39 |     "p_model_file_name" : "det1-0001",
40 |     "r_model_file_name" : "det2-0001",
41 |     "o_model_file_name" : "det3-0001",
42 |     "target_device" : "CPU",
43 |     "cpu_extension" : "True",
44 |     "cpu_extension_path" : "~/inference_engine_samples_build/intel64/Release/lib/libcpu_extension.so",
45 | 
46 |     "p_network_threshold" : 0.6,
47 |     "r_network_threshold" : 0.7,
48 |     "o_network_threshold" : 0.8,
49 | 
50 |     "minimum_face_size" : 15.0,
51 |     "minimum_length" : 720,
52 |     "factor_count" : 0,
53 |     "factor" : 0.707,
54 |     "min_detection_size" : 12,
55 | 
56 |     "nms_thresholds" : [0.6, 0.6, 0.6],
57 |     "r_input_batch_size" : 256,
58 |     "o_input_batch_size" : 256,
59 | 
60 |     "limit_cpu_threads" : "False",
61 |     "number_of_cpu_threads" : 4,
62 |     "bind_cpu_threads" : "True",
63 |     "cpu_stream" : "AUTO",
64 |     "gpu_stream" : "AUTO"
65 |   },
66 | 
67 |   "mtcnn_age_gender" : {
68 |     "model_path" : "~/DeepLearning/Models/gender-age/",
69 |     "model_name" : "model-0000",
70 |     "target_device" : "CPU",
71 |     "cpu_extension" : "True",
72 |     "cpu_extension_path" : "~/inference_engine_samples_build/intel64/Release/lib/libcpu_extension.so",
73 |     "async" : "False",
74 |     "request_count" : 1,
75 |     "dynamic_batch" : "False",
76 |     "batch_size" : 1,
77 |     "limit_cpu_threads" : "False",
78 |     "number_of_cpu_threads" : 4,
79 |     "bind_cpu_threads" : "True",
80 |     "cpu_stream" : "AUTO",
81 |     "gpu_stream" : "AUTO"
82 |   },
83 | 
84 |   "face_detection_model" : "mtcnn_facedetection",
85 |   "age_gender_detection_model" : "mtcnn_age_gender",
86 |   "run_age_gender" : "True",
87 |   "show_output" : "True",
88 |   "output_window_name" : "Face-Detection",
89 | 
90 |   "input_type" : "webcam",
91 |   "input_path" : "~/Videos/facedetection.mp4",
92 |   "web_cam_index" : 0,
93 | 
94 |   "log_level" : "DEBUG"
95 | }


--------------------------------------------------------------------------------
/detection/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/odundar/face-detection-python/8ef8863d85c4ddd3c67512ff3e48fa4cf7c1d770/detection/__init__.py


--------------------------------------------------------------------------------
/detection/age_gender_detection_ov.py:
--------------------------------------------------------------------------------
  1 | # MIT License
  2 | #
  3 | # Copyright (c) 2019 Onur Dundar onur.dundar1@gmail.com
  4 | #
  5 | # Permission is hereby granted, free of charge, to any person obtaining a copy
  6 | # of this software and associated documentation files (the "Software"), to deal
  7 | # in the Software without restriction, including without limitation the rights
  8 | # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  9 | # copies of the Software, and to permit persons to whom the Software is
 10 | # furnished to do so, subject to the following conditions:
 11 | #
 12 | # The above copyright notice and this permission notice shall be included in all
 13 | # copies or substantial portions of the Software.
 14 | #
 15 | # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 16 | # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 17 | # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 18 | # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 19 | # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 20 | # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 21 | # SOFTWARE.
 22 | 
 23 | import json
 24 | import numpy as np
 25 | import logging
 26 | 
 27 | from .detection_base_ov import InferenceBase, InferenceConfig
 28 | 
 29 | 
 30 | class AgeGenderDetectionTypes:
 31 |     MTCNN = "mtcnn_age_gender"
 32 |     OPENMODELZOO = "omz_age_gender"
 33 | 
 34 | 
 35 | class AgeGenderConfig(InferenceConfig):
 36 |     ModelType = AgeGenderDetectionTypes.OPENMODELZOO
 37 | 
 38 |     def parse_json(self, json_file):
 39 |         try:
 40 |             logging.log(logging.INFO, "Loading JSON File {}".format(json_file))
 41 |             logging.log(logging.INFO, "Model Type {}".format(self.ModelType))
 42 | 
 43 |             with open(json_file) as json_file:
 44 |                 data = json.load(json_file)
 45 | 
 46 |                 self.ModelPath = data[self.ModelType]["model_path"]
 47 |                 self.ModelName = data[self.ModelType]["model_name"]
 48 | 
 49 |                 self.TargetDevice = data[self.ModelType]["target_device"]
 50 | 
 51 |                 if data[self.ModelType]["async"] == "True":
 52 |                     self.Async = True
 53 | 
 54 |                 self.RequestCount = int(data[self.ModelType]["request_count"])
 55 | 
 56 |                 self.BatchSize = int(data[self.ModelType]["batch_size"])
 57 | 
 58 |                 if data[self.ModelType]["cpu_extension"] == "True":
 59 |                     self.CpuExtension = True
 60 | 
 61 |                 self.CpuExtensionPath = data[self.ModelType]["cpu_extension_path"]
 62 | 
 63 |                 if data[self.ModelType]["dynamic_batch"] == "True":
 64 |                     self.DynamicBatch = True
 65 | 
 66 |                 if data[self.ModelType]["limit_cpu_threads"] == "True":
 67 |                     self.LimitCPUThreads = True
 68 | 
 69 |                 self.CPUThreadNum = int(data[self.ModelType]["number_of_cpu_threads"])
 70 | 
 71 |                 if data[self.ModelType]["bind_cpu_threads"] == "True":
 72 |                     self.LimitCPUThreads = True
 73 | 
 74 |                 self.CPUStream = data[self.ModelType]["cpu_stream"]
 75 | 
 76 |         except FileNotFoundError:
 77 |             logging.log(logging.ERROR, '{} FileNotFound'.format(json_file))
 78 |             exit(-1)
 79 | 
 80 |     def read_dict(self, data=None):
 81 |         """
 82 |         Used When JSON Already Parsed as Dict
 83 |         :return:
 84 |         """
 85 |         if data is None:
 86 |             data = dict()
 87 |         self.ModelPath = data[self.ModelType]["model_path"]
 88 |         self.ModelName = data[self.ModelType]["model_name"]
 89 | 
 90 |         self.TargetDevice = data[self.ModelType]["target_device"]
 91 | 
 92 |         if data[self.ModelType]["async"] == "True":
 93 |             self.Async = True
 94 | 
 95 |         self.RequestCount = int(data[self.ModelType]["request_count"])
 96 | 
 97 |         self.BatchSize = int(data[self.ModelType]["batch_size"])
 98 | 
 99 |         if data[self.ModelType]["cpu_extension"] == "True":
100 |             self.CpuExtension = True
101 | 
102 |         self.CpuExtensionPath = data[self.ModelType]["cpu_extension_path"]
103 | 
104 |         if data[self.ModelType]["dynamic_batch"] == "True":
105 |             self.DynamicBatch = True
106 | 
107 |         if data[self.ModelType]["limit_cpu_threads"] == "True":
108 |             self.LimitCPUThreads = True
109 | 
110 |         self.CPUThreadNum = int(data[self.ModelType]["number_of_cpu_threads"])
111 | 
112 |         if data[self.ModelType]["bind_cpu_threads"] == "True":
113 |             self.LimitCPUThreads = True
114 | 
115 |         self.CPUStream = data[self.ModelType]["cpu_stream"]
116 | 
117 | 
118 | class MTCNNAgeGenderConfig(AgeGenderConfig):
119 |     ModelType = AgeGenderDetectionTypes.MTCNN
120 | 
121 | 
122 | class MTCNNAgeGenderDetection(InferenceBase):
123 | 
124 |     Config = MTCNNAgeGenderConfig()
125 | 
126 |     def get_age_gender_data(self, request_id=0):
127 |         """
128 |         Parse Output Data for Age-Gender Detection Model
129 |         :param request_id:
130 |         :return:
131 |         """
132 |         detection = self.OpenVinoExecutable.requests[request_id].outputs[self.OutputLayer]
133 |         # Parse detection vector to get age and gender
134 |         gender_vector = detection[:, 0:2].flatten()
135 |         gender = int(np.argmax(gender_vector))
136 | 
137 |         gender_text = 'female'
138 |         if gender == 1:
139 |             gender_text = 'male'
140 | 
141 |         age_matrix = detection[:, 2:202].reshape((100, 2))
142 |         ages = np.argmax(age_matrix, axis=1)
143 |         age = int(sum(ages))
144 | 
145 |         return age, gender_text
146 | 
147 | 
148 | class AgeGenderDetection(InferenceBase):
149 | 
150 |     Config = AgeGenderConfig()
151 | 
152 |     def get_age_gender_data(self, request_id=0):
153 |         """
154 |         Parse Output Data for Age-Gender Detection Model
155 |         :param request_id:
156 |         :return:
157 |         """
158 |         age = int(self.OpenVinoExecutable.requests[request_id].outputs["age_conv3"][0][0][0][0] * 100)
159 |         genders = self.OpenVinoExecutable.requests[request_id].outputs["prob"]
160 |         # Parse detection vector to get age and gender
161 | 
162 |         gender_text = 'female'
163 |         if genders[0][0][0][0] < genders[0][1][0][0]:
164 |             gender_text = 'male'
165 | 
166 |         return age, gender_text


--------------------------------------------------------------------------------
/detection/detection_base_ov.py:
--------------------------------------------------------------------------------
  1 | # MIT License
  2 | #
  3 | # Copyright (c) 2019 Onur Dundar onur.dundar1@gmail.com
  4 | #
  5 | # Permission is hereby granted, free of charge, to any person obtaining a copy
  6 | # of this software and associated documentation files (the "Software"), to deal
  7 | # in the Software without restriction, including without limitation the rights
  8 | # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  9 | # copies of the Software, and to permit persons to whom the Software is
 10 | # furnished to do so, subject to the following conditions:
 11 | #
 12 | # The above copyright notice and this permission notice shall be included in all
 13 | # copies or substantial portions of the Software.
 14 | #
 15 | # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 16 | # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 17 | # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 18 | # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 19 | # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 20 | # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 21 | # SOFTWARE.
 22 | 
 23 | import time, logging, json
 24 | import cv2 as cv
 25 | import numpy as np
 26 | 
 27 | # Import OpenVINO
 28 | # Make sure environment variables set correctly for this to work
 29 | # Check on README.md file
 30 | from openvino.inference_engine import IENetwork, IECore, ExecutableNetwork
 31 | 
 32 | 
 33 | class InferenceConfig(object):
 34 |     """
 35 |     Inference Configuration Model
 36 |     """
 37 |     ModelType = ""
 38 |     ModelPath = str()
 39 |     ModelName = str()
 40 |     TargetDevice = str()
 41 |     Async = False
 42 |     RequestCount = 1
 43 |     DynamicBatch = False
 44 |     BatchSize = 1
 45 |     CpuExtension = False
 46 |     CpuExtensionPath = "/opt/intel/openvino/inference_engine/lib/intel64/libcpu_extension.so"
 47 |     LimitCPUThreads = False
 48 |     CPUThreadNum = 1
 49 |     BindCPUThreads = True
 50 |     CPUStream = "AUTO"
 51 | 
 52 |     def parse_json(self, json_file):
 53 |         """
 54 |         Parse JSON Parameters
 55 |         :param json_file:
 56 |         :return:
 57 |         """
 58 |         try:
 59 |             logging.log(logging.INFO, "Loading JSON File".format(json_file))
 60 |             with open(json_file) as json_file:
 61 |                 data = json.load(json_file)
 62 | 
 63 |                 self.ModelPath = data[self.ModelType]["model_path"]
 64 |                 self.ModelName = data[self.ModelType]["model_name"]
 65 |                 self.TargetDevice = data[self.ModelType]["target_device"]
 66 | 
 67 |                 if data[self.ModelType]["async"] == "True":
 68 |                     self.Async = True
 69 | 
 70 |                 self.RequestCount = int(data[self.ModelType]["request_count"])
 71 |                 self.BatchSize = int(data[self.ModelType]["batch_size"])
 72 | 
 73 |                 if data[self.ModelType]["cpu_extension"] == "True":
 74 |                     self.CpuExtension = True
 75 | 
 76 |                 self.CpuExtensionPath = data["cpu_extension_path"]
 77 | 
 78 |                 if data[self.ModelType]["dynamic_batch"] == "True":
 79 |                     self.DynamicBatch = True
 80 | 
 81 |                 if data[self.ModelType]["limit_cpu_threads"] == "True":
 82 |                     self.LimitCPUThreads = True
 83 | 
 84 |                 self.CPUThreadNum = int(data[self.ModelType]["cpu_thread_num"])
 85 | 
 86 |                 if data[self.ModelType]["bind_cpu_threads"] == "True":
 87 |                     self.LimitCPUThreads = True
 88 | 
 89 |                 self.CPUStream = data[self.ModelType]["cpu_stream"]
 90 | 
 91 |         except FileNotFoundError:
 92 |             logging.log(logging.ERROR,'{} FileNotFound'.format(json_file))
 93 |             exit(-1)
 94 | 
 95 |     def read_dict(self, data=None):
 96 |         """
 97 |         Used When JSON Already Parsed as Dict
 98 |         :return:
 99 |         """
100 |         if data is None:
101 |             data = dict()
102 |         self.ModelPath = data[self.ModelType]["model_path"]
103 |         self.ModelName = data[self.ModelType]["model_name"]
104 |         self.TargetDevice = data[self.ModelType]["target_device"]
105 | 
106 |         if data[self.ModelType]["async"] == "True":
107 |             self.Async = True
108 | 
109 |         self.RequestCount = int(data[self.ModelType]["request_count"])
110 |         self.BatchSize = int(data[self.ModelType]["batch_size"])
111 | 
112 |         if data[self.ModelType]["cpu_extension"] == "True":
113 |             self.CpuExtension = True
114 | 
115 |         self.CpuExtensionPath = data["cpu_extension_path"]
116 | 
117 |         if data[self.ModelType]["dynamic_batch"] == "True":
118 |             self.DynamicBatch = True
119 | 
120 |         if data[self.ModelType]["limit_cpu_threads"] == "True":
121 |             self.LimitCPUThreads = True
122 | 
123 |         self.CPUThreadNum = int(data[self.ModelType]["cpu_thread_num"])
124 | 
125 |         if data[self.ModelType]["bind_cpu_threads"] == "True":
126 |             self.LimitCPUThreads = True
127 | 
128 |         self.CPUStream = data[self.ModelType]["cpu_stream"]
129 | 
130 | 
131 | class InferenceBase(object):
132 |     """
133 |     Base Class to Load a Model with Inference Engine
134 |     """
135 | 
136 |     Config = InferenceConfig()
137 | 
138 |     '''Inference Engine Components'''
139 |     OpenVinoIE = IECore()
140 |     OpenVinoNetwork = IENetwork()
141 |     OpenVinoExecutable = ExecutableNetwork()
142 | 
143 |     '''Model Components'''
144 |     InputLayer = str()
145 |     InputLayers = list()
146 |     OutputLayer = str()
147 |     OutputLayers = list()
148 |     InputShape = None
149 |     OutputShape = None
150 | 
151 |     '''Performance Metrics Storage'''
152 |     ElapsedInferenceTime = 0.0
153 |     InferenceCount = 0.0
154 | 
155 |     def __init__(self, infer_config):
156 |         self.Config = infer_config
157 |         self.prepare_detector()
158 | 
159 |     def prepare_detector(self):
160 |         """
161 |         Load Model, Libraries According to Given Configuration.
162 |         :return:
163 |         """
164 |         if self.Config.ModelPath is None or self.Config.ModelName is None:
165 |             return None
166 | 
167 |         ''' Model File Paths '''
168 |         model_file = self.Config.ModelPath + self.Config.ModelName + '.xml'
169 |         model_weights = self.Config.ModelPath + self.Config.ModelName + '.bin'
170 | 
171 |         logging.log(logging.INFO, "Model File {}".format(model_file))
172 |         logging.log(logging.INFO, "Model Weights {}".format(model_weights))
173 | 
174 |         ''' Create IECore Object '''
175 |         self.OpenVinoIE = IECore()
176 | 
177 |         ''' If target device is CPU add extensions '''
178 |         if self.Config.CpuExtension and 'CPU' in self.Config.TargetDevice:
179 |             logging.log(logging.INFO, "Adding CPU Extensions, Path {}".format(self.Config.CpuExtensionPath))
180 |             self.OpenVinoIE.add_extension(self.Config.CpuExtensionPath, "CPU")
181 | 
182 |         ''' Try loading network '''
183 |         try:
184 |             self.OpenVinoNetwork = IENetwork(model=model_file, weights=model_weights)
185 |             logging.log(logging.INFO, "Loaded IENetwork")
186 |         except FileNotFoundError:
187 |             logging.log(logging.ERROR, FileNotFoundError.strerror + " " + FileNotFoundError.filename)
188 |             logging.log(logging.ERROR, "Exiting ....")
189 |             exit(-1)
190 | 
191 |         ''' Print supported/not-supported layers '''
192 |         if "CPU" in self.Config.TargetDevice:
193 |             supported_layers = self.OpenVinoIE.query_network(self.OpenVinoNetwork, "CPU")
194 |             not_supported_layers = [l for l in self.OpenVinoNetwork.layers.keys() if l not in supported_layers]
195 |             if len(not_supported_layers) != 0:
196 |                 logging.log(logging.WARN, "Following layers are not supported by the plugin for specified device {}:\n {}".format(self.Config.TargetDevice, ', '.join(not_supported_layers)))
197 |                 logging.log(logging.WARN, "Please try to specify cpu extensions library path in config.json file ")
198 | 
199 |         '''Input / Output Memory Allocations to feed input or get output values'''
200 |         self.InputLayer = next(iter(self.OpenVinoNetwork.inputs))
201 |         logging.log(logging.INFO, "Input Layer ".format(self.InputLayer))
202 | 
203 |         N, C, H, W = self.OpenVinoNetwork.inputs[self.InputLayer].shape
204 | 
205 |         if self.Config.BatchSize > N:
206 |             self.OpenVinoNetwork.batch_size = self.Config.BatchSize
207 |         else:
208 |             self.Config.BatchSize = self.OpenVinoNetwork.batch_size
209 | 
210 |         self.OutputLayer = next(iter(self.OpenVinoNetwork.outputs))
211 |         logging.log(logging.INFO, "Output Layer ".format(self.OutputLayer))
212 | 
213 |         self.InputLayers = list(self.OpenVinoNetwork.inputs)
214 |         logging.log(logging.INFO, "Input Layers ".format(self.InputLayers))
215 | 
216 |         self.OutputLayers = list(self.OpenVinoNetwork.outputs)
217 |         logging.log(logging.INFO, "Output Layers ".format(self.OutputLayers))
218 | 
219 |         self.InputShape = self.OpenVinoNetwork.inputs[self.InputLayer].shape
220 |         logging.log(logging.INFO, "Input Shape: {}".format(self.InputShape))
221 | 
222 |         self.OutputShape = self.OpenVinoNetwork.outputs[self.OutputLayer].shape
223 |         logging.log(logging.INFO, "Output Shape: {}".format(self.OutputShape))
224 | 
225 |         '''Set Configurations'''
226 | 
227 |         config = {}
228 | 
229 |         if self.Config.DynamicBatch:
230 |             config["DYN_BATCH_ENABLE"] = "YES"
231 |             logging.log(logging.INFO, "Enabling Dynamic Batch Mode")
232 | 
233 |         if self.Config.Async:
234 |             logging.log(logging.INFO, "Async Mode Enabled")
235 | 
236 |         self.OpenVinoExecutable = self.OpenVinoIE.load_network(network=self.OpenVinoNetwork,
237 |                                                                device_name=self.Config.TargetDevice,
238 |                                                                config=config,
239 |                                                                num_requests=self.Config.RequestCount)
240 | 
241 |         logging.log(logging.INFO, "Completed Loading Neural Network")
242 | 
243 |         return None
244 | 
245 |     def preprocess_input(self, input_data):
246 |         """
247 |         Pre-process Input According to Loaded Network
248 |         :param input_data:
249 |         :return:
250 |         """
251 | 
252 |         n, c, h, w = self.OpenVinoNetwork.inputs[self.InputLayer].shape
253 |         logging.log(logging.DEBUG, "Pre-processing Input to Shape {}".format(self.OpenVinoNetwork.inputs[self.InputLayer].shape))
254 | 
255 |         resized = cv.resize(input_data, (w, h))
256 |         color_converted = cv.cvtColor(resized, cv.COLOR_BGR2RGB)
257 |         transposed = np.transpose(color_converted, (2, 0, 1))
258 |         reshaped = np.expand_dims(transposed, axis=0)
259 | 
260 |         return reshaped
261 | 
262 |     def infer(self, input_data, request_id=0):
263 |         """
264 |         Used to send data to network and start forward propagation.
265 |         :param input_data:
266 |         :param request_id:
267 |         :return:
268 |         """
269 |         if self.Config.Async:
270 |             logging.log(logging.DEBUG, "Async Infer Request Id {}".format(request_id))
271 |             self.infer_async(input_data, request_id)
272 |         else:
273 |             logging.log(logging.DEBUG, "Infer Request Id {}".format(request_id))
274 |             self.infer_sync(input_data, request_id)
275 | 
276 |     def infer_async(self, input_data, request_id=0):
277 |         """
278 |         Start Async Infer for Given Request Id
279 |         :param input_data:
280 |         :param request_id:
281 |         :return:
282 |         """
283 |         self.InferenceCount += 1
284 |         processed_input = self.preprocess_input(input_data)
285 |         self.OpenVinoExecutable.requests[request_id].async_infer(inputs={self.InputLayer: processed_input})
286 | 
287 |     def infer_sync(self, input_data, request_id=0):
288 |         """
289 |         Start Sync Infer
290 |         :param input_data:
291 |         :param request_id:
292 |         :return:
293 |         """
294 |         self.InferenceCount += 1
295 |         processed_input = self.preprocess_input(input_data)
296 |         start = time.time()
297 |         self.OpenVinoExecutable.requests[request_id].infer(inputs={self.InputLayer: processed_input})
298 |         end = time.time()
299 |         self.ElapsedInferenceTime += (end - start)
300 | 
301 |     def request_ready(self, request_id):
302 |         """
303 |         Check if request is ready
304 |         :param request_id: id to check request
305 |         :return: bool
306 |         """
307 |         if self.Config.Async:
308 |             if self.OpenVinoExecutable.requests[request_id].wait(0) == 0:
309 |                 return True
310 |         else:
311 |             return True
312 | 
313 |         return False
314 | 
315 |     def get_results(self, output_layer, request_id=0):
316 |         """
317 |         Get results from the network.
318 |         :param output_layer: output layer
319 |         :param request_id: request id
320 |         :return:
321 |         """
322 |         logging.log(logging.DEBUG, "Getting Results Request Id {}".format(request_id))
323 |         return self.OpenVinoExecutable.requests[request_id].outputs[output_layer]
324 | 
325 |     def print_inference_performance_metrics(self):
326 |         """
327 |         Print Performance Data Collection
328 |         :return:
329 |         """
330 |         if self.Config.Async:
331 |             logging.log(logging.WARN, 'Async Mode Inferred Frame Count {}'.format(self.InferenceCount))
332 |         else:
333 |             logging.log(logging.WARN, "Sync Mode Inferred Frame Count {}".format(self.InferenceCount))
334 |             logging.log(logging.WARN, "Inference Per Input: {} MilliSeconds".format((self.ElapsedInferenceTime / self.InferenceCount) * 1000))
335 | 


--------------------------------------------------------------------------------
/files/README.md:
--------------------------------------------------------------------------------
1 | Copy `files/intel-openvino.sh` & `files/intel-openvino.conf` file as shown below, they set the environment variables for OpenVINO(TM) system wide.
2 | 
3 | ```bash
4 | sudo cp files/intel-openvino.sh /etc/profile.d/
5 | sudo cp files/intel-openvino.conf /etc/ld.so.conf.d/ 
6 | sudo reboot
7 | ```


--------------------------------------------------------------------------------
/files/intel-openvino.conf:
--------------------------------------------------------------------------------
1 | /opt/intel/openvino/opencv/lib
2 | /opt/intel/opencl
3 | /opt/intel/openvino/deployment_tools/inference_engine/external/hddl/lib
4 | /opt/intel/openvino/deployment_tools/inference_engine/external/gna/lib
5 | /opt/intel/openvino/deployment_tools/inference_engine/external/mkltiny_lnx/lib
6 | /opt/intel/openvino/deployment_tools/inference_engine/external/tbb/lib
7 | /opt/intel/openvino/deployment_tools/inference_engine/lib/intel64
8 | /opt/intel/openvino/openvx/lib
9 | 


--------------------------------------------------------------------------------
/files/intel-openvino.sh:
--------------------------------------------------------------------------------
 1 | export PATH="$PATH:/opt/intel/openvino/deployment_tools/model_optimizer"
 2 | export PYTHONPATH="/opt/intel/openvino/python/python3.5:/opt/intel/openvino/deployment_tools/model_optimizer:/opt/intel/openvino/python/python3:/opt/intel/openvino/deployment_tools/model_optimizer:"
 3 | export OpenCV_DIR="/opt/intel/openvino/opencv/cmake"
 4 | export InferenceEngine_DIR="/opt/intel/openvino/deployment_tools/inference_engine/share"
 5 | export IE_PLUGINS_PATH="/opt/intel/openvino/deployment_tools/inference_engine/lib/intel64"
 6 | export LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/opt/intel/openvino/opencv/lib:/opt/intel/opencl:/opt/intel/openvino/deployment_tools/inference_engine/external/hddl/lib"
 7 | export LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/opt/intel/openvino/deployment_tools/inference_engine/external/gna/lib:/opt/intel/openvino/deployment_tools/inference_engine/external/mkltiny_lnx/lib"
 8 | export LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/opt/intel/openvino/deployment_tools/inference_engine/external/tbb/lib"
 9 | export LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/opt/intel/openvino/deployment_tools/inference_engine/lib/intel64"
10 | export LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/opt/intel/openvino/openvx/lib"
11 | export INTEL_OPENVINO_DIR="/opt/intel/openvino"
12 | export INTEL_CVSDK_DIR="/opt/intel/openvino"
13 | export HDDL_INSTALL_DIR="/opt/intel/openvino/deployment_tools/inference_engine/external/hddl"
14 | 


--------------------------------------------------------------------------------
/inference_services/README.md:
--------------------------------------------------------------------------------
 1 | # Dockerize AI Applications
 2 | 
 3 | AWS, Google Cloud & Azure already provides their services for AI. 
 4 | 
 5 | They mainly aims to enable you to use services to send data and get the predictions. 
 6 | 
 7 | Let's try to utilize this face detection modules to be used as a docker service.
 8 | 
 9 | ## Services
10 | 
11 | 1. Face Detection Service 
12 | 
13 | I want to deploy a face detection service which I can connect a network stream to get the detected faces from that video stream. 
14 | 
15 | 2. Age Gender Detection Service
16 | 
17 | I want to deploy a age-gender detection service which I can send face frames to get the age and gender data.
18 | 
19 | # System Design
20 | 
21 | ## How to send data?
22 | 
23 | JSON is used to send data, which can also include the remote video stream or remote image url to send to docker application to read from. 
24 | 
25 | ## How to receive data?
26 | 
27 | JSON files can be send to user to get the information; 
28 | 
29 | - For face detection, number of faces detected each second etc.
30 | - For age-gender detection, age and gender information.
31 | 
32 | 


--------------------------------------------------------------------------------
/inference_services/facedetection/Dockerfile:
--------------------------------------------------------------------------------
 1 | FROM ubuntu:18.04
 2 | 
 3 | MAINTAINER ONUR DUNDAR "onur.dundar1@gmail.com"
 4 | 
 5 | # ARG DOWNLOAD_LINK=~/Projects/workshop_installation/openvino_installer/l_openvino_toolkit_p_2019.2.242.tgz
 6 | ARG INSTALL_DIR=/opt/intel/openvino
 7 | ARG TEMP_DIR=/tmp/openvino_installer
 8 | 
 9 | RUN apt-get update && apt-get install -y --no-install-recommends \
10 |     wget \
11 |     cpio \
12 |     sudo \
13 |     lsb-release && \
14 |     rm -rf /var/lib/apt/lists/*
15 | 
16 | RUN mkdir -p $TEMP_DIR && cd $TEMP_DIR
17 | 
18 | COPY l_openvino_toolkit_p_2019.2.242.tgz $TEMP_DIR
19 | 
20 | WORKDIR $TEMP_DIR
21 | 
22 | RUN tar xf l_openvino_toolkit_p_2019.2.242.tgz && \
23 |     cd l_openvino_toolkit_p_2019.2.242 && \
24 |     sed -i 's/decline/accept/g' silent.cfg && \
25 |     ./install.sh -s silent.cfg && \
26 |     rm -rf $TEMP_DIR
27 | 
28 | RUN $INSTALL_DIR/install_dependencies/install_openvino_dependencies.sh
29 | 
30 | RUN apt-get update -y && \
31 |     apt-get install -y python3-pip python3-dev libgtk-3-0
32 | 
33 | WORKDIR /app
34 | COPY requirements.txt /app
35 | 
36 | RUN pip3 install -r requirements.txt
37 | 
38 | ENV PATH="$PATH:/opt/intel/openvino/deployment_tools/model_optimizer"
39 | ENV PYTHONPATH="/opt/intel/openvino/python/python3.6:/opt/intel/openvino/deployment_tools/model_optimizer:/opt/intel/openvino/python/python3:"
40 | ENV OpenCV_DIR="/opt/intel/openvino/opencv/cmake"
41 | ENV InferenceEngine_DIR="/opt/intel/openvino/deployment_tools/inference_engine/share"
42 | ENV IE_PLUGINS_PATH="/opt/intel/openvino/deployment_tools/inference_engine/lib/intel64"
43 | ENV LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/opt/intel/openvino/opencv/lib:/opt/intel/opencl:/opt/intel/openvino/deployment_tools/inference_engine/external/hddl/lib"
44 | ENV LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/opt/intel/openvino/deployment_tools/inference_engine/external/gna/lib:/opt/intel/openvino/deployment_tools/inference_engine/external/mkltiny_lnx/lib"
45 | ENV LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/opt/intel/openvino/deployment_tools/inference_engine/external/tbb/lib"
46 | ENV LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/opt/intel/openvino/deployment_tools/inference_engine/lib/intel64"
47 | ENV LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/opt/intel/openvino/openvx/lib"
48 | ENV INTEL_OPENVINO_DIR="/opt/intel/openvino"
49 | ENV INTEL_CVSDK_DIR="/opt/intel/openvino"
50 | ENV HDDL_INSTALL_DIR="/opt/intel/openvino/deployment_tools/inference_engine/external/hddl"
51 | 
52 | COPY detection /app/detection
53 | COPY utils /app/utils
54 | COPY models /app/models
55 | COPY videos /app/videos
56 | 
57 | COPY face_detection_service.py /app
58 | 
59 | EXPOSE 8000
60 | 
61 | CMD ["python3", "/app/face_detection_service.py", "-p 8000"]


--------------------------------------------------------------------------------
/inference_services/facedetection/README.md:
--------------------------------------------------------------------------------
 1 | # Face Detection Service with Docker
 2 | 
 3 | Here I have a very basic application developed with OpenVINO(TM) & Flask to start inference on given source.
 4 | 
 5 | This app can handle single request at one time, multiple requests are not possible. 
 6 | 
 7 | # Build & Start Docker with WebCam
 8 | 
 9 | Note: I had problems with webcam loading on docker so feel free to test as below.
10 | 
11 | ```bash
12 | docker build -t facedetection:latest .
13 | 
14 | docker run -d -p 8000:8000 facedetection --device=/dev/video0:/dev/video0
15 | ```
16 | 
17 | # JSON Config
18 | 
19 | JSON Configuration have to made beforeh and in order to correctly start the inference
20 | 
21 | # Curl Request to Start Face Detection Application
22 | 
23 | ```bash
24 | curl --header "Content-Type: application/json" --request POST --data '@inference_config.json' http://127.0.0.1:8000/
25 | 
26 | curl --header "Content-Type: application/json" --request POST --data '@~/Projects/face_detection/inference_services/facedetection/inference_config.json' http://127.0.0.1:8000
27 | ```
28 | 
29 | # Retrieve Status
30 | 
31 | You can retrieve the frame-id and face coordinates by a get request from:
32 | 
33 | ```bash
34 | curl --request GET http://127.0.0.1:8000/status
35 | ```
36 | 
37 | # Retrieve Results
38 | 
39 | You can retrieve the frame-id and face coordinates by a get request from:
40 | 
41 | ```bash
42 | curl --request GET http://127.0.0.1:8000/results
43 | ```
44 | 
45 | # Check Logs
46 | 
47 | ```bash
48 | curl --request GET http://127.0.0.1:8000/logs
49 | ```
50 | 
51 | # Play Video
52 | 
53 | NOT IMPLEMENTED


--------------------------------------------------------------------------------
/inference_services/facedetection/detection/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/odundar/face-detection-python/8ef8863d85c4ddd3c67512ff3e48fa4cf7c1d770/inference_services/facedetection/detection/__init__.py


--------------------------------------------------------------------------------
/inference_services/facedetection/detection/age_gender_detection_ov.py:
--------------------------------------------------------------------------------
  1 | # MIT License
  2 | #
  3 | # Copyright (c) 2019 Onur Dundar onur.dundar1@gmail.com
  4 | #
  5 | # Permission is hereby granted, free of charge, to any person obtaining a copy
  6 | # of this software and associated documentation files (the "Software"), to deal
  7 | # in the Software without restriction, including without limitation the rights
  8 | # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  9 | # copies of the Software, and to permit persons to whom the Software is
 10 | # furnished to do so, subject to the following conditions:
 11 | #
 12 | # The above copyright notice and this permission notice shall be included in all
 13 | # copies or substantial portions of the Software.
 14 | #
 15 | # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 16 | # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 17 | # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 18 | # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 19 | # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 20 | # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 21 | # SOFTWARE.
 22 | 
 23 | import json
 24 | import numpy as np
 25 | import logging
 26 | 
 27 | from .detection_base_ov import InferenceBase, InferenceConfig
 28 | 
 29 | 
 30 | class AgeGenderDetectionTypes:
 31 |     MTCNN = "mtcnn_age_gender"
 32 |     OPENMODELZOO = "omz_age_gender"
 33 | 
 34 | 
 35 | class AgeGenderConfig(InferenceConfig):
 36 |     ModelType = AgeGenderDetectionTypes.OPENMODELZOO
 37 | 
 38 |     def parse_json(self, json_file):
 39 |         try:
 40 |             logging.log(logging.INFO, "Loading JSON File {}".format(json_file))
 41 |             logging.log(logging.INFO, "Model Type {}".format(self.ModelType))
 42 | 
 43 |             with open(json_file) as json_file:
 44 |                 data = json.load(json_file)
 45 | 
 46 |                 self.ModelPath = data[self.ModelType]["model_path"]
 47 |                 self.ModelName = data[self.ModelType]["model_name"]
 48 | 
 49 |                 self.TargetDevice = data[self.ModelType]["target_device"]
 50 | 
 51 |                 if data[self.ModelType]["async"] == "True":
 52 |                     self.Async = True
 53 | 
 54 |                 self.RequestCount = int(data[self.ModelType]["request_count"])
 55 | 
 56 |                 self.BatchSize = int(data[self.ModelType]["batch_size"])
 57 | 
 58 |                 if data[self.ModelType]["cpu_extension"] == "True":
 59 |                     self.CpuExtension = True
 60 | 
 61 |                 self.CpuExtensionPath = data[self.ModelType]["cpu_extension_path"]
 62 | 
 63 |                 if data[self.ModelType]["dynamic_batch"] == "True":
 64 |                     self.DynamicBatch = True
 65 | 
 66 |                 if data[self.ModelType]["limit_cpu_threads"] == "True":
 67 |                     self.LimitCPUThreads = True
 68 | 
 69 |                 self.CPUThreadNum = int(data[self.ModelType]["number_of_cpu_threads"])
 70 | 
 71 |                 if data[self.ModelType]["bind_cpu_threads"] == "True":
 72 |                     self.LimitCPUThreads = True
 73 | 
 74 |                 self.CPUStream = data[self.ModelType]["cpu_stream"]
 75 | 
 76 |         except FileNotFoundError:
 77 |             logging.log(logging.ERROR, '{} FileNotFound'.format(json_file))
 78 |             exit(-1)
 79 | 
 80 |     def read_dict(self, data=None):
 81 |         """
 82 |         Used When JSON Already Parsed as Dict
 83 |         :return:
 84 |         """
 85 |         if data is None:
 86 |             data = dict()
 87 |         self.ModelPath = data[self.ModelType]["model_path"]
 88 |         self.ModelName = data[self.ModelType]["model_name"]
 89 | 
 90 |         self.TargetDevice = data[self.ModelType]["target_device"]
 91 | 
 92 |         if data[self.ModelType]["async"] == "True":
 93 |             self.Async = True
 94 | 
 95 |         self.RequestCount = int(data[self.ModelType]["request_count"])
 96 | 
 97 |         self.BatchSize = int(data[self.ModelType]["batch_size"])
 98 | 
 99 |         if data[self.ModelType]["cpu_extension"] == "True":
100 |             self.CpuExtension = True
101 | 
102 |         self.CpuExtensionPath = data[self.ModelType]["cpu_extension_path"]
103 | 
104 |         if data[self.ModelType]["dynamic_batch"] == "True":
105 |             self.DynamicBatch = True
106 | 
107 |         if data[self.ModelType]["limit_cpu_threads"] == "True":
108 |             self.LimitCPUThreads = True
109 | 
110 |         self.CPUThreadNum = int(data[self.ModelType]["number_of_cpu_threads"])
111 | 
112 |         if data[self.ModelType]["bind_cpu_threads"] == "True":
113 |             self.LimitCPUThreads = True
114 | 
115 |         self.CPUStream = data[self.ModelType]["cpu_stream"]
116 | 
117 | 
118 | class MTCNNAgeGenderConfig(AgeGenderConfig):
119 |     ModelType = AgeGenderDetectionTypes.MTCNN
120 | 
121 | 
122 | class MTCNNAgeGenderDetection(InferenceBase):
123 | 
124 |     Config = MTCNNAgeGenderConfig()
125 | 
126 |     def get_age_gender_data(self, request_id=0):
127 |         """
128 |         Parse Output Data for Age-Gender Detection Model
129 |         :param request_id:
130 |         :return:
131 |         """
132 |         detection = self.OpenVinoExecutable.requests[request_id].outputs[self.OutputLayer]
133 |         # Parse detection vector to get age and gender
134 |         gender_vector = detection[:, 0:2].flatten()
135 |         gender = int(np.argmax(gender_vector))
136 | 
137 |         gender_text = 'female'
138 |         if gender == 1:
139 |             gender_text = 'male'
140 | 
141 |         age_matrix = detection[:, 2:202].reshape((100, 2))
142 |         ages = np.argmax(age_matrix, axis=1)
143 |         age = int(sum(ages))
144 | 
145 |         return age, gender_text
146 | 
147 | 
148 | class AgeGenderDetection(InferenceBase):
149 | 
150 |     Config = AgeGenderConfig()
151 | 
152 |     def get_age_gender_data(self, request_id=0):
153 |         """
154 |         Parse Output Data for Age-Gender Detection Model
155 |         :param request_id:
156 |         :return:
157 |         """
158 |         age = int(self.OpenVinoExecutable.requests[request_id].outputs["age_conv3"][0][0][0][0] * 100)
159 |         genders = self.OpenVinoExecutable.requests[request_id].outputs["prob"]
160 |         # Parse detection vector to get age and gender
161 | 
162 |         gender_text = 'female'
163 |         if genders[0][0][0][0] < genders[0][1][0][0]:
164 |             gender_text = 'male'
165 | 
166 |         return age, gender_text


--------------------------------------------------------------------------------
/inference_services/facedetection/detection/detection_base_ov.py:
--------------------------------------------------------------------------------
  1 | # MIT License
  2 | #
  3 | # Copyright (c) 2019 Onur Dundar onur.dundar1@gmail.com
  4 | #
  5 | # Permission is hereby granted, free of charge, to any person obtaining a copy
  6 | # of this software and associated documentation files (the "Software"), to deal
  7 | # in the Software without restriction, including without limitation the rights
  8 | # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  9 | # copies of the Software, and to permit persons to whom the Software is
 10 | # furnished to do so, subject to the following conditions:
 11 | #
 12 | # The above copyright notice and this permission notice shall be included in all
 13 | # copies or substantial portions of the Software.
 14 | #
 15 | # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 16 | # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 17 | # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 18 | # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 19 | # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 20 | # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 21 | # SOFTWARE.
 22 | 
 23 | import time, logging, json
 24 | import cv2 as cv
 25 | import numpy as np
 26 | 
 27 | # Import OpenVINO
 28 | # Make sure environment variables set correctly for this to work
 29 | # Check on README.md file
 30 | from openvino.inference_engine import IENetwork, IECore, ExecutableNetwork
 31 | 
 32 | 
 33 | class InferenceConfig(object):
 34 |     """
 35 |     Inference Configuration Model
 36 |     """
 37 |     ModelType = ""
 38 |     ModelPath = str()
 39 |     ModelName = str()
 40 |     TargetDevice = str()
 41 |     Async = False
 42 |     RequestCount = 1
 43 |     DynamicBatch = False
 44 |     BatchSize = 1
 45 |     CpuExtension = False
 46 |     CpuExtensionPath = "/opt/intel/inference_engine/lib/intel64/libcpu_extension.so"
 47 |     LimitCPUThreads = False
 48 |     CPUThreadNum = 1
 49 |     BindCPUThreads = True
 50 |     CPUStream = "AUTO"
 51 | 
 52 |     def parse_json(self, json_file):
 53 |         """
 54 |         Parse JSON Parameters
 55 |         :param json_file:
 56 |         :return:
 57 |         """
 58 |         try:
 59 |             logging.log(logging.INFO, "Loading JSON File".format(json_file))
 60 |             with open(json_file) as json_file:
 61 |                 data = json.load(json_file)
 62 | 
 63 |                 self.ModelPath = data[self.ModelType]["model_path"]
 64 |                 self.ModelName = data[self.ModelType]["model_name"]
 65 |                 self.TargetDevice = data[self.ModelType]["target_device"]
 66 | 
 67 |                 if data[self.ModelType]["async"] == "True":
 68 |                     self.Async = True
 69 | 
 70 |                 self.RequestCount = int(data[self.ModelType]["request_count"])
 71 |                 self.BatchSize = int(data[self.ModelType]["batch_size"])
 72 | 
 73 |                 if data[self.ModelType]["cpu_extension"] == "True":
 74 |                     self.CpuExtension = True
 75 | 
 76 |                 self.CpuExtensionPath = data["cpu_extension_path"]
 77 | 
 78 |                 if data[self.ModelType]["dynamic_batch"] == "True":
 79 |                     self.DynamicBatch = True
 80 | 
 81 |                 if data[self.ModelType]["limit_cpu_threads"] == "True":
 82 |                     self.LimitCPUThreads = True
 83 | 
 84 |                 self.CPUThreadNum = int(data[self.ModelType]["cpu_thread_num"])
 85 | 
 86 |                 if data[self.ModelType]["bind_cpu_threads"] == "True":
 87 |                     self.LimitCPUThreads = True
 88 | 
 89 |                 self.CPUStream = data[self.ModelType]["cpu_stream"]
 90 | 
 91 |         except FileNotFoundError:
 92 |             logging.log(logging.ERROR,'{} FileNotFound'.format(json_file))
 93 |             exit(-1)
 94 | 
 95 |     def read_dict(self, data=None):
 96 |         """
 97 |         Used When JSON Already Parsed as Dict
 98 |         :return:
 99 |         """
100 |         if data is None:
101 |             data = dict()
102 |         self.ModelPath = data[self.ModelType]["model_path"]
103 |         self.ModelName = data[self.ModelType]["model_name"]
104 |         self.TargetDevice = data[self.ModelType]["target_device"]
105 | 
106 |         if data[self.ModelType]["async"] == "True":
107 |             self.Async = True
108 | 
109 |         self.RequestCount = int(data[self.ModelType]["request_count"])
110 |         self.BatchSize = int(data[self.ModelType]["batch_size"])
111 | 
112 |         if data[self.ModelType]["cpu_extension"] == "True":
113 |             self.CpuExtension = True
114 | 
115 |         self.CpuExtensionPath = data["cpu_extension_path"]
116 | 
117 |         if data[self.ModelType]["dynamic_batch"] == "True":
118 |             self.DynamicBatch = True
119 | 
120 |         if data[self.ModelType]["limit_cpu_threads"] == "True":
121 |             self.LimitCPUThreads = True
122 | 
123 |         self.CPUThreadNum = int(data[self.ModelType]["cpu_thread_num"])
124 | 
125 |         if data[self.ModelType]["bind_cpu_threads"] == "True":
126 |             self.LimitCPUThreads = True
127 | 
128 |         self.CPUStream = data[self.ModelType]["cpu_stream"]
129 | 
130 | 
131 | class InferenceBase(object):
132 |     """
133 |     Base Class to Load a Model with Inference Engine
134 |     """
135 | 
136 |     Config = InferenceConfig()
137 | 
138 |     '''Inference Engine Components'''
139 |     OpenVinoIE = IECore()
140 |     OpenVinoNetwork = IENetwork()
141 |     OpenVinoExecutable = ExecutableNetwork()
142 | 
143 |     '''Model Components'''
144 |     InputLayer = str()
145 |     InputLayers = list()
146 |     OutputLayer = str()
147 |     OutputLayers = list()
148 |     InputShape = None
149 |     OutputShape = None
150 | 
151 |     '''Performance Metrics Storage'''
152 |     ElapsedInferenceTime = 0.0
153 |     InferenceCount = 0.0
154 | 
155 |     def __init__(self, infer_config):
156 |         self.Config = infer_config
157 |         self.prepare_detector()
158 | 
159 |     def prepare_detector(self):
160 |         """
161 |         Load Model, Libraries According to Given Configuration.
162 |         :return:
163 |         """
164 |         if self.Config.ModelPath is None or self.Config.ModelName is None:
165 |             return None
166 | 
167 |         ''' Model File Paths '''
168 |         model_file = self.Config.ModelPath + self.Config.ModelName + '.xml'
169 |         model_weights = self.Config.ModelPath + self.Config.ModelName + '.bin'
170 | 
171 |         logging.log(logging.INFO, "Model File {}".format(model_file))
172 |         logging.log(logging.INFO, "Model Weights {}".format(model_weights))
173 | 
174 |         ''' Create IECore Object '''
175 |         self.OpenVinoIE = IECore()
176 | 
177 |         ''' If target device is CPU add extensions '''
178 |         if self.Config.CpuExtension and 'CPU' in self.Config.TargetDevice:
179 |             logging.log(logging.INFO, "Adding CPU Extensions, Path {}".format(self.Config.CpuExtensionPath))
180 |             self.OpenVinoIE.add_extension(self.Config.CpuExtensionPath, "CPU")
181 | 
182 |         ''' Try loading network '''
183 |         try:
184 |             self.OpenVinoNetwork = IENetwork(model=model_file, weights=model_weights)
185 |             logging.log(logging.INFO, "Loaded IENetwork")
186 |         except FileNotFoundError:
187 |             logging.log(logging.ERROR, FileNotFoundError.strerror + " " + FileNotFoundError.filename)
188 |             logging.log(logging.ERROR, "Exiting ....")
189 |             exit(-1)
190 | 
191 |         ''' Print supported/not-supported layers '''
192 |         if "CPU" in self.Config.TargetDevice:
193 |             supported_layers = self.OpenVinoIE.query_network(self.OpenVinoNetwork, "CPU")
194 |             not_supported_layers = [l for l in self.OpenVinoNetwork.layers.keys() if l not in supported_layers]
195 |             if len(not_supported_layers) != 0:
196 |                 logging.log(logging.WARN, "Following layers are not supported by the plugin for specified device {}:\n {}".format(self.Config.TargetDevice, ', '.join(not_supported_layers)))
197 |                 logging.log(logging.WARN, "Please try to specify cpu extensions library path in config.json file ")
198 | 
199 |         '''Input / Output Memory Allocations to feed input or get output values'''
200 |         self.InputLayer = next(iter(self.OpenVinoNetwork.inputs))
201 |         logging.log(logging.INFO, "Input Layer ".format(self.InputLayer))
202 | 
203 |         N, C, H, W = self.OpenVinoNetwork.inputs[self.InputLayer].shape
204 | 
205 |         if self.Config.BatchSize > N:
206 |             self.OpenVinoNetwork.batch_size = self.Config.BatchSize
207 |         else:
208 |             self.Config.BatchSize = self.OpenVinoNetwork.batch_size
209 | 
210 |         self.OutputLayer = next(iter(self.OpenVinoNetwork.outputs))
211 |         logging.log(logging.INFO, "Output Layer ".format(self.OutputLayer))
212 | 
213 |         self.InputLayers = list(self.OpenVinoNetwork.inputs)
214 |         logging.log(logging.INFO, "Input Layers ".format(self.InputLayers))
215 | 
216 |         self.OutputLayers = list(self.OpenVinoNetwork.outputs)
217 |         logging.log(logging.INFO, "Output Layers ".format(self.OutputLayers))
218 | 
219 |         self.InputShape = self.OpenVinoNetwork.inputs[self.InputLayer].shape
220 |         logging.log(logging.INFO, "Input Shape: {}".format(self.InputShape))
221 | 
222 |         self.OutputShape = self.OpenVinoNetwork.outputs[self.OutputLayer].shape
223 |         logging.log(logging.INFO, "Output Shape: {}".format(self.OutputShape))
224 | 
225 |         '''Set Configurations'''
226 | 
227 |         config = {}
228 | 
229 |         if self.Config.DynamicBatch:
230 |             config["DYN_BATCH_ENABLE"] = "YES"
231 |             logging.log(logging.INFO, "Enabling Dynamic Batch Mode")
232 | 
233 |         if self.Config.Async:
234 |             logging.log(logging.INFO, "Async Mode Enabled")
235 | 
236 |         self.OpenVinoExecutable = self.OpenVinoIE.load_network(network=self.OpenVinoNetwork,
237 |                                                                device_name=self.Config.TargetDevice,
238 |                                                                config=config,
239 |                                                                num_requests=self.Config.RequestCount)
240 | 
241 |         logging.log(logging.INFO, "Completed Loading Neural Network")
242 | 
243 |         return None
244 | 
245 |     def preprocess_input(self, input_data):
246 |         """
247 |         Pre-process Input According to Loaded Network
248 |         :param input_data:
249 |         :return:
250 |         """
251 | 
252 |         n, c, h, w = self.OpenVinoNetwork.inputs[self.InputLayer].shape
253 |         logging.log(logging.DEBUG, "Pre-processing Input to Shape {}".format(self.OpenVinoNetwork.inputs[self.InputLayer].shape))
254 | 
255 |         resized = cv.resize(input_data, (w, h))
256 |         color_converted = cv.cvtColor(resized, cv.COLOR_BGR2RGB)
257 |         transposed = np.transpose(color_converted, (2, 0, 1))
258 |         reshaped = np.expand_dims(transposed, axis=0)
259 | 
260 |         return reshaped
261 | 
262 |     def infer(self, input_data, request_id=0):
263 |         """
264 |         Used to send data to network and start forward propagation.
265 |         :param input_data:
266 |         :param request_id:
267 |         :return:
268 |         """
269 |         if self.Config.Async:
270 |             logging.log(logging.DEBUG, "Async Infer Request Id {}".format(request_id))
271 |             self.infer_async(input_data, request_id)
272 |         else:
273 |             logging.log(logging.DEBUG, "Infer Request Id {}".format(request_id))
274 |             self.infer_sync(input_data, request_id)
275 | 
276 |     def infer_async(self, input_data, request_id=0):
277 |         """
278 |         Start Async Infer for Given Request Id
279 |         :param input_data:
280 |         :param request_id:
281 |         :return:
282 |         """
283 |         self.InferenceCount += 1
284 |         processed_input = self.preprocess_input(input_data)
285 |         self.OpenVinoExecutable.requests[request_id].async_infer(inputs={self.InputLayer: processed_input})
286 | 
287 |     def infer_sync(self, input_data, request_id=0):
288 |         """
289 |         Start Sync Infer
290 |         :param input_data:
291 |         :param request_id:
292 |         :return:
293 |         """
294 |         self.InferenceCount += 1
295 |         processed_input = self.preprocess_input(input_data)
296 |         start = time.time()
297 |         self.OpenVinoExecutable.requests[request_id].infer(inputs={self.InputLayer: processed_input})
298 |         end = time.time()
299 |         self.ElapsedInferenceTime += (end - start)
300 | 
301 |     def request_ready(self, request_id):
302 |         """
303 |         Check if request is ready
304 |         :param request_id: id to check request
305 |         :return: bool
306 |         """
307 |         if self.Config.Async:
308 |             if self.OpenVinoExecutable.requests[request_id].wait(0) == 0:
309 |                 return True
310 |         else:
311 |             return True
312 | 
313 |         return False
314 | 
315 |     def get_results(self, output_layer, request_id=0):
316 |         """
317 |         Get results from the network.
318 |         :param output_layer: output layer
319 |         :param request_id: request id
320 |         :return:
321 |         """
322 |         logging.log(logging.DEBUG, "Getting Results Request Id {}".format(request_id))
323 |         return self.OpenVinoExecutable.requests[request_id].outputs[output_layer]
324 | 
325 |     def print_inference_performance_metrics(self):
326 |         """
327 |         Print Performance Data Collection
328 |         :return:
329 |         """
330 |         if self.Config.Async:
331 |             logging.log(logging.WARN, 'Async Mode Inferred Frame Count {}'.format(self.InferenceCount))
332 |         else:
333 |             logging.log(logging.WARN, "Sync Mode Inferred Frame Count {}".format(self.InferenceCount))
334 |             logging.log(logging.WARN, "Inference Per Input: {} MilliSeconds".format((self.ElapsedInferenceTime / self.InferenceCount) * 1000))
335 | 


--------------------------------------------------------------------------------
/inference_services/facedetection/detection/face_detection_ov.py:
--------------------------------------------------------------------------------
  1 | # MIT License
  2 | #
  3 | # Copyright (c) 2019 Onur Dundar onur.dundar1@gmail.com
  4 | #
  5 | # Permission is hereby granted, free of charge, to any person obtaining a copy
  6 | # of this software and associated documentation files (the "Software"), to deal
  7 | # in the Software without restriction, including without limitation the rights
  8 | # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  9 | # copies of the Software, and to permit persons to whom the Software is
 10 | # furnished to do so, subject to the following conditions:
 11 | #
 12 | # The above copyright notice and this permission notice shall be included in all
 13 | # copies or substantial portions of the Software.
 14 | #
 15 | # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 16 | # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 17 | # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 18 | # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 19 | # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 20 | # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 21 | # SOFTWARE.
 22 | 
 23 | import logging
 24 | import math
 25 | import json
 26 | import time
 27 | import cv2 as cv
 28 | import numpy as np
 29 | from PIL import Image
 30 | 
 31 | from openvino.inference_engine import IENetwork, IECore, ExecutableNetwork
 32 | from .detection_base_ov import InferenceConfig, InferenceBase
 33 | 
 34 | 
 35 | class FaceDetectionModelTypes:
 36 |     """
 37 |     Face Detection Model Type to Be Used
 38 |     """
 39 |     # MTCNN Face Detection
 40 |     MTCNN = 'mtcnn_facedetection'
 41 |     # Open Model Zoo Face Detection
 42 |     OPENMODELZOO = 'omz_facedetection'
 43 | 
 44 | 
 45 | class FaceDetectionConfig(InferenceConfig):
 46 |     """
 47 |     Face Detection Module Configurations based on Open Model Zoo Face Detection Model
 48 |     """
 49 |     ModelType = FaceDetectionModelTypes.OPENMODELZOO
 50 |     FaceDetectionThreshold = 1.0
 51 |     InputHeight = 720
 52 |     InputWidth = 1080
 53 | 
 54 |     def parse_json(self, json_file):
 55 |         try:
 56 |             logging.log(logging.INFO, "Loading JSON File {}".format(json_file))
 57 |             logging.log(logging.INFO, "Model Type {}".format(self.ModelType))
 58 | 
 59 |             with open(json_file) as json_file:
 60 |                 data = json.load(json_file)
 61 | 
 62 |                 self.ModelPath = data[self.ModelType]["model_path"]
 63 |                 self.ModelName = data[self.ModelType]["model_name"]
 64 | 
 65 |                 self.TargetDevice = data[self.ModelType]["target_device"]
 66 | 
 67 |                 self.FaceDetectionThreshold = data[self.ModelType]["face_detection_threshold"]
 68 | 
 69 |                 if data[self.ModelType]["async"] == "True":
 70 |                     self.Async = True
 71 | 
 72 |                 self.RequestCount = int(data[self.ModelType]["request_count"])
 73 | 
 74 |                 self.BatchSize = int(data[self.ModelType]["batch_size"])
 75 | 
 76 |                 if data[self.ModelType]["cpu_extension"] == "True":
 77 |                     self.CpuExtension = True
 78 | 
 79 |                 self.CpuExtensionPath = data[self.ModelType]["cpu_extension_path"]
 80 | 
 81 |                 if data[self.ModelType]["dynamic_batch"] == "True":
 82 |                     self.DynamicBatch = True
 83 | 
 84 |                 if data[self.ModelType]["limit_cpu_threads"] == "True":
 85 |                     self.LimitCPUThreads = True
 86 | 
 87 |                 self.CPUThreadNum = int(data[self.ModelType]["number_of_cpu_threads"])
 88 | 
 89 |                 if data[self.ModelType]["bind_cpu_threads"] == "True":
 90 |                     self.LimitCPUThreads = True
 91 | 
 92 |                 self.CPUStream = data[self.ModelType]["cpu_stream"]
 93 | 
 94 |         except FileNotFoundError:
 95 |             logging.log(logging.ERROR, '{} FileNotFound'.format(json_file))
 96 |             exit(-1)
 97 | 
 98 |     def read_dict(self, data=None):
 99 |         """
100 |         Used When JSON Already Parsed as Dict
101 |         :return:
102 |         """
103 |         if data is None:
104 |             logging.log(logging.ERROR, "No Parameters Passed")
105 |             exit(-1)
106 | 
107 |         self.ModelPath = data[self.ModelType]["model_path"]
108 |         self.ModelName = data[self.ModelType]["model_name"]
109 | 
110 |         self.TargetDevice = data[self.ModelType]["target_device"]
111 | 
112 |         self.FaceDetectionThreshold = data[self.ModelType]["face_detection_threshold"]
113 | 
114 |         if data[self.ModelType]["async"] == "True":
115 |             self.Async = True
116 | 
117 |         self.RequestCount = int(data[self.ModelType]["request_count"])
118 | 
119 |         self.BatchSize = int(data[self.ModelType]["batch_size"])
120 | 
121 |         if data[self.ModelType]["cpu_extension"] == "True":
122 |             self.CpuExtension = True
123 | 
124 |         self.CpuExtensionPath = data[self.ModelType]["cpu_extension_path"]
125 | 
126 |         if data[self.ModelType]["dynamic_batch"] == "True":
127 |             self.DynamicBatch = True
128 | 
129 |         if data[self.ModelType]["limit_cpu_threads"] == "True":
130 |             self.LimitCPUThreads = True
131 | 
132 |         self.CPUThreadNum = int(data[self.ModelType]["number_of_cpu_threads"])
133 | 
134 |         if data[self.ModelType]["bind_cpu_threads"] == "True":
135 |             self.LimitCPUThreads = True
136 | 
137 |         self.CPUStream = data[self.ModelType]["cpu_stream"]
138 | 
139 | 
140 | class OpenMZooFaceDetection(InferenceBase):
141 |     """
142 |     Face Detection Module Configured to Get Results using Open Model Zoo Face Detection Model
143 |     """
144 |     Config = FaceDetectionConfig()
145 | 
146 |     def __init__(self, config=FaceDetectionConfig()):
147 |         super(OpenMZooFaceDetection, self).__init__(config)
148 |         self.Config = config
149 | 
150 |     def get_face_detection_data(self, request_id=0):
151 |         """
152 |         Parse Face Detection Output
153 |         :param output_layer:
154 |         :param request_id:
155 |         :return: face coordinates
156 |         """
157 |         face_coordinates = []
158 | 
159 |         detections = self.get_results(self.OutputLayer, request_id)[0][0]
160 | 
161 |         logging.log(logging.INFO, "Fetched Face Detection Results")
162 | 
163 |         for detection in detections:
164 |             if detection[2] > self.Config.FaceDetectionThreshold:
165 |                 face_coordinates.append([detection[3], detection[4], detection[5], detection[6]])
166 | 
167 |         logging.log(logging.INFO, "Number of Detected Faces: {}".format(len(face_coordinates)))
168 |         return face_coordinates
169 | 
170 | 
171 | class MTCNNFaceDetectionConfig(InferenceConfig):
172 |     """
173 |     Face Detection Module Configurations based on MTCNN Face Detection Model
174 |     """
175 |     ModelType = FaceDetectionModelTypes.MTCNN
176 | 
177 |     InputHeight = 720
178 |     InputWidth = 1080
179 | 
180 |     PNetworkThreshold = 0.6
181 |     RNetworkThreshold = 0.7
182 |     ONetworkThreshold = 0.8
183 | 
184 |     NMSThresholds = [0.7, 0.7, 0.7]
185 |     MinDetectionSize = 12
186 |     Factor = 0.707
187 | 
188 |     MinimumFaceSize = 15.0
189 |     MinLength = 720
190 |     FactorCount = 0
191 | 
192 |     RInputBatchSize = 128
193 |     OInputBatchSize = 128
194 | 
195 |     PModelFileName = "det1-0001"
196 |     RModelFileName = "det2-0001"
197 |     OModelFileName = "det3-0001"
198 | 
199 |     def parse_json(self, json_file):
200 |         try:
201 |             logging.log(logging.INFO, "Loading JSON File {}".format(json_file))
202 |             logging.log(logging.INFO, "Model Type {}".format(self.ModelType))
203 |             with open(json_file) as json_file:
204 |                 data = json.load(json_file)
205 | 
206 |                 self.ModelPath = data[self.ModelType]["model_path"]
207 |                 self.PModelFileName = data[self.ModelType]["p_model_file_name"]
208 |                 self.RModelFileName = data[self.ModelType]["r_model_file_name"]
209 |                 self.OModelFileName = data[self.ModelType]["o_model_file_name"]
210 | 
211 |                 self.TargetDevice = data[self.ModelType]["target_device"]
212 | 
213 |                 if data[self.ModelType]["cpu_extension"] == "True":
214 |                     self.CpuExtension = True
215 | 
216 |                 self.CpuExtensionPath = data[self.ModelType]["cpu_extension_path"]
217 | 
218 |                 self.PNetworkThreshold = float(data[self.ModelType]["p_network_threshold"])
219 |                 self.RNetworkThreshold = float(data[self.ModelType]["r_network_threshold"])
220 |                 self.ONetworkThreshold = float(data[self.ModelType]["o_network_threshold"])
221 | 
222 |                 self.MinimumFaceSize = float(data[self.ModelType]["minimum_face_size"])
223 |                 self.MinLength = float(data[self.ModelType]["minimum_length"])
224 |                 self.FactorCount = float(data[self.ModelType]["factor_count"])
225 |                 self.Factor = float(data[self.ModelType]["factor"])
226 |                 self.MinDetectionSize = int(data[self.ModelType]["min_detection_size"])
227 | 
228 |                 self.NMSThresholds = list(data[self.ModelType]["nms_thresholds"])
229 | 
230 |                 self.RInputBatchSize = int(data[self.ModelType]["r_input_batch_size"])
231 |                 self.OInputBatchSize = int(data[self.ModelType]["o_input_batch_size"])
232 | 
233 |                 if data[self.ModelType]["limit_cpu_threads"] == "True":
234 |                     self.LimitCPUThreads = True
235 |                 self.CPUThreadNum = int(data[self.ModelType]["number_of_cpu_threads"])
236 |                 if data[self.ModelType]["bind_cpu_threads"] == "True":
237 |                     self.LimitCPUThreads = True
238 |                 self.CPUStream = data[self.ModelType]["cpu_stream"]
239 | 
240 |         except FileNotFoundError:
241 |             logging.log(logging.ERROR, '{} FileNotFound'.format(json_file))
242 |             exit(-1)
243 | 
244 |     def read_dict(self, data=None):
245 |         """
246 |         Used When JSON Already Parsed as Dict
247 |         :return:
248 |         """
249 |         if data is None:
250 |             logging.log(logging.ERROR, "No Parameters Passed")
251 |             exit(-1)
252 | 
253 |         self.ModelPath = data[self.ModelType]["model_path"]
254 |         self.PModelFileName = data[self.ModelType]["p_model_file_name"]
255 |         self.RModelFileName = data[self.ModelType]["r_model_file_name"]
256 |         self.OModelFileName = data[self.ModelType]["o_model_file_name"]
257 | 
258 |         self.TargetDevice = data[self.ModelType]["target_device"]
259 | 
260 |         if data[self.ModelType]["cpu_extension"] == "True":
261 |             self.CpuExtension = True
262 | 
263 |         self.CpuExtensionPath = data[self.ModelType]["cpu_extension_path"]
264 | 
265 |         self.PNetworkThreshold = float(data[self.ModelType]["p_network_threshold"])
266 |         self.RNetworkThreshold = float(data[self.ModelType]["r_network_threshold"])
267 |         self.ONetworkThreshold = float(data[self.ModelType]["o_network_threshold"])
268 | 
269 |         self.MinimumFaceSize = float(data[self.ModelType]["minimum_face_size"])
270 |         self.MinLength = float(data[self.ModelType]["minimum_length"])
271 |         self.FactorCount = float(data[self.ModelType]["factor_count"])
272 |         self.Factor = float(data[self.ModelType]["factor"])
273 |         self.MinDetectionSize = int(data[self.ModelType]["min_detection_size"])
274 | 
275 |         self.NMSThresholds = list(data[self.ModelType]["nms_thresholds"])
276 | 
277 |         self.RInputBatchSize = int(data[self.ModelType]["r_input_batch_size"])
278 |         self.OInputBatchSize = int(data[self.ModelType]["o_input_batch_size"])
279 | 
280 |         if data[self.ModelType]["limit_cpu_threads"] == "True":
281 |             self.LimitCPUThreads = True
282 |         self.CPUThreadNum = int(data[self.ModelType]["number_of_cpu_threads"])
283 |         if data[self.ModelType]["bind_cpu_threads"] == "True":
284 |             self.LimitCPUThreads = True
285 |         self.CPUStream = data[self.ModelType]["cpu_stream"]
286 | 
287 | 
288 | class MtCNNFaceDetection(InferenceBase):
289 | 
290 |     Config = MTCNNFaceDetectionConfig()
291 | 
292 |     OpenVinoExecutablesP = list()
293 |     OpenVinoExecutableR = ExecutableNetwork()
294 |     OpenVinoExecutableO = ExecutableNetwork()
295 | 
296 |     OpenVinoNetworkP = IENetwork()
297 |     OpenVinoNetworkR = IENetwork()
298 |     OpenVinoNetworkO = IENetwork()
299 | 
300 |     Scales = []
301 | 
302 |     RINPUT = []
303 |     OINPUT = []
304 | 
305 |     LastFaceDetections = []
306 |     LastLandmarkDetections = []
307 | 
308 |     InputLayerP = str()
309 |     InputLayerR = str()
310 |     InputLayerO = str()
311 | 
312 |     OutputLayersP = list()
313 |     OutputLayersR = list()
314 |     OutputLayersO = list()
315 | 
316 |     InputShapeP = []
317 |     InputShapeR = []
318 |     InputShapeO = []
319 | 
320 |     def __init__(self, config=MTCNNFaceDetectionConfig()):
321 |         super(MtCNNFaceDetection, self).__init__(config)
322 |         self.Config = config
323 | 
324 |     def prepare_detector(self):
325 |         """
326 |         Override Base Class Since MTCNN works with three different model
327 |         :return: None
328 |         """
329 | 
330 |         if self.Config.ModelPath is None or self.Config.ModelName is None:
331 |             return None
332 | 
333 |         logging.log(logging.INFO, "Setting Up R - O Network Input Storage")
334 |         self.RINPUT = np.zeros(dtype=float, shape=(self.Config.RInputBatchSize, 3, 24, 24))
335 |         self.OINPUT = np.zeros(dtype=float, shape=(self.Config.OInputBatchSize, 3, 48, 48))
336 | 
337 |         self.OpenVinoIE = IECore()
338 | 
339 |         if self.Config.CpuExtension and 'CPU' in self.Config.TargetDevice:
340 |             logging.log(logging.INFO, "CPU Extensions Added")
341 |             self.OpenVinoIE.add_extension(self.Config.CpuExtensionPath, "CPU")
342 | 
343 |         try:
344 |             # Model File Paths
345 |             model_file = self.Config.ModelPath + self.Config.PModelFileName + ".xml"
346 |             model_weights = self.Config.ModelPath + self.Config.PModelFileName + ".bin"
347 |             logging.log(logging.INFO, "Loading Models File {}".format(model_file))
348 |             logging.log(logging.INFO, "Loading Weights File {}".format(model_weights))
349 | 
350 |             self.OpenVinoNetworkP = IENetwork(model=model_file, weights=model_weights)
351 |             logging.log(logging.INFO, "Loading P Network")
352 | 
353 |             model_file = self.Config.ModelPath + self.Config.RModelFileName + ".xml"
354 |             model_weights = self.Config.ModelPath + self.Config.RModelFileName + ".bin"
355 |             logging.log(logging.INFO, "Loading Models File {}".format(model_file))
356 |             logging.log(logging.INFO, "Loading Weights File {}".format(model_weights))
357 | 
358 |             self.OpenVinoNetworkR = IENetwork(model=model_file, weights=model_weights)
359 |             self.OpenVinoNetworkR.batch_size = self.Config.RInputBatchSize
360 |             logging.log(logging.INFO, "Loading R Network")
361 | 
362 |             model_file = self.Config.ModelPath + self.Config.OModelFileName + ".xml"
363 |             model_weights = self.Config.ModelPath + self.Config.OModelFileName + ".bin"
364 |             logging.log(logging.INFO, "Loading Models File {}".format(model_file))
365 |             logging.log(logging.INFO, "Loading Weights File {}".format(model_weights))
366 | 
367 |             self.OpenVinoNetworkO = IENetwork(model=model_file, weights=model_weights)
368 |             self.OpenVinoNetworkO.batch_size = self.Config.OInputBatchSize
369 |             logging.log(logging.INFO, "Loading O Network")
370 | 
371 |         except FileNotFoundError:
372 |             logging.log(logging.ERROR, FileNotFoundError.strerror, " ", FileNotFoundError.filename)
373 |             exit(-1)
374 | 
375 |         if "CPU" in self.Config.TargetDevice:
376 |             supported_layers = self.OpenVinoIE.query_network(self.OpenVinoNetworkP, "CPU")
377 |             not_supported_layers = [l for l in self.OpenVinoNetworkP.layers.keys() if l not in supported_layers]
378 |             if len(not_supported_layers) != 0:
379 |                 logging.log(logging.INFO, "Following layers are not supported by the plugin for specified device {}:\n {}".
380 |                       format(self.Config.TargetDevice, ', '.join(not_supported_layers)))
381 |                 logging.log(logging.INFO, "Please try to specify cpu extensions library path in config.json file ")
382 | 
383 |         # Input / Output Memory Allocations to feed input or get output values
384 |         self.InputLayerP = next(iter(self.OpenVinoNetworkP.inputs))
385 |         self.InputLayerR = next(iter(self.OpenVinoNetworkP.inputs))
386 |         self.InputLayerO = next(iter(self.OpenVinoNetworkP.inputs))
387 | 
388 |         self.OutputLayersP = list(self.OpenVinoNetworkP.outputs)
389 |         self.OutputLayersR = list(self.OpenVinoNetworkR.outputs)
390 |         self.OutputLayersO = list(self.OpenVinoNetworkO.outputs)
391 | 
392 |         self.InputShapeP = self.OpenVinoNetworkP.inputs[self.InputLayerP].shape
393 |         self.InputShapeR = self.OpenVinoNetworkR.inputs[self.InputLayerR].shape
394 |         self.InputShapeO = self.OpenVinoNetworkO.inputs[self.InputLayerO].shape
395 | 
396 |         # Enable Dynamic Batch By Default
397 |         config = {"DYN_BATCH_ENABLED": "YES"}
398 | 
399 |         self.OpenVinoExecutableR = self.OpenVinoIE.load_network(network=self.OpenVinoNetworkR,
400 |                                                                 device_name=self.Config.TargetDevice,
401 |                                                                 config=config,
402 |                                                                 num_requests=self.Config.RequestCount)
403 |         logging.log(logging.INFO, "Created R Network Executable")
404 | 
405 |         self.OpenVinoExecutableO = self.OpenVinoIE.load_network(network=self.OpenVinoNetworkO,
406 |                                                                 device_name=self.Config.TargetDevice,
407 |                                                                 config=config,
408 |                                                                 num_requests=self.Config.RequestCount)
409 |         logging.log(logging.INFO, "Created O Network Executable")
410 | 
411 |         self.Config.MinLength = min(self.Config.InputHeight, self.Config.InputWidth)
412 |         M = self.Config.MinDetectionSize / self.Config.MinimumFaceSize
413 |         self.Config.MinLength *= M
414 | 
415 |         while self.Config.MinLength > self.Config.MinDetectionSize:
416 |             scale = (M*self.Config.Factor**self.Config.FactorCount)
417 |             self.Scales.append(scale)
418 |             self.Config.MinLength *= self.Config.Factor
419 |             self.Config.FactorCount += 1
420 | 
421 |             sw, sh = math.ceil(self.Config.InputWidth * scale), math.ceil(self.Config.InputHeight * scale)
422 | 
423 |             self.OpenVinoNetworkP.reshape({self.InputLayerP: (1, 3, sh, sw)})
424 | 
425 |             self.OpenVinoExecutablesP.append(self.OpenVinoIE.load_network(network=self.OpenVinoNetworkP,
426 |                                                                           device_name=self.Config.TargetDevice,
427 |                                                                           num_requests=self.Config.RequestCount))
428 | 
429 |         logging.log(logging.INFO, "Created Scaled P Networks {}".format(len(self.OpenVinoExecutablesP)))
430 | 
431 |     def run_mtcnn_face_detection(self, images, request_id=0):
432 |         """
433 |         Get Detected Face Coordinates
434 |         :param images:
435 |         :param request_id:
436 |         :return:
437 |         """
438 |         self.InferenceCount += 1
439 |         start_time = time.time()
440 |         bounding_boxes = []
441 |         landmarks = []
442 | 
443 |         cv_img = cv.cvtColor(images, cv.COLOR_BGR2RGB)
444 |         image = Image.fromarray(cv_img)
445 | 
446 |         none_count = 0
447 | 
448 |         for i, scale in enumerate(self.Scales):
449 |             width, height = image.size
450 |             sw, sh = math.ceil(width * scale), math.ceil(height * scale)
451 |             img = image.resize((sw, sh), Image.BILINEAR)
452 |             img = np.asarray(img, 'float32')
453 |             img = self.preprocess(img)
454 | 
455 |             output = self.OpenVinoExecutablesP[i].infer({self.InputLayerP: img})
456 | 
457 |             probs = output["prob1"][0, 1, :, :]
458 |             offsets = output["conv4_2"]
459 | 
460 |             boxes = self.generate_bboxes(probs, offsets, scale, self.Config.PNetworkThreshold)
461 | 
462 |             if len(boxes) == 0:
463 |                 bounding_boxes.append(None)
464 |                 none_count += 1
465 |             else:
466 |                 keep = self.nms(boxes[:, 0:5], overlap_threshold=0.5)
467 |                 bounding_boxes.append(boxes[keep])
468 | 
469 |         if len(bounding_boxes) > none_count:
470 |             bounding_boxes = [i for i in bounding_boxes if i is not None]
471 |             bounding_boxes = np.vstack(bounding_boxes)
472 |             keep = self.nms(bounding_boxes[:, 0:5], self.Config.NMSThresholds[0])
473 |             bounding_boxes = bounding_boxes[keep]
474 |             bounding_boxes = self.calibrate_box(bounding_boxes[:, 0:5], bounding_boxes[:, 5:])
475 |             bounding_boxes = self.convert_to_square(bounding_boxes)
476 |             bounding_boxes[:, 0:4] = np.round(bounding_boxes[:, 0:4])
477 | 
478 |             img_boxes = self.get_image_boxes(bounding_boxes, image, size=24)
479 | 
480 |             if img_boxes.shape[0] > 0:
481 |                 shp = img_boxes.shape
482 |                 self.RINPUT[0:shp[0], ] = img_boxes
483 |                 self.OpenVinoExecutableR.requests[request_id].set_batch(shp[0])
484 |                 self.OpenVinoExecutableR.requests[request_id].infer({self.InputLayerR: self.RINPUT})
485 | 
486 |                 offsets = self.OpenVinoExecutableR.requests[0].outputs['conv5_2'][:shp[0], ]
487 |                 probs = self.OpenVinoExecutableR.requests[0].outputs['prob1'][:shp[0]]
488 | 
489 |                 keep = np.where(probs[:, 1] > self.Config.RNetworkThreshold)[0]
490 |                 bounding_boxes = bounding_boxes[keep]
491 |                 bounding_boxes[:, 4] = probs[keep, 1].reshape((-1,))
492 |                 offsets = offsets[keep]
493 |                 keep = self.nms(bounding_boxes, self.Config.NMSThresholds[1])
494 |                 bounding_boxes = bounding_boxes[keep]
495 |                 bounding_boxes = self.calibrate_box(bounding_boxes, offsets[keep])
496 |                 bounding_boxes = self.convert_to_square(bounding_boxes)
497 |                 bounding_boxes[:, 0:4] = np.round(bounding_boxes[:, 0:4])
498 |                 img_boxes = self.get_image_boxes(bounding_boxes, image, size=48)
499 | 
500 |                 if img_boxes.shape[0] > 0:
501 |                     shp = img_boxes.shape
502 |                     self.OINPUT[0:shp[0], ] = img_boxes
503 | 
504 |                     self.OpenVinoExecutableO.requests[0].set_batch(shp[0])
505 |                     self.OpenVinoExecutableO.requests[0].infer({self.InputLayerO: self.OINPUT})
506 | 
507 |                     landmarks = self.OpenVinoExecutableO.requests[0].outputs['conv6_3'][:shp[0]]
508 |                     offsets = self.OpenVinoExecutableO.requests[0].outputs['conv6_2'][:shp[0]]
509 |                     probs = self.OpenVinoExecutableO.requests[0].outputs['prob1'][:shp[0]]
510 | 
511 |                     keep = np.where(probs[:, 1] > self.Config.ONetworkThreshold)[0]
512 |                     bounding_boxes = bounding_boxes[keep]
513 |                     bounding_boxes[:, 4] = probs[keep, 1].reshape((-1,))
514 |                     offsets = offsets[keep]
515 |                     landmarks = landmarks[keep]
516 |                     # compute landmark points
517 |                     width = bounding_boxes[:, 2] - bounding_boxes[:, 0] + 1.0
518 |                     height = bounding_boxes[:, 3] - bounding_boxes[:, 1] + 1.0
519 |                     xmin, ymin = bounding_boxes[:, 0], bounding_boxes[:, 1]
520 |                     landmarks[:, 0:5] = np.expand_dims(xmin, 1) + np.expand_dims(width, 1) * landmarks[:, 0:5]
521 |                     landmarks[:, 5:10] = np.expand_dims(ymin, 1) + np.expand_dims(height, 1) * landmarks[:, 5:10]
522 |                     bounding_boxes = self.calibrate_box(bounding_boxes, offsets)
523 |                     keep = self.nms(bounding_boxes, self.Config.NMSThresholds[2], mode='min')
524 |                     bounding_boxes = bounding_boxes[keep]
525 |                     landmarks = landmarks[keep]
526 | 
527 |         none_count = 0
528 | 
529 |         face_detections = []
530 |         landmark_detections = []
531 |         i = 0
532 |         for box in bounding_boxes:
533 |             if type(box) is type(None):
534 |                 none_count += 1
535 |             else:
536 |                 scale = box[4]
537 |                 xmin = float((box[0] / scale) / self.Config.InputWidth)
538 |                 ymin = float((box[1] / scale) / self.Config.InputHeight)
539 |                 xmax = float((box[2] / scale) / self.Config.InputWidth)
540 |                 ymax = float((box[3] / scale) / self.Config.InputHeight)
541 |                 face_detections.append([xmin, ymin, xmax, ymax])
542 |                 lands = []
543 |                 for l in range(5):
544 |                     lands.append(float((landmarks[i][l] / scale) / self.Config.InputWidth))
545 |                     lands.append(float((landmarks[i][l + 5] / scale) / self.Config.InputHeight))
546 | 
547 |                 landmark_detections.append(lands)
548 |                 i += 1
549 | 
550 |         if none_count == len(bounding_boxes):
551 |             return [], []
552 | 
553 |         self.LastFaceDetections = face_detections
554 |         self.LastLandmarkDetections = landmark_detections
555 | 
556 |         self.ElapsedInferenceTime += (time.time() - start_time)
557 | 
558 |     def infer(self, images, request_id=0):
559 |         """
560 |         Run inference
561 |         :param images: image to get faces
562 |         :param request_id: request id
563 |         :return:
564 |         """
565 |         self.run_mtcnn_face_detection(images, request_id=0)
566 | 
567 |     def request_ready(self, request_id):
568 |         """
569 |         This is true by default since there is no ASYNC mode for MTCNN
570 |         :param request_id:
571 |         :return:
572 |         """
573 |         return True
574 | 
575 |     def get_face_detection_data(self, request_id=0):
576 |         """
577 |         Get Latest Results for Face Coordinates
578 |         :param request_id:
579 |         :return:
580 |         """
581 |         return self.LastFaceDetections
582 | 
583 |     def get_face_landmarks_data(self, request_id=0):
584 |         """
585 |         Get Latest Results for Landmark Coordinates
586 |         :param request_id:
587 |         :return:
588 |         """
589 |         return self.LastLandmarkDetections
590 | 
591 |     @staticmethod
592 |     def preprocess(img):
593 |         """Preprocessing step before feeding the network.
594 | 
595 |         Arguments:
596 |             img: a float numpy array of shape [h, w, c].
597 | 
598 |         Returns:
599 |             a float numpy array of shape [1, c, h, w].
600 |         """
601 |         img = img.transpose((2, 0, 1))
602 |         img = np.expand_dims(img, 0)
603 |         img = (img - 127.5) * 0.0078125
604 |         return img
605 | 
606 |     @staticmethod
607 |     def generate_bboxes(probs, offsets, scale, threshold):
608 |         """Generate bounding boxes at places
609 |         where there is probably a face.
610 | 
611 |         Arguments:
612 |             probs: a float numpy array of shape [n, m].
613 |             offsets: a float numpy array of shape [1, 4, n, m].
614 |             scale: a float number,
615 |                 width and height of the image were scaled by this number.
616 |             threshold: a float number.
617 | 
618 |         Returns:
619 |             a float numpy array of shape [n_boxes, 9]
620 |         """
621 | 
622 |         # applying P-Net is equivalent, in some sense, to
623 |         # moving 12x12 window with stride 2
624 |         stride = 2
625 |         cell_size = 12
626 | 
627 |         # indices of boxes where there is probably a face
628 |         inds = np.where(probs > threshold)
629 | 
630 |         if inds[0].size == 0:
631 |             return np.array([])
632 | 
633 |         # transformations of bounding boxes
634 |         tx1, ty1, tx2, ty2 = [offsets[0, i, inds[0], inds[1]] for i in range(4)]
635 |         # they are defined as:
636 |         # w = x2 - x1 + 1
637 |         # h = y2 - y1 + 1
638 |         # x1_true = x1 + tx1*w
639 |         # x2_true = x2 + tx2*w
640 |         # y1_true = y1 + ty1*h
641 |         # y2_true = y2 + ty2*h
642 | 
643 |         offsets = np.array([tx1, ty1, tx2, ty2])
644 |         score = probs[inds[0], inds[1]]
645 | 
646 |         # P-Net is applied to scaled images
647 |         # so we need to rescale bounding boxes back
648 |         bounding_boxes = np.vstack([
649 |             np.round((stride * inds[1] + 1.0) / scale),
650 |             np.round((stride * inds[0] + 1.0) / scale),
651 |             np.round((stride * inds[1] + 1.0 + cell_size) / scale),
652 |             np.round((stride * inds[0] + 1.0 + cell_size) / scale),
653 |             score, offsets
654 |         ])
655 |         # why one is added?
656 | 
657 |         return bounding_boxes.T
658 | 
659 |     @staticmethod
660 |     def nms(boxes, overlap_threshold=0.5, mode='union'):
661 |         """Non-maximum suppression.
662 | 
663 |         Arguments:
664 |             boxes: a float numpy array of shape [n, 5],
665 |                 where each row is (xmin, ymin, xmax, ymax, score).
666 |             overlap_threshold: a float number.
667 |             mode: 'union' or 'min'.
668 | 
669 |         Returns:
670 |             list with indices of the selected boxes
671 |         """
672 | 
673 |         # if there are no boxes, return the empty list
674 |         if len(boxes) == 0:
675 |             return []
676 | 
677 |         # list of picked indices
678 |         pick = []
679 | 
680 |         # grab the coordinates of the bounding boxes
681 |         x1, y1, x2, y2, score = [boxes[:, i] for i in range(5)]
682 | 
683 |         area = (x2 - x1 + 1.0) * (y2 - y1 + 1.0)
684 |         ids = np.argsort(score)  # in increasing order
685 | 
686 |         while len(ids) > 0:
687 | 
688 |             # grab index of the largest value
689 |             last = len(ids) - 1
690 |             i = ids[last]
691 |             pick.append(i)
692 | 
693 |             # compute intersections
694 |             # of the box with the largest score
695 |             # with the rest of boxes
696 | 
697 |             # left top corner of intersection boxes
698 |             ix1 = np.maximum(x1[i], x1[ids[:last]])
699 |             iy1 = np.maximum(y1[i], y1[ids[:last]])
700 | 
701 |             # right bottom corner of intersection boxes
702 |             ix2 = np.minimum(x2[i], x2[ids[:last]])
703 |             iy2 = np.minimum(y2[i], y2[ids[:last]])
704 | 
705 |             # width and height of intersection boxes
706 |             w = np.maximum(0.0, ix2 - ix1 + 1.0)
707 |             h = np.maximum(0.0, iy2 - iy1 + 1.0)
708 | 
709 |             # intersections' areas
710 |             inter = w * h
711 |             if mode == 'min':
712 |                 overlap = inter / np.minimum(area[i], area[ids[:last]])
713 |             elif mode == 'union':
714 |                 # intersection over union (IoU)
715 |                 overlap = inter / (area[i] + area[ids[:last]] - inter)
716 | 
717 |             # delete all boxes where overlap is too big
718 |             ids = np.delete(
719 |                 ids,
720 |                 np.concatenate([[last], np.where(overlap > overlap_threshold)[0]])
721 |             )
722 | 
723 |         return pick
724 | 
725 |     @staticmethod
726 |     def calibrate_box(bboxes, offsets):
727 |         """Transform bounding boxes to be more like true bounding boxes.
728 |         'offsets' is one of the outputs of the nets.
729 | 
730 |         Arguments:
731 |             bboxes: a float numpy array of shape [n, 5].
732 |             offsets: a float numpy array of shape [n, 4].
733 | 
734 |         Returns:
735 |             a float numpy array of shape [n, 5].
736 |         """
737 |         x1, y1, x2, y2 = [bboxes[:, i] for i in range(4)]
738 |         w = x2 - x1 + 1.0
739 |         h = y2 - y1 + 1.0
740 |         w = np.expand_dims(w, 1)
741 |         h = np.expand_dims(h, 1)
742 | 
743 |         # this is what happening here:
744 |         # tx1, ty1, tx2, ty2 = [offsets[:, i] for i in range(4)]
745 |         # x1_true = x1 + tx1*w
746 |         # y1_true = y1 + ty1*h
747 |         # x2_true = x2 + tx2*w
748 |         # y2_true = y2 + ty2*h
749 |         # below is just more compact form of this
750 | 
751 |         # are offsets always such that
752 |         # x1 < x2 and y1 < y2 ?
753 | 
754 |         translation = np.hstack([w, h, w, h]) * offsets
755 |         bboxes[:, 0:4] = bboxes[:, 0:4] + translation
756 |         return bboxes
757 | 
758 |     @staticmethod
759 |     def convert_to_square(bboxes):
760 |         """Convert bounding boxes to a square form.
761 | 
762 |         Arguments:
763 |             bboxes: a float numpy array of shape [n, 5].
764 | 
765 |         Returns:
766 |             a float numpy array of shape [n, 5],
767 |                 squared bounding boxes.
768 |         """
769 | 
770 |         square_bboxes = np.zeros_like(bboxes)
771 |         x1, y1, x2, y2 = [bboxes[:, i] for i in range(4)]
772 |         h = y2 - y1 + 1.0
773 |         w = x2 - x1 + 1.0
774 |         max_side = np.maximum(h, w)
775 |         square_bboxes[:, 0] = x1 + w * 0.5 - max_side * 0.5
776 |         square_bboxes[:, 1] = y1 + h * 0.5 - max_side * 0.5
777 |         square_bboxes[:, 2] = square_bboxes[:, 0] + max_side - 1.0
778 |         square_bboxes[:, 3] = square_bboxes[:, 1] + max_side - 1.0
779 |         return square_bboxes
780 | 
781 |     @staticmethod
782 |     def correct_bboxes(bboxes, width, height):
783 |         """Crop boxes that are too big and get coordinates
784 |         with respect to cutouts.
785 | 
786 |         Arguments:
787 |             bboxes: a float numpy array of shape [n, 5],
788 |                 where each row is (xmin, ymin, xmax, ymax, score).
789 |             width: a float number.
790 |             height: a float number.
791 | 
792 |         Returns:
793 |             dy, dx, edy, edx: a int numpy arrays of shape [n],
794 |                 coordinates of the boxes with respect to the cutouts.
795 |             y, x, ey, ex: a int numpy arrays of shape [n],
796 |                 corrected ymin, xmin, ymax, xmax.
797 |             h, w: a int numpy arrays of shape [n],
798 |                 just heights and widths of boxes.
799 | 
800 |             in the following order:
801 |                 [dy, edy, dx, edx, y, ey, x, ex, w, h].
802 |         """
803 | 
804 |         x1, y1, x2, y2 = [bboxes[:, i] for i in range(4)]
805 |         w, h = x2 - x1 + 1.0, y2 - y1 + 1.0
806 |         num_boxes = bboxes.shape[0]
807 | 
808 |         # 'e' stands for end
809 |         # (x, y) -> (ex, ey)
810 |         x, y, ex, ey = x1, y1, x2, y2
811 | 
812 |         # we need to cut out a box from the image.
813 |         # (x, y, ex, ey) are corrected coordinates of the box
814 |         # in the image.
815 |         # (dx, dy, edx, edy) are coordinates of the box in the cutout
816 |         # from the image.
817 |         dx, dy = np.zeros((num_boxes,)), np.zeros((num_boxes,))
818 |         edx, edy = w.copy() - 1.0, h.copy() - 1.0
819 | 
820 |         # if box's bottom right corner is too far right
821 |         ind = np.where(ex > width - 1.0)[0]
822 |         edx[ind] = w[ind] + width - 2.0 - ex[ind]
823 |         ex[ind] = width - 1.0
824 | 
825 |         # if box's bottom right corner is too low
826 |         ind = np.where(ey > height - 1.0)[0]
827 |         edy[ind] = h[ind] + height - 2.0 - ey[ind]
828 |         ey[ind] = height - 1.0
829 | 
830 |         # if box's top left corner is too far left
831 |         ind = np.where(x < 0.0)[0]
832 |         dx[ind] = 0.0 - x[ind]
833 |         x[ind] = 0.0
834 | 
835 |         # if box's top left corner is too high
836 |         ind = np.where(y < 0.0)[0]
837 |         dy[ind] = 0.0 - y[ind]
838 |         y[ind] = 0.0
839 | 
840 |         return_list = [dy, edy, dx, edx, y, ey, x, ex, w, h]
841 |         return_list = [i.astype('int32') for i in return_list]
842 | 
843 |         return return_list
844 | 
845 |     @staticmethod
846 |     def get_image_boxes(bounding_boxes, img, size=24):
847 |         """Cut out boxes from the image.
848 | 
849 |         Arguments:
850 |             bounding_boxes: a float numpy array of shape [n, 5].
851 |             img: an instance of PIL.Image.
852 |             size: an integer, size of cutouts.
853 | 
854 |         Returns:
855 |             a float numpy array of shape [n, 3, size, size].
856 |         """
857 | 
858 |         num_boxes = len(bounding_boxes)
859 |         width, height = img.size
860 | 
861 |         [dy, edy, dx, edx, y, ey, x, ex, w, h] = MtCNNFaceDetection.correct_bboxes(bounding_boxes, width, height)
862 |         img_boxes = np.zeros((num_boxes, 3, size, size), 'float32')
863 | 
864 |         for i in range(num_boxes):
865 |             if h[i] <= 0 or w[i] <= 0:
866 |                 continue
867 |             img_box = np.zeros((h[i], w[i], 3), 'uint8')
868 | 
869 |             img_array = np.asarray(img, 'uint8')
870 |             img_box[dy[i]:(edy[i] + 1), dx[i]:(edx[i] + 1), :] = \
871 |                 img_array[y[i]:(ey[i] + 1), x[i]:(ex[i] + 1), :]
872 | 
873 |             # resize
874 |             img_box = Image.fromarray(img_box)
875 |             img_box = img_box.resize((size, size), Image.BILINEAR)
876 |             img_box = np.asarray(img_box, 'float32')
877 | 
878 |             img_boxes[i, :, :, :] = MtCNNFaceDetection.preprocess(img_box)
879 | 
880 |         return img_boxes


--------------------------------------------------------------------------------
/inference_services/facedetection/face_detection_service.py:
--------------------------------------------------------------------------------
  1 | # MIT License
  2 | #
  3 | # Copyright (c) 2019 Onur Dundar
  4 | #
  5 | # Permission is hereby granted, free of charge, to any person obtaining a copy
  6 | # of this software and associated documentation files (the "Software"), to deal
  7 | # in the Software without restriction, including without limitation the rights
  8 | # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  9 | # copies of the Software, and to permit persons to whom the Software is
 10 | # furnished to do so, subject to the following conditions:
 11 | #
 12 | # The above copyright notice and this permission notice shall be included in all
 13 | # copies or substantial portions of the Software.
 14 | #
 15 | # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 16 | # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 17 | # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 18 | # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 19 | # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 20 | # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 21 | # SOFTWARE.
 22 | 
 23 | from flask import Flask, request, jsonify, make_response, redirect
 24 | import logging
 25 | import sys
 26 | import optparse
 27 | import time
 28 | import cv2 as cv
 29 | import asyncio
 30 | import threading
 31 | 
 32 | from detection.face_detection_ov import FaceDetectionConfig, OpenMZooFaceDetection, FaceDetectionModelTypes, MtCNNFaceDetection, MTCNNFaceDetectionConfig
 33 | from detection.age_gender_detection_ov import AgeGenderConfig, MTCNNAgeGenderDetection, AgeGenderDetectionTypes, MTCNNAgeGenderConfig, AgeGenderDetection
 34 | from utils.image_utils import ImageUtil
 35 | 
 36 | app = Flask(__name__)
 37 | 
 38 | start = int(round(time.time()))
 39 | 
 40 | loop = asyncio.get_event_loop()
 41 | 
 42 | thread = threading.Thread()
 43 | 
 44 | class AppStatus:
 45 |     STARTED = "STARTED"
 46 |     FINISHED = "FINISHED"
 47 |     NOTSTARTED = "NOTSTARTED"
 48 |     STOPREQUEST = "STOPREQUESTED"
 49 | 
 50 | 
 51 | def prepare_configs():
 52 |     """
 53 |     Set Configurations for Face, Age Gender Models
 54 |     :return: face config, age_gender config
 55 |     """
 56 |     logging.getLogger(name="inference").log(logging.INFO, "Setting Configurations")
 57 | 
 58 |     if face_detection_model == FaceDetectionModelTypes.MTCNN:
 59 |         face_infer_cfg = MTCNNFaceDetectionConfig()
 60 |     else:
 61 |         face_infer_cfg = FaceDetectionConfig()
 62 | 
 63 |     face_infer_cfg.read_dict(json_req)
 64 | 
 65 |     logging.getLogger(name="inference").log(logging.INFO, "Configuration Set Completed...")
 66 | 
 67 |     return face_infer_cfg
 68 | 
 69 | 
 70 | async def inference():
 71 |     if inference_status == AppStatus.FINISHED or inference_status == AppStatus.NOTSTARTED:
 72 |         run_inference()
 73 |     else:
 74 |         logging.log(logging.WARN, "Inference Already Running ... ")
 75 |     loop.stop()
 76 |     return "OK"
 77 | 
 78 | 
 79 | def run_inference():
 80 |     """
 81 |     Runs Face Detection Application with the Requested JSON
 82 |     :return:
 83 |     """
 84 | 
 85 |     face_cfg = prepare_configs()
 86 | 
 87 |     if input_type == "video":
 88 |         logging.log(logging.INFO, "Video File Input Selected")
 89 |         capture = cv.VideoCapture(input_path)
 90 |         has_frame, frame = capture.read()
 91 |     elif input_type == "webcam":
 92 |         logging.log(logging.INFO, "Webcam Video Selected")
 93 |         capture = cv.VideoCapture(web_cam_index)
 94 |         has_frame, frame = capture.read()
 95 |     elif input_type == "image":
 96 |         logging.log(logging.INFO, "Single Image Inference Selected")
 97 |         frame = cv.imread(input_path)
 98 |     else:
 99 |         logging.log(logging.ERROR, "Invalid Input Type: {}".format(input_type))
100 |         exit(-1)
101 | 
102 |     face_cfg.InputHeight = frame.shape[0]
103 |     face_cfg.InputWidth = frame.shape[1]
104 | 
105 |     logging.getLogger(name="inference").log(logging.INFO, "Input Frame H: {} W: {}".format(face_cfg.InputHeight, face_cfg.InputWidth))
106 | 
107 |     if face_detection_model == FaceDetectionModelTypes.MTCNN:
108 |         face_infer = MtCNNFaceDetection(face_cfg)
109 |     else:
110 |         face_infer = OpenMZooFaceDetection(face_cfg)
111 | 
112 |     face_request_order = list()
113 |     face_process_order = list()
114 | 
115 |     for i in range(face_infer.Config.RequestCount):
116 |         face_request_order.append(i)
117 | 
118 |     frame_order = []
119 |     frame_id = 1
120 | 
121 |     global inference_status
122 |     inference_status = AppStatus.STARTED
123 | 
124 |     if save_roi_text:
125 |         roi_file = open(output_dir + roi_text_filename, 'w')
126 |         roi = "{};{};{};{};{}\n".format("frameid","xmin","ymin","xmax","ymax")
127 |         roi_file.write(roi)
128 | 
129 |     if save_roi_video:
130 |         fourcc = cv.VideoWriter_fourcc('X', '2', '6', '4')
131 |         roi_video = cv.VideoWriter(output_dir + roi_video_filename, fourcc, 10, (face_cfg.InputWidth, face_cfg.InputHeight ))
132 | 
133 |     if input_type == "video" or input_type == "webcam":
134 |         while has_frame:
135 | 
136 |             if inference_status == AppStatus.STOPREQUEST:
137 |                 break
138 | 
139 |             logging.log(logging.DEBUG, "Processing Frame {}".format(frame_id))
140 |             if len(face_request_order) > 0:
141 |                 req_id = face_request_order[0]
142 |                 face_request_order.pop(0)
143 |                 face_infer.infer(frame, req_id)
144 |                 face_process_order.append(req_id)
145 |                 frame_order.append(frame)
146 | 
147 |             if len(face_process_order) > 0:
148 |                 first = face_process_order[0]
149 |                 if face_infer.request_ready(request_id=first):
150 |                     detected_faces = face_infer.get_face_detection_data(first)
151 |                     if face_cfg.ModelType == FaceDetectionModelTypes.MTCNN:
152 |                         face_landmarks = face_infer.get_face_landmarks_data(first)
153 |                     face_process_order.pop(0)
154 |                     face_request_order.append(first)
155 |                     show_frame = frame_order[0]
156 |                     frame_order.pop(0)
157 |                     if len(detected_faces) > 0:
158 |                         for idx, face in enumerate(detected_faces):
159 |                             ImageUtil.draw_rectangle(show_frame, (face[0], face[1], face[2], face[3]))
160 | 
161 |                             if face_cfg.ModelType == FaceDetectionModelTypes.MTCNN:
162 |                                 for coordinate in range(0, len(face_landmarks[idx]), 2):
163 |                                     ImageUtil.draw_ellipse(show_frame, [face_landmarks[idx][coordinate],
164 |                                                                         face_landmarks[idx][coordinate + 1]])
165 | 
166 |                             if save_roi_text:
167 |                                 roi = "{};{};{};{};{}\n".format(frame_id, face[0], face[1], face[2], face[3])
168 |                                 roi_file.write(roi)
169 | 
170 |                     if save_only_frames and not save_roi_video and len(detected_faces) > 0:
171 |                         cv.imwrite(output_dir + roi_frame_filename + "_{}.png".format(frame_id), show_frame)
172 |                     elif save_roi_video:
173 |                         roi_video.write(show_frame)
174 | 
175 |                     # Required Since
176 |                     face_infer.LastFaceDetections = []
177 |                     face_infer.LastLandmarkDetections = []
178 | 
179 |             if len(face_request_order) > 0:
180 |                 has_frame, frame = capture.read()
181 |                 frame_id += 1
182 |     else:
183 |         face_infer.infer(frame)
184 |         faces = face_infer.get_face_detection_data()
185 |         if face_cfg.ModelType == FaceDetectionModelTypes.MTCNN:
186 |             landmarks = face_infer.get_face_landmarks_data()
187 | 
188 |         if len(faces) > 0:
189 |             print("Detected {} Faces with {} Threshold".format(len(faces), face_infer.Config.FaceDetectionThreshold))
190 |             for idx, face in enumerate(faces):
191 |                 ImageUtil.draw_rectangle(frame, (face[0], face[1], face[2], face[3]))
192 | 
193 |                 if face_cfg.ModelType == FaceDetectionModelTypes.MTCNN:
194 |                     for coordinate in range(0, len(landmarks[idx]), 2):
195 |                         ImageUtil.draw_ellipse(frame, [landmarks[idx][coordinate], landmarks[idx][coordinate + 1]])
196 | 
197 |                 if save_roi_text:
198 |                     roi = "{};{};{};{};{}\n".format(frame_id, face[0], face[1], face[2], face[3])
199 |                     roi_file.write(roi)
200 | 
201 |                 if save_only_frames:
202 |                     cv.imwrite(output_dir + roi_frame_filename + "_{}.png".format(frame_id), frame)
203 | 
204 |     face_infer.print_inference_performance_metrics()
205 | 
206 |     inference_status = AppStatus.FINISHED
207 | 
208 |     roi_file.close()
209 |     roi_video.release()
210 | 
211 | 
212 | inference_status = AppStatus.NOTSTARTED
213 | 
214 | input_type = "image"
215 | input_path = ''
216 | web_cam_index = 0
217 | face_detection_model = FaceDetectionModelTypes.OPENMODELZOO
218 | logfile_name = "log.txt" # "/app/log.txt"
219 | json_req = None
220 | 
221 | output_dir = "./"
222 | roi_text_filename = "inference_roi.txt"
223 | roi_video_filename = "inference_roi.mp4"
224 | roi_frame_filename = "inference_frame"
225 | 
226 | save_roi_video = False
227 | save_only_frames = False
228 | save_roi_text = True
229 | 
230 | 
231 | @app.route("/", methods=['GET', 'POST'])
232 | def start():
233 |     if request.is_json:
234 |         # Parse the JSON into a Python dictionary
235 |         req = request.json
236 |         try:
237 |             if req["log_level"] == "DEBUG":
238 |                 logging.basicConfig(filename=logfile_name,
239 |                                     level=logging.DEBUG,
240 |                                     filemode='a',
241 |                                     format='%(asctime)s,%(msecs)d %(name)s %(levelname)s %(message)s',
242 |                                     datefmt='%H:%M:%S')
243 |             elif req["log_level"] == "INFO":
244 |                 logging.basicConfig(filename=logfile_name,
245 |                                     level=logging.INFO,
246 |                                     filemode='a',
247 |                                     format='%(asctime)s,%(msecs)d %(name)s %(levelname)s %(message)s',
248 |                                     datefmt='%H:%M:%S')
249 |             elif req["log_level"] == "WARN":
250 |                 logging.basicConfig(filename=logfile_name,
251 |                                     level=logging.WARN,
252 |                                     filemode='a',
253 |                                     format='%(asctime)s,%(msecs)d %(name)s %(levelname)s %(message)s',
254 |                                     datefmt='%H:%M:%S')
255 |             else:
256 |                 logging.basicConfig(filename=logfile_name,
257 |                                     level=logging.ERROR,
258 |                                     filemode='a',
259 |                                     format='%(asctime)s,%(msecs)d %(name)s %(levelname)s %(message)s',
260 |                                     datefmt='%H:%M:%S')
261 | 
262 |             logging.log(logging.WARN, "Log Level Set to: {}".format(req["log_level"]))
263 | 
264 |             global input_path
265 |             input_path = req["input_path"]
266 | 
267 |             logging.log(logging.WARN, "Input Path: {}".format(req["input_path"]))
268 | 
269 |             global input_type
270 |             input_type = req["input_type"]
271 | 
272 |             logging.log(logging.WARN, "Input Type: {}".format(req["input_type"]))
273 | 
274 |             global web_cam_index
275 |             web_cam_index = int(req["web_cam_index"])
276 | 
277 |             logging.log(logging.WARN, "Web Cam {}".format(req["web_cam_index"]))
278 | 
279 |             global face_detection_model
280 |             if req['face_detection_model'] == FaceDetectionModelTypes.MTCNN:
281 |                 face_detection_model = FaceDetectionModelTypes.MTCNN
282 | 
283 |             logging.log(logging.WARN, "Face Detection Model {}".format(req["face_detection_model"]))
284 | 
285 |             global save_roi_video
286 |             if req["save_roi_video"] == "True":
287 |                 save_roi_video = True
288 | 
289 |             global save_only_frames
290 |             if req["save_only_frames"] == "True":
291 |                 save_only_frames = True
292 | 
293 |             global save_roi_text
294 |             if req["save_roi"] == "False":
295 |                 save_roi_text = False
296 | 
297 |             res = make_response(jsonify({"message": "INFERENCE STARTED"}), 200)
298 | 
299 |             global json_req
300 |             json_req = req
301 | 
302 |             #threading.Thread(target=run_inference()).start()
303 |             # Start Async Thread
304 |             logging.log(logging.WARN, "Starting Inference ...")
305 |             task = loop.create_task(inference())
306 | 
307 |             if not loop.is_running():
308 |                 loop.run_forever()
309 |             else:
310 |                 logging.log(logging.WARN, "Thread Loop Running ...")
311 | 
312 |             return res
313 |         except KeyError:
314 |             logging.log(logging.ERROR, "Key Not Found Error")
315 |             exit(-1)
316 |         except Exception as e:
317 |             logging.log(logging.ERROR, e.__str__())
318 |             exit(-1)
319 |         # Return a string along with an HTTP status code
320 | 
321 |     else:
322 |         # The request body wasn't JSON so return a 400 HTTP status code
323 |         return "Request was not JSON", 400
324 | 
325 | 
326 | @app.route("/status", methods=["GET"])
327 | def status():
328 |     """
329 |     Get App Status
330 |     :return:
331 |     """
332 |     logging.log(logging.WARN, "STATUS CALLED")
333 |     return jsonify(inference_status), 200
334 | 
335 | 
336 | @app.route("/stop_inference", methods=["POST"])
337 | def stop_inference():
338 |     """
339 |     Get App Status
340 |     :return:
341 |     """
342 | 
343 |     global inference_status
344 |     inference_status = AppStatus.STOPREQUEST
345 |     logging.log(logging.WARN, "STOPPING INFERENCE ... ")
346 |     return jsonify(inference_status), 200
347 | 
348 | 
349 | @app.route("/logs", methods=["GET"])
350 | def logs():
351 |     """
352 |     Show Logs
353 |     :return:
354 |     """
355 |     with open(logfile_name) as f:
356 |         file_content = f.read()
357 | 
358 |     return file_content, 200
359 | 
360 | 
361 | @app.route("/results", methods=["GET"])
362 | def results():
363 |     """
364 |     Get Latest Results
365 |     :return:
366 |     """
367 | 
368 |     roifile = output_dir + roi_text_filename
369 |     with open(roifile) as f:
370 |         file_content = f.read()
371 | 
372 |     return file_content
373 | 
374 | 
375 | @app.route('/play_roi', methods=["GET"])
376 | def play_roi():
377 |     return redirect(output_dir + roi_video_filename)
378 | 
379 | 
380 | if __name__ == '__main__':
381 |     parser = optparse.OptionParser(usage="python3 /app/face_detection_service.py -p ")
382 |     parser.add_option('-p', '--port', action='store', dest='port', help='The port to listen on.')
383 | 
384 |     (args, _) = parser.parse_args()
385 | 
386 |     if args.port is None:
387 |         print("Missing required argument: -p/--port")
388 |         sys.exit(1)
389 | 
390 |     app.run(host='0.0.0.0', port=int(args.port), debug=True, threaded=True)


--------------------------------------------------------------------------------
/inference_services/facedetection/inference_config.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "omz_facedetection" : {
 3 |     "model_path" : "/app/models/",
 4 |     "model_name" : "face-detection-retail-0013",
 5 |     "target_device" : "CPU",
 6 |     "cpu_extension" : "True",
 7 |     "cpu_extension_path" : "/opt/intel/openvino/inference_engine/lib/intel64/libcpu_extension.so",
 8 |     "face_detection_threshold" : 0.6,
 9 |     "async" : "False",
10 |     "request_count" : 1,
11 |     "dynamic_batch" : "False",
12 |     "batch_size" : 1,
13 |     "limit_cpu_threads" : "False",
14 |     "number_of_cpu_threads" : 4,
15 |     "bind_cpu_threads" : "True",
16 |     "cpu_stream" : "AUTO",
17 |     "gpu_stream" : "AUTO"
18 |   },
19 | 
20 |   "mtcnn_facedetection" : {
21 |     "model_path" : "/app/models/",
22 |     "p_model_file_name" : "det1-0001",
23 |     "r_model_file_name" : "det2-0001",
24 |     "o_model_file_name" : "det3-0001",
25 |     "target_device" : "CPU",
26 |     "cpu_extension" : "True",
27 |     "cpu_extension_path" : "/opt/intel/openvino/inference_engine/lib/intel64/libcpu_extension_sse4.so",
28 | 
29 |     "p_network_threshold" : 0.6,
30 |     "r_network_threshold" : 0.7,
31 |     "o_network_threshold" : 0.8,
32 | 
33 |     "minimum_face_size" : 15.0,
34 |     "minimum_length" : 720,
35 |     "factor_count" : 0,
36 |     "factor" : 0.707,
37 |     "min_detection_size" : 12,
38 | 
39 |     "nms_thresholds" : [0.6, 0.6, 0.6],
40 |     "r_input_batch_size" : 256,
41 |     "o_input_batch_size" : 256,
42 | 
43 |     "limit_cpu_threads" : "False",
44 |     "number_of_cpu_threads" : 4,
45 |     "bind_cpu_threads" : "True",
46 |     "cpu_stream" : "AUTO",
47 |     "gpu_stream" : "AUTO"
48 |   },
49 | 
50 |   "face_detection_model" : "mtcnn_facedetection",
51 |   "input_type" : "video",
52 |   "input_path" : "/app/videos/facedetection.mp4",
53 |   "web_cam_index" : "0",
54 |   "log_level" : "DEBUG",
55 | 
56 |   "save_roi_video" : "False",
57 |   "save_only_frames" : "False",
58 |   "save_roi" : "True"
59 | }


--------------------------------------------------------------------------------
/inference_services/facedetection/models/age-gender-recognition-retail-0013.bin:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/odundar/face-detection-python/8ef8863d85c4ddd3c67512ff3e48fa4cf7c1d770/inference_services/facedetection/models/age-gender-recognition-retail-0013.bin


--------------------------------------------------------------------------------
/inference_services/facedetection/models/age-gender-recognition-retail-0013.xml:
--------------------------------------------------------------------------------
  1 | <?xml version="1.0" ?>
  2 | <net batch="1" name="age_gender" version="6">
  3 | 	<layers>
  4 | 		<layer id="0" name="data" precision="FP32" type="Input">
  5 | 			<output>
  6 | 				<port id="0">
  7 | 					<dim>1</dim>
  8 | 					<dim>3</dim>
  9 | 					<dim>62</dim>
 10 | 					<dim>62</dim>
 11 | 				</port>
 12 | 			</output>
 13 | 		</layer>
 14 | 		<layer id="1" name="conv1" precision="FP32" type="Convolution">
 15 | 			<data dilations="1,1" group="1" kernel="3,3" output="48" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
 16 | 			<input>
 17 | 				<port id="0">
 18 | 					<dim>1</dim>
 19 | 					<dim>3</dim>
 20 | 					<dim>62</dim>
 21 | 					<dim>62</dim>
 22 | 				</port>
 23 | 			</input>
 24 | 			<output>
 25 | 				<port id="3">
 26 | 					<dim>1</dim>
 27 | 					<dim>48</dim>
 28 | 					<dim>60</dim>
 29 | 					<dim>60</dim>
 30 | 				</port>
 31 | 			</output>
 32 | 			<blobs>
 33 | 				<weights offset="0" size="5184"/>
 34 | 				<biases offset="5184" size="192"/>
 35 | 			</blobs>
 36 | 		</layer>
 37 | 		<layer id="2" name="pool1" precision="FP32" type="Pooling">
 38 | 			<data exclude-pad="true" kernel="3,3" pads_begin="0,0" pads_end="0,0" pool-method="max" rounding_type="ceil" strides="2,2"/>
 39 | 			<input>
 40 | 				<port id="0">
 41 | 					<dim>1</dim>
 42 | 					<dim>48</dim>
 43 | 					<dim>60</dim>
 44 | 					<dim>60</dim>
 45 | 				</port>
 46 | 			</input>
 47 | 			<output>
 48 | 				<port id="1">
 49 | 					<dim>1</dim>
 50 | 					<dim>48</dim>
 51 | 					<dim>30</dim>
 52 | 					<dim>30</dim>
 53 | 				</port>
 54 | 			</output>
 55 | 		</layer>
 56 | 		<layer id="3" name="relu1" precision="FP32" type="ReLU">
 57 | 			<input>
 58 | 				<port id="0">
 59 | 					<dim>1</dim>
 60 | 					<dim>48</dim>
 61 | 					<dim>30</dim>
 62 | 					<dim>30</dim>
 63 | 				</port>
 64 | 			</input>
 65 | 			<output>
 66 | 				<port id="1">
 67 | 					<dim>1</dim>
 68 | 					<dim>48</dim>
 69 | 					<dim>30</dim>
 70 | 					<dim>30</dim>
 71 | 				</port>
 72 | 			</output>
 73 | 		</layer>
 74 | 		<layer id="4" name="conv2" precision="FP32" type="Convolution">
 75 | 			<data dilations="1,1" group="1" kernel="3,3" output="64" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
 76 | 			<input>
 77 | 				<port id="0">
 78 | 					<dim>1</dim>
 79 | 					<dim>48</dim>
 80 | 					<dim>30</dim>
 81 | 					<dim>30</dim>
 82 | 				</port>
 83 | 			</input>
 84 | 			<output>
 85 | 				<port id="3">
 86 | 					<dim>1</dim>
 87 | 					<dim>64</dim>
 88 | 					<dim>28</dim>
 89 | 					<dim>28</dim>
 90 | 				</port>
 91 | 			</output>
 92 | 			<blobs>
 93 | 				<weights offset="5376" size="110592"/>
 94 | 				<biases offset="115968" size="256"/>
 95 | 			</blobs>
 96 | 		</layer>
 97 | 		<layer id="5" name="pool2" precision="FP32" type="Pooling">
 98 | 			<data exclude-pad="true" kernel="3,3" pads_begin="0,0" pads_end="0,0" pool-method="max" rounding_type="ceil" strides="2,2"/>
 99 | 			<input>
100 | 				<port id="0">
101 | 					<dim>1</dim>
102 | 					<dim>64</dim>
103 | 					<dim>28</dim>
104 | 					<dim>28</dim>
105 | 				</port>
106 | 			</input>
107 | 			<output>
108 | 				<port id="1">
109 | 					<dim>1</dim>
110 | 					<dim>64</dim>
111 | 					<dim>14</dim>
112 | 					<dim>14</dim>
113 | 				</port>
114 | 			</output>
115 | 		</layer>
116 | 		<layer id="6" name="relu2" precision="FP32" type="ReLU">
117 | 			<input>
118 | 				<port id="0">
119 | 					<dim>1</dim>
120 | 					<dim>64</dim>
121 | 					<dim>14</dim>
122 | 					<dim>14</dim>
123 | 				</port>
124 | 			</input>
125 | 			<output>
126 | 				<port id="1">
127 | 					<dim>1</dim>
128 | 					<dim>64</dim>
129 | 					<dim>14</dim>
130 | 					<dim>14</dim>
131 | 				</port>
132 | 			</output>
133 | 		</layer>
134 | 		<layer id="7" name="conv3" precision="FP32" type="Convolution">
135 | 			<data dilations="1,1" group="1" kernel="3,3" output="96" pads_begin="1,1" pads_end="1,1" strides="1,1"/>
136 | 			<input>
137 | 				<port id="0">
138 | 					<dim>1</dim>
139 | 					<dim>64</dim>
140 | 					<dim>14</dim>
141 | 					<dim>14</dim>
142 | 				</port>
143 | 			</input>
144 | 			<output>
145 | 				<port id="3">
146 | 					<dim>1</dim>
147 | 					<dim>96</dim>
148 | 					<dim>14</dim>
149 | 					<dim>14</dim>
150 | 				</port>
151 | 			</output>
152 | 			<blobs>
153 | 				<weights offset="116224" size="221184"/>
154 | 				<biases offset="337408" size="384"/>
155 | 			</blobs>
156 | 		</layer>
157 | 		<layer id="8" name="pool3" precision="FP32" type="Pooling">
158 | 			<data exclude-pad="true" kernel="3,3" pads_begin="0,0" pads_end="0,0" pool-method="max" rounding_type="ceil" strides="2,2"/>
159 | 			<input>
160 | 				<port id="0">
161 | 					<dim>1</dim>
162 | 					<dim>96</dim>
163 | 					<dim>14</dim>
164 | 					<dim>14</dim>
165 | 				</port>
166 | 			</input>
167 | 			<output>
168 | 				<port id="1">
169 | 					<dim>1</dim>
170 | 					<dim>96</dim>
171 | 					<dim>7</dim>
172 | 					<dim>7</dim>
173 | 				</port>
174 | 			</output>
175 | 		</layer>
176 | 		<layer id="9" name="relu3" precision="FP32" type="ReLU">
177 | 			<input>
178 | 				<port id="0">
179 | 					<dim>1</dim>
180 | 					<dim>96</dim>
181 | 					<dim>7</dim>
182 | 					<dim>7</dim>
183 | 				</port>
184 | 			</input>
185 | 			<output>
186 | 				<port id="1">
187 | 					<dim>1</dim>
188 | 					<dim>96</dim>
189 | 					<dim>7</dim>
190 | 					<dim>7</dim>
191 | 				</port>
192 | 			</output>
193 | 		</layer>
194 | 		<layer id="10" name="conv4" precision="FP32" type="Convolution">
195 | 			<data dilations="1,1" group="1" kernel="3,3" output="192" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
196 | 			<input>
197 | 				<port id="0">
198 | 					<dim>1</dim>
199 | 					<dim>96</dim>
200 | 					<dim>7</dim>
201 | 					<dim>7</dim>
202 | 				</port>
203 | 			</input>
204 | 			<output>
205 | 				<port id="3">
206 | 					<dim>1</dim>
207 | 					<dim>192</dim>
208 | 					<dim>5</dim>
209 | 					<dim>5</dim>
210 | 				</port>
211 | 			</output>
212 | 			<blobs>
213 | 				<weights offset="337792" size="663552"/>
214 | 				<biases offset="1001344" size="768"/>
215 | 			</blobs>
216 | 		</layer>
217 | 		<layer id="11" name="relu4" precision="FP32" type="ReLU">
218 | 			<input>
219 | 				<port id="0">
220 | 					<dim>1</dim>
221 | 					<dim>192</dim>
222 | 					<dim>5</dim>
223 | 					<dim>5</dim>
224 | 				</port>
225 | 			</input>
226 | 			<output>
227 | 				<port id="1">
228 | 					<dim>1</dim>
229 | 					<dim>192</dim>
230 | 					<dim>5</dim>
231 | 					<dim>5</dim>
232 | 				</port>
233 | 			</output>
234 | 		</layer>
235 | 		<layer id="12" name="conv5" precision="FP32" type="Convolution">
236 | 			<data dilations="1,1" group="1" kernel="3,3" output="256" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
237 | 			<input>
238 | 				<port id="0">
239 | 					<dim>1</dim>
240 | 					<dim>192</dim>
241 | 					<dim>5</dim>
242 | 					<dim>5</dim>
243 | 				</port>
244 | 			</input>
245 | 			<output>
246 | 				<port id="3">
247 | 					<dim>1</dim>
248 | 					<dim>256</dim>
249 | 					<dim>3</dim>
250 | 					<dim>3</dim>
251 | 				</port>
252 | 			</output>
253 | 			<blobs>
254 | 				<weights offset="1002112" size="1769472"/>
255 | 				<biases offset="2771584" size="1024"/>
256 | 			</blobs>
257 | 		</layer>
258 | 		<layer id="13" name="relu5" precision="FP32" type="ReLU">
259 | 			<input>
260 | 				<port id="0">
261 | 					<dim>1</dim>
262 | 					<dim>256</dim>
263 | 					<dim>3</dim>
264 | 					<dim>3</dim>
265 | 				</port>
266 | 			</input>
267 | 			<output>
268 | 				<port id="1">
269 | 					<dim>1</dim>
270 | 					<dim>256</dim>
271 | 					<dim>3</dim>
272 | 					<dim>3</dim>
273 | 				</port>
274 | 			</output>
275 | 		</layer>
276 | 		<layer id="14" name="age_conv1" precision="FP32" type="Convolution">
277 | 			<data dilations="1,1" group="1" kernel="3,3" output="256" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
278 | 			<input>
279 | 				<port id="0">
280 | 					<dim>1</dim>
281 | 					<dim>256</dim>
282 | 					<dim>3</dim>
283 | 					<dim>3</dim>
284 | 				</port>
285 | 			</input>
286 | 			<output>
287 | 				<port id="3">
288 | 					<dim>1</dim>
289 | 					<dim>256</dim>
290 | 					<dim>1</dim>
291 | 					<dim>1</dim>
292 | 				</port>
293 | 			</output>
294 | 			<blobs>
295 | 				<weights offset="2772608" size="2359296"/>
296 | 				<biases offset="5131904" size="1024"/>
297 | 			</blobs>
298 | 		</layer>
299 | 		<layer id="15" name="relu6_a" precision="FP32" type="ReLU">
300 | 			<input>
301 | 				<port id="0">
302 | 					<dim>1</dim>
303 | 					<dim>256</dim>
304 | 					<dim>1</dim>
305 | 					<dim>1</dim>
306 | 				</port>
307 | 			</input>
308 | 			<output>
309 | 				<port id="1">
310 | 					<dim>1</dim>
311 | 					<dim>256</dim>
312 | 					<dim>1</dim>
313 | 					<dim>1</dim>
314 | 				</port>
315 | 			</output>
316 | 		</layer>
317 | 		<layer id="16" name="age_conv2" precision="FP32" type="Convolution">
318 | 			<data dilations="1,1" group="1" kernel="1,1" output="512" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
319 | 			<input>
320 | 				<port id="0">
321 | 					<dim>1</dim>
322 | 					<dim>256</dim>
323 | 					<dim>1</dim>
324 | 					<dim>1</dim>
325 | 				</port>
326 | 			</input>
327 | 			<output>
328 | 				<port id="3">
329 | 					<dim>1</dim>
330 | 					<dim>512</dim>
331 | 					<dim>1</dim>
332 | 					<dim>1</dim>
333 | 				</port>
334 | 			</output>
335 | 			<blobs>
336 | 				<weights offset="5132928" size="524288"/>
337 | 				<biases offset="5657216" size="2048"/>
338 | 			</blobs>
339 | 		</layer>
340 | 		<layer id="17" name="relu7_a" precision="FP32" type="ReLU">
341 | 			<input>
342 | 				<port id="0">
343 | 					<dim>1</dim>
344 | 					<dim>512</dim>
345 | 					<dim>1</dim>
346 | 					<dim>1</dim>
347 | 				</port>
348 | 			</input>
349 | 			<output>
350 | 				<port id="1">
351 | 					<dim>1</dim>
352 | 					<dim>512</dim>
353 | 					<dim>1</dim>
354 | 					<dim>1</dim>
355 | 				</port>
356 | 			</output>
357 | 		</layer>
358 | 		<layer id="18" name="age_conv3" precision="FP32" type="Convolution">
359 | 			<data dilations="1,1" group="1" kernel="1,1" output="1" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
360 | 			<input>
361 | 				<port id="0">
362 | 					<dim>1</dim>
363 | 					<dim>512</dim>
364 | 					<dim>1</dim>
365 | 					<dim>1</dim>
366 | 				</port>
367 | 			</input>
368 | 			<output>
369 | 				<port id="3">
370 | 					<dim>1</dim>
371 | 					<dim>1</dim>
372 | 					<dim>1</dim>
373 | 					<dim>1</dim>
374 | 				</port>
375 | 			</output>
376 | 			<blobs>
377 | 				<weights offset="5659264" size="2048"/>
378 | 				<biases offset="5661312" size="4"/>
379 | 			</blobs>
380 | 		</layer>
381 | 		<layer id="19" name="gender_conv1" precision="FP32" type="Convolution">
382 | 			<data dilations="1,1" group="1" kernel="3,3" output="256" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
383 | 			<input>
384 | 				<port id="0">
385 | 					<dim>1</dim>
386 | 					<dim>256</dim>
387 | 					<dim>3</dim>
388 | 					<dim>3</dim>
389 | 				</port>
390 | 			</input>
391 | 			<output>
392 | 				<port id="3">
393 | 					<dim>1</dim>
394 | 					<dim>256</dim>
395 | 					<dim>1</dim>
396 | 					<dim>1</dim>
397 | 				</port>
398 | 			</output>
399 | 			<blobs>
400 | 				<weights offset="5661316" size="2359296"/>
401 | 				<biases offset="8020612" size="1024"/>
402 | 			</blobs>
403 | 		</layer>
404 | 		<layer id="20" name="relu6_g" precision="FP32" type="ReLU">
405 | 			<input>
406 | 				<port id="0">
407 | 					<dim>1</dim>
408 | 					<dim>256</dim>
409 | 					<dim>1</dim>
410 | 					<dim>1</dim>
411 | 				</port>
412 | 			</input>
413 | 			<output>
414 | 				<port id="1">
415 | 					<dim>1</dim>
416 | 					<dim>256</dim>
417 | 					<dim>1</dim>
418 | 					<dim>1</dim>
419 | 				</port>
420 | 			</output>
421 | 		</layer>
422 | 		<layer id="21" name="gender_conv2" precision="FP32" type="Convolution">
423 | 			<data dilations="1,1" group="1" kernel="1,1" output="512" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
424 | 			<input>
425 | 				<port id="0">
426 | 					<dim>1</dim>
427 | 					<dim>256</dim>
428 | 					<dim>1</dim>
429 | 					<dim>1</dim>
430 | 				</port>
431 | 			</input>
432 | 			<output>
433 | 				<port id="3">
434 | 					<dim>1</dim>
435 | 					<dim>512</dim>
436 | 					<dim>1</dim>
437 | 					<dim>1</dim>
438 | 				</port>
439 | 			</output>
440 | 			<blobs>
441 | 				<weights offset="8021636" size="524288"/>
442 | 				<biases offset="8545924" size="2048"/>
443 | 			</blobs>
444 | 		</layer>
445 | 		<layer id="22" name="relu7_g" precision="FP32" type="ReLU">
446 | 			<input>
447 | 				<port id="0">
448 | 					<dim>1</dim>
449 | 					<dim>512</dim>
450 | 					<dim>1</dim>
451 | 					<dim>1</dim>
452 | 				</port>
453 | 			</input>
454 | 			<output>
455 | 				<port id="1">
456 | 					<dim>1</dim>
457 | 					<dim>512</dim>
458 | 					<dim>1</dim>
459 | 					<dim>1</dim>
460 | 				</port>
461 | 			</output>
462 | 		</layer>
463 | 		<layer id="23" name="gender_conv3" precision="FP32" type="Convolution">
464 | 			<data dilations="1,1" group="1" kernel="1,1" output="2" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
465 | 			<input>
466 | 				<port id="0">
467 | 					<dim>1</dim>
468 | 					<dim>512</dim>
469 | 					<dim>1</dim>
470 | 					<dim>1</dim>
471 | 				</port>
472 | 			</input>
473 | 			<output>
474 | 				<port id="3">
475 | 					<dim>1</dim>
476 | 					<dim>2</dim>
477 | 					<dim>1</dim>
478 | 					<dim>1</dim>
479 | 				</port>
480 | 			</output>
481 | 			<blobs>
482 | 				<weights offset="8547972" size="4096"/>
483 | 				<biases offset="8552068" size="8"/>
484 | 			</blobs>
485 | 		</layer>
486 | 		<layer id="24" name="prob" precision="FP32" type="SoftMax">
487 | 			<data axis="1"/>
488 | 			<input>
489 | 				<port id="0">
490 | 					<dim>1</dim>
491 | 					<dim>2</dim>
492 | 					<dim>1</dim>
493 | 					<dim>1</dim>
494 | 				</port>
495 | 			</input>
496 | 			<output>
497 | 				<port id="1">
498 | 					<dim>1</dim>
499 | 					<dim>2</dim>
500 | 					<dim>1</dim>
501 | 					<dim>1</dim>
502 | 				</port>
503 | 			</output>
504 | 		</layer>
505 | 	</layers>
506 | 	<edges>
507 | 		<edge from-layer="0" from-port="0" to-layer="1" to-port="0"/>
508 | 		<edge from-layer="1" from-port="3" to-layer="2" to-port="0"/>
509 | 		<edge from-layer="2" from-port="1" to-layer="3" to-port="0"/>
510 | 		<edge from-layer="3" from-port="1" to-layer="4" to-port="0"/>
511 | 		<edge from-layer="4" from-port="3" to-layer="5" to-port="0"/>
512 | 		<edge from-layer="5" from-port="1" to-layer="6" to-port="0"/>
513 | 		<edge from-layer="6" from-port="1" to-layer="7" to-port="0"/>
514 | 		<edge from-layer="7" from-port="3" to-layer="8" to-port="0"/>
515 | 		<edge from-layer="8" from-port="1" to-layer="9" to-port="0"/>
516 | 		<edge from-layer="9" from-port="1" to-layer="10" to-port="0"/>
517 | 		<edge from-layer="10" from-port="3" to-layer="11" to-port="0"/>
518 | 		<edge from-layer="11" from-port="1" to-layer="12" to-port="0"/>
519 | 		<edge from-layer="12" from-port="3" to-layer="13" to-port="0"/>
520 | 		<edge from-layer="13" from-port="1" to-layer="14" to-port="0"/>
521 | 		<edge from-layer="14" from-port="3" to-layer="15" to-port="0"/>
522 | 		<edge from-layer="15" from-port="1" to-layer="16" to-port="0"/>
523 | 		<edge from-layer="16" from-port="3" to-layer="17" to-port="0"/>
524 | 		<edge from-layer="17" from-port="1" to-layer="18" to-port="0"/>
525 | 		<edge from-layer="13" from-port="1" to-layer="19" to-port="0"/>
526 | 		<edge from-layer="19" from-port="3" to-layer="20" to-port="0"/>
527 | 		<edge from-layer="20" from-port="1" to-layer="21" to-port="0"/>
528 | 		<edge from-layer="21" from-port="3" to-layer="22" to-port="0"/>
529 | 		<edge from-layer="22" from-port="1" to-layer="23" to-port="0"/>
530 | 		<edge from-layer="23" from-port="3" to-layer="24" to-port="0"/>
531 | 	</edges>
532 | 	<meta_data>
533 | 		<MO_version value="2019.2.0-402-g82c4801"/>
534 | 		<cli_parameters>
535 | 			<blobs_as_inputs value="False"/>
536 | 			<caffe_parser_path value="DIR"/>
537 | 			<data_type value="FP32"/>
538 | 			<disable_nhwc_to_nchw value="False"/>
539 | 			<disable_omitting_optional value="False"/>
540 | 			<disable_resnet_optimization value="False"/>
541 | 			<enable_concat_optimization value="False"/>
542 | 			<enable_flattening_nested_params value="False"/>
543 | 			<enable_ssd_gluoncv value="False"/>
544 | 			<extensions value="DIR"/>
545 | 			<framework value="caffe"/>
546 | 			<freeze_placeholder_with_value value="{}"/>
547 | 			<generate_experimental_IR_V10 value="False"/>
548 | 			<input value="data"/>
549 | 			<input_model value="DIR/age_gender_net.caffemodel"/>
550 | 			<input_model_is_text value="False"/>
551 | 			<input_proto value="DIR/age_gender_net.prototxt"/>
552 | 			<input_shape value="[1,3,62,62]"/>
553 | 			<k value="DIR/CustomLayersMapping.xml"/>
554 | 			<keep_quantize_ops_in_IR value="False"/>
555 | 			<keep_shape_ops value="False"/>
556 | 			<legacy_mxnet_model value="False"/>
557 | 			<log_level value="ERROR"/>
558 | 			<mean_scale_values value="{'data': {'mean': None, 'scale': array([254.99991075])}}"/>
559 | 			<mean_values value="()"/>
560 | 			<model_name value="age-gender-recognition-retail-0013"/>
561 | 			<move_to_preprocess value="False"/>
562 | 			<output value="['prob', 'age_conv3']"/>
563 | 			<output_dir value="DIR"/>
564 | 			<placeholder_shapes value="{'data': array([ 1,  3, 62, 62])}"/>
565 | 			<remove_output_softmax value="False"/>
566 | 			<reverse_input_channels value="False"/>
567 | 			<save_params_from_nd value="False"/>
568 | 			<scale_values value="data[254.99991075003123]"/>
569 | 			<silent value="False"/>
570 | 			<version value="False"/>
571 | 			<unset unset_cli_parameters="batch, counts, disable_fusing, disable_gfusing, finegrain_fusing, generate_deprecated_IR_V2, input_checkpoint, input_meta_graph, input_symbol, mean_file, mean_file_offsets, nd_prefix_name, pretrained_model_name, saved_model_dir, saved_model_tags, scale, tensorboard_logdir, tensorflow_custom_layer_libraries, tensorflow_custom_operations_config_update, tensorflow_object_detection_api_pipeline_config, tensorflow_operation_patterns, tensorflow_subgraph_patterns, tensorflow_use_custom_operations_config"/>
572 | 		</cli_parameters>
573 | 	</meta_data>
574 | </net>
575 | 


--------------------------------------------------------------------------------
/inference_services/facedetection/models/det1-0001.bin:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/odundar/face-detection-python/8ef8863d85c4ddd3c67512ff3e48fa4cf7c1d770/inference_services/facedetection/models/det1-0001.bin


--------------------------------------------------------------------------------
/inference_services/facedetection/models/det1-0001.mapping:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" ?>
 2 | <mapping>
 3 | 	<map>
 4 | 		<framework name="conv4_1" out_port_id="0"/>
 5 | 		<IR id="9" name="conv4_1" out_port_id="3"/>
 6 | 	</map>
 7 | 	<map>
 8 | 		<framework name="prelu1" out_port_id="0"/>
 9 | 		<IR id="2" name="prelu1" out_port_id="2"/>
10 | 	</map>
11 | 	<map>
12 | 		<framework name="prelu2" out_port_id="0"/>
13 | 		<IR id="5" name="prelu2" out_port_id="2"/>
14 | 	</map>
15 | 	<map>
16 | 		<framework name="conv3" out_port_id="0"/>
17 | 		<IR id="6" name="conv3" out_port_id="3"/>
18 | 	</map>
19 | 	<map>
20 | 		<framework name="pool1" out_port_id="0"/>
21 | 		<IR id="3" name="pool1" out_port_id="1"/>
22 | 	</map>
23 | 	<map>
24 | 		<framework name="prob1" out_port_id="0"/>
25 | 		<IR id="10" name="prob1" out_port_id="1"/>
26 | 	</map>
27 | 	<map>
28 | 		<framework name="conv4_2" out_port_id="0"/>
29 | 		<IR id="8" name="conv4_2" out_port_id="3"/>
30 | 	</map>
31 | 	<map>
32 | 		<framework name="data" out_port_id="0"/>
33 | 		<IR id="0" name="data" out_port_id="0"/>
34 | 	</map>
35 | 	<map>
36 | 		<framework name="conv1" out_port_id="0"/>
37 | 		<IR id="1" name="conv1" out_port_id="3"/>
38 | 	</map>
39 | 	<map>
40 | 		<framework name="prelu3" out_port_id="0"/>
41 | 		<IR id="7" name="prelu3" out_port_id="2"/>
42 | 	</map>
43 | 	<map>
44 | 		<framework name="conv2" out_port_id="0"/>
45 | 		<IR id="4" name="conv2" out_port_id="3"/>
46 | 	</map>
47 | </mapping>
48 | 


--------------------------------------------------------------------------------
/inference_services/facedetection/models/det1-0001.xml:
--------------------------------------------------------------------------------
  1 | <?xml version="1.0" ?>
  2 | <net batch="1" name="det1-0001" version="6">
  3 | 	<layers>
  4 | 		<layer id="0" name="data" precision="FP32" type="Input">
  5 | 			<output>
  6 | 				<port id="0">
  7 | 					<dim>1</dim>
  8 | 					<dim>3</dim>
  9 | 					<dim>12</dim>
 10 | 					<dim>12</dim>
 11 | 				</port>
 12 | 			</output>
 13 | 		</layer>
 14 | 		<layer id="1" name="conv1" precision="FP32" type="Convolution">
 15 | 			<data dilations="1,1" group="1" kernel="3,3" output="10" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
 16 | 			<input>
 17 | 				<port id="0">
 18 | 					<dim>1</dim>
 19 | 					<dim>3</dim>
 20 | 					<dim>12</dim>
 21 | 					<dim>12</dim>
 22 | 				</port>
 23 | 			</input>
 24 | 			<output>
 25 | 				<port id="3">
 26 | 					<dim>1</dim>
 27 | 					<dim>10</dim>
 28 | 					<dim>10</dim>
 29 | 					<dim>10</dim>
 30 | 				</port>
 31 | 			</output>
 32 | 			<blobs>
 33 | 				<weights offset="0" size="1080"/>
 34 | 				<biases offset="1080" size="40"/>
 35 | 			</blobs>
 36 | 		</layer>
 37 | 		<layer id="2" name="prelu1" precision="FP32" type="PReLU">
 38 | 			<data channel_shared="0" filler_type="constant" filler_value="0" max="1" mean="0" min="0" sparse="-1" std="0" variance_norm="caffe.FillerParameter.FAN_IN"/>
 39 | 			<input>
 40 | 				<port id="0">
 41 | 					<dim>1</dim>
 42 | 					<dim>10</dim>
 43 | 					<dim>10</dim>
 44 | 					<dim>10</dim>
 45 | 				</port>
 46 | 			</input>
 47 | 			<output>
 48 | 				<port id="2">
 49 | 					<dim>1</dim>
 50 | 					<dim>10</dim>
 51 | 					<dim>10</dim>
 52 | 					<dim>10</dim>
 53 | 				</port>
 54 | 			</output>
 55 | 			<blobs>
 56 | 				<weights offset="1120" size="40"/>
 57 | 			</blobs>
 58 | 		</layer>
 59 | 		<layer id="3" name="pool1" precision="FP32" type="Pooling">
 60 | 			<data exclude-pad="false" kernel="2,2" pads_begin="0,0" pads_end="0,0" pool-method="max" rounding_type="ceil" strides="2,2"/>
 61 | 			<input>
 62 | 				<port id="0">
 63 | 					<dim>1</dim>
 64 | 					<dim>10</dim>
 65 | 					<dim>10</dim>
 66 | 					<dim>10</dim>
 67 | 				</port>
 68 | 			</input>
 69 | 			<output>
 70 | 				<port id="1">
 71 | 					<dim>1</dim>
 72 | 					<dim>10</dim>
 73 | 					<dim>5</dim>
 74 | 					<dim>5</dim>
 75 | 				</port>
 76 | 			</output>
 77 | 		</layer>
 78 | 		<layer id="4" name="conv2" precision="FP32" type="Convolution">
 79 | 			<data dilations="1,1" group="1" kernel="3,3" output="16" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
 80 | 			<input>
 81 | 				<port id="0">
 82 | 					<dim>1</dim>
 83 | 					<dim>10</dim>
 84 | 					<dim>5</dim>
 85 | 					<dim>5</dim>
 86 | 				</port>
 87 | 			</input>
 88 | 			<output>
 89 | 				<port id="3">
 90 | 					<dim>1</dim>
 91 | 					<dim>16</dim>
 92 | 					<dim>3</dim>
 93 | 					<dim>3</dim>
 94 | 				</port>
 95 | 			</output>
 96 | 			<blobs>
 97 | 				<weights offset="1160" size="5760"/>
 98 | 				<biases offset="6920" size="64"/>
 99 | 			</blobs>
100 | 		</layer>
101 | 		<layer id="5" name="prelu2" precision="FP32" type="PReLU">
102 | 			<data channel_shared="0" filler_type="constant" filler_value="0" max="1" mean="0" min="0" sparse="-1" std="0" variance_norm="caffe.FillerParameter.FAN_IN"/>
103 | 			<input>
104 | 				<port id="0">
105 | 					<dim>1</dim>
106 | 					<dim>16</dim>
107 | 					<dim>3</dim>
108 | 					<dim>3</dim>
109 | 				</port>
110 | 			</input>
111 | 			<output>
112 | 				<port id="2">
113 | 					<dim>1</dim>
114 | 					<dim>16</dim>
115 | 					<dim>3</dim>
116 | 					<dim>3</dim>
117 | 				</port>
118 | 			</output>
119 | 			<blobs>
120 | 				<weights offset="6984" size="64"/>
121 | 			</blobs>
122 | 		</layer>
123 | 		<layer id="6" name="conv3" precision="FP32" type="Convolution">
124 | 			<data dilations="1,1" group="1" kernel="3,3" output="32" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
125 | 			<input>
126 | 				<port id="0">
127 | 					<dim>1</dim>
128 | 					<dim>16</dim>
129 | 					<dim>3</dim>
130 | 					<dim>3</dim>
131 | 				</port>
132 | 			</input>
133 | 			<output>
134 | 				<port id="3">
135 | 					<dim>1</dim>
136 | 					<dim>32</dim>
137 | 					<dim>1</dim>
138 | 					<dim>1</dim>
139 | 				</port>
140 | 			</output>
141 | 			<blobs>
142 | 				<weights offset="7048" size="18432"/>
143 | 				<biases offset="25480" size="128"/>
144 | 			</blobs>
145 | 		</layer>
146 | 		<layer id="7" name="prelu3" precision="FP32" type="PReLU">
147 | 			<data channel_shared="0" filler_type="constant" filler_value="0" max="1" mean="0" min="0" sparse="-1" std="0" variance_norm="caffe.FillerParameter.FAN_IN"/>
148 | 			<input>
149 | 				<port id="0">
150 | 					<dim>1</dim>
151 | 					<dim>32</dim>
152 | 					<dim>1</dim>
153 | 					<dim>1</dim>
154 | 				</port>
155 | 			</input>
156 | 			<output>
157 | 				<port id="2">
158 | 					<dim>1</dim>
159 | 					<dim>32</dim>
160 | 					<dim>1</dim>
161 | 					<dim>1</dim>
162 | 				</port>
163 | 			</output>
164 | 			<blobs>
165 | 				<weights offset="25608" size="128"/>
166 | 			</blobs>
167 | 		</layer>
168 | 		<layer id="8" name="conv4_2" precision="FP32" type="Convolution">
169 | 			<data dilations="1,1" group="1" kernel="1,1" output="4" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
170 | 			<input>
171 | 				<port id="0">
172 | 					<dim>1</dim>
173 | 					<dim>32</dim>
174 | 					<dim>1</dim>
175 | 					<dim>1</dim>
176 | 				</port>
177 | 			</input>
178 | 			<output>
179 | 				<port id="3">
180 | 					<dim>1</dim>
181 | 					<dim>4</dim>
182 | 					<dim>1</dim>
183 | 					<dim>1</dim>
184 | 				</port>
185 | 			</output>
186 | 			<blobs>
187 | 				<weights offset="25736" size="512"/>
188 | 				<biases offset="26248" size="16"/>
189 | 			</blobs>
190 | 		</layer>
191 | 		<layer id="9" name="conv4_1" precision="FP32" type="Convolution">
192 | 			<data dilations="1,1" group="1" kernel="1,1" output="2" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
193 | 			<input>
194 | 				<port id="0">
195 | 					<dim>1</dim>
196 | 					<dim>32</dim>
197 | 					<dim>1</dim>
198 | 					<dim>1</dim>
199 | 				</port>
200 | 			</input>
201 | 			<output>
202 | 				<port id="3">
203 | 					<dim>1</dim>
204 | 					<dim>2</dim>
205 | 					<dim>1</dim>
206 | 					<dim>1</dim>
207 | 				</port>
208 | 			</output>
209 | 			<blobs>
210 | 				<weights offset="26264" size="256"/>
211 | 				<biases offset="26520" size="8"/>
212 | 			</blobs>
213 | 		</layer>
214 | 		<layer id="10" name="prob1" precision="FP32" type="SoftMax">
215 | 			<data axis="1"/>
216 | 			<input>
217 | 				<port id="0">
218 | 					<dim>1</dim>
219 | 					<dim>2</dim>
220 | 					<dim>1</dim>
221 | 					<dim>1</dim>
222 | 				</port>
223 | 			</input>
224 | 			<output>
225 | 				<port id="1">
226 | 					<dim>1</dim>
227 | 					<dim>2</dim>
228 | 					<dim>1</dim>
229 | 					<dim>1</dim>
230 | 				</port>
231 | 			</output>
232 | 		</layer>
233 | 	</layers>
234 | 	<edges>
235 | 		<edge from-layer="0" from-port="0" to-layer="1" to-port="0"/>
236 | 		<edge from-layer="1" from-port="3" to-layer="2" to-port="0"/>
237 | 		<edge from-layer="2" from-port="2" to-layer="3" to-port="0"/>
238 | 		<edge from-layer="3" from-port="1" to-layer="4" to-port="0"/>
239 | 		<edge from-layer="4" from-port="3" to-layer="5" to-port="0"/>
240 | 		<edge from-layer="5" from-port="2" to-layer="6" to-port="0"/>
241 | 		<edge from-layer="6" from-port="3" to-layer="7" to-port="0"/>
242 | 		<edge from-layer="7" from-port="2" to-layer="8" to-port="0"/>
243 | 		<edge from-layer="7" from-port="2" to-layer="9" to-port="0"/>
244 | 		<edge from-layer="9" from-port="3" to-layer="10" to-port="0"/>
245 | 	</edges>
246 | 	<meta_data>
247 | 		<MO_version value="2019.2.0-436-gf5827d4"/>
248 | 		<cli_parameters>
249 | 			<blobs_as_inputs value="False"/>
250 | 			<data_type value="float"/>
251 | 			<disable_resnet_optimization value="False"/>
252 | 			<enable_concat_optimization value="False"/>
253 | 			<enable_ssd_gluoncv value="False"/>
254 | 			<extensions value="DIR"/>
255 | 			<framework value="mxnet"/>
256 | 			<freeze_placeholder_with_value value="{}"/>
257 | 			<generate_experimental_IR_V10 value="False"/>
258 | 			<input_model value="DIR/det1-0001.params"/>
259 | 			<input_shape value="[1,3,12,12]"/>
260 | 			<input_symbol value="DIR/det1-symbol.json"/>
261 | 			<keep_quantize_ops_in_IR value="False"/>
262 | 			<keep_shape_ops value="False"/>
263 | 			<legacy_mxnet_model value="False"/>
264 | 			<log_level value="ERROR"/>
265 | 			<mean_scale_values value="{}"/>
266 | 			<mean_values value="()"/>
267 | 			<move_to_preprocess value="False"/>
268 | 			<output_dir value="DIR"/>
269 | 			<placeholder_shapes value="[ 1  3 12 12]"/>
270 | 			<reverse_input_channels value="True"/>
271 | 			<save_params_from_nd value="False"/>
272 | 			<scale_values value="()"/>
273 | 			<silent value="False"/>
274 | 			<version value="False"/>
275 | 			<unset unset_cli_parameters="batch, disable_fusing, disable_gfusing, finegrain_fusing, generate_deprecated_IR_V2, input, model_name, nd_prefix_name, output, pretrained_model_name, scale"/>
276 | 		</cli_parameters>
277 | 	</meta_data>
278 | </net>
279 | 


--------------------------------------------------------------------------------
/inference_services/facedetection/models/det2-0001.bin:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/odundar/face-detection-python/8ef8863d85c4ddd3c67512ff3e48fa4cf7c1d770/inference_services/facedetection/models/det2-0001.bin


--------------------------------------------------------------------------------
/inference_services/facedetection/models/det2-0001.mapping:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" ?>
 2 | <mapping>
 3 | 	<map>
 4 | 		<framework name="prelu3" out_port_id="0"/>
 5 | 		<IR id="8" name="prelu3" out_port_id="2"/>
 6 | 	</map>
 7 | 	<map>
 8 | 		<framework name="prelu4" out_port_id="0"/>
 9 | 		<IR id="10" name="prelu4" out_port_id="2"/>
10 | 	</map>
11 | 	<map>
12 | 		<framework name="conv1" out_port_id="0"/>
13 | 		<IR id="1" name="conv1" out_port_id="3"/>
14 | 	</map>
15 | 	<map>
16 | 		<framework name="data" out_port_id="0"/>
17 | 		<IR id="0" name="data" out_port_id="0"/>
18 | 	</map>
19 | 	<map>
20 | 		<framework name="conv4" out_port_id="0"/>
21 | 		<IR id="9" name="conv4" out_port_id="3"/>
22 | 	</map>
23 | 	<map>
24 | 		<framework name="conv5_1" out_port_id="0"/>
25 | 		<IR id="12" name="conv5_1" out_port_id="3"/>
26 | 	</map>
27 | 	<map>
28 | 		<framework name="prelu1" out_port_id="0"/>
29 | 		<IR id="2" name="prelu1" out_port_id="2"/>
30 | 	</map>
31 | 	<map>
32 | 		<framework name="pool1" out_port_id="0"/>
33 | 		<IR id="3" name="pool1" out_port_id="1"/>
34 | 	</map>
35 | 	<map>
36 | 		<framework name="pool2" out_port_id="0"/>
37 | 		<IR id="6" name="pool2" out_port_id="1"/>
38 | 	</map>
39 | 	<map>
40 | 		<framework name="conv3" out_port_id="0"/>
41 | 		<IR id="7" name="conv3" out_port_id="3"/>
42 | 	</map>
43 | 	<map>
44 | 		<framework name="conv2" out_port_id="0"/>
45 | 		<IR id="4" name="conv2" out_port_id="3"/>
46 | 	</map>
47 | 	<map>
48 | 		<framework name="prob1" out_port_id="0"/>
49 | 		<IR id="13" name="prob1" out_port_id="1"/>
50 | 	</map>
51 | 	<map>
52 | 		<framework name="conv5_2" out_port_id="0"/>
53 | 		<IR id="11" name="conv5_2" out_port_id="3"/>
54 | 	</map>
55 | 	<map>
56 | 		<framework name="prelu2" out_port_id="0"/>
57 | 		<IR id="5" name="prelu2" out_port_id="2"/>
58 | 	</map>
59 | </mapping>
60 | 


--------------------------------------------------------------------------------
/inference_services/facedetection/models/det2-0001.xml:
--------------------------------------------------------------------------------
  1 | <?xml version="1.0" ?>
  2 | <net batch="1" name="det2-0001" version="6">
  3 | 	<layers>
  4 | 		<layer id="0" name="data" precision="FP32" type="Input">
  5 | 			<output>
  6 | 				<port id="0">
  7 | 					<dim>1</dim>
  8 | 					<dim>3</dim>
  9 | 					<dim>24</dim>
 10 | 					<dim>24</dim>
 11 | 				</port>
 12 | 			</output>
 13 | 		</layer>
 14 | 		<layer id="1" name="conv1" precision="FP32" type="Convolution">
 15 | 			<data dilations="1,1" group="1" kernel="3,3" output="28" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
 16 | 			<input>
 17 | 				<port id="0">
 18 | 					<dim>1</dim>
 19 | 					<dim>3</dim>
 20 | 					<dim>24</dim>
 21 | 					<dim>24</dim>
 22 | 				</port>
 23 | 			</input>
 24 | 			<output>
 25 | 				<port id="3">
 26 | 					<dim>1</dim>
 27 | 					<dim>28</dim>
 28 | 					<dim>22</dim>
 29 | 					<dim>22</dim>
 30 | 				</port>
 31 | 			</output>
 32 | 			<blobs>
 33 | 				<weights offset="0" size="3024"/>
 34 | 				<biases offset="3024" size="112"/>
 35 | 			</blobs>
 36 | 		</layer>
 37 | 		<layer id="2" name="prelu1" precision="FP32" type="PReLU">
 38 | 			<data channel_shared="0" filler_type="constant" filler_value="0" max="1" mean="0" min="0" sparse="-1" std="0" variance_norm="caffe.FillerParameter.FAN_IN"/>
 39 | 			<input>
 40 | 				<port id="0">
 41 | 					<dim>1</dim>
 42 | 					<dim>28</dim>
 43 | 					<dim>22</dim>
 44 | 					<dim>22</dim>
 45 | 				</port>
 46 | 			</input>
 47 | 			<output>
 48 | 				<port id="2">
 49 | 					<dim>1</dim>
 50 | 					<dim>28</dim>
 51 | 					<dim>22</dim>
 52 | 					<dim>22</dim>
 53 | 				</port>
 54 | 			</output>
 55 | 			<blobs>
 56 | 				<weights offset="3136" size="112"/>
 57 | 			</blobs>
 58 | 		</layer>
 59 | 		<layer id="3" name="pool1" precision="FP32" type="Pooling">
 60 | 			<data exclude-pad="false" kernel="3,3" pads_begin="0,0" pads_end="0,0" pool-method="max" rounding_type="ceil" strides="2,2"/>
 61 | 			<input>
 62 | 				<port id="0">
 63 | 					<dim>1</dim>
 64 | 					<dim>28</dim>
 65 | 					<dim>22</dim>
 66 | 					<dim>22</dim>
 67 | 				</port>
 68 | 			</input>
 69 | 			<output>
 70 | 				<port id="1">
 71 | 					<dim>1</dim>
 72 | 					<dim>28</dim>
 73 | 					<dim>11</dim>
 74 | 					<dim>11</dim>
 75 | 				</port>
 76 | 			</output>
 77 | 		</layer>
 78 | 		<layer id="4" name="conv2" precision="FP32" type="Convolution">
 79 | 			<data dilations="1,1" group="1" kernel="3,3" output="48" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
 80 | 			<input>
 81 | 				<port id="0">
 82 | 					<dim>1</dim>
 83 | 					<dim>28</dim>
 84 | 					<dim>11</dim>
 85 | 					<dim>11</dim>
 86 | 				</port>
 87 | 			</input>
 88 | 			<output>
 89 | 				<port id="3">
 90 | 					<dim>1</dim>
 91 | 					<dim>48</dim>
 92 | 					<dim>9</dim>
 93 | 					<dim>9</dim>
 94 | 				</port>
 95 | 			</output>
 96 | 			<blobs>
 97 | 				<weights offset="3248" size="48384"/>
 98 | 				<biases offset="51632" size="192"/>
 99 | 			</blobs>
100 | 		</layer>
101 | 		<layer id="5" name="prelu2" precision="FP32" type="PReLU">
102 | 			<data channel_shared="0" filler_type="constant" filler_value="0" max="1" mean="0" min="0" sparse="-1" std="0" variance_norm="caffe.FillerParameter.FAN_IN"/>
103 | 			<input>
104 | 				<port id="0">
105 | 					<dim>1</dim>
106 | 					<dim>48</dim>
107 | 					<dim>9</dim>
108 | 					<dim>9</dim>
109 | 				</port>
110 | 			</input>
111 | 			<output>
112 | 				<port id="2">
113 | 					<dim>1</dim>
114 | 					<dim>48</dim>
115 | 					<dim>9</dim>
116 | 					<dim>9</dim>
117 | 				</port>
118 | 			</output>
119 | 			<blobs>
120 | 				<weights offset="51824" size="192"/>
121 | 			</blobs>
122 | 		</layer>
123 | 		<layer id="6" name="pool2" precision="FP32" type="Pooling">
124 | 			<data exclude-pad="false" kernel="3,3" pads_begin="0,0" pads_end="0,0" pool-method="max" rounding_type="ceil" strides="2,2"/>
125 | 			<input>
126 | 				<port id="0">
127 | 					<dim>1</dim>
128 | 					<dim>48</dim>
129 | 					<dim>9</dim>
130 | 					<dim>9</dim>
131 | 				</port>
132 | 			</input>
133 | 			<output>
134 | 				<port id="1">
135 | 					<dim>1</dim>
136 | 					<dim>48</dim>
137 | 					<dim>4</dim>
138 | 					<dim>4</dim>
139 | 				</port>
140 | 			</output>
141 | 		</layer>
142 | 		<layer id="7" name="conv3" precision="FP32" type="Convolution">
143 | 			<data dilations="1,1" group="1" kernel="2,2" output="64" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
144 | 			<input>
145 | 				<port id="0">
146 | 					<dim>1</dim>
147 | 					<dim>48</dim>
148 | 					<dim>4</dim>
149 | 					<dim>4</dim>
150 | 				</port>
151 | 			</input>
152 | 			<output>
153 | 				<port id="3">
154 | 					<dim>1</dim>
155 | 					<dim>64</dim>
156 | 					<dim>3</dim>
157 | 					<dim>3</dim>
158 | 				</port>
159 | 			</output>
160 | 			<blobs>
161 | 				<weights offset="52016" size="49152"/>
162 | 				<biases offset="101168" size="256"/>
163 | 			</blobs>
164 | 		</layer>
165 | 		<layer id="8" name="prelu3" precision="FP32" type="PReLU">
166 | 			<data channel_shared="0" filler_type="constant" filler_value="0" max="1" mean="0" min="0" sparse="-1" std="0" variance_norm="caffe.FillerParameter.FAN_IN"/>
167 | 			<input>
168 | 				<port id="0">
169 | 					<dim>1</dim>
170 | 					<dim>64</dim>
171 | 					<dim>3</dim>
172 | 					<dim>3</dim>
173 | 				</port>
174 | 			</input>
175 | 			<output>
176 | 				<port id="2">
177 | 					<dim>1</dim>
178 | 					<dim>64</dim>
179 | 					<dim>3</dim>
180 | 					<dim>3</dim>
181 | 				</port>
182 | 			</output>
183 | 			<blobs>
184 | 				<weights offset="101424" size="256"/>
185 | 			</blobs>
186 | 		</layer>
187 | 		<layer id="9" name="conv4" precision="FP32" type="FullyConnected">
188 | 			<data out-size="128"/>
189 | 			<input>
190 | 				<port id="0">
191 | 					<dim>1</dim>
192 | 					<dim>64</dim>
193 | 					<dim>3</dim>
194 | 					<dim>3</dim>
195 | 				</port>
196 | 			</input>
197 | 			<output>
198 | 				<port id="3">
199 | 					<dim>1</dim>
200 | 					<dim>128</dim>
201 | 				</port>
202 | 			</output>
203 | 			<blobs>
204 | 				<weights offset="101680" size="294912"/>
205 | 				<biases offset="396592" size="512"/>
206 | 			</blobs>
207 | 		</layer>
208 | 		<layer id="10" name="prelu4" precision="FP32" type="PReLU">
209 | 			<data channel_shared="0" filler_type="constant" filler_value="0" max="1" mean="0" min="0" sparse="-1" std="0" variance_norm="caffe.FillerParameter.FAN_IN"/>
210 | 			<input>
211 | 				<port id="0">
212 | 					<dim>1</dim>
213 | 					<dim>128</dim>
214 | 				</port>
215 | 			</input>
216 | 			<output>
217 | 				<port id="2">
218 | 					<dim>1</dim>
219 | 					<dim>128</dim>
220 | 				</port>
221 | 			</output>
222 | 			<blobs>
223 | 				<weights offset="397104" size="512"/>
224 | 			</blobs>
225 | 		</layer>
226 | 		<layer id="11" name="conv5_2" precision="FP32" type="FullyConnected">
227 | 			<data out-size="4"/>
228 | 			<input>
229 | 				<port id="0">
230 | 					<dim>1</dim>
231 | 					<dim>128</dim>
232 | 				</port>
233 | 			</input>
234 | 			<output>
235 | 				<port id="3">
236 | 					<dim>1</dim>
237 | 					<dim>4</dim>
238 | 				</port>
239 | 			</output>
240 | 			<blobs>
241 | 				<weights offset="397616" size="2048"/>
242 | 				<biases offset="399664" size="16"/>
243 | 			</blobs>
244 | 		</layer>
245 | 		<layer id="12" name="conv5_1" precision="FP32" type="FullyConnected">
246 | 			<data out-size="2"/>
247 | 			<input>
248 | 				<port id="0">
249 | 					<dim>1</dim>
250 | 					<dim>128</dim>
251 | 				</port>
252 | 			</input>
253 | 			<output>
254 | 				<port id="3">
255 | 					<dim>1</dim>
256 | 					<dim>2</dim>
257 | 				</port>
258 | 			</output>
259 | 			<blobs>
260 | 				<weights offset="399680" size="1024"/>
261 | 				<biases offset="400704" size="8"/>
262 | 			</blobs>
263 | 		</layer>
264 | 		<layer id="13" name="prob1" precision="FP32" type="SoftMax">
265 | 			<data axis="1"/>
266 | 			<input>
267 | 				<port id="0">
268 | 					<dim>1</dim>
269 | 					<dim>2</dim>
270 | 				</port>
271 | 			</input>
272 | 			<output>
273 | 				<port id="1">
274 | 					<dim>1</dim>
275 | 					<dim>2</dim>
276 | 				</port>
277 | 			</output>
278 | 		</layer>
279 | 	</layers>
280 | 	<edges>
281 | 		<edge from-layer="0" from-port="0" to-layer="1" to-port="0"/>
282 | 		<edge from-layer="1" from-port="3" to-layer="2" to-port="0"/>
283 | 		<edge from-layer="2" from-port="2" to-layer="3" to-port="0"/>
284 | 		<edge from-layer="3" from-port="1" to-layer="4" to-port="0"/>
285 | 		<edge from-layer="4" from-port="3" to-layer="5" to-port="0"/>
286 | 		<edge from-layer="5" from-port="2" to-layer="6" to-port="0"/>
287 | 		<edge from-layer="6" from-port="1" to-layer="7" to-port="0"/>
288 | 		<edge from-layer="7" from-port="3" to-layer="8" to-port="0"/>
289 | 		<edge from-layer="8" from-port="2" to-layer="9" to-port="0"/>
290 | 		<edge from-layer="9" from-port="3" to-layer="10" to-port="0"/>
291 | 		<edge from-layer="10" from-port="2" to-layer="11" to-port="0"/>
292 | 		<edge from-layer="10" from-port="2" to-layer="12" to-port="0"/>
293 | 		<edge from-layer="12" from-port="3" to-layer="13" to-port="0"/>
294 | 	</edges>
295 | 	<meta_data>
296 | 		<MO_version value="2019.2.0-436-gf5827d4"/>
297 | 		<cli_parameters>
298 | 			<blobs_as_inputs value="False"/>
299 | 			<data_type value="float"/>
300 | 			<disable_resnet_optimization value="False"/>
301 | 			<enable_concat_optimization value="False"/>
302 | 			<enable_ssd_gluoncv value="False"/>
303 | 			<extensions value="DIR"/>
304 | 			<framework value="mxnet"/>
305 | 			<freeze_placeholder_with_value value="{}"/>
306 | 			<generate_experimental_IR_V10 value="False"/>
307 | 			<input_model value="DIR/det2-0001.params"/>
308 | 			<input_shape value="[1,3,24,24]"/>
309 | 			<input_symbol value="DIR/det2-symbol.json"/>
310 | 			<keep_quantize_ops_in_IR value="False"/>
311 | 			<keep_shape_ops value="False"/>
312 | 			<legacy_mxnet_model value="False"/>
313 | 			<log_level value="ERROR"/>
314 | 			<mean_scale_values value="{}"/>
315 | 			<mean_values value="()"/>
316 | 			<move_to_preprocess value="False"/>
317 | 			<output_dir value="DIR"/>
318 | 			<placeholder_shapes value="[ 1  3 24 24]"/>
319 | 			<reverse_input_channels value="True"/>
320 | 			<save_params_from_nd value="False"/>
321 | 			<scale_values value="()"/>
322 | 			<silent value="False"/>
323 | 			<version value="False"/>
324 | 			<unset unset_cli_parameters="batch, disable_fusing, disable_gfusing, finegrain_fusing, generate_deprecated_IR_V2, input, model_name, nd_prefix_name, output, pretrained_model_name, scale"/>
325 | 		</cli_parameters>
326 | 	</meta_data>
327 | </net>
328 | 


--------------------------------------------------------------------------------
/inference_services/facedetection/models/det3-0001.bin:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/odundar/face-detection-python/8ef8863d85c4ddd3c67512ff3e48fa4cf7c1d770/inference_services/facedetection/models/det3-0001.bin


--------------------------------------------------------------------------------
/inference_services/facedetection/models/det3-0001.mapping:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" ?>
 2 | <mapping>
 3 | 	<map>
 4 | 		<framework name="conv5" out_port_id="0"/>
 5 | 		<IR id="12" name="conv5" out_port_id="3"/>
 6 | 	</map>
 7 | 	<map>
 8 | 		<framework name="prelu5" out_port_id="0"/>
 9 | 		<IR id="13" name="prelu5" out_port_id="2"/>
10 | 	</map>
11 | 	<map>
12 | 		<framework name="prelu2" out_port_id="0"/>
13 | 		<IR id="5" name="prelu2" out_port_id="2"/>
14 | 	</map>
15 | 	<map>
16 | 		<framework name="pool3" out_port_id="0"/>
17 | 		<IR id="9" name="pool3" out_port_id="1"/>
18 | 	</map>
19 | 	<map>
20 | 		<framework name="data" out_port_id="0"/>
21 | 		<IR id="0" name="data" out_port_id="0"/>
22 | 	</map>
23 | 	<map>
24 | 		<framework name="prelu4" out_port_id="0"/>
25 | 		<IR id="11" name="prelu4" out_port_id="2"/>
26 | 	</map>
27 | 	<map>
28 | 		<framework name="conv6_3" out_port_id="0"/>
29 | 		<IR id="15" name="conv6_3" out_port_id="3"/>
30 | 	</map>
31 | 	<map>
32 | 		<framework name="prelu3" out_port_id="0"/>
33 | 		<IR id="8" name="prelu3" out_port_id="2"/>
34 | 	</map>
35 | 	<map>
36 | 		<framework name="conv3" out_port_id="0"/>
37 | 		<IR id="7" name="conv3" out_port_id="3"/>
38 | 	</map>
39 | 	<map>
40 | 		<framework name="pool1" out_port_id="0"/>
41 | 		<IR id="3" name="pool1" out_port_id="1"/>
42 | 	</map>
43 | 	<map>
44 | 		<framework name="conv4" out_port_id="0"/>
45 | 		<IR id="10" name="conv4" out_port_id="3"/>
46 | 	</map>
47 | 	<map>
48 | 		<framework name="prob1" out_port_id="0"/>
49 | 		<IR id="17" name="prob1" out_port_id="1"/>
50 | 	</map>
51 | 	<map>
52 | 		<framework name="pool2" out_port_id="0"/>
53 | 		<IR id="6" name="pool2" out_port_id="1"/>
54 | 	</map>
55 | 	<map>
56 | 		<framework name="conv2" out_port_id="0"/>
57 | 		<IR id="4" name="conv2" out_port_id="3"/>
58 | 	</map>
59 | 	<map>
60 | 		<framework name="conv6_1" out_port_id="0"/>
61 | 		<IR id="16" name="conv6_1" out_port_id="3"/>
62 | 	</map>
63 | 	<map>
64 | 		<framework name="prelu1" out_port_id="0"/>
65 | 		<IR id="2" name="prelu1" out_port_id="2"/>
66 | 	</map>
67 | 	<map>
68 | 		<framework name="conv6_2" out_port_id="0"/>
69 | 		<IR id="14" name="conv6_2" out_port_id="3"/>
70 | 	</map>
71 | 	<map>
72 | 		<framework name="conv1" out_port_id="0"/>
73 | 		<IR id="1" name="conv1" out_port_id="3"/>
74 | 	</map>
75 | </mapping>
76 | 


--------------------------------------------------------------------------------
/inference_services/facedetection/models/det3-0001.xml:
--------------------------------------------------------------------------------
  1 | <?xml version="1.0" ?>
  2 | <net batch="1" name="det3-0001" version="6">
  3 | 	<layers>
  4 | 		<layer id="0" name="data" precision="FP32" type="Input">
  5 | 			<output>
  6 | 				<port id="0">
  7 | 					<dim>1</dim>
  8 | 					<dim>3</dim>
  9 | 					<dim>48</dim>
 10 | 					<dim>48</dim>
 11 | 				</port>
 12 | 			</output>
 13 | 		</layer>
 14 | 		<layer id="1" name="conv1" precision="FP32" type="Convolution">
 15 | 			<data dilations="1,1" group="1" kernel="3,3" output="32" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
 16 | 			<input>
 17 | 				<port id="0">
 18 | 					<dim>1</dim>
 19 | 					<dim>3</dim>
 20 | 					<dim>48</dim>
 21 | 					<dim>48</dim>
 22 | 				</port>
 23 | 			</input>
 24 | 			<output>
 25 | 				<port id="3">
 26 | 					<dim>1</dim>
 27 | 					<dim>32</dim>
 28 | 					<dim>46</dim>
 29 | 					<dim>46</dim>
 30 | 				</port>
 31 | 			</output>
 32 | 			<blobs>
 33 | 				<weights offset="0" size="3456"/>
 34 | 				<biases offset="3456" size="128"/>
 35 | 			</blobs>
 36 | 		</layer>
 37 | 		<layer id="2" name="prelu1" precision="FP32" type="PReLU">
 38 | 			<data channel_shared="0" filler_type="constant" filler_value="0" max="1" mean="0" min="0" sparse="-1" std="0" variance_norm="caffe.FillerParameter.FAN_IN"/>
 39 | 			<input>
 40 | 				<port id="0">
 41 | 					<dim>1</dim>
 42 | 					<dim>32</dim>
 43 | 					<dim>46</dim>
 44 | 					<dim>46</dim>
 45 | 				</port>
 46 | 			</input>
 47 | 			<output>
 48 | 				<port id="2">
 49 | 					<dim>1</dim>
 50 | 					<dim>32</dim>
 51 | 					<dim>46</dim>
 52 | 					<dim>46</dim>
 53 | 				</port>
 54 | 			</output>
 55 | 			<blobs>
 56 | 				<weights offset="3584" size="128"/>
 57 | 			</blobs>
 58 | 		</layer>
 59 | 		<layer id="3" name="pool1" precision="FP32" type="Pooling">
 60 | 			<data exclude-pad="false" kernel="3,3" pads_begin="0,0" pads_end="0,0" pool-method="max" rounding_type="ceil" strides="2,2"/>
 61 | 			<input>
 62 | 				<port id="0">
 63 | 					<dim>1</dim>
 64 | 					<dim>32</dim>
 65 | 					<dim>46</dim>
 66 | 					<dim>46</dim>
 67 | 				</port>
 68 | 			</input>
 69 | 			<output>
 70 | 				<port id="1">
 71 | 					<dim>1</dim>
 72 | 					<dim>32</dim>
 73 | 					<dim>23</dim>
 74 | 					<dim>23</dim>
 75 | 				</port>
 76 | 			</output>
 77 | 		</layer>
 78 | 		<layer id="4" name="conv2" precision="FP32" type="Convolution">
 79 | 			<data dilations="1,1" group="1" kernel="3,3" output="64" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
 80 | 			<input>
 81 | 				<port id="0">
 82 | 					<dim>1</dim>
 83 | 					<dim>32</dim>
 84 | 					<dim>23</dim>
 85 | 					<dim>23</dim>
 86 | 				</port>
 87 | 			</input>
 88 | 			<output>
 89 | 				<port id="3">
 90 | 					<dim>1</dim>
 91 | 					<dim>64</dim>
 92 | 					<dim>21</dim>
 93 | 					<dim>21</dim>
 94 | 				</port>
 95 | 			</output>
 96 | 			<blobs>
 97 | 				<weights offset="3712" size="73728"/>
 98 | 				<biases offset="77440" size="256"/>
 99 | 			</blobs>
100 | 		</layer>
101 | 		<layer id="5" name="prelu2" precision="FP32" type="PReLU">
102 | 			<data channel_shared="0" filler_type="constant" filler_value="0" max="1" mean="0" min="0" sparse="-1" std="0" variance_norm="caffe.FillerParameter.FAN_IN"/>
103 | 			<input>
104 | 				<port id="0">
105 | 					<dim>1</dim>
106 | 					<dim>64</dim>
107 | 					<dim>21</dim>
108 | 					<dim>21</dim>
109 | 				</port>
110 | 			</input>
111 | 			<output>
112 | 				<port id="2">
113 | 					<dim>1</dim>
114 | 					<dim>64</dim>
115 | 					<dim>21</dim>
116 | 					<dim>21</dim>
117 | 				</port>
118 | 			</output>
119 | 			<blobs>
120 | 				<weights offset="77696" size="256"/>
121 | 			</blobs>
122 | 		</layer>
123 | 		<layer id="6" name="pool2" precision="FP32" type="Pooling">
124 | 			<data exclude-pad="false" kernel="3,3" pads_begin="0,0" pads_end="0,0" pool-method="max" rounding_type="ceil" strides="2,2"/>
125 | 			<input>
126 | 				<port id="0">
127 | 					<dim>1</dim>
128 | 					<dim>64</dim>
129 | 					<dim>21</dim>
130 | 					<dim>21</dim>
131 | 				</port>
132 | 			</input>
133 | 			<output>
134 | 				<port id="1">
135 | 					<dim>1</dim>
136 | 					<dim>64</dim>
137 | 					<dim>10</dim>
138 | 					<dim>10</dim>
139 | 				</port>
140 | 			</output>
141 | 		</layer>
142 | 		<layer id="7" name="conv3" precision="FP32" type="Convolution">
143 | 			<data dilations="1,1" group="1" kernel="3,3" output="64" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
144 | 			<input>
145 | 				<port id="0">
146 | 					<dim>1</dim>
147 | 					<dim>64</dim>
148 | 					<dim>10</dim>
149 | 					<dim>10</dim>
150 | 				</port>
151 | 			</input>
152 | 			<output>
153 | 				<port id="3">
154 | 					<dim>1</dim>
155 | 					<dim>64</dim>
156 | 					<dim>8</dim>
157 | 					<dim>8</dim>
158 | 				</port>
159 | 			</output>
160 | 			<blobs>
161 | 				<weights offset="77952" size="147456"/>
162 | 				<biases offset="225408" size="256"/>
163 | 			</blobs>
164 | 		</layer>
165 | 		<layer id="8" name="prelu3" precision="FP32" type="PReLU">
166 | 			<data channel_shared="0" filler_type="constant" filler_value="0" max="1" mean="0" min="0" sparse="-1" std="0" variance_norm="caffe.FillerParameter.FAN_IN"/>
167 | 			<input>
168 | 				<port id="0">
169 | 					<dim>1</dim>
170 | 					<dim>64</dim>
171 | 					<dim>8</dim>
172 | 					<dim>8</dim>
173 | 				</port>
174 | 			</input>
175 | 			<output>
176 | 				<port id="2">
177 | 					<dim>1</dim>
178 | 					<dim>64</dim>
179 | 					<dim>8</dim>
180 | 					<dim>8</dim>
181 | 				</port>
182 | 			</output>
183 | 			<blobs>
184 | 				<weights offset="225664" size="256"/>
185 | 			</blobs>
186 | 		</layer>
187 | 		<layer id="9" name="pool3" precision="FP32" type="Pooling">
188 | 			<data exclude-pad="false" kernel="2,2" pads_begin="0,0" pads_end="0,0" pool-method="max" rounding_type="ceil" strides="2,2"/>
189 | 			<input>
190 | 				<port id="0">
191 | 					<dim>1</dim>
192 | 					<dim>64</dim>
193 | 					<dim>8</dim>
194 | 					<dim>8</dim>
195 | 				</port>
196 | 			</input>
197 | 			<output>
198 | 				<port id="1">
199 | 					<dim>1</dim>
200 | 					<dim>64</dim>
201 | 					<dim>4</dim>
202 | 					<dim>4</dim>
203 | 				</port>
204 | 			</output>
205 | 		</layer>
206 | 		<layer id="10" name="conv4" precision="FP32" type="Convolution">
207 | 			<data dilations="1,1" group="1" kernel="2,2" output="128" pads_begin="0,0" pads_end="0,0" strides="1,1"/>
208 | 			<input>
209 | 				<port id="0">
210 | 					<dim>1</dim>
211 | 					<dim>64</dim>
212 | 					<dim>4</dim>
213 | 					<dim>4</dim>
214 | 				</port>
215 | 			</input>
216 | 			<output>
217 | 				<port id="3">
218 | 					<dim>1</dim>
219 | 					<dim>128</dim>
220 | 					<dim>3</dim>
221 | 					<dim>3</dim>
222 | 				</port>
223 | 			</output>
224 | 			<blobs>
225 | 				<weights offset="225920" size="131072"/>
226 | 				<biases offset="356992" size="512"/>
227 | 			</blobs>
228 | 		</layer>
229 | 		<layer id="11" name="prelu4" precision="FP32" type="PReLU">
230 | 			<data channel_shared="0" filler_type="constant" filler_value="0" max="1" mean="0" min="0" sparse="-1" std="0" variance_norm="caffe.FillerParameter.FAN_IN"/>
231 | 			<input>
232 | 				<port id="0">
233 | 					<dim>1</dim>
234 | 					<dim>128</dim>
235 | 					<dim>3</dim>
236 | 					<dim>3</dim>
237 | 				</port>
238 | 			</input>
239 | 			<output>
240 | 				<port id="2">
241 | 					<dim>1</dim>
242 | 					<dim>128</dim>
243 | 					<dim>3</dim>
244 | 					<dim>3</dim>
245 | 				</port>
246 | 			</output>
247 | 			<blobs>
248 | 				<weights offset="357504" size="512"/>
249 | 			</blobs>
250 | 		</layer>
251 | 		<layer id="12" name="conv5" precision="FP32" type="FullyConnected">
252 | 			<data out-size="256"/>
253 | 			<input>
254 | 				<port id="0">
255 | 					<dim>1</dim>
256 | 					<dim>128</dim>
257 | 					<dim>3</dim>
258 | 					<dim>3</dim>
259 | 				</port>
260 | 			</input>
261 | 			<output>
262 | 				<port id="3">
263 | 					<dim>1</dim>
264 | 					<dim>256</dim>
265 | 				</port>
266 | 			</output>
267 | 			<blobs>
268 | 				<weights offset="358016" size="1179648"/>
269 | 				<biases offset="1537664" size="1024"/>
270 | 			</blobs>
271 | 		</layer>
272 | 		<layer id="13" name="prelu5" precision="FP32" type="PReLU">
273 | 			<data channel_shared="0" filler_type="constant" filler_value="0" max="1" mean="0" min="0" sparse="-1" std="0" variance_norm="caffe.FillerParameter.FAN_IN"/>
274 | 			<input>
275 | 				<port id="0">
276 | 					<dim>1</dim>
277 | 					<dim>256</dim>
278 | 				</port>
279 | 			</input>
280 | 			<output>
281 | 				<port id="2">
282 | 					<dim>1</dim>
283 | 					<dim>256</dim>
284 | 				</port>
285 | 			</output>
286 | 			<blobs>
287 | 				<weights offset="1538688" size="1024"/>
288 | 			</blobs>
289 | 		</layer>
290 | 		<layer id="14" name="conv6_2" precision="FP32" type="FullyConnected">
291 | 			<data out-size="4"/>
292 | 			<input>
293 | 				<port id="0">
294 | 					<dim>1</dim>
295 | 					<dim>256</dim>
296 | 				</port>
297 | 			</input>
298 | 			<output>
299 | 				<port id="3">
300 | 					<dim>1</dim>
301 | 					<dim>4</dim>
302 | 				</port>
303 | 			</output>
304 | 			<blobs>
305 | 				<weights offset="1539712" size="4096"/>
306 | 				<biases offset="1543808" size="16"/>
307 | 			</blobs>
308 | 		</layer>
309 | 		<layer id="15" name="conv6_3" precision="FP32" type="FullyConnected">
310 | 			<data out-size="10"/>
311 | 			<input>
312 | 				<port id="0">
313 | 					<dim>1</dim>
314 | 					<dim>256</dim>
315 | 				</port>
316 | 			</input>
317 | 			<output>
318 | 				<port id="3">
319 | 					<dim>1</dim>
320 | 					<dim>10</dim>
321 | 				</port>
322 | 			</output>
323 | 			<blobs>
324 | 				<weights offset="1543824" size="10240"/>
325 | 				<biases offset="1554064" size="40"/>
326 | 			</blobs>
327 | 		</layer>
328 | 		<layer id="16" name="conv6_1" precision="FP32" type="FullyConnected">
329 | 			<data out-size="2"/>
330 | 			<input>
331 | 				<port id="0">
332 | 					<dim>1</dim>
333 | 					<dim>256</dim>
334 | 				</port>
335 | 			</input>
336 | 			<output>
337 | 				<port id="3">
338 | 					<dim>1</dim>
339 | 					<dim>2</dim>
340 | 				</port>
341 | 			</output>
342 | 			<blobs>
343 | 				<weights offset="1554104" size="2048"/>
344 | 				<biases offset="1556152" size="8"/>
345 | 			</blobs>
346 | 		</layer>
347 | 		<layer id="17" name="prob1" precision="FP32" type="SoftMax">
348 | 			<data axis="1"/>
349 | 			<input>
350 | 				<port id="0">
351 | 					<dim>1</dim>
352 | 					<dim>2</dim>
353 | 				</port>
354 | 			</input>
355 | 			<output>
356 | 				<port id="1">
357 | 					<dim>1</dim>
358 | 					<dim>2</dim>
359 | 				</port>
360 | 			</output>
361 | 		</layer>
362 | 	</layers>
363 | 	<edges>
364 | 		<edge from-layer="0" from-port="0" to-layer="1" to-port="0"/>
365 | 		<edge from-layer="1" from-port="3" to-layer="2" to-port="0"/>
366 | 		<edge from-layer="2" from-port="2" to-layer="3" to-port="0"/>
367 | 		<edge from-layer="3" from-port="1" to-layer="4" to-port="0"/>
368 | 		<edge from-layer="4" from-port="3" to-layer="5" to-port="0"/>
369 | 		<edge from-layer="5" from-port="2" to-layer="6" to-port="0"/>
370 | 		<edge from-layer="6" from-port="1" to-layer="7" to-port="0"/>
371 | 		<edge from-layer="7" from-port="3" to-layer="8" to-port="0"/>
372 | 		<edge from-layer="8" from-port="2" to-layer="9" to-port="0"/>
373 | 		<edge from-layer="9" from-port="1" to-layer="10" to-port="0"/>
374 | 		<edge from-layer="10" from-port="3" to-layer="11" to-port="0"/>
375 | 		<edge from-layer="11" from-port="2" to-layer="12" to-port="0"/>
376 | 		<edge from-layer="12" from-port="3" to-layer="13" to-port="0"/>
377 | 		<edge from-layer="13" from-port="2" to-layer="14" to-port="0"/>
378 | 		<edge from-layer="13" from-port="2" to-layer="15" to-port="0"/>
379 | 		<edge from-layer="13" from-port="2" to-layer="16" to-port="0"/>
380 | 		<edge from-layer="16" from-port="3" to-layer="17" to-port="0"/>
381 | 	</edges>
382 | 	<meta_data>
383 | 		<MO_version value="2019.2.0-436-gf5827d4"/>
384 | 		<cli_parameters>
385 | 			<blobs_as_inputs value="False"/>
386 | 			<data_type value="float"/>
387 | 			<disable_resnet_optimization value="False"/>
388 | 			<enable_concat_optimization value="False"/>
389 | 			<enable_ssd_gluoncv value="False"/>
390 | 			<extensions value="DIR"/>
391 | 			<framework value="mxnet"/>
392 | 			<freeze_placeholder_with_value value="{}"/>
393 | 			<generate_experimental_IR_V10 value="False"/>
394 | 			<input_model value="DIR/det3-0001.params"/>
395 | 			<input_shape value="[1,3,48,48]"/>
396 | 			<input_symbol value="DIR/det3-symbol.json"/>
397 | 			<keep_quantize_ops_in_IR value="False"/>
398 | 			<keep_shape_ops value="False"/>
399 | 			<legacy_mxnet_model value="False"/>
400 | 			<log_level value="ERROR"/>
401 | 			<mean_scale_values value="{}"/>
402 | 			<mean_values value="()"/>
403 | 			<move_to_preprocess value="False"/>
404 | 			<output_dir value="DIR"/>
405 | 			<placeholder_shapes value="[ 1  3 48 48]"/>
406 | 			<reverse_input_channels value="True"/>
407 | 			<save_params_from_nd value="False"/>
408 | 			<scale_values value="()"/>
409 | 			<silent value="False"/>
410 | 			<version value="False"/>
411 | 			<unset unset_cli_parameters="batch, disable_fusing, disable_gfusing, finegrain_fusing, generate_deprecated_IR_V2, input, model_name, nd_prefix_name, output, pretrained_model_name, scale"/>
412 | 		</cli_parameters>
413 | 	</meta_data>
414 | </net>
415 | 


--------------------------------------------------------------------------------
/inference_services/facedetection/requirements.txt:
--------------------------------------------------------------------------------
1 | Flask>=1.1
2 | opencv-python
3 | pillow


--------------------------------------------------------------------------------
/inference_services/facedetection/utils/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/odundar/face-detection-python/8ef8863d85c4ddd3c67512ff3e48fa4cf7c1d770/inference_services/facedetection/utils/__init__.py


--------------------------------------------------------------------------------
/inference_services/facedetection/utils/image_utils.py:
--------------------------------------------------------------------------------
  1 | # MIT License
  2 | #
  3 | # Copyright (c) 2019 Onur Dundar onur.dundar1@gmail.com
  4 | #
  5 | # Permission is hereby granted, free of charge, to any person obtaining a copy
  6 | # of this software and associated documentation files (the "Software"), to deal
  7 | # in the Software without restriction, including without limitation the rights
  8 | # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  9 | # copies of the Software, and to permit persons to whom the Software is
 10 | # furnished to do so, subject to the following conditions:
 11 | #
 12 | # The above copyright notice and this permission notice shall be included in all
 13 | # copies or substantial portions of the Software.
 14 | #
 15 | # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 16 | # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 17 | # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 18 | # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 19 | # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 20 | # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 21 | # SOFTWARE.
 22 | 
 23 | import cv2 as cv
 24 | import numpy as np
 25 | 
 26 | 
 27 | class ImageUtil(object):
 28 |     @staticmethod
 29 |     def crop_frame(frame, coordinate, normalized=True):
 30 |         """
 31 |         Crop Frame
 32 |         :param frame: cv mat object
 33 |         :param coordinate: x,y coordinates [xmin, ymin, xmax, ymax]
 34 |         :param normalized: if values normalized
 35 |         :return:
 36 |         """
 37 | 
 38 |         x1 = coordinate[0]
 39 |         y1 = coordinate[1]
 40 |         x2 = coordinate[2]
 41 |         y2 = coordinate[3]
 42 | 
 43 |         if normalized:
 44 |             h = frame.shape[0]
 45 |             w = frame.shape[1]
 46 | 
 47 |             x1 = int(x1 * w)
 48 |             x2 = int(x2 * w)
 49 | 
 50 |             y1 = int(y1 * h)
 51 |             y2 = int(y2 * h)
 52 | 
 53 |         return frame[y1:y2, x1:x2]
 54 | 
 55 |     @staticmethod
 56 |     def draw_text(frame, text, coordinate, line_color=(0, 255, 124), normalized=True):
 57 |         """
 58 |         Draw text with cv.puttext method
 59 |         :param frame: cv mat object
 60 |         :param coordinate: x,y coordinates [xmin, ymin, xmax, ymax]
 61 |         :param normalized: if values normalized
 62 |         :param text: Text to write on image
 63 |         :param line_color: color of text
 64 |         :return:
 65 |         """
 66 | 
 67 |         x1 = coordinate[0]
 68 |         y1 = coordinate[1]
 69 |         x2 = coordinate[2]
 70 |         y2 = coordinate[3]
 71 | 
 72 |         if normalized:
 73 |             h = frame.shape[0]
 74 |             w = frame.shape[1]
 75 | 
 76 |             x1 = int(x1 * w)
 77 |             x2 = int(x2 * w)
 78 | 
 79 |             y1 = int(y1 * h)
 80 |             y2 = int(y2 * h)
 81 | 
 82 |         font = cv.FONT_HERSHEY_SIMPLEX
 83 |         bottom_left_corner_of_text = (x2, y1 + 10)
 84 |         font_scale = 0.4
 85 |         font_color = line_color
 86 |         line_type = 1
 87 | 
 88 |         cv.putText(frame,
 89 |                    text,
 90 |                    bottom_left_corner_of_text,
 91 |                    font,
 92 |                    font_scale,
 93 |                    font_color,
 94 |                    line_type)
 95 | 
 96 |     @staticmethod
 97 |     def draw_rectangles(frame, coordinates, line_color=(0, 255, 124), normalized=True):
 98 |         """
 99 |         Draw Rectangles with given Normalized
100 |         :param frame: cv mat object
101 |         :param coordinates: x,y coordinates [xmin, ymin, xmax, ymax]
102 |         :param normalized: if values normalized
103 |         :param line_color: color of rectangle
104 |         :return:
105 |         """
106 |         for coordinate in coordinates:
107 |             x1 = coordinate[0]
108 |             y1 = coordinate[1]
109 |             x2 = coordinate[2]
110 |             y2 = coordinate[3]
111 | 
112 |             if normalized:
113 |                 h = frame.shape[0]
114 |                 w = frame.shape[1]
115 | 
116 |                 x1 = int(x1 * w)
117 |                 x2 = int(x2 * w)
118 | 
119 |                 y1 = int(y1 * h)
120 |                 y2 = int(y2 * h)
121 | 
122 |             cv.rectangle(frame, (x1, y1), (x2, y2), line_color, 2)
123 | 
124 |     @staticmethod
125 |     def draw_rectangle(frame, coordinate, line_color=(0, 255, 124), normalized=True):
126 |         """
127 |         Draw Rectangle with given Normalized
128 |         :param frame: cv mat object
129 |         :param coordinate: x,y coordinates [xmin, ymin, xmax, ymax]
130 |         :param normalized: if values normalized
131 |         :param line_color: color of rectangle
132 |         :return:
133 |         """
134 | 
135 |         x1 = coordinate[0]
136 |         y1 = coordinate[1]
137 |         x2 = coordinate[2]
138 |         y2 = coordinate[3]
139 | 
140 |         if normalized:
141 |             h = frame.shape[0]
142 |             w = frame.shape[1]
143 | 
144 |             x1 = int(x1 * w)
145 |             x2 = int(x2 * w)
146 | 
147 |             y1 = int(y1 * h)
148 |             y2 = int(y2 * h)
149 | 
150 |         cv.rectangle(frame, (x1, y1), (x2, y2), line_color, 2)
151 | 
152 |     @staticmethod
153 |     def draw_ellipse(frame, coordinate, line_color=(124, 0, 0), radius=1, normalized=True):
154 |         """
155 |         Draw Circle with given values
156 |         :param frame: cv mat object
157 |         :param coordinate: x,y coordinates [xmin, ymin, xmax, ymax]
158 |         :param normalized: if values normalized
159 |         :param line_color: color of rectangle
160 |         :param radius: radius of circle
161 |         :return:
162 |         """
163 | 
164 |         x1 = coordinate[0]
165 |         y1 = coordinate[1]
166 | 
167 |         if normalized:
168 |             h = frame.shape[0]
169 |             w = frame.shape[1]
170 | 
171 |             x1 = int(x1 * w)
172 |             y1 = int(y1 * h)
173 | 
174 |         cv.circle(frame, (x1, y1), radius=radius, color=line_color, thickness=1)
175 | 


--------------------------------------------------------------------------------
/inference_services/flask_hello_world/Dockerfile:
--------------------------------------------------------------------------------
 1 | FROM ubuntu:18.04
 2 | 
 3 | MAINTAINER ONUR DUNDAR "onur.dundar1@gmail.com"
 4 | 
 5 | RUN apt-get update -y && \
 6 |     apt-get install -y python3-pip python3-dev
 7 | 
 8 | COPY ./requirements.txt /app/requirements.txt
 9 | 
10 | WORKDIR /app
11 | 
12 | RUN pip3 install -r requirements.txt
13 | 
14 | COPY flask_app.py /app/
15 | 
16 | EXPOSE 8000
17 | 
18 | CMD ["python3", "/app/flask_app.py", "-p 8000"]


--------------------------------------------------------------------------------
/inference_services/flask_hello_world/README.md:
--------------------------------------------------------------------------------
 1 | # A Basic Flask App
 2 | 
 3 | ```bash
 4 | docker build -t flask-tutorial:latest .
 5 | 
 6 | docker run -d -p 8000:8000 flask-tutorial
 7 | ```
 8 | 
 9 | 
10 | 
11 | 
12 | 
13 | 
14 | 


--------------------------------------------------------------------------------
/inference_services/flask_hello_world/flask_app.py:
--------------------------------------------------------------------------------
 1 | # MIT License
 2 | #
 3 | # Copyright (c) 2019 Onur Dundar onur.dundar1@gmail.com
 4 | #
 5 | # Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | # of this software and associated documentation files (the "Software"), to deal
 7 | # in the Software without restriction, including without limitation the rights
 8 | # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | # copies of the Software, and to permit persons to whom the Software is
10 | # furnished to do so, subject to the following conditions:
11 | #
12 | # The above copyright notice and this permission notice shall be included in all
13 | # copies or substantial portions of the Software.
14 | #
15 | # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | # SOFTWARE.
22 | 
23 | from flask import Flask
24 | import sys
25 | import optparse
26 | import time
27 | 
28 | app = Flask(__name__)
29 | 
30 | start = int(round(time.time()))
31 | 
32 | 
33 | @app.route("/")
34 | def hello_world():
35 |     return "Hello Flask"
36 | 
37 | 
38 | if __name__ == '__main__':
39 |     parser = optparse.OptionParser(usage="python simpleapp.py -p ")
40 |     parser.add_option('-p', '--port', action='store', dest='port', help='The port to listen on.')
41 |     (args, _) = parser.parse_args()
42 |     if args.port == None:
43 |         print("Missing required argument: -p/--port")
44 |         sys.exit(1)
45 |     app.run(host='0.0.0.0', port=int(args.port), debug=False)


--------------------------------------------------------------------------------
/inference_services/flask_hello_world/requirements.txt:
--------------------------------------------------------------------------------
1 | Flask>=1.1


--------------------------------------------------------------------------------
/models/README.md:
--------------------------------------------------------------------------------
 1 | # Deep Learning Models
 2 | 
 3 | In this face detection applications, I used models from Intel's Open Model Zoo and from `deepinsight` github repository.
 4 | 
 5 | ## Open Model Zoo Face & Age-Gender Detection Models
 6 | 
 7 | There are numerous PoC type of DL models by intel in the following repository:
 8 | 
 9 | https://github.com/opencv/open_model_zoo
10 | 
11 | I have used face detection and age-gender detection models respectively:
12 | 
13 | - https://github.com/opencv/open_model_zoo/tree/master/intel_models/face-detection-retail-0004
14 | - https://github.com/opencv/open_model_zoo/tree/master/intel_models/age-gender-recognition-retail-0013
15 | 
16 | These models can be downloaded by OpenVINO(TM) Toolkit model downloader using below commands:
17 | 
18 | ```bash
19 | python3 /opt/intel/openvino/deployment_tools/tools/model_downloader/downloader.py --name age-gender-recognition-retail-0013 --output_dir openvino_models/
20 | python3 /opt/intel/openvino/deployment_tools/tools/model_downloader/downloader.py --name face-detection-retail-0004 --output_dir openvino_models/
21 | ```
22 | 
23 | You can use the models from their downloaded directory. Each has FP16 version as well. They are ready to be used with Inference Engine no extra work required.
24 | 
25 | Please also check the descriptions from the `description/face-detection-retail-0004.md` file to understand their input and outputs.
26 | 
27 | ## MTCNN Face & Age-Gender Detection Models
28 | 
29 | ### Face Detection Model
30 | 
31 | Source of Face Detection Model:
32 | 
33 | - https://github.com/YYuanAnyVision/mxnet_mtcnn_face_detection
34 | 
35 | Get Models and convert them using Model Optimizer.
36 | 
37 | Models are being trained using MxNet* framework therefore we will check guidance for conversion from MxNet conversion guideline:
38 | 
39 | - https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_convert_model_Convert_Model_From_MxNet.html
40 | 
41 | ```bash
42 | git clone https://github.com/YYuanAnyVision/mxnet_mtcnn_face_detection.git
43 | 
44 | python3 /opt/intel/openvino/deployment_tools/model_optimizer/mo_mxnet.py --input_model mxnet_mtcnn_face_detection/model/det1-0001.params --input_symbol mxnet_mtcnn_face_detection/model/det1-symbol.json --input_shape [1,3,12,12] --output_dir FP32/ --reverse_input_channels
45 | 
46 | python3 /opt/intel/openvino/deployment_tools/model_optimizer/mo_mxnet.py --input_model mxnet_mtcnn_face_detection/model/det2-0001.params --input_symbol mxnet_mtcnn_face_detection/model/det2-symbol.json --input_shape [1,3,24,24] --output_dir FP32/ --reverse_input_channels
47 | 
48 | python3 /opt/intel/openvino/deployment_tools/model_optimizer/mo_mxnet.py --input_model mxnet_mtcnn_face_detection/model/det3-0001.params --input_symbol mxnet_mtcnn_face_detection/model/det3-symbol.json --input_shape [1,3,48,48] --output_dir FP32/ --reverse_input_channels
49 | ```
50 | 
51 | You can also change FP32 to FP16 and make other corrections. 
52 | 
53 | ### Age Gender Model
54 | 
55 | - https://github.com/deepinsight/insightface/tree/master/gender-age
56 | 
57 | Pre-trained Model URL:
58 | 
59 | https://www.dropbox.com/s/2xq8mcao6z14e3u/gamodel-r50.zip?dl=0
60 | 
61 | You can convert models using Model Optimizer to make them ready to be used with OpenVINO(TM)
62 | 
63 | Deepinsight models are being trained using MxNet* framework therefore we will check guidance for conversion from MxNet conversion guideline:
64 | 
65 | - https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_convert_model_Convert_Model_From_MxNet.html
66 | 
67 | ```bash
68 | unzip gamodel-r50.zip
69 | 
70 | cd gamodel-r50
71 | 
72 | python3 /opt/intel/openvino/deployment_tools/model_optimizer/mo_mxnet.py --input_model model-0000.params --input_shape [1,3,112,112] --output_dir FP32 --data_type FP32 --scale 0.0399 --mean_values [127.5,127.5,127.5]
73 | ```
74 | 
75 | Important part here is the --input_shape, --mean_values and --scale parameters, you should investigate what they should be from the model descriptions page. Otherwise you will get faulty output.
76 | 
77 | # Important Notes for Model Conversion
78 | 
79 | Important factor while converting models to IR representations is that, all layers should be supported by Intel(R) Disribution of OpenVINO(TM) Model Optimizer otherwise certain errors will be occured.
80 | 
81 | If layers not supported, you should follow some additional development process and extend OpenVINO(TM) Toolkit Model Optimizer and add layer primitive implementation to use it in the runtime.
82 | 
83 | Many of the layer implementations are supported for MxNet*, Tensorflow*, Caffe*, ONNX* and Kaldi* 
84 | 
85 | Below are the guidelines to follow from documentation to learn about the model conversion process.
86 | 
87 | - Here is the general guideline for conversion process:
88 | 
89 |     - https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_Prepare_Trained_Model.html
90 |     - https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_convert_model_Converting_Model_General.html
91 | 
92 | - Here you can find the list of supported layers for each framework:
93 | 
94 |     - https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_Supported_Frameworks_Layers.html
95 | 
96 | If there are custom layers being used you need to add those layers with using defined steps in OpenVINO(TM) Toolkit documentation.
97 | 
98 | - Adding Custom Layers: https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_customize_model_optimizer_Customize_Model_Optimizer.html


--------------------------------------------------------------------------------
/utils/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/odundar/face-detection-python/8ef8863d85c4ddd3c67512ff3e48fa4cf7c1d770/utils/__init__.py


--------------------------------------------------------------------------------
/utils/image_utils.py:
--------------------------------------------------------------------------------
  1 | # MIT License
  2 | #
  3 | # Copyright (c) 2019 Onur Dundar onur.dundar1@gmail.com
  4 | #
  5 | # Permission is hereby granted, free of charge, to any person obtaining a copy
  6 | # of this software and associated documentation files (the "Software"), to deal
  7 | # in the Software without restriction, including without limitation the rights
  8 | # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  9 | # copies of the Software, and to permit persons to whom the Software is
 10 | # furnished to do so, subject to the following conditions:
 11 | #
 12 | # The above copyright notice and this permission notice shall be included in all
 13 | # copies or substantial portions of the Software.
 14 | #
 15 | # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 16 | # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 17 | # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 18 | # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 19 | # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 20 | # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 21 | # SOFTWARE.
 22 | 
 23 | import cv2 as cv
 24 | import numpy as np
 25 | 
 26 | 
 27 | class ImageUtil(object):
 28 |     @staticmethod
 29 |     def crop_frame(frame, coordinate, normalized=True):
 30 |         """
 31 |         Crop Frame
 32 |         :param frame: cv mat object
 33 |         :param coordinate: x,y coordinates [xmin, ymin, xmax, ymax]
 34 |         :param normalized: if values normalized
 35 |         :return:
 36 |         """
 37 | 
 38 |         x1 = coordinate[0]
 39 |         y1 = coordinate[1]
 40 |         x2 = coordinate[2]
 41 |         y2 = coordinate[3]
 42 | 
 43 |         if normalized:
 44 |             h = frame.shape[0]
 45 |             w = frame.shape[1]
 46 | 
 47 |             x1 = int(x1 * w)
 48 |             x2 = int(x2 * w)
 49 | 
 50 |             y1 = int(y1 * h)
 51 |             y2 = int(y2 * h)
 52 | 
 53 |         return frame[y1:y2, x1:x2]
 54 | 
 55 |     @staticmethod
 56 |     def draw_text(frame, text, coordinate, line_color=(0, 255, 124), normalized=True):
 57 |         """
 58 |         Draw text with cv.puttext method
 59 |         :param frame: cv mat object
 60 |         :param coordinate: x,y coordinates [xmin, ymin, xmax, ymax]
 61 |         :param normalized: if values normalized
 62 |         :param text: Text to write on image
 63 |         :param line_color: color of text
 64 |         :return:
 65 |         """
 66 | 
 67 |         x1 = coordinate[0]
 68 |         y1 = coordinate[1]
 69 |         x2 = coordinate[2]
 70 |         y2 = coordinate[3]
 71 | 
 72 |         if normalized:
 73 |             h = frame.shape[0]
 74 |             w = frame.shape[1]
 75 | 
 76 |             x1 = int(x1 * w)
 77 |             x2 = int(x2 * w)
 78 | 
 79 |             y1 = int(y1 * h)
 80 |             y2 = int(y2 * h)
 81 | 
 82 |         font = cv.FONT_HERSHEY_SIMPLEX
 83 |         bottom_left_corner_of_text = (x2, y1 + 10)
 84 |         font_scale = 0.4
 85 |         font_color = line_color
 86 |         line_type = 1
 87 | 
 88 |         cv.putText(frame,
 89 |                    text,
 90 |                    bottom_left_corner_of_text,
 91 |                    font,
 92 |                    font_scale,
 93 |                    font_color,
 94 |                    line_type)
 95 | 
 96 |     @staticmethod
 97 |     def draw_rectangles(frame, coordinates, line_color=(0, 255, 124), normalized=True):
 98 |         """
 99 |         Draw Rectangles with given Normalized
100 |         :param frame: cv mat object
101 |         :param coordinates: x,y coordinates [xmin, ymin, xmax, ymax]
102 |         :param normalized: if values normalized
103 |         :param line_color: color of rectangle
104 |         :return:
105 |         """
106 |         for coordinate in coordinates:
107 |             x1 = coordinate[0]
108 |             y1 = coordinate[1]
109 |             x2 = coordinate[2]
110 |             y2 = coordinate[3]
111 | 
112 |             if normalized:
113 |                 h = frame.shape[0]
114 |                 w = frame.shape[1]
115 | 
116 |                 x1 = int(x1 * w)
117 |                 x2 = int(x2 * w)
118 | 
119 |                 y1 = int(y1 * h)
120 |                 y2 = int(y2 * h)
121 | 
122 |             cv.rectangle(frame, (x1, y1), (x2, y2), line_color, 2)
123 | 
124 |     @staticmethod
125 |     def draw_rectangle(frame, coordinate, line_color=(0, 255, 124), normalized=True):
126 |         """
127 |         Draw Rectangle with given Normalized
128 |         :param frame: cv mat object
129 |         :param coordinate: x,y coordinates [xmin, ymin, xmax, ymax]
130 |         :param normalized: if values normalized
131 |         :param line_color: color of rectangle
132 |         :return:
133 |         """
134 | 
135 |         x1 = coordinate[0]
136 |         y1 = coordinate[1]
137 |         x2 = coordinate[2]
138 |         y2 = coordinate[3]
139 | 
140 |         if normalized:
141 |             h = frame.shape[0]
142 |             w = frame.shape[1]
143 | 
144 |             x1 = int(x1 * w)
145 |             x2 = int(x2 * w)
146 | 
147 |             y1 = int(y1 * h)
148 |             y2 = int(y2 * h)
149 | 
150 |         cv.rectangle(frame, (x1, y1), (x2, y2), line_color, 2)
151 | 
152 |     @staticmethod
153 |     def draw_ellipse(frame, coordinate, line_color=(124, 0, 0), radius=1, normalized=True):
154 |         """
155 |         Draw Circle with given values
156 |         :param frame: cv mat object
157 |         :param coordinate: x,y coordinates [xmin, ymin, xmax, ymax]
158 |         :param normalized: if values normalized
159 |         :param line_color: color of rectangle
160 |         :param radius: radius of circle
161 |         :return:
162 |         """
163 | 
164 |         x1 = coordinate[0]
165 |         y1 = coordinate[1]
166 | 
167 |         if normalized:
168 |             h = frame.shape[0]
169 |             w = frame.shape[1]
170 | 
171 |             x1 = int(x1 * w)
172 |             y1 = int(y1 * h)
173 | 
174 |         cv.circle(frame, (x1, y1), radius=radius, color=line_color, thickness=1)
175 | 


--------------------------------------------------------------------------------