├── 001.jpg
├── 002.jpg
├── LICENSE
├── README.md
├── annotations
    ├── creat_name.py
    ├── label_map_person.pbtxt
    └── trainval_person.txt
├── creat_name.py
├── embedded_ssd_mobilenet_v1_coco.config
├── label_map_person.pbtxt
├── object_detection
    ├── CONTRIBUTING.md
    ├── __init__.py
    ├── anchor_generators
    │   ├── __init__.py
    │   ├── grid_anchor_generator.py
    │   ├── grid_anchor_generator_test.py
    │   ├── multiple_grid_anchor_generator.py
    │   ├── multiple_grid_anchor_generator_test.py
    │   ├── multiscale_grid_anchor_generator.py
    │   └── multiscale_grid_anchor_generator_test.py
    ├── box_coders
    │   ├── __init__.py
    │   ├── faster_rcnn_box_coder.py
    │   ├── faster_rcnn_box_coder_test.py
    │   ├── keypoint_box_coder.py
    │   ├── keypoint_box_coder_test.py
    │   ├── mean_stddev_box_coder.py
    │   ├── mean_stddev_box_coder_test.py
    │   ├── square_box_coder.py
    │   └── square_box_coder_test.py
    ├── builders
    │   ├── __init__.py
    │   ├── anchor_generator_builder.py
    │   ├── anchor_generator_builder_test.py
    │   ├── box_coder_builder.py
    │   ├── box_coder_builder_test.py
    │   ├── box_predictor_builder.py
    │   ├── box_predictor_builder_test.py
    │   ├── dataset_builder.py
    │   ├── dataset_builder_test.py
    │   ├── graph_rewriter_builder.py
    │   ├── graph_rewriter_builder_test.py
    │   ├── hyperparams_builder.py
    │   ├── hyperparams_builder_test.py
    │   ├── image_resizer_builder.py
    │   ├── image_resizer_builder_test.py
    │   ├── input_reader_builder.py
    │   ├── input_reader_builder_test.py
    │   ├── losses_builder.py
    │   ├── losses_builder_test.py
    │   ├── matcher_builder.py
    │   ├── matcher_builder_test.py
    │   ├── model_builder.py
    │   ├── model_builder_test.py
    │   ├── optimizer_builder.py
    │   ├── optimizer_builder_test.py
    │   ├── post_processing_builder.py
    │   ├── post_processing_builder_test.py
    │   ├── preprocessor_builder.py
    │   ├── preprocessor_builder_test.py
    │   ├── region_similarity_calculator_builder.py
    │   └── region_similarity_calculator_builder_test.py
    ├── core
    │   ├── __init__.py
    │   ├── anchor_generator.py
    │   ├── balanced_positive_negative_sampler.py
    │   ├── balanced_positive_negative_sampler_test.py
    │   ├── batcher.py
    │   ├── batcher_test.py
    │   ├── box_coder.py
    │   ├── box_coder_test.py
    │   ├── box_list.py
    │   ├── box_list_ops.py
    │   ├── box_list_ops_test.py
    │   ├── box_list_test.py
    │   ├── box_predictor.py
    │   ├── data_decoder.py
    │   ├── data_parser.py
    │   ├── freezable_batch_norm.py
    │   ├── freezable_batch_norm_test.py
    │   ├── keypoint_ops.py
    │   ├── keypoint_ops_test.py
    │   ├── losses.py
    │   ├── losses_test.py
    │   ├── matcher.py
    │   ├── matcher_test.py
    │   ├── minibatch_sampler.py
    │   ├── minibatch_sampler_test.py
    │   ├── model.py
    │   ├── post_processing.py
    │   ├── post_processing_test.py
    │   ├── prefetcher.py
    │   ├── prefetcher_test.py
    │   ├── preprocessor.py
    │   ├── preprocessor_cache.py
    │   ├── preprocessor_test.py
    │   ├── region_similarity_calculator.py
    │   ├── region_similarity_calculator_test.py
    │   ├── standard_fields.py
    │   ├── target_assigner.py
    │   └── target_assigner_test.py
    ├── create_tf_record.py
    ├── data_decoders
    │   ├── __init__.py
    │   ├── tf_example_decoder.py
    │   └── tf_example_decoder_test.py
    ├── dataset_tools
    │   ├── __init__.py
    │   ├── create_coco_tf_record.py
    │   ├── create_coco_tf_record_test.py
    │   ├── create_kitti_tf_record.py
    │   ├── create_kitti_tf_record_test.py
    │   ├── create_oid_tf_record.py
    │   ├── create_pascal_tf_record.py
    │   ├── create_pascal_tf_record_test.py
    │   ├── create_pet_tf_record.py
    │   ├── create_pycocotools_package.sh
    │   ├── download_and_preprocess_mscoco.sh
    │   ├── oid_hierarchical_labels_expansion.py
    │   ├── oid_hierarchical_labels_expansion_test.py
    │   ├── oid_tfrecord_creation.py
    │   ├── oid_tfrecord_creation_test.py
    │   ├── tf_record_creation_util.py
    │   └── tf_record_creation_util_test.py
    ├── dockerfiles
    │   └── android
    │   │   ├── Dockerfile
    │   │   └── README.md
    ├── eval_util.py
    ├── eval_util_test.py
    ├── export_inference_graph.py
    ├── export_inference_graph.sh
    ├── export_tflite_ssd_graph.py
    ├── export_tflite_ssd_graph_lib.py
    ├── export_tflite_ssd_graph_lib_test.py
    ├── exporter.py
    ├── exporter_test.py
    ├── inference
    │   ├── __init__.py
    │   ├── detection_inference.py
    │   ├── detection_inference_test.py
    │   └── infer_detections.py
    ├── inputs.py
    ├── inputs_test.py
    ├── legacy
    │   ├── __init__.py
    │   ├── eval.py
    │   ├── evaluator.py
    │   ├── train.py
    │   ├── trainer.py
    │   └── trainer_test.py
    ├── matchers
    │   ├── __init__.py
    │   ├── argmax_matcher.py
    │   ├── argmax_matcher_test.py
    │   ├── bipartite_matcher.py
    │   └── bipartite_matcher_test.py
    ├── meta_architectures
    │   ├── __init__.py
    │   ├── faster_rcnn_meta_arch.py
    │   ├── faster_rcnn_meta_arch_test.py
    │   ├── faster_rcnn_meta_arch_test_lib.py
    │   ├── rfcn_meta_arch.py
    │   ├── rfcn_meta_arch_test.py
    │   ├── ssd_meta_arch.py
    │   └── ssd_meta_arch_test.py
    ├── metrics
    │   ├── __init__.py
    │   ├── coco_evaluation.py
    │   ├── coco_evaluation_test.py
    │   ├── coco_tools.py
    │   ├── coco_tools_test.py
    │   ├── io_utils.py
    │   ├── offline_eval_map_corloc.py
    │   ├── offline_eval_map_corloc_test.py
    │   ├── oid_od_challenge_evaluation.py
    │   ├── oid_od_challenge_evaluation_utils.py
    │   ├── oid_od_challenge_evaluation_utils_test.py
    │   ├── oid_vrd_challenge_evaluation.py
    │   ├── oid_vrd_challenge_evaluation_utils.py
    │   ├── oid_vrd_challenge_evaluation_utils_test.py
    │   ├── tf_example_parser.py
    │   └── tf_example_parser_test.py
    ├── model_hparams.py
    ├── model_lib.py
    ├── model_lib_test.py
    ├── model_main.py
    ├── model_tpu_main.py
    ├── models
    │   ├── __init__.py
    │   ├── embedded_ssd_mobilenet_v1_feature_extractor.py
    │   ├── embedded_ssd_mobilenet_v1_feature_extractor_test.py
    │   ├── faster_rcnn_inception_resnet_v2_feature_extractor.py
    │   ├── faster_rcnn_inception_resnet_v2_feature_extractor_test.py
    │   ├── faster_rcnn_inception_v2_feature_extractor.py
    │   ├── faster_rcnn_inception_v2_feature_extractor_test.py
    │   ├── faster_rcnn_mobilenet_v1_feature_extractor.py
    │   ├── faster_rcnn_mobilenet_v1_feature_extractor_test.py
    │   ├── faster_rcnn_nas_feature_extractor.py
    │   ├── faster_rcnn_nas_feature_extractor_test.py
    │   ├── faster_rcnn_pnas_feature_extractor.py
    │   ├── faster_rcnn_pnas_feature_extractor_test.py
    │   ├── faster_rcnn_resnet_v1_feature_extractor.py
    │   ├── faster_rcnn_resnet_v1_feature_extractor_test.py
    │   ├── feature_map_generators.py
    │   ├── feature_map_generators_test.py
    │   ├── ssd_feature_extractor_test.py
    │   ├── ssd_inception_v2_feature_extractor.py
    │   ├── ssd_inception_v2_feature_extractor_test.py
    │   ├── ssd_inception_v3_feature_extractor.py
    │   ├── ssd_inception_v3_feature_extractor_test.py
    │   ├── ssd_mobilenet_v1_feature_extractor.py
    │   ├── ssd_mobilenet_v1_feature_extractor_test.py
    │   ├── ssd_mobilenet_v1_fpn_feature_extractor.py
    │   ├── ssd_mobilenet_v1_fpn_feature_extractor_test.py
    │   ├── ssd_mobilenet_v1_ppn_feature_extractor.py
    │   ├── ssd_mobilenet_v1_ppn_feature_extractor_test.py
    │   ├── ssd_mobilenet_v2_feature_extractor.py
    │   ├── ssd_mobilenet_v2_feature_extractor_test.py
    │   ├── ssd_resnet_v1_fpn_feature_extractor.py
    │   ├── ssd_resnet_v1_fpn_feature_extractor_test.py
    │   ├── ssd_resnet_v1_fpn_feature_extractor_testbase.py
    │   ├── ssd_resnet_v1_ppn_feature_extractor.py
    │   ├── ssd_resnet_v1_ppn_feature_extractor_test.py
    │   └── ssd_resnet_v1_ppn_feature_extractor_testbase.py
    ├── object_detection.py
    ├── predictors
    │   ├── __init__.py
    │   ├── convolutional_box_predictor.py
    │   ├── convolutional_box_predictor_test.py
    │   ├── heads
    │   │   ├── __init__.py
    │   │   ├── box_head.py
    │   │   ├── box_head_test.py
    │   │   ├── class_head.py
    │   │   ├── class_head_test.py
    │   │   ├── head.py
    │   │   ├── keypoint_head.py
    │   │   ├── keypoint_head_test.py
    │   │   ├── mask_head.py
    │   │   └── mask_head_test.py
    │   ├── mask_rcnn_box_predictor.py
    │   ├── mask_rcnn_box_predictor_test.py
    │   ├── rfcn_box_predictor.py
    │   └── rfcn_box_predictor_test.py
    ├── protos
    │   ├── __init__.py
    │   ├── anchor_generator.proto
    │   ├── anchor_generator_pb2.py
    │   ├── argmax_matcher.proto
    │   ├── argmax_matcher_pb2.py
    │   ├── bipartite_matcher.proto
    │   ├── bipartite_matcher_pb2.py
    │   ├── box_coder.proto
    │   ├── box_coder_pb2.py
    │   ├── box_predictor.proto
    │   ├── box_predictor_pb2.py
    │   ├── eval.proto
    │   ├── eval_pb2.py
    │   ├── faster_rcnn.proto
    │   ├── faster_rcnn_box_coder.proto
    │   ├── faster_rcnn_box_coder_pb2.py
    │   ├── faster_rcnn_pb2.py
    │   ├── graph_rewriter.proto
    │   ├── graph_rewriter_pb2.py
    │   ├── grid_anchor_generator.proto
    │   ├── grid_anchor_generator_pb2.py
    │   ├── hyperparams.proto
    │   ├── hyperparams_pb2.py
    │   ├── image_resizer.proto
    │   ├── image_resizer_pb2.py
    │   ├── input_reader.proto
    │   ├── input_reader_pb2.py
    │   ├── keypoint_box_coder.proto
    │   ├── keypoint_box_coder_pb2.py
    │   ├── losses.proto
    │   ├── losses_pb2.py
    │   ├── matcher.proto
    │   ├── matcher_pb2.py
    │   ├── mean_stddev_box_coder.proto
    │   ├── mean_stddev_box_coder_pb2.py
    │   ├── model.proto
    │   ├── model_pb2.py
    │   ├── multiscale_anchor_generator.proto
    │   ├── multiscale_anchor_generator_pb2.py
    │   ├── optimizer.proto
    │   ├── optimizer_pb2.py
    │   ├── pipeline.proto
    │   ├── pipeline_pb2.py
    │   ├── post_processing.proto
    │   ├── post_processing_pb2.py
    │   ├── preprocessor.proto
    │   ├── preprocessor_pb2.py
    │   ├── region_similarity_calculator.proto
    │   ├── region_similarity_calculator_pb2.py
    │   ├── square_box_coder.proto
    │   ├── square_box_coder_pb2.py
    │   ├── ssd.proto
    │   ├── ssd_anchor_generator.proto
    │   ├── ssd_anchor_generator_pb2.py
    │   ├── ssd_pb2.py
    │   ├── string_int_label_map.proto
    │   ├── string_int_label_map_pb2.py
    │   ├── train.proto
    │   └── train_pb2.py
    ├── samples
    │   └── cloud
    │   │   └── cloud.yml
    ├── train.py
    ├── train.sh
    ├── trainer.py
    └── utils
    │   ├── __init__.py
    │   ├── category_util.py
    │   ├── category_util_test.py
    │   ├── config_util.py
    │   ├── config_util_test.py
    │   ├── context_manager.py
    │   ├── context_manager_test.py
    │   ├── dataset_util.py
    │   ├── dataset_util_test.py
    │   ├── json_utils.py
    │   ├── json_utils_test.py
    │   ├── label_map_util.py
    │   ├── label_map_util_test.py
    │   ├── learning_schedules.py
    │   ├── learning_schedules_test.py
    │   ├── metrics.py
    │   ├── metrics_test.py
    │   ├── np_box_list.py
    │   ├── np_box_list_ops.py
    │   ├── np_box_list_ops_test.py
    │   ├── np_box_list_test.py
    │   ├── np_box_mask_list.py
    │   ├── np_box_mask_list_ops.py
    │   ├── np_box_mask_list_ops_test.py
    │   ├── np_box_mask_list_test.py
    │   ├── np_box_ops.py
    │   ├── np_box_ops_test.py
    │   ├── np_mask_ops.py
    │   ├── np_mask_ops_test.py
    │   ├── object_detection_evaluation.py
    │   ├── object_detection_evaluation_test.py
    │   ├── ops.py
    │   ├── ops_test.py
    │   ├── per_image_evaluation.py
    │   ├── per_image_evaluation_test.py
    │   ├── per_image_vrd_evaluation.py
    │   ├── per_image_vrd_evaluation_test.py
    │   ├── shape_utils.py
    │   ├── shape_utils_test.py
    │   ├── static_shape.py
    │   ├── static_shape_test.py
    │   ├── test_case.py
    │   ├── test_utils.py
    │   ├── test_utils_test.py
    │   ├── variables_helper.py
    │   ├── variables_helper_test.py
    │   ├── visualization_utils.py
    │   ├── visualization_utils_test.py
    │   ├── vrd_evaluation.py
    │   └── vrd_evaluation_test.py
├── oilplot_pr.png
├── oiltank_155.jpg
├── readme_ch.md
├── setup.py
├── slim
    ├── WORKSPACE
    ├── __init__.py
    ├── datasets
    │   ├── __init__.py
    │   ├── build_imagenet_data.py
    │   ├── cifar10.py
    │   ├── dataset_classification.py
    │   ├── dataset_factory.py
    │   ├── dataset_utils.py
    │   ├── download_and_convert_cifar10.py
    │   ├── download_and_convert_flowers.py
    │   ├── download_and_convert_imagenet.sh
    │   ├── download_and_convert_mnist.py
    │   ├── download_imagenet.sh
    │   ├── flowers.py
    │   ├── imagenet.py
    │   ├── imagenet_2012_validation_synset_labels.txt
    │   ├── imagenet_lsvrc_2015_synsets.txt
    │   ├── imagenet_metadata.txt
    │   ├── mnist.py
    │   ├── preprocess_imagenet_validation_data.py
    │   └── process_bounding_boxes.py
    ├── deployment
    │   ├── __init__.py
    │   ├── model_deploy.py
    │   └── model_deploy_test.py
    ├── download_and_convert_data.py
    ├── eval_image_classifier.py
    ├── export_inference_graph.py
    ├── export_inference_graph_test.py
    ├── exporter.py
    ├── nets
    │   ├── __init__.py
    │   ├── alexnet.py
    │   ├── alexnet_test.py
    │   ├── cifarnet.py
    │   ├── cyclegan.py
    │   ├── cyclegan_test.py
    │   ├── dcgan.py
    │   ├── dcgan_test.py
    │   ├── inception.py
    │   ├── inception_resnet_v2.py
    │   ├── inception_resnet_v2_test.py
    │   ├── inception_utils.py
    │   ├── inception_v1.py
    │   ├── inception_v1_test.py
    │   ├── inception_v2.py
    │   ├── inception_v2_test.py
    │   ├── inception_v3.py
    │   ├── inception_v3_test.py
    │   ├── inception_v4.py
    │   ├── inception_v4_test.py
    │   ├── lenet.py
    │   ├── mobilenet
    │   │   ├── README.md
    │   │   ├── __init__.py
    │   │   ├── conv_blocks.py
    │   │   ├── madds_top1_accuracy.png
    │   │   ├── mnet_v1_vs_v2_pixel1_latency.png
    │   │   ├── mobilenet.py
    │   │   ├── mobilenet_example.ipynb
    │   │   ├── mobilenet_v2.py
    │   │   └── mobilenet_v2_test.py
    │   ├── mobilenet_v1.md
    │   ├── mobilenet_v1.png
    │   ├── mobilenet_v1.py
    │   ├── mobilenet_v1_eval.py
    │   ├── mobilenet_v1_test.py
    │   ├── mobilenet_v1_train.py
    │   ├── nasnet
    │   │   ├── README.md
    │   │   ├── __init__.py
    │   │   ├── nasnet.py
    │   │   ├── nasnet_test.py
    │   │   ├── nasnet_utils.py
    │   │   ├── nasnet_utils_test.py
    │   │   ├── pnasnet.py
    │   │   └── pnasnet_test.py
    │   ├── nets_factory.py
    │   ├── nets_factory_test.py
    │   ├── overfeat.py
    │   ├── overfeat_test.py
    │   ├── pix2pix.py
    │   ├── pix2pix_test.py
    │   ├── resnet_utils.py
    │   ├── resnet_v1.py
    │   ├── resnet_v1_test.py
    │   ├── resnet_v2.py
    │   ├── resnet_v2_test.py
    │   ├── vgg.py
    │   └── vgg_test.py
    ├── preprocessing
    │   ├── __init__.py
    │   ├── cifarnet_preprocessing.py
    │   ├── inception_preprocessing.py
    │   ├── lenet_preprocessing.py
    │   ├── preprocessing_factory.py
    │   └── vgg_preprocessing.py
    ├── scripts
    │   ├── export_mobilenet.sh
    │   ├── finetune_inception_resnet_v2_on_flowers.sh
    │   ├── finetune_inception_v1_on_flowers.sh
    │   ├── finetune_inception_v3_on_flowers.sh
    │   ├── finetune_resnet_v1_50_on_flowers.sh
    │   ├── train_cifarnet_on_cifar10.sh
    │   └── train_lenet_on_mnist.sh
    ├── setup.py
    ├── test_images_classifier.py
    ├── train_image_classifier.py
    └── train_image_classifier_defind.py
├── trainval_person.txt
├── zcreate_record.sh
├── zfrozen.sh
└── ztrain.sh


/001.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/001.jpg


--------------------------------------------------------------------------------
/002.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/002.jpg


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2017 Nick Bourdakos
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | # Embedded target detection based on mobilenet SSD
 2 |   1. The performance of this model for embedded design in small object detection will be better, such as Northwest University of technology aircraft data set (sparse small target).
 3 |   
 4 |   2. In the detection of the new aspect ratio, the coarse and large resolution channel is used to add attention, and the performance of the sample layer target is improved greatly (multi-scale: playground, aircraft, aisle).
 5 |   
 6 |   3. In our model, we first use the deconvolution structure for multi-source rough high-resolution, and the sampling layer is faster.
 7 |   
 8 |   4. Up sampling adopts label smoothing and training initialization weight, resulting in loss transformation modification, which makes frame drawing more accurate。	
 9 | 
10 | ## VOC Dataset
11 |    voc2007 format
12 | 	
13 | ## Training
14 | 	Tensorflow-gpu==1.10.0&Tensorflow-gpu==1.12.0
15 | 	cuda =8/9
16 | 	opencv-python==3.4.0
17 | 	pillow
18 | 	matplotlib
19 | 
20 | 	1、datsets
21 | 		imges ，imgs files；
22 | 		ammitations，xml files；
23 | 
24 | 	2、label_map_person.txt ；id，name.
25 | 	creat_name.py
26 | 
27 | 	slim files
28 | 		python setup.py build
29 | 		python setup.py install
30 | 
31 | 		python setup.py build
32 | 		python setup.py install
33 | 
34 | 	3、object_detection
35 | 		create_tf_record.py，146、149、162、167 rows
36 | 		train.record
37 | 		val.record
38 | 
39 | 	4、embedded_ssd_mobilenet_v1_coco.config中9、141、146、156、172、182、184 rows。
40 | 		
41 | 	5、object_detection
42 | 		train.sh
43 | 		
44 | 	6、reference resources readme_ch.md
45 | 	
46 | ## Evaluation	
47 | 	python export_inference_graph.py --input_type image_tensor --pipeline_config_path ./rfcn_resnet101_coco.config 
48 | 	--trained_checkpoint_prefix ./models/train/model.ckpt-5000 --output_directory ./fine_tuned_model
49 |   
50 | ## Citing mini_SSD
51 |   This project realizes high-speed detection of mobile terminal from the comprehensive optimization method of engineering hardware. I declare that this model is modified by referring to a sub model of Google's object detection API model and integrating mobilnetv1 and slim methods. It is mainly for an engineering product. We realize the use of embedded system, taking into account the calculation balance burden and thread synchronization between chip modules We have made the corresponding design.
52 |   
53 |   At present, there are still some small problems in speed and accuracy. I hope to communicate with you to solve this problem and achieve the goal of 95fps. The biggest advantage of the model is that the weight volume is about 100 / 1 of the ordinary model when the speed is relatively superior. For ordinary problems, we can use this model to realize the deployment of the model within 5m, and the weight problem is generally within 2m.
54 |   
55 |   i7 CPU on a single PC 300 ms, 1200*960 size pictures. I will complete other relevant parameters. Recently, we have been busy with our own measurement. The accuracy and speed of this target can be further optimized. I will tell you the details in the second edition. Open source will be used to solve the problem of deployment on ARMLinux with a large model and to produce your own idea. In the process of using the model, we need to compile tensorflow source code and deploy TF on related arm.
56 |   
57 |   If you are not familiar with Google's target detection API, please strictly follow my tutorial, otherwise many problems will lead to compilation problems between various components.
58 | 
59 | ![result](https://github.com/Eric3911/miniDetection/blob/master/oilplot_pr.png)
60 | ![result](https://github.com/Eric3911/miniDetection/blob/master/oiltank_155.jpg)
61 | ![result](https://github.com/Eric3911/mini_SSD/blob/master/001.jpg)
62 | 


--------------------------------------------------------------------------------
/annotations/creat_name.py:
--------------------------------------------------------------------------------
1 | #2、生成名称目录脚本
2 | import os
3 | imglst = os.listdir("./annotations/xmls/")
4 | with open("./annotations/trainval_person.txt","w") as ff:
5 |     for img_path in imglst:
6 |         name = img_path.split(".")[0]
7 |         print(name)
8 |         ff.write(name+"\n")


--------------------------------------------------------------------------------
/annotations/label_map_person.pbtxt:
--------------------------------------------------------------------------------
1 | item {
2 |   id: 1
3 |   name: 'Person'
4 | }
5 | 


--------------------------------------------------------------------------------
/annotations/trainval_person.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/annotations/trainval_person.txt


--------------------------------------------------------------------------------
/creat_name.py:
--------------------------------------------------------------------------------
1 | #2、生成名称目录脚本
2 | import os
3 | imglst = os.listdir("./annotations/xmls/")
4 | with open("./annotations/trainval_person.txt","w") as ff:
5 |     for img_path in imglst:
6 |         name = img_path.split(".")[0]
7 |         print(name)
8 |         ff.write(name+"\n")


--------------------------------------------------------------------------------
/label_map_person.pbtxt:
--------------------------------------------------------------------------------
1 | item {
2 |   id: 1
3 |   name: 'Person'
4 | }
5 | 


--------------------------------------------------------------------------------
/object_detection/CONTRIBUTING.md:
--------------------------------------------------------------------------------
 1 | # Contributing to the Tensorflow Object Detection API
 2 | 
 3 | Patches to Tensorflow Object Detection API are welcome!
 4 | 
 5 | We require contributors to fill out either the individual or corporate
 6 | Contributor License Agreement (CLA).
 7 | 
 8 |   * If you are an individual writing original source code and you're sure you own the intellectual property, then you'll need to sign an [individual CLA](http://code.google.com/legal/individual-cla-v1.0.html).
 9 |   * If you work for a company that wants to allow you to contribute your work, then you'll need to sign a [corporate CLA](http://code.google.com/legal/corporate-cla-v1.0.html).
10 | 
11 | Please follow the
12 | [Tensorflow contributing guidelines](https://github.com/tensorflow/tensorflow/blob/master/CONTRIBUTING.md)
13 | when submitting pull requests.
14 | 


--------------------------------------------------------------------------------
/object_detection/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/object_detection/__init__.py


--------------------------------------------------------------------------------
/object_detection/anchor_generators/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/object_detection/anchor_generators/__init__.py


--------------------------------------------------------------------------------
/object_detection/box_coders/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/object_detection/box_coders/__init__.py


--------------------------------------------------------------------------------
/object_detection/box_coders/mean_stddev_box_coder.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Mean stddev box coder.
17 | 
18 | This box coder use the following coding schema to encode boxes:
19 | rel_code = (box_corner - anchor_corner_mean) / anchor_corner_stddev.
20 | """
21 | from object_detection.core import box_coder
22 | from object_detection.core import box_list
23 | 
24 | 
25 | class MeanStddevBoxCoder(box_coder.BoxCoder):
26 |   """Mean stddev box coder."""
27 | 
28 |   def __init__(self, stddev=0.01):
29 |     """Constructor for MeanStddevBoxCoder.
30 | 
31 |     Args:
32 |       stddev: The standard deviation used to encode and decode boxes.
33 |     """
34 |     self._stddev = stddev
35 | 
36 |   @property
37 |   def code_size(self):
38 |     return 4
39 | 
40 |   def _encode(self, boxes, anchors):
41 |     """Encode a box collection with respect to anchor collection.
42 | 
43 |     Args:
44 |       boxes: BoxList holding N boxes to be encoded.
45 |       anchors: BoxList of N anchors.
46 | 
47 |     Returns:
48 |       a tensor representing N anchor-encoded boxes
49 | 
50 |     Raises:
51 |       ValueError: if the anchors still have deprecated stddev field.
52 |     """
53 |     box_corners = boxes.get()
54 |     if anchors.has_field('stddev'):
55 |       raise ValueError("'stddev' is a parameter of MeanStddevBoxCoder and "
56 |                        "should not be specified in the box list.")
57 |     means = anchors.get()
58 |     return (box_corners - means) / self._stddev
59 | 
60 |   def _decode(self, rel_codes, anchors):
61 |     """Decode.
62 | 
63 |     Args:
64 |       rel_codes: a tensor representing N anchor-encoded boxes.
65 |       anchors: BoxList of anchors.
66 | 
67 |     Returns:
68 |       boxes: BoxList holding N bounding boxes
69 | 
70 |     Raises:
71 |       ValueError: if the anchors still have deprecated stddev field and expects
72 |         the decode method to use stddev value from that field.
73 |     """
74 |     means = anchors.get()
75 |     if anchors.has_field('stddev'):
76 |       raise ValueError("'stddev' is a parameter of MeanStddevBoxCoder and "
77 |                        "should not be specified in the box list.")
78 |     box_corners = rel_codes * self._stddev + means
79 |     return box_list.BoxList(box_corners)
80 | 


--------------------------------------------------------------------------------
/object_detection/box_coders/mean_stddev_box_coder_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Tests for object_detection.box_coder.mean_stddev_boxcoder."""
17 | 
18 | import tensorflow as tf
19 | 
20 | from object_detection.box_coders import mean_stddev_box_coder
21 | from object_detection.core import box_list
22 | 
23 | 
24 | class MeanStddevBoxCoderTest(tf.test.TestCase):
25 | 
26 |   def testGetCorrectRelativeCodesAfterEncoding(self):
27 |     box_corners = [[0.0, 0.0, 0.5, 0.5], [0.0, 0.0, 0.5, 0.5]]
28 |     boxes = box_list.BoxList(tf.constant(box_corners))
29 |     expected_rel_codes = [[0.0, 0.0, 0.0, 0.0], [-5.0, -5.0, -5.0, -3.0]]
30 |     prior_means = tf.constant([[0.0, 0.0, 0.5, 0.5], [0.5, 0.5, 1.0, 0.8]])
31 |     priors = box_list.BoxList(prior_means)
32 | 
33 |     coder = mean_stddev_box_coder.MeanStddevBoxCoder(stddev=0.1)
34 |     rel_codes = coder.encode(boxes, priors)
35 |     with self.test_session() as sess:
36 |       rel_codes_out = sess.run(rel_codes)
37 |       self.assertAllClose(rel_codes_out, expected_rel_codes)
38 | 
39 |   def testGetCorrectBoxesAfterDecoding(self):
40 |     rel_codes = tf.constant([[0.0, 0.0, 0.0, 0.0], [-5.0, -5.0, -5.0, -3.0]])
41 |     expected_box_corners = [[0.0, 0.0, 0.5, 0.5], [0.0, 0.0, 0.5, 0.5]]
42 |     prior_means = tf.constant([[0.0, 0.0, 0.5, 0.5], [0.5, 0.5, 1.0, 0.8]])
43 |     priors = box_list.BoxList(prior_means)
44 | 
45 |     coder = mean_stddev_box_coder.MeanStddevBoxCoder(stddev=0.1)
46 |     decoded_boxes = coder.decode(rel_codes, priors)
47 |     decoded_box_corners = decoded_boxes.get()
48 |     with self.test_session() as sess:
49 |       decoded_out = sess.run(decoded_box_corners)
50 |       self.assertAllClose(decoded_out, expected_box_corners)
51 | 
52 | 
53 | if __name__ == '__main__':
54 |   tf.test.main()
55 | 


--------------------------------------------------------------------------------
/object_detection/builders/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/object_detection/builders/__init__.py


--------------------------------------------------------------------------------
/object_detection/builders/box_coder_builder.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """A function to build an object detection box coder from configuration."""
17 | from object_detection.box_coders import faster_rcnn_box_coder
18 | from object_detection.box_coders import keypoint_box_coder
19 | from object_detection.box_coders import mean_stddev_box_coder
20 | from object_detection.box_coders import square_box_coder
21 | from object_detection.protos import box_coder_pb2
22 | 
23 | 
24 | def build(box_coder_config):
25 |   """Builds a box coder object based on the box coder config.
26 | 
27 |   Args:
28 |     box_coder_config: A box_coder.proto object containing the config for the
29 |       desired box coder.
30 | 
31 |   Returns:
32 |     BoxCoder based on the config.
33 | 
34 |   Raises:
35 |     ValueError: On empty box coder proto.
36 |   """
37 |   if not isinstance(box_coder_config, box_coder_pb2.BoxCoder):
38 |     raise ValueError('box_coder_config not of type box_coder_pb2.BoxCoder.')
39 | 
40 |   if box_coder_config.WhichOneof('box_coder_oneof') == 'faster_rcnn_box_coder':
41 |     return faster_rcnn_box_coder.FasterRcnnBoxCoder(scale_factors=[
42 |         box_coder_config.faster_rcnn_box_coder.y_scale,
43 |         box_coder_config.faster_rcnn_box_coder.x_scale,
44 |         box_coder_config.faster_rcnn_box_coder.height_scale,
45 |         box_coder_config.faster_rcnn_box_coder.width_scale
46 |     ])
47 |   if box_coder_config.WhichOneof('box_coder_oneof') == 'keypoint_box_coder':
48 |     return keypoint_box_coder.KeypointBoxCoder(
49 |         box_coder_config.keypoint_box_coder.num_keypoints,
50 |         scale_factors=[
51 |             box_coder_config.keypoint_box_coder.y_scale,
52 |             box_coder_config.keypoint_box_coder.x_scale,
53 |             box_coder_config.keypoint_box_coder.height_scale,
54 |             box_coder_config.keypoint_box_coder.width_scale
55 |         ])
56 |   if (box_coder_config.WhichOneof('box_coder_oneof') ==
57 |       'mean_stddev_box_coder'):
58 |     return mean_stddev_box_coder.MeanStddevBoxCoder(
59 |         stddev=box_coder_config.mean_stddev_box_coder.stddev)
60 |   if box_coder_config.WhichOneof('box_coder_oneof') == 'square_box_coder':
61 |     return square_box_coder.SquareBoxCoder(scale_factors=[
62 |         box_coder_config.square_box_coder.y_scale,
63 |         box_coder_config.square_box_coder.x_scale,
64 |         box_coder_config.square_box_coder.length_scale
65 |     ])
66 |   raise ValueError('Empty box coder.')
67 | 


--------------------------------------------------------------------------------
/object_detection/builders/graph_rewriter_builder.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2018 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Functions for quantized training and evaluation."""
16 | 
17 | import tensorflow as tf
18 | 
19 | 
20 | def build(graph_rewriter_config, is_training):
21 |   """Returns a function that modifies default graph based on options.
22 | 
23 |   Args:
24 |     graph_rewriter_config: graph_rewriter_pb2.GraphRewriter proto.
25 |     is_training: whether in training of eval mode.
26 |   """
27 |   def graph_rewrite_fn():
28 |     """Function to quantize weights and activation of the default graph."""
29 |     if (graph_rewriter_config.quantization.weight_bits != 8 or
30 |         graph_rewriter_config.quantization.activation_bits != 8):
31 |       raise ValueError('Only 8bit quantization is supported')
32 | 
33 |     # Quantize the graph by inserting quantize ops for weights and activations
34 |     if is_training:
35 |       tf.contrib.quantize.create_training_graph(
36 |           input_graph=tf.get_default_graph(),
37 |           quant_delay=graph_rewriter_config.quantization.delay)
38 |     else:
39 |       tf.contrib.quantize.create_eval_graph(input_graph=tf.get_default_graph())
40 | 
41 |     tf.contrib.layers.summarize_collection('quant_vars')
42 |   return graph_rewrite_fn
43 | 


--------------------------------------------------------------------------------
/object_detection/builders/graph_rewriter_builder_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2018 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Tests for graph_rewriter_builder."""
16 | import mock
17 | import tensorflow as tf
18 | from object_detection.builders import graph_rewriter_builder
19 | from object_detection.protos import graph_rewriter_pb2
20 | 
21 | 
22 | class QuantizationBuilderTest(tf.test.TestCase):
23 | 
24 |   def testQuantizationBuilderSetsUpCorrectTrainArguments(self):
25 |     with mock.patch.object(
26 |         tf.contrib.quantize, 'create_training_graph') as mock_quant_fn:
27 |       with mock.patch.object(tf.contrib.layers,
28 |                              'summarize_collection') as mock_summarize_col:
29 |         graph_rewriter_proto = graph_rewriter_pb2.GraphRewriter()
30 |         graph_rewriter_proto.quantization.delay = 10
31 |         graph_rewriter_proto.quantization.weight_bits = 8
32 |         graph_rewriter_proto.quantization.activation_bits = 8
33 |         graph_rewrite_fn = graph_rewriter_builder.build(
34 |             graph_rewriter_proto, is_training=True)
35 |         graph_rewrite_fn()
36 |         _, kwargs = mock_quant_fn.call_args
37 |         self.assertEqual(kwargs['input_graph'], tf.get_default_graph())
38 |         self.assertEqual(kwargs['quant_delay'], 10)
39 |         mock_summarize_col.assert_called_with('quant_vars')
40 | 
41 |   def testQuantizationBuilderSetsUpCorrectEvalArguments(self):
42 |     with mock.patch.object(tf.contrib.quantize,
43 |                            'create_eval_graph') as mock_quant_fn:
44 |       with mock.patch.object(tf.contrib.layers,
45 |                              'summarize_collection') as mock_summarize_col:
46 |         graph_rewriter_proto = graph_rewriter_pb2.GraphRewriter()
47 |         graph_rewriter_proto.quantization.delay = 10
48 |         graph_rewrite_fn = graph_rewriter_builder.build(
49 |             graph_rewriter_proto, is_training=False)
50 |         graph_rewrite_fn()
51 |         _, kwargs = mock_quant_fn.call_args
52 |         self.assertEqual(kwargs['input_graph'], tf.get_default_graph())
53 |         mock_summarize_col.assert_called_with('quant_vars')
54 | 
55 | 
56 | if __name__ == '__main__':
57 |   tf.test.main()
58 | 


--------------------------------------------------------------------------------
/object_detection/builders/input_reader_builder.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Input reader builder.
17 | 
18 | Creates data sources for DetectionModels from an InputReader config. See
19 | input_reader.proto for options.
20 | 
21 | Note: If users wishes to also use their own InputReaders with the Object
22 | Detection configuration framework, they should define their own builder function
23 | that wraps the build function.
24 | """
25 | 
26 | import tensorflow as tf
27 | 
28 | from object_detection.data_decoders import tf_example_decoder
29 | from object_detection.protos import input_reader_pb2
30 | 
31 | parallel_reader = tf.contrib.slim.parallel_reader
32 | 
33 | 
34 | def build(input_reader_config):
35 |   """Builds a tensor dictionary based on the InputReader config.
36 | 
37 |   Args:
38 |     input_reader_config: A input_reader_pb2.InputReader object.
39 | 
40 |   Returns:
41 |     A tensor dict based on the input_reader_config.
42 | 
43 |   Raises:
44 |     ValueError: On invalid input reader proto.
45 |     ValueError: If no input paths are specified.
46 |   """
47 |   if not isinstance(input_reader_config, input_reader_pb2.InputReader):
48 |     raise ValueError('input_reader_config not of type '
49 |                      'input_reader_pb2.InputReader.')
50 | 
51 |   if input_reader_config.WhichOneof('input_reader') == 'tf_record_input_reader':
52 |     config = input_reader_config.tf_record_input_reader
53 |     if not config.input_path:
54 |       raise ValueError('At least one input path must be specified in '
55 |                        '`input_reader_config`.')
56 |     _, string_tensor = parallel_reader.parallel_read(
57 |         config.input_path[:],  # Convert `RepeatedScalarContainer` to list.
58 |         reader_class=tf.TFRecordReader,
59 |         num_epochs=(input_reader_config.num_epochs
60 |                     if input_reader_config.num_epochs else None),
61 |         num_readers=input_reader_config.num_readers,
62 |         shuffle=input_reader_config.shuffle,
63 |         dtypes=[tf.string, tf.string],
64 |         capacity=input_reader_config.queue_capacity,
65 |         min_after_dequeue=input_reader_config.min_after_dequeue)
66 | 
67 |     label_map_proto_file = None
68 |     if input_reader_config.HasField('label_map_path'):
69 |       label_map_proto_file = input_reader_config.label_map_path
70 |     decoder = tf_example_decoder.TfExampleDecoder(
71 |         load_instance_masks=input_reader_config.load_instance_masks,
72 |         instance_mask_type=input_reader_config.mask_type,
73 |         label_map_proto_file=label_map_proto_file)
74 |     return decoder.decode(string_tensor)
75 | 
76 |   raise ValueError('Unsupported input_reader_config.')
77 | 


--------------------------------------------------------------------------------
/object_detection/builders/matcher_builder.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """A function to build an object detection matcher from configuration."""
17 | 
18 | from object_detection.matchers import argmax_matcher
19 | from object_detection.matchers import bipartite_matcher
20 | from object_detection.protos import matcher_pb2
21 | 
22 | 
23 | def build(matcher_config):
24 |   """Builds a matcher object based on the matcher config.
25 | 
26 |   Args:
27 |     matcher_config: A matcher.proto object containing the config for the desired
28 |       Matcher.
29 | 
30 |   Returns:
31 |     Matcher based on the config.
32 | 
33 |   Raises:
34 |     ValueError: On empty matcher proto.
35 |   """
36 |   if not isinstance(matcher_config, matcher_pb2.Matcher):
37 |     raise ValueError('matcher_config not of type matcher_pb2.Matcher.')
38 |   if matcher_config.WhichOneof('matcher_oneof') == 'argmax_matcher':
39 |     matcher = matcher_config.argmax_matcher
40 |     matched_threshold = unmatched_threshold = None
41 |     if not matcher.ignore_thresholds:
42 |       matched_threshold = matcher.matched_threshold
43 |       unmatched_threshold = matcher.unmatched_threshold
44 |     return argmax_matcher.ArgMaxMatcher(
45 |         matched_threshold=matched_threshold,
46 |         unmatched_threshold=unmatched_threshold,
47 |         negatives_lower_than_unmatched=matcher.negatives_lower_than_unmatched,
48 |         force_match_for_each_row=matcher.force_match_for_each_row,
49 |         use_matmul_gather=matcher.use_matmul_gather)
50 |   if matcher_config.WhichOneof('matcher_oneof') == 'bipartite_matcher':
51 |     matcher = matcher_config.bipartite_matcher
52 |     return bipartite_matcher.GreedyBipartiteMatcher(matcher.use_matmul_gather)
53 |   raise ValueError('Empty matcher.')
54 | 


--------------------------------------------------------------------------------
/object_detection/builders/region_similarity_calculator_builder.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Builder for region similarity calculators."""
17 | 
18 | from object_detection.core import region_similarity_calculator
19 | from object_detection.protos import region_similarity_calculator_pb2
20 | 
21 | 
22 | def build(region_similarity_calculator_config):
23 |   """Builds region similarity calculator based on the configuration.
24 | 
25 |   Builds one of [IouSimilarity, IoaSimilarity, NegSqDistSimilarity] objects. See
26 |   core/region_similarity_calculator.proto for details.
27 | 
28 |   Args:
29 |     region_similarity_calculator_config: RegionSimilarityCalculator
30 |       configuration proto.
31 | 
32 |   Returns:
33 |     region_similarity_calculator: RegionSimilarityCalculator object.
34 | 
35 |   Raises:
36 |     ValueError: On unknown region similarity calculator.
37 |   """
38 | 
39 |   if not isinstance(
40 |       region_similarity_calculator_config,
41 |       region_similarity_calculator_pb2.RegionSimilarityCalculator):
42 |     raise ValueError(
43 |         'region_similarity_calculator_config not of type '
44 |         'region_similarity_calculator_pb2.RegionsSimilarityCalculator')
45 | 
46 |   similarity_calculator = region_similarity_calculator_config.WhichOneof(
47 |       'region_similarity')
48 |   if similarity_calculator == 'iou_similarity':
49 |     return region_similarity_calculator.IouSimilarity()
50 |   if similarity_calculator == 'ioa_similarity':
51 |     return region_similarity_calculator.IoaSimilarity()
52 |   if similarity_calculator == 'neg_sq_dist_similarity':
53 |     return region_similarity_calculator.NegSqDistSimilarity()
54 |   if similarity_calculator == 'thresholded_iou_similarity':
55 |     return region_similarity_calculator.ThresholdedIouSimilarity(
56 |         region_similarity_calculator_config.thresholded_iou_similarity.threshold
57 |     )
58 | 
59 |   raise ValueError('Unknown region similarity calculator.')
60 | 


--------------------------------------------------------------------------------
/object_detection/builders/region_similarity_calculator_builder_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Tests for region_similarity_calculator_builder."""
17 | 
18 | import tensorflow as tf
19 | 
20 | from google.protobuf import text_format
21 | from object_detection.builders import region_similarity_calculator_builder
22 | from object_detection.core import region_similarity_calculator
23 | from object_detection.protos import region_similarity_calculator_pb2 as sim_calc_pb2
24 | 
25 | 
26 | class RegionSimilarityCalculatorBuilderTest(tf.test.TestCase):
27 | 
28 |   def testBuildIoaSimilarityCalculator(self):
29 |     similarity_calc_text_proto = """
30 |       ioa_similarity {
31 |       }
32 |     """
33 |     similarity_calc_proto = sim_calc_pb2.RegionSimilarityCalculator()
34 |     text_format.Merge(similarity_calc_text_proto, similarity_calc_proto)
35 |     similarity_calc = region_similarity_calculator_builder.build(
36 |         similarity_calc_proto)
37 |     self.assertTrue(isinstance(similarity_calc,
38 |                                region_similarity_calculator.IoaSimilarity))
39 | 
40 |   def testBuildIouSimilarityCalculator(self):
41 |     similarity_calc_text_proto = """
42 |       iou_similarity {
43 |       }
44 |     """
45 |     similarity_calc_proto = sim_calc_pb2.RegionSimilarityCalculator()
46 |     text_format.Merge(similarity_calc_text_proto, similarity_calc_proto)
47 |     similarity_calc = region_similarity_calculator_builder.build(
48 |         similarity_calc_proto)
49 |     self.assertTrue(isinstance(similarity_calc,
50 |                                region_similarity_calculator.IouSimilarity))
51 | 
52 |   def testBuildNegSqDistSimilarityCalculator(self):
53 |     similarity_calc_text_proto = """
54 |       neg_sq_dist_similarity {
55 |       }
56 |     """
57 |     similarity_calc_proto = sim_calc_pb2.RegionSimilarityCalculator()
58 |     text_format.Merge(similarity_calc_text_proto, similarity_calc_proto)
59 |     similarity_calc = region_similarity_calculator_builder.build(
60 |         similarity_calc_proto)
61 |     self.assertTrue(isinstance(similarity_calc,
62 |                                region_similarity_calculator.
63 |                                NegSqDistSimilarity))
64 | 
65 | 
66 | if __name__ == '__main__':
67 |   tf.test.main()
68 | 


--------------------------------------------------------------------------------
/object_detection/core/__init__.py:
--------------------------------------------------------------------------------
1 | 
2 | 


--------------------------------------------------------------------------------
/object_detection/core/box_coder_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Tests for object_detection.core.box_coder."""
17 | 
18 | import tensorflow as tf
19 | 
20 | from object_detection.core import box_coder
21 | from object_detection.core import box_list
22 | 
23 | 
24 | class MockBoxCoder(box_coder.BoxCoder):
25 |   """Test BoxCoder that encodes/decodes using the multiply-by-two function."""
26 | 
27 |   def code_size(self):
28 |     return 4
29 | 
30 |   def _encode(self, boxes, anchors):
31 |     return 2.0 * boxes.get()
32 | 
33 |   def _decode(self, rel_codes, anchors):
34 |     return box_list.BoxList(rel_codes / 2.0)
35 | 
36 | 
37 | class BoxCoderTest(tf.test.TestCase):
38 | 
39 |   def test_batch_decode(self):
40 |     mock_anchor_corners = tf.constant(
41 |         [[0, 0.1, 0.2, 0.3], [0.2, 0.4, 0.4, 0.6]], tf.float32)
42 |     mock_anchors = box_list.BoxList(mock_anchor_corners)
43 |     mock_box_coder = MockBoxCoder()
44 | 
45 |     expected_boxes = [[[0.0, 0.1, 0.5, 0.6], [0.5, 0.6, 0.7, 0.8]],
46 |                       [[0.1, 0.2, 0.3, 0.4], [0.7, 0.8, 0.9, 1.0]]]
47 | 
48 |     encoded_boxes_list = [mock_box_coder.encode(
49 |         box_list.BoxList(tf.constant(boxes)), mock_anchors)
50 |                           for boxes in expected_boxes]
51 |     encoded_boxes = tf.stack(encoded_boxes_list)
52 |     decoded_boxes = box_coder.batch_decode(
53 |         encoded_boxes, mock_box_coder, mock_anchors)
54 | 
55 |     with self.test_session() as sess:
56 |       decoded_boxes_result = sess.run(decoded_boxes)
57 |       self.assertAllClose(expected_boxes, decoded_boxes_result)
58 | 
59 | 
60 | if __name__ == '__main__':
61 |   tf.test.main()
62 | 


--------------------------------------------------------------------------------
/object_detection/core/data_decoder.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Interface for data decoders.
17 | 
18 | Data decoders decode the input data and return a dictionary of tensors keyed by
19 | the entries in core.reader.Fields.
20 | """
21 | from abc import ABCMeta
22 | from abc import abstractmethod
23 | 
24 | 
25 | class DataDecoder(object):
26 |   """Interface for data decoders."""
27 |   __metaclass__ = ABCMeta
28 | 
29 |   @abstractmethod
30 |   def decode(self, data):
31 |     """Return a single image and associated labels.
32 | 
33 |     Args:
34 |       data: a string tensor holding a serialized protocol buffer corresponding
35 |         to data for a single image.
36 | 
37 |     Returns:
38 |       tensor_dict: a dictionary containing tensors. Possible keys are defined in
39 |           reader.Fields.
40 |     """
41 |     pass
42 | 


--------------------------------------------------------------------------------
/object_detection/core/data_parser.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Interface for data parsers.
16 | 
17 | Data parser parses input data and returns a dictionary of numpy arrays
18 | keyed by the entries in standard_fields.py. Since the parser parses records
19 | to numpy arrays (materialized tensors) directly, it is used to read data for
20 | evaluation/visualization; to parse the data during training, DataDecoder should
21 | be used.
22 | """
23 | from abc import ABCMeta
24 | from abc import abstractmethod
25 | 
26 | 
27 | class DataToNumpyParser(object):
28 |   __metaclass__ = ABCMeta
29 | 
30 |   @abstractmethod
31 |   def parse(self, input_data):
32 |     """Parses input and returns a numpy array or a dictionary of numpy arrays.
33 | 
34 |     Args:
35 |       input_data: an input data
36 | 
37 |     Returns:
38 |       A numpy array or a dictionary of numpy arrays or None, if input
39 |       cannot be parsed.
40 |     """
41 |     pass
42 | 


--------------------------------------------------------------------------------
/object_detection/core/freezable_batch_norm.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2018 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """A freezable batch norm layer that uses Keras batch normalization."""
17 | import tensorflow as tf
18 | 
19 | 
20 | class FreezableBatchNorm(tf.keras.layers.BatchNormalization):
21 |   """Batch normalization layer (Ioffe and Szegedy, 2014).
22 | 
23 |   This is a `freezable` batch norm layer that supports setting the `training`
24 |   parameter in the __init__ method rather than having to set it either via
25 |   the Keras learning phase or via the `call` method parameter. This layer will
26 |   forward all other parameters to the default Keras `BatchNormalization`
27 |   layer
28 | 
29 |   This is class is necessary because Object Detection model training sometimes
30 |   requires batch normalization layers to be `frozen` and used as if it was
31 |   evaluation time, despite still training (and potentially using dropout layers)
32 | 
33 |   Like the default Keras BatchNormalization layer, this will normalize the
34 |   activations of the previous layer at each batch,
35 |   i.e. applies a transformation that maintains the mean activation
36 |   close to 0 and the activation standard deviation close to 1.
37 | 
38 |   Arguments:
39 |     training: Boolean or None. If True, the batch normalization layer will
40 |       normalize the input batch using the batch mean and standard deviation,
41 |       and update the total moving mean and standard deviations. If False, the
42 |       layer will normalize using the moving average and std. dev, without
43 |       updating the learned avg and std. dev.
44 |       If None, the layer will follow the keras BatchNormalization layer
45 |       strategy of checking the Keras learning phase at `call` time to decide
46 |       what to do.
47 |     **kwargs: The keyword arguments to forward to the keras BatchNormalization
48 |         layer constructor.
49 | 
50 |   Input shape:
51 |       Arbitrary. Use the keyword argument `input_shape`
52 |       (tuple of integers, does not include the samples axis)
53 |       when using this layer as the first layer in a model.
54 | 
55 |   Output shape:
56 |       Same shape as input.
57 | 
58 |   References:
59 |       - [Batch Normalization: Accelerating Deep Network Training by Reducing
60 |         Internal Covariate Shift](https://arxiv.org/abs/1502.03167)
61 |   """
62 | 
63 |   def __init__(self, training=None, **kwargs):
64 |     super(FreezableBatchNorm, self).__init__(**kwargs)
65 |     self._training = training
66 | 
67 |   def call(self, inputs, training=None):
68 |     if training is None:
69 |       training = self._training
70 |     return super(FreezableBatchNorm, self).call(inputs, training=training)
71 | 


--------------------------------------------------------------------------------
/object_detection/core/minibatch_sampler.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Base minibatch sampler module.
17 | 
18 | The job of the minibatch_sampler is to subsample a minibatch based on some
19 | criterion.
20 | 
21 | The main function call is:
22 |     subsample(indicator, batch_size, **params).
23 | Indicator is a 1d boolean tensor where True denotes which examples can be
24 | sampled. It returns a boolean indicator where True denotes an example has been
25 | sampled..
26 | 
27 | Subclasses should implement the Subsample function and can make use of the
28 | @staticmethod SubsampleIndicator.
29 | """
30 | 
31 | from abc import ABCMeta
32 | from abc import abstractmethod
33 | 
34 | import tensorflow as tf
35 | 
36 | from object_detection.utils import ops
37 | 
38 | 
39 | class MinibatchSampler(object):
40 |   """Abstract base class for subsampling minibatches."""
41 |   __metaclass__ = ABCMeta
42 | 
43 |   def __init__(self):
44 |     """Constructs a minibatch sampler."""
45 |     pass
46 | 
47 |   @abstractmethod
48 |   def subsample(self, indicator, batch_size, **params):
49 |     """Returns subsample of entries in indicator.
50 | 
51 |     Args:
52 |       indicator: boolean tensor of shape [N] whose True entries can be sampled.
53 |       batch_size: desired batch size.
54 |       **params: additional keyword arguments for specific implementations of
55 |           the MinibatchSampler.
56 | 
57 |     Returns:
58 |       sample_indicator: boolean tensor of shape [N] whose True entries have been
59 |       sampled. If sum(indicator) >= batch_size, sum(is_sampled) = batch_size
60 |     """
61 |     pass
62 | 
63 |   @staticmethod
64 |   def subsample_indicator(indicator, num_samples):
65 |     """Subsample indicator vector.
66 | 
67 |     Given a boolean indicator vector with M elements set to `True`, the function
68 |     assigns all but `num_samples` of these previously `True` elements to
69 |     `False`. If `num_samples` is greater than M, the original indicator vector
70 |     is returned.
71 | 
72 |     Args:
73 |       indicator: a 1-dimensional boolean tensor indicating which elements
74 |         are allowed to be sampled and which are not.
75 |       num_samples: int32 scalar tensor
76 | 
77 |     Returns:
78 |       a boolean tensor with the same shape as input (indicator) tensor
79 |     """
80 |     indices = tf.where(indicator)
81 |     indices = tf.random_shuffle(indices)
82 |     indices = tf.reshape(indices, [-1])
83 | 
84 |     num_samples = tf.minimum(tf.size(indices), num_samples)
85 |     selected_indices = tf.slice(indices, [0], tf.reshape(num_samples, [1]))
86 | 
87 |     selected_indicator = ops.indices_to_dense_vector(selected_indices,
88 |                                                      tf.shape(indicator)[0])
89 | 
90 |     return tf.equal(selected_indicator, 1)
91 | 


--------------------------------------------------------------------------------
/object_detection/core/prefetcher.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Provides functions to prefetch tensors to feed into models."""
17 | import tensorflow as tf
18 | 
19 | 
20 | def prefetch(tensor_dict, capacity):
21 |   """Creates a prefetch queue for tensors.
22 | 
23 |   Creates a FIFO queue to asynchronously enqueue tensor_dicts and returns a
24 |   dequeue op that evaluates to a tensor_dict. This function is useful in
25 |   prefetching preprocessed tensors so that the data is readily available for
26 |   consumers.
27 | 
28 |   Example input pipeline when you don't need batching:
29 |   ----------------------------------------------------
30 |   key, string_tensor = slim.parallel_reader.parallel_read(...)
31 |   tensor_dict = decoder.decode(string_tensor)
32 |   tensor_dict = preprocessor.preprocess(tensor_dict, ...)
33 |   prefetch_queue = prefetcher.prefetch(tensor_dict, capacity=20)
34 |   tensor_dict = prefetch_queue.dequeue()
35 |   outputs = Model(tensor_dict)
36 |   ...
37 |   ----------------------------------------------------
38 | 
39 |   For input pipelines with batching, refer to core/batcher.py
40 | 
41 |   Args:
42 |     tensor_dict: a dictionary of tensors to prefetch.
43 |     capacity: the size of the prefetch queue.
44 | 
45 |   Returns:
46 |     a FIFO prefetcher queue
47 |   """
48 |   names = list(tensor_dict.keys())
49 |   dtypes = [t.dtype for t in tensor_dict.values()]
50 |   shapes = [t.get_shape() for t in tensor_dict.values()]
51 |   prefetch_queue = tf.PaddingFIFOQueue(capacity, dtypes=dtypes,
52 |                                        shapes=shapes,
53 |                                        names=names,
54 |                                        name='prefetch_queue')
55 |   enqueue_op = prefetch_queue.enqueue(tensor_dict)
56 |   tf.train.queue_runner.add_queue_runner(tf.train.queue_runner.QueueRunner(
57 |       prefetch_queue, [enqueue_op]))
58 |   tf.summary.scalar('queue/%s/fraction_of_%d_full' % (prefetch_queue.name,
59 |                                                       capacity),
60 |                     tf.to_float(prefetch_queue.size()) * (1. / capacity))
61 |   return prefetch_queue
62 | 


--------------------------------------------------------------------------------
/object_detection/data_decoders/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/object_detection/data_decoders/__init__.py


--------------------------------------------------------------------------------
/object_detection/dataset_tools/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/object_detection/dataset_tools/__init__.py


--------------------------------------------------------------------------------
/object_detection/dataset_tools/create_pycocotools_package.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | # Copyright 2018 The TensorFlow Authors. All Rights Reserved.
 3 | #
 4 | # Licensed under the Apache License, Version 2.0 (the "License");
 5 | # you may not use this file except in compliance with the License.
 6 | # You may obtain a copy of the License at
 7 | #
 8 | #     http://www.apache.org/licenses/LICENSE-2.0
 9 | #
10 | # Unless required by applicable law or agreed to in writing, software
11 | # distributed under the License is distributed on an "AS IS" BASIS,
12 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 | # See the License for the specific language governing permissions and
14 | # limitations under the License.
15 | # ==============================================================================
16 | 
17 | # Script to download pycocotools and make package for CMLE jobs.
18 | #
19 | # usage:
20 | #  bash object_detection/dataset_tools/create_pycocotools_package.sh \
21 | #    /tmp/pycocotools
22 | set -e
23 | 
24 | if [ -z "$1" ]; then
25 |   echo "usage create_pycocotools_package.sh [output dir]"
26 |   exit
27 | fi
28 | 
29 | # Create the output directory.
30 | OUTPUT_DIR="${1%/}"
31 | SCRATCH_DIR="${OUTPUT_DIR}/raw"
32 | mkdir -p "${OUTPUT_DIR}"
33 | mkdir -p "${SCRATCH_DIR}"
34 | 
35 | cd ${SCRATCH_DIR}
36 | git clone https://github.com/cocodataset/cocoapi.git
37 | cd cocoapi/PythonAPI && mv ../common ./
38 | 
39 | sed "s/\.\.\/common/common/g" setup.py > setup.py.updated
40 | cp -f setup.py.updated setup.py
41 | rm setup.py.updated
42 | 
43 | sed "s/\.\.\/common/common/g" pycocotools/_mask.pyx > _mask.pyx.updated
44 | cp -f _mask.pyx.updated pycocotools/_mask.pyx
45 | rm _mask.pyx.updated
46 | 
47 | sed "s/import matplotlib\.pyplot as plt/import matplotlib\nmatplotlib\.use\(\'Agg\'\)\nimport matplotlib\.pyplot as plt/g" pycocotools/coco.py > coco.py.updated
48 | cp -f coco.py.updated pycocotools/coco.py
49 | rm coco.py.updated
50 | 
51 | cd "${OUTPUT_DIR}"
52 | tar -czf pycocotools-2.0.tar.gz -C "${SCRATCH_DIR}/cocoapi/" PythonAPI/
53 | rm -rf ${SCRATCH_DIR}
54 | 


--------------------------------------------------------------------------------
/object_detection/dataset_tools/oid_hierarchical_labels_expansion_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Tests for the OpenImages label expansion (OIDHierarchicalLabelsExpansion)."""
16 | 
17 | from __future__ import absolute_import
18 | from __future__ import division
19 | from __future__ import print_function
20 | 
21 | import tensorflow as tf
22 | 
23 | from object_detection.dataset_tools import oid_hierarchical_labels_expansion
24 | 
25 | 
26 | def create_test_data():
27 |   hierarchy = {
28 |       'LabelName':
29 |           'a',
30 |       'Subcategory': [{
31 |           'LabelName': 'b'
32 |       }, {
33 |           'LabelName': 'c',
34 |           'Subcategory': [{
35 |               'LabelName': 'd'
36 |           }, {
37 |               'LabelName': 'e'
38 |           }]
39 |       }, {
40 |           'LabelName': 'f',
41 |           'Subcategory': [{
42 |               'LabelName': 'd'
43 |           },]
44 |       }]
45 |   }
46 |   bbox_rows = [
47 |       '123,xclick,b,1,0.1,0.2,0.1,0.2,1,1,0,0,0',
48 |       '123,xclick,d,1,0.2,0.3,0.1,0.2,1,1,0,0,0'
49 |   ]
50 |   label_rows = [
51 |       '123,verification,b,0', '123,verification,c,0', '124,verification,d,1'
52 |   ]
53 |   return hierarchy, bbox_rows, label_rows
54 | 
55 | 
56 | class HierarchicalLabelsExpansionTest(tf.test.TestCase):
57 | 
58 |   def test_bbox_expansion(self):
59 |     hierarchy, bbox_rows, _ = create_test_data()
60 |     expansion_generator = (
61 |         oid_hierarchical_labels_expansion.OIDHierarchicalLabelsExpansion(
62 |             hierarchy))
63 |     all_result_rows = []
64 |     for row in bbox_rows:
65 |       all_result_rows.extend(expansion_generator.expand_boxes_from_csv(row))
66 |     self.assertItemsEqual([
67 |         '123,xclick,b,1,0.1,0.2,0.1,0.2,1,1,0,0,0',
68 |         '123,xclick,d,1,0.2,0.3,0.1,0.2,1,1,0,0,0',
69 |         '123,xclick,f,1,0.2,0.3,0.1,0.2,1,1,0,0,0',
70 |         '123,xclick,c,1,0.2,0.3,0.1,0.2,1,1,0,0,0'
71 |     ], all_result_rows)
72 | 
73 |   def test_labels_expansion(self):
74 |     hierarchy, _, label_rows = create_test_data()
75 |     expansion_generator = (
76 |         oid_hierarchical_labels_expansion.OIDHierarchicalLabelsExpansion(
77 |             hierarchy))
78 |     all_result_rows = []
79 |     for row in label_rows:
80 |       all_result_rows.extend(expansion_generator.expand_labels_from_csv(row))
81 |     self.assertItemsEqual([
82 |         '123,verification,b,0', '123,verification,c,0', '123,verification,d,0',
83 |         '123,verification,e,0', '124,verification,d,1', '124,verification,f,1',
84 |         '124,verification,c,1'
85 |     ], all_result_rows)
86 | 
87 | if __name__ == '__main__':
88 |   tf.test.main()
89 | 


--------------------------------------------------------------------------------
/object_detection/dataset_tools/tf_record_creation_util.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2018 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | r"""Utilities for creating TFRecords of TF examples for the Open Images dataset.
16 | """
17 | from __future__ import absolute_import
18 | from __future__ import division
19 | from __future__ import print_function
20 | 
21 | import tensorflow as tf
22 | 
23 | 
24 | def open_sharded_output_tfrecords(exit_stack, base_path, num_shards):
25 |   """Opens all TFRecord shards for writing and adds them to an exit stack.
26 | 
27 |   Args:
28 |     exit_stack: A context2.ExitStack used to automatically closed the TFRecords
29 |       opened in this function.
30 |     base_path: The base path for all shards
31 |     num_shards: The number of shards
32 | 
33 |   Returns:
34 |     The list of opened TFRecords. Position k in the list corresponds to shard k.
35 |   """
36 |   tf_record_output_filenames = [
37 |       '{}-{:05d}-of-{:05d}'.format(base_path, idx, num_shards)
38 |       for idx in range(num_shards)
39 |   ]
40 | 
41 |   tfrecords = [
42 |       exit_stack.enter_context(tf.python_io.TFRecordWriter(file_name))
43 |       for file_name in tf_record_output_filenames
44 |   ]
45 | 
46 |   return tfrecords
47 | 


--------------------------------------------------------------------------------
/object_detection/dataset_tools/tf_record_creation_util_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2018 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Tests for tf_record_creation_util.py."""
16 | 
17 | import os
18 | import contextlib2
19 | import tensorflow as tf
20 | 
21 | from object_detection.dataset_tools import tf_record_creation_util
22 | 
23 | 
24 | class OpenOutputTfrecordsTests(tf.test.TestCase):
25 | 
26 |   def test_sharded_tfrecord_writes(self):
27 |     with contextlib2.ExitStack() as tf_record_close_stack:
28 |       output_tfrecords = tf_record_creation_util.open_sharded_output_tfrecords(
29 |           tf_record_close_stack,
30 |           os.path.join(tf.test.get_temp_dir(), 'test.tfrec'), 10)
31 |       for idx in range(10):
32 |         output_tfrecords[idx].write('test_{}'.format(idx))
33 | 
34 |     for idx in range(10):
35 |       tf_record_path = '{}-{:05d}-of-00010'.format(
36 |           os.path.join(tf.test.get_temp_dir(), 'test.tfrec'), idx)
37 |       records = list(tf.python_io.tf_record_iterator(tf_record_path))
38 |       self.assertAllEqual(records, ['test_{}'.format(idx)])
39 | 
40 | 
41 | if __name__ == '__main__':
42 |   tf.test.main()
43 | 


--------------------------------------------------------------------------------
/object_detection/dockerfiles/android/README.md:
--------------------------------------------------------------------------------
 1 | # Dockerfile for the TPU and TensorFlow Lite Object Detection tutorial
 2 | 
 3 | This Docker image automates the setup involved with training
 4 | object detection models on Google Cloud and building the Android TensorFlow Lite
 5 | demo app. We recommend using this container if you decide to work through our
 6 | tutorial on ["Training and serving a real-time mobile object detector in
 7 | 30 minutes with Cloud TPUs"](https://medium.com/tensorflow/training-and-serving-a-realtime-mobile-object-detector-in-30-minutes-with-cloud-tpus-b78971cf1193), though of course it may be useful even if you would
 8 | like to use the Object Detection API outside the context of the tutorial.
 9 | 
10 | A couple words of warning:
11 | 
12 | 1. Docker containers do not have persistent storage. This means that any changes
13 |    you make to files inside the container will not persist if you restart
14 |    the container. When running through the tutorial,
15 |    **do not close the container**.
16 | 2. To be able to deploy the [Android app](
17 |    https://github.com/tensorflow/tensorflow/tree/master/tensorflow/contrib/lite/examples/android/app)
18 |    (which you will build at the end of the tutorial),
19 |    you will need to kill any instances of `adb` running on the host machine. You
20 |    can accomplish this by closing all instances of Android Studio, and then
21 |    running `adb kill-server`.
22 | 
23 | You can install Docker by following the [instructions here](
24 | https://docs.docker.com/install/).
25 | 
26 | ## Running The Container
27 | 
28 | From this directory, build the Dockerfile as follows (this takes a while):
29 | 
30 | ```
31 | docker build --tag detect-tf .
32 | ```
33 | 
34 | Run the container:
35 | 
36 | ```
37 | docker run --rm -it --privileged -p 6006:6006 detect-tf
38 | ```
39 | 
40 | When running the container, you will find yourself inside the `/tensorflow`
41 | directory, which is the path to the TensorFlow [source
42 | tree](https://github.com/tensorflow/tensorflow).
43 | 
44 | ## Text Editing
45 | 
46 | The tutorial also
47 | requires you to occasionally edit files inside the source tree.
48 | This Docker images comes with `vim`, `nano`, and `emacs` preinstalled for your
49 | convenience.
50 | 
51 | ## What's In This Container
52 | 
53 | This container is derived from the nightly build of TensorFlow, and contains the
54 | sources for TensorFlow at `/tensorflow`, as well as the
55 | [TensorFlow Models](https://github.com/tensorflow/models) which are available at
56 | `/tensorflow/models` (and contain the Object Detection API as a subdirectory
57 | at `/tensorflow/models/research/object_detection`).
58 | The Oxford-IIIT Pets dataset, the COCO pre-trained SSD + MobileNet (v1)
59 | checkpoint, and example
60 | trained model are all available in `/tmp` in their respective folders.
61 | 
62 | This container also has the `gsutil` and `gcloud` utilities, the `bazel` build
63 | tool, and all dependencies necessary to use the Object Detection API, and
64 | compile and install the TensorFlow Lite Android demo app.
65 | 
66 | At various points throughout the tutorial, you may see references to the
67 | *research directory*.  This refers to the `research` folder within the
68 | models repository, located at
69 | `/tensorflow/models/resesarch`.
70 | 


--------------------------------------------------------------------------------
/object_detection/export_inference_graph.py:
--------------------------------------------------------------------------------
 1 | import tensorflow as tf
 2 | from google.protobuf import text_format
 3 | from object_detection import exporter
 4 | from object_detection.protos import pipeline_pb2
 5 | 
 6 | slim = tf.contrib.slim
 7 | flags = tf.app.flags
 8 | 
 9 | flags.DEFINE_string('input_type', 'image_tensor', 'Type of input node. Can be '
10 |                     'one of [`image_tensor`, `encoded_image_string_tensor`, '
11 |                     '`tf_example`]')
12 | flags.DEFINE_string('input_shape', None,
13 |                     'If input_type is `image_tensor`, this can explicitly set '
14 |                     'the shape of this input tensor to a fixed size. The '
15 |                     'dimensions are to be provided as a comma-separated list '
16 |                     'of integers. A value of -1 can be used for unknown '
17 |                     'dimensions. If not specified, for an `image_tensor, the '
18 |                     'default shape will be partially specified as '
19 |                     '`[None, None, None, 3]`.')
20 | flags.DEFINE_string('pipeline_config_path', None,
21 |                     'Path to a pipeline_pb2.TrainEvalPipelineConfig config '
22 |                     'file.')
23 | flags.DEFINE_string('trained_checkpoint_prefix', None,
24 |                     'Path to trained checkpoint, typically of the form '
25 |                     'path/to/model.ckpt')
26 | flags.DEFINE_string('output_directory', None, 'Path to write outputs.')
27 | flags.DEFINE_string('config_override', '',
28 |                     'pipeline_pb2.TrainEvalPipelineConfig '
29 |                     'text proto to override pipeline_config_path.')
30 | flags.DEFINE_boolean('write_inference_graph', False,
31 |                      'If true, writes inference graph to disk.')
32 | tf.app.flags.mark_flag_as_required('pipeline_config_path')
33 | tf.app.flags.mark_flag_as_required('trained_checkpoint_prefix')
34 | tf.app.flags.mark_flag_as_required('output_directory')
35 | FLAGS = flags.FLAGS
36 | 
37 | 
38 | def main(_):
39 |   pipeline_config = pipeline_pb2.TrainEvalPipelineConfig()
40 |   with tf.gfile.GFile(FLAGS.pipeline_config_path, 'r') as f:
41 |     text_format.Merge(f.read(), pipeline_config)
42 |   text_format.Merge(FLAGS.config_override, pipeline_config)
43 |   if FLAGS.input_shape:
44 |     input_shape = [
45 |         int(dim) if dim != '-1' else None
46 |         for dim in FLAGS.input_shape.split(',')
47 |     ]
48 |   else:
49 |     input_shape = None
50 |   exporter.export_inference_graph(
51 |       FLAGS.input_type, pipeline_config, FLAGS.trained_checkpoint_prefix,
52 |       FLAGS.output_directory, input_shape=input_shape,
53 |       write_inference_graph=FLAGS.write_inference_graph)
54 | 
55 | 
56 | if __name__ == '__main__':
57 |   tf.app.run()
58 | 


--------------------------------------------------------------------------------
/object_detection/export_inference_graph.sh:
--------------------------------------------------------------------------------
1 | python export_inference_graph.py	--input_type image_tensor	--pipeline_config_path=/path/to/ssd_inception_v2.config		--trained_checkpoint_prefix=/path/to/model.ckpt		--output_directory=/path/to/exported_model_directory


--------------------------------------------------------------------------------
/object_detection/inference/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/object_detection/inference/__init__.py


--------------------------------------------------------------------------------
/object_detection/legacy/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/object_detection/legacy/__init__.py


--------------------------------------------------------------------------------
/object_detection/matchers/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/object_detection/matchers/__init__.py


--------------------------------------------------------------------------------
/object_detection/matchers/bipartite_matcher.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Bipartite matcher implementation."""
17 | 
18 | import tensorflow as tf
19 | 
20 | from tensorflow.contrib.image.python.ops import image_ops
21 | from object_detection.core import matcher
22 | 
23 | 
24 | class GreedyBipartiteMatcher(matcher.Matcher):
25 |   """Wraps a Tensorflow greedy bipartite matcher."""
26 | 
27 |   def __init__(self, use_matmul_gather=False):
28 |     """Constructs a Matcher.
29 | 
30 |     Args:
31 |       use_matmul_gather: Force constructed match objects to use matrix
32 |         multiplication based gather instead of standard tf.gather.
33 |         (Default: False).
34 |     """
35 |     super(GreedyBipartiteMatcher, self).__init__(
36 |         use_matmul_gather=use_matmul_gather)
37 | 
38 |   def _match(self, similarity_matrix, num_valid_rows=-1):
39 |     """Bipartite matches a collection rows and columns. A greedy bi-partite.
40 | 
41 |     TODO(rathodv): Add num_valid_columns options to match only that many columns
42 |     with all the rows.
43 | 
44 |     Args:
45 |       similarity_matrix: Float tensor of shape [N, M] with pairwise similarity
46 |         where higher values mean more similar.
47 |       num_valid_rows: A scalar or a 1-D tensor with one element describing the
48 |         number of valid rows of similarity_matrix to consider for the bipartite
49 |         matching. If set to be negative, then all rows from similarity_matrix
50 |         are used.
51 | 
52 |     Returns:
53 |       match_results: int32 tensor of shape [M] with match_results[i]=-1
54 |         meaning that column i is not matched and otherwise that it is matched to
55 |         row match_results[i].
56 |     """
57 |     # Convert similarity matrix to distance matrix as tf.image.bipartite tries
58 |     # to find minimum distance matches.
59 |     distance_matrix = -1 * similarity_matrix
60 |     _, match_results = image_ops.bipartite_match(
61 |         distance_matrix, num_valid_rows)
62 |     match_results = tf.reshape(match_results, [-1])
63 |     match_results = tf.cast(match_results, tf.int32)
64 |     return match_results
65 | 


--------------------------------------------------------------------------------
/object_detection/matchers/bipartite_matcher_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Tests for object_detection.core.bipartite_matcher."""
17 | 
18 | import tensorflow as tf
19 | 
20 | from object_detection.matchers import bipartite_matcher
21 | 
22 | 
23 | class GreedyBipartiteMatcherTest(tf.test.TestCase):
24 | 
25 |   def test_get_expected_matches_when_all_rows_are_valid(self):
26 |     similarity_matrix = tf.constant([[0.50, 0.1, 0.8], [0.15, 0.2, 0.3]])
27 |     num_valid_rows = 2
28 |     expected_match_results = [-1, 1, 0]
29 | 
30 |     matcher = bipartite_matcher.GreedyBipartiteMatcher()
31 |     match = matcher.match(similarity_matrix, num_valid_rows=num_valid_rows)
32 |     with self.test_session() as sess:
33 |       match_results_out = sess.run(match._match_results)
34 |       self.assertAllEqual(match_results_out, expected_match_results)
35 | 
36 |   def test_get_expected_matches_with_valid_rows_set_to_minus_one(self):
37 |     similarity_matrix = tf.constant([[0.50, 0.1, 0.8], [0.15, 0.2, 0.3]])
38 |     num_valid_rows = -1
39 |     expected_match_results = [-1, 1, 0]
40 | 
41 |     matcher = bipartite_matcher.GreedyBipartiteMatcher()
42 |     match = matcher.match(similarity_matrix, num_valid_rows=num_valid_rows)
43 |     with self.test_session() as sess:
44 |       match_results_out = sess.run(match._match_results)
45 |       self.assertAllEqual(match_results_out, expected_match_results)
46 | 
47 |   def test_get_no_matches_with_zero_valid_rows(self):
48 |     similarity_matrix = tf.constant([[0.50, 0.1, 0.8], [0.15, 0.2, 0.3]])
49 |     num_valid_rows = 0
50 |     expected_match_results = [-1, -1, -1]
51 | 
52 |     matcher = bipartite_matcher.GreedyBipartiteMatcher()
53 |     match = matcher.match(similarity_matrix, num_valid_rows=num_valid_rows)
54 |     with self.test_session() as sess:
55 |       match_results_out = sess.run(match._match_results)
56 |       self.assertAllEqual(match_results_out, expected_match_results)
57 | 
58 |   def test_get_expected_matches_with_only_one_valid_row(self):
59 |     similarity_matrix = tf.constant([[0.50, 0.1, 0.8], [0.15, 0.2, 0.3]])
60 |     num_valid_rows = 1
61 |     expected_match_results = [-1, -1, 0]
62 | 
63 |     matcher = bipartite_matcher.GreedyBipartiteMatcher()
64 |     match = matcher.match(similarity_matrix, num_valid_rows=num_valid_rows)
65 |     with self.test_session() as sess:
66 |       match_results_out = sess.run(match._match_results)
67 |       self.assertAllEqual(match_results_out, expected_match_results)
68 | 
69 | 
70 | if __name__ == '__main__':
71 |   tf.test.main()
72 | 


--------------------------------------------------------------------------------
/object_detection/meta_architectures/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/object_detection/meta_architectures/__init__.py


--------------------------------------------------------------------------------
/object_detection/meta_architectures/rfcn_meta_arch_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Tests for object_detection.meta_architectures.rfcn_meta_arch."""
17 | 
18 | import tensorflow as tf
19 | 
20 | from object_detection.meta_architectures import faster_rcnn_meta_arch_test_lib
21 | from object_detection.meta_architectures import rfcn_meta_arch
22 | 
23 | 
24 | class RFCNMetaArchTest(
25 |     faster_rcnn_meta_arch_test_lib.FasterRCNNMetaArchTestBase):
26 | 
27 |   def _get_second_stage_box_predictor_text_proto(self):
28 |     box_predictor_text_proto = """
29 |       rfcn_box_predictor {
30 |         conv_hyperparams {
31 |           op: CONV
32 |           activation: NONE
33 |           regularizer {
34 |             l2_regularizer {
35 |               weight: 0.0005
36 |             }
37 |           }
38 |           initializer {
39 |             variance_scaling_initializer {
40 |               factor: 1.0
41 |               uniform: true
42 |               mode: FAN_AVG
43 |             }
44 |           }
45 |         }
46 |       }
47 |     """
48 |     return box_predictor_text_proto
49 | 
50 |   def _get_model(self, box_predictor, **common_kwargs):
51 |     return rfcn_meta_arch.RFCNMetaArch(
52 |         second_stage_rfcn_box_predictor=box_predictor, **common_kwargs)
53 | 
54 |   def _get_box_classifier_features_shape(self,
55 |                                          image_size,
56 |                                          batch_size,
57 |                                          max_num_proposals,
58 |                                          initial_crop_size,
59 |                                          maxpool_stride,
60 |                                          num_features):
61 |     return (batch_size, image_size, image_size, num_features)
62 | 
63 | 
64 | if __name__ == '__main__':
65 |   tf.test.main()
66 | 


--------------------------------------------------------------------------------
/object_detection/metrics/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/object_detection/metrics/__init__.py


--------------------------------------------------------------------------------
/object_detection/metrics/io_utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2018 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Common IO utils used in offline metric computation.
16 | """
17 | 
18 | from __future__ import absolute_import
19 | from __future__ import division
20 | from __future__ import print_function
21 | 
22 | import csv
23 | 
24 | 
25 | def write_csv(fid, metrics):
26 |   """Writes metrics key-value pairs to CSV file.
27 | 
28 |   Args:
29 |     fid: File identifier of an opened file.
30 |     metrics: A dictionary with metrics to be written.
31 |   """
32 |   metrics_writer = csv.writer(fid, delimiter=',')
33 |   for metric_name, metric_value in metrics.items():
34 |     metrics_writer.writerow([metric_name, str(metric_value)])
35 | 


--------------------------------------------------------------------------------
/object_detection/metrics/offline_eval_map_corloc_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Tests for utilities in offline_eval_map_corloc binary."""
16 | 
17 | import tensorflow as tf
18 | 
19 | from object_detection.metrics import offline_eval_map_corloc as offline_eval
20 | 
21 | 
22 | class OfflineEvalMapCorlocTest(tf.test.TestCase):
23 | 
24 |   def test_generateShardedFilenames(self):
25 |     test_filename = '/path/to/file'
26 |     result = offline_eval._generate_sharded_filenames(test_filename)
27 |     self.assertEqual(result, [test_filename])
28 | 
29 |     test_filename = '/path/to/file-00000-of-00050'
30 |     result = offline_eval._generate_sharded_filenames(test_filename)
31 |     self.assertEqual(result, [test_filename])
32 | 
33 |     result = offline_eval._generate_sharded_filenames('/path/to/@3.record')
34 |     self.assertEqual(result, [
35 |         '/path/to/-00000-of-00003.record', '/path/to/-00001-of-00003.record',
36 |         '/path/to/-00002-of-00003.record'
37 |     ])
38 | 
39 |     result = offline_eval._generate_sharded_filenames('/path/to/abc@3')
40 |     self.assertEqual(result, [
41 |         '/path/to/abc-00000-of-00003', '/path/to/abc-00001-of-00003',
42 |         '/path/to/abc-00002-of-00003'
43 |     ])
44 | 
45 |     result = offline_eval._generate_sharded_filenames('/path/to/@1')
46 |     self.assertEqual(result, ['/path/to/-00000-of-00001'])
47 | 
48 |   def test_generateFilenames(self):
49 |     test_filenames = ['/path/to/file', '/path/to/@3.record']
50 |     result = offline_eval._generate_filenames(test_filenames)
51 |     self.assertEqual(result, [
52 |         '/path/to/file', '/path/to/-00000-of-00003.record',
53 |         '/path/to/-00001-of-00003.record', '/path/to/-00002-of-00003.record'
54 |     ])
55 | 
56 | 
57 | if __name__ == '__main__':
58 |   tf.test.main()
59 | 


--------------------------------------------------------------------------------
/object_detection/model_hparams.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Hyperparameters for the object detection model in TF.learn.
16 | 
17 | This file consolidates and documents the hyperparameters used by the model.
18 | """
19 | 
20 | from __future__ import absolute_import
21 | from __future__ import division
22 | from __future__ import print_function
23 | 
24 | import tensorflow as tf
25 | 
26 | 
27 | def create_hparams(hparams_overrides=None):
28 |   """Returns hyperparameters, including any flag value overrides.
29 | 
30 |   Args:
31 |     hparams_overrides: Optional hparams overrides, represented as a
32 |       string containing comma-separated hparam_name=value pairs.
33 | 
34 |   Returns:
35 |     The hyperparameters as a tf.HParams object.
36 |   """
37 |   hparams = tf.contrib.training.HParams(
38 |       # Whether a fine tuning checkpoint (provided in the pipeline config)
39 |       # should be loaded for training.
40 |       load_pretrained=True)
41 |   # Override any of the preceding hyperparameter values.
42 |   if hparams_overrides:
43 |     hparams = hparams.parse(hparams_overrides)
44 |   return hparams
45 | 


--------------------------------------------------------------------------------
/object_detection/models/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/object_detection/models/__init__.py


--------------------------------------------------------------------------------
/object_detection/models/ssd_mobilenet_v1_ppn_feature_extractor.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2018 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """SSDFeatureExtractor for MobilenetV1 PPN features."""
17 | 
18 | import tensorflow as tf
19 | 
20 | from object_detection.meta_architectures import ssd_meta_arch
21 | from object_detection.models import feature_map_generators
22 | from object_detection.utils import context_manager
23 | from object_detection.utils import ops
24 | from object_detection.utils import shape_utils
25 | from nets import mobilenet_v1
26 | 
27 | slim = tf.contrib.slim
28 | 
29 | 
30 | class SSDMobileNetV1PpnFeatureExtractor(ssd_meta_arch.SSDFeatureExtractor):
31 |   """SSD Feature Extractor using MobilenetV1 PPN features."""
32 | 
33 |   def preprocess(self, resized_inputs):
34 |     """SSD preprocessing.
35 | 
36 |     Maps pixel values to the range [-1, 1].
37 | 
38 |     Args:
39 |       resized_inputs: a [batch, height, width, channels] float tensor
40 |         representing a batch of images.
41 | 
42 |     Returns:
43 |       preprocessed_inputs: a [batch, height, width, channels] float tensor
44 |         representing a batch of images.
45 |     """
46 |     return (2.0 / 255.0) * resized_inputs - 1.0
47 | 
48 |   def extract_features(self, preprocessed_inputs):
49 |     """Extract features from preprocessed inputs.
50 | 
51 |     Args:
52 |       preprocessed_inputs: a [batch, height, width, channels] float tensor
53 |         representing a batch of images.
54 | 
55 |     Returns:
56 |       feature_maps: a list of tensors where the ith tensor has shape
57 |         [batch, height_i, width_i, depth_i]
58 |     """
59 |     preprocessed_inputs = shape_utils.check_min_image_dim(
60 |         33, preprocessed_inputs)
61 | 
62 |     with tf.variable_scope('MobilenetV1',
63 |                            reuse=self._reuse_weights) as scope:
64 |       with slim.arg_scope(
65 |           mobilenet_v1.mobilenet_v1_arg_scope(
66 |               is_training=None, regularize_depthwise=True)):
67 |         with (slim.arg_scope(self._conv_hyperparams_fn())
68 |               if self._override_base_feature_extractor_hyperparams
69 |               else context_manager.IdentityContextManager()):
70 |           _, image_features = mobilenet_v1.mobilenet_v1_base(
71 |               ops.pad_to_multiple(preprocessed_inputs, self._pad_to_multiple),
72 |               final_endpoint='Conv2d_13_pointwise',
73 |               min_depth=self._min_depth,
74 |               depth_multiplier=self._depth_multiplier,
75 |               use_explicit_padding=self._use_explicit_padding,
76 |               scope=scope)
77 |       with slim.arg_scope(self._conv_hyperparams_fn()):
78 |         feature_maps = feature_map_generators.pooling_pyramid_feature_maps(
79 |             base_feature_map_depth=0,
80 |             num_layers=6,
81 |             image_features={
82 |                 'image_features': image_features['Conv2d_11_pointwise']
83 |             })
84 |     return feature_maps.values()
85 | 


--------------------------------------------------------------------------------
/object_detection/models/ssd_resnet_v1_fpn_feature_extractor_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Tests for ssd resnet v1 FPN feature extractors."""
16 | import tensorflow as tf
17 | 
18 | from object_detection.models import ssd_resnet_v1_fpn_feature_extractor
19 | from object_detection.models import ssd_resnet_v1_fpn_feature_extractor_testbase
20 | 
21 | 
22 | class SSDResnet50V1FeatureExtractorTest(
23 |     ssd_resnet_v1_fpn_feature_extractor_testbase.
24 |     SSDResnetFPNFeatureExtractorTestBase):
25 |   """SSDResnet50v1Fpn feature extractor test."""
26 | 
27 |   def _create_feature_extractor(self, depth_multiplier, pad_to_multiple,
28 |                                 use_explicit_padding=False):
29 |     min_depth = 32
30 |     is_training = True
31 |     return ssd_resnet_v1_fpn_feature_extractor.SSDResnet50V1FpnFeatureExtractor(
32 |         is_training, depth_multiplier, min_depth, pad_to_multiple,
33 |         self.conv_hyperparams_fn, use_explicit_padding=use_explicit_padding)
34 | 
35 |   def _resnet_scope_name(self):
36 |     return 'resnet_v1_50'
37 | 
38 | 
39 | class SSDResnet101V1FeatureExtractorTest(
40 |     ssd_resnet_v1_fpn_feature_extractor_testbase.
41 |     SSDResnetFPNFeatureExtractorTestBase):
42 |   """SSDResnet101v1Fpn feature extractor test."""
43 | 
44 |   def _create_feature_extractor(self, depth_multiplier, pad_to_multiple,
45 |                                 use_explicit_padding=False):
46 |     min_depth = 32
47 |     is_training = True
48 |     return (
49 |         ssd_resnet_v1_fpn_feature_extractor.SSDResnet101V1FpnFeatureExtractor(
50 |             is_training,
51 |             depth_multiplier,
52 |             min_depth,
53 |             pad_to_multiple,
54 |             self.conv_hyperparams_fn,
55 |             use_explicit_padding=use_explicit_padding))
56 | 
57 |   def _resnet_scope_name(self):
58 |     return 'resnet_v1_101'
59 | 
60 | 
61 | class SSDResnet152V1FeatureExtractorTest(
62 |     ssd_resnet_v1_fpn_feature_extractor_testbase.
63 |     SSDResnetFPNFeatureExtractorTestBase):
64 |   """SSDResnet152v1Fpn feature extractor test."""
65 | 
66 |   def _create_feature_extractor(self, depth_multiplier, pad_to_multiple,
67 |                                 use_explicit_padding=False):
68 |     min_depth = 32
69 |     is_training = True
70 |     return (
71 |         ssd_resnet_v1_fpn_feature_extractor.SSDResnet152V1FpnFeatureExtractor(
72 |             is_training,
73 |             depth_multiplier,
74 |             min_depth,
75 |             pad_to_multiple,
76 |             self.conv_hyperparams_fn,
77 |             use_explicit_padding=use_explicit_padding))
78 | 
79 |   def _resnet_scope_name(self):
80 |     return 'resnet_v1_152'
81 | 
82 | 
83 | if __name__ == '__main__':
84 |   tf.test.main()
85 | 


--------------------------------------------------------------------------------
/object_detection/models/ssd_resnet_v1_ppn_feature_extractor_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2018 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Tests for ssd resnet v1 feature extractors."""
16 | import tensorflow as tf
17 | 
18 | from object_detection.models import ssd_resnet_v1_ppn_feature_extractor
19 | from object_detection.models import ssd_resnet_v1_ppn_feature_extractor_testbase
20 | 
21 | 
22 | class SSDResnet50V1PpnFeatureExtractorTest(
23 |     ssd_resnet_v1_ppn_feature_extractor_testbase.
24 |     SSDResnetPpnFeatureExtractorTestBase):
25 |   """SSDResnet50v1 feature extractor test."""
26 | 
27 |   def _create_feature_extractor(self, depth_multiplier, pad_to_multiple,
28 |                                 use_explicit_padding=False):
29 |     min_depth = 32
30 |     is_training = True
31 |     return ssd_resnet_v1_ppn_feature_extractor.SSDResnet50V1PpnFeatureExtractor(
32 |         is_training,
33 |         depth_multiplier,
34 |         min_depth,
35 |         pad_to_multiple,
36 |         self.conv_hyperparams_fn,
37 |         use_explicit_padding=use_explicit_padding)
38 | 
39 |   def _scope_name(self):
40 |     return 'resnet_v1_50'
41 | 
42 | 
43 | class SSDResnet101V1PpnFeatureExtractorTest(
44 |     ssd_resnet_v1_ppn_feature_extractor_testbase.
45 |     SSDResnetPpnFeatureExtractorTestBase):
46 |   """SSDResnet101v1 feature extractor test."""
47 | 
48 |   def _create_feature_extractor(self, depth_multiplier, pad_to_multiple,
49 |                                 use_explicit_padding=False):
50 |     min_depth = 32
51 |     is_training = True
52 |     return (
53 |         ssd_resnet_v1_ppn_feature_extractor.SSDResnet101V1PpnFeatureExtractor(
54 |             is_training,
55 |             depth_multiplier,
56 |             min_depth,
57 |             pad_to_multiple,
58 |             self.conv_hyperparams_fn,
59 |             use_explicit_padding=use_explicit_padding))
60 | 
61 |   def _scope_name(self):
62 |     return 'resnet_v1_101'
63 | 
64 | 
65 | class SSDResnet152V1PpnFeatureExtractorTest(
66 |     ssd_resnet_v1_ppn_feature_extractor_testbase.
67 |     SSDResnetPpnFeatureExtractorTestBase):
68 |   """SSDResnet152v1 feature extractor test."""
69 | 
70 |   def _create_feature_extractor(self, depth_multiplier, pad_to_multiple,
71 |                                 use_explicit_padding=False):
72 |     min_depth = 32
73 |     is_training = True
74 |     return (
75 |         ssd_resnet_v1_ppn_feature_extractor.SSDResnet152V1PpnFeatureExtractor(
76 |             is_training,
77 |             depth_multiplier,
78 |             min_depth,
79 |             pad_to_multiple,
80 |             self.conv_hyperparams_fn,
81 |             use_explicit_padding=use_explicit_padding))
82 | 
83 |   def _scope_name(self):
84 |     return 'resnet_v1_152'
85 | 
86 | 
87 | if __name__ == '__main__':
88 |   tf.test.main()
89 | 


--------------------------------------------------------------------------------
/object_detection/models/ssd_resnet_v1_ppn_feature_extractor_testbase.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2018 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Tests for ssd resnet v1 feature extractors."""
16 | import abc
17 | import numpy as np
18 | 
19 | from object_detection.models import ssd_feature_extractor_test
20 | 
21 | 
22 | class SSDResnetPpnFeatureExtractorTestBase(
23 |     ssd_feature_extractor_test.SsdFeatureExtractorTestBase):
24 |   """Helper test class for SSD Resnet PPN feature extractors."""
25 | 
26 |   @abc.abstractmethod
27 |   def _scope_name(self):
28 |     pass
29 | 
30 |   def test_extract_features_returns_correct_shapes_289(self):
31 |     image_height = 289
32 |     image_width = 289
33 |     depth_multiplier = 1.0
34 |     pad_to_multiple = 1
35 |     expected_feature_map_shape = [(2, 19, 19, 1024), (2, 10, 10, 1024),
36 |                                   (2, 5, 5, 1024), (2, 3, 3, 1024),
37 |                                   (2, 2, 2, 1024), (2, 1, 1, 1024)]
38 |     self.check_extract_features_returns_correct_shape(
39 |         2, image_height, image_width, depth_multiplier, pad_to_multiple,
40 |         expected_feature_map_shape)
41 | 
42 |   def test_extract_features_returns_correct_shapes_with_dynamic_inputs(self):
43 |     image_height = 289
44 |     image_width = 289
45 |     depth_multiplier = 1.0
46 |     pad_to_multiple = 1
47 |     expected_feature_map_shape = [(2, 19, 19, 1024), (2, 10, 10, 1024),
48 |                                   (2, 5, 5, 1024), (2, 3, 3, 1024),
49 |                                   (2, 2, 2, 1024), (2, 1, 1, 1024)]
50 |     self.check_extract_features_returns_correct_shapes_with_dynamic_inputs(
51 |         2, image_height, image_width, depth_multiplier, pad_to_multiple,
52 |         expected_feature_map_shape)
53 | 
54 |   def test_extract_features_raises_error_with_invalid_image_size(self):
55 |     image_height = 32
56 |     image_width = 32
57 |     depth_multiplier = 1.0
58 |     pad_to_multiple = 1
59 |     self.check_extract_features_raises_error_with_invalid_image_size(
60 |         image_height, image_width, depth_multiplier, pad_to_multiple)
61 | 
62 |   def test_preprocess_returns_correct_value_range(self):
63 |     image_height = 128
64 |     image_width = 128
65 |     depth_multiplier = 1
66 |     pad_to_multiple = 1
67 |     test_image = np.random.rand(4, image_height, image_width, 3)
68 |     feature_extractor = self._create_feature_extractor(depth_multiplier,
69 |                                                        pad_to_multiple)
70 |     preprocessed_image = feature_extractor.preprocess(test_image)
71 |     self.assertAllClose(preprocessed_image,
72 |                         test_image - [[123.68, 116.779, 103.939]])
73 | 
74 |   def test_variables_only_created_in_scope(self):
75 |     depth_multiplier = 1
76 |     pad_to_multiple = 1
77 |     self.check_feature_extractor_variables_under_scope(
78 |         depth_multiplier, pad_to_multiple, self._scope_name())
79 | 


--------------------------------------------------------------------------------
/object_detection/predictors/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/object_detection/predictors/__init__.py


--------------------------------------------------------------------------------
/object_detection/predictors/heads/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/object_detection/predictors/heads/__init__.py


--------------------------------------------------------------------------------
/object_detection/predictors/heads/head.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Base head class.
17 | 
18 | All the different kinds of prediction heads in different models will inherit
19 | from this class. What is in common between all head classes is that they have a
20 | `predict` function that receives `features` as its first argument.
21 | 
22 | How to add a new prediction head to an existing meta architecture?
23 | For example, how can we add a `3d shape` prediction head to Mask RCNN?
24 | 
25 | We have to take the following steps to add a new prediction head to an
26 | existing meta arch:
27 | (a) Add a class for predicting the head. This class should inherit from the
28 | `Head` class below and have a `predict` function that receives the features
29 | and predicts the output. The output is always a tf.float32 tensor.
30 | (b) Add the head to the meta architecture. For example in case of Mask RCNN,
31 | go to box_predictor_builder and put in the logic for adding the new head to the
32 | Mask RCNN box predictor.
33 | (c) Add the logic for computing the loss for the new head.
34 | (d) Add the necessary metrics for the new head.
35 | (e) (optional) Add visualization for the new head.
36 | """
37 | from abc import abstractmethod
38 | 
39 | 
40 | class Head(object):
41 |   """Mask RCNN head base class."""
42 | 
43 |   def __init__(self):
44 |     """Constructor."""
45 |     pass
46 | 
47 |   @abstractmethod
48 |   def predict(self, features, num_predictions_per_location):
49 |     """Returns the head's predictions.
50 | 
51 |     Args:
52 |       features: A float tensor of features.
53 |       num_predictions_per_location: Int containing number of predictions per
54 |         location.
55 | 
56 |     Returns:
57 |       A tf.float32 tensor.
58 |     """
59 |     pass
60 | 


--------------------------------------------------------------------------------
/object_detection/predictors/heads/keypoint_head_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Tests for object_detection.predictors.heads.keypoint_head."""
17 | import tensorflow as tf
18 | 
19 | from google.protobuf import text_format
20 | from object_detection.builders import hyperparams_builder
21 | from object_detection.predictors.heads import keypoint_head
22 | from object_detection.protos import hyperparams_pb2
23 | from object_detection.utils import test_case
24 | 
25 | 
26 | class MaskRCNNKeypointHeadTest(test_case.TestCase):
27 | 
28 |   def _build_arg_scope_with_hyperparams(self,
29 |                                         op_type=hyperparams_pb2.Hyperparams.FC):
30 |     hyperparams = hyperparams_pb2.Hyperparams()
31 |     hyperparams_text_proto = """
32 |       activation: NONE
33 |       regularizer {
34 |         l2_regularizer {
35 |         }
36 |       }
37 |       initializer {
38 |         truncated_normal_initializer {
39 |         }
40 |       }
41 |     """
42 |     text_format.Merge(hyperparams_text_proto, hyperparams)
43 |     hyperparams.op = op_type
44 |     return hyperparams_builder.build(hyperparams, is_training=True)
45 | 
46 |   def test_prediction_size(self):
47 |     keypoint_prediction_head = keypoint_head.MaskRCNNKeypointHead(
48 |         conv_hyperparams_fn=self._build_arg_scope_with_hyperparams())
49 |     roi_pooled_features = tf.random_uniform(
50 |         [64, 14, 14, 1024], minval=-2.0, maxval=2.0, dtype=tf.float32)
51 |     prediction = keypoint_prediction_head.predict(
52 |         features=roi_pooled_features, num_predictions_per_location=1)
53 |     self.assertAllEqual([64, 1, 17, 56, 56], prediction.get_shape().as_list())
54 | 
55 | 
56 | if __name__ == '__main__':
57 |   tf.test.main()
58 | 


--------------------------------------------------------------------------------
/object_detection/predictors/rfcn_box_predictor_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Tests for object_detection.predictors.rfcn_box_predictor."""
17 | import numpy as np
18 | import tensorflow as tf
19 | 
20 | from google.protobuf import text_format
21 | from object_detection.builders import hyperparams_builder
22 | from object_detection.predictors import rfcn_box_predictor as box_predictor
23 | from object_detection.protos import hyperparams_pb2
24 | from object_detection.utils import test_case
25 | 
26 | 
27 | class RfcnBoxPredictorTest(test_case.TestCase):
28 | 
29 |   def _build_arg_scope_with_conv_hyperparams(self):
30 |     conv_hyperparams = hyperparams_pb2.Hyperparams()
31 |     conv_hyperparams_text_proto = """
32 |       regularizer {
33 |         l2_regularizer {
34 |         }
35 |       }
36 |       initializer {
37 |         truncated_normal_initializer {
38 |         }
39 |       }
40 |     """
41 |     text_format.Merge(conv_hyperparams_text_proto, conv_hyperparams)
42 |     return hyperparams_builder.build(conv_hyperparams, is_training=True)
43 | 
44 |   def test_get_correct_box_encoding_and_class_prediction_shapes(self):
45 | 
46 |     def graph_fn(image_features, proposal_boxes):
47 |       rfcn_box_predictor = box_predictor.RfcnBoxPredictor(
48 |           is_training=False,
49 |           num_classes=2,
50 |           conv_hyperparams_fn=self._build_arg_scope_with_conv_hyperparams(),
51 |           num_spatial_bins=[3, 3],
52 |           depth=4,
53 |           crop_size=[12, 12],
54 |           box_code_size=4
55 |       )
56 |       box_predictions = rfcn_box_predictor.predict(
57 |           [image_features], num_predictions_per_location=[1],
58 |           scope='BoxPredictor',
59 |           proposal_boxes=proposal_boxes)
60 |       box_encodings = tf.concat(
61 |           box_predictions[box_predictor.BOX_ENCODINGS], axis=1)
62 |       class_predictions_with_background = tf.concat(
63 |           box_predictions[box_predictor.CLASS_PREDICTIONS_WITH_BACKGROUND],
64 |           axis=1)
65 |       return (box_encodings, class_predictions_with_background)
66 | 
67 |     image_features = np.random.rand(4, 8, 8, 64).astype(np.float32)
68 |     proposal_boxes = np.random.rand(4, 2, 4).astype(np.float32)
69 |     (box_encodings, class_predictions_with_background) = self.execute(
70 |         graph_fn, [image_features, proposal_boxes])
71 | 
72 |     self.assertAllEqual(box_encodings.shape, [8, 1, 2, 4])
73 |     self.assertAllEqual(class_predictions_with_background.shape, [8, 1, 3])
74 | 
75 | 
76 | if __name__ == '__main__':
77 |   tf.test.main()
78 | 


--------------------------------------------------------------------------------
/object_detection/protos/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/object_detection/protos/__init__.py


--------------------------------------------------------------------------------
/object_detection/protos/anchor_generator.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | import "object_detection/protos/grid_anchor_generator.proto";
 6 | import "object_detection/protos/ssd_anchor_generator.proto";
 7 | import "object_detection/protos/multiscale_anchor_generator.proto";
 8 | 
 9 | // Configuration proto for the anchor generator to use in the object detection
10 | // pipeline. See core/anchor_generator.py for details.
11 | message AnchorGenerator {
12 |   oneof anchor_generator_oneof {
13 |     GridAnchorGenerator grid_anchor_generator = 1;
14 |     SsdAnchorGenerator ssd_anchor_generator = 2;
15 |     MultiscaleAnchorGenerator multiscale_anchor_generator = 3;
16 |   }
17 | }
18 | 


--------------------------------------------------------------------------------
/object_detection/protos/argmax_matcher.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | // Configuration proto for ArgMaxMatcher. See
 6 | // matchers/argmax_matcher.py for details.
 7 | message ArgMaxMatcher {
 8 |   // Threshold for positive matches.
 9 |   optional float matched_threshold = 1 [default = 0.5];
10 | 
11 |   // Threshold for negative matches.
12 |   optional float unmatched_threshold = 2 [default = 0.5];
13 | 
14 |   // Whether to construct ArgMaxMatcher without thresholds.
15 |   optional bool ignore_thresholds = 3 [default = false];
16 | 
17 |   // If True then negative matches are the ones below the unmatched_threshold,
18 |   // whereas ignored matches are in between the matched and umatched
19 |   // threshold. If False, then negative matches are in between the matched
20 |   // and unmatched threshold, and everything lower than unmatched is ignored.
21 |   optional bool negatives_lower_than_unmatched = 4 [default = true];
22 | 
23 |   // Whether to ensure each row is matched to at least one column.
24 |   optional bool force_match_for_each_row = 5 [default = false];
25 | 
26 |   // Force constructed match objects to use matrix multiplication based gather
27 |   // instead of standard tf.gather
28 |   optional bool use_matmul_gather = 6 [default = false];
29 | }
30 | 


--------------------------------------------------------------------------------
/object_detection/protos/bipartite_matcher.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | // Configuration proto for bipartite matcher. See
 6 | // matchers/bipartite_matcher.py for details.
 7 | message BipartiteMatcher {
 8 |   // Force constructed match objects to use matrix multiplication based gather
 9 |   // instead of standard tf.gather
10 |   optional bool use_matmul_gather = 6 [default = false];
11 | }
12 | 


--------------------------------------------------------------------------------
/object_detection/protos/bipartite_matcher_pb2.py:
--------------------------------------------------------------------------------
 1 | # Generated by the protocol buffer compiler.  DO NOT EDIT!
 2 | # source: object_detection/protos/bipartite_matcher.proto
 3 | 
 4 | import sys
 5 | _b=sys.version_info[0]<3 and (lambda x:x) or (lambda x:x.encode('latin1'))
 6 | from google.protobuf import descriptor as _descriptor
 7 | from google.protobuf import message as _message
 8 | from google.protobuf import reflection as _reflection
 9 | from google.protobuf import symbol_database as _symbol_database
10 | from google.protobuf import descriptor_pb2
11 | # @@protoc_insertion_point(imports)
12 | 
13 | _sym_db = _symbol_database.Default()
14 | 
15 | 
16 | 
17 | 
18 | DESCRIPTOR = _descriptor.FileDescriptor(
19 |   name='object_detection/protos/bipartite_matcher.proto',
20 |   package='object_detection.protos',
21 |   syntax='proto2',
22 |   serialized_pb=_b('\n/object_detection/protos/bipartite_matcher.proto\x12\x17object_detection.protos\"4\n\x10\x42ipartiteMatcher\x12 \n\x11use_matmul_gather\x18\x06 \x01(\x08:\x05\x66\x61lse')
23 | )
24 | 
25 | 
26 | 
27 | 
28 | _BIPARTITEMATCHER = _descriptor.Descriptor(
29 |   name='BipartiteMatcher',
30 |   full_name='object_detection.protos.BipartiteMatcher',
31 |   filename=None,
32 |   file=DESCRIPTOR,
33 |   containing_type=None,
34 |   fields=[
35 |     _descriptor.FieldDescriptor(
36 |       name='use_matmul_gather', full_name='object_detection.protos.BipartiteMatcher.use_matmul_gather', index=0,
37 |       number=6, type=8, cpp_type=7, label=1,
38 |       has_default_value=True, default_value=False,
39 |       message_type=None, enum_type=None, containing_type=None,
40 |       is_extension=False, extension_scope=None,
41 |       options=None),
42 |   ],
43 |   extensions=[
44 |   ],
45 |   nested_types=[],
46 |   enum_types=[
47 |   ],
48 |   options=None,
49 |   is_extendable=False,
50 |   syntax='proto2',
51 |   extension_ranges=[],
52 |   oneofs=[
53 |   ],
54 |   serialized_start=76,
55 |   serialized_end=128,
56 | )
57 | 
58 | DESCRIPTOR.message_types_by_name['BipartiteMatcher'] = _BIPARTITEMATCHER
59 | _sym_db.RegisterFileDescriptor(DESCRIPTOR)
60 | 
61 | BipartiteMatcher = _reflection.GeneratedProtocolMessageType('BipartiteMatcher', (_message.Message,), dict(
62 |   DESCRIPTOR = _BIPARTITEMATCHER,
63 |   __module__ = 'object_detection.protos.bipartite_matcher_pb2'
64 |   # @@protoc_insertion_point(class_scope:object_detection.protos.BipartiteMatcher)
65 |   ))
66 | _sym_db.RegisterMessage(BipartiteMatcher)
67 | 
68 | 
69 | # @@protoc_insertion_point(module_scope)
70 | 


--------------------------------------------------------------------------------
/object_detection/protos/box_coder.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | import "object_detection/protos/faster_rcnn_box_coder.proto";
 6 | import "object_detection/protos/keypoint_box_coder.proto";
 7 | import "object_detection/protos/mean_stddev_box_coder.proto";
 8 | import "object_detection/protos/square_box_coder.proto";
 9 | 
10 | // Configuration proto for the box coder to be used in the object detection
11 | // pipeline. See core/box_coder.py for details.
12 | message BoxCoder {
13 |   oneof box_coder_oneof {
14 |     FasterRcnnBoxCoder faster_rcnn_box_coder = 1;
15 |     MeanStddevBoxCoder mean_stddev_box_coder = 2;
16 |     SquareBoxCoder square_box_coder = 3;
17 |     KeypointBoxCoder keypoint_box_coder = 4;
18 |   }
19 | }
20 | 


--------------------------------------------------------------------------------
/object_detection/protos/eval.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | // Message for configuring DetectionModel evaluation jobs (eval.py).
 6 | message EvalConfig {
 7 |   // Number of visualization images to generate.
 8 |   optional uint32 num_visualizations = 1 [default=10];
 9 | 
10 |   // Number of examples to process of evaluation.
11 |   optional uint32 num_examples = 2 [default=5000];
12 | 
13 |   // How often to run evaluation.
14 |   optional uint32 eval_interval_secs = 3 [default=300];
15 | 
16 |   // Maximum number of times to run evaluation. If set to 0, will run forever.
17 |   optional uint32 max_evals = 4 [default=0];
18 | 
19 |   // Whether the TensorFlow graph used for evaluation should be saved to disk.
20 |   optional bool save_graph = 5 [default=false];
21 | 
22 |   // Path to directory to store visualizations in. If empty, visualization
23 |   // images are not exported (only shown on Tensorboard).
24 |   optional string visualization_export_dir = 6 [default=""];
25 | 
26 |   // BNS name of the TensorFlow master.
27 |   optional string eval_master = 7 [default=""];
28 | 
29 |   // Type of metrics to use for evaluation.
30 |   repeated string metrics_set = 8;
31 | 
32 |   // Path to export detections to COCO compatible JSON format.
33 |   optional string export_path = 9 [default=''];
34 | 
35 |   // Option to not read groundtruth labels and only export detections to
36 |   // COCO-compatible JSON file.
37 |   optional bool ignore_groundtruth = 10 [default=false];
38 | 
39 |   // Use exponential moving averages of variables for evaluation.
40 |   // TODO(rathodv): When this is false make sure the model is constructed
41 |   // without moving averages in restore_fn.
42 |   optional bool use_moving_averages = 11 [default=false];
43 | 
44 |   // Whether to evaluate instance masks.
45 |   // Note that since there is no evaluation code currently for instance
46 |   // segmenation this option is unused.
47 |   optional bool eval_instance_masks = 12 [default=false];
48 | 
49 |   // Minimum score threshold for a detected object box to be visualized
50 |   optional float min_score_threshold = 13 [default=0.5];
51 | 
52 |   // Maximum number of detections to visualize
53 |   optional int32 max_num_boxes_to_visualize = 14 [default=20];
54 | 
55 |   // When drawing a single detection, each label is by default visualized as
56 |   // <label name> : <label score>. One can skip the name or/and score using the
57 |   // following fields:
58 |   optional bool skip_scores = 15 [default=false];
59 |   optional bool skip_labels = 16 [default=false];
60 | 
61 |   // Whether to show groundtruth boxes in addition to detected boxes in
62 |   // visualizations.
63 |   optional bool visualize_groundtruth_boxes = 17 [default=false];
64 | 
65 |   // Box color for visualizing groundtruth boxes.
66 |   optional string groundtruth_box_visualization_color = 18 [default="black"];
67 | 
68 |   // Whether to keep image identifier in filename when exported to
69 |   // visualization_export_dir.
70 |   optional bool keep_image_id_for_visualization_export = 19 [default=false];
71 | 
72 |   // Whether to retain original images (i.e. not pre-processed) in the tensor
73 |   // dictionary, so that they can be displayed in Tensorboard.
74 |   optional bool retain_original_images = 23 [default=true];
75 | 
76 |   // If True, additionally include per-category metrics.
77 |   optional bool include_metrics_per_category = 24 [default=false];
78 | }
79 | 


--------------------------------------------------------------------------------
/object_detection/protos/faster_rcnn_box_coder.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | // Configuration proto for FasterRCNNBoxCoder. See
 6 | // box_coders/faster_rcnn_box_coder.py for details.
 7 | message FasterRcnnBoxCoder {
 8 |   // Scale factor for anchor encoded box center.
 9 |   optional float y_scale = 1 [default = 10.0];
10 |   optional float x_scale = 2 [default = 10.0];
11 | 
12 |   // Scale factor for anchor encoded box height.
13 |   optional float height_scale = 3 [default = 5.0];
14 | 
15 |   // Scale factor for anchor encoded box width.
16 |   optional float width_scale = 4 [default = 5.0];
17 | }
18 | 


--------------------------------------------------------------------------------
/object_detection/protos/graph_rewriter.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | // Message to configure graph rewriter for the tf graph.
 6 | message GraphRewriter {
 7 |   optional Quantization quantization = 1;
 8 | }
 9 | 
10 | // Message for quantization options. See
11 | // tensorflow/contrib/quantize/python/quantize.py for details.
12 | message Quantization {
13 |   // Number of steps to delay before quantization takes effect during training.
14 |   optional int32 delay = 1 [default = 500000];
15 | 
16 |   // Number of bits to use for quantizing weights.
17 |   // Only 8 bit is supported for now.
18 |   optional int32 weight_bits = 2 [default = 8];
19 | 
20 |   // Number of bits to use for quantizing activations.
21 |   // Only 8 bit is supported for now.
22 |   optional int32 activation_bits = 3 [default = 8];
23 | }
24 | 


--------------------------------------------------------------------------------
/object_detection/protos/grid_anchor_generator.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | // Configuration proto for GridAnchorGenerator. See
 6 | // anchor_generators/grid_anchor_generator.py for details.
 7 | message GridAnchorGenerator {
 8 |    // Anchor height in pixels.
 9 |   optional int32 height = 1 [default = 256];
10 | 
11 |   // Anchor width in pixels.
12 |   optional int32 width = 2 [default = 256];
13 | 
14 |   // Anchor stride in height dimension in pixels.
15 |   optional int32 height_stride = 3 [default = 16];
16 | 
17 |   // Anchor stride in width dimension in pixels.
18 |   optional int32 width_stride = 4 [default = 16];
19 | 
20 |   // Anchor height offset in pixels.
21 |   optional int32 height_offset = 5 [default = 0];
22 | 
23 |   // Anchor width offset in pixels.
24 |   optional int32 width_offset = 6 [default = 0];
25 | 
26 |   // At any given location, len(scales) * len(aspect_ratios) anchors are
27 |   // generated with all possible combinations of scales and aspect ratios.
28 | 
29 |   // List of scales for the anchors.
30 |   repeated float scales = 7;
31 | 
32 |   // List of aspect ratios for the anchors.
33 |   repeated float aspect_ratios = 8;
34 | }
35 | 


--------------------------------------------------------------------------------
/object_detection/protos/image_resizer.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | // Configuration proto for image resizing operations.
 6 | // See builders/image_resizer_builder.py for details.
 7 | message ImageResizer {
 8 |   oneof image_resizer_oneof {
 9 |     KeepAspectRatioResizer keep_aspect_ratio_resizer = 1;
10 |     FixedShapeResizer fixed_shape_resizer = 2;
11 |   }
12 | }
13 | 
14 | // Enumeration type for image resizing methods provided in TensorFlow.
15 | enum ResizeType {
16 |   BILINEAR = 0; // Corresponds to tf.image.ResizeMethod.BILINEAR
17 |   NEAREST_NEIGHBOR = 1; // Corresponds to tf.image.ResizeMethod.NEAREST_NEIGHBOR
18 |   BICUBIC = 2; // Corresponds to tf.image.ResizeMethod.BICUBIC
19 |   AREA = 3; // Corresponds to tf.image.ResizeMethod.AREA
20 | }
21 | 
22 | // Configuration proto for image resizer that keeps aspect ratio.
23 | message KeepAspectRatioResizer {
24 |   // Desired size of the smaller image dimension in pixels.
25 |   optional int32 min_dimension = 1 [default = 600];
26 | 
27 |   // Desired size of the larger image dimension in pixels.
28 |   optional int32 max_dimension = 2 [default = 1024];
29 | 
30 |   // Desired method when resizing image.
31 |   optional ResizeType resize_method = 3 [default = BILINEAR];
32 | 
33 |   // Whether to pad the image with zeros so the output spatial size is
34 |   // [max_dimension, max_dimension]. Note that the zeros are padded to the
35 |   // bottom and the right of the resized image.
36 |   optional bool pad_to_max_dimension = 4 [default = false];
37 | 
38 |   // Whether to also resize the image channels from 3 to 1 (RGB to grayscale).
39 |   optional bool convert_to_grayscale = 5 [default = false];
40 | 
41 |   // Per-channel pad value. This is only used when pad_to_max_dimension is True.
42 |   // If unspecified, a default pad value of 0 is applied to all channels.
43 |   repeated float per_channel_pad_value = 6;
44 | }
45 | 
46 | // Configuration proto for image resizer that resizes to a fixed shape.
47 | message FixedShapeResizer {
48 |   // Desired height of image in pixels.
49 |   optional int32 height = 1 [default = 300];
50 | 
51 |   // Desired width of image in pixels.
52 |   optional int32 width = 2 [default = 300];
53 | 
54 |   // Desired method when resizing image.
55 |   optional ResizeType resize_method = 3 [default = BILINEAR];
56 | 
57 |   // Whether to also resize the image channels from 3 to 1 (RGB to grayscale).
58 |   optional bool convert_to_grayscale = 4 [default = false];
59 | }
60 | 


--------------------------------------------------------------------------------
/object_detection/protos/keypoint_box_coder.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | // Configuration proto for KeypointBoxCoder. See
 6 | // box_coders/keypoint_box_coder.py for details.
 7 | message KeypointBoxCoder {
 8 |   optional int32 num_keypoints = 1;
 9 | 
10 |   // Scale factor for anchor encoded box center and keypoints.
11 |   optional float y_scale = 2 [default = 10.0];
12 |   optional float x_scale = 3 [default = 10.0];
13 | 
14 |   // Scale factor for anchor encoded box height.
15 |   optional float height_scale = 4 [default = 5.0];
16 | 
17 |   // Scale factor for anchor encoded box width.
18 |   optional float width_scale = 5 [default = 5.0];
19 | }
20 | 


--------------------------------------------------------------------------------
/object_detection/protos/matcher.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | import "object_detection/protos/argmax_matcher.proto";
 6 | import "object_detection/protos/bipartite_matcher.proto";
 7 | 
 8 | // Configuration proto for the matcher to be used in the object detection
 9 | // pipeline. See core/matcher.py for details.
10 | message Matcher {
11 |   oneof matcher_oneof {
12 |     ArgMaxMatcher argmax_matcher = 1;
13 |     BipartiteMatcher bipartite_matcher = 2;
14 |   }
15 | }
16 | 


--------------------------------------------------------------------------------
/object_detection/protos/mean_stddev_box_coder.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | // Configuration proto for MeanStddevBoxCoder. See
 6 | // box_coders/mean_stddev_box_coder.py for details.
 7 | message MeanStddevBoxCoder {
 8 |   // The standard deviation used to encode and decode boxes.
 9 |   optional float stddev = 1 [default=0.01];
10 | }
11 | 


--------------------------------------------------------------------------------
/object_detection/protos/mean_stddev_box_coder_pb2.py:
--------------------------------------------------------------------------------
 1 | # Generated by the protocol buffer compiler.  DO NOT EDIT!
 2 | # source: object_detection/protos/mean_stddev_box_coder.proto
 3 | 
 4 | import sys
 5 | _b=sys.version_info[0]<3 and (lambda x:x) or (lambda x:x.encode('latin1'))
 6 | from google.protobuf import descriptor as _descriptor
 7 | from google.protobuf import message as _message
 8 | from google.protobuf import reflection as _reflection
 9 | from google.protobuf import symbol_database as _symbol_database
10 | from google.protobuf import descriptor_pb2
11 | # @@protoc_insertion_point(imports)
12 | 
13 | _sym_db = _symbol_database.Default()
14 | 
15 | 
16 | 
17 | 
18 | DESCRIPTOR = _descriptor.FileDescriptor(
19 |   name='object_detection/protos/mean_stddev_box_coder.proto',
20 |   package='object_detection.protos',
21 |   syntax='proto2',
22 |   serialized_pb=_b('\n3object_detection/protos/mean_stddev_box_coder.proto\x12\x17object_detection.protos\"*\n\x12MeanStddevBoxCoder\x12\x14\n\x06stddev\x18\x01 \x01(\x02:\x04\x30.01')
23 | )
24 | 
25 | 
26 | 
27 | 
28 | _MEANSTDDEVBOXCODER = _descriptor.Descriptor(
29 |   name='MeanStddevBoxCoder',
30 |   full_name='object_detection.protos.MeanStddevBoxCoder',
31 |   filename=None,
32 |   file=DESCRIPTOR,
33 |   containing_type=None,
34 |   fields=[
35 |     _descriptor.FieldDescriptor(
36 |       name='stddev', full_name='object_detection.protos.MeanStddevBoxCoder.stddev', index=0,
37 |       number=1, type=2, cpp_type=6, label=1,
38 |       has_default_value=True, default_value=float(0.01),
39 |       message_type=None, enum_type=None, containing_type=None,
40 |       is_extension=False, extension_scope=None,
41 |       options=None),
42 |   ],
43 |   extensions=[
44 |   ],
45 |   nested_types=[],
46 |   enum_types=[
47 |   ],
48 |   options=None,
49 |   is_extendable=False,
50 |   syntax='proto2',
51 |   extension_ranges=[],
52 |   oneofs=[
53 |   ],
54 |   serialized_start=80,
55 |   serialized_end=122,
56 | )
57 | 
58 | DESCRIPTOR.message_types_by_name['MeanStddevBoxCoder'] = _MEANSTDDEVBOXCODER
59 | _sym_db.RegisterFileDescriptor(DESCRIPTOR)
60 | 
61 | MeanStddevBoxCoder = _reflection.GeneratedProtocolMessageType('MeanStddevBoxCoder', (_message.Message,), dict(
62 |   DESCRIPTOR = _MEANSTDDEVBOXCODER,
63 |   __module__ = 'object_detection.protos.mean_stddev_box_coder_pb2'
64 |   # @@protoc_insertion_point(class_scope:object_detection.protos.MeanStddevBoxCoder)
65 |   ))
66 | _sym_db.RegisterMessage(MeanStddevBoxCoder)
67 | 
68 | 
69 | # @@protoc_insertion_point(module_scope)
70 | 


--------------------------------------------------------------------------------
/object_detection/protos/model.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | import "object_detection/protos/faster_rcnn.proto";
 6 | import "object_detection/protos/ssd.proto";
 7 | 
 8 | // Top level configuration for DetectionModels.
 9 | message DetectionModel {
10 |   oneof model {
11 |     FasterRcnn faster_rcnn = 1;
12 |     Ssd ssd = 2;
13 |   }
14 | }
15 | 


--------------------------------------------------------------------------------
/object_detection/protos/multiscale_anchor_generator.proto:
--------------------------------------------------------------------------------
 1 |   syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | // Configuration proto for RetinaNet anchor generator described in
 6 | // https://arxiv.org/abs/1708.02002. See
 7 | // anchor_generators/multiscale_grid_anchor_generator.py for details.
 8 | message MultiscaleAnchorGenerator {
 9 |   // minimum level in feature pyramid
10 |   optional int32 min_level = 1 [default = 3];
11 | 
12 |   // maximum level in feature pyramid
13 |   optional int32 max_level = 2 [default = 7];
14 | 
15 |   // Scale of anchor to feature stride
16 |   optional float anchor_scale = 3 [default = 4.0];
17 | 
18 |   // Aspect ratios for anchors at each grid point.
19 |   repeated float aspect_ratios = 4;
20 | 
21 |   // Number of intermediate scale each scale octave
22 |   optional int32 scales_per_octave = 5 [default = 2];
23 | 
24 |   // Whether to produce anchors in normalized coordinates.
25 |   optional bool normalize_coordinates = 6 [default = true];
26 | }
27 | 


--------------------------------------------------------------------------------
/object_detection/protos/pipeline.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | import "object_detection/protos/eval.proto";
 6 | import "object_detection/protos/graph_rewriter.proto";
 7 | import "object_detection/protos/input_reader.proto";
 8 | import "object_detection/protos/model.proto";
 9 | import "object_detection/protos/train.proto";
10 | 
11 | // Convenience message for configuring a training and eval pipeline. Allows all
12 | // of the pipeline parameters to be configured from one file.
13 | message TrainEvalPipelineConfig {
14 |   optional DetectionModel model = 1;
15 |   optional TrainConfig train_config = 2;
16 |   optional InputReader train_input_reader = 3;
17 |   optional EvalConfig eval_config = 4;
18 |   optional InputReader eval_input_reader = 5;
19 |   optional GraphRewriter graph_rewriter = 6;
20 |   extensions 1000 to max;
21 | }
22 | 


--------------------------------------------------------------------------------
/object_detection/protos/post_processing.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | // Configuration proto for non-max-suppression operation on a batch of
 6 | // detections.
 7 | message BatchNonMaxSuppression {
 8 |   // Scalar threshold for score (low scoring boxes are removed).
 9 |   optional float score_threshold = 1 [default = 0.0];
10 | 
11 |   // Scalar threshold for IOU (boxes that have high IOU overlap
12 |   // with previously selected boxes are removed).
13 |   optional float iou_threshold = 2 [default = 0.6];
14 | 
15 |   // Maximum number of detections to retain per class.
16 |   optional int32 max_detections_per_class = 3 [default = 100];
17 | 
18 |   // Maximum number of detections to retain across all classes.
19 |   optional int32 max_total_detections = 5 [default = 100];
20 | }
21 | 
22 | // Configuration proto for post-processing predicted boxes and
23 | // scores.
24 | message PostProcessing {
25 |   // Non max suppression parameters.
26 |   optional BatchNonMaxSuppression batch_non_max_suppression = 1;
27 | 
28 |   // Enum to specify how to convert the detection scores.
29 |   enum ScoreConverter {
30 |     // Input scores equals output scores.
31 |     IDENTITY = 0;
32 | 
33 |     // Applies a sigmoid on input scores.
34 |     SIGMOID = 1;
35 | 
36 |     // Applies a softmax on input scores
37 |     SOFTMAX = 2;
38 |   }
39 | 
40 |   // Score converter to use.
41 |   optional ScoreConverter score_converter = 2 [default = IDENTITY];
42 |   // Scale logit (input) value before conversion in post-processing step.
43 |   // Typically used for softmax distillation, though can be used to scale for
44 |   // other reasons.
45 |   optional float logit_scale = 3 [default = 1.0];
46 | }
47 | 


--------------------------------------------------------------------------------
/object_detection/protos/region_similarity_calculator.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | // Configuration proto for region similarity calculators. See
 6 | // core/region_similarity_calculator.py for details.
 7 | message RegionSimilarityCalculator {
 8 |   oneof region_similarity {
 9 |     NegSqDistSimilarity neg_sq_dist_similarity = 1;
10 |     IouSimilarity iou_similarity = 2;
11 |     IoaSimilarity ioa_similarity = 3;
12 |     ThresholdedIouSimilarity thresholded_iou_similarity = 4;
13 |   }
14 | }
15 | 
16 | // Configuration for negative squared distance similarity calculator.
17 | message NegSqDistSimilarity {
18 | }
19 | 
20 | // Configuration for intersection-over-union (IOU) similarity calculator.
21 | message IouSimilarity {
22 | }
23 | 
24 | // Configuration for intersection-over-area (IOA) similarity calculator.
25 | message IoaSimilarity {
26 | }
27 | 
28 | // Configuration for thresholded-intersection-over-union similarity calculator.
29 | message ThresholdedIouSimilarity {
30 | 
31 |   // IOU threshold used for filtering scores.
32 |   optional float iou_threshold = 1 [default = 0.5];
33 | }
34 | 


--------------------------------------------------------------------------------
/object_detection/protos/square_box_coder.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | // Configuration proto for SquareBoxCoder. See
 6 | // box_coders/square_box_coder.py for details.
 7 | message SquareBoxCoder {
 8 |   // Scale factor for anchor encoded box center.
 9 |   optional float y_scale = 1 [default = 10.0];
10 |   optional float x_scale = 2 [default = 10.0];
11 | 
12 |   // Scale factor for anchor encoded box length.
13 |   optional float length_scale = 3 [default = 5.0];
14 | }
15 | 


--------------------------------------------------------------------------------
/object_detection/protos/square_box_coder_pb2.py:
--------------------------------------------------------------------------------
 1 | # Generated by the protocol buffer compiler.  DO NOT EDIT!
 2 | # source: object_detection/protos/square_box_coder.proto
 3 | 
 4 | import sys
 5 | _b=sys.version_info[0]<3 and (lambda x:x) or (lambda x:x.encode('latin1'))
 6 | from google.protobuf import descriptor as _descriptor
 7 | from google.protobuf import message as _message
 8 | from google.protobuf import reflection as _reflection
 9 | from google.protobuf import symbol_database as _symbol_database
10 | from google.protobuf import descriptor_pb2
11 | # @@protoc_insertion_point(imports)
12 | 
13 | _sym_db = _symbol_database.Default()
14 | 
15 | 
16 | 
17 | 
18 | DESCRIPTOR = _descriptor.FileDescriptor(
19 |   name='object_detection/protos/square_box_coder.proto',
20 |   package='object_detection.protos',
21 |   syntax='proto2',
22 |   serialized_pb=_b('\n.object_detection/protos/square_box_coder.proto\x12\x17object_detection.protos\"S\n\x0eSquareBoxCoder\x12\x13\n\x07y_scale\x18\x01 \x01(\x02:\x02\x31\x30\x12\x13\n\x07x_scale\x18\x02 \x01(\x02:\x02\x31\x30\x12\x17\n\x0clength_scale\x18\x03 \x01(\x02:\x01\x35')
23 | )
24 | 
25 | 
26 | 
27 | 
28 | _SQUAREBOXCODER = _descriptor.Descriptor(
29 |   name='SquareBoxCoder',
30 |   full_name='object_detection.protos.SquareBoxCoder',
31 |   filename=None,
32 |   file=DESCRIPTOR,
33 |   containing_type=None,
34 |   fields=[
35 |     _descriptor.FieldDescriptor(
36 |       name='y_scale', full_name='object_detection.protos.SquareBoxCoder.y_scale', index=0,
37 |       number=1, type=2, cpp_type=6, label=1,
38 |       has_default_value=True, default_value=float(10),
39 |       message_type=None, enum_type=None, containing_type=None,
40 |       is_extension=False, extension_scope=None,
41 |       options=None),
42 |     _descriptor.FieldDescriptor(
43 |       name='x_scale', full_name='object_detection.protos.SquareBoxCoder.x_scale', index=1,
44 |       number=2, type=2, cpp_type=6, label=1,
45 |       has_default_value=True, default_value=float(10),
46 |       message_type=None, enum_type=None, containing_type=None,
47 |       is_extension=False, extension_scope=None,
48 |       options=None),
49 |     _descriptor.FieldDescriptor(
50 |       name='length_scale', full_name='object_detection.protos.SquareBoxCoder.length_scale', index=2,
51 |       number=3, type=2, cpp_type=6, label=1,
52 |       has_default_value=True, default_value=float(5),
53 |       message_type=None, enum_type=None, containing_type=None,
54 |       is_extension=False, extension_scope=None,
55 |       options=None),
56 |   ],
57 |   extensions=[
58 |   ],
59 |   nested_types=[],
60 |   enum_types=[
61 |   ],
62 |   options=None,
63 |   is_extendable=False,
64 |   syntax='proto2',
65 |   extension_ranges=[],
66 |   oneofs=[
67 |   ],
68 |   serialized_start=75,
69 |   serialized_end=158,
70 | )
71 | 
72 | DESCRIPTOR.message_types_by_name['SquareBoxCoder'] = _SQUAREBOXCODER
73 | _sym_db.RegisterFileDescriptor(DESCRIPTOR)
74 | 
75 | SquareBoxCoder = _reflection.GeneratedProtocolMessageType('SquareBoxCoder', (_message.Message,), dict(
76 |   DESCRIPTOR = _SQUAREBOXCODER,
77 |   __module__ = 'object_detection.protos.square_box_coder_pb2'
78 |   # @@protoc_insertion_point(class_scope:object_detection.protos.SquareBoxCoder)
79 |   ))
80 | _sym_db.RegisterMessage(SquareBoxCoder)
81 | 
82 | 
83 | # @@protoc_insertion_point(module_scope)
84 | 


--------------------------------------------------------------------------------
/object_detection/protos/ssd_anchor_generator.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto2";
 2 | 
 3 | package object_detection.protos;
 4 | 
 5 | // Configuration proto for SSD anchor generator described in
 6 | // https://arxiv.org/abs/1512.02325. See
 7 | // anchor_generators/multiple_grid_anchor_generator.py for details.
 8 | message SsdAnchorGenerator {
 9 |   // Number of grid layers to create anchors for.
10 |   optional int32 num_layers = 1 [default = 6];
11 | 
12 |   // Scale of anchors corresponding to finest resolution.
13 |   optional float min_scale = 2 [default = 0.2];
14 | 
15 |   // Scale of anchors corresponding to coarsest resolution
16 |   optional float max_scale = 3 [default = 0.95];
17 | 
18 |   // Can be used to override min_scale->max_scale, with an explicitly defined
19 |   // set of scales.  If empty, then min_scale->max_scale is used.
20 |   repeated float scales = 12;
21 | 
22 |   // Aspect ratios for anchors at each grid point.
23 |   repeated float aspect_ratios = 4;
24 | 
25 |   // When this aspect ratio is greater than 0, then an additional
26 |   // anchor, with an interpolated scale is added with this aspect ratio.
27 |   optional float interpolated_scale_aspect_ratio = 13 [default = 1.0];
28 | 
29 |   // Whether to use the following aspect ratio and scale combination for the
30 |   // layer with the finest resolution : (scale=0.1, aspect_ratio=1.0),
31 |   // (scale=min_scale, aspect_ration=2.0), (scale=min_scale, aspect_ratio=0.5).
32 |   optional bool reduce_boxes_in_lowest_layer = 5 [default = true];
33 | 
34 |   // The base anchor size in height dimension.
35 |   optional float base_anchor_height = 6 [default = 1.0];
36 | 
37 |   // The base anchor size in width dimension.
38 |   optional float base_anchor_width = 7 [default = 1.0];
39 | 
40 |   // Anchor stride in height dimension in pixels for each layer. The length of
41 |   // this field is expected to be equal to the value of num_layers.
42 |   repeated int32 height_stride = 8;
43 | 
44 |   // Anchor stride in width dimension in pixels for each layer. The length of
45 |   // this field is expected to be equal to the value of num_layers.
46 |   repeated int32 width_stride = 9;
47 | 
48 |   // Anchor height offset in pixels for each layer. The length of this field is
49 |   // expected to be equal to the value of num_layers.
50 |   repeated int32 height_offset = 10;
51 | 
52 |   // Anchor width offset in pixels for each layer. The length of this field is
53 |   // expected to be equal to the value of num_layers.
54 |   repeated int32 width_offset = 11;
55 | }
56 | 


--------------------------------------------------------------------------------
/object_detection/protos/string_int_label_map.proto:
--------------------------------------------------------------------------------
 1 | // Message to store the mapping from class label strings to class id. Datasets
 2 | // use string labels to represent classes while the object detection framework
 3 | // works with class ids. This message maps them so they can be converted back
 4 | // and forth as needed.
 5 | syntax = "proto2";
 6 | 
 7 | package object_detection.protos;
 8 | 
 9 | message StringIntLabelMapItem {
10 |   // String name. The most common practice is to set this to a MID or synsets
11 |   // id.
12 |   optional string name = 1;
13 | 
14 |   // Integer id that maps to the string name above. Label ids should start from
15 |   // 1.
16 |   optional int32 id = 2;
17 | 
18 |   // Human readable string label.
19 |   optional string display_name = 3;
20 | };
21 | 
22 | message StringIntLabelMap {
23 |   repeated StringIntLabelMapItem item = 1;
24 | };
25 | 


--------------------------------------------------------------------------------
/object_detection/samples/cloud/cloud.yml:
--------------------------------------------------------------------------------
 1 | trainingInput:
 2 |   runtimeVersion: "1.8"
 3 |   scaleTier: CUSTOM
 4 |   masterType: standard_gpu
 5 |   workerCount: 5
 6 |   workerType: standard_gpu
 7 |   parameterServerCount: 3
 8 |   parameterServerType: standard
 9 | 
10 | 
11 | 
12 | 


--------------------------------------------------------------------------------
/object_detection/train.sh:
--------------------------------------------------------------------------------
1 | python train.py --logtostderr --train_dir=/path/to/train --pipeline_config_path=pipeline_config.pbtxt


--------------------------------------------------------------------------------
/object_detection/utils/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/object_detection/utils/__init__.py


--------------------------------------------------------------------------------
/object_detection/utils/category_util.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Functions for importing/exporting Object Detection categories."""
17 | import csv
18 | 
19 | import tensorflow as tf
20 | 
21 | 
22 | def load_categories_from_csv_file(csv_path):
23 |   """Loads categories from a csv file.
24 | 
25 |   The CSV file should have one comma delimited numeric category id and string
26 |   category name pair per line. For example:
27 | 
28 |   0,"cat"
29 |   1,"dog"
30 |   2,"bird"
31 |   ...
32 | 
33 |   Args:
34 |     csv_path: Path to the csv file to be parsed into categories.
35 |   Returns:
36 |     categories: A list of dictionaries representing all possible categories.
37 |                 The categories will contain an integer 'id' field and a string
38 |                 'name' field.
39 |   Raises:
40 |     ValueError: If the csv file is incorrectly formatted.
41 |   """
42 |   categories = []
43 | 
44 |   with tf.gfile.Open(csv_path, 'r') as csvfile:
45 |     reader = csv.reader(csvfile, delimiter=',', quotechar='"')
46 |     for row in reader:
47 |       if not row:
48 |         continue
49 | 
50 |       if len(row) != 2:
51 |         raise ValueError('Expected 2 fields per row in csv: %s' % ','.join(row))
52 | 
53 |       category_id = int(row[0])
54 |       category_name = row[1]
55 |       categories.append({'id': category_id, 'name': category_name})
56 | 
57 |   return categories
58 | 
59 | 
60 | def save_categories_to_csv_file(categories, csv_path):
61 |   """Saves categories to a csv file.
62 | 
63 |   Args:
64 |     categories: A list of dictionaries representing categories to save to file.
65 |                 Each category must contain an 'id' and 'name' field.
66 |     csv_path: Path to the csv file to be parsed into categories.
67 |   """
68 |   categories.sort(key=lambda x: x['id'])
69 |   with tf.gfile.Open(csv_path, 'w') as csvfile:
70 |     writer = csv.writer(csvfile, delimiter=',', quotechar='"')
71 |     for category in categories:
72 |       writer.writerow([category['id'], category['name']])
73 | 


--------------------------------------------------------------------------------
/object_detection/utils/category_util_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Tests for object_detection.utils.category_util."""
17 | import os
18 | 
19 | import tensorflow as tf
20 | 
21 | from object_detection.utils import category_util
22 | 
23 | 
24 | class EvalUtilTest(tf.test.TestCase):
25 | 
26 |   def test_load_categories_from_csv_file(self):
27 |     csv_data = """
28 |         0,"cat"
29 |         1,"dog"
30 |         2,"bird"
31 |     """.strip(' ')
32 |     csv_path = os.path.join(self.get_temp_dir(), 'test.csv')
33 |     with tf.gfile.Open(csv_path, 'wb') as f:
34 |       f.write(csv_data)
35 | 
36 |     categories = category_util.load_categories_from_csv_file(csv_path)
37 |     self.assertTrue({'id': 0, 'name': 'cat'} in categories)
38 |     self.assertTrue({'id': 1, 'name': 'dog'} in categories)
39 |     self.assertTrue({'id': 2, 'name': 'bird'} in categories)
40 | 
41 |   def test_save_categories_to_csv_file(self):
42 |     categories = [
43 |         {'id': 0, 'name': 'cat'},
44 |         {'id': 1, 'name': 'dog'},
45 |         {'id': 2, 'name': 'bird'},
46 |     ]
47 |     csv_path = os.path.join(self.get_temp_dir(), 'test.csv')
48 |     category_util.save_categories_to_csv_file(categories, csv_path)
49 |     saved_categories = category_util.load_categories_from_csv_file(csv_path)
50 |     self.assertEqual(saved_categories, categories)
51 | 
52 | 
53 | if __name__ == '__main__':
54 |   tf.test.main()
55 | 


--------------------------------------------------------------------------------
/object_detection/utils/context_manager.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2018 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Python context management helper."""
16 | 
17 | from __future__ import absolute_import
18 | from __future__ import division
19 | from __future__ import print_function
20 | 
21 | 
22 | class IdentityContextManager(object):
23 |   """Returns an identity context manager that does nothing.
24 | 
25 |   This is helpful in setting up conditional `with` statement as below:
26 | 
27 |   with slim.arg_scope(x) if use_slim_scope else IdentityContextManager():
28 |     do_stuff()
29 | 
30 |   """
31 | 
32 |   def __enter__(self):
33 |     return None
34 | 
35 |   def __exit__(self, exec_type, exec_value, traceback):
36 |     del exec_type
37 |     del exec_value
38 |     del traceback
39 |     return False
40 | 
41 | 


--------------------------------------------------------------------------------
/object_detection/utils/context_manager_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2018 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Tests for tensorflow_models.object_detection.utils.context_manager."""
16 | 
17 | from __future__ import absolute_import
18 | from __future__ import division
19 | from __future__ import print_function
20 | 
21 | import tensorflow as tf
22 | from object_detection.utils import context_manager
23 | 
24 | 
25 | class ContextManagerTest(tf.test.TestCase):
26 | 
27 |   def test_identity_context_manager(self):
28 |     with context_manager.IdentityContextManager() as identity_context:
29 |       self.assertIsNone(identity_context)
30 | 
31 | 
32 | if __name__ == '__main__':
33 |   tf.test.main()
34 | 


--------------------------------------------------------------------------------
/object_detection/utils/dataset_util.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Utility functions for creating TFRecord data sets."""
17 | 
18 | import tensorflow as tf
19 | 
20 | 
21 | def int64_feature(value):
22 |   return tf.train.Feature(int64_list=tf.train.Int64List(value=[value]))
23 | 
24 | 
25 | def int64_list_feature(value):
26 |   return tf.train.Feature(int64_list=tf.train.Int64List(value=value))
27 | 
28 | 
29 | def bytes_feature(value):
30 |   return tf.train.Feature(bytes_list=tf.train.BytesList(value=[value]))
31 | 
32 | 
33 | def bytes_list_feature(value):
34 |   return tf.train.Feature(bytes_list=tf.train.BytesList(value=value))
35 | 
36 | 
37 | def float_list_feature(value):
38 |   return tf.train.Feature(float_list=tf.train.FloatList(value=value))
39 | 
40 | 
41 | def read_examples_list(path):
42 |   """Read list of training or validation examples.
43 | 
44 |   The file is assumed to contain a single example per line where the first
45 |   token in the line is an identifier that allows us to find the image and
46 |   annotation xml for that example.
47 | 
48 |   For example, the line:
49 |   xyz 3
50 |   would allow us to find files xyz.jpg and xyz.xml (the 3 would be ignored).
51 | 
52 |   Args:
53 |     path: absolute path to examples list file.
54 | 
55 |   Returns:
56 |     list of example identifiers (strings).
57 |   """
58 |   with tf.gfile.GFile(path) as fid:
59 |     lines = fid.readlines()
60 |   return [line.strip().split(' ')[0] for line in lines]
61 | 
62 | 
63 | def recursive_parse_xml_to_dict(xml):
64 |   """Recursively parses XML contents to python dict.
65 | 
66 |   We assume that `object` tags are the only ones that can appear
67 |   multiple times at the same level of a tree.
68 | 
69 |   Args:
70 |     xml: xml tree obtained by parsing XML file contents using lxml.etree
71 | 
72 |   Returns:
73 |     Python dictionary holding XML contents.
74 |   """
75 |   if not xml:
76 |     return {xml.tag: xml.text}
77 |   result = {}
78 |   for child in xml:
79 |     child_result = recursive_parse_xml_to_dict(child)
80 |     if child.tag != 'object':
81 |       result[child.tag] = child_result[child.tag]
82 |     else:
83 |       if child.tag not in result:
84 |         result[child.tag] = []
85 |       result[child.tag].append(child_result[child.tag])
86 |   return {xml.tag: result}
87 | 
88 | 
89 | 


--------------------------------------------------------------------------------
/object_detection/utils/dataset_util_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Tests for object_detection.utils.dataset_util."""
17 | 
18 | import os
19 | import tensorflow as tf
20 | 
21 | from object_detection.utils import dataset_util
22 | 
23 | 
24 | class DatasetUtilTest(tf.test.TestCase):
25 | 
26 |   def test_read_examples_list(self):
27 |     example_list_data = """example1 1\nexample2 2"""
28 |     example_list_path = os.path.join(self.get_temp_dir(), 'examples.txt')
29 |     with tf.gfile.Open(example_list_path, 'wb') as f:
30 |       f.write(example_list_data)
31 | 
32 |     examples = dataset_util.read_examples_list(example_list_path)
33 |     self.assertListEqual(['example1', 'example2'], examples)
34 | 
35 | 
36 | if __name__ == '__main__':
37 |   tf.test.main()
38 | 


--------------------------------------------------------------------------------
/object_detection/utils/json_utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Utilities for dealing with writing json strings.
16 | 
17 | json_utils wraps json.dump and json.dumps so that they can be used to safely
18 | control the precision of floats when writing to json strings or files.
19 | """
20 | import json
21 | from json import encoder
22 | 
23 | 
24 | def Dump(obj, fid, float_digits=-1, **params):
25 |   """Wrapper of json.dump that allows specifying the float precision used.
26 | 
27 |   Args:
28 |     obj: The object to dump.
29 |     fid: The file id to write to.
30 |     float_digits: The number of digits of precision when writing floats out.
31 |     **params: Additional parameters to pass to json.dumps.
32 |   """
33 |   original_encoder = encoder.FLOAT_REPR
34 |   if float_digits >= 0:
35 |     encoder.FLOAT_REPR = lambda o: format(o, '.%df' % float_digits)
36 |   try:
37 |     json.dump(obj, fid, **params)
38 |   finally:
39 |     encoder.FLOAT_REPR = original_encoder
40 | 
41 | 
42 | def Dumps(obj, float_digits=-1, **params):
43 |   """Wrapper of json.dumps that allows specifying the float precision used.
44 | 
45 |   Args:
46 |     obj: The object to dump.
47 |     float_digits: The number of digits of precision when writing floats out.
48 |     **params: Additional parameters to pass to json.dumps.
49 | 
50 |   Returns:
51 |     output: JSON string representation of obj.
52 |   """
53 |   original_encoder = encoder.FLOAT_REPR
54 |   original_c_make_encoder = encoder.c_make_encoder
55 |   if float_digits >= 0:
56 |     encoder.FLOAT_REPR = lambda o: format(o, '.%df' % float_digits)
57 |     encoder.c_make_encoder = None
58 |   try:
59 |     output = json.dumps(obj, **params)
60 |   finally:
61 |     encoder.FLOAT_REPR = original_encoder
62 |     encoder.c_make_encoder = original_c_make_encoder
63 | 
64 |   return output
65 | 
66 | 
67 | def PrettyParams(**params):
68 |   """Returns parameters for use with Dump and Dumps to output pretty json.
69 | 
70 |   Example usage:
71 |     ```json_str = json_utils.Dumps(obj, **json_utils.PrettyParams())```
72 |     ```json_str = json_utils.Dumps(
73 |                       obj, **json_utils.PrettyParams(allow_nans=False))```
74 | 
75 |   Args:
76 |     **params: Additional params to pass to json.dump or json.dumps.
77 | 
78 |   Returns:
79 |     params: Parameters that are compatible with json_utils.Dump and
80 |       json_utils.Dumps.
81 |   """
82 |   params['float_digits'] = 4
83 |   params['sort_keys'] = True
84 |   params['indent'] = 2
85 |   params['separators'] = (',', ': ')
86 |   return params
87 | 
88 | 


--------------------------------------------------------------------------------
/object_detection/utils/np_box_mask_list.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Numpy BoxMaskList classes and functions."""
17 | 
18 | import numpy as np
19 | from object_detection.utils import np_box_list
20 | 
21 | 
22 | class BoxMaskList(np_box_list.BoxList):
23 |   """Convenience wrapper for BoxList with masks.
24 | 
25 |   BoxMaskList extends the np_box_list.BoxList to contain masks as well.
26 |   In particular, its constructor receives both boxes and masks. Note that the
27 |   masks correspond to the full image.
28 |   """
29 | 
30 |   def __init__(self, box_data, mask_data):
31 |     """Constructs box collection.
32 | 
33 |     Args:
34 |       box_data: a numpy array of shape [N, 4] representing box coordinates
35 |       mask_data: a numpy array of shape [N, height, width] representing masks
36 |         with values are in {0,1}. The masks correspond to the full
37 |         image. The height and the width will be equal to image height and width.
38 | 
39 |     Raises:
40 |       ValueError: if bbox data is not a numpy array
41 |       ValueError: if invalid dimensions for bbox data
42 |       ValueError: if mask data is not a numpy array
43 |       ValueError: if invalid dimension for mask data
44 |     """
45 |     super(BoxMaskList, self).__init__(box_data)
46 |     if not isinstance(mask_data, np.ndarray):
47 |       raise ValueError('Mask data must be a numpy array.')
48 |     if len(mask_data.shape) != 3:
49 |       raise ValueError('Invalid dimensions for mask data.')
50 |     if mask_data.dtype != np.uint8:
51 |       raise ValueError('Invalid data type for mask data: uint8 is required.')
52 |     if mask_data.shape[0] != box_data.shape[0]:
53 |       raise ValueError('There should be the same number of boxes and masks.')
54 |     self.data['masks'] = mask_data
55 | 
56 |   def get_masks(self):
57 |     """Convenience function for accessing masks.
58 | 
59 |     Returns:
60 |       a numpy array of shape [N, height, width] representing masks
61 |     """
62 |     return self.get_field('masks')
63 | 
64 | 


--------------------------------------------------------------------------------
/object_detection/utils/np_box_ops_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Tests for object_detection.np_box_ops."""
17 | 
18 | import numpy as np
19 | import tensorflow as tf
20 | 
21 | from object_detection.utils import np_box_ops
22 | 
23 | 
24 | class BoxOpsTests(tf.test.TestCase):
25 | 
26 |   def setUp(self):
27 |     boxes1 = np.array([[4.0, 3.0, 7.0, 5.0], [5.0, 6.0, 10.0, 7.0]],
28 |                       dtype=float)
29 |     boxes2 = np.array([[3.0, 4.0, 6.0, 8.0], [14.0, 14.0, 15.0, 15.0],
30 |                        [0.0, 0.0, 20.0, 20.0]],
31 |                       dtype=float)
32 |     self.boxes1 = boxes1
33 |     self.boxes2 = boxes2
34 | 
35 |   def testArea(self):
36 |     areas = np_box_ops.area(self.boxes1)
37 |     expected_areas = np.array([6.0, 5.0], dtype=float)
38 |     self.assertAllClose(expected_areas, areas)
39 | 
40 |   def testIntersection(self):
41 |     intersection = np_box_ops.intersection(self.boxes1, self.boxes2)
42 |     expected_intersection = np.array([[2.0, 0.0, 6.0], [1.0, 0.0, 5.0]],
43 |                                      dtype=float)
44 |     self.assertAllClose(intersection, expected_intersection)
45 | 
46 |   def testIOU(self):
47 |     iou = np_box_ops.iou(self.boxes1, self.boxes2)
48 |     expected_iou = np.array([[2.0 / 16.0, 0.0, 6.0 / 400.0],
49 |                              [1.0 / 16.0, 0.0, 5.0 / 400.0]],
50 |                             dtype=float)
51 |     self.assertAllClose(iou, expected_iou)
52 | 
53 |   def testIOA(self):
54 |     boxes1 = np.array([[0.25, 0.25, 0.75, 0.75],
55 |                        [0.0, 0.0, 0.5, 0.75]],
56 |                       dtype=np.float32)
57 |     boxes2 = np.array([[0.5, 0.25, 1.0, 1.0],
58 |                        [0.0, 0.0, 1.0, 1.0]],
59 |                       dtype=np.float32)
60 |     ioa21 = np_box_ops.ioa(boxes2, boxes1)
61 |     expected_ioa21 = np.array([[0.5, 0.0],
62 |                                [1.0, 1.0]],
63 |                               dtype=np.float32)
64 |     self.assertAllClose(ioa21, expected_ioa21)
65 | 
66 | 
67 | if __name__ == '__main__':
68 |   tf.test.main()
69 | 


--------------------------------------------------------------------------------
/object_detection/utils/static_shape.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Helper functions to access TensorShape values.
17 | 
18 | The rank 4 tensor_shape must be of the form [batch_size, height, width, depth].
19 | """
20 | 
21 | 
22 | def get_batch_size(tensor_shape):
23 |   """Returns batch size from the tensor shape.
24 | 
25 |   Args:
26 |     tensor_shape: A rank 4 TensorShape.
27 | 
28 |   Returns:
29 |     An integer representing the batch size of the tensor.
30 |   """
31 |   tensor_shape.assert_has_rank(rank=4)
32 |   return tensor_shape[0].value
33 | 
34 | 
35 | def get_height(tensor_shape):
36 |   """Returns height from the tensor shape.
37 | 
38 |   Args:
39 |     tensor_shape: A rank 4 TensorShape.
40 | 
41 |   Returns:
42 |     An integer representing the height of the tensor.
43 |   """
44 |   tensor_shape.assert_has_rank(rank=4)
45 |   return tensor_shape[1].value
46 | 
47 | 
48 | def get_width(tensor_shape):
49 |   """Returns width from the tensor shape.
50 | 
51 |   Args:
52 |     tensor_shape: A rank 4 TensorShape.
53 | 
54 |   Returns:
55 |     An integer representing the width of the tensor.
56 |   """
57 |   tensor_shape.assert_has_rank(rank=4)
58 |   return tensor_shape[2].value
59 | 
60 | 
61 | def get_depth(tensor_shape):
62 |   """Returns depth from the tensor shape.
63 | 
64 |   Args:
65 |     tensor_shape: A rank 4 TensorShape.
66 | 
67 |   Returns:
68 |     An integer representing the depth of the tensor.
69 |   """
70 |   tensor_shape.assert_has_rank(rank=4)
71 |   return tensor_shape[3].value
72 | 


--------------------------------------------------------------------------------
/object_detection/utils/static_shape_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Tests for object_detection.utils.static_shape."""
17 | 
18 | import tensorflow as tf
19 | 
20 | from object_detection.utils import static_shape
21 | 
22 | 
23 | class StaticShapeTest(tf.test.TestCase):
24 | 
25 |   def test_return_correct_batchSize(self):
26 |     tensor_shape = tf.TensorShape(dims=[32, 299, 384, 3])
27 |     self.assertEqual(32, static_shape.get_batch_size(tensor_shape))
28 | 
29 |   def test_return_correct_height(self):
30 |     tensor_shape = tf.TensorShape(dims=[32, 299, 384, 3])
31 |     self.assertEqual(299, static_shape.get_height(tensor_shape))
32 | 
33 |   def test_return_correct_width(self):
34 |     tensor_shape = tf.TensorShape(dims=[32, 299, 384, 3])
35 |     self.assertEqual(384, static_shape.get_width(tensor_shape))
36 | 
37 |   def test_return_correct_depth(self):
38 |     tensor_shape = tf.TensorShape(dims=[32, 299, 384, 3])
39 |     self.assertEqual(3, static_shape.get_depth(tensor_shape))
40 | 
41 |   def test_die_on_tensor_shape_with_rank_three(self):
42 |     tensor_shape = tf.TensorShape(dims=[32, 299, 384])
43 |     with self.assertRaises(ValueError):
44 |       static_shape.get_batch_size(tensor_shape)
45 |       static_shape.get_height(tensor_shape)
46 |       static_shape.get_width(tensor_shape)
47 |       static_shape.get_depth(tensor_shape)
48 | 
49 | if __name__ == '__main__':
50 |   tf.test.main()
51 | 


--------------------------------------------------------------------------------
/object_detection/utils/test_utils_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Tests for object_detection.utils.test_utils."""
17 | 
18 | import numpy as np
19 | import tensorflow as tf
20 | 
21 | from object_detection.utils import test_utils
22 | 
23 | 
24 | class TestUtilsTest(tf.test.TestCase):
25 | 
26 |   def test_diagonal_gradient_image(self):
27 |     """Tests if a good pyramid image is created."""
28 |     pyramid_image = test_utils.create_diagonal_gradient_image(3, 4, 2)
29 | 
30 |     # Test which is easy to understand.
31 |     expected_first_channel = np.array([[3, 2, 1, 0],
32 |                                        [4, 3, 2, 1],
33 |                                        [5, 4, 3, 2]], dtype=np.float32)
34 |     self.assertAllEqual(np.squeeze(pyramid_image[:, :, 0]),
35 |                         expected_first_channel)
36 | 
37 |     # Actual test.
38 |     expected_image = np.array([[[3, 30],
39 |                                 [2, 20],
40 |                                 [1, 10],
41 |                                 [0, 0]],
42 |                                [[4, 40],
43 |                                 [3, 30],
44 |                                 [2, 20],
45 |                                 [1, 10]],
46 |                                [[5, 50],
47 |                                 [4, 40],
48 |                                 [3, 30],
49 |                                 [2, 20]]], dtype=np.float32)
50 | 
51 |     self.assertAllEqual(pyramid_image, expected_image)
52 | 
53 |   def test_random_boxes(self):
54 |     """Tests if valid random boxes are created."""
55 |     num_boxes = 1000
56 |     max_height = 3
57 |     max_width = 5
58 |     boxes = test_utils.create_random_boxes(num_boxes,
59 |                                            max_height,
60 |                                            max_width)
61 | 
62 |     true_column = np.ones(shape=(num_boxes)) == 1
63 |     self.assertAllEqual(boxes[:, 0] < boxes[:, 2], true_column)
64 |     self.assertAllEqual(boxes[:, 1] < boxes[:, 3], true_column)
65 | 
66 |     self.assertTrue(boxes[:, 0].min() >= 0)
67 |     self.assertTrue(boxes[:, 1].min() >= 0)
68 |     self.assertTrue(boxes[:, 2].max() <= max_height)
69 |     self.assertTrue(boxes[:, 3].max() <= max_width)
70 | 
71 |   def test_first_rows_close_as_set(self):
72 |     a = [1, 2, 3, 0, 0]
73 |     b = [3, 2, 1, 0, 0]
74 |     k = 3
75 |     self.assertTrue(test_utils.first_rows_close_as_set(a, b, k))
76 | 
77 |     a = [[1, 2], [1, 4], [0, 0]]
78 |     b = [[1, 4 + 1e-9], [1, 2], [0, 0]]
79 |     k = 2
80 |     self.assertTrue(test_utils.first_rows_close_as_set(a, b, k))
81 | 
82 |     a = [[1, 2], [1, 4], [0, 0]]
83 |     b = [[1, 4 + 1e-9], [2, 2], [0, 0]]
84 |     k = 2
85 |     self.assertFalse(test_utils.first_rows_close_as_set(a, b, k))
86 | 
87 | 
88 | if __name__ == '__main__':
89 |   tf.test.main()
90 | 


--------------------------------------------------------------------------------
/oilplot_pr.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/oilplot_pr.png


--------------------------------------------------------------------------------
/oiltank_155.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/oiltank_155.jpg


--------------------------------------------------------------------------------
/readme_ch.md:
--------------------------------------------------------------------------------
 1 | 
 2 | 
 3 | # INTRODUCTION
 4 | 	Embdded_SSD_Mobilenet
 5 | 
 6 | # RESULT_SHOW
 7 | 
 8 | # Installation
 9 | 	Tensorflow-gpu==1.10.0&Tensorflow-gpu==1.12.0
10 | 	opencv-python==3.4.0
11 | 	pillow
12 | 	matplotlib
13 | 	
14 | 	1、数据准备
15 | 		imges 存放图片；
16 | 		ammitations存放标签；
17 | 		
18 | 	2、环境配置
19 | 	label_map_person.txt中写入id，name（id=多少个类就写那个id，name=具体的类型名称）。
20 | 	creat_name.py生成训练数据集；
21 | 	
22 | 	进入slim执行以下命令编译安装环境
23 | 		python setup.py build
24 | 		python setup.py install
25 | 		
26 | 	进入根目录下同样执行以上操作
27 | 		python setup.py build
28 | 		python setup.py install
29 | 		
30 | 	3、进入object_detection目录
31 | 		修改create_tf_record.py中146、149、162、167行生成如下文件
32 | 		train.record
33 | 		val.record
34 | 		
35 | 	4、进入根目录下找到embedded_ssd_mobilenet_v1_coco.config中9、141、146、156行。
36 | 		9行类别参数
37 | 		141行batch_size参数
38 | 		146行学习率
39 | 		156行是否迁移学习（如果采用从头训练需要注释掉这段代码）
40 | 		170行训练数据train.record路径
41 | 		172行写入label_map_person.pbtxt
42 | 		182行写入验证的val.record路径
43 | 		184行写入验证的label_map_person.pbtxt
44 | 		
45 | # Training	
46 | 	1、进入object_detection目录
47 | 		修改训练train.sh路径内容
48 | 		
49 | # Testing
50 | 	1、生成网络结构和参数固定化融合生成pb,进入object_detection目录
51 | 		export_inference_graph.sh
52 | 		
53 | 	2、进入object_detection目录修改27、28、37、63行为自己对应文件路径进行测试
54 | 	
55 | 
56 | # Citation
57 | 	《SSD》
58 | 	《mobilenetv1》
59 | 	《pruning》
60 | 	《Weight Factorization》
61 | 	《Weight Sharing》
62 | 	《Quantization》
63 | 	 参数修剪和共享（parameter pruning and sharing）
64 | 	 低秩因子分解（low-rank factorization）
65 | 	 转移/紧凑卷积滤波器（transferred/compact convolutional filters）
66 | 	 知识蒸馏（knowledge distillation）
67 | 	
68 | # 项目目录
69 | 	annotations 存放xml标签
70 | 	images      存放训练图片
71 | 	weights		
72 | 		input_w  存放生成的ckpt、enents、pipline
73 | 		output_w 存放export输出的pb文件
74 | 	test	      存放验证数据集
75 | 	result        存放输出结果图
76 | 	


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
 1 | """Setup script for object_detection."""
 2 | 
 3 | from setuptools import find_packages
 4 | from setuptools import setup
 5 | 
 6 | 
 7 | REQUIRED_PACKAGES = ['Pillow>=1.0']
 8 | 
 9 | setup(
10 |     name='object_detection',
11 |     version='0.1',
12 |     install_requires=REQUIRED_PACKAGES,
13 |     include_package_data=True,
14 |     packages=[p for p in find_packages() if p.startswith('object_detection')],
15 |     description='Tensorflow Object Detection Library',
16 | )
17 | 


--------------------------------------------------------------------------------
/slim/WORKSPACE:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/slim/WORKSPACE


--------------------------------------------------------------------------------
/slim/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/slim/__init__.py


--------------------------------------------------------------------------------
/slim/datasets/__init__.py:
--------------------------------------------------------------------------------
1 | 
2 | 


--------------------------------------------------------------------------------
/slim/datasets/cifar10.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2016 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | # http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Provides data for the Cifar10 dataset.
16 | 
17 | The dataset scripts used to create the dataset can be found at:
18 | tensorflow/models/research/slim/datasets/download_and_convert_cifar10.py
19 | """
20 | 
21 | from __future__ import absolute_import
22 | from __future__ import division
23 | from __future__ import print_function
24 | 
25 | import os
26 | import tensorflow as tf
27 | 
28 | from datasets import dataset_utils
29 | 
30 | slim = tf.contrib.slim
31 | 
32 | _FILE_PATTERN = 'cifar10_%s.tfrecord'
33 | 
34 | SPLITS_TO_SIZES = {'train': 50000, 'test': 10000}
35 | 
36 | _NUM_CLASSES = 10
37 | 
38 | _ITEMS_TO_DESCRIPTIONS = {
39 |     'image': 'A [32 x 32 x 3] color image.',
40 |     'label': 'A single integer between 0 and 9',
41 | }
42 | 
43 | 
44 | def get_split(split_name, dataset_dir, file_pattern=None, reader=None):
45 |   """Gets a dataset tuple with instructions for reading cifar10.
46 | 
47 |   Args:
48 |     split_name: A train/test split name.
49 |     dataset_dir: The base directory of the dataset sources.
50 |     file_pattern: The file pattern to use when matching the dataset sources.
51 |       It is assumed that the pattern contains a '%s' string so that the split
52 |       name can be inserted.
53 |     reader: The TensorFlow reader type.
54 | 
55 |   Returns:
56 |     A `Dataset` namedtuple.
57 | 
58 |   Raises:
59 |     ValueError: if `split_name` is not a valid train/test split.
60 |   """
61 |   if split_name not in SPLITS_TO_SIZES:
62 |     raise ValueError('split name %s was not recognized.' % split_name)
63 | 
64 |   if not file_pattern:
65 |     file_pattern = _FILE_PATTERN
66 |   file_pattern = os.path.join(dataset_dir, file_pattern % split_name)
67 | 
68 |   # Allowing None in the signature so that dataset_factory can use the default.
69 |   if not reader:
70 |     reader = tf.TFRecordReader
71 | 
72 |   keys_to_features = {
73 |       'image/encoded': tf.FixedLenFeature((), tf.string, default_value=''),
74 |       'image/format': tf.FixedLenFeature((), tf.string, default_value='png'),
75 |       'image/class/label': tf.FixedLenFeature(
76 |           [], tf.int64, default_value=tf.zeros([], dtype=tf.int64)),
77 |   }
78 | 
79 |   items_to_handlers = {
80 |       'image': slim.tfexample_decoder.Image(shape=[32, 32, 3]),
81 |       'label': slim.tfexample_decoder.Tensor('image/class/label'),
82 |   }
83 | 
84 |   decoder = slim.tfexample_decoder.TFExampleDecoder(
85 |       keys_to_features, items_to_handlers)
86 | 
87 |   labels_to_names = None
88 |   if dataset_utils.has_labels(dataset_dir):
89 |     labels_to_names = dataset_utils.read_label_file(dataset_dir)
90 | 
91 |   return slim.dataset.Dataset(
92 |       data_sources=file_pattern,
93 |       reader=reader,
94 |       decoder=decoder,
95 |       num_samples=SPLITS_TO_SIZES[split_name],
96 |       items_to_descriptions=_ITEMS_TO_DESCRIPTIONS,
97 |       num_classes=_NUM_CLASSES,
98 |       labels_to_names=labels_to_names)
99 | 


--------------------------------------------------------------------------------
/slim/datasets/dataset_classification.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import tensorflow as tf
 3 | slim = tf.contrib.slim
 4 | def get_dataset(dataset_dir, num_samples, num_classes, labels_to_names_path=None, file_pattern='*.tfrecord'):
 5 |     file_pattern = os.path.join(dataset_dir, file_pattern)
 6 |     keys_to_features = {
 7 |         'image/encoded': tf.FixedLenFeature((), tf.string, default_value=''),
 8 |         'image/format': tf.FixedLenFeature((), tf.string, default_value='jpg'),
 9 |         'image/class/label': tf.FixedLenFeature(
10 |             [], tf.int64, default_value=tf.zeros([], dtype=tf.int64)),
11 |     }
12 |     items_to_handlers = {
13 |         'image': slim.tfexample_decoder.Image(),
14 |         'label': slim.tfexample_decoder.Tensor('image/class/label'),
15 |     }
16 |     decoder = slim.tfexample_decoder.TFExampleDecoder(keys_to_features, items_to_handlers)
17 |     items_to_descriptions = {
18 |         'image': 'A color image of varying size.',
19 |         'label': 'A single integer between 0 and ' + str(num_classes - 1),
20 |     }
21 |     labels_to_names = None
22 |     if labels_to_names_path is not None:
23 |         fd = open(labels_to_names_path)
24 |         labels_to_names = {i : line.strip() for i, line in enumerate(fd)}
25 |         fd.close()
26 |     return slim.dataset.Dataset(
27 |             data_sources=file_pattern,
28 |             reader=tf.TFRecordReader,
29 |             decoder=decoder,
30 |             num_samples=num_samples,
31 |             items_to_descriptions=items_to_descriptions,
32 |             num_classes=num_classes,
33 |             labels_to_names=labels_to_names)


--------------------------------------------------------------------------------
/slim/datasets/dataset_factory.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2016 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """A factory-pattern class which returns classification image/label pairs."""
16 | 
17 | from __future__ import absolute_import
18 | from __future__ import division
19 | from __future__ import print_function
20 | 
21 | from datasets import cifar10
22 | from datasets import flowers
23 | from datasets import imagenet
24 | from datasets import mnist
25 | 
26 | datasets_map = {
27 |     'cifar10': cifar10,
28 |     'flowers': flowers,
29 |     'imagenet': imagenet,
30 |     'mnist': mnist,
31 | }
32 | 
33 | 
34 | def get_dataset(name, split_name, dataset_dir, file_pattern=None, reader=None):
35 |   """Given a dataset name and a split_name returns a Dataset.
36 | 
37 |   Args:
38 |     name: String, the name of the dataset.
39 |     split_name: A train/test split name.
40 |     dataset_dir: The directory where the dataset files are stored.
41 |     file_pattern: The file pattern to use for matching the dataset source files.
42 |     reader: The subclass of tf.ReaderBase. If left as `None`, then the default
43 |       reader defined by each dataset is used.
44 | 
45 |   Returns:
46 |     A `Dataset` class.
47 | 
48 |   Raises:
49 |     ValueError: If the dataset `name` is unknown.
50 |   """
51 |   if name not in datasets_map:
52 |     raise ValueError('Name of dataset unknown %s' % name)
53 |   return datasets_map[name].get_split(
54 |       split_name,
55 |       dataset_dir,
56 |       file_pattern,
57 |       reader)
58 | 


--------------------------------------------------------------------------------
/slim/datasets/flowers.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2016 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | # http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Provides data for the flowers dataset.
16 | 
17 | The dataset scripts used to create the dataset can be found at:
18 | tensorflow/models/research/slim/datasets/download_and_convert_flowers.py
19 | """
20 | 
21 | from __future__ import absolute_import
22 | from __future__ import division
23 | from __future__ import print_function
24 | 
25 | import os
26 | import tensorflow as tf
27 | 
28 | from datasets import dataset_utils
29 | 
30 | slim = tf.contrib.slim
31 | 
32 | _FILE_PATTERN = 'flowers_%s_*.tfrecord'
33 | 
34 | SPLITS_TO_SIZES = {'train': 3320, 'validation': 350}
35 | 
36 | _NUM_CLASSES = 5
37 | 
38 | _ITEMS_TO_DESCRIPTIONS = {
39 |     'image': 'A color image of varying size.',
40 |     'label': 'A single integer between 0 and 4',
41 | }
42 | 
43 | 
44 | def get_split(split_name, dataset_dir, file_pattern=None, reader=None):
45 |   """Gets a dataset tuple with instructions for reading flowers.
46 | 
47 |   Args:
48 |     split_name: A train/validation split name.
49 |     dataset_dir: The base directory of the dataset sources.
50 |     file_pattern: The file pattern to use when matching the dataset sources.
51 |       It is assumed that the pattern contains a '%s' string so that the split
52 |       name can be inserted.
53 |     reader: The TensorFlow reader type.
54 | 
55 |   Returns:
56 |     A `Dataset` namedtuple.
57 | 
58 |   Raises:
59 |     ValueError: if `split_name` is not a valid train/validation split.
60 |   """
61 |   if split_name not in SPLITS_TO_SIZES:
62 |     raise ValueError('split name %s was not recognized.' % split_name)
63 | 
64 |   if not file_pattern:
65 |     file_pattern = _FILE_PATTERN
66 |   file_pattern = os.path.join(dataset_dir, file_pattern % split_name)
67 | 
68 |   # Allowing None in the signature so that dataset_factory can use the default.
69 |   if reader is None:
70 |     reader = tf.TFRecordReader
71 | 
72 |   keys_to_features = {
73 |       'image/encoded': tf.FixedLenFeature((), tf.string, default_value=''),
74 |       'image/format': tf.FixedLenFeature((), tf.string, default_value='png'),
75 |       'image/class/label': tf.FixedLenFeature(
76 |           [], tf.int64, default_value=tf.zeros([], dtype=tf.int64)),
77 |   }
78 | 
79 |   items_to_handlers = {
80 |       'image': slim.tfexample_decoder.Image(),
81 |       'label': slim.tfexample_decoder.Tensor('image/class/label'),
82 |   }
83 | 
84 |   decoder = slim.tfexample_decoder.TFExampleDecoder(
85 |       keys_to_features, items_to_handlers)
86 | 
87 |   labels_to_names = None
88 |   if dataset_utils.has_labels(dataset_dir):
89 |     labels_to_names = dataset_utils.read_label_file(dataset_dir)
90 | 
91 |   return slim.dataset.Dataset(
92 |       data_sources=file_pattern,
93 |       reader=reader,
94 |       decoder=decoder,
95 |       num_samples=SPLITS_TO_SIZES[split_name],
96 |       items_to_descriptions=_ITEMS_TO_DESCRIPTIONS,
97 |       num_classes=_NUM_CLASSES,
98 |       labels_to_names=labels_to_names)
99 | 


--------------------------------------------------------------------------------
/slim/datasets/mnist.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2016 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | # http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Provides data for the MNIST dataset.
16 | 
17 | The dataset scripts used to create the dataset can be found at:
18 | tensorflow/models/research/slim/datasets/download_and_convert_mnist.py
19 | """
20 | 
21 | from __future__ import absolute_import
22 | from __future__ import division
23 | from __future__ import print_function
24 | 
25 | import os
26 | import tensorflow as tf
27 | 
28 | from datasets import dataset_utils
29 | 
30 | slim = tf.contrib.slim
31 | 
32 | _FILE_PATTERN = 'mnist_%s.tfrecord'
33 | 
34 | _SPLITS_TO_SIZES = {'train': 60000, 'test': 10000}
35 | 
36 | _NUM_CLASSES = 10
37 | 
38 | _ITEMS_TO_DESCRIPTIONS = {
39 |     'image': 'A [28 x 28 x 1] grayscale image.',
40 |     'label': 'A single integer between 0 and 9',
41 | }
42 | 
43 | 
44 | def get_split(split_name, dataset_dir, file_pattern=None, reader=None):
45 |   """Gets a dataset tuple with instructions for reading MNIST.
46 | 
47 |   Args:
48 |     split_name: A train/test split name.
49 |     dataset_dir: The base directory of the dataset sources.
50 |     file_pattern: The file pattern to use when matching the dataset sources.
51 |       It is assumed that the pattern contains a '%s' string so that the split
52 |       name can be inserted.
53 |     reader: The TensorFlow reader type.
54 | 
55 |   Returns:
56 |     A `Dataset` namedtuple.
57 | 
58 |   Raises:
59 |     ValueError: if `split_name` is not a valid train/test split.
60 |   """
61 |   if split_name not in _SPLITS_TO_SIZES:
62 |     raise ValueError('split name %s was not recognized.' % split_name)
63 | 
64 |   if not file_pattern:
65 |     file_pattern = _FILE_PATTERN
66 |   file_pattern = os.path.join(dataset_dir, file_pattern % split_name)
67 | 
68 |   # Allowing None in the signature so that dataset_factory can use the default.
69 |   if reader is None:
70 |     reader = tf.TFRecordReader
71 | 
72 |   keys_to_features = {
73 |       'image/encoded': tf.FixedLenFeature((), tf.string, default_value=''),
74 |       'image/format': tf.FixedLenFeature((), tf.string, default_value='raw'),
75 |       'image/class/label': tf.FixedLenFeature(
76 |           [1], tf.int64, default_value=tf.zeros([1], dtype=tf.int64)),
77 |   }
78 | 
79 |   items_to_handlers = {
80 |       'image': slim.tfexample_decoder.Image(shape=[28, 28, 1], channels=1),
81 |       'label': slim.tfexample_decoder.Tensor('image/class/label', shape=[]),
82 |   }
83 | 
84 |   decoder = slim.tfexample_decoder.TFExampleDecoder(
85 |       keys_to_features, items_to_handlers)
86 | 
87 |   labels_to_names = None
88 |   if dataset_utils.has_labels(dataset_dir):
89 |     labels_to_names = dataset_utils.read_label_file(dataset_dir)
90 | 
91 |   return slim.dataset.Dataset(
92 |       data_sources=file_pattern,
93 |       reader=reader,
94 |       decoder=decoder,
95 |       num_samples=_SPLITS_TO_SIZES[split_name],
96 |       num_classes=_NUM_CLASSES,
97 |       items_to_descriptions=_ITEMS_TO_DESCRIPTIONS,
98 |       labels_to_names=labels_to_names)
99 | 


--------------------------------------------------------------------------------
/slim/datasets/preprocess_imagenet_validation_data.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/python
 2 | # Copyright 2016 Google Inc. All Rights Reserved.
 3 | #
 4 | # Licensed under the Apache License, Version 2.0 (the "License");
 5 | # you may not use this file except in compliance with the License.
 6 | # You may obtain a copy of the License at
 7 | #
 8 | #     http://www.apache.org/licenses/LICENSE-2.0
 9 | #
10 | # Unless required by applicable law or agreed to in writing, software
11 | # distributed under the License is distributed on an "AS IS" BASIS,
12 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 | # See the License for the specific language governing permissions and
14 | # limitations under the License.
15 | # ==============================================================================
16 | r"""Process the ImageNet Challenge bounding boxes for TensorFlow model training.
17 | 
18 | Associate the ImageNet 2012 Challenge validation data set with labels.
19 | 
20 | The raw ImageNet validation data set is expected to reside in JPEG files
21 | located in the following directory structure.
22 | 
23 |  data_dir/ILSVRC2012_val_00000001.JPEG
24 |  data_dir/ILSVRC2012_val_00000002.JPEG
25 |  ...
26 |  data_dir/ILSVRC2012_val_00050000.JPEG
27 | 
28 | This script moves the files into a directory structure like such:
29 |  data_dir/n01440764/ILSVRC2012_val_00000293.JPEG
30 |  data_dir/n01440764/ILSVRC2012_val_00000543.JPEG
31 |  ...
32 | where 'n01440764' is the unique synset label associated with
33 | these images.
34 | 
35 | This directory reorganization requires a mapping from validation image
36 | number (i.e. suffix of the original file) to the associated label. This
37 | is provided in the ImageNet development kit via a Matlab file.
38 | 
39 | In order to make life easier and divorce ourselves from Matlab, we instead
40 | supply a custom text file that provides this mapping for us.
41 | 
42 | Sample usage:
43 |   ./preprocess_imagenet_validation_data.py ILSVRC2012_img_val \
44 |   imagenet_2012_validation_synset_labels.txt
45 | """
46 | 
47 | from __future__ import absolute_import
48 | from __future__ import division
49 | from __future__ import print_function
50 | 
51 | import os
52 | import sys
53 | 
54 | from six.moves import xrange  # pylint: disable=redefined-builtin
55 | 
56 | 
57 | if __name__ == '__main__':
58 |   if len(sys.argv) < 3:
59 |     print('Invalid usage\n'
60 |           'usage: preprocess_imagenet_validation_data.py '
61 |           '<validation data dir> <validation labels file>')
62 |     sys.exit(-1)
63 |   data_dir = sys.argv[1]
64 |   validation_labels_file = sys.argv[2]
65 | 
66 |   # Read in the 50000 synsets associated with the validation data set.
67 |   labels = [l.strip() for l in open(validation_labels_file).readlines()]
68 |   unique_labels = set(labels)
69 | 
70 |   # Make all sub-directories in the validation data dir.
71 |   for label in unique_labels:
72 |     labeled_data_dir = os.path.join(data_dir, label)
73 |     os.makedirs(labeled_data_dir)
74 | 
75 |   # Move all of the image to the appropriate sub-directory.
76 |   for i in xrange(len(labels)):
77 |     basename = 'ILSVRC2012_val_000%.5d.JPEG' % (i + 1)
78 |     original_filename = os.path.join(data_dir, basename)
79 |     if not os.path.exists(original_filename):
80 |       print('Failed to find: ', original_filename)
81 |       sys.exit(-1)
82 |     new_filename = os.path.join(data_dir, labels[i], basename)
83 |     os.rename(original_filename, new_filename)
84 | 


--------------------------------------------------------------------------------
/slim/deployment/__init__.py:
--------------------------------------------------------------------------------
1 | 
2 | 


--------------------------------------------------------------------------------
/slim/download_and_convert_data.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2016 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | r"""Downloads and converts a particular dataset.
16 | 
17 | Usage:
18 | ```shell
19 | 
20 | $ python download_and_convert_data.py \
21 |     --dataset_name=mnist \
22 |     --dataset_dir=/tmp/mnist
23 | 
24 | $ python download_and_convert_data.py \
25 |     --dataset_name=cifar10 \
26 |     --dataset_dir=/tmp/cifar10
27 | 
28 | $ python download_and_convert_data.py \
29 |     --dataset_name=flowers \
30 |     --dataset_dir=/tmp/flowers
31 | ```
32 | """
33 | from __future__ import absolute_import
34 | from __future__ import division
35 | from __future__ import print_function
36 | 
37 | import tensorflow as tf
38 | 
39 | from datasets import download_and_convert_cifar10
40 | from datasets import download_and_convert_flowers
41 | from datasets import download_and_convert_mnist
42 | 
43 | FLAGS = tf.app.flags.FLAGS
44 | 
45 | tf.app.flags.DEFINE_string(
46 |     'dataset_name',
47 |     None,
48 |     'The name of the dataset to convert, one of "cifar10", "flowers", "mnist".')
49 | 
50 | tf.app.flags.DEFINE_string(
51 |     'dataset_dir',
52 |     None,
53 |     'The directory where the output TFRecords and temporary files are saved.')
54 | 
55 | 
56 | def main(_):
57 |   if not FLAGS.dataset_name:
58 |     raise ValueError('You must supply the dataset name with --dataset_name')
59 |   if not FLAGS.dataset_dir:
60 |     raise ValueError('You must supply the dataset directory with --dataset_dir')
61 | 
62 |   if FLAGS.dataset_name == 'cifar10':
63 |     download_and_convert_cifar10.run(FLAGS.dataset_dir)
64 |   elif FLAGS.dataset_name == 'flowers':
65 |     download_and_convert_flowers.run(FLAGS.dataset_dir)
66 |   elif FLAGS.dataset_name == 'mnist':
67 |     download_and_convert_mnist.run(FLAGS.dataset_dir)
68 |   else:
69 |     raise ValueError(
70 |         'dataset_name [%s] was not recognized.' % FLAGS.dataset_name)
71 | 
72 | if __name__ == '__main__':
73 |   tf.app.run()
74 | 


--------------------------------------------------------------------------------
/slim/export_inference_graph_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | # http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Tests for export_inference_graph."""
17 | 
18 | from __future__ import absolute_import
19 | from __future__ import division
20 | from __future__ import print_function
21 | 
22 | import os
23 | 
24 | 
25 | import tensorflow as tf
26 | 
27 | from tensorflow.python.platform import gfile
28 | import models.research.slim.export_inference_graph as export_inference_graph
29 | 
30 | 
31 | class ExportInferenceGraphTest(tf.test.TestCase):
32 | 
33 |   def testExportInferenceGraph(self):
34 |     tmpdir = self.get_temp_dir()
35 |     output_file = os.path.join(tmpdir, 'inception_v3.pb')
36 |     flags = tf.app.flags.FLAGS
37 |     flags.output_file = output_file
38 |     flags.model_name = 'inception_v3'
39 |     flags.dataset_dir = tmpdir
40 |     export_inference_graph.main(None)
41 |     self.assertTrue(gfile.Exists(output_file))
42 | 
43 | if __name__ == '__main__':
44 |   tf.test.main()
45 | 


--------------------------------------------------------------------------------
/slim/nets/__init__.py:
--------------------------------------------------------------------------------
1 | 
2 | 


--------------------------------------------------------------------------------
/slim/nets/inception.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2016 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | # http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Brings all inception models under one namespace."""
16 | 
17 | from __future__ import absolute_import
18 | from __future__ import division
19 | from __future__ import print_function
20 | 
21 | # pylint: disable=unused-import
22 | from nets.inception_resnet_v2 import inception_resnet_v2
23 | from nets.inception_resnet_v2 import inception_resnet_v2_arg_scope
24 | from nets.inception_resnet_v2 import inception_resnet_v2_base
25 | from nets.inception_v1 import inception_v1
26 | from nets.inception_v1 import inception_v1_arg_scope
27 | from nets.inception_v1 import inception_v1_base
28 | from nets.inception_v2 import inception_v2
29 | from nets.inception_v2 import inception_v2_arg_scope
30 | from nets.inception_v2 import inception_v2_base
31 | from nets.inception_v3 import inception_v3
32 | from nets.inception_v3 import inception_v3_arg_scope
33 | from nets.inception_v3 import inception_v3_base
34 | from nets.inception_v4 import inception_v4
35 | from nets.inception_v4 import inception_v4_arg_scope
36 | from nets.inception_v4 import inception_v4_base
37 | # pylint: enable=unused-import
38 | 


--------------------------------------------------------------------------------
/slim/nets/inception_utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2016 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | # http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Contains common code shared by all inception models.
16 | 
17 | Usage of arg scope:
18 |   with slim.arg_scope(inception_arg_scope()):
19 |     logits, end_points = inception.inception_v3(images, num_classes,
20 |                                                 is_training=is_training)
21 | 
22 | """
23 | from __future__ import absolute_import
24 | from __future__ import division
25 | from __future__ import print_function
26 | 
27 | import tensorflow as tf
28 | 
29 | slim = tf.contrib.slim
30 | 
31 | 
32 | def inception_arg_scope(weight_decay=0.00004,
33 |                         use_batch_norm=True,
34 |                         batch_norm_decay=0.9997,
35 |                         batch_norm_epsilon=0.001,
36 |                         activation_fn=tf.nn.relu,
37 |                         batch_norm_updates_collections=tf.GraphKeys.UPDATE_OPS):
38 |   """Defines the default arg scope for inception models.
39 | 
40 |   Args:
41 |     weight_decay: The weight decay to use for regularizing the model.
42 |     use_batch_norm: "If `True`, batch_norm is applied after each convolution.
43 |     batch_norm_decay: Decay for batch norm moving average.
44 |     batch_norm_epsilon: Small float added to variance to avoid dividing by zero
45 |       in batch norm.
46 |     activation_fn: Activation function for conv2d.
47 |     batch_norm_updates_collections: Collection for the update ops for
48 |       batch norm.
49 | 
50 |   Returns:
51 |     An `arg_scope` to use for the inception models.
52 |   """
53 |   batch_norm_params = {
54 |       # Decay for the moving averages.
55 |       'decay': batch_norm_decay,
56 |       # epsilon to prevent 0s in variance.
57 |       'epsilon': batch_norm_epsilon,
58 |       # collection containing update_ops.
59 |       'updates_collections': batch_norm_updates_collections,
60 |       # use fused batch norm if possible.
61 |       'fused': None,
62 |   }
63 |   if use_batch_norm:
64 |     normalizer_fn = slim.batch_norm
65 |     normalizer_params = batch_norm_params
66 |   else:
67 |     normalizer_fn = None
68 |     normalizer_params = {}
69 |   # Set weight_decay for weights in Conv and FC layers.
70 |   with slim.arg_scope([slim.conv2d, slim.fully_connected],
71 |                       weights_regularizer=slim.l2_regularizer(weight_decay)):
72 |     with slim.arg_scope(
73 |         [slim.conv2d],
74 |         weights_initializer=slim.variance_scaling_initializer(),
75 |         activation_fn=activation_fn,
76 |         normalizer_fn=normalizer_fn,
77 |         normalizer_params=normalizer_params) as sc:
78 |       return sc
79 | 


--------------------------------------------------------------------------------
/slim/nets/mobilenet/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/slim/nets/mobilenet/__init__.py


--------------------------------------------------------------------------------
/slim/nets/mobilenet/madds_top1_accuracy.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/slim/nets/mobilenet/madds_top1_accuracy.png


--------------------------------------------------------------------------------
/slim/nets/mobilenet/mnet_v1_vs_v2_pixel1_latency.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/slim/nets/mobilenet/mnet_v1_vs_v2_pixel1_latency.png


--------------------------------------------------------------------------------
/slim/nets/mobilenet_v1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/slim/nets/mobilenet_v1.png


--------------------------------------------------------------------------------
/slim/nets/nasnet/README.md:
--------------------------------------------------------------------------------
 1 | # TensorFlow-Slim NASNet-A Implementation/Checkpoints
 2 | This directory contains the code for the NASNet-A model from the paper
 3 | [Learning Transferable Architectures for Scalable Image Recognition](https://arxiv.org/abs/1707.07012) by Zoph et al.
 4 | In nasnet.py there are three different configurations of NASNet-A that are implementented. One of the models is the NASNet-A built for CIFAR-10 and the
 5 | other two are variants of NASNet-A trained on ImageNet, which are listed below.
 6 | 
 7 | # Pre-Trained Models
 8 | Two NASNet-A checkpoints are available that have been trained on the
 9 | [ILSVRC-2012-CLS](http://www.image-net.org/challenges/LSVRC/2012/)
10 | image classification dataset. Accuracies were computed by evaluating using a single image crop.
11 | 
12 | Model Checkpoint | Million MACs | Million Parameters | Top-1 Accuracy| Top-5 Accuracy |
13 | :----:|:------------:|:----------:|:-------:|:-------:|
14 | [NASNet-A_Mobile_224](https://storage.googleapis.com/download.tensorflow.org/models/nasnet-a_mobile_04_10_2017.tar.gz)|564|5.3|74.0|91.6|
15 | [NASNet-A_Large_331](https://storage.googleapis.com/download.tensorflow.org/models/nasnet-a_large_04_10_2017.tar.gz)|23800|88.9|82.7|96.2|
16 | 
17 | 
18 | Here is an example of how to download the NASNet-A_Mobile_224 checkpoint. The way to download the NASNet-A_Large_331 is the same.
19 | 
20 | ```shell
21 | CHECKPOINT_DIR=/tmp/checkpoints
22 | mkdir ${CHECKPOINT_DIR}
23 | cd ${CHECKPOINT_DIR}
24 | wget https://storage.googleapis.com/download.tensorflow.org/models/nasnet-a_mobile_04_10_2017.tar.gz
25 | tar -xvf nasnet-a_mobile_04_10_2017.tar.gz
26 | rm nasnet-a_mobile_04_10_2017.tar.gz
27 | ```
28 | More information on integrating NASNet Models into your project can be found at the [TF-Slim Image Classification Library](https://github.com/tensorflow/models/blob/master/research/slim/README.md).
29 | 
30 | To get started running models on-device go to [TensorFlow Mobile](https://www.tensorflow.org/mobile/).
31 | 
32 | ## Sample Commands for using NASNet-A Mobile and Large Checkpoints for Inference
33 | -------
34 | Run eval with the NASNet-A mobile ImageNet model
35 | 
36 | ```shell
37 | DATASET_DIR=/tmp/imagenet
38 | EVAL_DIR=/tmp/tfmodel/eval
39 | CHECKPOINT_DIR=/tmp/checkpoints/model.ckpt
40 | python tensorflow_models/research/slim/eval_image_classifier \
41 | --checkpoint_path=${CHECKPOINT_DIR} \
42 | --eval_dir=${EVAL_DIR} \
43 | --dataset_dir=${DATASET_DIR} \
44 | --dataset_name=imagenet \
45 | --dataset_split_name=validation \
46 | --model_name=nasnet_mobile \
47 | --eval_image_size=224
48 | ```
49 | 
50 | Run eval with the NASNet-A large ImageNet model
51 | 
52 | ```shell
53 | DATASET_DIR=/tmp/imagenet
54 | EVAL_DIR=/tmp/tfmodel/eval
55 | CHECKPOINT_DIR=/tmp/checkpoints/model.ckpt
56 | python tensorflow_models/research/slim/eval_image_classifier \
57 | --checkpoint_path=${CHECKPOINT_DIR} \
58 | --eval_dir=${EVAL_DIR} \
59 | --dataset_dir=${DATASET_DIR} \
60 | --dataset_name=imagenet \
61 | --dataset_split_name=validation \
62 | --model_name=nasnet_large \
63 | --eval_image_size=331
64 | ```
65 | 


--------------------------------------------------------------------------------
/slim/nets/nasnet/__init__.py:
--------------------------------------------------------------------------------
1 | 
2 | 


--------------------------------------------------------------------------------
/slim/nets/nasnet/nasnet_utils_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | # http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Tests for slim.nets.nasnet.nasnet_utils."""
16 | 
17 | from __future__ import absolute_import
18 | from __future__ import division
19 | from __future__ import print_function
20 | 
21 | import tensorflow as tf
22 | 
23 | from nets.nasnet import nasnet_utils
24 | 
25 | 
26 | class NasnetUtilsTest(tf.test.TestCase):
27 | 
28 |   def testCalcReductionLayers(self):
29 |     num_cells = 18
30 |     num_reduction_layers = 2
31 |     reduction_layers = nasnet_utils.calc_reduction_layers(
32 |         num_cells, num_reduction_layers)
33 |     self.assertEqual(len(reduction_layers), 2)
34 |     self.assertEqual(reduction_layers[0], 6)
35 |     self.assertEqual(reduction_layers[1], 12)
36 | 
37 |   def testGetChannelIndex(self):
38 |     data_formats = ['NHWC', 'NCHW']
39 |     for data_format in data_formats:
40 |       index = nasnet_utils.get_channel_index(data_format)
41 |       correct_index = 3 if data_format == 'NHWC' else 1
42 |       self.assertEqual(index, correct_index)
43 | 
44 |   def testGetChannelDim(self):
45 |     data_formats = ['NHWC', 'NCHW']
46 |     shape = [10, 20, 30, 40]
47 |     for data_format in data_formats:
48 |       dim = nasnet_utils.get_channel_dim(shape, data_format)
49 |       correct_dim = shape[3] if data_format == 'NHWC' else shape[1]
50 |       self.assertEqual(dim, correct_dim)
51 | 
52 |   def testGlobalAvgPool(self):
53 |     data_formats = ['NHWC', 'NCHW']
54 |     inputs = tf.placeholder(tf.float32, (5, 10, 20, 10))
55 |     for data_format in data_formats:
56 |       output = nasnet_utils.global_avg_pool(
57 |           inputs, data_format)
58 |       self.assertEqual(output.shape, [5, 10])
59 | 
60 | 
61 | if __name__ == '__main__':
62 |   tf.test.main()
63 | 


--------------------------------------------------------------------------------
/slim/nets/nets_factory_test.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2016 Google Inc. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | # http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | 
16 | """Tests for slim.inception."""
17 | 
18 | from __future__ import absolute_import
19 | from __future__ import division
20 | from __future__ import print_function
21 | 
22 | 
23 | import tensorflow as tf
24 | 
25 | from nets import nets_factory
26 | 
27 | 
28 | class NetworksTest(tf.test.TestCase):
29 | 
30 |   def testGetNetworkFnFirstHalf(self):
31 |     batch_size = 5
32 |     num_classes = 1000
33 |     for net in list(nets_factory.networks_map.keys())[:10]:
34 |       with tf.Graph().as_default() as g, self.test_session(g):
35 |         net_fn = nets_factory.get_network_fn(net, num_classes)
36 |         # Most networks use 224 as their default_image_size
37 |         image_size = getattr(net_fn, 'default_image_size', 224)
38 |         inputs = tf.random_uniform((batch_size, image_size, image_size, 3))
39 |         logits, end_points = net_fn(inputs)
40 |         self.assertTrue(isinstance(logits, tf.Tensor))
41 |         self.assertTrue(isinstance(end_points, dict))
42 |         self.assertEqual(logits.get_shape().as_list()[0], batch_size)
43 |         self.assertEqual(logits.get_shape().as_list()[-1], num_classes)
44 | 
45 |   def testGetNetworkFnSecondHalf(self):
46 |     batch_size = 5
47 |     num_classes = 1000
48 |     for net in list(nets_factory.networks_map.keys())[10:]:
49 |       with tf.Graph().as_default() as g, self.test_session(g):
50 |         net_fn = nets_factory.get_network_fn(net, num_classes)
51 |         # Most networks use 224 as their default_image_size
52 |         image_size = getattr(net_fn, 'default_image_size', 224)
53 |         inputs = tf.random_uniform((batch_size, image_size, image_size, 3))
54 |         logits, end_points = net_fn(inputs)
55 |         self.assertTrue(isinstance(logits, tf.Tensor))
56 |         self.assertTrue(isinstance(end_points, dict))
57 |         self.assertEqual(logits.get_shape().as_list()[0], batch_size)
58 |         self.assertEqual(logits.get_shape().as_list()[-1], num_classes)
59 | 
60 | if __name__ == '__main__':
61 |   tf.test.main()
62 | 


--------------------------------------------------------------------------------
/slim/preprocessing/__init__.py:
--------------------------------------------------------------------------------
1 | 
2 | 


--------------------------------------------------------------------------------
/slim/preprocessing/lenet_preprocessing.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2016 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | # http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Provides utilities for preprocessing."""
16 | 
17 | from __future__ import absolute_import
18 | from __future__ import division
19 | from __future__ import print_function
20 | 
21 | import tensorflow as tf
22 | 
23 | slim = tf.contrib.slim
24 | 
25 | 
26 | def preprocess_image(image, output_height, output_width, is_training):
27 |   """Preprocesses the given image.
28 | 
29 |   Args:
30 |     image: A `Tensor` representing an image of arbitrary size.
31 |     output_height: The height of the image after preprocessing.
32 |     output_width: The width of the image after preprocessing.
33 |     is_training: `True` if we're preprocessing the image for training and
34 |       `False` otherwise.
35 | 
36 |   Returns:
37 |     A preprocessed image.
38 |   """
39 |   image = tf.to_float(image)
40 |   image = tf.image.resize_image_with_crop_or_pad(
41 |       image, output_width, output_height)
42 |   image = tf.subtract(image, 128.0)
43 |   image = tf.div(image, 128.0)
44 |   return image
45 | 


--------------------------------------------------------------------------------
/slim/preprocessing/preprocessing_factory.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2016 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | # http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Contains a factory for building various models."""
16 | 
17 | from __future__ import absolute_import
18 | from __future__ import division
19 | from __future__ import print_function
20 | 
21 | import tensorflow as tf
22 | 
23 | from preprocessing import cifarnet_preprocessing
24 | from preprocessing import inception_preprocessing
25 | from preprocessing import lenet_preprocessing
26 | from preprocessing import vgg_preprocessing
27 | 
28 | slim = tf.contrib.slim
29 | 
30 | 
31 | def get_preprocessing(name, is_training=False):
32 |   """Returns preprocessing_fn(image, height, width, **kwargs).
33 | 
34 |   Args:
35 |     name: The name of the preprocessing function.
36 |     is_training: `True` if the model is being used for training and `False`
37 |       otherwise.
38 | 
39 |   Returns:
40 |     preprocessing_fn: A function that preprocessing a single image (pre-batch).
41 |       It has the following signature:
42 |         image = preprocessing_fn(image, output_height, output_width, ...).
43 | 
44 |   Raises:
45 |     ValueError: If Preprocessing `name` is not recognized.
46 |   """
47 |   preprocessing_fn_map = {
48 |       'cifarnet': cifarnet_preprocessing,
49 |       'inception': inception_preprocessing,
50 |       'inception_v1': inception_preprocessing,
51 |       'inception_v2': inception_preprocessing,
52 |       'inception_v3': inception_preprocessing,
53 |       'inception_v4': inception_preprocessing,
54 |       'inception_resnet_v2': inception_preprocessing,
55 |       'lenet': lenet_preprocessing,
56 |       'mobilenet_v1': inception_preprocessing,
57 |       'mobilenet_v2': inception_preprocessing,
58 |       'mobilenet_v2_035': inception_preprocessing,
59 |       'mobilenet_v2_140': inception_preprocessing,
60 |       'nasnet_mobile': inception_preprocessing,
61 |       'nasnet_large': inception_preprocessing,
62 |       'pnasnet_mobile': inception_preprocessing,
63 |       'pnasnet_large': inception_preprocessing,
64 |       'resnet_v1_50': vgg_preprocessing,
65 |       'resnet_v1_101': vgg_preprocessing,
66 |       'resnet_v1_152': vgg_preprocessing,
67 |       'resnet_v1_200': vgg_preprocessing,
68 |       'resnet_v2_50': vgg_preprocessing,
69 |       'resnet_v2_101': vgg_preprocessing,
70 |       'resnet_v2_152': vgg_preprocessing,
71 |       'resnet_v2_200': vgg_preprocessing,
72 |       'vgg': vgg_preprocessing,
73 |       'vgg_a': vgg_preprocessing,
74 |       'vgg_16': vgg_preprocessing,
75 |       'vgg_19': vgg_preprocessing,
76 |   }
77 | 
78 |   if name not in preprocessing_fn_map:
79 |     raise ValueError('Preprocessing name [%s] was not recognized' % name)
80 | 
81 |   def preprocessing_fn(image, output_height, output_width, **kwargs):
82 |     return preprocessing_fn_map[name].preprocess_image(
83 |         image, output_height, output_width, is_training=is_training, **kwargs)
84 | 
85 |   return preprocessing_fn
86 | 


--------------------------------------------------------------------------------
/slim/scripts/train_cifarnet_on_cifar10.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 3 | #
 4 | # Licensed under the Apache License, Version 2.0 (the "License");
 5 | # you may not use this file except in compliance with the License.
 6 | # You may obtain a copy of the License at
 7 | #
 8 | # http://www.apache.org/licenses/LICENSE-2.0
 9 | #
10 | # Unless required by applicable law or agreed to in writing, software
11 | # distributed under the License is distributed on an "AS IS" BASIS,
12 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 | # See the License for the specific language governing permissions and
14 | # limitations under the License.
15 | # ==============================================================================
16 | #
17 | # This script performs the following operations:
18 | # 1. Downloads the Cifar10 dataset
19 | # 2. Trains a CifarNet model on the Cifar10 training set.
20 | # 3. Evaluates the model on the Cifar10 testing set.
21 | #
22 | # Usage:
23 | # cd slim
24 | # ./scripts/train_cifarnet_on_cifar10.sh
25 | set -e
26 | 
27 | # Where the checkpoint and logs will be saved to.
28 | TRAIN_DIR=/tmp/cifarnet-model
29 | 
30 | # Where the dataset is saved to.
31 | DATASET_DIR=/tmp/cifar10
32 | 
33 | # Download the dataset
34 | python download_and_convert_data.py \
35 |   --dataset_name=cifar10 \
36 |   --dataset_dir=${DATASET_DIR}
37 | 
38 | # Run training.
39 | python train_image_classifier.py \
40 |   --train_dir=${TRAIN_DIR} \
41 |   --dataset_name=cifar10 \
42 |   --dataset_split_name=train \
43 |   --dataset_dir=${DATASET_DIR} \
44 |   --model_name=cifarnet \
45 |   --preprocessing_name=cifarnet \
46 |   --max_number_of_steps=100000 \
47 |   --batch_size=128 \
48 |   --save_interval_secs=120 \
49 |   --save_summaries_secs=120 \
50 |   --log_every_n_steps=100 \
51 |   --optimizer=sgd \
52 |   --learning_rate=0.1 \
53 |   --learning_rate_decay_factor=0.1 \
54 |   --num_epochs_per_decay=200 \
55 |   --weight_decay=0.004
56 | 
57 | # Run evaluation.
58 | python eval_image_classifier.py \
59 |   --checkpoint_path=${TRAIN_DIR} \
60 |   --eval_dir=${TRAIN_DIR} \
61 |   --dataset_name=cifar10 \
62 |   --dataset_split_name=test \
63 |   --dataset_dir=${DATASET_DIR} \
64 |   --model_name=cifarnet
65 | 


--------------------------------------------------------------------------------
/slim/scripts/train_lenet_on_mnist.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 3 | #
 4 | # Licensed under the Apache License, Version 2.0 (the "License");
 5 | # you may not use this file except in compliance with the License.
 6 | # You may obtain a copy of the License at
 7 | #
 8 | # http://www.apache.org/licenses/LICENSE-2.0
 9 | #
10 | # Unless required by applicable law or agreed to in writing, software
11 | # distributed under the License is distributed on an "AS IS" BASIS,
12 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 | # See the License for the specific language governing permissions and
14 | # limitations under the License.
15 | # ==============================================================================
16 | #
17 | # This script performs the following operations:
18 | # 1. Downloads the MNIST dataset
19 | # 2. Trains a LeNet model on the MNIST training set.
20 | # 3. Evaluates the model on the MNIST testing set.
21 | #
22 | # Usage:
23 | # cd slim
24 | # ./slim/scripts/train_lenet_on_mnist.sh
25 | set -e
26 | 
27 | # Where the checkpoint and logs will be saved to.
28 | TRAIN_DIR=/tmp/lenet-model
29 | 
30 | # Where the dataset is saved to.
31 | DATASET_DIR=/tmp/mnist
32 | 
33 | # Download the dataset
34 | python download_and_convert_data.py \
35 |   --dataset_name=mnist \
36 |   --dataset_dir=${DATASET_DIR}
37 | 
38 | # Run training.
39 | python train_image_classifier.py \
40 |   --train_dir=${TRAIN_DIR} \
41 |   --dataset_name=mnist \
42 |   --dataset_split_name=train \
43 |   --dataset_dir=${DATASET_DIR} \
44 |   --model_name=lenet \
45 |   --preprocessing_name=lenet \
46 |   --max_number_of_steps=20000 \
47 |   --batch_size=50 \
48 |   --learning_rate=0.01 \
49 |   --save_interval_secs=60 \
50 |   --save_summaries_secs=60 \
51 |   --log_every_n_steps=100 \
52 |   --optimizer=sgd \
53 |   --learning_rate_decay_type=fixed \
54 |   --weight_decay=0
55 | 
56 | # Run evaluation.
57 | python eval_image_classifier.py \
58 |   --checkpoint_path=${TRAIN_DIR} \
59 |   --eval_dir=${TRAIN_DIR} \
60 |   --dataset_name=mnist \
61 |   --dataset_split_name=test \
62 |   --dataset_dir=${DATASET_DIR} \
63 |   --model_name=lenet
64 | 


--------------------------------------------------------------------------------
/slim/setup.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | # http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # ==============================================================================
15 | """Setup script for slim."""
16 | 
17 | from setuptools import find_packages
18 | from setuptools import setup
19 | 
20 | 
21 | setup(
22 |     name='slim',
23 |     version='0.1',
24 |     include_package_data=True,
25 |     packages=find_packages(),
26 |     description='tf-slim',
27 | )
28 | 


--------------------------------------------------------------------------------
/slim/test_images_classifier.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import
 2 | from __future__ import division
 3 | from __future__ import print_function
 4 | 
 5 | import os
 6 | import math
 7 | import tensorflow as tf
 8 | 
 9 | from nets import nets_factory
10 | from preprocessing import preprocessing_factory
11 | 
12 | slim = tf.contrib.slim
13 | 
14 | tf.app.flags.DEFINE_string(
15 |     'master', '', 'The address of the TensorFlow master to use.')
16 | 
17 | tf.app.flags.DEFINE_string(
18 |     'checkpoint_path', '/tmp/tfmodel/',
19 |     'The directory where the model was written to or an absolute path to a '
20 |     'checkpoint file.')
21 | 
22 | tf.app.flags.DEFINE_string(
23 |     'test_path', '', 'Test image path.')
24 | 
25 | tf.app.flags.DEFINE_integer(
26 |     'num_classes', 5, 'Number of classes.')
27 | 
28 | tf.app.flags.DEFINE_integer(
29 |     'labels_offset', 0,
30 |     'An offset for the labels in the dataset. This flag is primarily used to '
31 |     'evaluate the VGG and ResNet architectures which do not use a background '
32 |     'class for the ImageNet dataset.')
33 | 
34 | tf.app.flags.DEFINE_string(
35 |     'model_name', 'inception_v3', 'The name of the architecture to evaluate.')
36 | 
37 | tf.app.flags.DEFINE_string(
38 |     'preprocessing_name', None, 'The name of the preprocessing to use. If left '
39 |     'as `None`, then the model_name flag is used.')
40 | 
41 | tf.app.flags.DEFINE_integer(
42 |     'test_image_size', None, 'Eval image size')
43 | 
44 | FLAGS = tf.app.flags.FLAGS
45 | 
46 | 
47 | def main(_):
48 |     # if not FLAGS.test_list:
49 |     #     raise ValueError('You must supply the test list with --test_list')
50 | 
51 |     tf.logging.set_verbosity(tf.logging.INFO)
52 |     with tf.Graph().as_default():
53 |         tf_global_step = slim.get_or_create_global_step()
54 | 
55 |         ####################
56 |         # Select the model #
57 |         ####################
58 |         network_fn = nets_factory.get_network_fn(
59 |             FLAGS.model_name,
60 |             num_classes=(FLAGS.num_classes - FLAGS.labels_offset),
61 |             is_training=False)
62 | 
63 |         #####################################
64 |         # Select the preprocessing function #
65 |         #####################################
66 |         preprocessing_name = FLAGS.preprocessing_name or FLAGS.model_name
67 |         image_preprocessing_fn = preprocessing_factory.get_preprocessing(
68 |             preprocessing_name,
69 |             is_training=False)
70 | 
71 |         test_image_size = FLAGS.test_image_size or network_fn.default_image_size
72 | 
73 |         if tf.gfile.IsDirectory(FLAGS.checkpoint_path):
74 |             checkpoint_path = tf.train.latest_checkpoint(FLAGS.checkpoint_path)
75 |         else:
76 |             checkpoint_path = FLAGS.checkpoint_path
77 | 
78 |         tf.Graph().as_default()
79 |         with tf.Session() as sess:
80 |             image = open(FLAGS.test_path, 'rb').read()
81 |             image = tf.image.decode_jpeg(image, channels=3)
82 |             processed_image = image_preprocessing_fn(image, test_image_size, test_image_size)
83 |             processed_images = tf.expand_dims(processed_image, 0)
84 |             logits, _ = network_fn(processed_images)
85 |             predictions = tf.argmax(logits, 1)
86 |             saver = tf.train.Saver()
87 |             print(checkpoint_path)
88 |             saver.restore(sess, checkpoint_path)
89 |             np_image, network_input, predictions = sess.run([image, processed_image, predictions])
90 |             print('{} {}'.format(FLAGS.test_path, predictions[0]))
91 | 
92 | if __name__ == '__main__':
93 |     tf.app.run()


--------------------------------------------------------------------------------
/trainval_person.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Eric3911/Mini-SSD/6fb6e1bce3ab6e4adb832b37e78325803c7424b6/trainval_person.txt


--------------------------------------------------------------------------------
/zcreate_record.sh:
--------------------------------------------------------------------------------
1 | 
2 | python object_detection/create_tf_record.py
3 | 


--------------------------------------------------------------------------------
/zfrozen.sh:
--------------------------------------------------------------------------------
1 | python object_detection/export_inference_graph.py 
2 |          --input_type image_tensor
3 |          --pipeline_config_path configs/faster_rcnn_resnet101.config 
4 |          --trained_checkpoint_prefix model.ckpt-20000
5 |          --output_directory output_inference_graph
6 | 


--------------------------------------------------------------------------------
/ztrain.sh:
--------------------------------------------------------------------------------
1 | nohup python object_detection/train.py \
2 |         --logtostderr \
3 |         --train_dir=train \
4 |         --pipeline_config_path=configs\faster_rcnn_resnet101.config > train/losslog/train_loss.log 2>&1 &
5 | 


--------------------------------------------------------------------------------