├── .gitignore
├── README.md
├── data_process
    └── script
    │   └── data_preprocessing.py
├── grasp_env.yaml
├── grasp_multiObject_multiGrasp
    ├── data
    │   ├── demo
    │   │   ├── mask.jpg
    │   │   ├── pcd0100r_rgd_preprocessed_1.png
    │   │   ├── pcd0266r_rgd_preprocessed_1.png
    │   │   ├── pcd0882r_rgd_preprocessed_1.png
    │   │   ├── results_all_cls
    │   │   │   ├── pcd0100r_rgd_preprocessed_1.png
    │   │   │   ├── pcd0266r_rgd_preprocessed_1.png
    │   │   │   ├── pcd0882r_rgd_preprocessed_1.png
    │   │   │   ├── rgd_0000Cropped320.png
    │   │   │   ├── scene_0022+0028.png
    │   │   │   ├── scene_0036+0061.png
    │   │   │   ├── scene_0065+0032.png
    │   │   │   ├── scene_0087+0049.png
    │   │   │   ├── scene_0108+0036.png
    │   │   │   ├── scene_0129+0058.png
    │   │   │   ├── scene_0156+0010.png
    │   │   │   └── scene_0174+0092.png
    │   │   ├── rgd_0000Cropped320.png
    │   │   ├── scene_0022+0011.png
    │   │   ├── scene_0022+0028.png
    │   │   ├── scene_0036+0061.png
    │   │   ├── scene_0065+0032.png
    │   │   ├── scene_0087+0049.png
    │   │   ├── scene_0108+0036.png
    │   │   ├── scene_0129+0058.png
    │   │   ├── scene_0156+0010.png
    │   │   └── scene_0174+0092.png
    │   └── scripts
    │   │   ├── dataPreprocessingTest_fasterrcnn_split.m
    │   │   ├── dataPreprocessingTest_fasterrcnn_split.m.backup
    │   │   ├── dataPreprocessing_fasterrcnn.m
    │   │   ├── fetch_faster_rcnn_models.sh
    │   │   └── log.txt
    ├── experiments
    │   ├── cfgs
    │   │   ├── res101-lg.yml
    │   │   ├── res101.yml
    │   │   ├── res50.yml
    │   │   └── vgg16.yml
    │   ├── logs
    │   │   └── .gitignore
    │   └── scripts
    │   │   ├── convert_vgg16.sh
    │   │   ├── test_faster_rcnn.sh
    │   │   ├── train_faster_rcnn.sh
    │   │   └── train_faster_rcnn.sh~
    ├── lib
    │   ├── Makefile
    │   ├── datasets
    │   │   ├── VOCdevkit-matlab-wrapper
    │   │   │   ├── get_voc_opts.m
    │   │   │   ├── voc_eval.m
    │   │   │   └── xVOCap.m
    │   │   ├── __init__.py
    │   │   ├── __pycache__
    │   │   │   ├── __init__.cpython-36.pyc
    │   │   │   ├── coco.cpython-36.pyc
    │   │   │   ├── ds_utils.cpython-36.pyc
    │   │   │   ├── factory.cpython-36.pyc
    │   │   │   ├── graspRGB.cpython-36.pyc
    │   │   │   ├── imdb.cpython-36.pyc
    │   │   │   ├── pascal_voc.cpython-36.pyc
    │   │   │   └── voc_eval.cpython-36.pyc
    │   │   ├── coco.py
    │   │   ├── ds_utils.py
    │   │   ├── factory.py
    │   │   ├── graspRGB.py
    │   │   ├── imdb.py
    │   │   ├── pascal_voc.py
    │   │   ├── tools
    │   │   │   └── mcg_munge.py
    │   │   └── voc_eval.py
    │   ├── layer_utils
    │   │   ├── __init__.py
    │   │   ├── __pycache__
    │   │   │   ├── __init__.cpython-36.pyc
    │   │   │   ├── anchor_target_layer.cpython-36.pyc
    │   │   │   ├── generate_anchors.cpython-36.pyc
    │   │   │   ├── proposal_layer.cpython-36.pyc
    │   │   │   ├── proposal_target_layer.cpython-36.pyc
    │   │   │   ├── proposal_top_layer.cpython-36.pyc
    │   │   │   └── snippets.cpython-36.pyc
    │   │   ├── anchor_target_layer.py
    │   │   ├── generate_anchors.py
    │   │   ├── proposal_layer.py
    │   │   ├── proposal_target_layer.py
    │   │   ├── proposal_top_layer.py
    │   │   └── snippets.py
    │   ├── model
    │   │   ├── __init__.py
    │   │   ├── __pycache__
    │   │   │   ├── __init__.cpython-36.pyc
    │   │   │   ├── __init__.cpython-37.pyc
    │   │   │   ├── bbox_transform.cpython-36.pyc
    │   │   │   ├── config.cpython-36.pyc
    │   │   │   ├── config.cpython-37.pyc
    │   │   │   ├── nms_wrapper.cpython-36.pyc
    │   │   │   ├── test.cpython-36.pyc
    │   │   │   └── train_val.cpython-36.pyc
    │   │   ├── bbox_transform.py
    │   │   ├── config.py
    │   │   ├── nms_wrapper.py
    │   │   ├── test.py
    │   │   └── train_val.py
    │   ├── nets
    │   │   ├── __init__.py
    │   │   ├── __pycache__
    │   │   │   ├── __init__.cpython-36.pyc
    │   │   │   ├── network.cpython-36.pyc
    │   │   │   ├── resnet_v1.cpython-36.pyc
    │   │   │   └── vgg16.cpython-36.pyc
    │   │   ├── network.py
    │   │   ├── resnet_v1.py
    │   │   └── vgg16.py
    │   ├── nms
    │   │   ├── .gitignore
    │   │   ├── __init__.py
    │   │   ├── __pycache__
    │   │   │   └── __init__.cpython-36.pyc
    │   │   ├── cpu_nms.c
    │   │   ├── cpu_nms.pyx
    │   │   ├── gpu_nms.cpp
    │   │   ├── gpu_nms.hpp
    │   │   ├── gpu_nms.pyx
    │   │   ├── nms_kernel.cu
    │   │   └── py_cpu_nms.py
    │   ├── roi_data_layer
    │   │   ├── __init__.py
    │   │   ├── __pycache__
    │   │   │   ├── __init__.cpython-36.pyc
    │   │   │   ├── layer.cpython-36.pyc
    │   │   │   ├── minibatch.cpython-36.pyc
    │   │   │   └── roidb.cpython-36.pyc
    │   │   ├── layer.py
    │   │   ├── minibatch.py
    │   │   └── roidb.py
    │   ├── setup.py
    │   └── utils
    │   │   ├── .gitignore
    │   │   ├── __init__.py
    │   │   ├── __pycache__
    │   │       ├── __init__.cpython-36.pyc
    │   │       ├── blob.cpython-36.pyc
    │   │       ├── boxes_grid.cpython-36.pyc
    │   │       └── timer.cpython-36.pyc
    │   │   ├── bbox.pyx
    │   │   ├── blob.py
    │   │   ├── boxes_grid.py
    │   │   ├── nms.py
    │   │   ├── nms.pyx
    │   │   └── timer.py
    └── tools
    │   ├── __pycache__
    │       ├── _init_paths.cpython-36.pyc
    │       └── _init_paths.cpython-37.pyc
    │   ├── _init_paths.py
    │   ├── _init_paths.pyc
    │   ├── demo_graspRGD.py
    │   ├── demo_graspRGD_vis_mask.py
    │   ├── demo_graspRGD_vis_select.py
    │   ├── graspnet_config.py
    │   ├── mask_gen.py
    │   ├── predict_graspRGD.py
    │   ├── result
    │       ├── FPPI.npy
    │       ├── analysis.py
    │       ├── miss_rate.npy
    │       ├── total_false_positive_num.npy
    │       ├── total_gt_num.npy
    │       ├── total_missed_gt_grasp_num.npy
    │       └── total_proposed_num.npy
    │   ├── test_graspRGD.py
    │   └── trainval_net.py
└── requirements.txt


/.gitignore:
--------------------------------------------------------------------------------
1 | *.so
2 | *.pyc
3 | grasp_multiObject_multiGrasp/data/coco/
4 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
  1 | # rectangle-graspnet-multiObject-multiGrasp
  2 | 
  3 | ### Introduction
  4 | **rectangle-graspnet-multiObject-multiGrasp** is a modified version of [grasp_multiObject_multiGrasp](https://github.com/ivalab/grasp_multiObject_multiGrasp) by [fujenchu](https://github.com/fujenchu). We have made some adjustment to the original code in order to apply it to the [graspnet](https://github.com/Fang-Haoshu/graspnetAPI) dataset.
  5 | 
  6 | ###  Acknowledgement
  7 | 
  8 | The code of this repo is mainly based on [grasp_multiObject_multiGrasp](https://github.com/ivalab/grasp_multiObject_multiGrasp).
  9 | 
 10 | ### Install
 11 | 
 12 | 1. Clone the code
 13 | ```
 14 | git clone https://github.com/graspnet/rectangle-graspnet-multiObject-multiGrasp
 15 | cd rectangle-graspnet-multiObject-multiGrasp/grasp_multiObject_multiGrasp
 16 | ```
 17 | 
 18 | 2. Prepare environment (Need Anaconda or Miniconda)
 19 | ```
 20 | conda env create -f grasp_env.yaml
 21 | conda activate grasp
 22 | ```
 23 | 
 24 | 3. Build Cython modules
 25 | ```
 26 | cd lib
 27 | make clean
 28 | make
 29 | cd ..
 30 | ```
 31 | 
 32 | 4. Install [Python COCO API](https://github.com/cocodataset/cocoapi)
 33 | ```
 34 | cd data
 35 | git clone https://github.com/pdollar/coco.git
 36 | cd coco/PythonAPI
 37 | make
 38 | cd ../../../..
 39 | ```
 40 | 
 41 | ### Graspnet Dataset
 42 | 
 43 | ```
 44 | mkdir graspnet_dataset
 45 | ```
 46 | 
 47 | Then download the graspnet dataset from `https://graspnet.net/datasets.html`
 48 | 
 49 | - Move the dataset to [./graspnet_dataset](./graspnet_dataset)
 50 | 
 51 | - Or you can link the path of the graspnet dataset to [./graspnet_dataset](./graspnet_dataset) by
 52 | 
 53 |   ```
 54 |   ln -s /path/to/graspnet ./graspnet_dataset
 55 |   ```
 56 | 
 57 | - Or you can modify GRASPNET_ROOT in [grasp_multiObject_multiGrasp/tools/graspnet_config.py](grasp_multiObject_multiGrasp/tools/graspnet_config.py) directly
 58 | 
 59 | **NOTICE:** Your path should match the following structure details
 60 | 
 61 | ```
 62 | graspnet_dataset
 63 | |-- scenes
 64 |     |-- scene_0000
 65 |     |   |-- object_id_list.txt
 66 |     |   |-- rs_wrt_kn.npy
 67 |     |   |-- kinect
 68 |     |   |   |-- rgb
 69 |     |   |   |   |-- 0000.png to 0255.png
 70 |     |   |   `-- depth
 71 |     |   |   |   |-- 0000.png to 0255.png
 72 |     |   |   `-- label
 73 |     |   |   |   |-- 0000.png to 0255.png
 74 |     |   |   `-- annotations
 75 |     |   |   |   |-- 0000.xml to 0255.xml
 76 |     |   |   `-- meta
 77 |     |   |   |   |-- 0000.mat to 0255.mat
 78 |     |   |   `-- rect
 79 |     |   |   |   |-- 0000.npy to 0255.npy
 80 |     |   |   `-- camK.npy
 81 |     |   |   `-- camera_poses.npy
 82 |     |   |   `-- cam0_wrt_table.npy
 83 |     |   |
 84 |     |   `-- realsense
 85 |     |       |-- same structure as kinect
 86 |     |
 87 |     |
 88 |     `-- scene_0001
 89 |     |
 90 |     `-- ... ...
 91 |     |
 92 |     `-- scene_0189
 93 | ```
 94 | 
 95 | 
 96 | 
 97 | ### Demo
 98 | 
 99 | 1. Download pretrained models
100 | 
101 |    - Download the model from [Google Drive](https://drive.google.com/file/d/1QrjLDKr8eHgN0rM48YpWXY-sN89zJNim/view?usp=sharing), or [JBOX](https://jbox.sjtu.edu.cn/l/J5z6gE), or [Baidu Pan (Password: v9j7)](https://pan.baidu.com/s/19Vp8DWbpFdDQfeICVwRTew)
102 |    - Move it to [grasp_multiObject_multiGrasp/output/res50/train/default/](grasp_multiObject_multiGrasp/output/res50/train/default/)
103 | 
104 | 2. Run demo
105 | 
106 |    ```
107 |    cd grasp_multiObject_multiGrasp/tools
108 |    python demo_graspRGD.py --net res50 --dataset grasp
109 |    cd ../..
110 |    ```
111 | 
112 | ### Data Preprocessing
113 | 
114 | 1. Choose the type of the camera by changing CAMERA_NAME(line 2) in [grasp_multiObject_multiGrasp/tools/graspnet_config.py](grasp_multiObject_multiGrasp/tools/graspnet_config.py)
115 | 2. Run data processing script
116 | ```
117 | cd data_process/script
118 | python data_preprocessing.py
119 | cd ..
120 | ```
121 | 
122 | 3. Move the processed data
123 | 
124 | ```
125 | mv grasp_data ../grasp_multiObject_multiGrasp/
126 | cd ..
127 | ```
128 | 
129 | ### Training
130 | 
131 | 1. Download the `res50` pretrained model
132 | 
133 |    - Download the model from [Google Drive](https://drive.google.com/file/d/1srBA9KQZJnuI59kZUZ7lGWWN6bcTzVNC/view?usp=sharing), or [JBOX](https://jbox.sjtu.edu.cn/l/Vooj01), or [Baidu Pan (Password: tl84)](https://pan.baidu.com/s/1PhGBwKVd5o0Q9qNIy8AI4Q)
134 | 
135 |    - Move the `res50.ckpt` file to [grasp_multiObject_multiGrasp/data/imagenet_weights/](grasp_multiObject_multiGrasp/data/imagenet_weights/)
136 | 
137 | 2. If you have stored the pretrained models in [grasp_multiObject_multiGrasp/output/res50/train/default/](grasp_multiObject_multiGrasp/output/res50/train/default/)
138 | 
139 |    - Make sure there's nothing in [grasp_multiObject_multiGrasp/output/res50/train/default/](grasp_multiObject_multiGrasp/output/res50/train/default/)
140 | 
141 |    - You can rename the directory. For example:
142 | 
143 |      ```
144 |      mv grasp_multiObject_multiGrasp/output/res50 grasp_multiObject_multiGrasp/output/res50_pretrained
145 |      ```
146 | 
147 |    - Or you can move the directory [grasp_multiObject_multiGrasp/output/res50/](grasp_multiObject_multiGrasp/output/res50/) to somewhere else
148 | 
149 | 3. Training
150 | ```
151 | cd grasp_multiObject_multiGrasp
152 | ./experiments/scripts/train_faster_rcnn.sh 0 graspRGB res50
153 | ```


--------------------------------------------------------------------------------
/data_process/script/data_preprocessing.py:
--------------------------------------------------------------------------------
  1 | import numpy as np
  2 | import os
  3 | import cv2
  4 | import random
  5 | import sys
  6 | sys.path.append(os.path.join('..', '..', 'grasp_multiObject_multiGrasp', 'tools'))
  7 | import graspnet_config
  8 | 
  9 | if not os.path.exists(os.path.join('..', 'grasp_data')):
 10 |     os.mkdir(os.path.join('..', 'grasp_data'))
 11 | 
 12 | if not os.path.exists(os.path.join('..', 'grasp_data', 'Images')):
 13 |     os.mkdir(os.path.join('..', 'grasp_data', 'Images'))
 14 | 
 15 | if not os.path.exists(os.path.join('..', 'grasp_data', 'ImageSets')):
 16 |     os.mkdir(os.path.join('..', 'grasp_data', 'ImageSets'))
 17 | 
 18 | if not os.path.exists(os.path.join('..', 'grasp_data', 'Annotations')):
 19 |     os.mkdir(os.path.join('..', 'grasp_data', 'Annotations'))
 20 | 
 21 | # scene_name_list = os.listdir('../scenes/') # ['scene_0023', 'scene_0022', 'scene_0021', ...]
 22 | # scene_name_list.sort()
 23 | scene_name_list = []
 24 | for i in range(0, 100):
 25 | # for i in [108, 129]:
 26 |     scene_name_list.append('scene_{}'.format(str(i).zfill(4)))
 27 | 
 28 | print('************************************************')
 29 | print('************************************************')
 30 | print('The number of scenes is: {}'.format(len(scene_name_list)))
 31 | print('************************************************')
 32 | print('************************************************')
 33 | 
 34 | train_total_number = 0 # number of images used for training in all scenes
 35 | test_total_number = 0 # number of images used for testing in all scenes
 36 | 
 37 | f_scene_skip = open('scene_skip.txt', 'a')
 38 | f_image_skip = open('image_skip.txt', 'a')
 39 | 
 40 | for scene_name in scene_name_list:
 41 |     scene_index = scene_name[-4:]
 42 | 
 43 |     print('------------------------------------------')
 44 |     print('Processing scene: {}'.format(scene_index))
 45 |     try:
 46 |         # rgb_name_list = os.listdir('/DATA2/Benchmark/graspnet/scenes/' + scene_name + '/kinect/rgb/')
 47 |         rgb_name_list = os.listdir(os.path.join(graspnet_config.GRASPNET_ROOT, 'scenes', scene_name, graspnet_config.CAMERA_NAME, 'rgb')) # ['0001.png', '0002.png', ...]
 48 |         rgb_name_list.sort()
 49 |     except:
 50 |         print('scene {} skipped'.format(scene_index))
 51 |         f_scene_skip.write('{}\n'.format(scene_name))
 52 |         continue
 53 | 
 54 |     # list used to record
 55 |     log_train_list = []
 56 |     log_test_list = []
 57 | 
 58 |     grasp_num = 256 # number of images with rectangle grasp in the scene
 59 |     test_num = int(grasp_num / 5) # number of images used for testing in the scene
 60 |     train_num = grasp_num - test_num # number of images used for training in the scene
 61 |     test_count = 0
 62 |     train_count = 0
 63 | 
 64 |     if os.path.exists(os.path.join(graspnet_config.GRASPNET_ROOT, 'scenes', scene_name, graspnet_config.CAMERA_NAME, 'rect', scene_index)):
 65 |     # if os.path.exists('/DATA2/Benchmark/graspnet/scenes/' + scene_name + '/kinect/rect/' + scene_index):
 66 |         grasp_base_path = os.path.join(graspnet_config.GRASPNET_ROOT, 'scenes', scene_name, graspnet_config.CAMERA_NAME, 'rect', scene_index)
 67 |         # grasp_base_path = '/DATA2/Benchmark/graspnet/scenes/' + scene_name + '/kinect/rect/' + scene_index + '/'
 68 |     else:
 69 |         grasp_base_path = os.path.join(graspnet_config.GRASPNET_ROOT, 'scenes', scene_name, graspnet_config.CAMERA_NAME, 'rect')
 70 |         # grasp_base_path = '/DATA2/Benchmark/graspnet/scenes/' + scene_name + '/kinect/rect/'
 71 | 
 72 |     for rgb_name in rgb_name_list:
 73 |         img_index = rgb_name[:4] # 0000 / 0001 / 0002 ...
 74 |         rgb_path = os.path.join(graspnet_config.GRASPNET_ROOT, 'scenes', scene_name, graspnet_config.CAMERA_NAME, 'rgb', rgb_name) # '../scenes/scene_0021/kinect/rgb/0000.png'
 75 |         # rgb_path = '/DATA2/Benchmark/graspnet/scenes/' + scene_name + '/kinect/rgb/' + rgb_name
 76 |         depth_path = os.path.join(graspnet_config.GRASPNET_ROOT, 'scenes', scene_name, graspnet_config.CAMERA_NAME, 'depth', rgb_name) # '../scenes/scene_0021/kinect/depth/0000.png'
 77 |         # depth_path = '/DATA2/Benchmark/graspnet/scenes/' + scene_name + '/kinect/depth/' + rgb_name
 78 |         grasp_path = os.path.join(grasp_base_path, img_index+'.npy') # '../scenes/scene_0021/kinect/rect/(0021/)0000.npy'
 79 |         # grasp_path = grasp_base_path + img_index + '.npy'
 80 |         img_name = scene_name + '+' + img_index # 'scene_0021+0000'
 81 |         img_path = os.path.join('..', 'grasp_data', 'Images', img_name+'.png')
 82 |         anno_path = os.path.join('..', 'grasp_data', 'Annotations', img_name+'.txt')
 83 | 
 84 |         try:
 85 |             grasp = np.load(grasp_path) # load the grasp annotationos, shape: (*, 6)
 86 |             rgb_img = cv2.imread(rgb_path, cv2.IMREAD_UNCHANGED) # load the RGB information
 87 |             b_img, g_img, r_img = cv2.split(rgb_img)
 88 |             depth_img = cv2.imread(depth_path, cv2.IMREAD_UNCHANGED) # load the depth information
 89 |         except:
 90 |             print('{} skipped'.format(img_name))
 91 |             f_image_skip.write('{}\n'.format(img_name))
 92 |             continue
 93 | 
 94 |         reshaped_r_img = r_img.reshape((r_img.shape[0], r_img.shape[1], 1))
 95 |         reshaped_g_img = g_img.reshape((g_img.shape[0], g_img.shape[1], 1))
 96 |         reshaped_depth_img = depth_img.reshape((depth_img.shape[0], depth_img.shape[1], 1))
 97 |         # img = np.concatenate((rgb_img, reshaped_depth_img), axis=-1) # RGB-D
 98 |         img = np.concatenate((reshaped_depth_img, reshaped_g_img, reshaped_r_img), axis=-1) # RGD
 99 | 
100 |         # Processing grasp
101 |         mask = grasp[:, 5] > 0.8
102 |         grasp = grasp[mask]
103 |         center_x = grasp[:, 0] # shape: (*, )
104 |         center_y = grasp[:, 1] # shape: (*, )
105 |         open_point_x = grasp[:, 2] # shape: (*, )
106 |         open_point_y = grasp[:, 3] # shape: (*, )
107 |         height = grasp[:, 4] # height of the rectangle, shape: (*, )
108 |         score = grasp[:, 5] # shape: (*, )
109 | 
110 | 
111 |         width = 2 * np.sqrt(np.square(open_point_x - center_x) + np.square(open_point_y - center_y)) # width of the rectangle, shape: (*, )
112 |         theta = np.zeros(width.shape) # rotation angle of the rectangle
113 | 
114 |         rotation_class = np.zeros(theta.shape, dtype='int32') # rotation class of the rectangle
115 |         x_min = center_x - width / 2
116 |         y_min = center_y - height / 2
117 |         x_max = center_x + width / 2
118 |         y_max = center_y + height / 2
119 | 
120 |         f_anno = open(anno_path, 'w')
121 | 
122 |         for i in range(theta.shape[0]):
123 |             if center_x[i] > open_point_x[i]:
124 |                 theta[i] = np.arctan((open_point_y[i] - center_y[i]) / (center_x[i] - open_point_x[i])) * 180 / np.pi
125 |             elif center_x[i] < open_point_x[i]:
126 |                 theta[i] = np.arctan((center_y[i] - open_point_y[i]) / (open_point_x[i] - center_x[i])) * 180 / np.pi
127 |             else:
128 |                 theta[i] = -90.0
129 |             rotation_class[i] = int(round((theta[i] + 90) / 10) + 1)
130 |             if x_min[i] < 0 or y_min[i] < 0 or x_max[i] > 1280 or y_max[i] > 720:
131 |                 continue
132 |             f_anno.write('{} {} {} {} {}\n'.format(rotation_class[i], x_min[i], y_min[i], x_max[i], y_max[i]))
133 | 
134 |         f_anno.close()
135 | 
136 |         cv2.imwrite(img_path, img) # write the RGD image
137 |         tmp_num = random.randint(1, 5)
138 |         if (test_count >= test_num) or ((train_count < train_num) and (not tmp_num == 1)):
139 |             is_training = True
140 |         else:
141 |             is_training = False
142 |         if is_training:
143 |             log_train_list.append(img_name)
144 |             log_train_list.append('\n')
145 |             train_total_number += 1
146 |             train_count += 1
147 |         else:
148 |             log_test_list.append(img_name)
149 |             log_test_list.append('\n')
150 |             test_total_number += 1
151 |             test_count += 1
152 | 
153 |     # record the list
154 |     f_train = open(os.path.join('..', 'grasp_data', 'ImageSets', 'train.txt'), 'a')
155 |     # f_train = open('../grasp_data/ImageSets/train.txt', 'a')
156 |     f_train.writelines(log_train_list)
157 |     f_train.close()
158 |     f_test = open(os.path.join('..', 'grasp_data', 'ImageSets', 'test.txt'), 'a')
159 |     # f_test = open('../grasp_data/ImageSets/test.txt', 'a')
160 |     f_test.writelines(log_test_list)
161 |     f_test.close()
162 |     print('scene {} done'.format(scene_index))
163 |     print('{} images for training in scene {}'.format(train_count, scene_index))
164 |     print('{} images for testing in scene {}'.format(test_count, scene_index))
165 | 
166 | f_image_skip.close()
167 | f_scene_skip.close()
168 | 
169 | print('The number of images for training: {}'.format(train_total_number))
170 | print('The number of images for testing: {}'.format(test_total_number))
171 | print('------------------------------------------')
172 | 


--------------------------------------------------------------------------------
/grasp_env.yaml:
--------------------------------------------------------------------------------
  1 | name: grasp
  2 | channels:
  3 |   - defaults
  4 | dependencies:
  5 |   - _libgcc_mutex=0.1=main
  6 |   - _tflow_select=2.1.0=gpu
  7 |   - absl-py=0.9.0=py36_0
  8 |   - astor=0.8.1=py36_0
  9 |   - blas=1.0=mkl
 10 |   - c-ares=1.15.0=h7b6447c_1001
 11 |   - ca-certificates=2020.7.22=0
 12 |   - certifi=2020.6.20=py36_0
 13 |   - cudatoolkit=10.1.243=h6bb024c_0
 14 |   - cudnn=7.6.5=cuda10.1_0
 15 |   - cupti=10.1.168=0
 16 |   - cycler=0.10.0=py36_0
 17 |   - cython=0.29.21=py36he6710b0_0
 18 |   - dbus=1.13.16=hb2f20db_0
 19 |   - expat=2.2.9=he6710b0_2
 20 |   - fontconfig=2.13.0=h9420a91_0
 21 |   - freetype=2.10.2=h5ab3b9f_0
 22 |   - gast=0.4.0=py_0
 23 |   - geos=3.8.0=he6710b0_0
 24 |   - glib=2.65.0=h3eb4bd4_0
 25 |   - google-pasta=0.2.0=py_0
 26 |   - grpcio=1.31.0=py36hf8bcb03_0
 27 |   - gst-plugins-base=1.14.0=hbbd80ab_1
 28 |   - gstreamer=1.14.0=hb31296c_0
 29 |   - h5py=2.10.0=py36hd6299e0_1
 30 |   - hdf5=1.10.6=hb1b8bf9_0
 31 |   - icu=58.2=he6710b0_3
 32 |   - importlib-metadata=1.7.0=py36_0
 33 |   - intel-openmp=2020.2=254
 34 |   - jpeg=9b=h024ee3a_2
 35 |   - keras-applications=1.0.8=py_1
 36 |   - keras-preprocessing=1.1.0=py_1
 37 |   - kiwisolver=1.2.0=py36hfd86e86_0
 38 |   - lcms2=2.11=h396b838_0
 39 |   - ld_impl_linux-64=2.33.1=h53a641e_7
 40 |   - libedit=3.1.20191231=h14c3975_1
 41 |   - libffi=3.3=he6710b0_2
 42 |   - libgcc-ng=9.1.0=hdf63c60_0
 43 |   - libgfortran-ng=7.3.0=hdf63c60_0
 44 |   - libpng=1.6.37=hbc83047_0
 45 |   - libprotobuf=3.12.4=hd408876_0
 46 |   - libstdcxx-ng=9.1.0=hdf63c60_0
 47 |   - libtiff=4.1.0=h2733197_1
 48 |   - libuuid=1.0.3=h1bed415_2
 49 |   - libxcb=1.14=h7b6447c_0
 50 |   - libxml2=2.9.10=he19cac6_1
 51 |   - lz4-c=1.9.2=he6710b0_1
 52 |   - markdown=3.2.2=py36_0
 53 |   - matplotlib=3.2.2=0
 54 |   - matplotlib-base=3.2.2=py36hef1b27d_0
 55 |   - mkl=2020.2=256
 56 |   - mkl-service=2.3.0=py36he904b0f_0
 57 |   - mkl_fft=1.1.0=py36h23d657b_0
 58 |   - mkl_random=1.1.1=py36h0573a6f_0
 59 |   - ncurses=6.2=he6710b0_1
 60 |   - numpy=1.16.0=py36h7e9f1db_1
 61 |   - numpy-base=1.16.0=py36hde5b4d6_1
 62 |   - olefile=0.46=py36_0
 63 |   - openssl=1.1.1g=h7b6447c_0
 64 |   - pcre=8.44=he6710b0_0
 65 |   - pillow=7.2.0=py36hb39fc2d_0
 66 |   - pip=20.2.2=py36_0
 67 |   - protobuf=3.12.4=py36he6710b0_0
 68 |   - pyparsing=2.4.7=py_0
 69 |   - pyqt=5.9.2=py36h05f1152_2
 70 |   - python=3.6.10=h7579374_2
 71 |   - python-dateutil=2.8.1=py_0
 72 |   - pyyaml=5.3.1=py36h7b6447c_1
 73 |   - qt=5.9.7=h5867ecd_1
 74 |   - readline=8.0=h7b6447c_0
 75 |   - scipy=1.5.2=py36h0b6359f_0
 76 |   - setuptools=49.6.0=py36_0
 77 |   - shapely=1.7.0=py36h98ec03d_0
 78 |   - sip=4.19.8=py36hf484d3e_0
 79 |   - six=1.15.0=py_0
 80 |   - sqlite=3.33.0=h62c20be_0
 81 |   - tensorboard=1.14.0=py36hf484d3e_0
 82 |   - tensorflow=1.14.0=gpu_py36h3fb9ad6_0
 83 |   - tensorflow-base=1.14.0=gpu_py36he45bfe2_0
 84 |   - tensorflow-estimator=1.14.0=py_0
 85 |   - tensorflow-gpu=1.14.0=h0d30ee6_0
 86 |   - termcolor=1.1.0=py36_1
 87 |   - tk=8.6.10=hbc83047_0
 88 |   - tornado=6.0.4=py36h7b6447c_1
 89 |   - werkzeug=1.0.1=py_0
 90 |   - wheel=0.35.1=py_0
 91 |   - wrapt=1.12.1=py36h7b6447c_1
 92 |   - xz=5.2.5=h7b6447c_0
 93 |   - yaml=0.2.5=h7b6447c_0
 94 |   - zipp=3.1.0=py_0
 95 |   - zlib=1.2.11=h7b6447c_3
 96 |   - zstd=1.4.5=h9ceee32_0
 97 |   - pip:
 98 |     - easydict==1.9
 99 |     - opencv-python==4.3.0.36
100 | prefix: /home/xusheng/miniconda3/envs/grasp
101 | 
102 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/mask.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/mask.jpg


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/pcd0100r_rgd_preprocessed_1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/pcd0100r_rgd_preprocessed_1.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/pcd0266r_rgd_preprocessed_1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/pcd0266r_rgd_preprocessed_1.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/pcd0882r_rgd_preprocessed_1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/pcd0882r_rgd_preprocessed_1.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/results_all_cls/pcd0100r_rgd_preprocessed_1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/results_all_cls/pcd0100r_rgd_preprocessed_1.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/results_all_cls/pcd0266r_rgd_preprocessed_1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/results_all_cls/pcd0266r_rgd_preprocessed_1.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/results_all_cls/pcd0882r_rgd_preprocessed_1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/results_all_cls/pcd0882r_rgd_preprocessed_1.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/results_all_cls/rgd_0000Cropped320.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/results_all_cls/rgd_0000Cropped320.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/results_all_cls/scene_0022+0028.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/results_all_cls/scene_0022+0028.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/results_all_cls/scene_0036+0061.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/results_all_cls/scene_0036+0061.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/results_all_cls/scene_0065+0032.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/results_all_cls/scene_0065+0032.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/results_all_cls/scene_0087+0049.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/results_all_cls/scene_0087+0049.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/results_all_cls/scene_0108+0036.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/results_all_cls/scene_0108+0036.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/results_all_cls/scene_0129+0058.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/results_all_cls/scene_0129+0058.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/results_all_cls/scene_0156+0010.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/results_all_cls/scene_0156+0010.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/results_all_cls/scene_0174+0092.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/results_all_cls/scene_0174+0092.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/rgd_0000Cropped320.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/rgd_0000Cropped320.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/scene_0022+0011.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/scene_0022+0011.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/scene_0022+0028.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/scene_0022+0028.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/scene_0036+0061.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/scene_0036+0061.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/scene_0065+0032.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/scene_0065+0032.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/scene_0087+0049.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/scene_0087+0049.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/scene_0108+0036.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/scene_0108+0036.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/scene_0129+0058.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/scene_0129+0058.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/scene_0156+0010.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/scene_0156+0010.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/demo/scene_0174+0092.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/data/demo/scene_0174+0092.png


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/scripts/dataPreprocessingTest_fasterrcnn_split.m:
--------------------------------------------------------------------------------
  1 | %% script to test dataPreprocessing
  2 | %% created by Fu-Jen Chu on 09/15/2016
  3 | 
  4 | close all
  5 | clear
  6 | 
  7 | %parpool(4)
  8 | %addpath('/media/fujenchu/home3/data/grasps/')
  9 | 
 10 | 
 11 | % generate list for splits
 12 | list = [100:949 1000:1034];
 13 | list_idx = randperm(length(list));
 14 | train_list_idx = list_idx(length(list)/5+1:end);
 15 | test_list_idx = list_idx(1:length(list)/5);
 16 | train_list = list(train_list_idx);
 17 | test_list = list(test_list_idx);
 18 | 
 19 | 
 20 | for folder = 1:1
 21 | display(['processing folder ' int2str(folder)])
 22 | 
 23 | imgDataDir = ['/SSD2/xusheng/Grasp/grasp_multiObject_multiGrasp/grasp_data/grasps/' sprintf('%02d',folder)];
 24 | txtDataDir = ['/SSD2/xusheng/Grasp/grasp_multiObject_multiGrasp/grasp_data/grasps/' sprintf('%02d',folder)];
 25 | 
 26 | %imgDataOutDir = ['/home/fujenchu/projects/deepLearning/tensorflow-finetune-flickr-style-master/data/grasps/' sprintf('%02d',folder) '_Cropped320_rgd'];
 27 | imgDataOutDir = '/SSD2/xusheng/Grasp/grasp_multiObject_multiGrasp/grasp_data/Images';
 28 | annotationDataOutDir = '/SSD2/xusheng/Grasp/grasp_multiObject_multiGrasp/grasp_data/Annotations';
 29 | imgSetTrain = '/SSD2/xusheng/Grasp/grasp_multiObject_multiGrasp/grasp_data/ImageSets/train.txt'; 
 30 | imgSetTest = '/SSD2/xusheng/Grasp/grasp_multiObject_multiGrasp/grasp_data/ImageSets/test.txt'; 
 31 | 
 32 | imgFiles = dir([imgDataDir '/*.png']);
 33 | txtFiles = dir([txtDataDir '/*pos.txt']);
 34 | 
 35 | logfileID = fopen('log.txt','a');
 36 | mainfileID = fopen(['/SSD2/xusheng/Grasp/grasp_multiObject_multiGrasp/grasp_data/grasps/scripts/trainttt' sprintf('%02d',folder) '.txt'],'a');
 37 | for idx = 1:length(imgFiles) 
 38 |     %% display progress
 39 |     tic
 40 |     display(['processing folder: ' sprintf('%02d',folder) ', imgFiles: ' int2str(idx)])
 41 |     
 42 |     %% reading data
 43 |     imgName = imgFiles(idx).name;
 44 |     [pathstr,imgname] = fileparts(imgName);
 45 |     
 46 |     filenum = str2num(imgname(4:7));
 47 |     if(any(test_list == filenum))
 48 |         file_writeID = fopen(imgSetTest,'a');
 49 |         fprintf(file_writeID, '%s\n', [imgname '_preprocessed_1' ] );
 50 |         fclose(file_writeID);
 51 | 	is_training = 0;
 52 |     else
 53 | 	is_training = 1;
 54 |     end
 55 |     
 56 |     txtName = txtFiles(idx).name;
 57 |     [pathstr,txtname] = fileparts(txtName);
 58 | 
 59 |     img = imread([imgDataDir '/' imgname '.png']);
 60 |     fileID = fopen([txtDataDir '/' txtname '.txt'],'r');
 61 |     sizeA = [2 100];
 62 |     bbsIn_all = fscanf(fileID, '%f %f', sizeA);
 63 |     fclose(fileID);
 64 |     
 65 |     %% data pre-processing
 66 |     [imagesOut bbsOut] = dataPreprocessing_fasterrcnn(img, bbsIn_all, 227, 5, 5);
 67 |     
 68 |     % for each augmented image
 69 |     for i = 1:1:size(imagesOut,2)
 70 |         
 71 |         % for each bbs
 72 |         file_writeID = fopen([annotationDataOutDir '/' imgname '_preprocessed_' int2str(i) '.txt'],'w');
 73 |         printCount = 0;
 74 |         for ibbs = 1:1:size(bbsOut{i},2)
 75 |           A = bbsOut{i}{ibbs};  
 76 |           xy_ctr = sum(A,2)/4; x_ctr = xy_ctr(1); y_ctr = xy_ctr(2);
 77 |           width = sqrt(sum((A(:,1) - A(:,2)).^2)); height = sqrt(sum((A(:,2) - A(:,3)).^2));
 78 |           if(A(1,1) > A(1,2))
 79 |               theta = atan((A(2,2)-A(2,1))/(A(1,1)-A(1,2)));
 80 |           else
 81 |               theta = atan((A(2,1)-A(2,2))/(A(1,2)-A(1,1))); % note y is facing down
 82 |           end  
 83 |     
 84 |           % process to fasterrcnn
 85 |           x_min = x_ctr - width/2; x_max = x_ctr + width/2;
 86 |           y_min = y_ctr - height/2; y_max = y_ctr + height/2;
 87 |           %if(x_min < 0 || y_min < 0 || x_max > 227 || y_max > 227) display('yoooooooo'); end
 88 |           if((x_min < 0 && x_max < 0) || (y_min > 227 && y_max > 227) || (x_min > 227 && x_max > 227) || (y_min < 0 && y_max < 0)) display('xxxxxxxxx'); break; end
 89 |           cls = round((theta/pi*180+90)/10) + 1;
 90 |           
 91 |           % write as lefttop rightdown, Xmin Ymin Xmax Ymax, ex: 261 109 511 705  (x水平 y垂直)
 92 |           fprintf(file_writeID, '%d %f %f %f %f\n', cls, x_min, y_min, x_max, y_max );   
 93 |           printCount = printCount+1;
 94 |         end
 95 |         if(printCount == 0) fprintf(logfileID, '%s\n', [imgname '_preprocessed_' int2str(i) ]);end
 96 |         
 97 |         fclose(file_writeID);
 98 |         imwrite(imagesOut{i}, [imgDataOutDir '/' imgname '_preprocessed_' int2str(i) '.png']); 
 99 |         
100 |         % write filename to imageSet 
101 | 	if(is_training)
102 |             file_writeID = fopen(imgSetTrain,'a');
103 |             fprintf(file_writeID, '%s\n', [imgname '_preprocessed_' int2str(i) ] );
104 |             fclose(file_writeID);
105 | 	end
106 | 
107 |     end
108 |     
109 | 
110 |     toc
111 | end
112 | fclose(mainfileID);
113 | 
114 | end
115 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/scripts/dataPreprocessingTest_fasterrcnn_split.m.backup:
--------------------------------------------------------------------------------
  1 | %% script to test dataPreprocessing
  2 | %% created by Fu-Jen Chu on 09/15/2016
  3 | 
  4 | close all
  5 | clear
  6 | 
  7 | %parpool(4)
  8 | %addpath('/media/fujenchu/home3/data/grasps/')
  9 | 
 10 | 
 11 | % generate list for splits
 12 | list = [100:949 1000:1034];
 13 | list_idx = randperm(length(list));
 14 | train_list_idx = list_idx(length(list)/5+1:end);
 15 | test_list_idx = list_idx(1:length(list)/5);
 16 | train_list = list(train_list_idx);
 17 | test_list = list(test_list_idx);
 18 | 
 19 | 
 20 | for folder = 1:1
 21 | display(['processing folder ' int2str(folder)])
 22 | 
 23 | imgDataDir = ['/SSD2/xusheng/Grasp/grasp_multiObject_multiGrasp/grasp_data/grasps/' sprintf('%02d',folder)];
 24 | txtDataDir = ['/SSD2/xusheng/Grasp/grasp_multiObject_multiGrasp/grasp_data/grasps/' sprintf('%02d',folder)];
 25 | 
 26 | %imgDataOutDir = ['/home/fujenchu/projects/deepLearning/tensorflow-finetune-flickr-style-master/data/grasps/' sprintf('%02d',folder) '_Cropped320_rgd'];
 27 | imgDataOutDir = '/SSD2/xusheng/Grasp/grasp_multiObject_multiGrasp/grasp_data/Images';
 28 | annotationDataOutDir = '/SSD2/xusheng/Grasp/grasp_multiObject_multiGrasp/grasp_data/Annotations';
 29 | imgSetTrain = '/SSD2/xusheng/Grasp/grasp_multiObject_multiGrasp/grasp_data/ImageSets/train.txt'; 
 30 | imgSetTest = '/SSD2/xusheng/Grasp/grasp_multiObject_multiGrasp/grasp_data/ImageSets/test.txt'; 
 31 | 
 32 | imgFiles = dir([imgDataDir '/*.png']);
 33 | txtFiles = dir([txtDataDir '/*pos.txt']);
 34 | 
 35 | logfileID = fopen('log.txt','a');
 36 | mainfileID = fopen(['/SSD2/xusheng/Grasp/grasp_multiObject_multiGrasp/grasp_data/grasps/scripts/trainttt' sprintf('%02d',folder) '.txt'],'a');
 37 | for idx = 1:length(imgFiles) 
 38 |     %% display progress
 39 |     tic
 40 |     display(['processing folder: ' sprintf('%02d',folder) ', imgFiles: ' int2str(idx)])
 41 |     
 42 |     %% reading data
 43 |     imgName = imgFiles(idx).name;
 44 |     [pathstr,imgname] = fileparts(imgName);
 45 |     
 46 |     filenum = str2num(imgname(4:7));
 47 |     if(any(test_list == filenum))
 48 |         file_writeID = fopen(imgSetTest,'a');
 49 |         fprintf(file_writeID, '%s\n', [imgDataDir(1:end-3) 'Cropped320_rgd/' imgname '_preprocessed_1.png' ] );
 50 |         fclose(file_writeID);
 51 |         continue;
 52 |     end
 53 |     
 54 |     txtName = txtFiles(idx).name;
 55 |     [pathstr,txtname] = fileparts(txtName);
 56 | 
 57 |     img = imread([imgDataDir '/' imgname '.png']);
 58 |     fileID = fopen([txtDataDir '/' txtname '.txt'],'r');
 59 |     sizeA = [2 100];
 60 |     bbsIn_all = fscanf(fileID, '%f %f', sizeA);
 61 |     fclose(fileID);
 62 |     
 63 |     %% data pre-processing
 64 |     [imagesOut bbsOut] = dataPreprocessing_fasterrcnn(img, bbsIn_all, 227, 5, 5);
 65 |     
 66 |     % for each augmented image
 67 |     for i = 1:1:size(imagesOut,2)
 68 |         
 69 |         % for each bbs
 70 |         file_writeID = fopen([annotationDataOutDir '/' imgname '_preprocessed_' int2str(i) '.txt'],'w');
 71 |         printCount = 0;
 72 |         for ibbs = 1:1:size(bbsOut{i},2)
 73 |           A = bbsOut{i}{ibbs};  
 74 |           xy_ctr = sum(A,2)/4; x_ctr = xy_ctr(1); y_ctr = xy_ctr(2);
 75 |           width = sqrt(sum((A(:,1) - A(:,2)).^2)); height = sqrt(sum((A(:,2) - A(:,3)).^2));
 76 |           if(A(1,1) > A(1,2))
 77 |               theta = atan((A(2,2)-A(2,1))/(A(1,1)-A(1,2)));
 78 |           else
 79 |               theta = atan((A(2,1)-A(2,2))/(A(1,2)-A(1,1))); % note y is facing down
 80 |           end  
 81 |     
 82 |           % process to fasterrcnn
 83 |           x_min = x_ctr - width/2; x_max = x_ctr + width/2;
 84 |           y_min = y_ctr - height/2; y_max = y_ctr + height/2;
 85 |           %if(x_min < 0 || y_min < 0 || x_max > 227 || y_max > 227) display('yoooooooo'); end
 86 |           if((x_min < 0 && x_max < 0) || (y_min > 227 && y_max > 227) || (x_min > 227 && x_max > 227) || (y_min < 0 && y_max < 0)) display('xxxxxxxxx'); break; end
 87 |           cls = round((theta/pi*180+90)/10) + 1;
 88 |           
 89 |           % write as lefttop rightdown, Xmin Ymin Xmax Ymax, ex: 261 109 511 705  (x水平 y垂直)
 90 |           fprintf(file_writeID, '%d %f %f %f %f\n', cls, x_min, y_min, x_max, y_max );   
 91 |           printCount = printCount+1;
 92 |         end
 93 |         if(printCount == 0) fprintf(logfileID, '%s\n', [imgname '_preprocessed_' int2str(i) ]);end
 94 |         
 95 |         fclose(file_writeID);
 96 |         imwrite(imagesOut{i}, [imgDataOutDir '/' imgname '_preprocessed_' int2str(i) '.png']); 
 97 |         
 98 |         % write filename to imageSet 
 99 |         file_writeID = fopen(imgSetTrain,'a');
100 |         fprintf(file_writeID, '%s\n', [imgname '_preprocessed_' int2str(i) ] );
101 |         fclose(file_writeID);
102 | 
103 |     end
104 |     
105 | 
106 |     toc
107 | end
108 | fclose(mainfileID);
109 | 
110 | end
111 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/scripts/dataPreprocessing_fasterrcnn.m:
--------------------------------------------------------------------------------
 1 | function [imagesOut bbsOut] = dataPreprocessing( imageIn, bbsIn_all, cropSize, translationShiftNumber, roatateAngleNumber)
 2 | % dataPreprocessing function perfroms
 3 | % 1) croping
 4 | % 2) padding
 5 | % 3) rotatation
 6 | % 4) shifting
 7 | %
 8 | % for a input image with a bbs as 4 points, 
 9 | % dataPreprocessing outputs a set of images with corresponding bbs.
10 | %
11 | %
12 | % Inputs: 
13 | %   imageIn: input image (480 by 640 by 3)
14 | %   bbsIn: bounding box (2 by 4)
15 | %   cropSize: output image size
16 | %   shift: shifting offset
17 | %   rotate: rotation angle
18 | %
19 | % Outputs:
20 | %   imagesOut: output images (n images)
21 | %   bbsOut: output bbs according to shift and rotation
22 | %
23 | %% created by Fu-Jen Chu on 09/15/2016
24 | 
25 | debug_dev = 0;
26 | debug = 0;
27 | %% show image and bbs
28 | if(debug_dev)
29 | figure(1); imshow(imageIn); hold on;
30 | x = bbsIn_all(1, [1:3]);
31 | y = bbsIn_all(2, [1:3]);
32 | plot(x,y); hold off;
33 | end
34 | 
35 | %% crop image and padding image
36 | % cropping to 321 by 321 from center
37 | imgCrop = imcrop(imageIn, [145 65 351 351]); 
38 | 
39 | % padding to 501 by 501
40 | imgPadding = padarray(imgCrop, [75 75], 'replicate', 'both');
41 | 
42 | count = 1;
43 | for i_rotate = 1:roatateAngleNumber*translationShiftNumber*translationShiftNumber
44 |     % random roatateAngle
45 |     theta = randi(360)-1;
46 |     %theta = 0;
47 | 
48 |     % random translationShift
49 |     dx = randi(101)-51;
50 |     %dx = 0;
51 | 
52 |     %% rotation and shifting
53 |     % random translationShift
54 |     dy = randi(101)-51;
55 |     %dy = 0;
56 | 
57 |     imgRotate = imrotate(imgPadding, theta);
58 |     if(debug_dev)figure(2); imshow(imgRotate);end
59 |     imgCropRotate = imcrop(imgRotate, [size(imgRotate,1)/2-160-dx size(imgRotate,1)/2-160-dy 320 320]);
60 |     if(debug_dev)figure(3); imshow(imgCropRotate);end 
61 |     imgResize = imresize(imgCropRotate, [cropSize cropSize]);
62 |     if(debug)figure(4); imshow(imgResize); hold on;end
63 | 
64 |     %% modify bbs
65 |     [m, n] = size(bbsIn_all);
66 |     bbsNum = n/4;
67 |     
68 |     countbbs = 1;
69 |     for idx = 1:bbsNum
70 |       bbsIn =  bbsIn_all(:,idx*4-3:idx*4); 
71 |       if(sum(sum(isnan(bbsIn)))) continue; end
72 |       
73 |       bbsInShift = bbsIn - repmat([320; 240], 1, 4);
74 |       R = [cos(theta/180*pi) -sin(theta/180*pi); sin(theta/180*pi) cos(theta/180*pi)];
75 |       bbsRotated = (bbsInShift'*R)';
76 |       bbsInShiftBack = (bbsRotated + repmat([160; 160], 1, 4) + repmat([dx; dy], 1, 4))*cropSize/320;
77 |       if(debug)
78 |         figure(4)
79 |         x = bbsInShiftBack(1, [1:4 1]);
80 |         y = bbsInShiftBack(2, [1:4 1]);
81 |         plot(x,y); hold on; pause(0.01);
82 |       end
83 |       bbsOut{count}{countbbs} = bbsInShiftBack;
84 |       countbbs = countbbs + 1;
85 |     end
86 |     
87 |     imagesOut{count} = imgResize;
88 |     count = count +1;
89 | 
90 |    
91 | end
92 | 
93 | 
94 | 
95 | end
96 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/scripts/fetch_faster_rcnn_models.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )/../" && pwd )"
 4 | cd $DIR
 5 | 
 6 | NET=res101
 7 | FILE=voc_0712_80k-110k.tgz
 8 | # replace it with gs11655.sp.cs.cmu.edu if ladoga.graphics.cs.cmu.edu does not work
 9 | URL=http://ladoga.graphics.cs.cmu.edu/xinleic/tf-faster-rcnn/$NET/$FILE
10 | CHECKSUM=cb32e9df553153d311cc5095b2f8c340
11 | 
12 | if [ -f $FILE ]; then
13 |   echo "File already exists. Checking md5..."
14 |   os=`uname -s`
15 |   if [ "$os" = "Linux" ]; then
16 |     checksum=`md5sum $FILE | awk '{ print $1 }'`
17 |   elif [ "$os" = "Darwin" ]; then
18 |     checksum=`cat $FILE | md5`
19 |   fi
20 |   if [ "$checksum" = "$CHECKSUM" ]; then
21 |     echo "Checksum is correct. No need to download."
22 |     exit 0
23 |   else
24 |     echo "Checksum is incorrect. Need to download again."
25 |   fi
26 | fi
27 | 
28 | echo "Downloading Resnet 101 Faster R-CNN models Pret-trained on VOC 07+12 (340M)..."
29 | 
30 | wget $URL -O $FILE
31 | 
32 | echo "Unzipping..."
33 | 
34 | tar zxvf $FILE
35 | 
36 | echo "Done. Please run this command again to verify that checksum = $CHECKSUM."
37 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/data/scripts/log.txt:
--------------------------------------------------------------------------------
 1 | pcd0117r_preprocessed_21
 2 | pcd0117r_preprocessed_28
 3 | pcd0117r_preprocessed_33
 4 | pcd0117r_preprocessed_64
 5 | pcd0117r_preprocessed_65
 6 | pcd0117r_preprocessed_68
 7 | pcd0117r_preprocessed_73
 8 | pcd0117r_preprocessed_75
 9 | pcd0117r_preprocessed_78
10 | pcd0117r_preprocessed_81
11 | pcd0117r_preprocessed_108
12 | pcd0117r_preprocessed_116
13 | pcd0117r_preprocessed_123
14 | pcd0117r_preprocessed_2
15 | pcd0117r_preprocessed_70
16 | pcd0117r_preprocessed_73
17 | pcd0117r_preprocessed_98
18 | pcd0117r_preprocessed_113
19 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/experiments/cfgs/res101-lg.yml:
--------------------------------------------------------------------------------
 1 | EXP_DIR: res101-lg
 2 | TRAIN:
 3 |   HAS_RPN: True
 4 |   IMS_PER_BATCH: 1
 5 |   BBOX_NORMALIZE_TARGETS_PRECOMPUTED: True
 6 |   RPN_POSITIVE_OVERLAP: 0.7
 7 |   RPN_BATCHSIZE: 256
 8 |   PROPOSAL_METHOD: gt
 9 |   BG_THRESH_LO: 0.0
10 |   DISPLAY: 20
11 |   BATCH_SIZE: 256
12 |   WEIGHT_DECAY: 0.0001
13 |   DOUBLE_BIAS: False
14 |   SNAPSHOT_PREFIX: res101_faster_rcnn
15 |   SCALES: [800]
16 |   MAX_SIZE: 1333
17 | TEST:
18 |   HAS_RPN: True
19 |   SCALES: [800]
20 |   MAX_SIZE: 1333
21 |   RPN_POST_NMS_TOP_N: 1000
22 | POOLING_MODE: crop
23 | ANCHOR_SCALES: [2,4,8,16,32]
24 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/experiments/cfgs/res101.yml:
--------------------------------------------------------------------------------
 1 | EXP_DIR: res101
 2 | TRAIN:
 3 |   HAS_RPN: True
 4 |   IMS_PER_BATCH: 1
 5 |   BBOX_NORMALIZE_TARGETS_PRECOMPUTED: True
 6 |   RPN_POSITIVE_OVERLAP: 0.7
 7 |   RPN_BATCHSIZE: 256
 8 |   PROPOSAL_METHOD: gt
 9 |   BG_THRESH_LO: 0.0
10 |   DISPLAY: 20
11 |   BATCH_SIZE: 256
12 |   WEIGHT_DECAY: 0.0001
13 |   DOUBLE_BIAS: False
14 |   SNAPSHOT_PREFIX: res101_faster_rcnn
15 | TEST:
16 |   HAS_RPN: True
17 | POOLING_MODE: crop
18 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/experiments/cfgs/res50.yml:
--------------------------------------------------------------------------------
 1 | EXP_DIR: res50
 2 | TRAIN:
 3 |   HAS_RPN: True
 4 |   IMS_PER_BATCH: 1
 5 |   BBOX_NORMALIZE_TARGETS_PRECOMPUTED: True
 6 |   RPN_POSITIVE_OVERLAP: 0.7
 7 |   RPN_BATCHSIZE: 256
 8 |   PROPOSAL_METHOD: gt
 9 |   BG_THRESH_LO: 0.0
10 |   DISPLAY: 20
11 |   BATCH_SIZE: 256
12 |   WEIGHT_DECAY: 0.0001
13 |   DOUBLE_BIAS: False
14 |   SNAPSHOT_PREFIX: res50_faster_rcnn
15 | TEST:
16 |   HAS_RPN: True
17 | POOLING_MODE: crop
18 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/experiments/cfgs/vgg16.yml:
--------------------------------------------------------------------------------
 1 | EXP_DIR: vgg16
 2 | TRAIN:
 3 |   HAS_RPN: True
 4 |   IMS_PER_BATCH: 1
 5 |   BBOX_NORMALIZE_TARGETS_PRECOMPUTED: True
 6 |   RPN_POSITIVE_OVERLAP: 0.7
 7 |   RPN_BATCHSIZE: 256
 8 |   PROPOSAL_METHOD: gt
 9 |   BG_THRESH_LO: 0.0
10 |   DISPLAY: 20
11 |   BATCH_SIZE: 256
12 |   SNAPSHOT_PREFIX: vgg16_faster_rcnn
13 | TEST:
14 |   HAS_RPN: True
15 | POOLING_MODE: crop
16 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/experiments/logs/.gitignore:
--------------------------------------------------------------------------------
1 | *.txt.*
2 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/experiments/scripts/convert_vgg16.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | set -x
 4 | set -e
 5 | 
 6 | export PYTHONUNBUFFERED="True"
 7 | 
 8 | GPU_ID=$1
 9 | DATASET=$2
10 | NET=vgg16
11 | 
12 | array=( $@ )
13 | len=${#array[@]}
14 | EXTRA_ARGS=${array[@]:2:$len}
15 | EXTRA_ARGS_SLUG=${EXTRA_ARGS// /_}
16 | 
17 | case ${DATASET} in
18 |   pascal_voc)
19 |     TRAIN_IMDB="voc_2007_trainval"
20 |     TEST_IMDB="voc_2007_test"
21 |     STEPSIZE=50000
22 |     ITERS=70000
23 |     ANCHORS="[8,16,32]"
24 |     RATIOS="[0.5,1,2]"
25 |     ;;
26 |   pascal_voc_0712)
27 |     TRAIN_IMDB="voc_2007_trainval+voc_2012_trainval"
28 |     TEST_IMDB="voc_2007_test"
29 |     STEPSIZE=80000
30 |     ITERS=110000
31 |     ANCHORS="[8,16,32]"
32 |     RATIOS="[0.5,1,2]"
33 |     ;;
34 |   coco)
35 |     TRAIN_IMDB="coco_2014_train+coco_2014_valminusminival"
36 |     TEST_IMDB="coco_2014_minival"
37 |     STEPSIZE=350000
38 |     ITERS=490000
39 |     ANCHORS="[4,8,16,32]"
40 |     RATIOS="[0.5,1,2]"
41 |     ;;
42 |   *)
43 |     echo "No dataset given"
44 |     exit
45 |     ;;
46 | esac
47 | 
48 | set +x
49 | NET_FINAL=${NET}_faster_rcnn_iter_${ITERS}
50 | set -x
51 | 
52 | if [ ! -f ${NET_FINAL}.index ]; then
53 |     if [[ ! -z  ${EXTRA_ARGS_SLUG}  ]]; then
54 |         CUDA_VISIBLE_DEVICES=${GPU_ID} time python ./tools/convert_from_depre.py \
55 |             --snapshot ${NET_FINAL} \
56 |             --imdb ${TRAIN_IMDB} \
57 |             --iters ${ITERS} \
58 |             --cfg experiments/cfgs/${NET}.yml \
59 |             --tag ${EXTRA_ARGS_SLUG} \
60 |             --set ANCHOR_SCALES ${ANCHORS} ANCHOR_RATIOS ${RATIOS} TRAIN.STEPSIZE ${STEPSIZE} ${EXTRA_ARGS}
61 |     else
62 |         CUDA_VISIBLE_DEVICES=${GPU_ID} time python ./tools/convert_from_depre.py \
63 |             --snapshot ${NET_FINAL} \
64 |             --imdb ${TRAIN_IMDB} \
65 |             --iters ${ITERS} \
66 |             --cfg experiments/cfgs/${NET}.yml \
67 |             --set ANCHOR_SCALES ${ANCHORS} ANCHOR_RATIOS ${RATIOS} TRAIN.STEPSIZE ${STEPSIZE} ${EXTRA_ARGS}
68 |     fi
69 | fi
70 | 
71 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/experiments/scripts/test_faster_rcnn.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | set -x
 4 | set -e
 5 | 
 6 | export PYTHONUNBUFFERED="True"
 7 | 
 8 | GPU_ID=$1
 9 | DATASET=$2
10 | NET=$3
11 | 
12 | array=( $@ )
13 | len=${#array[@]}
14 | EXTRA_ARGS=${array[@]:3:$len}
15 | EXTRA_ARGS_SLUG=${EXTRA_ARGS// /_}
16 | 
17 | case ${DATASET} in
18 |   pascal_voc)
19 |     TRAIN_IMDB="voc_2007_trainval"
20 |     TEST_IMDB="voc_2007_test"
21 |     ITERS=70000
22 |     ANCHORS="[8,16,32]"
23 |     RATIOS="[0.5,1,2]"
24 |     ;;
25 |   pascal_voc_0712)
26 |     TRAIN_IMDB="voc_2007_trainval+voc_2012_trainval"
27 |     TEST_IMDB="voc_2007_test"
28 |     ITERS=110000
29 |     ANCHORS="[8,16,32]"
30 |     RATIOS="[0.5,1,2]"
31 |     ;;
32 |   coco)
33 |     TRAIN_IMDB="coco_2014_train+coco_2014_valminusminival"
34 |     TEST_IMDB="coco_2014_minival"
35 |     ITERS=490000
36 |     ANCHORS="[4,8,16,32]"
37 |     RATIOS="[0.5,1,2]"
38 |     ;;
39 |   *)
40 |     echo "No dataset given"
41 |     exit
42 |     ;;
43 | esac
44 | 
45 | LOG="experiments/logs/test_${NET}_${TRAIN_IMDB}_${EXTRA_ARGS_SLUG}.txt.`date +'%Y-%m-%d_%H-%M-%S'`"
46 | exec &> >(tee -a "$LOG")
47 | echo Logging output to "$LOG"
48 | 
49 | set +x
50 | if [[ ! -z  ${EXTRA_ARGS_SLUG}  ]]; then
51 |   NET_FINAL=output/${NET}/${TRAIN_IMDB}/${EXTRA_ARGS_SLUG}/${NET}_faster_rcnn_iter_${ITERS}.ckpt
52 | else
53 |   NET_FINAL=output/${NET}/${TRAIN_IMDB}/default/${NET}_faster_rcnn_iter_${ITERS}.ckpt
54 | fi
55 | set -x
56 | 
57 | if [[ ! -z  ${EXTRA_ARGS_SLUG}  ]]; then
58 |   CUDA_VISIBLE_DEVICES=${GPU_ID} time python ./tools/test_net.py \
59 |     --imdb ${TEST_IMDB} \
60 |     --model ${NET_FINAL} \
61 |     --cfg experiments/cfgs/${NET}.yml \
62 |     --tag ${EXTRA_ARGS_SLUG} \
63 |     --net ${NET} \
64 |     --set ANCHOR_SCALES ${ANCHORS} ANCHOR_RATIOS ${RATIOS} ${EXTRA_ARGS}
65 | else
66 |   CUDA_VISIBLE_DEVICES=${GPU_ID} time python ./tools/test_net.py \
67 |     --imdb ${TEST_IMDB} \
68 |     --model ${NET_FINAL} \
69 |     --cfg experiments/cfgs/${NET}.yml \
70 |     --net ${NET} \
71 |     --set ANCHOR_SCALES ${ANCHORS} ANCHOR_RATIOS ${RATIOS} ${EXTRA_ARGS}
72 | fi
73 | 
74 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/experiments/scripts/train_faster_rcnn.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | set -x
 4 | set -e
 5 | 
 6 | export PYTHONUNBUFFERED="True"
 7 | 
 8 | GPU_ID=$1
 9 | DATASET=$2
10 | NET=$3
11 | 
12 | array=( $@ )
13 | len=${#array[@]}
14 | EXTRA_ARGS=${array[@]:3:$len}
15 | EXTRA_ARGS_SLUG=${EXTRA_ARGS// /_}
16 | 
17 | echo ${DATASET} 
18 | case ${DATASET} in
19 |     graspRGB)
20 |     TRAIN_IMDB="graspRGB_train"
21 |     TEST_IMDB="graspRGB_test"
22 |     STEPSIZE=50000
23 |     ITERS=240000
24 |     #ANCHORS="[2,4,8,16,32]"
25 |     ANCHORS="[8,16,32]"
26 |     RATIOS="[0.5,1,2]"
27 |     ;;
28 |     pascal_voc)
29 |     TRAIN_IMDB="voc_2007_trainval"
30 |     TEST_IMDB="voc_2007_test"
31 |     STEPSIZE=50000
32 |     ITERS=70000
33 |     ANCHORS="[8,16,32]"
34 |     RATIOS="[0.5,1,2]"
35 |     ;;
36 |     pascal_voc_0712)
37 |     TRAIN_IMDB="voc_2007_trainval+voc_2012_trainval"
38 |     TEST_IMDB="voc_2007_test"
39 |     STEPSIZE=80000
40 |     ITERS=110000
41 |     ANCHORS="[8,16,32]"
42 |     RATIOS="[0.5,1,2]"
43 |     ;;
44 |     coco)
45 |     TRAIN_IMDB="coco_2014_train+coco_2014_valminusminival"
46 |     TEST_IMDB="coco_2014_minival"
47 |     STEPSIZE=350000
48 |     ITERS=490000
49 |     ANCHORS="[4,8,16,32]"
50 |     RATIOS="[0.5,1,2]"
51 |     ;;
52 |     *)
53 |     echo "No dataset given"
54 |     exit
55 |     ;;
56 | esac
57 | 
58 | LOG="experiments/logs/${NET}_${TRAIN_IMDB}_${EXTRA_ARGS_SLUG}_${NET}.txt.`date +'%Y-%m-%d_%H-%M-%S'`"
59 | exec &> >(tee -a "$LOG")
60 | echo Logging output to "$LOG"
61 | 
62 | set +x
63 | if [[ ! -z  ${EXTRA_ARGS_SLUG}  ]]; then
64 |     NET_FINAL=output/${NET}/${TRAIN_IMDB}/${EXTRA_ARGS_SLUG}/${NET}_faster_rcnn_iter_${ITERS}.ckpt
65 | else
66 |     NET_FINAL=output/${NET}/${TRAIN_IMDB}/default/${NET}_faster_rcnn_iter_${ITERS}.ckpt
67 | fi
68 | set -x
69 | 
70 | if [ ! -f ${NET_FINAL}.index ]; then
71 |     if [[ ! -z  ${EXTRA_ARGS_SLUG}  ]]; then
72 |         CUDA_VISIBLE_DEVICES=${GPU_ID} time python ./tools/trainval_net.py \
73 |             --weight data/imagenet_weights/${NET}.ckpt \
74 |             --imdb ${TRAIN_IMDB} \
75 |             --imdbval ${TEST_IMDB} \
76 |             --iters ${ITERS} \
77 |             --cfg experiments/cfgs/${NET}.yml \
78 |             --tag ${EXTRA_ARGS_SLUG} \
79 |             --net ${NET} \
80 |             --set ANCHOR_SCALES ${ANCHORS} ANCHOR_RATIOS ${RATIOS} TRAIN.STEPSIZE ${STEPSIZE} ${EXTRA_ARGS}
81 |     else
82 |         CUDA_VISIBLE_DEVICES=${GPU_ID} time python ./tools/trainval_net.py \
83 |             --weight data/imagenet_weights/${NET}.ckpt \
84 |             --imdb ${TRAIN_IMDB} \
85 |             --imdbval ${TEST_IMDB} \
86 |             --iters ${ITERS} \
87 |             --cfg experiments/cfgs/${NET}.yml \
88 |             --net ${NET} \
89 |             --set ANCHOR_SCALES ${ANCHORS} ANCHOR_RATIOS ${RATIOS} TRAIN.STEPSIZE ${STEPSIZE} ${EXTRA_ARGS}
90 |     fi
91 | fi
92 | 
93 | ./experiments/scripts/test_faster_rcnn.sh $@
94 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/experiments/scripts/train_faster_rcnn.sh~:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | set -x
 4 | set -e
 5 | 
 6 | export PYTHONUNBUFFERED="True"
 7 | 
 8 | GPU_ID=$1
 9 | DATASET=$2
10 | NET=$3
11 | 
12 | array=( $@ )
13 | len=${#array[@]}
14 | EXTRA_ARGS=${array[@]:3:$len}
15 | EXTRA_ARGS_SLUG=${EXTRA_ARGS// /_}
16 | 
17 | case ${DATASET} in
18 |   graspRGB)
19 |     TRAIN_IMDB="graspRGB_train"
20 |     TEST_IMDB="graspRGB_test"
21 |     STEPSIZE=50000
22 |     ITERS=160000
23 |     #ANCHORS="[2,4,8,16,32]"
24 |     ANCHORS="[8,16,32]"
25 |     RATIOS="[0.5,1,2]"
26 |     ;;
27 |   pascal_voc)
28 |     TRAIN_IMDB="voc_2007_trainval"
29 |     TEST_IMDB="voc_2007_test"
30 |     STEPSIZE=50000
31 |     ITERS=70000
32 |     ANCHORS="[8,16,32]"
33 |     RATIOS="[0.5,1,2]"
34 |     ;;
35 |   pascal_voc_0712)
36 |     TRAIN_IMDB="voc_2007_trainval+voc_2012_trainval"
37 |     TEST_IMDB="voc_2007_test"
38 |     STEPSIZE=80000
39 |     ITERS=110000
40 |     ANCHORS="[8,16,32]"
41 |     RATIOS="[0.5,1,2]"
42 |     ;;
43 |   coco)
44 |     TRAIN_IMDB="coco_2014_train+coco_2014_valminusminival"
45 |     TEST_IMDB="coco_2014_minival"
46 |     STEPSIZE=350000
47 |     ITERS=490000
48 |     ANCHORS="[4,8,16,32]"
49 |     RATIOS="[0.5,1,2]"
50 |     ;;
51 |   *)
52 |     echo "No dataset given"
53 |     exit
54 |     ;;
55 | esac
56 | 
57 | LOG="experiments/logs/${NET}_${TRAIN_IMDB}_${EXTRA_ARGS_SLUG}_${NET}.txt.`date +'%Y-%m-%d_%H-%M-%S'`"
58 | exec &> >(tee -a "$LOG")
59 | echo Logging output to "$LOG"
60 | 
61 | set +x
62 | if [[ ! -z  ${EXTRA_ARGS_SLUG}  ]]; then
63 |     NET_FINAL=output/${NET}/${TRAIN_IMDB}/${EXTRA_ARGS_SLUG}/${NET}_faster_rcnn_iter_${ITERS}.ckpt
64 | else
65 |     NET_FINAL=output/${NET}/${TRAIN_IMDB}/default/${NET}_faster_rcnn_iter_${ITERS}.ckpt
66 | fi
67 | set -x
68 | 
69 | if [ ! -f ${NET_FINAL}.index ]; then
70 |     if [[ ! -z  ${EXTRA_ARGS_SLUG}  ]]; then
71 |         CUDA_VISIBLE_DEVICES=${GPU_ID} time python ./tools/trainval_net.py \
72 |             --weight data/imagenet_weights/${NET}.ckpt \
73 |             --imdb ${TRAIN_IMDB} \
74 |             --imdbval ${TEST_IMDB} \
75 |             --iters ${ITERS} \
76 |             --cfg experiments/cfgs/${NET}.yml \
77 |             --tag ${EXTRA_ARGS_SLUG} \
78 |             --net ${NET} \
79 |             --set ANCHOR_SCALES ${ANCHORS} ANCHOR_RATIOS ${RATIOS} TRAIN.STEPSIZE ${STEPSIZE} ${EXTRA_ARGS}
80 |     else
81 |         CUDA_VISIBLE_DEVICES=${GPU_ID} time python ./tools/trainval_net.py \
82 |             --weight data/imagenet_weights/${NET}.ckpt \
83 |             --imdb ${TRAIN_IMDB} \
84 |             --imdbval ${TEST_IMDB} \
85 |             --iters ${ITERS} \
86 |             --cfg experiments/cfgs/${NET}.yml \
87 |             --net ${NET} \
88 |             --set ANCHOR_SCALES ${ANCHORS} ANCHOR_RATIOS ${RATIOS} TRAIN.STEPSIZE ${STEPSIZE} ${EXTRA_ARGS}
89 |     fi
90 | fi
91 | 
92 | ./experiments/scripts/test_faster_rcnn.sh $@
93 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/Makefile:
--------------------------------------------------------------------------------
1 | all:
2 | 	python setup.py build_ext --inplace
3 | 	rm -rf build
4 | clean:
5 | 	rm -rf */*.pyc
6 | 	rm -rf */*.so
7 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/datasets/VOCdevkit-matlab-wrapper/get_voc_opts.m:
--------------------------------------------------------------------------------
 1 | function VOCopts = get_voc_opts(path)
 2 | 
 3 | tmp = pwd;
 4 | cd(path);
 5 | try
 6 |   addpath('VOCcode');
 7 |   VOCinit;
 8 | catch
 9 |   rmpath('VOCcode');
10 |   cd(tmp);
11 |   error(sprintf('VOCcode directory not found under %s', path));
12 | end
13 | rmpath('VOCcode');
14 | cd(tmp);
15 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/datasets/VOCdevkit-matlab-wrapper/voc_eval.m:
--------------------------------------------------------------------------------
 1 | function res = voc_eval(path, comp_id, test_set, output_dir)
 2 | 
 3 | VOCopts = get_voc_opts(path);
 4 | VOCopts.testset = test_set;
 5 | 
 6 | for i = 1:length(VOCopts.classes)
 7 |   cls = VOCopts.classes{i};
 8 |   res(i) = voc_eval_cls(cls, VOCopts, comp_id, output_dir);
 9 | end
10 | 
11 | fprintf('\n~~~~~~~~~~~~~~~~~~~~\n');
12 | fprintf('Results:\n');
13 | aps = [res(:).ap]';
14 | fprintf('%.1f\n', aps * 100);
15 | fprintf('%.1f\n', mean(aps) * 100);
16 | fprintf('~~~~~~~~~~~~~~~~~~~~\n');
17 | 
18 | function res = voc_eval_cls(cls, VOCopts, comp_id, output_dir)
19 | 
20 | test_set = VOCopts.testset;
21 | year = VOCopts.dataset(4:end);
22 | 
23 | addpath(fullfile(VOCopts.datadir, 'VOCcode'));
24 | 
25 | res_fn = sprintf(VOCopts.detrespath, comp_id, cls);
26 | 
27 | recall = [];
28 | prec = [];
29 | ap = 0;
30 | ap_auc = 0;
31 | 
32 | do_eval = (str2num(year) <= 2007) | ~strcmp(test_set, 'test');
33 | if do_eval
34 |   % Bug in VOCevaldet requires that tic has been called first
35 |   tic;
36 |   [recall, prec, ap] = VOCevaldet(VOCopts, comp_id, cls, true);
37 |   ap_auc = xVOCap(recall, prec);
38 | 
39 |   % force plot limits
40 |   ylim([0 1]);
41 |   xlim([0 1]);
42 | 
43 |   print(gcf, '-djpeg', '-r0', ...
44 |         [output_dir '/' cls '_pr.jpg']);
45 | end
46 | fprintf('!!! %s : %.4f %.4f\n', cls, ap, ap_auc);
47 | 
48 | res.recall = recall;
49 | res.prec = prec;
50 | res.ap = ap;
51 | res.ap_auc = ap_auc;
52 | 
53 | save([output_dir '/' cls '_pr.mat'], ...
54 |      'res', 'recall', 'prec', 'ap', 'ap_auc');
55 | 
56 | rmpath(fullfile(VOCopts.datadir, 'VOCcode'));
57 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/datasets/VOCdevkit-matlab-wrapper/xVOCap.m:
--------------------------------------------------------------------------------
 1 | function ap = xVOCap(rec,prec)
 2 | % From the PASCAL VOC 2011 devkit
 3 | 
 4 | mrec=[0 ; rec ; 1];
 5 | mpre=[0 ; prec ; 0];
 6 | for i=numel(mpre)-1:-1:1
 7 |     mpre(i)=max(mpre(i),mpre(i+1));
 8 | end
 9 | i=find(mrec(2:end)~=mrec(1:end-1))+1;
10 | ap=sum((mrec(i)-mrec(i-1)).*mpre(i));
11 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/datasets/__init__.py:
--------------------------------------------------------------------------------
1 | # --------------------------------------------------------
2 | # Fast R-CNN
3 | # Copyright (c) 2015 Microsoft
4 | # Licensed under The MIT License [see LICENSE for details]
5 | # Written by Ross Girshick
6 | # --------------------------------------------------------
7 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/datasets/__pycache__/__init__.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/datasets/__pycache__/__init__.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/datasets/__pycache__/coco.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/datasets/__pycache__/coco.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/datasets/__pycache__/ds_utils.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/datasets/__pycache__/ds_utils.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/datasets/__pycache__/factory.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/datasets/__pycache__/factory.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/datasets/__pycache__/graspRGB.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/datasets/__pycache__/graspRGB.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/datasets/__pycache__/imdb.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/datasets/__pycache__/imdb.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/datasets/__pycache__/pascal_voc.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/datasets/__pycache__/pascal_voc.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/datasets/__pycache__/voc_eval.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/datasets/__pycache__/voc_eval.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/datasets/ds_utils.py:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Fast/er R-CNN
 3 | # Licensed under The MIT License [see LICENSE for details]
 4 | # Written by Ross Girshick
 5 | # --------------------------------------------------------
 6 | from __future__ import absolute_import
 7 | from __future__ import division
 8 | from __future__ import print_function
 9 | 
10 | import numpy as np
11 | 
12 | 
13 | def unique_boxes(boxes, scale=1.0):
14 |   """Return indices of unique boxes."""
15 |   v = np.array([1, 1e3, 1e6, 1e9])
16 |   hashes = np.round(boxes * scale).dot(v)
17 |   _, index = np.unique(hashes, return_index=True)
18 |   return np.sort(index)
19 | 
20 | 
21 | def xywh_to_xyxy(boxes):
22 |   """Convert [x y w h] box format to [x1 y1 x2 y2] format."""
23 |   return np.hstack((boxes[:, 0:2], boxes[:, 0:2] + boxes[:, 2:4] - 1))
24 | 
25 | 
26 | def xyxy_to_xywh(boxes):
27 |   """Convert [x1 y1 x2 y2] box format to [x y w h] format."""
28 |   return np.hstack((boxes[:, 0:2], boxes[:, 2:4] - boxes[:, 0:2] + 1))
29 | 
30 | 
31 | def validate_boxes(boxes, width=0, height=0):
32 |   """Check that a set of boxes are valid."""
33 |   x1 = boxes[:, 0]
34 |   y1 = boxes[:, 1]
35 |   x2 = boxes[:, 2]
36 |   y2 = boxes[:, 3]
37 |   assert (x1 >= 0).all()
38 |   assert (y1 >= 0).all()
39 |   assert (x2 >= x1).all()
40 |   assert (y2 >= y1).all()
41 |   assert (x2 < width).all()
42 |   assert (y2 < height).all()
43 | 
44 | 
45 | def filter_small_boxes(boxes, min_size):
46 |   w = boxes[:, 2] - boxes[:, 0]
47 |   h = boxes[:, 3] - boxes[:, 1]
48 |   keep = np.where((w >= min_size) & (h > min_size))[0]
49 |   return keep
50 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/datasets/factory.py:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Fast R-CNN
 3 | # Copyright (c) 2015 Microsoft
 4 | # Licensed under The MIT License [see LICENSE for details]
 5 | # Written by Ross Girshick
 6 | # --------------------------------------------------------
 7 | 
 8 | """Factory method for easily getting imdbs by name."""
 9 | from __future__ import absolute_import
10 | from __future__ import division
11 | from __future__ import print_function
12 | from datasets.graspRGB import graspRGB
13 | 
14 | __sets = {}
15 | from datasets.pascal_voc import pascal_voc
16 | from datasets.coco import coco
17 | 
18 | import numpy as np
19 | import os
20 | 
21 | # Set up voc_<year>_<split>
22 | for year in ['2007', '2012']:
23 |   for split in ['train', 'val', 'trainval', 'test']:
24 |     name = 'voc_{}_{}'.format(year, split)
25 |     __sets[name] = (lambda split=split, year=year: pascal_voc(split, year))
26 | 
27 | # Set up coco_2014_<split>
28 | for year in ['2014']:
29 |   for split in ['train', 'val', 'minival', 'valminusminival', 'trainval']:
30 |     name = 'coco_{}_{}'.format(year, split)
31 |     __sets[name] = (lambda split=split, year=year: coco(split, year))
32 | 
33 | # Set up coco_2015_<split>
34 | for year in ['2015']:
35 |   for split in ['test', 'test-dev']:
36 |     name = 'coco_{}_{}'.format(year, split)
37 |     __sets[name] = (lambda split=split, year=year: coco(split, year))
38 | 
39 | # Set up graspRGB_<split> using selective search "fast" mode # added by FC
40 | # graspRGB_devkit_path = '/home/xusheng/Grasp/grasp_multiObject_multiGrasp'
41 | graspRGB_devkit_path = os.path.abspath(os.path.join(os.path.split(os.path.abspath(__file__))[0], '..', '..'))
42 | for split in ['train', 'test']:
43 |     name = '{}_{}'.format('graspRGB', split)
44 |     __sets[name] = (lambda split=split: graspRGB(split, graspRGB_devkit_path))
45 | 
46 | def get_imdb(name):
47 |   """Get an imdb (image database) by name."""
48 |   if name not in __sets:
49 |     raise KeyError('Unknown dataset: {}'.format(name))
50 |   return __sets[name]()
51 | 
52 | 
53 | def list_imdbs():
54 |   """List all registered imdbs."""
55 |   return list(__sets.keys())
56 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/datasets/imdb.py:
--------------------------------------------------------------------------------
  1 | # --------------------------------------------------------
  2 | # Fast R-CNN
  3 | # Copyright (c) 2015 Microsoft
  4 | # Licensed under The MIT License [see LICENSE for details]
  5 | # Written by Ross Girshick and Xinlei Chen
  6 | # --------------------------------------------------------
  7 | from __future__ import absolute_import
  8 | from __future__ import division
  9 | from __future__ import print_function
 10 | 
 11 | import os
 12 | import os.path as osp
 13 | import PIL
 14 | from utils.cython_bbox import bbox_overlaps
 15 | import numpy as np
 16 | import scipy.sparse
 17 | from model.config import cfg
 18 | 
 19 | 
 20 | class imdb(object):
 21 |   """Image database."""
 22 | 
 23 |   def __init__(self, name, classes=None):
 24 |     self._name = name
 25 |     self._num_classes = 0
 26 |     if not classes:
 27 |       self._classes = []
 28 |     else:
 29 |       self._classes = classes
 30 |     self._image_index = []
 31 |     self._obj_proposer = 'gt'
 32 |     self._roidb = None
 33 |     self._roidb_handler = self.default_roidb
 34 |     # Use this dict for storing dataset specific config options
 35 |     self.config = {}
 36 | 
 37 |   @property
 38 |   def name(self):
 39 |     return self._name
 40 | 
 41 |   @property
 42 |   def num_classes(self):
 43 |     return len(self._classes)
 44 | 
 45 |   @property
 46 |   def classes(self):
 47 |     return self._classes
 48 | 
 49 |   @property
 50 |   def image_index(self):
 51 |     return self._image_index
 52 | 
 53 |   @property
 54 |   def roidb_handler(self):
 55 |     return self._roidb_handler
 56 | 
 57 |   @roidb_handler.setter
 58 |   def roidb_handler(self, val):
 59 |     self._roidb_handler = val
 60 | 
 61 |   def set_proposal_method(self, method):
 62 |     method = eval('self.' + method + '_roidb')
 63 |     self.roidb_handler = method
 64 | 
 65 |   @property
 66 |   def roidb(self):
 67 |     # A roidb is a list of dictionaries, each with the following keys:
 68 |     #   boxes
 69 |     #   gt_overlaps
 70 |     #   gt_classes
 71 |     #   flipped
 72 |     if self._roidb is not None:
 73 |       return self._roidb
 74 |     self._roidb = self.roidb_handler()
 75 |     return self._roidb
 76 | 
 77 |   @property
 78 |   def cache_path(self):
 79 |     cache_path = osp.abspath(osp.join(cfg.DATA_DIR, 'cache'))
 80 |     if not os.path.exists(cache_path):
 81 |       os.makedirs(cache_path)
 82 |     return cache_path
 83 | 
 84 |   @property
 85 |   def num_images(self):
 86 |     return len(self.image_index)
 87 | 
 88 |   def image_path_at(self, i):
 89 |     raise NotImplementedError
 90 | 
 91 |   def default_roidb(self):
 92 |     raise NotImplementedError
 93 | 
 94 |   def evaluate_detections(self, all_boxes, output_dir=None):
 95 |     """
 96 |     all_boxes is a list of length number-of-classes.
 97 |     Each list element is a list of length number-of-images.
 98 |     Each of those list elements is either an empty list []
 99 |     or a numpy array of detection.
100 | 
101 |     all_boxes[class][image] = [] or np.array of shape #dets x 5
102 |     """
103 |     raise NotImplementedError
104 | 
105 |   def _get_widths(self):
106 |     return [PIL.Image.open(self.image_path_at(i)).size[0]
107 |             for i in range(self.num_images)]
108 | 
109 |   def append_flipped_images(self):
110 |     num_images = self.num_images
111 |     widths = self._get_widths()
112 |     for i in range(num_images):
113 |       boxes = self.roidb[i]['boxes'].copy()
114 |       oldx1 = boxes[:, 0].copy()
115 |       oldx2 = boxes[:, 2].copy()
116 |       boxes[:, 0] = widths[i] - oldx2 - 1
117 |       boxes[:, 2] = widths[i] - oldx1 - 1
118 |       assert (boxes[:, 2] >= boxes[:, 0]).all()
119 |       entry = {'boxes': boxes,
120 |                'gt_overlaps': self.roidb[i]['gt_overlaps'],
121 |                'gt_classes': self.roidb[i]['gt_classes'],
122 |                'flipped': True}
123 |       self.roidb.append(entry)
124 |     self._image_index = self._image_index * 2
125 | 
126 |   def evaluate_recall(self, candidate_boxes=None, thresholds=None,
127 |                       area='all', limit=None):
128 |     """Evaluate detection proposal recall metrics.
129 | 
130 |     Returns:
131 |         results: dictionary of results with keys
132 |             'ar': average recall
133 |             'recalls': vector recalls at each IoU overlap threshold
134 |             'thresholds': vector of IoU overlap thresholds
135 |             'gt_overlaps': vector of all ground-truth overlaps
136 |     """
137 |     # Record max overlap value for each gt box
138 |     # Return vector of overlap values
139 |     areas = {'all': 0, 'small': 1, 'medium': 2, 'large': 3,
140 |              '96-128': 4, '128-256': 5, '256-512': 6, '512-inf': 7}
141 |     area_ranges = [[0 ** 2, 1e5 ** 2],  # all
142 |                    [0 ** 2, 32 ** 2],  # small
143 |                    [32 ** 2, 96 ** 2],  # medium
144 |                    [96 ** 2, 1e5 ** 2],  # large
145 |                    [96 ** 2, 128 ** 2],  # 96-128
146 |                    [128 ** 2, 256 ** 2],  # 128-256
147 |                    [256 ** 2, 512 ** 2],  # 256-512
148 |                    [512 ** 2, 1e5 ** 2],  # 512-inf
149 |                    ]
150 |     assert area in areas, 'unknown area range: {}'.format(area)
151 |     area_range = area_ranges[areas[area]]
152 |     gt_overlaps = np.zeros(0)
153 |     num_pos = 0
154 |     for i in range(self.num_images):
155 |       # Checking for max_overlaps == 1 avoids including crowd annotations
156 |       # (...pretty hacking :/)
157 |       max_gt_overlaps = self.roidb[i]['gt_overlaps'].toarray().max(axis=1)
158 |       gt_inds = np.where((self.roidb[i]['gt_classes'] > 0) &
159 |                          (max_gt_overlaps == 1))[0]
160 |       gt_boxes = self.roidb[i]['boxes'][gt_inds, :]
161 |       gt_areas = self.roidb[i]['seg_areas'][gt_inds]
162 |       valid_gt_inds = np.where((gt_areas >= area_range[0]) &
163 |                                (gt_areas <= area_range[1]))[0]
164 |       gt_boxes = gt_boxes[valid_gt_inds, :]
165 |       num_pos += len(valid_gt_inds)
166 | 
167 |       if candidate_boxes is None:
168 |         # If candidate_boxes is not supplied, the default is to use the
169 |         # non-ground-truth boxes from this roidb
170 |         non_gt_inds = np.where(self.roidb[i]['gt_classes'] == 0)[0]
171 |         boxes = self.roidb[i]['boxes'][non_gt_inds, :]
172 |       else:
173 |         boxes = candidate_boxes[i]
174 |       if boxes.shape[0] == 0:
175 |         continue
176 |       if limit is not None and boxes.shape[0] > limit:
177 |         boxes = boxes[:limit, :]
178 | 
179 |       overlaps = bbox_overlaps(boxes.astype(np.float),
180 |                                gt_boxes.astype(np.float))
181 | 
182 |       _gt_overlaps = np.zeros((gt_boxes.shape[0]))
183 |       for j in range(gt_boxes.shape[0]):
184 |         # find which proposal box maximally covers each gt box
185 |         argmax_overlaps = overlaps.argmax(axis=0)
186 |         # and get the iou amount of coverage for each gt box
187 |         max_overlaps = overlaps.max(axis=0)
188 |         # find which gt box is 'best' covered (i.e. 'best' = most iou)
189 |         gt_ind = max_overlaps.argmax()
190 |         gt_ovr = max_overlaps.max()
191 |         assert (gt_ovr >= 0)
192 |         # find the proposal box that covers the best covered gt box
193 |         box_ind = argmax_overlaps[gt_ind]
194 |         # record the iou coverage of this gt box
195 |         _gt_overlaps[j] = overlaps[box_ind, gt_ind]
196 |         assert (_gt_overlaps[j] == gt_ovr)
197 |         # mark the proposal box and the gt box as used
198 |         overlaps[box_ind, :] = -1
199 |         overlaps[:, gt_ind] = -1
200 |       # append recorded iou coverage level
201 |       gt_overlaps = np.hstack((gt_overlaps, _gt_overlaps))
202 | 
203 |     gt_overlaps = np.sort(gt_overlaps)
204 |     if thresholds is None:
205 |       step = 0.05
206 |       thresholds = np.arange(0.5, 0.95 + 1e-5, step)
207 |     recalls = np.zeros_like(thresholds)
208 |     # compute recall for each iou threshold
209 |     for i, t in enumerate(thresholds):
210 |       recalls[i] = (gt_overlaps >= t).sum() / float(num_pos)
211 |     # ar = 2 * np.trapz(recalls, thresholds)
212 |     ar = recalls.mean()
213 |     return {'ar': ar, 'recalls': recalls, 'thresholds': thresholds,
214 |             'gt_overlaps': gt_overlaps}
215 | 
216 |   def create_roidb_from_box_list(self, box_list, gt_roidb):
217 |     assert len(box_list) == self.num_images, \
218 |       'Number of boxes must match number of ground-truth images'
219 |     roidb = []
220 |     for i in range(self.num_images):
221 |       boxes = box_list[i]
222 |       num_boxes = boxes.shape[0]
223 |       overlaps = np.zeros((num_boxes, self.num_classes), dtype=np.float32)
224 | 
225 |       if gt_roidb is not None and gt_roidb[i]['boxes'].size > 0:
226 |         gt_boxes = gt_roidb[i]['boxes']
227 |         gt_classes = gt_roidb[i]['gt_classes']
228 |         gt_overlaps = bbox_overlaps(boxes.astype(np.float),
229 |                                     gt_boxes.astype(np.float))
230 |         argmaxes = gt_overlaps.argmax(axis=1)
231 |         maxes = gt_overlaps.max(axis=1)
232 |         I = np.where(maxes > 0)[0]
233 |         overlaps[I, gt_classes[argmaxes[I]]] = maxes[I]
234 | 
235 |       overlaps = scipy.sparse.csr_matrix(overlaps)
236 |       roidb.append({
237 |         'boxes': boxes,
238 |         'gt_classes': np.zeros((num_boxes,), dtype=np.int32),
239 |         'gt_overlaps': overlaps,
240 |         'flipped': False,
241 |         'seg_areas': np.zeros((num_boxes,), dtype=np.float32),
242 |       })
243 |     return roidb
244 | 
245 |   @staticmethod
246 |   def merge_roidbs(a, b):
247 |     assert len(a) == len(b)
248 |     for i in range(len(a)):
249 |       a[i]['boxes'] = np.vstack((a[i]['boxes'], b[i]['boxes']))
250 |       a[i]['gt_classes'] = np.hstack((a[i]['gt_classes'],
251 |                                       b[i]['gt_classes']))
252 |       a[i]['gt_overlaps'] = scipy.sparse.vstack([a[i]['gt_overlaps'],
253 |                                                  b[i]['gt_overlaps']])
254 |       a[i]['seg_areas'] = np.hstack((a[i]['seg_areas'],
255 |                                      b[i]['seg_areas']))
256 |     return a
257 | 
258 |   def competition_mode(self, on):
259 |     """Turn competition mode on or off."""
260 |     pass
261 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/datasets/tools/mcg_munge.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import sys
 3 | 
 4 | """Hacky tool to convert file system layout of MCG boxes downloaded from
 5 | http://www.eecs.berkeley.edu/Research/Projects/CS/vision/grouping/mcg/
 6 | so that it's consistent with those computed by Jan Hosang (see:
 7 | http://www.mpi-inf.mpg.de/departments/computer-vision-and-multimodal-
 8 |   computing/research/object-recognition-and-scene-understanding/how-
 9 |   good-are-detection-proposals-really/)
10 | 
11 | NB: Boxes from the MCG website are in (y1, x1, y2, x2) order.
12 | Boxes from Hosang et al. are in (x1, y1, x2, y2) order.
13 | """
14 | 
15 | def munge(src_dir):
16 |     # stored as: ./MCG-COCO-val2014-boxes/COCO_val2014_000000193401.mat
17 |     # want:      ./MCG/mat/COCO_val2014_0/COCO_val2014_000000141/COCO_val2014_000000141334.mat
18 | 
19 |     files = os.listdir(src_dir)
20 |     for fn in files:
21 |         base, ext = os.path.splitext(fn)
22 |         # first 14 chars / first 22 chars / all chars + .mat
23 |         # COCO_val2014_0/COCO_val2014_000000447/COCO_val2014_000000447991.mat
24 |         first = base[:14]
25 |         second = base[:22]
26 |         dst_dir = os.path.join('MCG', 'mat', first, second)
27 |         if not os.path.exists(dst_dir):
28 |             os.makedirs(dst_dir)
29 |         src = os.path.join(src_dir, fn)
30 |         dst = os.path.join(dst_dir, fn)
31 |         print 'MV: {} -> {}'.format(src, dst)
32 |         os.rename(src, dst)
33 | 
34 | if __name__ == '__main__':
35 |     # src_dir should look something like:
36 |     #  src_dir = 'MCG-COCO-val2014-boxes'
37 |     src_dir = sys.argv[1]
38 |     munge(src_dir)
39 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/datasets/voc_eval.py:
--------------------------------------------------------------------------------
  1 | # --------------------------------------------------------
  2 | # Fast/er R-CNN
  3 | # Licensed under The MIT License [see LICENSE for details]
  4 | # Written by Bharath Hariharan
  5 | # --------------------------------------------------------
  6 | from __future__ import absolute_import
  7 | from __future__ import division
  8 | from __future__ import print_function
  9 | 
 10 | import xml.etree.ElementTree as ET
 11 | import os
 12 | import pickle
 13 | import numpy as np
 14 | 
 15 | def parse_rec(filename):
 16 |   """ Parse a PASCAL VOC xml file """
 17 |   tree = ET.parse(filename)
 18 |   objects = []
 19 |   for obj in tree.findall('object'):
 20 |     obj_struct = {}
 21 |     obj_struct['name'] = obj.find('name').text
 22 |     obj_struct['pose'] = obj.find('pose').text
 23 |     obj_struct['truncated'] = int(obj.find('truncated').text)
 24 |     obj_struct['difficult'] = int(obj.find('difficult').text)
 25 |     bbox = obj.find('bndbox')
 26 |     obj_struct['bbox'] = [int(bbox.find('xmin').text),
 27 |                           int(bbox.find('ymin').text),
 28 |                           int(bbox.find('xmax').text),
 29 |                           int(bbox.find('ymax').text)]
 30 |     objects.append(obj_struct)
 31 | 
 32 |   return objects
 33 | 
 34 | 
 35 | def voc_ap(rec, prec, use_07_metric=False):
 36 |   """ ap = voc_ap(rec, prec, [use_07_metric])
 37 |   Compute VOC AP given precision and recall.
 38 |   If use_07_metric is true, uses the
 39 |   VOC 07 11 point method (default:False).
 40 |   """
 41 |   if use_07_metric:
 42 |     # 11 point metric
 43 |     ap = 0.
 44 |     for t in np.arange(0., 1.1, 0.1):
 45 |       if np.sum(rec >= t) == 0:
 46 |         p = 0
 47 |       else:
 48 |         p = np.max(prec[rec >= t])
 49 |       ap = ap + p / 11.
 50 |   else:
 51 |     # correct AP calculation
 52 |     # first append sentinel values at the end
 53 |     mrec = np.concatenate(([0.], rec, [1.]))
 54 |     mpre = np.concatenate(([0.], prec, [0.]))
 55 | 
 56 |     # compute the precision envelope
 57 |     for i in range(mpre.size - 1, 0, -1):
 58 |       mpre[i - 1] = np.maximum(mpre[i - 1], mpre[i])
 59 | 
 60 |     # to calculate area under PR curve, look for points
 61 |     # where X axis (recall) changes value
 62 |     i = np.where(mrec[1:] != mrec[:-1])[0]
 63 | 
 64 |     # and sum (\Delta recall) * prec
 65 |     ap = np.sum((mrec[i + 1] - mrec[i]) * mpre[i + 1])
 66 |   return ap
 67 | 
 68 | 
 69 | def voc_eval(detpath,
 70 |              annopath,
 71 |              imagesetfile,
 72 |              classname,
 73 |              cachedir,
 74 |              ovthresh=0.5,
 75 |              use_07_metric=False):
 76 |   """rec, prec, ap = voc_eval(detpath,
 77 |                               annopath,
 78 |                               imagesetfile,
 79 |                               classname,
 80 |                               [ovthresh],
 81 |                               [use_07_metric])
 82 | 
 83 |   Top level function that does the PASCAL VOC evaluation.
 84 | 
 85 |   detpath: Path to detections
 86 |       detpath.format(classname) should produce the detection results file.
 87 |   annopath: Path to annotations
 88 |       annopath.format(imagename) should be the xml annotations file.
 89 |   imagesetfile: Text file containing the list of images, one image per line.
 90 |   classname: Category name (duh)
 91 |   cachedir: Directory for caching the annotations
 92 |   [ovthresh]: Overlap threshold (default = 0.5)
 93 |   [use_07_metric]: Whether to use VOC07's 11 point AP computation
 94 |       (default False)
 95 |   """
 96 |   # assumes detections are in detpath.format(classname)
 97 |   # assumes annotations are in annopath.format(imagename)
 98 |   # assumes imagesetfile is a text file with each line an image name
 99 |   # cachedir caches the annotations in a pickle file
100 | 
101 |   # first load gt
102 |   if not os.path.isdir(cachedir):
103 |     os.mkdir(cachedir)
104 |   cachefile = os.path.join(cachedir, 'annots.pkl')
105 |   # read list of images
106 |   with open(imagesetfile, 'r') as f:
107 |     lines = f.readlines()
108 |   imagenames = [x.strip() for x in lines]
109 | 
110 |   if not os.path.isfile(cachefile):
111 |     # load annots
112 |     recs = {}
113 |     for i, imagename in enumerate(imagenames):
114 |       recs[imagename] = parse_rec(annopath.format(imagename))
115 |       if i % 100 == 0:
116 |         print('Reading annotation for {:d}/{:d}'.format(
117 |           i + 1, len(imagenames)))
118 |     # save
119 |     print('Saving cached annotations to {:s}'.format(cachefile))
120 |     with open(cachefile, 'w') as f:
121 |       pickle.dump(recs, f)
122 |   else:
123 |     # load
124 |     with open(cachefile, 'rb') as f:
125 |       try:
126 |         recs = pickle.load(f)
127 |       except:
128 |         recs = pickle.load(f, encoding='bytes')
129 | 
130 |   # extract gt objects for this class
131 |   class_recs = {}
132 |   npos = 0
133 |   for imagename in imagenames:
134 |     R = [obj for obj in recs[imagename] if obj['name'] == classname]
135 |     bbox = np.array([x['bbox'] for x in R])
136 |     difficult = np.array([x['difficult'] for x in R]).astype(np.bool)
137 |     det = [False] * len(R)
138 |     npos = npos + sum(~difficult)
139 |     class_recs[imagename] = {'bbox': bbox,
140 |                              'difficult': difficult,
141 |                              'det': det}
142 | 
143 |   # read dets
144 |   detfile = detpath.format(classname)
145 |   with open(detfile, 'r') as f:
146 |     lines = f.readlines()
147 | 
148 |   splitlines = [x.strip().split(' ') for x in lines]
149 |   image_ids = [x[0] for x in splitlines]
150 |   confidence = np.array([float(x[1]) for x in splitlines])
151 |   BB = np.array([[float(z) for z in x[2:]] for x in splitlines])
152 | 
153 |   nd = len(image_ids)
154 |   tp = np.zeros(nd)
155 |   fp = np.zeros(nd)
156 | 
157 |   if BB.shape[0] > 0:
158 |     # sort by confidence
159 |     sorted_ind = np.argsort(-confidence)
160 |     sorted_scores = np.sort(-confidence)
161 |     BB = BB[sorted_ind, :]
162 |     image_ids = [image_ids[x] for x in sorted_ind]
163 | 
164 |     # go down dets and mark TPs and FPs
165 |     for d in range(nd):
166 |       R = class_recs[image_ids[d]]
167 |       bb = BB[d, :].astype(float)
168 |       ovmax = -np.inf
169 |       BBGT = R['bbox'].astype(float)
170 | 
171 |       if BBGT.size > 0:
172 |         # compute overlaps
173 |         # intersection
174 |         ixmin = np.maximum(BBGT[:, 0], bb[0])
175 |         iymin = np.maximum(BBGT[:, 1], bb[1])
176 |         ixmax = np.minimum(BBGT[:, 2], bb[2])
177 |         iymax = np.minimum(BBGT[:, 3], bb[3])
178 |         iw = np.maximum(ixmax - ixmin + 1., 0.)
179 |         ih = np.maximum(iymax - iymin + 1., 0.)
180 |         inters = iw * ih
181 | 
182 |         # union
183 |         uni = ((bb[2] - bb[0] + 1.) * (bb[3] - bb[1] + 1.) +
184 |                (BBGT[:, 2] - BBGT[:, 0] + 1.) *
185 |                (BBGT[:, 3] - BBGT[:, 1] + 1.) - inters)
186 | 
187 |         overlaps = inters / uni
188 |         ovmax = np.max(overlaps)
189 |         jmax = np.argmax(overlaps)
190 | 
191 |       if ovmax > ovthresh:
192 |         if not R['difficult'][jmax]:
193 |           if not R['det'][jmax]:
194 |             tp[d] = 1.
195 |             R['det'][jmax] = 1
196 |           else:
197 |             fp[d] = 1.
198 |       else:
199 |         fp[d] = 1.
200 | 
201 |   # compute precision recall
202 |   fp = np.cumsum(fp)
203 |   tp = np.cumsum(tp)
204 |   rec = tp / float(npos)
205 |   # avoid divide by zero in case the first detection matches a difficult
206 |   # ground truth
207 |   prec = tp / np.maximum(tp + fp, np.finfo(np.float64).eps)
208 |   ap = voc_ap(rec, prec, use_07_metric)
209 | 
210 |   return rec, prec, ap
211 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/layer_utils/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/layer_utils/__init__.py


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/layer_utils/__pycache__/__init__.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/layer_utils/__pycache__/__init__.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/layer_utils/__pycache__/anchor_target_layer.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/layer_utils/__pycache__/anchor_target_layer.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/layer_utils/__pycache__/generate_anchors.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/layer_utils/__pycache__/generate_anchors.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/layer_utils/__pycache__/proposal_layer.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/layer_utils/__pycache__/proposal_layer.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/layer_utils/__pycache__/proposal_target_layer.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/layer_utils/__pycache__/proposal_target_layer.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/layer_utils/__pycache__/proposal_top_layer.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/layer_utils/__pycache__/proposal_top_layer.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/layer_utils/__pycache__/snippets.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/layer_utils/__pycache__/snippets.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/layer_utils/anchor_target_layer.py:
--------------------------------------------------------------------------------
  1 | # --------------------------------------------------------
  2 | # Faster R-CNN
  3 | # Copyright (c) 2015 Microsoft
  4 | # Licensed under The MIT License [see LICENSE for details]
  5 | # Written by Ross Girshick and Xinlei Chen
  6 | # --------------------------------------------------------
  7 | from __future__ import absolute_import
  8 | from __future__ import division
  9 | from __future__ import print_function
 10 | 
 11 | import os
 12 | from model.config import cfg
 13 | import numpy as np
 14 | import numpy.random as npr
 15 | from utils.cython_bbox import bbox_overlaps
 16 | from model.bbox_transform import bbox_transform
 17 | 
 18 | def anchor_target_layer(rpn_cls_score, gt_boxes, im_info, _feat_stride, all_anchors, num_anchors):
 19 |   """Same as the anchor target layer in original Fast/er RCNN """
 20 |   A = num_anchors
 21 |   total_anchors = all_anchors.shape[0]
 22 |   K = total_anchors / num_anchors
 23 |   im_info = im_info[0]
 24 | 
 25 |   # allow boxes to sit over the edge by a small amount
 26 |   _allowed_border = 0
 27 | 
 28 |   # map of shape (..., H, W)
 29 |   height, width = rpn_cls_score.shape[1:3]
 30 | 
 31 |   # only keep anchors inside the image
 32 |   inds_inside = np.where(
 33 |     (all_anchors[:, 0] >= -_allowed_border) &
 34 |     (all_anchors[:, 1] >= -_allowed_border) &
 35 |     (all_anchors[:, 2] < im_info[1] + _allowed_border) &  # width
 36 |     (all_anchors[:, 3] < im_info[0] + _allowed_border)  # height
 37 |   )[0]
 38 | 
 39 |   # keep only inside anchors
 40 |   anchors = all_anchors[inds_inside, :]
 41 | 
 42 |   # label: 1 is positive, 0 is negative, -1 is dont care
 43 |   labels = np.empty((len(inds_inside),), dtype=np.float32)
 44 |   labels.fill(-1)
 45 | 
 46 |   # overlaps between the anchors and the gt boxes
 47 |   # overlaps (ex, gt)
 48 |   overlaps = bbox_overlaps(
 49 |     np.ascontiguousarray(anchors, dtype=np.float),
 50 |     np.ascontiguousarray(gt_boxes, dtype=np.float))
 51 |   argmax_overlaps = overlaps.argmax(axis=1)
 52 |   max_overlaps = overlaps[np.arange(len(inds_inside)), argmax_overlaps]
 53 |   gt_argmax_overlaps = overlaps.argmax(axis=0)
 54 |   gt_max_overlaps = overlaps[gt_argmax_overlaps,
 55 |                              np.arange(overlaps.shape[1])]
 56 |   gt_argmax_overlaps = np.where(overlaps == gt_max_overlaps)[0]
 57 | 
 58 |   if not cfg.TRAIN.RPN_CLOBBER_POSITIVES:
 59 |     # assign bg labels first so that positive labels can clobber them
 60 |     # first set the negatives
 61 |     labels[max_overlaps < cfg.TRAIN.RPN_NEGATIVE_OVERLAP] = 0
 62 | 
 63 |   # fg label: for each gt, anchor with highest overlap
 64 |   labels[gt_argmax_overlaps] = 1
 65 | 
 66 |   # fg label: above threshold IOU
 67 |   labels[max_overlaps >= cfg.TRAIN.RPN_POSITIVE_OVERLAP] = 1
 68 | 
 69 |   if cfg.TRAIN.RPN_CLOBBER_POSITIVES:
 70 |     # assign bg labels last so that negative labels can clobber positives
 71 |     labels[max_overlaps < cfg.TRAIN.RPN_NEGATIVE_OVERLAP] = 0
 72 | 
 73 |   # subsample positive labels if we have too many
 74 |   num_fg = int(cfg.TRAIN.RPN_FG_FRACTION * cfg.TRAIN.RPN_BATCHSIZE)
 75 |   fg_inds = np.where(labels == 1)[0]
 76 |   if len(fg_inds) > num_fg:
 77 |     disable_inds = npr.choice(
 78 |       fg_inds, size=(len(fg_inds) - num_fg), replace=False)
 79 |     labels[disable_inds] = -1
 80 | 
 81 |   # subsample negative labels if we have too many
 82 |   num_bg = cfg.TRAIN.RPN_BATCHSIZE - np.sum(labels == 1)
 83 |   bg_inds = np.where(labels == 0)[0]
 84 |   if len(bg_inds) > num_bg:
 85 |     disable_inds = npr.choice(
 86 |       bg_inds, size=(len(bg_inds) - num_bg), replace=False)
 87 |     labels[disable_inds] = -1
 88 | 
 89 |   bbox_targets = np.zeros((len(inds_inside), 4), dtype=np.float32)
 90 |   bbox_targets = _compute_targets(anchors, gt_boxes[argmax_overlaps, :])
 91 | 
 92 |   bbox_inside_weights = np.zeros((len(inds_inside), 4), dtype=np.float32)
 93 |   # only the positive ones have regression targets
 94 |   bbox_inside_weights[labels == 1, :] = np.array(cfg.TRAIN.RPN_BBOX_INSIDE_WEIGHTS)
 95 | 
 96 |   bbox_outside_weights = np.zeros((len(inds_inside), 4), dtype=np.float32)
 97 |   if cfg.TRAIN.RPN_POSITIVE_WEIGHT < 0:
 98 |     # uniform weighting of examples (given non-uniform sampling)
 99 |     num_examples = np.sum(labels >= 0)
100 |     positive_weights = np.ones((1, 4)) * 1.0 / num_examples
101 |     negative_weights = np.ones((1, 4)) * 1.0 / num_examples
102 |   else:
103 |     assert ((cfg.TRAIN.RPN_POSITIVE_WEIGHT > 0) &
104 |             (cfg.TRAIN.RPN_POSITIVE_WEIGHT < 1))
105 |     positive_weights = (cfg.TRAIN.RPN_POSITIVE_WEIGHT /
106 |                         np.sum(labels == 1))
107 |     negative_weights = ((1.0 - cfg.TRAIN.RPN_POSITIVE_WEIGHT) /
108 |                         np.sum(labels == 0))
109 |   bbox_outside_weights[labels == 1, :] = positive_weights
110 |   bbox_outside_weights[labels == 0, :] = negative_weights
111 | 
112 |   # map up to original set of anchors
113 |   labels = _unmap(labels, total_anchors, inds_inside, fill=-1)
114 |   bbox_targets = _unmap(bbox_targets, total_anchors, inds_inside, fill=0)
115 |   bbox_inside_weights = _unmap(bbox_inside_weights, total_anchors, inds_inside, fill=0)
116 |   bbox_outside_weights = _unmap(bbox_outside_weights, total_anchors, inds_inside, fill=0)
117 | 
118 |   # labels
119 |   labels = labels.reshape((1, height, width, A)).transpose(0, 3, 1, 2)
120 |   labels = labels.reshape((1, 1, A * height, width))
121 |   rpn_labels = labels
122 | 
123 |   # bbox_targets
124 |   bbox_targets = bbox_targets \
125 |     .reshape((1, height, width, A * 4))
126 | 
127 |   rpn_bbox_targets = bbox_targets
128 |   # bbox_inside_weights
129 |   bbox_inside_weights = bbox_inside_weights \
130 |     .reshape((1, height, width, A * 4))
131 | 
132 |   rpn_bbox_inside_weights = bbox_inside_weights
133 | 
134 |   # bbox_outside_weights
135 |   bbox_outside_weights = bbox_outside_weights \
136 |     .reshape((1, height, width, A * 4))
137 | 
138 |   rpn_bbox_outside_weights = bbox_outside_weights
139 |   return rpn_labels, rpn_bbox_targets, rpn_bbox_inside_weights, rpn_bbox_outside_weights
140 | 
141 | 
142 | def _unmap(data, count, inds, fill=0):
143 |   """ Unmap a subset of item (data) back to the original set of items (of
144 |   size count) """
145 |   if len(data.shape) == 1:
146 |     ret = np.empty((count,), dtype=np.float32)
147 |     ret.fill(fill)
148 |     ret[inds] = data
149 |   else:
150 |     ret = np.empty((count,) + data.shape[1:], dtype=np.float32)
151 |     ret.fill(fill)
152 |     ret[inds, :] = data
153 |   return ret
154 | 
155 | 
156 | def _compute_targets(ex_rois, gt_rois):
157 |   """Compute bounding-box regression targets for an image."""
158 | 
159 |   assert ex_rois.shape[0] == gt_rois.shape[0]
160 |   assert ex_rois.shape[1] == 4
161 |   assert gt_rois.shape[1] == 5
162 | 
163 |   return bbox_transform(ex_rois, gt_rois[:, :4]).astype(np.float32, copy=False)
164 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/layer_utils/generate_anchors.py:
--------------------------------------------------------------------------------
  1 | # --------------------------------------------------------
  2 | # Faster R-CNN
  3 | # Copyright (c) 2015 Microsoft
  4 | # Licensed under The MIT License [see LICENSE for details]
  5 | # Written by Ross Girshick and Sean Bell
  6 | # --------------------------------------------------------
  7 | from __future__ import absolute_import
  8 | from __future__ import division
  9 | from __future__ import print_function
 10 | 
 11 | import numpy as np
 12 | 
 13 | 
 14 | # Verify that we compute the same anchors as Shaoqing's matlab implementation:
 15 | #
 16 | #    >> load output/rpn_cachedir/faster_rcnn_VOC2007_ZF_stage1_rpn/anchors.mat
 17 | #    >> anchors
 18 | #
 19 | #    anchors =
 20 | #
 21 | #       -83   -39   100    56
 22 | #      -175   -87   192   104
 23 | #      -359  -183   376   200
 24 | #       -55   -55    72    72
 25 | #      -119  -119   136   136
 26 | #      -247  -247   264   264
 27 | #       -35   -79    52    96
 28 | #       -79  -167    96   184
 29 | #      -167  -343   184   360
 30 | 
 31 | # array([[ -83.,  -39.,  100.,   56.],
 32 | #       [-175.,  -87.,  192.,  104.],
 33 | #       [-359., -183.,  376.,  200.],
 34 | #       [ -55.,  -55.,   72.,   72.],
 35 | #       [-119., -119.,  136.,  136.],
 36 | #       [-247., -247.,  264.,  264.],
 37 | #       [ -35.,  -79.,   52.,   96.],
 38 | #       [ -79., -167.,   96.,  184.],
 39 | #       [-167., -343.,  184.,  360.]])
 40 | 
 41 | def generate_anchors(base_size=16, ratios=[0.5, 1, 2],
 42 |                      scales=2 ** np.arange(3, 6)):
 43 |   """
 44 |   Generate anchor (reference) windows by enumerating aspect ratios X
 45 |   scales wrt a reference (0, 0, 15, 15) window.
 46 |   """
 47 | 
 48 |   base_anchor = np.array([1, 1, base_size, base_size]) - 1
 49 |   ratio_anchors = _ratio_enum(base_anchor, ratios)
 50 |   anchors = np.vstack([_scale_enum(ratio_anchors[i, :], scales)
 51 |                        for i in range(ratio_anchors.shape[0])])
 52 |   return anchors
 53 | 
 54 | 
 55 | def _whctrs(anchor):
 56 |   """
 57 |   Return width, height, x center, and y center for an anchor (window).
 58 |   """
 59 | 
 60 |   w = anchor[2] - anchor[0] + 1
 61 |   h = anchor[3] - anchor[1] + 1
 62 |   x_ctr = anchor[0] + 0.5 * (w - 1)
 63 |   y_ctr = anchor[1] + 0.5 * (h - 1)
 64 |   return w, h, x_ctr, y_ctr
 65 | 
 66 | 
 67 | def _mkanchors(ws, hs, x_ctr, y_ctr):
 68 |   """
 69 |   Given a vector of widths (ws) and heights (hs) around a center
 70 |   (x_ctr, y_ctr), output a set of anchors (windows).
 71 |   """
 72 | 
 73 |   ws = ws[:, np.newaxis]
 74 |   hs = hs[:, np.newaxis]
 75 |   anchors = np.hstack((x_ctr - 0.5 * (ws - 1),
 76 |                        y_ctr - 0.5 * (hs - 1),
 77 |                        x_ctr + 0.5 * (ws - 1),
 78 |                        y_ctr + 0.5 * (hs - 1)))
 79 |   return anchors
 80 | 
 81 | 
 82 | def _ratio_enum(anchor, ratios):
 83 |   """
 84 |   Enumerate a set of anchors for each aspect ratio wrt an anchor.
 85 |   """
 86 | 
 87 |   w, h, x_ctr, y_ctr = _whctrs(anchor)
 88 |   size = w * h
 89 |   size_ratios = size / ratios
 90 |   ws = np.round(np.sqrt(size_ratios))
 91 |   hs = np.round(ws * ratios)
 92 |   anchors = _mkanchors(ws, hs, x_ctr, y_ctr)
 93 |   return anchors
 94 | 
 95 | 
 96 | def _scale_enum(anchor, scales):
 97 |   """
 98 |   Enumerate a set of anchors for each scale wrt an anchor.
 99 |   """
100 | 
101 |   w, h, x_ctr, y_ctr = _whctrs(anchor)
102 |   ws = w * scales
103 |   hs = h * scales
104 |   anchors = _mkanchors(ws, hs, x_ctr, y_ctr)
105 |   return anchors
106 | 
107 | 
108 | if __name__ == '__main__':
109 |   import time
110 | 
111 |   t = time.time()
112 |   a = generate_anchors()
113 |   print(time.time() - t)
114 |   print(a)
115 |   from IPython import embed;
116 | 
117 |   embed()
118 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/layer_utils/proposal_layer.py:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Faster R-CNN
 3 | # Licensed under The MIT License [see LICENSE for details]
 4 | # Written by Ross Girshick and Xinlei Chen
 5 | # --------------------------------------------------------
 6 | from __future__ import absolute_import
 7 | from __future__ import division
 8 | from __future__ import print_function
 9 | 
10 | import numpy as np
11 | from model.config import cfg
12 | from model.bbox_transform import bbox_transform_inv, clip_boxes
13 | from model.nms_wrapper import nms
14 | 
15 | 
16 | def proposal_layer(rpn_cls_prob, rpn_bbox_pred, im_info, cfg_key, _feat_stride, anchors, num_anchors):
17 |   """A simplified version compared to fast/er RCNN
18 |      For details please see the technical report
19 |   """
20 |   if type(cfg_key) == bytes:
21 |       cfg_key = cfg_key.decode('utf-8')
22 |   pre_nms_topN = cfg[cfg_key].RPN_PRE_NMS_TOP_N
23 |   post_nms_topN = cfg[cfg_key].RPN_POST_NMS_TOP_N
24 |   nms_thresh = cfg[cfg_key].RPN_NMS_THRESH
25 | 
26 |   im_info = im_info[0]
27 |   # Get the scores and bounding boxes
28 |   scores = rpn_cls_prob[:, :, :, num_anchors:]
29 |   rpn_bbox_pred = rpn_bbox_pred.reshape((-1, 4))
30 |   scores = scores.reshape((-1, 1))
31 |   proposals = bbox_transform_inv(anchors, rpn_bbox_pred)
32 |   proposals = clip_boxes(proposals, im_info[:2])
33 | 
34 |   # Pick the top region proposals
35 |   order = scores.ravel().argsort()[::-1]
36 |   if pre_nms_topN > 0:
37 |     order = order[:pre_nms_topN]
38 |   proposals = proposals[order, :]
39 |   scores = scores[order]
40 | 
41 |   # Non-maximal suppression
42 |   keep = nms(np.hstack((proposals, scores)), nms_thresh)
43 | 
44 |   # Pick th top region proposals after NMS
45 |   if post_nms_topN > 0:
46 |     keep = keep[:post_nms_topN]
47 |   proposals = proposals[keep, :]
48 |   scores = scores[keep]
49 | 
50 |   # Only support single image as input
51 |   batch_inds = np.zeros((proposals.shape[0], 1), dtype=np.float32)
52 |   blob = np.hstack((batch_inds, proposals.astype(np.float32, copy=False)))
53 | 
54 |   return blob, scores
55 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/layer_utils/proposal_target_layer.py:
--------------------------------------------------------------------------------
  1 | # --------------------------------------------------------
  2 | # Faster R-CNN
  3 | # Copyright (c) 2015 Microsoft
  4 | # Licensed under The MIT License [see LICENSE for details]
  5 | # Written by Ross Girshick, Sean Bell and Xinlei Chen
  6 | # --------------------------------------------------------
  7 | from __future__ import absolute_import
  8 | from __future__ import division
  9 | from __future__ import print_function
 10 | 
 11 | import numpy as np
 12 | import numpy.random as npr
 13 | from model.config import cfg
 14 | from model.bbox_transform import bbox_transform
 15 | from utils.cython_bbox import bbox_overlaps
 16 | 
 17 | 
 18 | def proposal_target_layer(rpn_rois, rpn_scores, gt_boxes, _num_classes):
 19 |   """
 20 |   Assign object detection proposals to ground-truth targets. Produces proposal
 21 |   classification labels and bounding-box regression targets.
 22 |   """
 23 | 
 24 |   # Proposal ROIs (0, x1, y1, x2, y2) coming from RPN
 25 |   # (i.e., rpn.proposal_layer.ProposalLayer), or any other source
 26 |   all_rois = rpn_rois
 27 |   all_scores = rpn_scores
 28 | 
 29 |   # Include ground-truth boxes in the set of candidate rois
 30 |   if cfg.TRAIN.USE_GT:
 31 |     zeros = np.zeros((gt_boxes.shape[0], 1), dtype=gt_boxes.dtype)
 32 |     all_rois = np.vstack(
 33 |       (all_rois, np.hstack((zeros, gt_boxes[:, :-1])))
 34 |     )
 35 |     # not sure if it a wise appending, but anyway i am not using it
 36 |     all_scores = np.vstack((all_scores, zeros))
 37 | 
 38 |   num_images = 1
 39 |   rois_per_image = cfg.TRAIN.BATCH_SIZE / num_images
 40 |   fg_rois_per_image = np.round(cfg.TRAIN.FG_FRACTION * rois_per_image)
 41 | 
 42 |   # Sample rois with classification labels and bounding box regression
 43 |   # targets
 44 |   labels, rois, roi_scores, bbox_targets, bbox_inside_weights = _sample_rois(
 45 |     all_rois, all_scores, gt_boxes, fg_rois_per_image,
 46 |     rois_per_image, _num_classes)
 47 | 
 48 |   rois = rois.reshape(-1, 5)
 49 |   roi_scores = roi_scores.reshape(-1)
 50 |   labels = labels.reshape(-1, 1)
 51 |   bbox_targets = bbox_targets.reshape(-1, _num_classes * 4)
 52 |   bbox_inside_weights = bbox_inside_weights.reshape(-1, _num_classes * 4)
 53 |   bbox_outside_weights = np.array(bbox_inside_weights > 0).astype(np.float32)
 54 | 
 55 |   return rois, roi_scores, labels, bbox_targets, bbox_inside_weights, bbox_outside_weights
 56 | 
 57 | 
 58 | def _get_bbox_regression_labels(bbox_target_data, num_classes):
 59 |   """Bounding-box regression targets (bbox_target_data) are stored in a
 60 |   compact form N x (class, tx, ty, tw, th)
 61 | 
 62 |   This function expands those targets into the 4-of-4*K representation used
 63 |   by the network (i.e. only one class has non-zero targets).
 64 | 
 65 |   Returns:
 66 |       bbox_target (ndarray): N x 4K blob of regression targets
 67 |       bbox_inside_weights (ndarray): N x 4K blob of loss weights
 68 |   """
 69 | 
 70 |   clss = bbox_target_data[:, 0]
 71 |   bbox_targets = np.zeros((clss.size, 4 * num_classes), dtype=np.float32)
 72 |   bbox_inside_weights = np.zeros(bbox_targets.shape, dtype=np.float32)
 73 |   inds = np.where(clss > 0)[0]
 74 |   for ind in inds:
 75 |     cls = clss[ind]
 76 |     start = int(4 * cls)
 77 |     end = start + 4
 78 |     bbox_targets[ind, start:end] = bbox_target_data[ind, 1:]
 79 |     bbox_inside_weights[ind, start:end] = cfg.TRAIN.BBOX_INSIDE_WEIGHTS
 80 |   return bbox_targets, bbox_inside_weights
 81 | 
 82 | 
 83 | def _compute_targets(ex_rois, gt_rois, labels):
 84 |   """Compute bounding-box regression targets for an image."""
 85 | 
 86 |   assert ex_rois.shape[0] == gt_rois.shape[0]
 87 |   assert ex_rois.shape[1] == 4
 88 |   assert gt_rois.shape[1] == 4
 89 | 
 90 |   targets = bbox_transform(ex_rois, gt_rois)
 91 |   if cfg.TRAIN.BBOX_NORMALIZE_TARGETS_PRECOMPUTED:
 92 |     # Optionally normalize targets by a precomputed mean and stdev
 93 |     targets = ((targets - np.array(cfg.TRAIN.BBOX_NORMALIZE_MEANS))
 94 |                / np.array(cfg.TRAIN.BBOX_NORMALIZE_STDS))
 95 |   return np.hstack(
 96 |     (labels[:, np.newaxis], targets)).astype(np.float32, copy=False)
 97 | 
 98 | 
 99 | def _sample_rois(all_rois, all_scores, gt_boxes, fg_rois_per_image, rois_per_image, num_classes):
100 |   """Generate a random sample of RoIs comprising foreground and background
101 |   examples.
102 |   """
103 |   # overlaps: (rois x gt_boxes)
104 |   overlaps = bbox_overlaps(
105 |     np.ascontiguousarray(all_rois[:, 1:5], dtype=np.float),
106 |     np.ascontiguousarray(gt_boxes[:, :4], dtype=np.float))
107 |   gt_assignment = overlaps.argmax(axis=1)
108 |   max_overlaps = overlaps.max(axis=1)
109 |   labels = gt_boxes[gt_assignment, 4]
110 | 
111 |   # Select foreground RoIs as those with >= FG_THRESH overlap
112 |   fg_inds = np.where(max_overlaps >= cfg.TRAIN.FG_THRESH)[0]
113 |   # Guard against the case when an image has fewer than fg_rois_per_image
114 |   # Select background RoIs as those within [BG_THRESH_LO, BG_THRESH_HI)
115 |   bg_inds = np.where((max_overlaps < cfg.TRAIN.BG_THRESH_HI) &
116 |                      (max_overlaps >= cfg.TRAIN.BG_THRESH_LO))[0]
117 | 
118 |   # Small modification to the original version where we ensure a fixed number of regions are sampled
119 |   if fg_inds.size > 0 and bg_inds.size > 0:
120 |     fg_rois_per_image = min(fg_rois_per_image, fg_inds.size)
121 |     fg_inds = npr.choice(fg_inds, size=int(fg_rois_per_image), replace=False)
122 |     bg_rois_per_image = rois_per_image - fg_rois_per_image
123 |     to_replace = bg_inds.size < bg_rois_per_image
124 |     bg_inds = npr.choice(bg_inds, size=int(bg_rois_per_image), replace=to_replace)
125 |   elif fg_inds.size > 0:
126 |     to_replace = fg_inds.size < rois_per_image
127 |     fg_inds = npr.choice(fg_inds, size=int(rois_per_image), replace=to_replace)
128 |     fg_rois_per_image = rois_per_image
129 |   elif bg_inds.size > 0:
130 |     to_replace = bg_inds.size < rois_per_image
131 |     bg_inds = npr.choice(bg_inds, size=int(rois_per_image), replace=to_replace)
132 |     fg_rois_per_image = 0
133 |   else:
134 |     import pdb
135 |     pdb.set_trace()
136 | 
137 |   # The indices that we're selecting (both fg and bg)
138 |   keep_inds = np.append(fg_inds, bg_inds)
139 |   # Select sampled values from various arrays:
140 |   labels = labels[keep_inds]
141 |   # Clamp labels for the background RoIs to 0
142 |   labels[int(fg_rois_per_image):] = 0
143 |   rois = all_rois[keep_inds]
144 |   roi_scores = all_scores[keep_inds]
145 | 
146 |   bbox_target_data = _compute_targets(
147 |     rois[:, 1:5], gt_boxes[gt_assignment[keep_inds], :4], labels)
148 | 
149 |   bbox_targets, bbox_inside_weights = \
150 |     _get_bbox_regression_labels(bbox_target_data, num_classes)
151 | 
152 |   return labels, rois, roi_scores, bbox_targets, bbox_inside_weights
153 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/layer_utils/proposal_top_layer.py:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Faster R-CNN
 3 | # Licensed under The MIT License [see LICENSE for details]
 4 | # Written by Xinlei Chen
 5 | # --------------------------------------------------------
 6 | from __future__ import absolute_import
 7 | from __future__ import division
 8 | from __future__ import print_function
 9 | 
10 | import numpy as np
11 | from model.config import cfg
12 | from model.bbox_transform import bbox_transform_inv, clip_boxes
13 | import numpy.random as npr
14 | 
15 | def proposal_top_layer(rpn_cls_prob, rpn_bbox_pred, im_info, _feat_stride, anchors, num_anchors):
16 |   """A layer that just selects the top region proposals
17 |      without using non-maximal suppression,
18 |      For details please see the technical report
19 |   """
20 |   rpn_top_n = cfg.TEST.RPN_TOP_N
21 |   im_info = im_info[0]
22 | 
23 |   scores = rpn_cls_prob[:, :, :, num_anchors:]
24 | 
25 |   rpn_bbox_pred = rpn_bbox_pred.reshape((-1, 4))
26 |   scores = scores.reshape((-1, 1))
27 | 
28 |   length = scores.shape[0]
29 |   if length < rpn_top_n:
30 |     # Random selection, maybe unnecessary and loses good proposals
31 |     # But such case rarely happens
32 |     top_inds = npr.choice(length, size=rpn_top_n, replace=True)
33 |   else:
34 |     top_inds = scores.argsort(0)[::-1]
35 |     top_inds = top_inds[:rpn_top_n]
36 |     top_inds = top_inds.reshape(rpn_top_n, )
37 | 
38 |   # Do the selection here
39 |   anchors = anchors[top_inds, :]
40 |   rpn_bbox_pred = rpn_bbox_pred[top_inds, :]
41 |   scores = scores[top_inds]
42 | 
43 |   # Convert anchors into proposals via bbox transformations
44 |   proposals = bbox_transform_inv(anchors, rpn_bbox_pred)
45 | 
46 |   # Clip predicted boxes to image
47 |   proposals = clip_boxes(proposals, im_info[:2])
48 | 
49 |   # Output rois blob
50 |   # Our RPN implementation only supports a single input image, so all
51 |   # batch inds are 0
52 |   batch_inds = np.zeros((proposals.shape[0], 1), dtype=np.float32)
53 |   blob = np.hstack((batch_inds, proposals.astype(np.float32, copy=False)))
54 |   return blob, scores
55 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/layer_utils/snippets.py:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Tensorflow Faster R-CNN
 3 | # Licensed under The MIT License [see LICENSE for details]
 4 | # Written by Xinlei Chen
 5 | # --------------------------------------------------------
 6 | from __future__ import absolute_import
 7 | from __future__ import division
 8 | from __future__ import print_function
 9 | 
10 | import numpy as np
11 | import numpy.random as npr
12 | from model.config import cfg
13 | from layer_utils.generate_anchors import generate_anchors
14 | from model.bbox_transform import bbox_transform_inv, clip_boxes
15 | from utils.cython_bbox import bbox_overlaps
16 | 
17 | def generate_anchors_pre(height, width, feat_stride, anchor_scales=(8,16,32), anchor_ratios=(0.5,1,2)):
18 |   """ A wrapper function to generate anchors given different scales
19 |     Also return the number of anchors in variable 'length'
20 |   """
21 |   anchors = generate_anchors(ratios=np.array(anchor_ratios), scales=np.array(anchor_scales))
22 |   A = anchors.shape[0]
23 |   shift_x = np.arange(0, width) * feat_stride
24 |   shift_y = np.arange(0, height) * feat_stride
25 |   shift_x, shift_y = np.meshgrid(shift_x, shift_y)
26 |   shifts = np.vstack((shift_x.ravel(), shift_y.ravel(), shift_x.ravel(), shift_y.ravel())).transpose()
27 |   K = shifts.shape[0]
28 |   # width changes faster, so here it is H, W, C
29 |   anchors = anchors.reshape((1, A, 4)) + shifts.reshape((1, K, 4)).transpose((1, 0, 2))
30 |   anchors = anchors.reshape((K * A, 4)).astype(np.float32, copy=False)
31 |   length = np.int32(anchors.shape[0])
32 | 
33 |   return anchors, length
34 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/model/__init__.py:
--------------------------------------------------------------------------------
1 | from . import config
2 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/model/__pycache__/__init__.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/model/__pycache__/__init__.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/model/__pycache__/__init__.cpython-37.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/model/__pycache__/__init__.cpython-37.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/model/__pycache__/bbox_transform.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/model/__pycache__/bbox_transform.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/model/__pycache__/config.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/model/__pycache__/config.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/model/__pycache__/config.cpython-37.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/model/__pycache__/config.cpython-37.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/model/__pycache__/nms_wrapper.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/model/__pycache__/nms_wrapper.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/model/__pycache__/test.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/model/__pycache__/test.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/model/__pycache__/train_val.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/model/__pycache__/train_val.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/model/bbox_transform.py:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Fast R-CNN
 3 | # Copyright (c) 2015 Microsoft
 4 | # Licensed under The MIT License [see LICENSE for details]
 5 | # Written by Ross Girshick
 6 | # --------------------------------------------------------
 7 | from __future__ import absolute_import
 8 | from __future__ import division
 9 | from __future__ import print_function
10 | 
11 | import numpy as np
12 | 
13 | def bbox_transform(ex_rois, gt_rois):
14 |   ex_widths = ex_rois[:, 2] - ex_rois[:, 0] + 1.0
15 |   ex_heights = ex_rois[:, 3] - ex_rois[:, 1] + 1.0
16 |   ex_ctr_x = ex_rois[:, 0] + 0.5 * ex_widths
17 |   ex_ctr_y = ex_rois[:, 1] + 0.5 * ex_heights
18 | 
19 |   gt_widths = gt_rois[:, 2] - gt_rois[:, 0] + 1.0
20 |   gt_heights = gt_rois[:, 3] - gt_rois[:, 1] + 1.0
21 |   gt_ctr_x = gt_rois[:, 0] + 0.5 * gt_widths
22 |   gt_ctr_y = gt_rois[:, 1] + 0.5 * gt_heights
23 | 
24 |   targets_dx = (gt_ctr_x - ex_ctr_x) / ex_widths
25 |   targets_dy = (gt_ctr_y - ex_ctr_y) / ex_heights
26 |   targets_dw = np.log(gt_widths / ex_widths)
27 |   targets_dh = np.log(gt_heights / ex_heights)
28 | 
29 |   targets = np.vstack(
30 |     (targets_dx, targets_dy, targets_dw, targets_dh)).transpose()
31 |   return targets
32 | 
33 | 
34 | def bbox_transform_inv(boxes, deltas):
35 |   if boxes.shape[0] == 0:
36 |     return np.zeros((0, deltas.shape[1]), dtype=deltas.dtype)
37 | 
38 |   boxes = boxes.astype(deltas.dtype, copy=False)
39 |   widths = boxes[:, 2] - boxes[:, 0] + 1.0
40 |   heights = boxes[:, 3] - boxes[:, 1] + 1.0
41 |   ctr_x = boxes[:, 0] + 0.5 * widths
42 |   ctr_y = boxes[:, 1] + 0.5 * heights
43 | 
44 |   dx = deltas[:, 0::4]
45 |   dy = deltas[:, 1::4]
46 |   dw = deltas[:, 2::4]
47 |   dh = deltas[:, 3::4]
48 |   
49 |   pred_ctr_x = dx * widths[:, np.newaxis] + ctr_x[:, np.newaxis]
50 |   pred_ctr_y = dy * heights[:, np.newaxis] + ctr_y[:, np.newaxis]
51 |   pred_w = np.exp(dw) * widths[:, np.newaxis]
52 |   pred_h = np.exp(dh) * heights[:, np.newaxis]
53 | 
54 |   pred_boxes = np.zeros(deltas.shape, dtype=deltas.dtype)
55 |   # x1
56 |   pred_boxes[:, 0::4] = pred_ctr_x - 0.5 * pred_w
57 |   # y1
58 |   pred_boxes[:, 1::4] = pred_ctr_y - 0.5 * pred_h
59 |   # x2
60 |   pred_boxes[:, 2::4] = pred_ctr_x + 0.5 * pred_w
61 |   # y2
62 |   pred_boxes[:, 3::4] = pred_ctr_y + 0.5 * pred_h
63 | 
64 |   return pred_boxes
65 | 
66 | 
67 | def clip_boxes(boxes, im_shape):
68 |   """
69 |   Clip boxes to image boundaries.
70 |   """
71 | 
72 |   # x1 >= 0
73 |   boxes[:, 0::4] = np.maximum(np.minimum(boxes[:, 0::4], im_shape[1] - 1), 0)
74 |   # y1 >= 0
75 |   boxes[:, 1::4] = np.maximum(np.minimum(boxes[:, 1::4], im_shape[0] - 1), 0)
76 |   # x2 < im_shape[1]
77 |   boxes[:, 2::4] = np.maximum(np.minimum(boxes[:, 2::4], im_shape[1] - 1), 0)
78 |   # y2 < im_shape[0]
79 |   boxes[:, 3::4] = np.maximum(np.minimum(boxes[:, 3::4], im_shape[0] - 1), 0)
80 |   return boxes
81 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/model/nms_wrapper.py:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Fast R-CNN
 3 | # Copyright (c) 2015 Microsoft
 4 | # Licensed under The MIT License [see LICENSE for details]
 5 | # Written by Ross Girshick
 6 | # --------------------------------------------------------
 7 | from __future__ import absolute_import
 8 | from __future__ import division
 9 | from __future__ import print_function
10 | 
11 | from model.config import cfg
12 | from nms.gpu_nms import gpu_nms
13 | from nms.cpu_nms import cpu_nms
14 | 
15 | def nms(dets, thresh, force_cpu=False):
16 |   """Dispatch to either CPU or GPU NMS implementations."""
17 | 
18 |   if dets.shape[0] == 0:
19 |     return []
20 |   if cfg.USE_GPU_NMS and not force_cpu:
21 |     return gpu_nms(dets, thresh, device_id=cfg.GPU_ID)
22 |   else:
23 |     return cpu_nms(dets, thresh)
24 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/model/test.py:
--------------------------------------------------------------------------------
  1 | # --------------------------------------------------------
  2 | # Tensorflow Faster R-CNN
  3 | # Licensed under The MIT License [see LICENSE for details]
  4 | # Written by Xinlei Chen
  5 | # --------------------------------------------------------
  6 | from __future__ import absolute_import
  7 | from __future__ import division
  8 | from __future__ import print_function
  9 | 
 10 | import cv2
 11 | import numpy as np
 12 | try:
 13 |   import cPickle as pickle
 14 | except ImportError:
 15 |   import pickle
 16 | import os
 17 | import math
 18 | 
 19 | from utils.timer import Timer
 20 | from utils.cython_nms import nms, nms_new
 21 | from utils.boxes_grid import get_boxes_grid
 22 | from utils.blob import im_list_to_blob
 23 | 
 24 | from model.config import cfg, get_output_dir
 25 | from model.bbox_transform import clip_boxes, bbox_transform_inv
 26 | 
 27 | def _get_image_blob(im):
 28 |   """Converts an image into a network input.
 29 |   Arguments:
 30 |     im (ndarray): a color image in BGR order
 31 |   Returns:
 32 |     blob (ndarray): a data blob holding an image pyramid
 33 |     im_scale_factors (list): list of image scales (relative to im) used
 34 |       in the image pyramid
 35 |   """
 36 |   im_orig = im.astype(np.float32, copy=True)
 37 |   im_orig -= cfg.PIXEL_MEANS
 38 | 
 39 |   im_shape = im_orig.shape
 40 |   im_size_min = np.min(im_shape[0:2])
 41 |   im_size_max = np.max(im_shape[0:2])
 42 | 
 43 |   processed_ims = []
 44 |   im_scale_factors = []
 45 | 
 46 |   for target_size in cfg.TEST.SCALES:
 47 |     im_scale = float(target_size) / float(im_size_min)
 48 |     # Prevent the biggest axis from being more than MAX_SIZE
 49 |     if np.round(im_scale * im_size_max) > cfg.TEST.MAX_SIZE:
 50 |       im_scale = float(cfg.TEST.MAX_SIZE) / float(im_size_max)
 51 |     im = cv2.resize(im_orig, None, None, fx=im_scale, fy=im_scale,
 52 |             interpolation=cv2.INTER_LINEAR)
 53 |     im_scale_factors.append(im_scale)
 54 |     processed_ims.append(im)
 55 | 
 56 |   # Create a blob to hold the input images
 57 |   blob = im_list_to_blob(processed_ims)
 58 | 
 59 |   return blob, np.array(im_scale_factors)
 60 | 
 61 | def _get_blobs(im):
 62 |   """Convert an image and RoIs within that image into network inputs."""
 63 |   blobs = {}
 64 |   blobs['data'], im_scale_factors = _get_image_blob(im)
 65 | 
 66 |   return blobs, im_scale_factors
 67 | 
 68 | def _clip_boxes(boxes, im_shape):
 69 |   """Clip boxes to image boundaries."""
 70 |   # x1 >= 0
 71 |   boxes[:, 0::4] = np.maximum(boxes[:, 0::4], 0)
 72 |   # y1 >= 0
 73 |   boxes[:, 1::4] = np.maximum(boxes[:, 1::4], 0)
 74 |   # x2 < im_shape[1]
 75 |   boxes[:, 2::4] = np.minimum(boxes[:, 2::4], im_shape[1] - 1)
 76 |   # y2 < im_shape[0]
 77 |   boxes[:, 3::4] = np.minimum(boxes[:, 3::4], im_shape[0] - 1)
 78 |   return boxes
 79 | 
 80 | def _rescale_boxes(boxes, inds, scales):
 81 |   """Rescale boxes according to image rescaling."""
 82 |   for i in range(boxes.shape[0]):
 83 |     boxes[i,:] = boxes[i,:] / scales[int(inds[i])]
 84 | 
 85 |   return boxes
 86 | 
 87 | def im_detect(sess, net, im):
 88 |   blobs, im_scales = _get_blobs(im)
 89 |   assert len(im_scales) == 1, "Only single-image batch implemented"
 90 |    
 91 |   im_blob = blobs['data']
 92 |   # seems to have height, width, and image scales
 93 |   # still not sure about the scale, maybe full image it is 1.
 94 |   blobs['im_info'] = np.array([[im_blob.shape[1], im_blob.shape[2], im_scales[0]]], dtype=np.float32)
 95 | 
 96 |   _, scores, bbox_pred, rois = net.test_image(sess, blobs['data'], blobs['im_info'])
 97 |   
 98 |   boxes = rois[:, 1:5] / im_scales[0]
 99 |   # print(scores.shape, bbox_pred.shape, rois.shape, boxes.shape)
100 |   scores = np.reshape(scores, [scores.shape[0], -1])
101 |   bbox_pred = np.reshape(bbox_pred, [bbox_pred.shape[0], -1])
102 |   if cfg.TEST.BBOX_REG:
103 |     # Apply bounding-box regression deltas
104 |     box_deltas = bbox_pred
105 |     pred_boxes = bbox_transform_inv(boxes, box_deltas)
106 |     pred_boxes = _clip_boxes(pred_boxes, im.shape)
107 |   else:
108 |     # Simply repeat the boxes, once for each class
109 |     pred_boxes = np.tile(boxes, (1, scores.shape[1]))
110 | 
111 |   return scores, pred_boxes
112 | 
113 | def apply_nms(all_boxes, thresh):
114 |   """Apply non-maximum suppression to all predicted boxes output by the
115 |   test_net method.
116 |   """
117 |   num_classes = len(all_boxes)
118 |   num_images = len(all_boxes[0])
119 |   nms_boxes = [[[] for _ in range(num_images)] for _ in range(num_classes)]
120 |   for cls_ind in range(num_classes):
121 |     for im_ind in range(num_images):
122 |       dets = all_boxes[cls_ind][im_ind]
123 |       if dets == []:
124 |         continue
125 | 
126 |       x1 = dets[:, 0]
127 |       y1 = dets[:, 1]
128 |       x2 = dets[:, 2]
129 |       y2 = dets[:, 3]
130 |       scores = dets[:, 4]
131 |       inds = np.where((x2 > x1) & (y2 > y1) & (scores > cfg.TEST.DET_THRESHOLD))[0]
132 |       dets = dets[inds,:]
133 |       if dets == []:
134 |         continue
135 | 
136 |       keep = nms(dets, thresh)
137 |       if len(keep) == 0:
138 |         continue
139 |       nms_boxes[cls_ind][im_ind] = dets[keep, :].copy()
140 |   return nms_boxes
141 | 
142 | def test_net(sess, net, imdb, weights_filename, max_per_image=100, thresh=0.05):
143 |   np.random.seed(cfg.RNG_SEED)
144 |   """Test a Fast R-CNN network on an image database."""
145 |   num_images = len(imdb.image_index)
146 |   # all detections are collected into:
147 |   #  all_boxes[cls][image] = N x 5 array of detections in
148 |   #  (x1, y1, x2, y2, score)
149 |   all_boxes = [[[] for _ in range(num_images)]
150 |          for _ in range(imdb.num_classes)]
151 | 
152 |   output_dir = get_output_dir(imdb, weights_filename)
153 |   # timers
154 |   _t = {'im_detect' : Timer(), 'misc' : Timer()}
155 | 
156 |   for i in range(num_images):
157 |     im = cv2.imread(imdb.image_path_at(i), cv2.IMREAD_UNCHANGED)
158 | 
159 |     _t['im_detect'].tic()
160 |     scores, boxes = im_detect(sess, net, im)
161 |     _t['im_detect'].toc()
162 | 
163 |     _t['misc'].tic()
164 | 
165 |     # skip j = 0, because it's the background class
166 |     for j in range(1, imdb.num_classes):
167 |       inds = np.where(scores[:, j] > thresh)[0]
168 |       cls_scores = scores[inds, j]
169 |       cls_boxes = boxes[inds, j*4:(j+1)*4]
170 |       cls_dets = np.hstack((cls_boxes, cls_scores[:, np.newaxis])) \
171 |         .astype(np.float32, copy=False)
172 |       keep = nms(cls_dets, cfg.TEST.NMS)
173 |       cls_dets = cls_dets[keep, :]
174 |       all_boxes[j][i] = cls_dets
175 | 
176 |     # Limit to max_per_image detections *over all classes*
177 |     if max_per_image > 0:
178 |       image_scores = np.hstack([all_boxes[j][i][:, -1]
179 |                     for j in range(1, imdb.num_classes)])
180 |       if len(image_scores) > max_per_image:
181 |         image_thresh = np.sort(image_scores)[-max_per_image]
182 |         for j in range(1, imdb.num_classes):
183 |           keep = np.where(all_boxes[j][i][:, -1] >= image_thresh)[0]
184 |           all_boxes[j][i] = all_boxes[j][i][keep, :]
185 |     _t['misc'].toc()
186 | 
187 |     print('im_detect: {:d}/{:d} {:.3f}s {:.3f}s' \
188 |         .format(i + 1, num_images, _t['im_detect'].average_time,
189 |             _t['misc'].average_time))
190 | 
191 |   det_file = os.path.join(output_dir, 'detections.pkl')
192 |   with open(det_file, 'wb') as f:
193 |     pickle.dump(all_boxes, f, pickle.HIGHEST_PROTOCOL)
194 | 
195 |   print('Evaluating detections')
196 |   imdb.evaluate_detections(all_boxes, output_dir)
197 | 
198 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/nets/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/nets/__init__.py


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/nets/__pycache__/__init__.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/nets/__pycache__/__init__.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/nets/__pycache__/network.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/nets/__pycache__/network.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/nets/__pycache__/resnet_v1.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/nets/__pycache__/resnet_v1.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/nets/__pycache__/vgg16.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/nets/__pycache__/vgg16.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/nets/vgg16.py:
--------------------------------------------------------------------------------
  1 | # --------------------------------------------------------
  2 | # Tensorflow Faster R-CNN
  3 | # Licensed under The MIT License [see LICENSE for details]
  4 | # Written by Xinlei Chen
  5 | # --------------------------------------------------------
  6 | from __future__ import absolute_import
  7 | from __future__ import division
  8 | from __future__ import print_function
  9 | 
 10 | import tensorflow as tf
 11 | import tensorflow.contrib.slim as slim
 12 | from tensorflow.contrib.slim import losses
 13 | from tensorflow.contrib.slim import arg_scope
 14 | import numpy as np
 15 | 
 16 | from nets.network import Network
 17 | from model.config import cfg
 18 | 
 19 | class vgg16(Network):
 20 |   def __init__(self, batch_size=1):
 21 |     Network.__init__(self, batch_size=batch_size)
 22 | 
 23 |   def build_network(self, sess, is_training=True):
 24 |     with tf.variable_scope('vgg_16', 'vgg_16'):
 25 |       # select initializers
 26 |       if cfg.TRAIN.TRUNCATED:
 27 |         initializer = tf.truncated_normal_initializer(mean=0.0, stddev=0.01)
 28 |         initializer_bbox = tf.truncated_normal_initializer(mean=0.0, stddev=0.001)
 29 |       else:
 30 |         initializer = tf.random_normal_initializer(mean=0.0, stddev=0.01)
 31 |         initializer_bbox = tf.random_normal_initializer(mean=0.0, stddev=0.001)
 32 | 
 33 |       net = slim.repeat(self._image, 2, slim.conv2d, 64, [3, 3],
 34 |                         trainable=False, scope='conv1')
 35 |       net = slim.max_pool2d(net, [2, 2], padding='SAME', scope='pool1')
 36 |       net = slim.repeat(net, 2, slim.conv2d, 128, [3, 3],
 37 |                         trainable=False, scope='conv2')
 38 |       net = slim.max_pool2d(net, [2, 2], padding='SAME', scope='pool2')
 39 |       net = slim.repeat(net, 3, slim.conv2d, 256, [3, 3],
 40 |                         trainable=is_training, scope='conv3')
 41 |       net = slim.max_pool2d(net, [2, 2], padding='SAME', scope='pool3')
 42 |       net = slim.repeat(net, 3, slim.conv2d, 512, [3, 3],
 43 |                         trainable=is_training, scope='conv4')
 44 |       net = slim.max_pool2d(net, [2, 2], padding='SAME', scope='pool4')
 45 |       net = slim.repeat(net, 3, slim.conv2d, 512, [3, 3],
 46 |                         trainable=is_training, scope='conv5')
 47 |       self._act_summaries.append(net)
 48 |       self._layers['head'] = net
 49 |       # build the anchors for the image
 50 |       self._anchor_component()
 51 | 
 52 |       # rpn
 53 |       rpn = slim.conv2d(net, 512, [3, 3], trainable=is_training, weights_initializer=initializer, scope="rpn_conv/3x3")
 54 |       self._act_summaries.append(rpn)
 55 |       rpn_cls_score = slim.conv2d(rpn, self._num_anchors * 2, [1, 1], trainable=is_training,
 56 |                                   weights_initializer=initializer,
 57 |                                   padding='VALID', activation_fn=None, scope='rpn_cls_score')
 58 |       # change it so that the score has 2 as its channel size
 59 |       rpn_cls_score_reshape = self._reshape_layer(rpn_cls_score, 2, 'rpn_cls_score_reshape')
 60 |       rpn_cls_prob_reshape = self._softmax_layer(rpn_cls_score_reshape, "rpn_cls_prob_reshape")
 61 |       rpn_cls_prob = self._reshape_layer(rpn_cls_prob_reshape, self._num_anchors * 2, "rpn_cls_prob")
 62 |       rpn_bbox_pred = slim.conv2d(rpn, self._num_anchors * 4, [1, 1], trainable=is_training,
 63 |                                   weights_initializer=initializer,
 64 |                                   padding='VALID', activation_fn=None, scope='rpn_bbox_pred')
 65 |       if is_training:
 66 |         rois, roi_scores = self._proposal_layer(rpn_cls_prob, rpn_bbox_pred, "rois")
 67 |         rpn_labels = self._anchor_target_layer(rpn_cls_score, "anchor")
 68 |         # Try to have a determinestic order for the computing graph, for reproducibility
 69 |         with tf.control_dependencies([rpn_labels]):
 70 |           rois, _ = self._proposal_target_layer(rois, roi_scores, "rpn_rois")
 71 |       else:
 72 |         if cfg.TEST.MODE == 'nms':
 73 |           rois, _ = self._proposal_layer(rpn_cls_prob, rpn_bbox_pred, "rois")
 74 |         elif cfg.TEST.MODE == 'top':
 75 |           rois, _ = self._proposal_top_layer(rpn_cls_prob, rpn_bbox_pred, "rois")
 76 |         else:
 77 |           raise NotImplementedError
 78 | 
 79 |       # rcnn
 80 |       if cfg.POOLING_MODE == 'crop':
 81 |         pool5 = self._crop_pool_layer(net, rois, "pool5")
 82 |       else:
 83 |         raise NotImplementedError
 84 | 
 85 |       pool5_flat = slim.flatten(pool5, scope='flatten')
 86 |       fc6 = slim.fully_connected(pool5_flat, 4096, scope='fc6')
 87 |       if is_training:
 88 |         fc6 = slim.dropout(fc6, keep_prob=0.5, is_training=True, scope='dropout6')
 89 |       fc7 = slim.fully_connected(fc6, 4096, scope='fc7')
 90 |       if is_training:
 91 |         fc7 = slim.dropout(fc7, keep_prob=0.5, is_training=True, scope='dropout7')
 92 |       cls_score = slim.fully_connected(fc7, self._num_classes, 
 93 |                                        weights_initializer=initializer,
 94 |                                        trainable=is_training,
 95 |                                        activation_fn=None, scope='cls_score')
 96 |       cls_prob = self._softmax_layer(cls_score, "cls_prob")
 97 |       bbox_pred = slim.fully_connected(fc7, self._num_classes * 4, 
 98 |                                        weights_initializer=initializer_bbox,
 99 |                                        trainable=is_training,
100 |                                        activation_fn=None, scope='bbox_pred')
101 | 
102 |       self._predictions["rpn_cls_score"] = rpn_cls_score
103 |       self._predictions["rpn_cls_score_reshape"] = rpn_cls_score_reshape
104 |       self._predictions["rpn_cls_prob"] = rpn_cls_prob
105 |       self._predictions["rpn_bbox_pred"] = rpn_bbox_pred
106 |       self._predictions["cls_score"] = cls_score
107 |       self._predictions["cls_prob"] = cls_prob
108 |       self._predictions["bbox_pred"] = bbox_pred
109 |       self._predictions["rois"] = rois
110 | 
111 |       self._score_summaries.update(self._predictions)
112 | 
113 |       return rois, cls_prob, bbox_pred
114 | 
115 |   def get_variables_to_restore(self, variables, var_keep_dic):
116 |     variables_to_restore = []
117 | 
118 |     for v in variables:
119 |       # exclude the conv weights that are fc weights in vgg16
120 |       if v.name == 'vgg_16/fc6/weights:0' or v.name == 'vgg_16/fc7/weights:0':
121 |         self._variables_to_fix[v.name] = v
122 |         continue
123 |       # exclude the first conv layer to swap RGB to BGR
124 |       if v.name == 'vgg_16/conv1/conv1_1/weights:0':
125 |         self._variables_to_fix[v.name] = v
126 |         continue
127 |       if v.name.split(':')[0] in var_keep_dic:
128 |         print('Varibles restored: %s' % v.name)
129 |         variables_to_restore.append(v)
130 | 
131 |     return variables_to_restore
132 | 
133 |   def fix_variables(self, sess, pretrained_model):
134 |     print('Fix VGG16 layers..')
135 |     with tf.variable_scope('Fix_VGG16') as scope:
136 |       with tf.device("/cpu:0"):
137 |         # fix the vgg16 issue from conv weights to fc weights
138 |         # fix RGB to BGR
139 |         fc6_conv = tf.get_variable("fc6_conv", [7, 7, 512, 4096], trainable=False)
140 |         fc7_conv = tf.get_variable("fc7_conv", [1, 1, 4096, 4096], trainable=False)
141 |         conv1_rgb = tf.get_variable("conv1_rgb", [3, 3, 3, 64], trainable=False)
142 |         restorer_fc = tf.train.Saver({"vgg_16/fc6/weights": fc6_conv, 
143 |                                       "vgg_16/fc7/weights": fc7_conv,
144 |                                       "vgg_16/conv1/conv1_1/weights": conv1_rgb})
145 |         restorer_fc.restore(sess, pretrained_model)
146 | 
147 |         sess.run(tf.assign(self._variables_to_fix['vgg_16/fc6/weights:0'], tf.reshape(fc6_conv, 
148 |                             self._variables_to_fix['vgg_16/fc6/weights:0'].get_shape())))
149 |         sess.run(tf.assign(self._variables_to_fix['vgg_16/fc7/weights:0'], tf.reshape(fc7_conv, 
150 |                             self._variables_to_fix['vgg_16/fc7/weights:0'].get_shape())))
151 |         sess.run(tf.assign(self._variables_to_fix['vgg_16/conv1/conv1_1/weights:0'], 
152 |                             tf.reverse(conv1_rgb, [2])))


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/nms/.gitignore:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/nms/.gitignore


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/nms/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/nms/__init__.py


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/nms/__pycache__/__init__.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/nms/__pycache__/__init__.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/nms/cpu_nms.pyx:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Fast R-CNN
 3 | # Copyright (c) 2015 Microsoft
 4 | # Licensed under The MIT License [see LICENSE for details]
 5 | # Written by Ross Girshick
 6 | # --------------------------------------------------------
 7 | 
 8 | import numpy as np
 9 | cimport numpy as np
10 | 
11 | cdef inline np.float32_t max(np.float32_t a, np.float32_t b):
12 |     return a if a >= b else b
13 | 
14 | cdef inline np.float32_t min(np.float32_t a, np.float32_t b):
15 |     return a if a <= b else b
16 | 
17 | def cpu_nms(np.ndarray[np.float32_t, ndim=2] dets, np.float thresh):
18 |     cdef np.ndarray[np.float32_t, ndim=1] x1 = dets[:, 0]
19 |     cdef np.ndarray[np.float32_t, ndim=1] y1 = dets[:, 1]
20 |     cdef np.ndarray[np.float32_t, ndim=1] x2 = dets[:, 2]
21 |     cdef np.ndarray[np.float32_t, ndim=1] y2 = dets[:, 3]
22 |     cdef np.ndarray[np.float32_t, ndim=1] scores = dets[:, 4]
23 | 
24 |     cdef np.ndarray[np.float32_t, ndim=1] areas = (x2 - x1 + 1) * (y2 - y1 + 1)
25 |     cdef np.ndarray[np.int_t, ndim=1] order = scores.argsort()[::-1]
26 | 
27 |     cdef int ndets = dets.shape[0]
28 |     cdef np.ndarray[np.int_t, ndim=1] suppressed = \
29 |             np.zeros((ndets), dtype=np.int)
30 | 
31 |     # nominal indices
32 |     cdef int _i, _j
33 |     # sorted indices
34 |     cdef int i, j
35 |     # temp variables for box i's (the box currently under consideration)
36 |     cdef np.float32_t ix1, iy1, ix2, iy2, iarea
37 |     # variables for computing overlap with box j (lower scoring box)
38 |     cdef np.float32_t xx1, yy1, xx2, yy2
39 |     cdef np.float32_t w, h
40 |     cdef np.float32_t inter, ovr
41 | 
42 |     keep = []
43 |     for _i in range(ndets):
44 |         i = order[_i]
45 |         if suppressed[i] == 1:
46 |             continue
47 |         keep.append(i)
48 |         ix1 = x1[i]
49 |         iy1 = y1[i]
50 |         ix2 = x2[i]
51 |         iy2 = y2[i]
52 |         iarea = areas[i]
53 |         for _j in range(_i + 1, ndets):
54 |             j = order[_j]
55 |             if suppressed[j] == 1:
56 |                 continue
57 |             xx1 = max(ix1, x1[j])
58 |             yy1 = max(iy1, y1[j])
59 |             xx2 = min(ix2, x2[j])
60 |             yy2 = min(iy2, y2[j])
61 |             w = max(0.0, xx2 - xx1 + 1)
62 |             h = max(0.0, yy2 - yy1 + 1)
63 |             inter = w * h
64 |             ovr = inter / (iarea + areas[j] - inter)
65 |             if ovr >= thresh:
66 |                 suppressed[j] = 1
67 | 
68 |     return keep
69 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/nms/gpu_nms.hpp:
--------------------------------------------------------------------------------
1 | void _nms(int* keep_out, int* num_out, const float* boxes_host, int boxes_num,
2 |           int boxes_dim, float nms_overlap_thresh, int device_id);
3 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/nms/gpu_nms.pyx:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Faster R-CNN
 3 | # Copyright (c) 2015 Microsoft
 4 | # Licensed under The MIT License [see LICENSE for details]
 5 | # Written by Ross Girshick
 6 | # --------------------------------------------------------
 7 | 
 8 | import numpy as np
 9 | cimport numpy as np
10 | 
11 | assert sizeof(int) == sizeof(np.int32_t)
12 | 
13 | cdef extern from "gpu_nms.hpp":
14 |     void _nms(np.int32_t*, int*, np.float32_t*, int, int, float, int)
15 | 
16 | def gpu_nms(np.ndarray[np.float32_t, ndim=2] dets, np.float thresh,
17 |             np.int32_t device_id=0):
18 |     cdef int boxes_num = dets.shape[0]
19 |     cdef int boxes_dim = dets.shape[1]
20 |     cdef int num_out
21 |     cdef np.ndarray[np.int32_t, ndim=1] \
22 |         keep = np.zeros(boxes_num, dtype=np.int32)
23 |     cdef np.ndarray[np.float32_t, ndim=1] \
24 |         scores = dets[:, 4]
25 |     cdef np.ndarray[np.int_t, ndim=1] \
26 |         order = scores.argsort()[::-1]
27 |     cdef np.ndarray[np.float32_t, ndim=2] \
28 |         sorted_dets = dets[order, :]
29 |     _nms(&keep[0], &num_out, &sorted_dets[0, 0], boxes_num, boxes_dim, thresh, device_id)
30 |     keep = keep[:num_out]
31 |     return list(order[keep])
32 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/nms/nms_kernel.cu:
--------------------------------------------------------------------------------
  1 | // ------------------------------------------------------------------
  2 | // Faster R-CNN
  3 | // Copyright (c) 2015 Microsoft
  4 | // Licensed under The MIT License [see fast-rcnn/LICENSE for details]
  5 | // Written by Shaoqing Ren
  6 | // ------------------------------------------------------------------
  7 | 
  8 | #include "gpu_nms.hpp"
  9 | #include <vector>
 10 | #include <iostream>
 11 | 
 12 | #define CUDA_CHECK(condition) \
 13 |   /* Code block avoids redefinition of cudaError_t error */ \
 14 |   do { \
 15 |     cudaError_t error = condition; \
 16 |     if (error != cudaSuccess) { \
 17 |       std::cout << cudaGetErrorString(error) << std::endl; \
 18 |     } \
 19 |   } while (0)
 20 | 
 21 | #define DIVUP(m,n) ((m) / (n) + ((m) % (n) > 0))
 22 | int const threadsPerBlock = sizeof(unsigned long long) * 8;
 23 | 
 24 | __device__ inline float devIoU(float const * const a, float const * const b) {
 25 |   float left = max(a[0], b[0]), right = min(a[2], b[2]);
 26 |   float top = max(a[1], b[1]), bottom = min(a[3], b[3]);
 27 |   float width = max(right - left + 1, 0.f), height = max(bottom - top + 1, 0.f);
 28 |   float interS = width * height;
 29 |   float Sa = (a[2] - a[0] + 1) * (a[3] - a[1] + 1);
 30 |   float Sb = (b[2] - b[0] + 1) * (b[3] - b[1] + 1);
 31 |   return interS / (Sa + Sb - interS);
 32 | }
 33 | 
 34 | __global__ void nms_kernel(const int n_boxes, const float nms_overlap_thresh,
 35 |                            const float *dev_boxes, unsigned long long *dev_mask) {
 36 |   const int row_start = blockIdx.y;
 37 |   const int col_start = blockIdx.x;
 38 | 
 39 |   // if (row_start > col_start) return;
 40 | 
 41 |   const int row_size =
 42 |         min(n_boxes - row_start * threadsPerBlock, threadsPerBlock);
 43 |   const int col_size =
 44 |         min(n_boxes - col_start * threadsPerBlock, threadsPerBlock);
 45 | 
 46 |   __shared__ float block_boxes[threadsPerBlock * 5];
 47 |   if (threadIdx.x < col_size) {
 48 |     block_boxes[threadIdx.x * 5 + 0] =
 49 |         dev_boxes[(threadsPerBlock * col_start + threadIdx.x) * 5 + 0];
 50 |     block_boxes[threadIdx.x * 5 + 1] =
 51 |         dev_boxes[(threadsPerBlock * col_start + threadIdx.x) * 5 + 1];
 52 |     block_boxes[threadIdx.x * 5 + 2] =
 53 |         dev_boxes[(threadsPerBlock * col_start + threadIdx.x) * 5 + 2];
 54 |     block_boxes[threadIdx.x * 5 + 3] =
 55 |         dev_boxes[(threadsPerBlock * col_start + threadIdx.x) * 5 + 3];
 56 |     block_boxes[threadIdx.x * 5 + 4] =
 57 |         dev_boxes[(threadsPerBlock * col_start + threadIdx.x) * 5 + 4];
 58 |   }
 59 |   __syncthreads();
 60 | 
 61 |   if (threadIdx.x < row_size) {
 62 |     const int cur_box_idx = threadsPerBlock * row_start + threadIdx.x;
 63 |     const float *cur_box = dev_boxes + cur_box_idx * 5;
 64 |     int i = 0;
 65 |     unsigned long long t = 0;
 66 |     int start = 0;
 67 |     if (row_start == col_start) {
 68 |       start = threadIdx.x + 1;
 69 |     }
 70 |     for (i = start; i < col_size; i++) {
 71 |       if (devIoU(cur_box, block_boxes + i * 5) > nms_overlap_thresh) {
 72 |         t |= 1ULL << i;
 73 |       }
 74 |     }
 75 |     const int col_blocks = DIVUP(n_boxes, threadsPerBlock);
 76 |     dev_mask[cur_box_idx * col_blocks + col_start] = t;
 77 |   }
 78 | }
 79 | 
 80 | void _set_device(int device_id) {
 81 |   int current_device;
 82 |   CUDA_CHECK(cudaGetDevice(&current_device));
 83 |   if (current_device == device_id) {
 84 |     return;
 85 |   }
 86 |   // The call to cudaSetDevice must come before any calls to Get, which
 87 |   // may perform initialization using the GPU.
 88 |   CUDA_CHECK(cudaSetDevice(device_id));
 89 | }
 90 | 
 91 | void _nms(int* keep_out, int* num_out, const float* boxes_host, int boxes_num,
 92 |           int boxes_dim, float nms_overlap_thresh, int device_id) {
 93 |   _set_device(device_id);
 94 | 
 95 |   float* boxes_dev = NULL;
 96 |   unsigned long long* mask_dev = NULL;
 97 | 
 98 |   const int col_blocks = DIVUP(boxes_num, threadsPerBlock);
 99 | 
100 |   CUDA_CHECK(cudaMalloc(&boxes_dev,
101 |                         boxes_num * boxes_dim * sizeof(float)));
102 |   CUDA_CHECK(cudaMemcpy(boxes_dev,
103 |                         boxes_host,
104 |                         boxes_num * boxes_dim * sizeof(float),
105 |                         cudaMemcpyHostToDevice));
106 | 
107 |   CUDA_CHECK(cudaMalloc(&mask_dev,
108 |                         boxes_num * col_blocks * sizeof(unsigned long long)));
109 | 
110 |   dim3 blocks(DIVUP(boxes_num, threadsPerBlock),
111 |               DIVUP(boxes_num, threadsPerBlock));
112 |   dim3 threads(threadsPerBlock);
113 |   nms_kernel<<<blocks, threads>>>(boxes_num,
114 |                                   nms_overlap_thresh,
115 |                                   boxes_dev,
116 |                                   mask_dev);
117 | 
118 |   std::vector<unsigned long long> mask_host(boxes_num * col_blocks);
119 |   CUDA_CHECK(cudaMemcpy(&mask_host[0],
120 |                         mask_dev,
121 |                         sizeof(unsigned long long) * boxes_num * col_blocks,
122 |                         cudaMemcpyDeviceToHost));
123 | 
124 |   std::vector<unsigned long long> remv(col_blocks);
125 |   memset(&remv[0], 0, sizeof(unsigned long long) * col_blocks);
126 | 
127 |   int num_to_keep = 0;
128 |   for (int i = 0; i < boxes_num; i++) {
129 |     int nblock = i / threadsPerBlock;
130 |     int inblock = i % threadsPerBlock;
131 | 
132 |     if (!(remv[nblock] & (1ULL << inblock))) {
133 |       keep_out[num_to_keep++] = i;
134 |       unsigned long long *p = &mask_host[0] + i * col_blocks;
135 |       for (int j = nblock; j < col_blocks; j++) {
136 |         remv[j] |= p[j];
137 |       }
138 |     }
139 |   }
140 |   *num_out = num_to_keep;
141 | 
142 |   CUDA_CHECK(cudaFree(boxes_dev));
143 |   CUDA_CHECK(cudaFree(mask_dev));
144 | }
145 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/nms/py_cpu_nms.py:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Fast R-CNN
 3 | # Copyright (c) 2015 Microsoft
 4 | # Licensed under The MIT License [see LICENSE for details]
 5 | # Written by Ross Girshick
 6 | # --------------------------------------------------------
 7 | 
 8 | import numpy as np
 9 | 
10 | def py_cpu_nms(dets, thresh):
11 |     """Pure Python NMS baseline."""
12 |     x1 = dets[:, 0]
13 |     y1 = dets[:, 1]
14 |     x2 = dets[:, 2]
15 |     y2 = dets[:, 3]
16 |     scores = dets[:, 4]
17 | 
18 |     areas = (x2 - x1 + 1) * (y2 - y1 + 1)
19 |     order = scores.argsort()[::-1]
20 | 
21 |     keep = []
22 |     while order.size > 0:
23 |         i = order[0]
24 |         keep.append(i)
25 |         xx1 = np.maximum(x1[i], x1[order[1:]])
26 |         yy1 = np.maximum(y1[i], y1[order[1:]])
27 |         xx2 = np.minimum(x2[i], x2[order[1:]])
28 |         yy2 = np.minimum(y2[i], y2[order[1:]])
29 | 
30 |         w = np.maximum(0.0, xx2 - xx1 + 1)
31 |         h = np.maximum(0.0, yy2 - yy1 + 1)
32 |         inter = w * h
33 |         ovr = inter / (areas[i] + areas[order[1:]] - inter)
34 | 
35 |         inds = np.where(ovr <= thresh)[0]
36 |         order = order[inds + 1]
37 | 
38 |     return keep
39 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/roi_data_layer/__init__.py:
--------------------------------------------------------------------------------
1 | # --------------------------------------------------------
2 | # Fast R-CNN
3 | # Copyright (c) 2015 Microsoft
4 | # Licensed under The MIT License [see LICENSE for details]
5 | # Written by Ross Girshick
6 | # --------------------------------------------------------
7 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/roi_data_layer/__pycache__/__init__.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/roi_data_layer/__pycache__/__init__.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/roi_data_layer/__pycache__/layer.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/roi_data_layer/__pycache__/layer.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/roi_data_layer/__pycache__/minibatch.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/roi_data_layer/__pycache__/minibatch.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/roi_data_layer/__pycache__/roidb.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/roi_data_layer/__pycache__/roidb.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/roi_data_layer/layer.py:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Fast R-CNN
 3 | # Copyright (c) 2015 Microsoft
 4 | # Licensed under The MIT License [see LICENSE for details]
 5 | # Written by Ross Girshick and Xinlei Chen
 6 | # --------------------------------------------------------
 7 | 
 8 | """The data layer used during training to train a Fast R-CNN network.
 9 | 
10 | RoIDataLayer implements a Caffe Python layer.
11 | """
12 | from __future__ import absolute_import
13 | from __future__ import division
14 | from __future__ import print_function
15 | 
16 | from model.config import cfg
17 | from roi_data_layer.minibatch import get_minibatch
18 | import numpy as np
19 | import time
20 | 
21 | class RoIDataLayer(object):
22 |   """Fast R-CNN data layer used for training."""
23 | 
24 |   def __init__(self, roidb, num_classes, random=False):
25 |     """Set the roidb to be used by this layer during training."""
26 |     self._roidb = roidb
27 |     self._num_classes = num_classes
28 |     # Also set a random flag
29 |     self._random = random
30 |     self._shuffle_roidb_inds()
31 | 
32 |   def _shuffle_roidb_inds(self):
33 |     """Randomly permute the training roidb."""
34 |     # If the random flag is set, 
35 |     # then the database is shuffled according to system time
36 |     # Useful for the validation set
37 |     if self._random:
38 |       st0 = np.random.get_state()
39 |       millis = int(round(time.time() * 1000)) % 4294967295
40 |       np.random.seed(millis)
41 |     
42 |     if cfg.TRAIN.ASPECT_GROUPING:
43 |       widths = np.array([r['width'] for r in self._roidb])
44 |       heights = np.array([r['height'] for r in self._roidb])
45 |       horz = (widths >= heights)
46 |       vert = np.logical_not(horz)
47 |       horz_inds = np.where(horz)[0]
48 |       vert_inds = np.where(vert)[0]
49 |       inds = np.hstack((
50 |           np.random.permutation(horz_inds),
51 |           np.random.permutation(vert_inds)))
52 |       inds = np.reshape(inds, (-1, 2))
53 |       row_perm = np.random.permutation(np.arange(inds.shape[0]))
54 |       inds = np.reshape(inds[row_perm, :], (-1,))
55 |       self._perm = inds
56 |     else:
57 |       self._perm = np.random.permutation(np.arange(len(self._roidb)))
58 |     # Restore the random state
59 |     if self._random:
60 |       np.random.set_state(st0)
61 |       
62 |     self._cur = 0
63 | 
64 |   def _get_next_minibatch_inds(self):
65 |     """Return the roidb indices for the next minibatch."""
66 |     
67 |     if self._cur + cfg.TRAIN.IMS_PER_BATCH >= len(self._roidb):
68 |       self._shuffle_roidb_inds()
69 | 
70 |     #print (len(self._perm))
71 | 
72 |     db_inds = self._perm[self._cur:self._cur + cfg.TRAIN.IMS_PER_BATCH]
73 |     self._cur += cfg.TRAIN.IMS_PER_BATCH
74 | 
75 |     return db_inds
76 | 
77 |   def _get_next_minibatch(self):
78 |     """Return the blobs to be used for the next minibatch.
79 | 
80 |     If cfg.TRAIN.USE_PREFETCH is True, then blobs will be computed in a
81 |     separate process and made available through self._blob_queue.
82 |     """
83 |     db_inds = self._get_next_minibatch_inds()
84 |     minibatch_db = [self._roidb[i] for i in db_inds]
85 |     return get_minibatch(minibatch_db, self._num_classes)
86 |       
87 |   def forward(self):
88 |     """Get blobs and copy them into this layer's top blob vector."""
89 |     blobs = self._get_next_minibatch()
90 |     return blobs
91 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/roi_data_layer/minibatch.py:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Fast R-CNN
 3 | # Copyright (c) 2015 Microsoft
 4 | # Licensed under The MIT License [see LICENSE for details]
 5 | # Written by Ross Girshick and Xinlei Chen
 6 | # --------------------------------------------------------
 7 | 
 8 | """Compute minibatch blobs for training a Fast R-CNN network."""
 9 | from __future__ import absolute_import
10 | from __future__ import division
11 | from __future__ import print_function
12 | 
13 | import numpy as np
14 | import numpy.random as npr
15 | import cv2
16 | from model.config import cfg
17 | from utils.blob import prep_im_for_blob, im_list_to_blob
18 | 
19 | def get_minibatch(roidb, num_classes):
20 |   """Given a roidb, construct a minibatch sampled from it."""
21 |   num_images = len(roidb)
22 |   # Sample random scales to use for each image in this batch
23 |   random_scale_inds = npr.randint(0, high=len(cfg.TRAIN.SCALES),
24 |                   size=num_images)
25 |   assert(cfg.TRAIN.BATCH_SIZE % num_images == 0), \
26 |     'num_images ({}) must divide BATCH_SIZE ({})'. \
27 |     format(num_images, cfg.TRAIN.BATCH_SIZE)
28 | 
29 |   # Get the input image blob, formatted for caffe
30 |   im_blob, im_scales = _get_image_blob(roidb, random_scale_inds)
31 | 
32 |   blobs = {'data': im_blob}
33 | 
34 |   assert len(im_scales) == 1, "Single batch only"
35 |   assert len(roidb) == 1, "Single batch only"
36 |   
37 |   # gt boxes: (x1, y1, x2, y2, cls)
38 |   if cfg.TRAIN.USE_ALL_GT:
39 |     # Include all ground truth boxes
40 |     gt_inds = np.where(roidb[0]['gt_classes'] != 0)[0]
41 |   else:
42 |     # For the COCO ground truth boxes, exclude the ones that are ''iscrowd'' 
43 |     gt_inds = np.where(roidb[0]['gt_classes'] != 0 & np.all(roidb[0]['gt_overlaps'].toarray() > -1.0, axis=1))[0]
44 |   gt_boxes = np.empty((len(gt_inds), 5), dtype=np.float32)
45 |   gt_boxes[:, 0:4] = roidb[0]['boxes'][gt_inds, :] * im_scales[0]
46 |   gt_boxes[:, 4] = roidb[0]['gt_classes'][gt_inds]
47 |   blobs['gt_boxes'] = gt_boxes
48 |   blobs['im_info'] = np.array(
49 |     [[im_blob.shape[1], im_blob.shape[2], im_scales[0]]],
50 |     dtype=np.float32)
51 | 
52 |   return blobs
53 | 
54 | def _get_image_blob(roidb, scale_inds):
55 |   """Builds an input blob from the images in the roidb at the specified
56 |   scales.
57 |   """
58 |   num_images = len(roidb)
59 |   processed_ims = []
60 |   im_scales = []
61 |   for i in range(num_images):
62 |     im = cv2.imread(roidb[i]['image'], cv2.IMREAD_UNCHANGED)
63 |     if roidb[i]['flipped']:
64 |       im = im[:, ::-1, :]
65 |     target_size = cfg.TRAIN.SCALES[scale_inds[i]]
66 |     im, im_scale = prep_im_for_blob(im, cfg.PIXEL_MEANS, target_size,
67 |                     cfg.TRAIN.MAX_SIZE)
68 |     im_scales.append(im_scale)
69 |     processed_ims.append(im)
70 | 
71 |   # Create a blob to hold the input images
72 |   blob = im_list_to_blob(processed_ims)
73 | 
74 |   return blob, im_scales
75 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/roi_data_layer/roidb.py:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Fast R-CNN
 3 | # Copyright (c) 2015 Microsoft
 4 | # Licensed under The MIT License [see LICENSE for details]
 5 | # Written by Ross Girshick
 6 | # --------------------------------------------------------
 7 | 
 8 | """Transform a roidb into a trainable roidb by adding a bunch of metadata."""
 9 | from __future__ import absolute_import
10 | from __future__ import division
11 | from __future__ import print_function
12 | 
13 | import numpy as np
14 | from model.config import cfg
15 | from model.bbox_transform import bbox_transform
16 | from utils.cython_bbox import bbox_overlaps
17 | import PIL
18 | 
19 | def prepare_roidb(imdb):
20 |   """Enrich the imdb's roidb by adding some derived quantities that
21 |   are useful for training. This function precomputes the maximum
22 |   overlap, taken over ground-truth boxes, between each ROI and
23 |   each ground-truth box. The class with maximum overlap is also
24 |   recorded.
25 |   """
26 |   roidb = imdb.roidb
27 |   if not (imdb.name.startswith('coco')):
28 |     sizes = [PIL.Image.open(imdb.image_path_at(i)).size
29 |          for i in range(imdb.num_images)]
30 |   for i in range(len(imdb.image_index)):
31 |     roidb[i]['image'] = imdb.image_path_at(i)
32 |     if not (imdb.name.startswith('coco')):
33 |       roidb[i]['width'] = sizes[i][0]
34 |       roidb[i]['height'] = sizes[i][1]
35 |     # need gt_overlaps as a dense array for argmax
36 |     gt_overlaps = roidb[i]['gt_overlaps'].toarray()
37 |     # max overlap with gt over classes (columns)
38 |     max_overlaps = gt_overlaps.max(axis=1)
39 |     # gt class that had the max overlap
40 |     max_classes = gt_overlaps.argmax(axis=1)
41 |     roidb[i]['max_classes'] = max_classes
42 |     roidb[i]['max_overlaps'] = max_overlaps
43 |     # sanity checks
44 |     # max overlap of 0 => class should be zero (background)
45 |     zero_inds = np.where(max_overlaps == 0)[0]
46 |     assert all(max_classes[zero_inds] == 0)
47 |     # max overlap > 0 => class should not be zero (must be a fg class)
48 |     nonzero_inds = np.where(max_overlaps > 0)[0]
49 |     assert all(max_classes[nonzero_inds] != 0)
50 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/setup.py:
--------------------------------------------------------------------------------
  1 | # --------------------------------------------------------
  2 | # Fast R-CNN
  3 | # Copyright (c) 2015 Microsoft
  4 | # Licensed under The MIT License [see LICENSE for details]
  5 | # Written by Ross Girshick
  6 | # --------------------------------------------------------
  7 | 
  8 | import os
  9 | from os.path import join as pjoin
 10 | import numpy as np
 11 | from distutils.core import setup
 12 | from distutils.extension import Extension
 13 | from Cython.Distutils import build_ext
 14 | 
 15 | def find_in_path(name, path):
 16 |     "Find a file in a search path"
 17 |     #adapted fom http://code.activestate.com/recipes/52224-find-a-file-given-a-search-path/
 18 |     for dir in path.split(os.pathsep):
 19 |         binpath = pjoin(dir, name)
 20 |         if os.path.exists(binpath):
 21 |             return os.path.abspath(binpath)
 22 |     return None
 23 | 
 24 | def locate_cuda():
 25 |     """Locate the CUDA environment on the system
 26 | 
 27 |     Returns a dict with keys 'home', 'nvcc', 'include', and 'lib64'
 28 |     and values giving the absolute path to each directory.
 29 | 
 30 |     Starts by looking for the CUDAHOME env variable. If not found, everything
 31 |     is based on finding 'nvcc' in the PATH.
 32 |     """
 33 | 
 34 |     # first check if the CUDAHOME env variable is in use
 35 |     if 'CUDAHOME' in os.environ:
 36 |         home = os.environ['CUDAHOME']
 37 |         nvcc = pjoin(home, 'bin', 'nvcc')
 38 |     else:
 39 |         # otherwise, search the PATH for NVCC
 40 |         default_path = pjoin(os.sep, 'usr', 'local', 'cuda', 'bin')
 41 |         nvcc = find_in_path('nvcc', os.environ['PATH'] + os.pathsep + default_path)
 42 |         if nvcc is None:
 43 |             raise EnvironmentError('The nvcc binary could not be '
 44 |                 'located in your $PATH. Either add it to your path, or set $CUDAHOME')
 45 |         home = os.path.dirname(os.path.dirname(nvcc))
 46 | 
 47 |     cudaconfig = {'home':home, 'nvcc':nvcc,
 48 |                   'include': pjoin(home, 'include'),
 49 |                   'lib64': pjoin(home, 'lib64')}
 50 |     for k, v in cudaconfig.items():
 51 |         if not os.path.exists(v):
 52 |             raise EnvironmentError('The CUDA %s path could not be located in %s' % (k, v))
 53 | 
 54 |     return cudaconfig
 55 | CUDA = locate_cuda()
 56 | 
 57 | # Obtain the numpy include directory.  This logic works across numpy versions.
 58 | try:
 59 |     numpy_include = np.get_include()
 60 | except AttributeError:
 61 |     numpy_include = np.get_numpy_include()
 62 | 
 63 | def customize_compiler_for_nvcc(self):
 64 |     """inject deep into distutils to customize how the dispatch
 65 |     to gcc/nvcc works.
 66 | 
 67 |     If you subclass UnixCCompiler, it's not trivial to get your subclass
 68 |     injected in, and still have the right customizations (i.e.
 69 |     distutils.sysconfig.customize_compiler) run on it. So instead of going
 70 |     the OO route, I have this. Note, it's kindof like a wierd functional
 71 |     subclassing going on."""
 72 | 
 73 |     # tell the compiler it can processes .cu
 74 |     self.src_extensions.append('.cu')
 75 | 
 76 |     # save references to the default compiler_so and _comple methods
 77 |     default_compiler_so = self.compiler_so
 78 |     super = self._compile
 79 | 
 80 |     # now redefine the _compile method. This gets executed for each
 81 |     # object but distutils doesn't have the ability to change compilers
 82 |     # based on source extension: we add it.
 83 |     def _compile(obj, src, ext, cc_args, extra_postargs, pp_opts):
 84 |         print(extra_postargs)
 85 |         if os.path.splitext(src)[1] == '.cu':
 86 |             # use the cuda for .cu files
 87 |             self.set_executable('compiler_so', CUDA['nvcc'])
 88 |             # use only a subset of the extra_postargs, which are 1-1 translated
 89 |             # from the extra_compile_args in the Extension class
 90 |             postargs = extra_postargs['nvcc']
 91 |         else:
 92 |             postargs = extra_postargs['gcc']
 93 | 
 94 |         super(obj, src, ext, cc_args, postargs, pp_opts)
 95 |         # reset the default compiler_so, which we might have changed for cuda
 96 |         self.compiler_so = default_compiler_so
 97 | 
 98 |     # inject our redefined _compile method into the class
 99 |     self._compile = _compile
100 | 
101 | # run the customize_compiler
102 | class custom_build_ext(build_ext):
103 |     def build_extensions(self):
104 |         customize_compiler_for_nvcc(self.compiler)
105 |         build_ext.build_extensions(self)
106 | 
107 | ext_modules = [
108 |     Extension(
109 |         "utils.cython_bbox",
110 |         ["utils/bbox.pyx"],
111 |         extra_compile_args={'gcc': ["-Wno-cpp", "-Wno-unused-function"]},
112 |         include_dirs = [numpy_include]
113 |     ),
114 |     Extension(
115 |         "utils.cython_nms",
116 |         ["utils/nms.pyx"],
117 |         extra_compile_args={'gcc': ["-Wno-cpp", "-Wno-unused-function"]},
118 |         include_dirs = [numpy_include]
119 |     ),
120 |     Extension(
121 |         "nms.cpu_nms",
122 |         ["nms/cpu_nms.pyx"],
123 |         extra_compile_args={'gcc': ["-Wno-cpp", "-Wno-unused-function"]},
124 |         include_dirs = [numpy_include]
125 |     ),
126 |     Extension('nms.gpu_nms',
127 |         ['nms/nms_kernel.cu', 'nms/gpu_nms.pyx'],
128 |         library_dirs=[CUDA['lib64']],
129 |         libraries=['cudart'],
130 |         language='c++',
131 |         runtime_library_dirs=[CUDA['lib64']],
132 |         # this syntax is specific to this build system
133 |         # we're only going to use certain compiler args with nvcc and not with gcc
134 |         # the implementation of this trick is in customize_compiler() below
135 |         extra_compile_args={'gcc': ["-Wno-unused-function"],
136 |                             'nvcc': ['-arch=sm_52',
137 |                                      '--ptxas-options=-v',
138 |                                      '-c',
139 |                                      '--compiler-options',
140 |                                      "'-fPIC'"]},
141 |         include_dirs = [numpy_include, CUDA['include']]
142 |     )
143 | ]
144 | 
145 | setup(
146 |     name='tf_faster_rcnn',
147 |     ext_modules=ext_modules,
148 |     # inject our custom trigger
149 |     cmdclass={'build_ext': custom_build_ext},
150 | )
151 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/utils/.gitignore:
--------------------------------------------------------------------------------
1 | *.c
2 | *.cpp
3 | *.h
4 | *.hpp
5 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/utils/__init__.py:
--------------------------------------------------------------------------------
1 | # --------------------------------------------------------
2 | # Fast R-CNN
3 | # Copyright (c) 2015 Microsoft
4 | # Licensed under The MIT License [see LICENSE for details]
5 | # Written by Ross Girshick
6 | # --------------------------------------------------------
7 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/utils/__pycache__/__init__.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/utils/__pycache__/__init__.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/utils/__pycache__/blob.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/utils/__pycache__/blob.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/utils/__pycache__/boxes_grid.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/utils/__pycache__/boxes_grid.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/utils/__pycache__/timer.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/lib/utils/__pycache__/timer.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/utils/bbox.pyx:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Fast R-CNN
 3 | # Copyright (c) 2015 Microsoft
 4 | # Licensed under The MIT License [see LICENSE for details]
 5 | # Written by Sergey Karayev
 6 | # --------------------------------------------------------
 7 | 
 8 | cimport cython
 9 | import numpy as np
10 | cimport numpy as np
11 | 
12 | DTYPE = np.float
13 | ctypedef np.float_t DTYPE_t
14 | 
15 | def bbox_overlaps(
16 |         np.ndarray[DTYPE_t, ndim=2] boxes,
17 |         np.ndarray[DTYPE_t, ndim=2] query_boxes):
18 |     """
19 |     Parameters
20 |     ----------
21 |     boxes: (N, 4) ndarray of float
22 |     query_boxes: (K, 4) ndarray of float
23 |     Returns
24 |     -------
25 |     overlaps: (N, K) ndarray of overlap between boxes and query_boxes
26 |     """
27 |     cdef unsigned int N = boxes.shape[0]
28 |     cdef unsigned int K = query_boxes.shape[0]
29 |     cdef np.ndarray[DTYPE_t, ndim=2] overlaps = np.zeros((N, K), dtype=DTYPE)
30 |     cdef DTYPE_t iw, ih, box_area
31 |     cdef DTYPE_t ua
32 |     cdef unsigned int k, n
33 |     for k in range(K):
34 |         box_area = (
35 |             (query_boxes[k, 2] - query_boxes[k, 0] + 1) *
36 |             (query_boxes[k, 3] - query_boxes[k, 1] + 1)
37 |         )
38 |         for n in range(N):
39 |             iw = (
40 |                 min(boxes[n, 2], query_boxes[k, 2]) -
41 |                 max(boxes[n, 0], query_boxes[k, 0]) + 1
42 |             )
43 |             if iw > 0:
44 |                 ih = (
45 |                     min(boxes[n, 3], query_boxes[k, 3]) -
46 |                     max(boxes[n, 1], query_boxes[k, 1]) + 1
47 |                 )
48 |                 if ih > 0:
49 |                     ua = float(
50 |                         (boxes[n, 2] - boxes[n, 0] + 1) *
51 |                         (boxes[n, 3] - boxes[n, 1] + 1) +
52 |                         box_area - iw * ih
53 |                     )
54 |                     overlaps[n, k] = iw * ih / ua
55 |     return overlaps
56 | 
57 | def bbox_overlaps_self(
58 |         np.ndarray[DTYPE_t, ndim=2] boxes,
59 |         np.ndarray[DTYPE_t, ndim=2] query_boxes):
60 |     """
61 |     Parameters
62 |     ----------
63 |     boxes: (N, 4) ndarray of float
64 |     query_boxes: (K, 4) ndarray of float
65 |     Returns
66 |     -------
67 |     overlaps: (N, K) ndarray of overlap between boxes and query_boxes
68 |     """
69 |     cdef unsigned int N = boxes.shape[0]
70 |     cdef unsigned int K = query_boxes.shape[0]
71 |     cdef np.ndarray[DTYPE_t, ndim=2] overlaps = np.zeros((N, K), dtype=DTYPE)
72 |     cdef DTYPE_t iw, ih, box_area
73 |     cdef DTYPE_t ua
74 |     cdef unsigned int k, n
75 |     for k in range(K):
76 |         box_area = (
77 |             (query_boxes[k, 2] - query_boxes[k, 0] + 1) *
78 |             (query_boxes[k, 3] - query_boxes[k, 1] + 1)
79 |         )
80 |         for n in range(N):
81 |             iw = (
82 |                 min(boxes[n, 2], query_boxes[k, 2]) -
83 |                 max(boxes[n, 0], query_boxes[k, 0]) + 1
84 |             )
85 |             if iw > 0:
86 |                 ih = (
87 |                     min(boxes[n, 3], query_boxes[k, 3]) -
88 |                     max(boxes[n, 1], query_boxes[k, 1]) + 1
89 |                 )
90 |                 if ih > 0:
91 |                     ua = float(box_area)
92 |                     overlaps[n, k] = iw * ih / ua
93 |     return overlaps


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/utils/blob.py:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Fast R-CNN
 3 | # Copyright (c) 2015 Microsoft
 4 | # Licensed under The MIT License [see LICENSE for details]
 5 | # Written by Ross Girshick
 6 | # --------------------------------------------------------
 7 | 
 8 | """Blob helper functions."""
 9 | from __future__ import absolute_import
10 | from __future__ import division
11 | from __future__ import print_function
12 | 
13 | import numpy as np
14 | import cv2
15 | 
16 | 
17 | def im_list_to_blob(ims):
18 |   """Convert a list of images into a network input.
19 | 
20 |   Assumes images are already prepared (means subtracted, BGR order, ...).
21 |   """
22 |   max_shape = np.array([im.shape for im in ims]).max(axis=0)
23 |   num_images = len(ims)
24 |   blob = np.zeros((num_images, max_shape[0], max_shape[1], 3),
25 |                   dtype=np.float32)
26 |   for i in range(num_images):
27 |     im = ims[i]
28 |     blob[i, 0:im.shape[0], 0:im.shape[1], :] = im
29 | 
30 |   return blob
31 | 
32 | 
33 | def prep_im_for_blob(im, pixel_means, target_size, max_size):
34 |   """Mean subtract and scale an image for use in a blob."""
35 |   im = im.astype(np.float32, copy=False)
36 |   im -= pixel_means
37 |   im_shape = im.shape
38 |   im_size_min = np.min(im_shape[0:2])
39 |   im_size_max = np.max(im_shape[0:2])
40 |   im_scale = float(target_size) / float(im_size_min)
41 |   # Prevent the biggest axis from being more than MAX_SIZE
42 |   if np.round(im_scale * im_size_max) > max_size:
43 |     im_scale = float(max_size) / float(im_size_max)
44 |   im = cv2.resize(im, None, None, fx=im_scale, fy=im_scale,
45 |                   interpolation=cv2.INTER_LINEAR)
46 | 
47 |   return im, im_scale
48 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/utils/boxes_grid.py:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Subcategory CNN
 3 | # Copyright (c) 2015 CVGL Stanford
 4 | # Licensed under The MIT License [see LICENSE for details]
 5 | # Written by Yu Xiang
 6 | # --------------------------------------------------------
 7 | from __future__ import absolute_import
 8 | from __future__ import division
 9 | from __future__ import print_function
10 | 
11 | import numpy as np
12 | import math
13 | from model.config import cfg
14 | 
15 | 
16 | def get_boxes_grid(image_height, image_width):
17 |   """
18 |   Return the boxes on image grid.
19 |   """
20 | 
21 |   # height and width of the heatmap
22 |   if cfg.NET_NAME == 'CaffeNet':
23 |     height = np.floor((image_height * max(cfg.TRAIN.SCALES) - 1) / 4.0 + 1)
24 |     height = np.floor((height - 1) / 2.0 + 1 + 0.5)
25 |     height = np.floor((height - 1) / 2.0 + 1 + 0.5)
26 | 
27 |     width = np.floor((image_width * max(cfg.TRAIN.SCALES) - 1) / 4.0 + 1)
28 |     width = np.floor((width - 1) / 2.0 + 1 + 0.5)
29 |     width = np.floor((width - 1) / 2.0 + 1 + 0.5)
30 |   elif cfg.NET_NAME == 'VGGnet':
31 |     height = np.floor(image_height * max(cfg.TRAIN.SCALES) / 2.0 + 0.5)
32 |     height = np.floor(height / 2.0 + 0.5)
33 |     height = np.floor(height / 2.0 + 0.5)
34 |     height = np.floor(height / 2.0 + 0.5)
35 | 
36 |     width = np.floor(image_width * max(cfg.TRAIN.SCALES) / 2.0 + 0.5)
37 |     width = np.floor(width / 2.0 + 0.5)
38 |     width = np.floor(width / 2.0 + 0.5)
39 |     width = np.floor(width / 2.0 + 0.5)
40 |   else:
41 |     assert (1), 'The network architecture is not supported in utils.get_boxes_grid!'
42 | 
43 |   # compute the grid box centers
44 |   h = np.arange(height)
45 |   w = np.arange(width)
46 |   y, x = np.meshgrid(h, w, indexing='ij')
47 |   centers = np.dstack((x, y))
48 |   centers = np.reshape(centers, (-1, 2))
49 |   num = centers.shape[0]
50 | 
51 |   # compute width and height of grid box
52 |   area = cfg.TRAIN.KERNEL_SIZE * cfg.TRAIN.KERNEL_SIZE
53 |   aspect = cfg.TRAIN.ASPECTS  # height / width
54 |   num_aspect = len(aspect)
55 |   widths = np.zeros((1, num_aspect), dtype=np.float32)
56 |   heights = np.zeros((1, num_aspect), dtype=np.float32)
57 |   for i in range(num_aspect):
58 |     widths[0, i] = math.sqrt(area / aspect[i])
59 |     heights[0, i] = widths[0, i] * aspect[i]
60 | 
61 |   # construct grid boxes
62 |   centers = np.repeat(centers, num_aspect, axis=0)
63 |   widths = np.tile(widths, num).transpose()
64 |   heights = np.tile(heights, num).transpose()
65 | 
66 |   x1 = np.reshape(centers[:, 0], (-1, 1)) - widths * 0.5
67 |   x2 = np.reshape(centers[:, 0], (-1, 1)) + widths * 0.5
68 |   y1 = np.reshape(centers[:, 1], (-1, 1)) - heights * 0.5
69 |   y2 = np.reshape(centers[:, 1], (-1, 1)) + heights * 0.5
70 | 
71 |   boxes_grid = np.hstack((x1, y1, x2, y2)) / cfg.TRAIN.SPATIAL_SCALE
72 | 
73 |   return boxes_grid, centers[:, 0], centers[:, 1]
74 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/utils/nms.py:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Fast R-CNN
 3 | # Copyright (c) 2015 Microsoft
 4 | # Licensed under The MIT License [see LICENSE for details]
 5 | # Written by Ross Girshick
 6 | # --------------------------------------------------------
 7 | 
 8 | import numpy as np
 9 | 
10 | def nms(dets, thresh):
11 |     x1 = dets[:, 0]
12 |     y1 = dets[:, 1]
13 |     x2 = dets[:, 2]
14 |     y2 = dets[:, 3]
15 |     scores = dets[:, 4]
16 | 
17 |     areas = (x2 - x1 + 1) * (y2 - y1 + 1)
18 |     order = scores.argsort()[::-1]
19 | 
20 |     keep = []
21 |     while order.size > 0:
22 |         i = order[0]
23 |         keep.append(i)
24 |         xx1 = np.maximum(x1[i], x1[order[1:]])
25 |         yy1 = np.maximum(y1[i], y1[order[1:]])
26 |         xx2 = np.minimum(x2[i], x2[order[1:]])
27 |         yy2 = np.minimum(y2[i], y2[order[1:]])
28 | 
29 |         w = np.maximum(0.0, xx2 - xx1 + 1)
30 |         h = np.maximum(0.0, yy2 - yy1 + 1)
31 |         inter = w * h
32 |         ovr = inter / (areas[i] + areas[order[1:]] - inter)
33 | 
34 |         inds = np.where(ovr <= thresh)[0]
35 |         order = order[inds + 1]
36 | 
37 |     return keep
38 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/utils/nms.pyx:
--------------------------------------------------------------------------------
  1 | # --------------------------------------------------------
  2 | # Fast R-CNN
  3 | # Copyright (c) 2015 Microsoft
  4 | # Licensed under The MIT License [see LICENSE for details]
  5 | # Written by Ross Girshick
  6 | # --------------------------------------------------------
  7 | 
  8 | import numpy as np
  9 | cimport numpy as np
 10 | 
 11 | cdef inline np.float32_t max(np.float32_t a, np.float32_t b):
 12 |     return a if a >= b else b
 13 | 
 14 | cdef inline np.float32_t min(np.float32_t a, np.float32_t b):
 15 |     return a if a <= b else b
 16 | 
 17 | def nms(np.ndarray[np.float32_t, ndim=2] dets, np.float thresh):
 18 |     cdef np.ndarray[np.float32_t, ndim=1] x1 = dets[:, 0]
 19 |     cdef np.ndarray[np.float32_t, ndim=1] y1 = dets[:, 1]
 20 |     cdef np.ndarray[np.float32_t, ndim=1] x2 = dets[:, 2]
 21 |     cdef np.ndarray[np.float32_t, ndim=1] y2 = dets[:, 3]
 22 |     cdef np.ndarray[np.float32_t, ndim=1] scores = dets[:, 4]
 23 | 
 24 |     cdef np.ndarray[np.float32_t, ndim=1] areas = (x2 - x1 + 1) * (y2 - y1 + 1)
 25 |     cdef np.ndarray[np.int_t, ndim=1] order = scores.argsort()[::-1]
 26 | 
 27 |     cdef int ndets = dets.shape[0]
 28 |     cdef np.ndarray[np.int_t, ndim=1] suppressed = \
 29 |             np.zeros((ndets), dtype=np.int)
 30 | 
 31 |     # nominal indices
 32 |     cdef int _i, _j
 33 |     # sorted indices
 34 |     cdef int i, j
 35 |     # temp variables for box i's (the box currently under consideration)
 36 |     cdef np.float32_t ix1, iy1, ix2, iy2, iarea
 37 |     # variables for computing overlap with box j (lower scoring box)
 38 |     cdef np.float32_t xx1, yy1, xx2, yy2
 39 |     cdef np.float32_t w, h
 40 |     cdef np.float32_t inter, ovr
 41 | 
 42 |     keep = []
 43 |     for _i in range(ndets):
 44 |         i = order[_i]
 45 |         if suppressed[i] == 1:
 46 |             continue
 47 |         keep.append(i)
 48 |         ix1 = x1[i]
 49 |         iy1 = y1[i]
 50 |         ix2 = x2[i]
 51 |         iy2 = y2[i]
 52 |         iarea = areas[i]
 53 |         for _j in range(_i + 1, ndets):
 54 |             j = order[_j]
 55 |             if suppressed[j] == 1:
 56 |                 continue
 57 |             xx1 = max(ix1, x1[j])
 58 |             yy1 = max(iy1, y1[j])
 59 |             xx2 = min(ix2, x2[j])
 60 |             yy2 = min(iy2, y2[j])
 61 |             w = max(0.0, xx2 - xx1 + 1)
 62 |             h = max(0.0, yy2 - yy1 + 1)
 63 |             inter = w * h
 64 |             ovr = inter / (iarea + areas[j] - inter)
 65 |             if ovr >= thresh:
 66 |                 suppressed[j] = 1
 67 | 
 68 |     return keep
 69 | 
 70 | def nms_new(np.ndarray[np.float32_t, ndim=2] dets, np.float thresh):
 71 |     cdef np.ndarray[np.float32_t, ndim=1] x1 = dets[:, 0]
 72 |     cdef np.ndarray[np.float32_t, ndim=1] y1 = dets[:, 1]
 73 |     cdef np.ndarray[np.float32_t, ndim=1] x2 = dets[:, 2]
 74 |     cdef np.ndarray[np.float32_t, ndim=1] y2 = dets[:, 3]
 75 |     cdef np.ndarray[np.float32_t, ndim=1] scores = dets[:, 4]
 76 | 
 77 |     cdef np.ndarray[np.float32_t, ndim=1] areas = (x2 - x1 + 1) * (y2 - y1 + 1)
 78 |     cdef np.ndarray[np.int_t, ndim=1] order = scores.argsort()[::-1]
 79 | 
 80 |     cdef int ndets = dets.shape[0]
 81 |     cdef np.ndarray[np.int_t, ndim=1] suppressed = \
 82 |             np.zeros((ndets), dtype=np.int)
 83 | 
 84 |     # nominal indices
 85 |     cdef int _i, _j
 86 |     # sorted indices
 87 |     cdef int i, j
 88 |     # temp variables for box i's (the box currently under consideration)
 89 |     cdef np.float32_t ix1, iy1, ix2, iy2, iarea
 90 |     # variables for computing overlap with box j (lower scoring box)
 91 |     cdef np.float32_t xx1, yy1, xx2, yy2
 92 |     cdef np.float32_t w, h
 93 |     cdef np.float32_t inter, ovr
 94 | 
 95 |     keep = []
 96 |     for _i in range(ndets):
 97 |         i = order[_i]
 98 |         if suppressed[i] == 1:
 99 |             continue
100 |         keep.append(i)
101 |         ix1 = x1[i]
102 |         iy1 = y1[i]
103 |         ix2 = x2[i]
104 |         iy2 = y2[i]
105 |         iarea = areas[i]
106 |         for _j in range(_i + 1, ndets):
107 |             j = order[_j]
108 |             if suppressed[j] == 1:
109 |                 continue
110 |             xx1 = max(ix1, x1[j])
111 |             yy1 = max(iy1, y1[j])
112 |             xx2 = min(ix2, x2[j])
113 |             yy2 = min(iy2, y2[j])
114 |             w = max(0.0, xx2 - xx1 + 1)
115 |             h = max(0.0, yy2 - yy1 + 1)
116 |             inter = w * h
117 |             ovr = inter / (iarea + areas[j] - inter)
118 |             ovr1 = inter / iarea
119 |             ovr2 = inter / areas[j]
120 |             if ovr >= thresh or ovr1 > 0.95 or ovr2 > 0.95:
121 |                 suppressed[j] = 1
122 | 
123 |     return keep
124 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/lib/utils/timer.py:
--------------------------------------------------------------------------------
 1 | # --------------------------------------------------------
 2 | # Fast R-CNN
 3 | # Copyright (c) 2015 Microsoft
 4 | # Licensed under The MIT License [see LICENSE for details]
 5 | # Written by Ross Girshick
 6 | # --------------------------------------------------------
 7 | 
 8 | import time
 9 | 
10 | class Timer(object):
11 |     """A simple timer."""
12 |     def __init__(self):
13 |         self.total_time = 0.
14 |         self.calls = 0
15 |         self.start_time = 0.
16 |         self.diff = 0.
17 |         self.average_time = 0.
18 | 
19 |     def tic(self):
20 |         # using time.time instead of time.clock because time time.clock
21 |         # does not normalize for multithreading
22 |         self.start_time = time.time()
23 | 
24 |     def toc(self, average=True):
25 |         self.diff = time.time() - self.start_time
26 |         self.total_time += self.diff
27 |         self.calls += 1
28 |         self.average_time = self.total_time / self.calls
29 |         if average:
30 |             return self.average_time
31 |         else:
32 |             return self.diff
33 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/__pycache__/_init_paths.cpython-36.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/tools/__pycache__/_init_paths.cpython-36.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/__pycache__/_init_paths.cpython-37.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/tools/__pycache__/_init_paths.cpython-37.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/_init_paths.py:
--------------------------------------------------------------------------------
 1 | import os.path as osp
 2 | import sys
 3 | 
 4 | def add_path(path):
 5 |     if path not in sys.path:
 6 |         sys.path.insert(0, path)
 7 | 
 8 | this_dir = osp.dirname(__file__)
 9 | 
10 | # Add lib to PYTHONPATH
11 | lib_path = osp.join(this_dir, '..', 'lib')
12 | add_path(lib_path)
13 | 
14 | coco_path = osp.join(this_dir, '..', 'data', 'coco', 'PythonAPI')
15 | add_path(coco_path)
16 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/_init_paths.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/tools/_init_paths.pyc


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/demo_graspRGD.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python
  2 | 
  3 | # --------------------------------------------------------
  4 | # Tensorflow Faster R-CNN
  5 | # Licensed under The MIT License [see LICENSE for details]
  6 | # Written by Xinlei Chen, based on code from Ross Girshick
  7 | # --------------------------------------------------------
  8 | 
  9 | """
 10 | Demo script showing detections in sample images.
 11 | 
 12 | See README.md for installation instructions before running.
 13 | """
 14 | from __future__ import absolute_import
 15 | from __future__ import division
 16 | from __future__ import print_function
 17 | 
 18 | import _init_paths
 19 | from model.config import cfg
 20 | from model.test import im_detect
 21 | from model.nms_wrapper import nms
 22 | 
 23 | from utils.timer import Timer
 24 | import tensorflow as tf
 25 | import matplotlib.pyplot as plt
 26 | import numpy as np
 27 | import os, cv2
 28 | import argparse
 29 | 
 30 | from nets.vgg16 import vgg16
 31 | from nets.resnet_v1 import resnetv1
 32 | import scipy
 33 | from shapely.geometry import Polygon
 34 | 
 35 | import graspnet_config
 36 | 
 37 | pi     = scipy.pi
 38 | dot    = scipy.dot
 39 | sin    = scipy.sin
 40 | cos    = scipy.cos
 41 | ar     = scipy.array
 42 | 
 43 | CLASSES = ('__background__',
 44 |            'angle_01', 'angle_02', 'angle_03', 'angle_04', 'angle_05',
 45 |            'angle_06', 'angle_07', 'angle_08', 'angle_09', 'angle_10',
 46 |            'angle_11', 'angle_12', 'angle_13', 'angle_14', 'angle_15',
 47 |            'angle_16', 'angle_17', 'angle_18', 'angle_19')
 48 | 
 49 | NETS = {'vgg16': ('vgg16_faster_rcnn_iter_70000.ckpt',),'res101': ('res101_faster_rcnn_iter_110000.ckpt',),'res50': ('res50_faster_rcnn_iter_240000.ckpt',)}
 50 | DATASETS= {'pascal_voc': ('voc_2007_trainval',),'pascal_voc_0712': ('voc_2007_trainval+voc_2012_trainval',),'grasp': ('train',)}
 51 | 
 52 | def Rotate2D(pts,cnt,ang=scipy.pi/4):
 53 |     '''pts = {} Rotates points(nx2) about center cnt(2) by angle ang(1) in radian'''
 54 |     return dot(pts-cnt,ar([[cos(ang),sin(ang)],[-sin(ang),cos(ang)]]))+cnt
 55 | 
 56 | def vis_detections(ax, image_name, im, class_name, dets, thresh=0.5):
 57 |     """Draw detected bounding boxes."""
 58 |     inds = np.where(dets[:, -1] >= thresh)[0]
 59 |     if len(inds) == 0:
 60 |         return
 61 | 
 62 |     im = im[:, :, (2, 1, 0)]
 63 |     #fig, ax = plt.subplots(figsize=(12, 12))
 64 |     ax.imshow(im, aspect='equal')
 65 |     for i in inds:
 66 |         bbox = dets[i, :4]
 67 |         score = dets[i, -1]
 68 | 
 69 |         # plot rotated rectangles
 70 |         pts = ar([[bbox[0],bbox[1]], [bbox[2], bbox[1]], [bbox[2], bbox[3]], [bbox[0], bbox[3]]])
 71 |         cnt = ar([(bbox[0] + bbox[2])/2, (bbox[1] + bbox[3])/2])
 72 |         angle = int(class_name[6:])
 73 |         r_bbox = Rotate2D(pts, cnt, -pi/2-pi/20*(angle-1)) # maybe -pi/2-pi/18*(angle-1)
 74 |         pred_label_polygon = Polygon([(r_bbox[0,0],r_bbox[0,1]), (r_bbox[1,0], r_bbox[1,1]), (r_bbox[2,0], r_bbox[2,1]), (r_bbox[3,0], r_bbox[3,1])])
 75 |         pred_x, pred_y = pred_label_polygon.exterior.xy
 76 | 
 77 |         plt.plot(pred_x[0:2],pred_y[0:2], color='k', alpha = 0.7, linewidth=1, solid_capstyle='round', zorder=2)
 78 |         plt.plot(pred_x[1:3],pred_y[1:3], color='r', alpha = 0.7, linewidth=3, solid_capstyle='round', zorder=2)
 79 |         plt.plot(pred_x[2:4],pred_y[2:4], color='k', alpha = 0.7, linewidth=1, solid_capstyle='round', zorder=2)
 80 |         plt.plot(pred_x[3:5],pred_y[3:5], color='r', alpha = 0.7, linewidth=3, solid_capstyle='round', zorder=2)
 81 | 
 82 | def demo(sess, net, image_name):
 83 |     """Detect object classes in an image using pre-computed object proposals."""
 84 | 
 85 |     # Load the demo image
 86 |     im_file = os.path.join(cfg.DATA_DIR, 'demo', image_name)
 87 |     im = cv2.imread(im_file, cv2.IMREAD_UNCHANGED)
 88 |     im_rgb_file = os.path.join(graspnet_config.GRASPNET_ROOT, 'scenes', image_name[:10], graspnet_config.CAMERA_NAME, 'rgb', image_name[11:15] + '.png')
 89 |     # im_rgb_file = '/DATA2/Benchmark/graspnet/scenes/' + image_name[:10] + '/kinect/rgb/' + image_name[11:15] + '.png'
 90 |     im_rgb = cv2.imread(im_rgb_file, cv2.IMREAD_UNCHANGED)
 91 | 
 92 |     # Detect all object classes and regress object bounds
 93 |     timer = Timer()
 94 |     timer.tic()
 95 |     scores, boxes = im_detect(sess, net, im)
 96 | 
 97 |     timer.toc()
 98 |     print('Detection took {:.3f}s for {:d} object proposals'.format(timer.total_time, boxes.shape[0]))
 99 | 
100 |     fig, ax = plt.subplots(figsize=(12, 12))
101 |     # Visualize detections for each class
102 |     CONF_THRESH = 0.1
103 |     NMS_THRESH = 0.3
104 |     for cls_ind, cls in enumerate(CLASSES[1:]):
105 |         cls_ind += 1 # because we skipped background
106 |         cls_boxes = boxes[:, 4*cls_ind:4*(cls_ind + 1)]
107 |         cls_scores = scores[:, cls_ind]
108 |         dets = np.hstack((cls_boxes,
109 |                           cls_scores[:, np.newaxis])).astype(np.float32)
110 |         keep = nms(dets, NMS_THRESH)
111 |         dets = dets[keep, :]
112 |         vis_detections(ax, image_name, im_rgb, cls, dets, thresh=CONF_THRESH)
113 | 
114 |     plt.axis('off')
115 |     plt.tight_layout()
116 | 
117 |     #save result
118 |     savepath = os.path.join('..', 'data', 'demo', 'results_all_cls', str(image_name)[:-4])
119 |     # savepath = '../data/demo/results_all_cls/' + str(image_name)[:-4]
120 |     plt.savefig(savepath)
121 | 
122 |     plt.draw()
123 | 
124 | def parse_args():
125 |     """Parse input arguments."""
126 |     parser = argparse.ArgumentParser(description='Tensorflow Faster R-CNN demo')
127 |     parser.add_argument('--net', dest='demo_net', help='Network to use [vgg16 res101]',
128 |                         choices=NETS.keys(), default='res101')
129 |     parser.add_argument('--dataset', dest='dataset', help='Trained dataset [pascal_voc pascal_voc_0712]',
130 |                         choices=DATASETS.keys(), default='pascal_voc_0712')
131 |     args = parser.parse_args()
132 | 
133 |     return args
134 | 
135 | if __name__ == '__main__':
136 |     cfg.TEST.HAS_RPN = True  # Use RPN for proposals
137 |     args = parse_args()
138 | 
139 |     # model path
140 |     demonet = args.demo_net
141 |     dataset = args.dataset
142 |     tfmodel = os.path.join('..', 'output', demonet, DATASETS[dataset][0], 'default',
143 |                               NETS[demonet][0])
144 | 
145 | 
146 |     if not os.path.isfile(tfmodel + '.meta'):
147 |         raise IOError(('{:s} not found.\nDid you download the proper networks from '
148 |                        'our server and place them properly?').format(tfmodel + '.meta'))
149 | 
150 |     # set config
151 |     tfconfig = tf.ConfigProto(allow_soft_placement=True)
152 |     tfconfig.gpu_options.allow_growth=True
153 | 
154 |     # init session
155 |     sess = tf.Session(config=tfconfig)
156 |     # load network
157 |     if demonet == 'vgg16':
158 |         net = vgg16(batch_size=1)
159 |     elif demonet == 'res101':
160 |         net = resnetv1(batch_size=1, num_layers=101)
161 |     elif demonet == 'res50':
162 |         net = resnetv1(batch_size=1, num_layers=50)
163 |     else:
164 |         raise NotImplementedError
165 |     net.create_architecture(sess, "TEST", 20,
166 |                           tag='default', anchor_scales=[8, 16, 32])
167 |     saver = tf.train.Saver()
168 |     saver.restore(sess, tfmodel)
169 | 
170 |     print('Loaded network {:s}'.format(tfmodel))
171 | 
172 |     im_names = ['scene_0108+0036.png','scene_0129+0058.png','scene_0156+0010.png','scene_0174+0092.png']
173 |     for im_name in im_names:
174 |         print('~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~')
175 |         print('Demo for data/demo/{}'.format(im_name))
176 |         demo(sess, net, im_name)
177 | 
178 |     plt.show()
179 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/demo_graspRGD_vis_mask.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python
  2 | 
  3 | # --------------------------------------------------------
  4 | # Tensorflow Faster R-CNN
  5 | # Licensed under The MIT License [see LICENSE for details]
  6 | # Written by Xinlei Chen, based on code from Ross Girshick
  7 | # --------------------------------------------------------
  8 | 
  9 | """
 10 | Demo script showing detections in sample images.
 11 | 
 12 | See README.md for installation instructions before running.
 13 | """
 14 | from __future__ import absolute_import
 15 | from __future__ import division
 16 | from __future__ import print_function
 17 | 
 18 | import _init_paths
 19 | from model.config import cfg
 20 | from model.test import im_detect
 21 | from model.nms_wrapper import nms
 22 | 
 23 | from utils.timer import Timer
 24 | import tensorflow as tf
 25 | import matplotlib.pyplot as plt
 26 | import numpy as np
 27 | import os, cv2
 28 | import argparse
 29 | 
 30 | from nets.vgg16 import vgg16
 31 | from nets.resnet_v1 import resnetv1
 32 | import scipy
 33 | from shapely.geometry import Polygon
 34 | 
 35 | pi     = scipy.pi
 36 | dot    = scipy.dot
 37 | sin    = scipy.sin
 38 | cos    = scipy.cos
 39 | ar     = scipy.array
 40 | 
 41 | CLASSES = ('__background__',
 42 |            'angle_01', 'angle_02', 'angle_03', 'angle_04', 'angle_05',
 43 |            'angle_06', 'angle_07', 'angle_08', 'angle_09', 'angle_10',
 44 |            'angle_11', 'angle_12', 'angle_13', 'angle_14', 'angle_15',
 45 |            'angle_16', 'angle_17', 'angle_18', 'angle_19')
 46 | 
 47 | NETS = {'vgg16': ('vgg16_faster_rcnn_iter_70000.ckpt',),'res101': ('res101_faster_rcnn_iter_110000.ckpt',),'res50': ('res50_faster_rcnn_iter_240000.ckpt',)}
 48 | DATASETS= {'pascal_voc': ('voc_2007_trainval',),'pascal_voc_0712': ('voc_2007_trainval+voc_2012_trainval',),'grasp': ('train',)}
 49 | 
 50 | def Rotate2D(pts,cnt,ang=scipy.pi/4):
 51 |     '''pts = {} Rotates points(nx2) about center cnt(2) by angle ang(1) in radian'''
 52 |     return dot(pts-cnt,ar([[cos(ang),sin(ang)],[-sin(ang),cos(ang)]]))+cnt
 53 | 
 54 | def vis_detections(ax, image_name, im, class_name, dets, thresh=0.5):
 55 |     """Draw detected bounding boxes."""
 56 |     inds = np.where(dets[:, -1] >= thresh)[0]
 57 |     if len(inds) == 0:
 58 |         return
 59 | 
 60 |     im = im[:, :, (2, 1, 0)]
 61 |     #fig, ax = plt.subplots(figsize=(12, 12))
 62 |     ax.imshow(im, aspect='equal')
 63 | 
 64 |     for i in inds:
 65 |         bbox = dets[i, :4]
 66 |         score = dets[i, -1]
 67 | 
 68 |         #ax.add_patch(
 69 |         #    plt.Rectangle((bbox[0], bbox[1]),
 70 |         #                  bbox[2] - bbox[0],
 71 |         #                  bbox[3] - bbox[1], fill=False,
 72 |         #                  edgecolor='red', linewidth=3.5)
 73 |         #    )
 74 | 
 75 |         # plot rotated rectangles
 76 |         pts = ar([[bbox[0],bbox[1]], [bbox[2], bbox[1]], [bbox[2], bbox[3]], [bbox[0], bbox[3]]])
 77 |         cnt = ar([(bbox[0] + bbox[2])/2, (bbox[1] + bbox[3])/2])
 78 |         angle = int(class_name[6:])
 79 |         r_bbox = Rotate2D(pts, cnt, -pi/2-pi/20*(angle-1))
 80 |         pred_label_polygon = Polygon([(r_bbox[0,0],r_bbox[0,1]), (r_bbox[1,0], r_bbox[1,1]), (r_bbox[2,0], r_bbox[2,1]), (r_bbox[3,0], r_bbox[3,1])])
 81 |         pred_x, pred_y = pred_label_polygon.exterior.xy
 82 | 
 83 |         plt.plot(pred_x[0:2],pred_y[0:2], color='k', alpha = 0.7, linewidth=1, solid_capstyle='round', zorder=2)
 84 |         plt.plot(pred_x[1:3],pred_y[1:3], color='r', alpha = 0.7, linewidth=3, solid_capstyle='round', zorder=2)
 85 |         plt.plot(pred_x[2:4],pred_y[2:4], color='k', alpha = 0.7, linewidth=1, solid_capstyle='round', zorder=2)
 86 |         plt.plot(pred_x[3:5],pred_y[3:5], color='r', alpha = 0.7, linewidth=3, solid_capstyle='round', zorder=2)
 87 | 
 88 |         #ax.text(bbox[0], bbox[1] - 2,
 89 |         #        '{:s} {:.3f}'.format(class_name, score),
 90 |         #        bbox=dict(facecolor='blue', alpha=0.5),
 91 |         #        fontsize=14, color='white')
 92 | 
 93 |     #ax.set_title(('{} detections with '
 94 |     #              'p({} | box) >= {:.1f}').format(class_name, class_name,
 95 |     #                                              thresh),
 96 |     #              fontsize=14)
 97 |     #plt.axis('off')
 98 |     #plt.tight_layout()
 99 | 
100 |     #save result
101 |     #savepath = './data/demo/results/' + str(image_name) + str(class_name) + '.png'
102 |     #plt.savefig(savepath)
103 | 
104 |     #plt.draw()
105 | 
106 | def demo(sess, net, image_name, mask_name):
107 |     """Detect object classes in an image using pre-computed object proposals."""
108 | 
109 |     # Load the demo image
110 |     im_file = os.path.join(cfg.DATA_DIR, 'demo', image_name)
111 |     mask_file = os.path.join(cfg.DATA_DIR, 'demo', mask_name)
112 |     im = cv2.imread(im_file, cv2.IMREAD_UNCHANGED)
113 |     mask = cv2.imread(mask_file,0)
114 |     #im = im*np.stack([mask,mask,mask], axis=2)
115 |     im = cv2.bitwise_and(im,im,mask = mask)
116 | 
117 |     
118 |     # Detect all object classes and regress object bounds
119 |     timer = Timer()
120 |     timer.tic()
121 |     scores, boxes = im_detect(sess, net, im)
122 | 
123 |     #scores_max = scores[:,1:-1].max(axis=1)
124 |     #scores_max_idx = np.argmax(scores_max)
125 |     #scores = scores[scores_max_idx:scores_max_idx+1,:]
126 |     #boxes = boxes[scores_max_idx:scores_max_idx+1, :]
127 | 
128 |     #im = cv2.imread('/home/fujenchu/projects/deepLearning/tensorflow-finetune-flickr-style-master/data/grasps_ivalab/rgb_cropped320/rgb_0076Cropped320.png')
129 |     timer.toc()
130 |     print('Detection took {:.3f}s for {:d} object proposals'.format(timer.total_time, boxes.shape[0]))
131 | 
132 |     fig, ax = plt.subplots(figsize=(12, 12))
133 |     # Visualize detections for each class
134 |     CONF_THRESH = 0.1	
135 |     NMS_THRESH = 0.3
136 |     for cls_ind, cls in enumerate(CLASSES[1:]):
137 |         cls_ind += 1 # because we skipped background
138 |         cls_boxes = boxes[:, 4*cls_ind:4*(cls_ind + 1)]
139 |         cls_scores = scores[:, cls_ind]
140 |         dets = np.hstack((cls_boxes,
141 |                           cls_scores[:, np.newaxis])).astype(np.float32)
142 |         keep = nms(dets, NMS_THRESH)
143 |         dets = dets[keep, :]
144 |         vis_detections(ax, image_name, im, cls, dets, thresh=CONF_THRESH)
145 |         #tmp = max(cls_scores)
146 | 
147 |     plt.axis('off')
148 |     plt.tight_layout()
149 | 
150 |     #cv2.imshow('deepGrasp_top_score', im)
151 |     #choice = cv2.waitKey(100)
152 |     
153 |     #save result
154 |     savepath = './data/demo/results_all_cls/' + str(image_name) + '.png'
155 |     plt.savefig(savepath)
156 | 
157 |     plt.draw()
158 | 
159 | def parse_args():
160 |     """Parse input arguments."""
161 |     parser = argparse.ArgumentParser(description='Tensorflow Faster R-CNN demo')
162 |     parser.add_argument('--net', dest='demo_net', help='Network to use [vgg16 res101]',
163 |                         choices=NETS.keys(), default='res101')
164 |     parser.add_argument('--dataset', dest='dataset', help='Trained dataset [pascal_voc pascal_voc_0712]',
165 |                         choices=DATASETS.keys(), default='pascal_voc_0712')
166 |     args = parser.parse_args()
167 | 
168 |     return args
169 | 
170 | if __name__ == '__main__':
171 |     cfg.TEST.HAS_RPN = True  # Use RPN for proposals
172 |     args = parse_args()
173 | 
174 |     # model path
175 |     demonet = args.demo_net
176 |     dataset = args.dataset
177 |     tfmodel = os.path.join('output', demonet, DATASETS[dataset][0], 'default',
178 |                               NETS[demonet][0])
179 | 
180 | 
181 |     if not os.path.isfile(tfmodel + '.meta'):
182 |         raise IOError(('{:s} not found.\nDid you download the proper networks from '
183 |                        'our server and place them properly?').format(tfmodel + '.meta'))
184 | 
185 |     # set config
186 |     tfconfig = tf.ConfigProto(allow_soft_placement=True)
187 |     tfconfig.gpu_options.allow_growth=True
188 | 
189 |     # init session
190 |     sess = tf.Session(config=tfconfig)
191 |     # load network
192 |     if demonet == 'vgg16':
193 |         net = vgg16(batch_size=1)
194 |     elif demonet == 'res101':
195 |         net = resnetv1(batch_size=1, num_layers=101)
196 |     elif demonet == 'res50':
197 |         net = resnetv1(batch_size=1, num_layers=50)
198 |     else:
199 |         raise NotImplementedError
200 |     net.create_architecture(sess, "TEST", 20,
201 |                           tag='default', anchor_scales=[8, 16, 32])
202 |     saver = tf.train.Saver()
203 |     saver.restore(sess, tfmodel)
204 | 
205 |     print('Loaded network {:s}'.format(tfmodel))
206 | 
207 |     #im_names = ['rgd_0076Cropped320.png','rgd_0095.png','pcd0122r_rgd_preprocessed_1.png','pcd0875r_rgd_preprocessed_1.png','resized_0875_2.png']
208 |     im_names = ['rgd_0000Cropped320.png']
209 |     mask_name = 'mask.jpg'
210 |     
211 |     for im_name in im_names:
212 |         print('~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~')
213 |         print('Demo for data/demo/{}'.format(im_name))
214 |         demo(sess, net, im_name, mask_name)
215 | 
216 |     plt.show()
217 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/demo_graspRGD_vis_select.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python
  2 | 
  3 | # --------------------------------------------------------
  4 | # Tensorflow Faster R-CNN
  5 | # Licensed under The MIT License [see LICENSE for details]
  6 | # Written by Xinlei Chen, based on code from Ross Girshick
  7 | # --------------------------------------------------------
  8 | 
  9 | """
 10 | Demo script showing detections in sample images.
 11 | 
 12 | See README.md for installation instructions before running.
 13 | """
 14 | from __future__ import absolute_import
 15 | from __future__ import division
 16 | from __future__ import print_function
 17 | 
 18 | import _init_paths
 19 | from model.config import cfg
 20 | from model.test import im_detect
 21 | from model.nms_wrapper import nms
 22 | 
 23 | from utils.timer import Timer
 24 | import tensorflow as tf
 25 | import matplotlib.pyplot as plt
 26 | import numpy as np
 27 | import os, cv2
 28 | import argparse
 29 | 
 30 | from nets.vgg16 import vgg16
 31 | from nets.resnet_v1 import resnetv1
 32 | import scipy
 33 | from shapely.geometry import Polygon
 34 | 
 35 | pi     = scipy.pi
 36 | dot    = scipy.dot
 37 | sin    = scipy.sin
 38 | cos    = scipy.cos
 39 | ar     = scipy.array
 40 | 
 41 | CLASSES = ('__background__',
 42 |            'angle_01', 'angle_02', 'angle_03', 'angle_04', 'angle_05',
 43 |            'angle_06', 'angle_07', 'angle_08', 'angle_09', 'angle_10',
 44 |            'angle_11', 'angle_12', 'angle_13', 'angle_14', 'angle_15',
 45 |            'angle_16', 'angle_17', 'angle_18', 'angle_19')
 46 | 
 47 | global SELECTION_COUNT 
 48 | SELECTION_COUNT = 0
 49 | NETS = {'vgg16': ('vgg16_faster_rcnn_iter_70000.ckpt',),'res101': ('res101_faster_rcnn_iter_110000.ckpt',),'res50': ('res50_faster_rcnn_iter_240000.ckpt',)}
 50 | DATASETS= {'pascal_voc': ('voc_2007_trainval',),'pascal_voc_0712': ('voc_2007_trainval+voc_2012_trainval',),'grasp': ('train',)}
 51 | 
 52 | 
 53 | def Rotate2D(pts,cnt,ang=scipy.pi/4):
 54 |     '''pts = {} Rotates points(nx2) about center cnt(2) by angle ang(1) in radian'''
 55 |     return dot(pts-cnt,ar([[cos(ang),sin(ang)],[-sin(ang),cos(ang)]]))+cnt
 56 | 
 57 | def vis_detections(ax, image_name, im, class_name, dets, thresh=0.5):
 58 |     """Draw detected bounding boxes."""
 59 |     inds = np.where(dets[:, -1] >= thresh)[0]
 60 |     if len(inds) == 0:
 61 |         return
 62 | 
 63 |     im = im[:, :, (2, 1, 0)]
 64 |     #fig, ax = plt.subplots(figsize=(12, 12))
 65 |     ax.imshow(im, aspect='equal')
 66 |     for i in inds:
 67 |         bbox = dets[i, :4]
 68 |         score = dets[i, -1]
 69 | 
 70 |         #ax.add_patch(
 71 |         #    plt.Rectangle((bbox[0], bbox[1]),
 72 |         #                  bbox[2] - bbox[0],
 73 |         #                  bbox[3] - bbox[1], fill=False,
 74 |         #                  edgecolor='red', linewidth=3.5)
 75 |         #    )
 76 | 
 77 |         # plot rotated rectangles
 78 |         pts = ar([[bbox[0],bbox[1]], [bbox[2], bbox[1]], [bbox[2], bbox[3]], [bbox[0], bbox[3]]])
 79 |         cnt = ar([(bbox[0] + bbox[2])/2, (bbox[1] + bbox[3])/2])
 80 |         angle = int(class_name[6:])
 81 |         r_bbox = Rotate2D(pts, cnt, -pi/2-pi/20*(angle-1))
 82 |         pred_label_polygon = Polygon([(r_bbox[0,0],r_bbox[0,1]), (r_bbox[1,0], r_bbox[1,1]), (r_bbox[2,0], r_bbox[2,1]), (r_bbox[3,0], r_bbox[3,1])])
 83 |         pred_x, pred_y = pred_label_polygon.exterior.xy
 84 | 
 85 |         plt.plot(pred_x[0:2],pred_y[0:2], color='k', alpha = 0.7, linewidth=1, solid_capstyle='round', zorder=2)
 86 |         plt.plot(pred_x[1:3],pred_y[1:3], color='r', alpha = 0.7, linewidth=3, solid_capstyle='round', zorder=2)
 87 |         plt.plot(pred_x[2:4],pred_y[2:4], color='k', alpha = 0.7, linewidth=1, solid_capstyle='round', zorder=2)
 88 |         plt.plot(pred_x[3:5],pred_y[3:5], color='r', alpha = 0.7, linewidth=3, solid_capstyle='round', zorder=2)
 89 | 
 90 |         #ax.text(bbox[0], bbox[1] - 2,
 91 |         #        '{:s} {:.3f}'.format(class_name, score),
 92 |         #        bbox=dict(facecolor='blue', alpha=0.5),
 93 |         #        fontsize=14, color='white')
 94 |         global SELECTION_COUNT
 95 |         ax.text(bbox[0], bbox[1] - 2,
 96 |                 '{:s}  {:.3f}'.format(str(SELECTION_COUNT), score),
 97 |                 bbox=dict(facecolor='blue', alpha=0.5),
 98 |                 fontsize=14, color='white')
 99 |         SELECTION_COUNT =  SELECTION_COUNT + 1
100 | 
101 |     #ax.set_title(('{} detections with '
102 |     #              'p({} | box) >= {:.1f}').format(class_name, class_name,
103 |     #                                              thresh),
104 |     #              fontsize=14)
105 |     #plt.axis('off')
106 |     #plt.tight_layout()
107 | 
108 |     #save result
109 |     #savepath = './data/demo/results/' + str(image_name) + str(class_name) + '.png'
110 |     #plt.savefig(savepath)
111 | 
112 |     #plt.draw()
113 | 
114 | def demo(sess, net, image_name):
115 |     """Detect object classes in an image using pre-computed object proposals."""
116 | 
117 |     # Load the demo image
118 |     im_file = os.path.join(cfg.DATA_DIR, 'demo', image_name)
119 |     im = cv2.imread(im_file, cv2.IMREAD_UNCHANGED)
120 |     #print(im)
121 | 
122 |     # Detect all object classes and regress object bounds
123 |     timer = Timer()
124 |     timer.tic()
125 |     scores, boxes = im_detect(sess, net, im)
126 | 
127 |     #scores_max = scores[:,1:-1].max(axis=1)
128 |     #scores_max_idx = np.argmax(scores_max)
129 |     #scores = scores[scores_max_idx:scores_max_idx+1,:]
130 |     #boxes = boxes[scores_max_idx:scores_max_idx+1, :]
131 | 
132 |     #im = cv2.imread('/home/fujenchu/projects/deepLearning/tensorflow-finetune-flickr-style-master/data/grasps_ivalab/rgb_cropped320/rgb_0076Cropped320.png')
133 |     timer.toc()
134 |     print('Detection took {:.3f}s for {:d} object proposals'.format(timer.total_time, boxes.shape[0]))
135 | 
136 |     fig, ax = plt.subplots(figsize=(12, 12))
137 |     # Visualize detections for each class
138 |     CONF_THRESH = 0.1	
139 |     NMS_THRESH = 0.3
140 |     global SELECTION_COUNT 
141 |     SELECTION_COUNT = 0
142 |     for cls_ind, cls in enumerate(CLASSES[1:]):
143 |         cls_ind += 1 # because we skipped background
144 |         cls_boxes = boxes[:, 4*cls_ind:4*(cls_ind + 1)]
145 |         cls_scores = scores[:, cls_ind]
146 |         dets = np.hstack((cls_boxes,
147 |                           cls_scores[:, np.newaxis])).astype(np.float32)
148 |         keep = nms(dets, NMS_THRESH)
149 |         dets = dets[keep, :]
150 |         vis_detections(ax, image_name, im, cls, dets, thresh=CONF_THRESH)
151 |         #tmp = max(cls_scores)
152 | 
153 |     plt.axis('off')
154 |     plt.tight_layout()
155 | 
156 |     #cv2.imshow('deepGrasp_top_score', im)
157 |     #choice = cv2.waitKey(100)
158 |     
159 |     #save result
160 |     savepath = './data/demo/results_all_cls/' + str(image_name) + '.png'
161 |     plt.savefig(savepath)
162 | 
163 |     plt.draw()
164 | 
165 | def parse_args():
166 |     """Parse input arguments."""
167 |     parser = argparse.ArgumentParser(description='Tensorflow Faster R-CNN demo')
168 |     parser.add_argument('--net', dest='demo_net', help='Network to use [vgg16 res101]',
169 |                         choices=NETS.keys(), default='res101')
170 |     parser.add_argument('--dataset', dest='dataset', help='Trained dataset [pascal_voc pascal_voc_0712]',
171 |                         choices=DATASETS.keys(), default='pascal_voc_0712')
172 |     args = parser.parse_args()
173 | 
174 |     return args
175 | 
176 | if __name__ == '__main__':
177 |     cfg.TEST.HAS_RPN = True  # Use RPN for proposals
178 |     args = parse_args()
179 | 
180 |     # model path
181 |     demonet = args.demo_net
182 |     dataset = args.dataset
183 |     tfmodel = os.path.join('output', demonet, DATASETS[dataset][0], 'default',
184 |                               NETS[demonet][0])
185 | 
186 | 
187 |     if not os.path.isfile(tfmodel + '.meta'):
188 |         raise IOError(('{:s} not found.\nDid you download the proper networks from '
189 |                        'our server and place them properly?').format(tfmodel + '.meta'))
190 | 
191 |     # set config
192 |     tfconfig = tf.ConfigProto(allow_soft_placement=True)
193 |     tfconfig.gpu_options.allow_growth=True
194 | 
195 |     # init session
196 |     sess = tf.Session(config=tfconfig)
197 |     # load network
198 |     if demonet == 'vgg16':
199 |         net = vgg16(batch_size=1)
200 |     elif demonet == 'res101':
201 |         net = resnetv1(batch_size=1, num_layers=101)
202 |     elif demonet == 'res50':
203 |         net = resnetv1(batch_size=1, num_layers=50)
204 |     else:
205 |         raise NotImplementedError
206 |     net.create_architecture(sess, "TEST", 20,
207 |                           tag='default', anchor_scales=[8, 16, 32])
208 |     saver = tf.train.Saver()
209 |     saver.restore(sess, tfmodel)
210 | 
211 |     print('Loaded network {:s}'.format(tfmodel))
212 | 
213 |     #im_names = ['rgd_0076Cropped320.png','rgd_0095.png','pcd0122r_rgd_preprocessed_1.png','pcd0875r_rgd_preprocessed_1.png','resized_0875_2.png']
214 |     im_names = ['pcd0100r_rgd_preprocessed_1.png','pcd0266r_rgd_preprocessed_1.png','pcd0882r_rgd_preprocessed_1.png','rgd_0000Cropped320.png']
215 |     for im_name in im_names:
216 |         print('~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~')
217 |         print('Demo for data/demo/{}'.format(im_name))
218 |         demo(sess, net, im_name)
219 | 
220 |     plt.show()
221 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/graspnet_config.py:
--------------------------------------------------------------------------------
1 | import os
2 | 
3 | GRASPNET_ROOT = os.path.abspath(os.path.join(os.path.split(os.path.abspath(__file__))[0], '..', '..', 'graspnet_dataset'))
4 | CAMERA_NAME = 'kinect'


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/mask_gen.py:
--------------------------------------------------------------------------------
1 | import numpy as np    
2 | mask = np.zeros((227,227))
3 | mask[70:120,90:150]=1
4 | import scipy.miscscipy.misc.imsave('mask.jpg', mask)
5 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/predict_graspRGD.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python
  2 | 
  3 | from __future__ import absolute_import
  4 | from __future__ import division
  5 | from __future__ import print_function
  6 | 
  7 | import _init_paths
  8 | from model.config import cfg
  9 | from model.test import im_detect
 10 | from model.nms_wrapper import nms
 11 | 
 12 | from utils.timer import Timer
 13 | import tensorflow as tf
 14 | import numpy as np
 15 | import os, cv2
 16 | import argparse
 17 | 
 18 | from nets.vgg16 import vgg16
 19 | from nets.resnet_v1 import resnetv1
 20 | import scipy
 21 | 
 22 | import graspnet_config
 23 | 
 24 | pi = scipy.pi
 25 | dot = scipy.dot
 26 | sin = scipy.sin
 27 | cos = scipy.cos
 28 | ar = scipy.array
 29 | 
 30 | os.environ['CUDA_VISIBLE_DEVICES'] = '1' # Choose GPU
 31 | 
 32 | CLASSES = ('__background__',
 33 |            'angle_01', 'angle_02', 'angle_03', 'angle_04', 'angle_05',
 34 |            'angle_06', 'angle_07', 'angle_08', 'angle_09', 'angle_10',
 35 |            'angle_11', 'angle_12', 'angle_13', 'angle_14', 'angle_15',
 36 |            'angle_16', 'angle_17', 'angle_18', 'angle_19')
 37 | 
 38 | NETS = {'vgg16': ('vgg16_faster_rcnn_iter_70000.ckpt',),'res101': ('res101_faster_rcnn_iter_110000.ckpt',),'res50': ('res50_faster_rcnn_iter_240000.ckpt',)}
 39 | DATASETS= {'pascal_voc': ('voc_2007_trainval',),'pascal_voc_0712': ('voc_2007_trainval+voc_2012_trainval',),'grasp': ('train',)}
 40 | 
 41 | def Rotate2D(pts, cnt, ang=scipy.pi/4):
 42 |     '''pts = {} Rotates points(nx2) about center cnt(2) by angle ang(1) in radian'''
 43 |     return dot(pts-cnt, ar([[cos(ang), sin(ang)], [-sin(ang), cos(ang)]])) + cnt
 44 | 
 45 | def add_predicted_grasps(class_name, dets, image_grasps, thresh=0.5):
 46 |     """Draw detected bounding boxes."""
 47 |     inds = np.where(dets[:, -1] >= thresh)[0]
 48 |     if len(inds) == 0:
 49 |         return 0, 0
 50 | 
 51 |     angle_class = int(class_name[6:])
 52 | 
 53 |     for i in inds:
 54 |         bbox = dets[i, :4]
 55 |         score = dets[i, -1]
 56 |         # plot rotated rectangles
 57 |         height = bbox[3] - bbox[1]
 58 |         cnt = ar([(bbox[0] + bbox[2])/2, (bbox[1] + bbox[3])/2])
 59 |         open_point = ar([bbox[2], (bbox[1] + bbox[3])/2])
 60 |         rotated_open_point = Rotate2D(open_point, cnt, -pi/2-pi/18*(angle_class-1)) # rotated rectangle (eg. class2: -100 degree, 对应y向上坐标的100 degree or -80 degree)
 61 |         this_grasp = list(cnt) + list(rotated_open_point)
 62 |         this_grasp.append(height)
 63 |         this_grasp.append(score)
 64 |         this_grasp.append(-1)
 65 |         image_grasps.append(this_grasp)
 66 | 
 67 | def demo(sess, net, image_name, CONF_THRESH):
 68 |     """Detect object classes in an image using pre-computed object proposals."""
 69 | 
 70 |     # Load the demo image
 71 |     im_file = os.path.join(cfg.DATA_DIR, 'demo', 'Images', image_name)
 72 |     im = cv2.imread(im_file, cv2.IMREAD_UNCHANGED)
 73 | 
 74 |     scene_name = image_name[:10] # 'scene_0021'
 75 |     image_index = image_name[11:15] # '0003'
 76 | 
 77 |     # Detect all object classes and regress object bounds
 78 |     timer = Timer()
 79 |     timer.tic()
 80 |     scores, boxes = im_detect(sess, net, im)
 81 | 
 82 |     timer.toc()
 83 | 
 84 |     NMS_THRESH = 0.3
 85 | 
 86 |     image_grasps = []
 87 | 
 88 |     for cls_ind, cls in enumerate(CLASSES[1:]):
 89 |         cls_ind += 1 # because we skipped background
 90 |         cls_boxes = boxes[:, 4*cls_ind:4*(cls_ind + 1)]
 91 |         cls_scores = scores[:, cls_ind]
 92 |         dets = np.hstack((cls_boxes,
 93 |                           cls_scores[:, np.newaxis])).astype(np.float32)
 94 |         keep = nms(dets, NMS_THRESH)
 95 |         dets = dets[keep, :]
 96 |         add_predicted_grasps(cls, dets, image_grasps, thresh=CONF_THRESH)
 97 | 
 98 |     image_grasps = np.array(image_grasps)
 99 |     np.save(os.path.join('..', 'predicted_rectangle_grasp', scene_name, graspnet_config.CAMERA_NAME, image_index), image_grasps)
100 | 
101 | 
102 | def parse_args():
103 |     """Parse input arguments."""
104 |     parser = argparse.ArgumentParser(description='Tensorflow Faster R-CNN demo')
105 |     parser.add_argument('--net', dest='demo_net', help='Network to use [vgg16 res101]',
106 |                         choices=NETS.keys(), default='res101')
107 |     parser.add_argument('--dataset', dest='dataset', help='Trained dataset [pascal_voc pascal_voc_0712]',
108 |                         choices=DATASETS.keys(), default='pascal_voc_0712')
109 |     args = parser.parse_args()
110 | 
111 |     return args
112 | 
113 | if __name__ == '__main__':
114 |     cfg.TEST.HAS_RPN = True  # Use RPN for proposals
115 |     args = parse_args()
116 | 
117 |     # model path
118 |     demonet = args.demo_net
119 |     dataset = args.dataset
120 |     tfmodel = os.path.join('..', 'output', demonet, DATASETS[dataset][0], 'default',
121 |                               NETS[demonet][0])
122 | 
123 | 
124 |     if not os.path.isfile(tfmodel + '.meta'):
125 |         raise IOError(('{:s} not found.\nDid you download the proper networks from '
126 |                        'our server and place them properly?').format(tfmodel + '.meta'))
127 | 
128 |     # set config
129 |     tfconfig = tf.ConfigProto(allow_soft_placement=True)
130 |     tfconfig.gpu_options.allow_growth=True
131 | 
132 |     # init session
133 |     sess = tf.Session(config=tfconfig)
134 |     # load network
135 |     if demonet == 'vgg16':
136 |         net = vgg16(batch_size=1)
137 |     elif demonet == 'res101':
138 |         net = resnetv1(batch_size=1, num_layers=101)
139 |     elif demonet == 'res50':
140 |         net = resnetv1(batch_size=1, num_layers=50)
141 |     else:
142 |         raise NotImplementedError
143 |     net.create_architecture(sess, "TEST", 20,
144 |                           tag='default', anchor_scales=[8, 16, 32])
145 |     saver = tf.train.Saver()
146 |     saver.restore(sess, tfmodel)
147 | 
148 |     print('Loaded network {:s}'.format(tfmodel))
149 | 
150 | 
151 |     CONF_THRESH = 0.0
152 | 
153 |     for scene_index in range(100, 190):
154 |         scene_name = 'scene_{}'.format(str(scene_index).zfill(4)) # 'scene_0012'
155 |         if not os.path.exists(os.path.join('..', 'predicted_rectangle_grasp', scene_name)):
156 |             os.mkdir(os.path.join('..', 'predicted_rectangle_grasp', scene_name))
157 |         if not os.path.exists(os.path.join('..', 'predicted_rectangle_grasp', scene_name, graspnet_config.CAMERA_NAME)):
158 |             os.mkdir(os.path.join('..', 'predicted_rectangle_grasp', scene_name, graspnet_config.CAMERA_NAME))
159 |         print(scene_name)
160 |         for img_index in range(256):
161 |             im_name = '{}+{}.png'.format(scene_name, str(img_index).zfill(4))
162 |             demo(sess, net, im_name, CONF_THRESH)
163 | 


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/result/FPPI.npy:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/tools/result/FPPI.npy


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/result/analysis.py:
--------------------------------------------------------------------------------
 1 | import numpy as np
 2 | 
 3 | # FPPI.npy  miss_rate.npy  total_false_positive_num.npy  total_gt_num.npy  total_missed_gt_grasp_num.npy  total_proposed_num.npy
 4 | 
 5 | FPPI = np.load('FPPI.npy')
 6 | miss_rate = np.load('miss_rate.npy')
 7 | total_false_positive_num = np.load('total_false_positive_num.npy')
 8 | total_gt_num = np.load('total_gt_num.npy')
 9 | total_missed_gt_grasp_num = np.load('total_missed_gt_grasp_num.npy')
10 | total_proposed_num = np.load('total_proposed_num.npy')
11 | 
12 | total_true_positive_num = total_proposed_num - total_false_positive_num
13 | accuracy = total_true_positive_num / total_proposed_num
14 | 
15 | print('FPPI: {}'.format(FPPI))
16 | print('miss rate: {}'.format(miss_rate))
17 | print('accuracy: {}'.format(accuracy))


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/result/miss_rate.npy:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/tools/result/miss_rate.npy


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/result/total_false_positive_num.npy:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/tools/result/total_false_positive_num.npy


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/result/total_gt_num.npy:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/tools/result/total_gt_num.npy


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/result/total_missed_gt_grasp_num.npy:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/tools/result/total_missed_gt_grasp_num.npy


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/result/total_proposed_num.npy:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/graspnet/rectangle-graspnet-multiObject-multiGrasp/672ee86a1d49c455b7da77237b57976ea11465fd/grasp_multiObject_multiGrasp/tools/result/total_proposed_num.npy


--------------------------------------------------------------------------------
/grasp_multiObject_multiGrasp/tools/trainval_net.py:
--------------------------------------------------------------------------------
  1 | # --------------------------------------------------------
  2 | # Tensorflow Faster R-CNN
  3 | # Licensed under The MIT License [see LICENSE for details]
  4 | # Written by Zheqi He, Xinlei Chen, based on code from Ross Girshick
  5 | # --------------------------------------------------------
  6 | from __future__ import absolute_import
  7 | from __future__ import division
  8 | from __future__ import print_function
  9 | 
 10 | import _init_paths
 11 | from model.train_val import get_training_roidb, train_net
 12 | from model.config import cfg, cfg_from_file, cfg_from_list, get_output_dir, get_output_tb_dir
 13 | from datasets.factory import get_imdb
 14 | import datasets.imdb
 15 | import argparse
 16 | import pprint
 17 | import numpy as np
 18 | import sys
 19 | 
 20 | import tensorflow as tf
 21 | from nets.vgg16 import vgg16
 22 | from nets.resnet_v1 import resnetv1
 23 | 
 24 | def parse_args():
 25 |   """
 26 |   Parse input arguments
 27 |   """
 28 |   parser = argparse.ArgumentParser(description='Train a Fast R-CNN network')
 29 |   parser.add_argument('--cfg', dest='cfg_file',
 30 |                       help='optional config file',
 31 |                       default=None, type=str)
 32 |   parser.add_argument('--weight', dest='weight',
 33 |                       help='initialize with pretrained model weights',
 34 |                       type=str)
 35 |   parser.add_argument('--imdb', dest='imdb_name',
 36 |                       help='dataset to train on',
 37 |                       default='voc_2007_trainval', type=str)
 38 |   parser.add_argument('--imdbval', dest='imdbval_name',
 39 |                       help='dataset to validate on',
 40 |                       default='voc_2007_test', type=str)
 41 |   parser.add_argument('--iters', dest='max_iters',
 42 |                       help='number of iterations to train',
 43 |                       default=70000, type=int)
 44 |   parser.add_argument('--tag', dest='tag',
 45 |                       help='tag of the model',
 46 |                       default=None, type=str)
 47 |   parser.add_argument('--net', dest='net',
 48 |                       help='vgg16, res50, res101, res152',
 49 |                       default='res50', type=str)
 50 |   parser.add_argument('--set', dest='set_cfgs',
 51 |                       help='set config keys', default=None,
 52 |                       nargs=argparse.REMAINDER)
 53 | 
 54 |   if len(sys.argv) == 1:
 55 |     parser.print_help()
 56 |     sys.exit(1)
 57 | 
 58 |   args = parser.parse_args()
 59 |   return args
 60 | 
 61 | 
 62 | def combined_roidb(imdb_names):
 63 |   """
 64 |   Combine multiple roidbs
 65 |   """
 66 | 
 67 |   def get_roidb(imdb_name):
 68 |     imdb = get_imdb(imdb_name)
 69 |     print('Loaded dataset `{:s}` for training'.format(imdb.name))
 70 |     imdb.set_proposal_method(cfg.TRAIN.PROPOSAL_METHOD)
 71 |     print('Set proposal method: {:s}'.format(cfg.TRAIN.PROPOSAL_METHOD))
 72 |     roidb = get_training_roidb(imdb)
 73 |     return roidb
 74 | 
 75 |   roidbs = [get_roidb(s) for s in imdb_names.split('+')]
 76 |   roidb = roidbs[0]
 77 |   if len(roidbs) > 1:
 78 |     for r in roidbs[1:]:
 79 |       roidb.extend(r)
 80 |     tmp = get_imdb(imdb_names.split('+')[1])
 81 |     imdb = datasets.imdb.imdb(imdb_names, tmp.classes)
 82 |   else:
 83 |     imdb = get_imdb(imdb_names)
 84 |   return imdb, roidb
 85 | 
 86 | 
 87 | if __name__ == '__main__':
 88 |   args = parse_args()
 89 | 
 90 |   print('Called with args:')
 91 |   print(args)
 92 | 
 93 |   if args.cfg_file is not None:
 94 |     cfg_from_file(args.cfg_file)
 95 |   if args.set_cfgs is not None:
 96 |     cfg_from_list(args.set_cfgs)
 97 | 
 98 |   print('Using config:')
 99 |   pprint.pprint(cfg)
100 | 
101 |   np.random.seed(cfg.RNG_SEED)
102 | 
103 |   # train set
104 |   imdb, roidb = combined_roidb(args.imdb_name)
105 |   print('{:d} roidb entries'.format(len(roidb)))
106 | 
107 |   # output directory where the models are saved
108 |   output_dir = get_output_dir(imdb, args.tag)
109 |   print('Output will be saved to `{:s}`'.format(output_dir))
110 | 
111 |   # tensorboard directory where the summaries are saved during training
112 |   tb_dir = get_output_tb_dir(imdb, args.tag)
113 |   print('TensorFlow summaries will be saved to `{:s}`'.format(tb_dir))
114 | 
115 |   # also add the validation set, but with no flipping images
116 |   orgflip = cfg.TRAIN.USE_FLIPPED
117 |   cfg.TRAIN.USE_FLIPPED = False
118 |   _, valroidb = combined_roidb(args.imdbval_name)
119 |   print('{:d} validation roidb entries'.format(len(valroidb)))
120 |   cfg.TRAIN.USE_FLIPPED = orgflip
121 | 
122 |   # load network
123 |   if args.net == 'vgg16':
124 |     net = vgg16(batch_size=cfg.TRAIN.IMS_PER_BATCH)
125 |   elif args.net == 'res50':
126 |     net = resnetv1(batch_size=cfg.TRAIN.IMS_PER_BATCH, num_layers=50)
127 |   elif args.net == 'res101':
128 |     net = resnetv1(batch_size=cfg.TRAIN.IMS_PER_BATCH, num_layers=101)
129 |   elif args.net == 'res152':
130 |     net = resnetv1(batch_size=cfg.TRAIN.IMS_PER_BATCH, num_layers=152)
131 |   else:
132 |     raise NotImplementedError
133 |     
134 |   train_net(net, imdb, roidb, valroidb, output_dir, tb_dir,
135 |             pretrained_model=args.weight,
136 |             max_iters=args.max_iters)
137 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
 1 | absl-py==0.9.0
 2 | astor==0.8.1
 3 | certifi==2020.6.20
 4 | cycler==0.10.0
 5 | Cython @ file:///tmp/build/80754af9/cython_1594831565616/work
 6 | easydict==1.9
 7 | gast @ file:///tmp/build/80754af9/gast_1597433534803/work
 8 | google-pasta==0.2.0
 9 | grpcio @ file:///tmp/build/80754af9/grpcio_1597424460877/work
10 | h5py @ file:///tmp/build/80754af9/h5py_1593454121459/work
11 | importlib-metadata @ file:///tmp/build/80754af9/importlib-metadata_1593446433964/work
12 | Keras-Applications @ file:///tmp/build/80754af9/keras-applications_1594366238411/work
13 | Keras-Preprocessing==1.1.0
14 | kiwisolver==1.2.0
15 | Markdown @ file:///tmp/build/80754af9/markdown_1597433258348/work
16 | matplotlib @ file:///tmp/build/80754af9/matplotlib-base_1592846044287/work
17 | mkl-fft==1.1.0
18 | mkl-random==1.1.1
19 | mkl-service==2.3.0
20 | numpy==1.16.0
21 | olefile==0.46
22 | opencv-python==4.3.0.36
23 | Pillow @ file:///tmp/build/80754af9/pillow_1594307298074/work
24 | protobuf==3.12.4
25 | pyparsing==2.4.7
26 | python-dateutil==2.8.1
27 | PyYAML==5.3.1
28 | scipy @ file:///tmp/build/80754af9/scipy_1597686625380/work
29 | Shapely==1.7.0
30 | six==1.15.0
31 | tensorboard==1.14.0
32 | tensorflow==1.14.0
33 | tensorflow-estimator==1.14.0
34 | termcolor==1.1.0
35 | tornado==6.0.4
36 | Werkzeug==1.0.1
37 | wrapt==1.12.1
38 | zipp==3.1.0
39 | 


--------------------------------------------------------------------------------