├── umd1.jpg
├── umd2.jpg
├── folder.jpg
├── images.zip
├── dataset.zip
├── fine_search.jpg
├── babysitting1.jpg
├── babysitting2.jpg
├── babysitting3.jpg
├── coarse_search.jpg
├── keras-tensorflow-logo.jpg
├── 1_reg_10minus6_lr_10minus4.png
├── 2_reg_10minus6_lr_10power4.png
├── README.txt
├── README.md
├── cnn_code.py
└── UMD.py


/umd1.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kalyanghosh/Face-Detection-using-CNN/HEAD/umd1.jpg


--------------------------------------------------------------------------------
/umd2.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kalyanghosh/Face-Detection-using-CNN/HEAD/umd2.jpg


--------------------------------------------------------------------------------
/folder.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kalyanghosh/Face-Detection-using-CNN/HEAD/folder.jpg


--------------------------------------------------------------------------------
/images.zip:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kalyanghosh/Face-Detection-using-CNN/HEAD/images.zip


--------------------------------------------------------------------------------
/dataset.zip:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kalyanghosh/Face-Detection-using-CNN/HEAD/dataset.zip


--------------------------------------------------------------------------------
/fine_search.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kalyanghosh/Face-Detection-using-CNN/HEAD/fine_search.jpg


--------------------------------------------------------------------------------
/babysitting1.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kalyanghosh/Face-Detection-using-CNN/HEAD/babysitting1.jpg


--------------------------------------------------------------------------------
/babysitting2.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kalyanghosh/Face-Detection-using-CNN/HEAD/babysitting2.jpg


--------------------------------------------------------------------------------
/babysitting3.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kalyanghosh/Face-Detection-using-CNN/HEAD/babysitting3.jpg


--------------------------------------------------------------------------------
/coarse_search.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kalyanghosh/Face-Detection-using-CNN/HEAD/coarse_search.jpg


--------------------------------------------------------------------------------
/keras-tensorflow-logo.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kalyanghosh/Face-Detection-using-CNN/HEAD/keras-tensorflow-logo.jpg


--------------------------------------------------------------------------------
/1_reg_10minus6_lr_10minus4.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kalyanghosh/Face-Detection-using-CNN/HEAD/1_reg_10minus6_lr_10minus4.png


--------------------------------------------------------------------------------
/2_reg_10minus6_lr_10power4.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kalyanghosh/Face-Detection-using-CNN/HEAD/2_reg_10minus6_lr_10power4.png


--------------------------------------------------------------------------------
/README.txt:
--------------------------------------------------------------------------------
 1 | ###########################################################################################################
 2 |                DATA PREPROCESSING IO CODE (UMD.py)
 3 | ###########################################################################################################
 4 | #Instructions to run the code UMD.py inside the dataset subfolder folder inside Project2 folder
 5 | 
 6 | #1. Download the data(Batch 3, 12GB version) from http://www.umdfaces.io/ 
 7 | #2. Create a folder named data_UMD inside the dataset folder.Inside the data_UMD folder,
 8 | #   create two dirs named Annotation and original_pics
 9 | #3. Extract the dataset inside the original_pics folder and copy the umdfaces_batch3_ultraface.csv annotation
10 | #   file to the Annotation folder.
11 | #4. Run the code UMD.py inside the dataset folder by specifying the following parameters.
12 | 
13 | #   INPUT PARAMETERS
14 | #   image_dir = .\data_UMD\original_pics
15 | #   anno_dir  = .\data_UMD\Annotation
16 | #   save_dir  = .\data_UMD\cache
17 | #   use_Color = True for color image , False for gray
18 | #   patch_size = 60, you are free to give your own size
19 | #   train_size =  10000, number of training images  
20 | #   test_size = 1000, number of testing images
21 | 
22 | #   OUTPUT
23 | #   After running the code UMD.py, the folder structure that will be generatd is as follows:
24 | #   1. Inside the data_UMD folder, a folder 'cache' will be created
25 | #   2. Inside the data_UMD folder, a folder 'color' (if use_Color=True) else 'gray' will be created
26 | #   3. Inside the 'color'/'gray' folder, two folders namely 'train' and 'test' will be created
27 | #   4. Inside each of the 'train' and 'test' folders,
28 | #      'neg' folder for negative images and 'pos' foder for positive images will be created         
29 | ###########################################################################################################
30 | 
31 |                      NEURAL NETWORK CODE (cnn_code.py)
32 | ###########################################################################################################
33 | 
34 | #Instructions to run the code cnn_code.py inside the code folder
35 | 
36 | #1. Navigate to the code folder inside the Project_2 folder
37 | #2. Give the path of train_dir = '/home/kghosh/dataset/data_UMD/cache1/color/train/'
38 | #   Give the path to test_dir = '/home/kghosh/dataset/data_UMD/cache1/color/test/'
39 | #3. Run the python file cnn_code.py in the terminal using the below command:
40 | #   ($python cnn_code.py)
41 | #4. After the code is run and all the epochs complete,the model will be saved in 
42 | # face_vs_nonface.h5
43 | 
44 | 
45 | 
46 | #############################################################################################################


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | 
 2 | 
 3 | # PROJECT TITLE: FACE DETECTION USING CNN aka ConvNets
 4 | 
 5 | ## DESCRIPTION:
 6 | <br>This repository gives budding Deep Learning enthusiats a gentle introduction to the topic of Deep Learning.</br>
 7 | <br>In this repository , I will list down all the steps needed to get started with your first project in Deep Learning.</br>
 8 | <br>So go ahead, Fork this repo and get started with Deep Learning.</br>
 9 | 
10 | ## CONTENTS:
11 | 1. Dataset download
12 | 2. Tools & Libraries
13 | 3. Code
14 | 4. Instructions to run the code
15 | 5. Future improvements
16 | 
17 | ## EXPLANATIONS & STEPS:
18 | 1. <b> Dataset download:</b>
19 | <br>For this project we will be using the UMD face dataset which can be downloaded from: [UMD Dataset](http://www.umdfaces.io/) </br>
20 | <br>![UMD Face Dataset](https://github.com/kalyanghosh/Face-Detection-using-CNN/blob/master/umd1.jpg)</br>
21 | <br>Go ahead and download the <b>Batch 3 dataset</b>, which will have faces of personalities and and <b>.csv</b> file that contains the annotations
22 | to crop out the face from each of the images:</br>
23 | ![Batch 3](https://github.com/kalyanghosh/Face-Detection-using-CNN/blob/master/umd2.jpg)</br>
24 | 
25 | 1.1.<b> Data Preprocessing Input/Output Code-UMD.py:</b>
26 | <br>In the next step, we need to write a code that would read the annotations from the .csv file , crop out the faces to create the 
27 | positive dataset and crop out the background to create the negative dataset.The code should be self sufficient and modular so that when parameters like <b>"dataset path", "# of train images", "# of test images", "color/gray"</b>, the code should perform all the tasks and divide the dataset into a folder structure as below:</br>
28 | <br>![Train/Test Folder Structure](https://github.com/kalyanghosh/Face-Detection-using-CNN/blob/master/folder.jpg)</br>
29 | 
30 | 2.<b> Tools & Libraries:</b>
31 | <br>2.1 In this project we will be using the <b>Keras Deep Learning Library</b> and we will be running it on top of the <b>Tensorflow</b> backend.
32 | <br>![Keras & Tensorflow](https://github.com/kalyanghosh/Face-Detection-using-CNN/blob/master/keras-tensorflow-logo.jpg)</br>
33 | <br>Instructions on how to install <b>Keras & Tensorflow</b> on an Ubuntu machine are available online.</br>
34 | 2.2 The code editors we will be using are <b>Anaconda</b> with <b>OpenCV,Numpy,Scipy</b> support. 
35 | 
36 | 3.<b> Code-CNN_code.py:</b>
37 | <br>The python file CNN_code is the main code which encapsulates the CNN architecture that was used for this project.</br>
38 | <br>The steps performed by the code are as follows:<br>
39 | <br>3.1: In this code, I have used a simplistic CNN architecture as below:</br>
40 | <br><b>2D CONVOLUTION LAYER->2D MAX POOLING->2D CONVOLUTION LAYER->2D MAX POOLING->2D CONVOLUTION LAYER->2D MAX POOLING->2D CONVOLUTION LAYER->2D MAX POOLING->FULLY CONNECTED->FULLY CONNECTED</b></br>
41 | <br>3.2: In this code, I have used <b>Binary CrossEntropy</b> as the <b>Loss Function</b> , the <b>RMSProp</b> as the <b>Gradient Descent</b> algorithm:</br>
42 | <br>3.3 The hyperparameters used are as follows:</br>
43 | <br><b> LEARNING RATE =1e-4 </b></br>
44 | <br><b> STEPS PER EPOCH =100 </b></br>
45 | <br><b> EPOCHS =30 </b></br>
46 | <br><b> VALIDATION STEPS =50 </b></br>
47 | 
48 | 4.<b> HYPER PARAMETER OPTIMIZATION:</b>
49 | <br>The tune the hyperparameters, we run a random search over the hyperparameter space, by sampling the Learning Rate & Regularization   from a uniform distribution.</br>
50 | <br>The optimal set of hyperparameters after running a coarse search and fine search are as follows:<br>
51 | <br><b> COARSE SEARCH: <b><br>
52 | <br><b> Maximum Testing Accuracy=96.89% </b></br>
53 | <br><b> Minimum Testing Loss=0.094 </b></br>
54 | <br><b> Value of optimum Learning Rate=4.48e-4 </b></br>
55 | <br><b> Value of optimum Regularization=2.27e-5 </b></br>
56 | 
57 | 
58 | <br><b> FINE SEARCH: <b><br>
59 | <br><b> Maximum Testing Accuracy=97.79% </b></br>
60 | <br><b> Minimum Testing Loss=0.1034 </b></br>
61 | <br><b> Value of optimum Learning Rate=8.29e-4 </b></br>
62 | <br><b> Value of optimum Regularization=3.91e-3 </b></br>
63 | 
64 | <br>The plots of TRAINING VS TESTING ACCURACY and TRAINING VS TESTING LOSS: </br>
65 | <br>![TRAINING VS TESTING LOSS](https://github.com/kalyanghosh/Face-Detection-using-CNN/blob/master/1_reg_10minus6_lr_10minus4.png)</br>
66 | <br>![TRAINING VS TESTING ACCURACY](https://github.com/kalyanghosh/Face-Detection-using-CNN/blob/master/2_reg_10minus6_lr_10power4.png)</br>
67 | 5.<b> SETUP INSTRUCTIONS:</b>
68 | <br>The entire setup instructions to run the code can be found in <b>README.txt</b></br>
69 | 


--------------------------------------------------------------------------------
/cnn_code.py:
--------------------------------------------------------------------------------
  1 | 
  2 | # coding: utf-8
  3 | 
  4 | # In[7]:
  5 | 
  6 | #Instructions to run the code cnn_code.py inside the code folder
  7 | 
  8 | #1. Navigate to the code folder inside the Project_2 folder
  9 | #2. Give the path of train_dir = '/home/kghosh/dataset/data_UMD/cache1/color/train/'
 10 | #   Give the path to test_dir = '/home/kghosh/dataset/data_UMD/cache1/color/test/'
 11 | #3. Run the python file cnn_code.py in the terminal using the below command:
 12 | #   ($python cnn_code.py)
 13 | #4. After the code is run and all the epochs complete,the model will be saved in 
 14 | # face_vs_nonface.h5
 15 | 
 16 | 
 17 | 
 18 | 
 19 | 
 20 | 
 21 | #*******************************************#
 22 | #Importing the libraries 
 23 | import numpy as np
 24 | from keras import layers
 25 | from keras import models
 26 | from keras import regularizers
 27 | from keras import optimizers
 28 | from keras.preprocessing.image import ImageDataGenerator
 29 | import matplotlib.pyplot as plt
 30 | 
 31 | train_dir='/home/kghosh/dataset/data_UMD/cache1/color/train/'
 32 | test_dir='/home/kghosh/dataset/data_UMD/cache1/color/test/'
 33 | #*******************************************#
 34 | 
 35 | 
 36 | max_count=100
 37 | reg_val=[]
 38 | lr_val=[]
 39 | test_loss=[]
 40 | test_acc=[]
 41 | 
 42 | for i in range(max_count):
 43 | 
 44 | 	print ("*"*30)
 45 | 	print (str(i+1)+"/"+str(max_count))
 46 | 	print ("*"*30)
 47 | # Sampling learning rate and regularization from a uniform distribution
 48 | 
 49 |         reg=10**(np.random.uniform(-4,0))
 50 |         lr=10**(np.random.uniform(-3,-4))
 51 | 
 52 | 
 53 | 
 54 | #*******************************************#
 55 | #Defining the architechture
 56 | 
 57 | 	model=models.Sequential()
 58 | 
 59 | 	model.add(layers.Conv2D(32,(3,3),activation='relu',input_shape=(60,60,3)))
 60 | 
 61 | 	model.add(layers.MaxPooling2D((2,2)))
 62 | 
 63 | 	model.add(layers.Conv2D(64,(3,3),activation='relu'))
 64 | 
 65 | 	model.add(layers.MaxPooling2D(2,2))
 66 | 
 67 | 	model.add(layers.Conv2D(128,(3,3),activation='relu'))
 68 | 
 69 | 	model.add(layers.MaxPooling2D((2,2)))
 70 | 
 71 |    	model.add(layers.Conv2D(128,(3,3),activation='relu'))
 72 | 
 73 | 	model.add(layers.MaxPooling2D((2,2)))
 74 | 
 75 | 	model.add(layers.Flatten())
 76 | 
 77 | 	model.add(layers.Dense(512,activation='relu',kernel_regularizer=regularizers.l2(reg)))
 78 | 
 79 | 	model.add(layers.Dense(1,activation='sigmoid',kernel_regularizer=regularizers.l2(reg)))
 80 | 
 81 | #**********************************************#
 82 | # Summazing the model
 83 | 
 84 | #model.summary()
 85 | 
 86 | #**********************************************#
 87 | # Configuring the model for training
 88 | 
 89 | 
 90 | 
 91 | 	model.compile(loss='binary_crossentropy',
 92 |               optimizer=optimizers.RMSprop(lr=lr),
 93 |              metrics=['acc'])
 94 | 	
 95 | #***********************************************#
 96 | # Using the ImageDataGenerator class to read the.. 
 97 | # images from the directories
 98 | 
 99 | 
100 | 
101 | #Rescale all the images by 1/255
102 | 	train_datagen=ImageDataGenerator(rescale=1./255)
103 | 	test_datagen=ImageDataGenerator(rescale=1./255)
104 | 
105 | 	train_generator=train_datagen.flow_from_directory(
106 |                 train_dir,
107 |                 target_size=(60,60),
108 |                 batch_size=20,
109 |                 class_mode='binary')
110 | 	test_generator=test_datagen.flow_from_directory(
111 |                 test_dir,
112 |                 target_size=(60,60),
113 |                 batch_size=20,
114 |                 class_mode='binary'
115 |                 )
116 | #Fit the model using batch generator
117 | 	history=model.fit_generator(
118 |         	train_generator,
119 |         	steps_per_epoch=100,
120 |         	epochs=5,
121 |         	validation_data=test_generator,
122 |         	validation_steps=50)
123 | 
124 | 	reg_val.append(reg)
125 | 	lr_val.append(lr)
126 | 	test_loss.append(history.history['val_loss'])
127 | 	test_acc.append(history.history['val_acc'])
128 | 
129 | #Save the model 
130 | #model.save('face_vs_nonface.h5')
131 | 
132 | #Plotting accuracy and loss
133 | '''
134 | acc=history.history['acc']
135 | test_acc=history.history['val_acc']
136 | loss=history.history['loss']
137 | test_loss=history.history['val_loss']
138 | epochs=range(1,len(acc)+1)
139 | 
140 | plt.plot(epochs,acc,'bo',label='TRAINING ACCURACY')
141 | plt.plot(epochs,test_acc,'b',label='TEST ACCURACY')
142 | plt.title('TRAINING AND TEST ACCURACY')
143 | plt.xlabel('Epochs')
144 | plt.ylabel('Accuracy')
145 | plt.legend()
146 | 
147 | plt.figure()
148 | 
149 | plt.plot(epochs,loss,'bo',label='TRAINING LOSS')
150 | plt.plot(epochs,test_loss,'b',label='TEST LOSS')
151 | plt.title('TRAINING AND TESTING LOSS')
152 | plt.xlabel('Epochs')
153 | plt.ylabel('Loss')
154 | plt.legend()
155 | 
156 | plt.show()
157 | '''
158 | 
159 | print ("*"*30)
160 | print ("Finding the highest Test Accuracy and lowest Test Loss...")
161 | 
162 | index1=0
163 | index2=0
164 | max_test_acc=max(test_acc[0])
165 | min_test_loss=min(test_loss[0])
166 | for i in range(max_count):
167 | 	temp1=max(test_acc[i])
168 | 	if(temp1>=max_test_acc):
169 |     		max_test_acc=temp1
170 | 		index1=i
171 |         temp2=min(test_loss[i])
172 | 	if(temp2<min_test_loss):
173 | 		min_test_loss=temp2
174 | 		index2=i	  
175 | 
176 | print ('Maximum Testing Accuracy:',max_test_acc)
177 | print ('Minimum Testing Loss:',min_test_loss)
178 | print ('Value of optimum learning rate :',lr_val[index1])
179 | print ('Value of optimum regularization:',reg_val[index2])
180 | 
181 | 
182 | 
183 | 
184 | 
185 | 
186 | 
187 | 


--------------------------------------------------------------------------------
/UMD.py:
--------------------------------------------------------------------------------
  1 | # -*- coding: utf-8 -*-
  2 | """
  3 | Created on Tue Mar 27 19:54:41 2018
  4 | 
  5 | @author: Kalyan
  6 | """
  7 | 
  8 | ###########################################################################################################
  9 | #Instructions to run the code UMD.py inside the dataset subfolder folder inside Project2 folder
 10 | 
 11 | #1. Download the data(Batch 3, 12GB version) from http://www.umdfaces.io/ 
 12 | #2. Create a folder named data_UMD inside the dataset folder.Inside the data_UMD folder,
 13 | #   create two dirs named Annotation and original_pics
 14 | #3. Extract the dataset inside the original_pics folder and copy the umdfaces_batch3_ultraface.csv annotation
 15 | #   file to the Annotation folder.
 16 | #4. Run the code UMD.py inside the dataset folder by specifying the following parameters.
 17 | 
 18 | #   INPUT PARAMETERS
 19 | #   image_dir = .\data_UMD\original_pics
 20 | #   anno_dir  = .\data_UMD\Annotation
 21 | #   save_dir  = .\data_UMD\cache
 22 | #   use_Color = True for color image , False for gray
 23 | #   patch_size = 60, you are free to give your own size
 24 | #   train_size =  10000, number of training images  
 25 | #   test_size = 1000, number of testing images
 26 | 
 27 | #   OUTPUT
 28 | #   After running the code UMD.py, the folder structure that will be generatd is as follows:
 29 | #   1. Inside the data_UMD folder, a folder 'cache' will be created
 30 | #   2. Inside the data_UMD folder, a folder 'color' (if use_Color=True) else 'gray' will be created
 31 | #   3. Inside the 'color'/'gray' folder, two folders namely 'train' and 'test' will be created
 32 | #   4. Inside each of the 'train' and 'test' folders,
 33 | #      'neg' folder for negative images and 'pos' foder for positive images will be created         
 34 | ###########################################################################################################
 35 | 
 36 | 
 37 | 
 38 | import os
 39 | import glob
 40 | import sys
 41 | import csv
 42 | import numpy as np
 43 | import random
 44 | import cv2
 45 | import math
 46 | import argparse
 47 | import cPickle
 48 | 
 49 | from util_file import *
 50 | 
 51 | def parse_UMD(image_dir, anno_dir,train_size,test_size):
 52 |     """ origional annotation format
 53 |             '313', 'gaetano_donizetti/gaetano_donizetti_0010.jpg', '3.652360', '0.998470', '235.973200', '113.164400', '83.661600', '82.111200', '12.000000', '-21.000000', '1.000000', '242.945000', 
 54 |             '123.762000', '0.672196', '249.732000', '122.254000', '0.953512', '258.527000', '123.782000', '0.987899', '275.412000', '122.693000', '0.976441', '285.191000', '120.007000', '0.952408', '294.760000', '120.541000', '0.888727', '248.084000', '130.652000', 
 55 |             '0.918214', '254.237000', '130.043000', '1.003340', '260.078000', '130.637000', '0.961023', '278.597000', '129.900000', '0.959223', '285.327000', '128.429000', '0.985439', '291.989000', '128.231000', '0.981398', '243.272000', '147.739000', '0.000000', '261.525000', '152.766000', '0.627117', '267.922000', '153.909000', '0.989203', '278.154000', '151.961000', '0.948437', '312.663000', '144.420000', '0.000000', '261.234000', '167.113000', '0.896388', '271.949000', '168.055000', '0.972544', '284.254000', 
 56 |             '166.072000', '0.986057', '274.983000', '188.433000', '0.247581', '0.874067', '0.125933'
 57 |         """
 58 |     # check directories of the dataset
 59 |     check_path(image_dir)
 60 |     check_path(anno_dir)
 61 |     #parse the annotation file
 62 |     anno_file = os.path.join(anno_dir, 'umdfaces_batch3_ultraface.csv')
 63 |     dataset=[]
 64 |     
 65 |     num_train_test_size=train_size+test_size 
 66 |     
 67 |     count=0
 68 |     with open(anno_file) as csvfile:
 69 |         readCSV = csv.reader(csvfile, delimiter=',')
 70 |         next(readCSV)
 71 |         for row in readCSV:
 72 |             
 73 |             per_data_info=[]
 74 |             img_name=row[1]
 75 |             per_data_info.append(img_name)
 76 |             face_x=row[4]
 77 |             per_data_info.append(face_x)
 78 |             face_y=row[5]
 79 |             per_data_info.append(face_y)
 80 |             face_width=row[6]
 81 |             per_data_info.append(face_width)
 82 |             face_height=row[7]
 83 |             per_data_info.append(face_height)
 84 |             count+=1
 85 |             dataset.append(per_data_info)
 86 |             if(count<num_train_test_size):
 87 |                 continue
 88 |             break
 89 |     
 90 |     return dataset
 91 |     
 92 | def create_datasets_UMD(image_dir,anno_dir,save_dir,use_Color,patch_size,train_size,test_size):
 93 |     dataset=parse_UMD(image_dir,anno_dir,train_size,test_size)
 94 |     
 95 |     # create directories for saving cropped datasets if necessary
 96 |     make_dir_if_not_exist(save_dir)
 97 |     dataset_tag ='color' if use_Color  else 'gray'
 98 |     
 99 |     save_folder = os.path.join(save_dir, dataset_tag)
100 |     make_dir_if_not_exist(save_folder)
101 |     
102 |     dataset_train='train' 
103 |     save_folder_train = os.path.join(save_folder, dataset_train)
104 |     make_dir_if_not_exist(save_folder_train)
105 |     
106 |     dataset_test='test' 
107 |     save_folder_test = os.path.join(save_folder, dataset_test)
108 |     make_dir_if_not_exist(save_folder_test)
109 |     
110 |     #create pos folder-train
111 |     positive='pos'
112 |     positive_folder_train=os.path.join(save_folder_train, positive)
113 |     make_dir_if_not_exist(positive_folder_train)
114 |     
115 |     #create neg folder-train
116 |     negative='neg'
117 |     negative_folder_train=os.path.join(save_folder_train, negative)
118 |     make_dir_if_not_exist(negative_folder_train)
119 |     
120 |     #create pos folder-test
121 |     positive='pos'
122 |     positive_folder_test=os.path.join(save_folder_test, positive)
123 |     make_dir_if_not_exist(positive_folder_test)
124 |     
125 |     #create neg folder-test
126 |     negative='neg'
127 |     negative_folder_test=os.path.join(save_folder_test, negative)
128 |     make_dir_if_not_exist(negative_folder_test)
129 |     
130 |     count=0
131 |     dSize=patch_size
132 |     
133 |     img_tag = cv2.IMREAD_COLOR if use_Color else cv2.IMREAD_GRAYSCALE
134 |     
135 |     #train
136 |     #crop positive
137 |     for i in range(1,train_size):
138 |         per_data_info=dataset[i]
139 |         full_name=per_data_info[0]
140 |         index_of_slash=full_name.find('/')
141 |         img_name=full_name[index_of_slash+1:]
142 |         folder_name=img_name[:index_of_slash]
143 |         X=int(float(per_data_info[1]))
144 |         Y=int(float(per_data_info[2]))
145 |         W=int(float(per_data_info[3]))
146 |         H=int(float(per_data_info[4]))
147 |                 
148 |         #find the image in the image_dir
149 |         folder_path=os.path.join(image_dir,folder_name)
150 |         
151 |         # if use_Color is True
152 |         if use_Color:
153 |           
154 |             for filename in glob.glob(folder_path+'\*.jpg'): 
155 |                 
156 |                 length=len(img_name)
157 |                 filename_short=filename[len(filename)-length:]
158 |                 
159 |                 if(filename_short==img_name):
160 |                     
161 |                     img= cv2.imread(folder_path+'\\'+img_name,img_tag)
162 |                     cv2.rectangle(img,(X,Y),(X+H,Y+H),(255,255,255))
163 |                     
164 |                     #crop pos
165 |                     cropped_image_pos=img[Y:Y+H,X:X+W]
166 |                     
167 |                     #crop neg
168 |                     cropped_image_neg=img[0:dSize,0:dSize]
169 |                     
170 |                     #save pos
171 |                     resized_pos=cv2.resize(cropped_image_pos,(dSize,dSize)) 
172 |                     cv2.imwrite(positive_folder_train+'\\'+img_name,resized_pos)
173 |                     
174 |                     #save neg
175 |                     resized_neg=cv2.resize(cropped_image_neg,(dSize,dSize))
176 |                     cv2.imwrite(negative_folder_train+'\\'+img_name,resized_neg)
177 |                     
178 |         # if use_Color is False            
179 |         else:
180 |             
181 |             for filename in glob.glob(folder_path+'\*.jpg'): 
182 |                 
183 |                 length=len(img_name)
184 |                 filename_short=filename[len(filename)-length:]
185 |                 
186 |                 if(filename_short==img_name):
187 |                     
188 |                     img= cv2.imread(folder_path+'\\'+img_name,img_tag)
189 |                     cv2.rectangle(img,(X,Y),(X+H,Y+H),(255,255,255))
190 |                     
191 |                     #crop pos
192 |                     cropped_image_pos=img[Y:Y+H,X:X+W]
193 |                     
194 |                     #crop neg
195 |                     cropped_image_neg=img[0:dSize,0:dSize]
196 |                     
197 |                     #save pos
198 |                     resized_pos=cv2.resize(cropped_image_pos,(dSize,dSize)) 
199 |                     cv2.imwrite(positive_folder_train+'\\'+img_name,resized_pos)
200 |                     
201 |                     #save neg
202 |                     resized_neg=cv2.resize(cropped_image_neg,(dSize,dSize))
203 |                     cv2.imwrite(negative_folder_train+'\\'+img_name,resized_neg)
204 |           
205 |     #**************************************************************************
206 |     #test
207 |     for i in range(train_size,train_size+test_size):
208 |         per_data_info=dataset[i]
209 |         full_name=per_data_info[0]
210 |         index_of_slash=full_name.find('/')
211 |         img_name=full_name[index_of_slash+1:]
212 |         folder_name=img_name[:index_of_slash]
213 |         X=int(float(per_data_info[1]))
214 |         Y=int(float(per_data_info[2]))
215 |         W=int(float(per_data_info[3]))
216 |         H=int(float(per_data_info[4]))
217 |                 
218 |         #find the image in the image_dir
219 |         folder_path=os.path.join(image_dir,folder_name)
220 |         
221 |         # if use_Color is True
222 |         if use_Color:
223 |           
224 |             for filename in glob.glob(folder_path+'\*.jpg'): 
225 |                 
226 |                 length=len(img_name)
227 |                 filename_short=filename[len(filename)-length:]
228 |                 
229 |                 if(filename_short==img_name):
230 |                     
231 |                     img= cv2.imread(folder_path+'\\'+img_name,img_tag)
232 |                     cv2.rectangle(img,(X,Y),(X+H,Y+H),(255,255,255))
233 |                     
234 |                     #crop pos
235 |                     cropped_image_pos=img[Y:Y+H,X:X+W]
236 |                     
237 |                     #crop neg
238 |                     cropped_image_neg=img[0:dSize,0:dSize]
239 |                     
240 |                     #save pos
241 |                     resized_pos=cv2.resize(cropped_image_pos,(dSize,dSize)) 
242 |                     cv2.imwrite(positive_folder_test+'\\'+img_name,resized_pos)
243 |                     
244 |                     #save neg
245 |                     resized_neg=cv2.resize(cropped_image_neg,(dSize,dSize))
246 |                     cv2.imwrite(negative_folder_test+'\\'+img_name,resized_neg)
247 |                     
248 |         # if use_Color is False            
249 |         else:
250 |             
251 |             for filename in glob.glob(folder_path+'\*.jpg'): 
252 |                 
253 |                 length=len(img_name)
254 |                 filename_short=filename[len(filename)-length:]
255 |                 
256 |                 if(filename_short==img_name):
257 |                     
258 |                     img= cv2.imread(folder_path+'\\'+img_name,img_tag)
259 |                     cv2.rectangle(img,(X,Y),(X+H,Y+H),(255,255,255))
260 |                     
261 |                     #crop pos
262 |                     cropped_image=img[Y:Y+H,X:X+W]
263 |                     
264 |                     #crop neg
265 |                     cropped_image=img[Y:Y+H,X:X+W]
266 |                     
267 |                     #save pos
268 |                     resized=cv2.resize(cropped_image,(dSize,dSize))
269 |                     cv2.imwrite(positive_folder_test+'\\'+img_name,resized)
270 |         
271 |                     #save neg
272 |                     resized_neg=cv2.resize(cropped_image_neg,(dSize,dSize))
273 |                     cv2.imwrite(negative_folder_test+'\\'+img_name,resized_neg)
274 | 
275 | # --image_dir .\data_UMD\originalPics, --anno_dir .\data_UMD\annotations,  --save_dir .\data_UMD\cache, 
276 | # --use_Color True for Color else False, -- patch_size=60 , --train_size =10000 , --test_size= 1000 
277 |                     #
278 | 
279 | if __name__ == '__main__':
280 |     
281 |     create_datasets_UMD('.\data_UMD\original_pics', '.\data_UMD\Annotation','.\data_UMD\cache',True,60,10000,1000)


--------------------------------------------------------------------------------