├── README.md
├── data_extraction
    ├── pickle_kitti_dataset.py
    ├── pickle_nyu_dataset.py
    └── save_to_file_nyu.m
├── depth_estimate.PNG
├── depth_estimation_nunet.py
├── inference_timer.py
├── kitti.gif
├── models
    ├── losses.py
    └── models.py
├── prediction_comparison.py
├── requirements.txt
└── utils
    ├── augmented_data_generator.py
    ├── deep_utils.py
    ├── fill_depth_colorization.py
    ├── image_utils.py
    ├── images_to_video.py
    ├── rgb2depth.py
    ├── rgb2depth_stream.py
    └── stack_videos.py


/README.md:
--------------------------------------------------------------------------------
  1 | # depth-estimation
  2 | Practical Depth Estimation with Image Segmentation and Serial U-Nets
  3 | 
  4 | ![Depth Estimate](depth_estimate.PNG)
  5 | 
  6 | ![Car Depth Estimate](kitti.gif)
  7 | 
  8 | **Depth Estimates on KITTI Validation Data**
  9 | 
 10 | ```
 11 | depth-estimation
 12 | |   depth_estimation_nunet.py <--- main file
 13 | |   depth_estimate.png
 14 | |   inference_timer.py
 15 | |   kitti.gif
 16 | |   prediction_comparison.py
 17 | |   README.md
 18 | |   requirements.txt
 19 | |
 20 | +---data_extraction
 21 | |       pickle_kitti_dataset.py
 22 | |       pickle_nyu_dataset.py
 23 | |       save_to_file_nyu.m
 24 | |
 25 | +---models
 26 | |       losses.py
 27 | |       models.py
 28 | |
 29 | \---utils
 30 |         augmented_data_generator.py
 31 |         deep_utils.py
 32 |         fill_depth_colorization.py
 33 |         image_utils.py
 34 |         images_2_video.py
 35 |         rgb2depth.py
 36 |         rgb2depth_stream.py
 37 |         stack_videos.py
 38 | 
 39 | ```
 40 | 
 41 | ### Initial Setup
 42 | ```
 43 | git clone https://github.com/mech0ctopus/depth-estimation.git
 44 | cd depth-estimation
 45 | pip install -r requirements.txt
 46 | ```
 47 | 
 48 | ### Use Pre-Trained Network on Webcam
 49 | 1. Download & extract pre-trained weights from link below. Place in depth-estimation folder.
 50 | 2. Run rgb2depth_stream.
 51 | ```
 52 | cd depth-estimation
 53 | python utils\rgb2depth_stream.py
 54 | ```
 55 | 
 56 | ### Use Pre-Trained Network on RGB Video
 57 | 1. Download & extract pre-trained weights from link below. Place in depth-estimation folder.
 58 | 2. Run video_depth_writer.
 59 | ```
 60 | cd depth-estimation
 61 | python utils\video_depth_writer.py
 62 | ```
 63 | 
 64 | ###  Train Depth Estimation Network
 65 | 1. Download NYU Depth V2 or KITTI images from link below
 66 | 2. (Optional, for NYU Depth V2) Colorize depth images
 67 | ```
 68 | python utils\fill_depth_colorization.py
 69 | ```
 70 | 3. Update training & validation folderpaths
 71 | 4. Verify input shapes are correct (NYU: 480x640, Re-sized KITTI: 192x640)
 72 | ```
 73 | python depth_estimation_nunet.py
 74 | ```
 75 | 5. View Results in Tensorboard.
 76 | ```
 77 | cd depth-estimation
 78 | tensorboard --logdir logs
 79 | ```
 80 | 
 81 | ### Pre-trained Weights
 82 | - [Download Pre-trained Weights (NYU Depth V2, ResNet34 Backbones, 480x640 Images)](https://mega.nz/#!y9E1lC7S!UATGE-izPvmzfm_bWeGTkPb9tmoAS8pP4P72iyTQ2pQ)
 83 | 
 84 | - [Download Pre-trained Weights (KITTI, ResNet50 Backbones, 192x640 Images)](https://mega.nz/file/L8kHRZSQ#sbZyujgm9CUJL1vdw9D4L6JtTLfS7IzoLtT7mDzI63I)
 85 | 
 86 | ### Download Pre-processed KITTI Dataset
 87 | [Download Pre-processed KITTI RGB and Depth Images (Re-sized and colorized) Training Images (5.5GB)](https://mega.nz/file/O1sn3TQQ#fbXlhG5T8Ad30CTtfwvKyKfgDyH3Aa2tq_fSoYhTA0U)
 88 | 
 89 | **Note:** Raw image data is from the [KITTI Raw Dataset (synced and rectified)](http://www.cvlibs.net/datasets/kitti/raw_data.php) and the [KITTI Depth Prediction Dataset (annotated depth maps)](http://www.cvlibs.net/datasets/kitti/eval_depth.php?benchmark=depth_prediction).
 90 | 
 91 | ### Datasets
 92 | - [FieldSAFE](https://vision.eng.au.dk/fieldsafe/)
 93 | - [KITTI](http://www.cvlibs.net/datasets/kitti/eval_depth.php?benchmark=depth_prediction)
 94 | - [NYU Depth Dataset V2](https://cs.nyu.edu/~silberman/datasets/nyu_depth_v2.html)
 95 | 
 96 | ### Citation
 97 | ```
 98 | @conference{vehits20,
 99 | author={Kyle J. Cantrell. and Craig D. Miller. and Carlos W. Morato.},
100 | title={Practical Depth Estimation with Image Segmentation and Serial U-Nets},
101 | booktitle={Proceedings of the 6th International Conference on Vehicle Technology and Intelligent Transport Systems - Volume 1: VEHITS,},
102 | year={2020},
103 | pages={406-414},
104 | publisher={SciTePress},
105 | organization={INSTICC},
106 | doi={10.5220/0009781804060414},
107 | isbn={978-989-758-419-0},
108 | }
109 | ```


--------------------------------------------------------------------------------
/data_extraction/pickle_kitti_dataset.py:
--------------------------------------------------------------------------------
  1 | # -*- coding: utf-8 -*-
  2 | """
  3 | Reads and pickles KITTI dataset into multiple files.
  4 | 
  5 | Expects dataset structured as follows:
  6 |     dataset
  7 |         X_rgb
  8 |             2011_09_26_drive_0002_sync (default KITTI subtree)
  9 |             2011_09_26_drive_0009_sync
 10 |             ...
 11 |         y_depth
 12 |             2011_09_26_drive_0002_sync
 13 |             2011_09_26_drive_0009_sync
 14 |             ...
 15 | 
 16 | Usage:
 17 | pickle_data(dataset,output_folderpath)
 18 | 
 19 | """
 20 | import numpy as np
 21 | from glob import glob
 22 | from utils.image_utils import depth_read, rgb_read
 23 | import pickle
 24 | from math import ceil
 25 | 
 26 | def append_folderpath(folderpath):
 27 |     '''Adds '\\' to folderpath end if needed'''
 28 |     if folderpath.endswith('\\')==False:
 29 |         folderpath=str(folderpath)+ '\\'
 30 |         
 31 |     return folderpath
 32 |         
 33 | def get_X_y_paths(data_folderpath,subfolder):
 34 |     '''Builds X & y subfolderpaths.'''
 35 |     #Append folder paths if necessary
 36 |     data_folderpath=append_folderpath(data_folderpath)
 37 |     subfolder=append_folderpath(subfolder)
 38 |     #Establish X and y subfolder paths
 39 |     X_rgb_subpath=data_folderpath+'X_rgb'+'\\'+subfolder
 40 |     y_depth_subpath=data_folderpath+'y_depth'+'\\'+subfolder
 41 |     
 42 |     return X_rgb_subpath, y_depth_subpath
 43 | 
 44 | def get_depth_paths(y_depth_subpath):
 45 |     '''Build lists of filepaths for left & right image depths .'''
 46 |     y_depth_subpath=append_folderpath(y_depth_subpath)
 47 |     #Point to correct location
 48 |     left_depth=y_depth_subpath+'proj_depth\groundtruth\image_02\\'
 49 |     right_depth=y_depth_subpath+'proj_depth\groundtruth\image_03\\' 
 50 |     #Get all image filenames
 51 |     left_depth_paths=glob(left_depth+'*.PNG')           
 52 |     right_depth_paths=glob(right_depth+'*.PNG')
 53 |     
 54 |     return left_depth_paths, right_depth_paths
 55 |     
 56 | def pickle_depth_images(subfolder,depth_paths,output_folderpath,max_array_len=200):
 57 |     '''Generates pickle file of y_depth data'''
 58 |     #Read depth images and update np.array
 59 |     num_images=len(depth_paths)
 60 |     y=np.zeros((num_images,375,1242),dtype=np.uint8)
 61 |     for idx, depth_path in enumerate(depth_paths):
 62 |         y[idx]=depth_read(depth_path)
 63 |     
 64 |     #Split data into smaller pickle files if necessary
 65 |     num_intervals=ceil(num_images/max_array_len)
 66 |     if num_intervals>1:
 67 |         y_splits=np.array_split(y,num_intervals)
 68 |         #Clear y variable
 69 |         y=None
 70 |         for idx, y_split in enumerate(y_splits):
 71 |             #Save to pickle file
 72 |             pickle.dump(y_split, open(output_folderpath+r"y_"+str(subfolder)+f"_{idx}.p", "wb"), protocol=4)
 73 |             #Clear y_split variable
 74 |         y_splits=None
 75 |     else:
 76 |         #Save to pickle file
 77 |         pickle.dump(y, open(output_folderpath+r"y_"+str(subfolder)+".p", "wb"), protocol=4)
 78 |         #Clear y variable
 79 |         y=None
 80 |     
 81 | def get_rgb_paths(X_rgb_subpath,left_depth_paths, right_depth_paths):
 82 |     '''Create list of RGB paths corresponding to input depth paths'''
 83 |     #Point to correct location
 84 |     left_rgb=X_rgb_subpath+'image_02\data\\'
 85 |     right_rgb=X_rgb_subpath+'image_03\data\\'
 86 |     #Build list of image names in left and right depth paths
 87 |     left_depth_image_names=[filepath.split('\\')[-1] for filepath in left_depth_paths]
 88 |     right_depth_image_names=[filepath.split('\\')[-1] for filepath in right_depth_paths]
 89 |     #Build list of left and right RGB paths corrseponding to depth images
 90 |     left_rgb_paths,right_rgb_paths=[],[]
 91 |     for left_depth_image_name in left_depth_image_names:
 92 |         left_rgb_paths.append(left_rgb+left_depth_image_name)
 93 |     for right_depth_image_name in right_depth_image_names:
 94 |         right_rgb_paths.append(right_rgb+right_depth_image_name)    
 95 |     rgb_paths=left_rgb_paths+right_rgb_paths
 96 |     
 97 |     return rgb_paths
 98 |  
 99 | def pickle_rgb_images(subfolder,rgb_paths,output_folderpath,max_array_len=200):
100 |     '''Generates pickle file of X_rgb data'''
101 |     #Read RGB images and update np.array
102 |     num_images=len(rgb_paths)
103 |     X=np.zeros((num_images,375,1242,3),dtype=np.uint8)
104 |     for idx, rgb_path in enumerate(rgb_paths):
105 |         X[idx]=rgb_read(rgb_path)
106 |         
107 |     #Split data into smaller pickle files if necessary
108 |     num_intervals=ceil(num_images/max_array_len)
109 |     if num_intervals>1:
110 |         X_splits=np.array_split(X,num_intervals)
111 |         #Clear X variable
112 |         X=None
113 |         for idx, X_split in enumerate(X_splits):
114 |             #Save to pickle file
115 |             pickle.dump(X_split, open(output_folderpath+r"X_"+str(subfolder)+f"_{idx}.p", "wb"), protocol=4)
116 |             #Clear X_split variable
117 |         X_splits=None
118 |     else:
119 |         #Save to pickle file
120 |         pickle.dump(X, open(output_folderpath+r"X_"+str(subfolder)+".p", "wb"), protocol=4)
121 |         #Clear X variable
122 |         X=None
123 |         
124 | def pickle_folder(data_folderpath,subfolder,output_folderpath):
125 |     '''Reads and pickles one folder from KITTI.  
126 |     Save X, y folder pair as pickle files.'''
127 |     #Identify where X and y data is located    
128 |     X_rgb_subpath, y_depth_subpath=get_X_y_paths(data_folderpath,subfolder)
129 |     #Build list of filepaths for left & right image depths
130 |     left_depth_paths, right_depth_paths=get_depth_paths(y_depth_subpath)
131 |     depth_paths=left_depth_paths+right_depth_paths
132 |     #Create pickle file of all depth images listed in depth_paths
133 |     pickle_depth_images(subfolder,depth_paths,output_folderpath)
134 |     #Create list of corresponding RGB paths
135 |     rgb_paths=get_rgb_paths(X_rgb_subpath,left_depth_paths, right_depth_paths)
136 |     #Create pickle file of all RGB images listed in rgb_paths
137 |     pickle_rgb_images(subfolder,rgb_paths,output_folderpath)
138 | 
139 | def pickle_dataset(data_folderpath,output_folderpath):
140 |     '''Reads and pickles KITTI dataset into multiple files.'''
141 |     output_folderpath=append_folderpath(output_folderpath)
142 |     #Build list of subfolders in data_folderpath\y_depth
143 |     data_folderpath=append_folderpath(data_folderpath)
144 |     y_depth_path=data_folderpath+'y_depth'
145 |     subfolders=glob(y_depth_path+'\\*\\')
146 |     #Parse out foldername
147 |     subfolders=[subfolder.split('\\')[-2] for subfolder in subfolders]
148 |     #Pickle each subfolder
149 |     for subfolder in subfolders:
150 |         print(f'Pickling {subfolder}')
151 |         pickle_folder(data_folderpath,subfolder,output_folderpath)
152 |     
153 | if __name__ == '__main__':   
154 |     dataset=r"G:\Documents\KITTI\sandbox_val"
155 |     output_folderpath=r"G:\Documents\KITTI\pickled_KITTI\validation"
156 |     pickle_dataset(dataset,output_folderpath)


--------------------------------------------------------------------------------
/data_extraction/pickle_nyu_dataset.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | """
 3 | Pickles thin NYU Depth dataset
 4 | """
 5 | import numpy as np
 6 | from glob import glob
 7 | from PIL import Image
 8 | import pickle
 9 | from utils.image_utils import depth_read
10 | 
11 | def generate_pickle_files(X,y):
12 |     '''Generates pickle file to compress whole dataset.'''
13 |     pickle.dump(X, open(r"X.p", "wb"), protocol=4)
14 |     pickle.dump(y, open(r"y.p", "wb"), protocol=4)
15 | 
16 | def load_pickle_files(X_file, y_file):
17 |     '''Reads data from pickle files'''
18 |     X=pickle.load(open(X_file,'rb'))
19 |     y=pickle.load(open(y_file,'rb'))
20 |     return X, y
21 | 
22 | def read_data(data_folderpath,output_folderpath,num_intervals=35):
23 |     '''Reads full dataset.  Assumes data has been resized.
24 |     Assumes "data_folderpath" contains subfolders corresponding
25 |     to class names and each containing jpg files for class.'''
26 |     print('Initializing Matrices')
27 |     X=np.zeros((7392,480,640,3),dtype=np.uint8) #Was 480,640
28 |     y=np.zeros((7392,480,640),dtype=np.uint8)   #Was 480,640
29 | 
30 |     #Append folderpaths if needed
31 |     if data_folderpath.endswith('\\')==False:
32 |         data_folderpath=str(data_folderpath)+ '\\'
33 |     if output_folderpath.endswith('\\')==False:
34 |         output_folderpath=str(output_folderpath)+ '\\'
35 |     X_folderpath=data_folderpath+'X_rgb\\'
36 |     y_folderpath=data_folderpath+'y_depth\\'
37 |     
38 |     #Build list of filenames
39 |     X_filelist=glob(X_folderpath+'*.png')
40 |     y_filelist=glob(y_folderpath+'*.png')
41 |     
42 |     X_filelist.sort(key=lambda f: int(''.join(filter(str.isdigit, f))))
43 |     y_filelist.sort(key=lambda f: int(''.join(filter(str.isdigit, f))))
44 |     
45 |     for idx in range(len(X_filelist)):
46 |         print(f'Reading file #{idx}')
47 |         #Load images
48 |         rgb_image=Image.open(X_filelist[idx])
49 |         #depth_image=Image.open(y_filelist[idx])
50 | 
51 |         #store as np.arrays
52 |         X[idx]=np.array(rgb_image) #.reshape(640,480,3) #Reshape is new
53 |         #y[idx]=np.array(depth_image) #.reshape(640,480) #Reshape is new
54 |         y[idx]=depth_read(y_filelist[idx])
55 | #        if idx==1:
56 | ##            image_utils.image_from_np(y[idx],rgb=False)
57 | #            image_utils.image_from_np(X[idx])
58 | #            plt.imshow(y[idx], cmap='gray', interpolation='nearest')
59 | #            break
60 |         rgb_image.close()
61 |         #depth_image.close()
62 | 
63 |     print('Splitting Data')
64 |     y_splits=np.array_split(y,num_intervals)
65 |     X_splits=np.array_split(X,num_intervals)
66 |     X=None
67 |     y=None
68 |     
69 |     print('Pickling')
70 |     for idx in range(len(y_splits)):
71 |         #Save to pickle file
72 |         pickle.dump(y_splits[idx], open(output_folderpath+f"y_{idx}.p", "wb"), protocol=4)
73 |         pickle.dump(X_splits[idx], open(output_folderpath+f"X_{idx}.p", "wb"), protocol=4)
74 |     
75 | if __name__ == '__main__':   
76 |     dataset=r"E:\NYU\nyud_raw_data\nyuv2-python-toolbox-master\colorized"
77 |     output_folderpath=r"G:\Documents\NYU Depth Dataset\nyu_data\pickled_colorized"
78 |     read_data(dataset,output_folderpath)


--------------------------------------------------------------------------------
/data_extraction/save_to_file_nyu.m:
--------------------------------------------------------------------------------
 1 | %Saves RGB and color images from nyu_depth_v2_labeled.mat to PNG files
 2 | %Assumes depths and images variables have been loaded
 3 | 
 4 | size_rgb_images=size(images);
 5 | num_rgb_images=size_rgb_images(4);
 6 | 
 7 | for i=1:num_rgb_images
 8 |     disp(strcat(num2str(i),'/',num2str(num_rgb_images)));
 9 |     rgb_filename=strcat('nyu_data/X_rgb/rgb_',num2str(i),'.png');
10 |     imwrite(uint8(images(:,:,:,i)),rgb_filename);
11 |     
12 |     d_filename=strcat('nyu_data/y_depth/d_',num2str(i),'.png');
13 |     imwrite(mat2gray(depths(:,:,i)),d_filename);
14 | end


--------------------------------------------------------------------------------
/depth_estimate.PNG:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mech0ctopus/depth-estimation/89d0a3f2efcb16a85530694b476d9868b374a5e8/depth_estimate.PNG


--------------------------------------------------------------------------------
/depth_estimation_nunet.py:
--------------------------------------------------------------------------------
  1 | # Kyle J. Cantrell & Craig D. Miller
  2 | # kjcantrell@wpi.edu & cdmiller@wpi.edu
  3 | # Deep Learning for Advanced Robot Perception
  4 | #
  5 | # Depth Estimation from RGB Images
  6 | 
  7 | import numpy as np
  8 | from glob import glob
  9 | from utils import deep_utils
 10 | from utils.image_utils import depth_read, rgb_read, depth_read_kitti
 11 | from models import models
 12 | from tensorflow.keras.callbacks import TensorBoard, ModelCheckpoint
 13 | from tensorflow.keras.optimizers import Adam
 14 | import datetime
 15 | from tensorflow.compat.v1 import ConfigProto
 16 | from tensorflow.compat.v1 import InteractiveSession
 17 | import segmentation_models
 18 | 
 19 | config = ConfigProto()
 20 | config.gpu_options.per_process_gpu_memory_fraction = 0.9
 21 | config.gpu_options.allow_growth = True
 22 | session = InteractiveSession(config=config)
 23 | 
 24 | def _batchGenerator(X_filelist,y_filelist,batchSize):
 25 |     """
 26 |     Yield X and Y data when the batch is filled.
 27 |     """
 28 |     #Sort filelists to confirm they are same order
 29 |     X_filelist.sort(key=lambda f: int(''.join(filter(str.isdigit, f))))
 30 |     y_filelist.sort(key=lambda f: int(''.join(filter(str.isdigit, f))))
 31 |     #Shuffle order of filenames
 32 |     X_filelist,y_filelist=deep_utils.simul_shuffle(X_filelist,y_filelist)
 33 | 
 34 |     while True:
 35 |         idx=0
 36 |         
 37 |         while idx<len(X_filelist):
 38 |             X_train=np.zeros((batchSize,192,640,3),dtype=np.uint8)
 39 |             y_train=np.zeros((batchSize,192,640),dtype=np.uint8)
 40 |             
 41 |             for i in range(batchSize):
 42 |                 #Load images
 43 |                 X_train[i]=rgb_read(X_filelist[idx+i])
 44 |                 #y_train[i]=depth_read(y_filelist[idx+i])
 45 |                 y_train[i]=depth_read_kitti(y_filelist[idx+i])
 46 |                 
 47 |             #Reshape [samples][width][height][pixels]
 48 |             X_train = X_train.reshape(X_train.shape[0], X_train.shape[1], 
 49 |                                       X_train.shape[2], X_train.shape[3]).astype(np.uint8)
 50 | 
 51 |             y_train = y_train.reshape((y_train.shape[0],1,-1)).astype(np.uint8)
 52 |             y_train = y_train.squeeze()
 53 |                  
 54 |             # normalize inputs and outputs from 0-255 to 0-1
 55 |             X_train=np.divide(X_train,255).astype(np.float16)   
 56 |             y_train=np.divide(y_train,255).astype(np.float16)
 57 |             
 58 |             if (idx % 1024)==0:
 59 |                 print(str(idx)+'/'+str(len(X_filelist)))
 60 |                 
 61 |             idx+=batchSize
 62 |             
 63 |             yield X_train, y_train
 64 |             
 65 | def _valBatchGenerator(X_val_filelist,y_val_filelist,batchSize):
 66 |     """
 67 |     Yield X and Y data when the batch is filled.
 68 |     """
 69 |     #Sort filelists to confirm they are same order
 70 |     X_val_filelist.sort(key=lambda f: int(''.join(filter(str.isdigit, f))))
 71 |     y_val_filelist.sort(key=lambda f: int(''.join(filter(str.isdigit, f))))
 72 |     #Shuffle order of filenames
 73 |     X_val_filelist,y_val_filelist=deep_utils.simul_shuffle(X_val_filelist,y_val_filelist)
 74 | 
 75 |     while True:
 76 |         idx=0
 77 |         
 78 |         while idx<len(X_val_filelist):
 79 |             X_val=np.zeros((batchSize,192,640,3),dtype=np.uint8)
 80 |             y_val=np.zeros((batchSize,192,640),dtype=np.uint8)
 81 |             
 82 |             for i in range(batchSize):
 83 |                 #Load images
 84 |                 X_val[i]=rgb_read(X_val_filelist[idx+i])
 85 |                 #y_val[i]=depth_read(y_val_filelist[idx+i])
 86 |                 y_val[i]=depth_read_kitti(y_val_filelist[idx+i])
 87 |     
 88 |             #Reshape [samples][width][height][pixels]
 89 |             X_val = X_val.reshape(X_val.shape[0], X_val.shape[1], 
 90 |                                   X_val.shape[2], X_val.shape[3]).astype(np.uint8)
 91 | 
 92 |             y_val = y_val.reshape((y_val.shape[0],1,-1)).astype(np.uint8)
 93 |             y_val = y_val.squeeze()
 94 |                  
 95 |             # normalize inputs and outputs from 0-255 to 0-1
 96 |             X_val=np.divide(X_val,255).astype(np.float16)   
 97 |             y_val=np.divide(y_val,255).astype(np.float16)
 98 |             
 99 |             if (idx % 1024)==0:
100 |                 print(str(idx)+'/'+str(len(X_val_filelist)))
101 |                 
102 |             idx+=batchSize
103 |             
104 |             yield X_val, y_val
105 |             
106 | def main(model_name, model=models.wnet_connected,num_epochs=5,batch_size=2):
107 |     '''Trains depth estimation model.'''
108 |     
109 |     segmentation_models.set_framework('tf.keras')
110 |     print(segmentation_models.framework())
111 |     
112 |     #Build list of training filenames
113 |     X_folderpath=r"G:\Documents\KITTI\data\train\X\\"
114 |     y_folderpath=r"G:\Documents\KITTI\data\train\y\\"
115 |     X_filelist=glob(X_folderpath+'*.png')
116 |     y_filelist=glob(y_folderpath+'*.png')
117 |     
118 |     #Build list of validation filenames
119 |     X_val_folderpath=r"G:\Documents\KITTI\data\val\X\\"
120 |     y_val_folderpath=r"G:\Documents\KITTI\data\val\y\\"
121 |     X_val_filelist=glob(X_val_folderpath+'*.png')
122 |     y_val_filelist=glob(y_val_folderpath+'*.png')
123 |     
124 |     model=model()
125 |     model.compile(loss='mean_squared_error',optimizer=Adam(lr=1e-4)) #,metrics=['mse']
126 | 
127 |     #Save best model weights checkpoint
128 |     filepath=f"{model_name}_weights_best.hdf5"
129 |     checkpoint = ModelCheckpoint(filepath, monitor='val_loss', verbose=1, 
130 |                                  save_best_only=True, mode='min')
131 |     
132 |     #Tensorboard setup
133 |     log_dir = f"logs\\{model_name}\\" + datetime.datetime.now().strftime("%Y%m%d-%H%M%S")        
134 |     tensorboard_callback = TensorBoard(log_dir=log_dir)
135 |     
136 |     callbacks_list = [checkpoint, tensorboard_callback]
137 |     
138 |     model.fit_generator(_batchGenerator(X_filelist,y_filelist,batch_size),
139 |                         epochs=num_epochs,
140 |                         steps_per_epoch=len(X_filelist)//batch_size,
141 |                         #validation_data=(X_test,y_test),
142 |                         validation_data=_valBatchGenerator(X_val_filelist,y_val_filelist,batch_size),
143 |                         validation_steps=len(X_val_filelist)//batch_size,
144 |                         max_queue_size=1,
145 |                         callbacks=callbacks_list,
146 |                         verbose=2)
147 |     
148 |     return model
149 |     
150 | if __name__=='__main__':
151 |     training_models=[models.cnn, 
152 |                      models.pretrained_unet_cnn,
153 |                      models.rcnn_640_480, 
154 |                      models.pretrained_unet_rcnn,
155 |                      models.pretrained_unet, 
156 |                      models.wnet, 
157 |                      models.wnet_connected]
158 |     model_names=['CNN',
159 |                  'U-Net_CNN',
160 |                  'RCNN',
161 |                  'U-Net_RCNN',
162 |                  'U-Net',
163 |                  'W-Net',
164 |                  'W-Net_Connected']
165 |     
166 |     #Specify test_id argument to main()
167 |     test_id=6
168 |     
169 |     model=main(model_name=model_names[test_id],model=training_models[test_id],
170 |                num_epochs=35,batch_size=2)
171 |     
172 |     #Save model
173 |     deep_utils.save_model(model,serialize_type='yaml',
174 |                           model_name=f'{model_names[test_id]}_nyu_model',
175 |                           save_weights=False)
176 |     
177 |     deep_utils.save_model(model,serialize_type='json',
178 |                           model_name=f'{model_names[test_id]}_nyu_model',
179 |                           save_weights=False)


--------------------------------------------------------------------------------
/inference_timer.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | """
 3 | Assumes model and X_test are loaded as variables.
 4 | """
 5 | from timeit import default_timer as timer
 6 | from models import models
 7 | from tensorflow.keras.optimizers import Adam
 8 | from utils import image_utils
 9 | import numpy as np
10 | 
11 | #Load weights (h5)
12 | weights={'unet':r"G:\WPI\Courses\2019\Deep Learning for Advanced Robot Perception, RBE595\Project\VEHITS\Weights & Models\20Epochs_NoAugment_LowerLR\20200213-065621\U-Net_weights_best.hdf5",
13 |         'wnet':r"G:\WPI\Courses\2019\Deep Learning for Advanced Robot Perception, RBE595\Project\VEHITS\Weights & Models\20Epochs_NoAugment_LowerLR\20200213-082137\W-Net_weights_best.hdf5",
14 |         'wnet_c':r"G:\WPI\Courses\2019\Deep Learning for Advanced Robot Perception, RBE595\Project\VEHITS\Weights & Models\20Epochs_NoAugment_LowerLR\20200212-205108\W-Net_Connected_weights_best.hdf5"
15 |          }
16 | 
17 | model=models.pretrained_unet()
18 | model.compile(loss='mean_squared_error',optimizer=Adam(),metrics=['mse']) 
19 | model.load_weights(weights['unet'])
20 | 
21 | times=[]
22 | 
23 | #Read test image
24 | test_image=r"G:\WPI\Courses\2019\Deep Learning for Advanced Robot Perception, RBE595\Project\VEHITS\Graphs & Pictures\LR_0.0001\CityImages\1.jpg"
25 | test_image=image_utils.rgb_read(test_image) #640x480
26 | test_image=test_image.reshape(1,480,640,3)
27 | test_image=np.divide(test_image,255)
28 | 
29 | for i in range(101):  
30 |     start_time = timer()
31 |     y_est=model.predict(test_image)
32 |     end_time = timer()
33 |     if i!=0:
34 |         times.append(end_time-start_time)
35 |         print(end_time-start_time)
36 |     
37 | print('Average (ms): '+str(sum(times)/len(times)))
38 | print('Max. (ms): '+str(max(times)))
39 | print('Min. (ms): '+str(min(times)))


--------------------------------------------------------------------------------
/kitti.gif:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mech0ctopus/depth-estimation/89d0a3f2efcb16a85530694b476d9868b374a5e8/kitti.gif


--------------------------------------------------------------------------------
/models/losses.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | """
 3 | Created on Sun Dec  1 17:46:34 2019
 4 | Loss Functions 
 5 | @author: kjcantrell99
 6 | """
 7 | import keras.backend as K
 8 | 
 9 | def sil(yTrue,yPred):
10 |     """
11 |     Scale-Invariant Loss
12 |     usage: model.compile(loss=sil,...)
13 |     """
14 |     n = 480*640
15 |     yTrue = K.cast(yTrue, yPred.dtype)
16 |     first_log = K.log(K.clip(yPred, K.epsilon(), None) + 1.)
17 |     second_log = K.log(K.clip(yTrue, K.epsilon(), None) + 1.)
18 |     di = first_log - second_log
19 |     term1 = K.sum(K.square(di))
20 |     term2 = K.square(K.sum(di))
21 |     return (1/n)*(term1) - (0.5/(n*n))*term2
22 | 
23 | def root_mean_squared_error(yTrue, yPred):
24 |     """
25 |     Root-Mean Square Error Loss
26 |     usage: model.compile(loss=root_mean_squared_error,...)
27 |     https://stackoverflow.com/questions/43855162/rmse-rmsle-loss-function-in-keras/43863854
28 |     """
29 |     return K.sqrt(K.mean(K.square(yPred - yTrue)))
30 | 
31 | 


--------------------------------------------------------------------------------
/models/models.py:
--------------------------------------------------------------------------------
  1 | # -*- coding: utf-8 -*-
  2 | """
  3 | Final Models.
  4 | """
  5 | from tensorflow.keras.models import Sequential, Model
  6 | from tensorflow.keras.layers import Dense
  7 | from tensorflow.keras.layers import Dropout, LSTM, Input
  8 | from tensorflow.keras.layers import Flatten, Reshape, Concatenate
  9 | from tensorflow.keras.layers import Convolution2D
 10 | from tensorflow.keras.layers import MaxPooling2D
 11 | import segmentation_models
 12 | 
 13 | # from models.losses import sil
 14 | # from models.test_loss import depth_loss_function
 15 | 
 16 | segmentation_models.set_framework('tf.keras')
 17 | 
 18 | def cnn(input_shape=(480,640,3)):
 19 | 	'''Define CNN model'''
 20 | 	model = Sequential()
 21 | 	model.add(Convolution2D(30, 5, 5, border_mode='valid',input_shape=input_shape, activation='relu'))
 22 | 	model.add(MaxPooling2D(pool_size=(2, 2)))
 23 | 	model.add(Convolution2D(15, 3, 3, activation='relu'))
 24 | 	model.add(MaxPooling2D(pool_size=(2, 2)))
 25 | 	model.add(Dropout(0.5))
 26 | 	model.add(Flatten())
 27 | 	model.add(Dense(128, activation='relu'))
 28 | 	model.add(Dropout(0.5))
 29 | 	model.add(Dense(128, activation='relu'))
 30 | 	model.add(Dropout(0.5))
 31 | 	model.add(Dense(128, activation='relu'))
 32 | 	model.add(Dropout(0.5))
 33 | 	model.add(Dense(64, activation='relu'))
 34 | 	model.add(Dropout(0.5))
 35 | 	model.add(Dense(64, activation='relu'))
 36 | 	model.add(Dropout(0.5))
 37 | 	#model.add(Flatten())	
 38 | 	model.add(Dense(480*640,activation='linear'))
 39 | 	#model.compile(loss='mean_squared_error', optimizer=Adam(),metrics=['mse','msle']) 
 40 | 	return model
 41 | 
 42 | def pretrained_unet():
 43 |     '''Define pretrained U-Net model.'''
 44 |     #Load unet with resnet34 backbone.  Freeze imagenet weights for encoder
 45 |     premodel = segmentation_models.Unet('resnet34', input_shape=(480, 640, 3), encoder_weights='imagenet',encoder_freeze = True)
 46 |     #Get final conv. output and skip sigmoid activation layer
 47 |     x=premodel.layers[-2].output 
 48 |     reshape=Reshape((307200,))(x)
 49 |     model = Model(inputs=premodel.input, outputs=reshape)
 50 |     #model.compile(loss='mean_squared_error', optimizer=Adam(),metrics=['mse','msle']) #lr=1e-5, lr=5e-3
 51 |     #model.compile(loss=depth_loss_function, optimizer=Adam(),metrics=['mse','msle'])
 52 |     return model
 53 | 
 54 | def pretrained_unet_cnn():
 55 |     '''Define pretrained U-Net with CNN model.'''
 56 |     unet_cnn=Sequential()
 57 |     #Load unet with resnet34 backbone.  Freeze imagenet weights for encoder
 58 |     premodel = segmentation_models.Unet('resnet34', input_shape=(480, 640, 3), encoder_weights='imagenet',encoder_freeze = True)
 59 |     #Get final conv. output and keep sigmoid activation layer
 60 |     premodel=Model(inputs=premodel.input,outputs=premodel.layers[-1].output)  
 61 |     unet_cnn.add(premodel)
 62 |     unet_cnn.add(cnn(input_shape=(480,640,1)))
 63 | 
 64 |     #unet_cnn.compile(loss='mean_squared_error', optimizer=Adam()) 
 65 |     return unet_cnn
 66 | 
 67 | def wnet():
 68 |     #Load unet with resnet34 backbone.
 69 |     wnet=Sequential()
 70 |     firstU = segmentation_models.Unet('resnet34', input_shape=(480, 640, 3), encoder_weights='imagenet',encoder_freeze = True)
 71 |     secondU = segmentation_models.Unet('resnet34', input_shape=(480, 640, 1), encoder_weights=None)
 72 |     #Get final conv. output and keep sigmoid activation layer
 73 |     firstU = Model(inputs=firstU.input, outputs=firstU.layers[-1].output)
 74 |     #Get final conv. output and skip sigmoid activation layer
 75 |     secondU=Model(inputs=secondU.input, outputs=secondU.layers[-2].output)
 76 | #    for layer in firstU.layers:
 77 | #        layer.trainable = False
 78 |     for layer in secondU.layers:
 79 |         layer.trainable = True
 80 |         
 81 |     wnet.add(firstU)
 82 |     wnet.add(secondU)
 83 |     wnet.add(Reshape((307200,)))
 84 |     
 85 |     # Make sure that the pre-trained firstU layers are not trainable
 86 | #    wnet.layers[0].trainable=False
 87 | #    wnet.layers[1].trainable=True
 88 | #    wnet.layers[2].trainable=True
 89 |     #wnet.compile(loss='mean_squared_error', optimizer=Adam())
 90 |     #wnet.summary()
 91 |     return wnet
 92 | 
 93 | def wnet_connected():   
 94 |     #Load unet with resnet34 backbone. (densenet201,resnet34,vgg16,resnet18,resnet152)
 95 |     firstU = segmentation_models.Unet('resnet50', input_shape=(192, 640, 3), encoder_weights='imagenet',encoder_freeze = True)
 96 |     secondU = segmentation_models.Unet('resnet50', input_shape=(192, 640, 4), encoder_weights=None)
 97 |     #Get final conv. output and keep sigmoid activation layer
 98 |     firstU = Model(inputs=firstU.input, outputs=firstU.layers[-1].output)
 99 |     #Get final conv. output and skip sigmoid activation layer
100 |     secondU=Model(inputs=secondU.input, outputs=secondU.layers[-2].output) 
101 | #    for layer in firstU.layers:
102 | #        layer.trainable = False
103 |     for layer in secondU.layers:
104 |         layer.trainable = True
105 |     
106 |     inputs = Input((192, 640, 3))
107 |     m1=firstU(inputs)
108 |     merged=Concatenate()([inputs,m1])
109 |     reshape1=Reshape((192, 640, 4))(merged)
110 |     m2=secondU(reshape1)
111 |     reshape2=Reshape((192*640,))(m2)
112 |     
113 |     wnet_c=Model(inputs=inputs,outputs=reshape2)
114 |     
115 |     # Make sure that the pre-trained firstU layers are not trainable
116 | #    for layer in wnet_c.layers:
117 | #        print(layer)
118 | #    wnet_c.layers[0].trainable=False #Input
119 | #    wnet_c.layers[1].trainable=False #First U
120 |     wnet_c.layers[2].trainable=True #Concat
121 |     wnet_c.layers[3].trainable=True #Reshape
122 |     wnet_c.layers[4].trainable=True #Second U
123 |     wnet_c.layers[5].trainable=True #Reshape
124 |     #wnet_c.compile(loss='mean_squared_error', optimizer=Adam(),metrics=['mse','msle']) #lr=1e-5, lr=0.00001
125 |     #wnet_c.summary()
126 | 
127 |     return wnet_c
128 | 
129 | def rcnn_640_480(input_shape=(480,640,3)):
130 |    '''RCNN: CNN First'''
131 |    rcnn = Sequential()
132 |    rcnn.add(Convolution2D(30, (10, 10),strides=(1,1), padding='valid', input_shape=input_shape, activation='relu'))
133 |    rcnn.add(MaxPooling2D(pool_size=(4, 4)))
134 |    rcnn.add(Dropout(0.5))
135 |    rcnn.add(Convolution2D(15, (6, 6), activation='relu',strides=(1,1)))
136 |    rcnn.add(MaxPooling2D(pool_size=(4, 4)))
137 |    rcnn.add(Dropout(0.5))
138 |    rcnn.add(Flatten())
139 |    rcnn.add(Reshape((28, 38*15)))
140 |    rcnn.add(LSTM(512,input_shape=(28,38*15),return_sequences=True))
141 |    rcnn.add(Dense(512,activation='relu'))
142 |    rcnn.add(LSTM(512))
143 |    rcnn.add(Dense(128,activation='relu'))
144 |    rcnn.add(Dense(640*480,activation='linear'))
145 |    #rcnn.compile(loss='mean_squared_error', optimizer=Adam())
146 |    return rcnn
147 | 
148 | def pretrained_unet_rcnn():
149 |     '''Define pretrained U-Net with RCNN model.'''
150 |     unet_rcnn=Sequential()
151 |     #Load unet with resnet34 backbone.  Freeze imagenet weights for encoder
152 |     premodel = segmentation_models.Unet('resnet34', input_shape=(480, 640, 3), encoder_weights='imagenet',encoder_freeze = True)
153 |     #Get final conv. output and keep sigmoid activation layer
154 |     premodel=Model(inputs=premodel.input,outputs=premodel.layers[-1].output)  
155 |     unet_rcnn.add(premodel)
156 |     unet_rcnn.add(rcnn_640_480(input_shape=(480,640,1)))
157 | 
158 |     #unet_rcnn.compile(loss='mean_squared_error', optimizer=Adam()) 
159 |     return unet_rcnn


--------------------------------------------------------------------------------
/prediction_comparison.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | """
 3 | Script for creating depth prediction images from multiple models for comparison
 4 | """
 5 | from utils import deep_utils
 6 | from utils import image_utils
 7 | import numpy as np
 8 | from os.path import basename
 9 | from models import models
10 | from tensorflow.keras.optimizers import Adam
11 | 
12 | #Load weights (h5)
13 | weights={'unet':r"G:\WPI\Courses\2019\Deep Learning for Advanced Robot Perception, RBE595\Project\VEHITS\Weights & Models\20Epochs_NoAugment_LowerLR\20200213-065621\U-Net_weights_best.hdf5",
14 |         'wnet':r"G:\WPI\Courses\2019\Deep Learning for Advanced Robot Perception, RBE595\Project\VEHITS\Weights & Models\20Epochs_NoAugment_LowerLR\20200213-082137\W-Net_weights_best.hdf5",
15 |         'wnet_c':r"G:\WPI\Courses\2019\Deep Learning for Advanced Robot Perception, RBE595\Project\VEHITS\Weights & Models\20Epochs_NoAugment_LowerLR\20200212-205108\W-Net_Connected_weights_best.hdf5"
16 |          }
17 | 
18 | images=[r"G:\WPI\Courses\2019\Deep Learning for Advanced Robot Perception, RBE595\Project\VEHITS\Graphs & Pictures\LR_0.0001\MoreCars\5.jpg"]
19 | 
20 | model_name='wnet'
21 | model=models.wnet()
22 | 
23 | model.compile(loss='mean_squared_error',optimizer=Adam(),metrics=['mse']) 
24 | model.load_weights(weights['wnet'])
25 | 
26 | 
27 | for i in range(len(images)):
28 |     #Read test image
29 |     image=image_utils.rgb_read(images[i]) #640x480
30 |     image=image.reshape(1,480,640,3)
31 |     image=np.divide(image,255).astype(np.float16)
32 |     image_name=basename(images[i]).split('.')[0]
33 |     #Predict depth
34 |     y_est=model.predict(image)
35 |     y_est=y_est.reshape((480,640))*255 #De-normalize for depth viewing
36 |     #Save results
37 |     #image_utils.heatmap(y_est,save=True,name=f'{image_name}_{model_name}_gray',cmap='gray')
38 |     image_utils.heatmap(y_est,save=True,name=f'{image_name}_{model_name}_plasma',cmap='plasma')
39 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
  1 | # packages in environment at C:\Users\Craig\Anaconda3\envs\tf2_depth:
  2 | #
  3 | # Name                    Version                   Build  Channel
  4 | _tflow_select             2.1.0                       gpu  
  5 | absl-py                   0.8.1                    py37_0  
  6 | alabaster                 0.7.12                   py37_0  
  7 | argh                      0.26.2                   py37_0  
  8 | asn1crypto                1.3.0                    py37_0  
  9 | astor                     0.8.0                    py37_0  
 10 | astroid                   2.3.3                    py37_0  
 11 | atomicwrites              1.3.0                    py37_1  
 12 | attrs                     19.3.0                     py_0  
 13 | autopep8                  1.4.4                      py_0  
 14 | babel                     2.8.0                      py_0  
 15 | backcall                  0.1.0                    py37_0  
 16 | bcrypt                    3.1.7            py37he774522_0  
 17 | blas                      1.0                         mkl  
 18 | bleach                    3.1.0                    py37_0  
 19 | ca-certificates           2020.1.1                      0  
 20 | certifi                   2019.11.28               py37_0  
 21 | cffi                      1.13.2           py37h7a1dbc1_0  
 22 | chardet                   3.0.4                 py37_1003  
 23 | cloudpickle               1.2.2                      py_0  
 24 | colorama                  0.4.3                      py_0  
 25 | cryptography              2.8              py37h7a1dbc1_0  
 26 | cudatoolkit               10.0.130                      0  
 27 | cudnn                     7.6.5                cuda10.0_0  
 28 | cycler                    0.10.0                   py37_0  
 29 | decorator                 4.4.1                      py_0  
 30 | defusedxml                0.6.0                      py_0  
 31 | diff-match-patch          20181111                   py_0  
 32 | docutils                  0.16                     py37_0  
 33 | efficientnet              1.0.0                    pypi_0    pypi
 34 | entrypoints               0.3                      py37_0  
 35 | flake8                    3.7.9                    py37_0  
 36 | freetype                  2.9.1                ha9979f8_1  
 37 | future                    0.18.2                   py37_0  
 38 | gast                      0.2.2                    py37_0  
 39 | google-pasta              0.1.8                      py_0  
 40 | grpcio                    1.16.1           py37h351948d_1  
 41 | h5py                      2.10.0           py37h5e291fa_0  
 42 | hdf5                      1.10.4               h7ebc959_0  
 43 | icc_rt                    2019.0.0             h0cc432a_1  
 44 | icu                       58.2                 ha66f8fd_1  
 45 | idna                      2.8                      py37_0  
 46 | image-classifiers         1.0.0                    pypi_0    pypi
 47 | imageio                   2.6.1                    pypi_0    pypi
 48 | imagesize                 1.2.0                      py_0  
 49 | importlib_metadata        1.5.0                    py37_0  
 50 | inflect                   4.1.0                    py37_0  
 51 | intel-openmp              2020.0                      166  
 52 | intervaltree              3.0.2                      py_0  
 53 | ipykernel                 5.1.4            py37h39e3cac_0  
 54 | ipython                   7.12.0           py37h5ca1d4c_0  
 55 | ipython_genutils          0.2.0                    py37_0  
 56 | isort                     4.3.21                   py37_0  
 57 | jaraco.itertools          5.0.0                      py_0  
 58 | jedi                      0.14.1                   py37_0  
 59 | jinja2                    2.11.1                     py_0  
 60 | jpeg                      9b                   hb83a4c4_2  
 61 | jsonschema                3.2.0                    py37_0  
 62 | jupyter_client            5.3.4                    py37_0  
 63 | jupyter_core              4.6.1                    py37_0  
 64 | keras                     2.3.1                    pypi_0    pypi
 65 | keras-applications        1.0.8                      py_0  
 66 | keras-preprocessing       1.1.0                      py_1  
 67 | keyring                   21.1.0                   py37_0  
 68 | kiwisolver                1.1.0            py37ha925a31_0  
 69 | lazy-object-proxy         1.4.3            py37he774522_0  
 70 | libpng                    1.6.37               h2a8f88b_0  
 71 | libprotobuf               3.11.2               h7bd577a_0  
 72 | libsodium                 1.0.16               h9d3ae62_0  
 73 | libspatialindex           1.9.3                h33f27b4_0  
 74 | markdown                  3.1.1                    py37_0  
 75 | markupsafe                1.1.1            py37he774522_0  
 76 | matplotlib                3.1.3                    py37_0  
 77 | matplotlib-base           3.1.3            py37h64f37c6_0  
 78 | mccabe                    0.6.1                    py37_1  
 79 | mistune                   0.8.4            py37he774522_0  
 80 | mkl                       2020.0                      166  
 81 | mkl-service               2.3.0            py37hb782905_0  
 82 | mkl_fft                   1.0.15           py37h14836fe_0  
 83 | mkl_random                1.1.0            py37h675688f_0  
 84 | more-itertools            8.2.0                      py_0  
 85 | nbconvert                 5.6.1                    py37_0  
 86 | nbformat                  5.0.4                      py_0  
 87 | networkx                  2.4                      pypi_0    pypi
 88 | numpy                     1.18.1           py37h93ca92e_0  
 89 | numpy-base                1.18.1           py37hc3f5095_1  
 90 | numpydoc                  0.9.2                      py_0  
 91 | opencv-python             4.2.0.32                 pypi_0    pypi
 92 | openssl                   1.1.1d               he774522_3  
 93 | opt_einsum                3.1.0                      py_0  
 94 | packaging                 20.1                       py_0  
 95 | pandoc                    2.2.3.2                       0  
 96 | pandocfilters             1.4.2                    py37_1  
 97 | paramiko                  2.6.0                    py37_0  
 98 | parso                     0.6.0                      py_0  
 99 | pathtools                 0.1.2                      py_1  
100 | pexpect                   4.8.0                    py37_0  
101 | pickleshare               0.7.5                    py37_0  
102 | pillow                    7.0.0                    pypi_0    pypi
103 | pip                       20.0.2                   py37_1  
104 | pluggy                    0.13.1                   py37_0  
105 | prompt_toolkit            3.0.3                      py_0  
106 | protobuf                  3.11.2           py37h33f27b4_0  
107 | psutil                    5.6.7            py37he774522_0  
108 | pycodestyle               2.5.0                    py37_0  
109 | pycparser                 2.19                     py37_0  
110 | pydocstyle                4.0.1                      py_0  
111 | pyflakes                  2.1.1                    py37_0  
112 | pygments                  2.5.2                      py_0  
113 | pylint                    2.4.4                    py37_0  
114 | pynacl                    1.3.0            py37h62dcd97_0  
115 | pyopenssl                 19.1.0                   py37_0  
116 | pyparsing                 2.4.6                      py_0  
117 | pyqt                      5.9.2            py37h6538335_2  
118 | pyreadline                2.1                      py37_1  
119 | pyrsistent                0.15.7           py37he774522_0  
120 | pysocks                   1.7.1                    py37_0  
121 | python                    3.7.6                h60c2a47_2  
122 | python-dateutil           2.8.1                      py_0  
123 | python-jsonrpc-server     0.3.4                      py_0  
124 | python-language-server    0.31.7                   py37_0  
125 | pytz                      2019.3                     py_0  
126 | pywavelets                1.1.1                    pypi_0    pypi
127 | pywin32                   227              py37he774522_1  
128 | pywin32-ctypes            0.2.0                 py37_1000  
129 | pyyaml                    5.3                      pypi_0    pypi
130 | pyzmq                     18.1.1           py37ha925a31_0  
131 | qdarkstyle                2.8                        py_0  
132 | qt                        5.9.7            vc14h73c81de_0  
133 | qtawesome                 0.6.1                      py_0  
134 | qtconsole                 4.6.0                      py_1  
135 | qtpy                      1.9.0                      py_0  
136 | requests                  2.22.0                   py37_1  
137 | rope                      0.16.0                     py_0  
138 | rtree                     0.9.3            py37h21ff451_0  
139 | scikit-image              0.16.2                   pypi_0    pypi
140 | scipy                     1.4.1            py37h9439919_0  
141 | segmentation-models       1.0.1                    pypi_0    pypi
142 | setuptools                45.1.0                   py37_0  
143 | sip                       4.19.8           py37h6538335_0  
144 | six                       1.14.0                   py37_0  
145 | snowballstemmer           2.0.0                      py_0  
146 | sortedcontainers          2.1.0                    py37_0  
147 | sphinx                    2.3.1                      py_0  
148 | sphinxcontrib-applehelp   1.0.1                      py_0  
149 | sphinxcontrib-devhelp     1.0.1                      py_0  
150 | sphinxcontrib-htmlhelp    1.0.2                      py_0  
151 | sphinxcontrib-jsmath      1.0.1                      py_0  
152 | sphinxcontrib-qthelp      1.0.2                      py_0  
153 | sphinxcontrib-serializinghtml 1.1.3                      py_0  
154 | spyder                    4.0.1                    py37_0  
155 | spyder-kernels            1.8.1                    py37_0  
156 | sqlite                    3.31.1               he774522_0  
157 | tensorboard               2.0.0              pyhb38c66f_1  
158 | tensorflow                2.0.0           gpu_py37h57d29ca_0  
159 | tensorflow-base           2.0.0           gpu_py37h390e234_0  
160 | tensorflow-estimator      2.0.0              pyh2649769_0  
161 | tensorflow-gpu            2.0.0                h0d30ee6_0  
162 | termcolor                 1.1.0                    py37_1  
163 | testpath                  0.4.4                      py_0  
164 | tornado                   6.0.3            py37he774522_1  
165 | traitlets                 4.3.3                    py37_0  
166 | ujson                     1.35             py37hfa6e2cd_0  
167 | urllib3                   1.25.8                   py37_0  
168 | vc                        14.1                 h0510ff6_4  
169 | vs2015_runtime            14.16.27012          hf0eaf9b_1  
170 | watchdog                  0.10.1                   py37_0  
171 | wcwidth                   0.1.8                      py_0  
172 | webencodings              0.5.1                    py37_1  
173 | werkzeug                  0.16.1                     py_0  
174 | wheel                     0.34.2                   py37_0  
175 | win_inet_pton             1.1.0                    py37_0  
176 | wincertstore              0.2                      py37_0  
177 | wrapt                     1.11.2           py37he774522_0  
178 | yaml                      0.1.7                hc54c509_2  
179 | yapf                      0.28.0                     py_0  
180 | zeromq                    4.3.1                h33f27b4_3  
181 | zipp                      2.1.0                      py_0  
182 | zlib                      1.2.11               h62dcd97_3  
183 | 


--------------------------------------------------------------------------------
/utils/augmented_data_generator.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | """
 3 | Image data generator
 4 | 
 5 | https://stackoverflow.com/questions/47826730/how-to-save-resized-images-using-imagedatagenerator-and-flow-from-directory-in-k
 6 | """
 7 | from keras.preprocessing.image import ImageDataGenerator
 8 | import numpy as np
 9 | from glob import glob
10 | from os.path import basename
11 | import cv2
12 | 
13 | datagen = ImageDataGenerator(featurewise_center=False, 
14 |                              samplewise_center=False, 
15 |                              featurewise_std_normalization=False,
16 |                              samplewise_std_normalization=False,
17 |                              zca_whitening=False, 
18 |                              zca_epsilon=1e-06, 
19 |                              rotation_range=0, 
20 |                              width_shift_range=0.0, 
21 |                              height_shift_range=0.0, 
22 |                              brightness_range=(0.3,1), #Use
23 |                              shear_range=0.0, 
24 |                              zoom_range=0.0, 
25 |                              channel_shift_range=0.0, 
26 |                              fill_mode='nearest', 
27 |                              cval=0.0, 
28 |                              horizontal_flip=False, 
29 |                              vertical_flip=False, 
30 |                              rescale=None, 
31 |                              preprocessing_function=None, 
32 |                              data_format='channels_last', 
33 |                              validation_split=0.0, 
34 |                              interpolation_order=1)
35 | 
36 | folderpath=r"C:\Users\Craig\Desktop\test_rgb_folder\\"
37 | filelist=glob(folderpath+'*.png')
38 | save_here = r'C:\Users\Craig\Desktop\test_rgb_folder\augmented'
39 | 
40 | for filepath in filelist:
41 |     image = np.expand_dims(cv2.imread(filepath), 0)
42 |     datagen.fit(image)
43 |     
44 |     idx=basename(filepath).split('.')[0]
45 |     idx=idx.split('_')[-1]
46 |     
47 |     depth_file=r"C:\Users\Craig\Desktop\test_depth_folder\\"+f"d_{idx}.PNG"
48 |     im=cv2.imread(depth_file)
49 |     
50 |     cv2.imwrite(r"C:\Users\Craig\Desktop\test_depth_folder\augmented\\"+f"z_aug_d_{idx}_000000.PNG",im)
51 |     
52 |     for x, val in zip(datagen.flow(image,                    #image we chose
53 |             save_to_dir=save_here,     #this is where we figure out where to save
54 |              save_prefix=f'z_aug_rgb_{idx}',        # it will save the images as 'aug_0912' some number for every new augmented image
55 |             save_format='png'),range(10)) :     # here we define a range because we want 10 augmented images otherwise it will keep looping forever I think
56 |         cv2.imwrite(r"C:\Users\Craig\Desktop\test_depth_folder\augmented\\"+f"z_aug_d_{idx}_{val}.PNG",im)
57 |         
58 | 


--------------------------------------------------------------------------------
/utils/deep_utils.py:
--------------------------------------------------------------------------------
  1 | # -*- coding: utf-8 -*-
  2 | """
  3 | Utility functions for working with neural networks.
  4 | """
  5 | from keras.models import model_from_json, model_from_yaml
  6 | import numpy as np
  7 | import pickle
  8 | import matplotlib.pyplot as plt
  9 | import random
 10 | from tensorflow.keras.optimizers import Adam
 11 | 
 12 | def save_model(model,serialize_type,model_name='model',save_weights=False):
 13 |     '''Saves model and weights to file.'''
 14 |     serialize_type=serialize_type.lower()
 15 |     
 16 |     if serialize_type=='yaml':
 17 |         model_yaml = model.to_yaml()
 18 |         with open(model_name+".yaml", "w") as yaml_file:
 19 |             yaml_file.write(model_yaml)
 20 |     elif serialize_type=='json':
 21 |         model_json = model.to_json()
 22 |         with open(model_name+".json", "w") as json_file:
 23 |             json_file.write(model_json)
 24 |     if save_weights:
 25 |         model.save_weights(model_name+".h5")
 26 |         print(model_name+' & weights saved to disk.')
 27 |     else:
 28 |         print(model_name+' saved to disk.')
 29 | 
 30 |     
 31 | def load_model_weights(model, weights):
 32 |     '''Loads pretrained and compiled model.'''
 33 |     model.compile(loss='mean_squared_error',optimizer=Adam(),metrics=['mse']) 
 34 |     model.load_weights(weights)
 35 |     return model
 36 | 
 37 | def load_model(model_filepath,weights_filepath):
 38 |     '''Loads model and weights to file.'''
 39 |     
 40 |     serialize_type=model_filepath.split('.')[-1]
 41 |     serialize_type=serialize_type.lower()
 42 |     
 43 |     file = open(model_filepath, 'r')
 44 |     loaded_model = file.read()
 45 |     file.close()
 46 |     
 47 |     if serialize_type=='yaml':
 48 |         loaded_model = model_from_yaml(loaded_model)
 49 |     elif serialize_type=='json':
 50 |         loaded_model=model_from_json(loaded_model)
 51 | 
 52 |     loaded_model.load_weights(weights_filepath)
 53 |     print("Loaded model from disk")
 54 |     return loaded_model
 55 | 
 56 | def get_layer_names(model):
 57 |     '''Returns list of layer names.'''
 58 |     layer_names=[]
 59 |     for layer in model.layers:
 60 |         layer_names.append(layer.name)
 61 |     return layer_names
 62 | 
 63 | def generate_pickle_files(X,y):
 64 |     '''Generates pickle file to compress whole dataset.'''
 65 |     pickle.dump(X, open(r"X.p", "wb"), protocol=4)
 66 |     pickle.dump(y, open(r"y.p", "wb"), protocol=4)
 67 | 
 68 | def load_pickle_files(X_file, y_file):
 69 |     '''Reads data from pickle files'''
 70 |     X=pickle.load(open(X_file,'rb'))
 71 |     y=pickle.load(open(y_file,'rb'))
 72 |     return X, y
 73 | 
 74 | def simul_shuffle(mat1, mat2):
 75 |     '''Shuffles two matrices in the same order'''
 76 |     
 77 |     if type(mat1)==list:
 78 |         temp = list(zip(mat1, mat2)) 
 79 |         random.shuffle(temp) 
 80 |         mat1, mat2 = zip(*temp)
 81 |     else:
 82 |         idx=np.arange(0,mat1.shape[0])   
 83 |         random.shuffle(idx)
 84 |         mat1=mat1[idx]
 85 |         mat2=mat2[idx]
 86 |     return mat1, mat2
 87 |     
 88 | def plot_accuracy(history):
 89 |     '''Summarize history for accuracy'''
 90 |     plt.plot(history.history['acc'])
 91 |     plt.plot(history.history['val_acc'])
 92 |     plt.title('model accuracy')
 93 |     plt.ylabel('accuracy')
 94 |     plt.xlabel('epoch')
 95 |     plt.legend(['train', 'test'], loc='upper left')
 96 |     plt.show()
 97 | 
 98 | def plot_mse(history):
 99 |     '''Summarize history for mean-squared error (MSE)'''
100 |     plt.plot(history.history['mean_squared_error'])
101 |     plt.plot(history.history['val_mean_squared_error'])
102 |     plt.title('model MSE')
103 |     plt.ylabel('MSE')
104 |     plt.xlabel('epoch')
105 |     plt.legend(['train', 'test'], loc='upper left')
106 |     plt.show()
107 |     
108 | def plot_loss(history):
109 |     '''Summarize history for loss'''
110 |     plt.plot(history.history['loss'])
111 |     plt.plot(history.history['val_loss'])
112 |     plt.title('model loss')
113 |     plt.ylabel('loss')
114 |     plt.xlabel('epoch')
115 |     plt.legend(['train', 'test'], loc='upper left')
116 |     plt.show()
117 | 
118 | def plot_full_val_loss(history):
119 |     '''Summarize history for loss'''
120 |     loss_history=[]
121 |     val_loss_history=[]
122 |     for h in history:
123 |         for item in h.history['loss']:
124 |             loss_history.append(item)
125 |         for item in h.history['val_loss']:
126 |             val_loss_history.append(item)
127 |     plt.plot(loss_history)
128 |     plt.plot(val_loss_history)
129 |     plt.title('Validation Loss')
130 |     plt.ylabel('loss')
131 |     plt.xlabel('epoch')
132 |     plt.legend(['train', 'test'], loc='upper left')
133 |     plt.show()
134 | 
135 | if __name__ == '__main__':   
136 |     dataset=r"G:\Documents\KITTI\sandbox"


--------------------------------------------------------------------------------
/utils/fill_depth_colorization.py:
--------------------------------------------------------------------------------
  1 | # -*- coding: utf-8 -*-
  2 | 
  3 | # Original Matlab code https://cs.nyu.edu/~silberman/datasets/nyu_depth_v2.html
  4 | #
  5 | #
  6 | # Python port of depth filling code from NYU toolbox
  7 | # Speed needs to be improved
  8 | #
  9 | # Uses 'pypardiso' solver 
 10 | #
 11 | import scipy
 12 | import skimage
 13 | import skimage.color
 14 | import numpy as np
 15 | from pypardiso import spsolve
 16 | from PIL import Image
 17 | import image_utils
 18 | from glob import glob
 19 | from timeit import default_timer as timer
 20 | 
 21 | # fill_depth_colorization.m
 22 | # Preprocesses the kinect depth image using a gray scale version of the
 23 | # RGB image as a weighting for the smoothing. This code is a slight
 24 | # adaptation of Anat Levin's colorization code:
 25 | #
 26 | # See: www.cs.huji.ac.il/~yweiss/Colorization/
 27 | #
 28 | # Args:
 29 | #  imgRgb - HxWx3 matrix, the rgb image for the current frame. This must
 30 | #      be between 0 and 1.
 31 | #  imgDepth - HxW matrix, the depth image for the current frame in
 32 | #       absolute (meters) space.
 33 | #  alpha - a penalty value between 0 and 1 for the current depth values.
 34 | 
 35 | def fill_depth_colorization(imgRgb=None, imgDepthInput=None, alpha=1):
 36 | 	imgIsNoise = imgDepthInput == 0
 37 | 	maxImgAbsDepth = np.max(imgDepthInput)
 38 | 	imgDepth = imgDepthInput / maxImgAbsDepth
 39 | 	imgDepth[imgDepth > 1] = 1
 40 | 	(H, W) = imgDepth.shape
 41 | 	numPix = H * W
 42 | 	indsM = np.arange(numPix).reshape((W, H)).transpose()
 43 | 	knownValMask = (imgIsNoise == False).astype(int)
 44 | 	grayImg = skimage.color.rgb2gray(imgRgb)
 45 | 	winRad = 1
 46 | 	len_ = 0
 47 | 	absImgNdx = 0
 48 | 	len_window = (2 * winRad + 1) ** 2
 49 | 	len_zeros = numPix * len_window
 50 | 
 51 | 	cols = np.zeros(len_zeros) - 1
 52 | 	rows = np.zeros(len_zeros) - 1
 53 | 	vals = np.zeros(len_zeros) - 1
 54 | 	gvals = np.zeros(len_window) - 1
 55 | 
 56 | 	for j in range(W):
 57 | 		for i in range(H):
 58 | 			nWin = 0
 59 | 			for ii in range(max(0, i - winRad), min(i + winRad + 1, H)):
 60 | 				for jj in range(max(0, j - winRad), min(j + winRad + 1, W)):
 61 | 					if ii == i and jj == j:
 62 | 						continue
 63 | 
 64 | 					rows[len_] = absImgNdx
 65 | 					cols[len_] = indsM[ii, jj]
 66 | 					gvals[nWin] = grayImg[ii, jj]
 67 | 
 68 | 					len_ = len_ + 1
 69 | 					nWin = nWin + 1
 70 | 
 71 | 			curVal = grayImg[i, j]
 72 | 			gvals[nWin] = curVal
 73 | 			c_var = np.mean((gvals[:nWin + 1] - np.mean(gvals[:nWin+ 1])) ** 2)
 74 | 
 75 | 			csig = c_var * 0.6
 76 | 			mgv = np.min((gvals[:nWin] - curVal) ** 2)
 77 | 			if csig < -mgv / np.log(0.01):
 78 | 				csig = -mgv / np.log(0.01)
 79 | 
 80 | 			if csig < 2e-06:
 81 | 				csig = 2e-06
 82 | 
 83 | 			gvals[:nWin] = np.exp(-(gvals[:nWin] - curVal) ** 2 / csig)
 84 | 			gvals[:nWin] = gvals[:nWin] / sum(gvals[:nWin])
 85 | 			vals[len_ - nWin:len_] = -gvals[:nWin]
 86 | 
 87 | 	  		# Now the self-reference (along the diagonal).
 88 | 			rows[len_] = absImgNdx
 89 | 			cols[len_] = absImgNdx
 90 | 			vals[len_] = 1  # sum(gvals(1:nWin))
 91 | 
 92 | 			len_ = len_ + 1
 93 | 			absImgNdx = absImgNdx + 1
 94 | 
 95 | 	vals = vals[:len_]
 96 | 	cols = cols[:len_]
 97 | 	rows = rows[:len_]
 98 | 	A = scipy.sparse.csr_matrix((vals, (rows, cols)), (numPix, numPix))
 99 | 
100 | 	rows = np.arange(0, numPix)
101 | 	cols = np.arange(0, numPix)
102 | 	vals = (knownValMask * alpha).transpose().reshape(numPix)
103 | 	G = scipy.sparse.csr_matrix((vals, (rows, cols)), (numPix, numPix))
104 | 
105 | 	A = A + G
106 | 	b = np.multiply(vals.reshape(numPix), imgDepth.flatten('F'))
107 | 
108 | 	#print ('Solving system..')
109 | 
110 | 	new_vals = spsolve(A, b)
111 | 	new_vals = np.reshape(new_vals, (H, W), 'F')
112 | 
113 | 	#print ('Done.')
114 | 
115 | 	denoisedDepthImg = new_vals * maxImgAbsDepth
116 |     
117 | 	output = denoisedDepthImg.reshape((H, W)).astype('float32')
118 | 
119 | 	output = np.multiply(output, (1-knownValMask)) + imgDepthInput
120 |     
121 | 	return output
122 | 
123 | if __name__=="__main__":
124 |     X_files=glob(r"E:\NYU\nyud_raw_data\nyuv2-python-toolbox-master\X_rgb\\"+'*')
125 |     y_files=glob(r"E:\NYU\nyud_raw_data\nyuv2-python-toolbox-master\y_depth\\"+'*')
126 |     
127 |     X_files.sort(key=lambda f: int(''.join(filter(str.isdigit, f))))
128 |     y_files.sort(key=lambda f: int(''.join(filter(str.isdigit, f))))
129 |     
130 |     len_files=len(X_files)
131 |     
132 |     last_image=7171
133 |     
134 |     for idx in range(len_files):
135 |         if idx>last_image:
136 |             start=timer()
137 |             #Read RGB and depth input images
138 |             imgRgb=image_utils.rgb_read(X_files[idx])
139 |             imgDepthInput=image_utils.depth_read(y_files[idx])
140 |             #Colorize
141 |             denoised_depth_img=fill_depth_colorization(imgRgb=imgRgb, imgDepthInput=imgDepthInput, alpha=0.8)
142 |             #Save depth image
143 |             image_utils.heatmap(denoised_depth_img,save=True,
144 |                                 name=r'E:\NYU\nyud_raw_data\nyuv2-python-toolbox-master\colorized\y_depth\\'+f'c_depth_{idx}')
145 |             end=timer()
146 |             dt=end-start
147 |             print(f'Saving {idx}/{len_files} in {dt} sec')
148 |         else:
149 |             pass


--------------------------------------------------------------------------------
/utils/image_utils.py:
--------------------------------------------------------------------------------
  1 | # -*- coding: utf-8 -*-
  2 | """
  3 | Image Utility functions.
  4 | """
  5 | import numpy as np
  6 | from PIL import Image
  7 | import matplotlib.pyplot as plt
  8 | import cv2
  9 | 
 10 | def crop_image(img,x=640,y=192,mode='middle'):
 11 |     '''Crops images starting at 'top', 'middle', or 'bottom'.'''
 12 |    
 13 |     if img.shape[0] != y:
 14 |         #Crop vertically
 15 |         if mode=='top':
 16 |             y_top, y_bottom = 0, y
 17 |             img=img[y_top:y_bottom,:]
 18 |         elif mode=='middle':
 19 |             y_mid=img.shape[0]/2
 20 |             y_top, y_bottom = int(y_mid-y/2), int(y_mid+y/2)
 21 |             img=img[y_top:y_bottom,:]
 22 |         elif mode=='bottom':
 23 |             y_top, y_bottom = img.shape[0]-y, img.shape[0]
 24 |             img=img[y_top:y_bottom,:]
 25 |         else:
 26 |             print('Unknown crop mode.')
 27 |             img=None
 28 |     
 29 |     if img.shape[1] != x:
 30 |         #Crop horizontally in the middle of image
 31 |         x_mid=img.shape[1]/2
 32 |         x_left, x_right = int(x_mid-x/2), int(x_mid+x/2)
 33 |         img=img[:,x_left:x_right]
 34 |         
 35 |     return img
 36 | 
 37 | def image_from_np(image_array,save=False,rgb=True):
 38 |     '''Plots RGB or grayscale image from numpy array'''
 39 |     if rgb==True:
 40 |         img = Image.fromarray(image_array, 'RGB')
 41 |         img.show()
 42 |     else:
 43 |         #img = Image.fromarray(image_array, '1')
 44 |         img=cv2.imshow('image_from_np',image_array)
 45 |         cv2.waitKey(0)
 46 |     return img
 47 | 
 48 | def add_blur(im_array,ksize=12,sigmaColor=400,sigmaMax=700):
 49 |     """
 50 |     Adds bilateral filtering to blur objects but preserve edges
 51 |     """
 52 |     return cv2.bilateralFiltering(im_array,ksize,sigmaColor,sigmaMax)
 53 | 
 54 | def rgb_read(filename):
 55 |     '''Reads RGB image from png file and returns it as a numpy array'''
 56 |     #Load image
 57 |     image=Image.open(filename)
 58 |     #store as np.array
 59 |     rgb=np.array(image)
 60 |     image.close()
 61 |     return rgb
 62 | 
 63 | def depth_read(filename):
 64 |     '''Loads depth map D from png file and returns it as a numpy array'''
 65 |     #Lower is closer
 66 |     # From KITTI devkit
 67 |     
 68 |     image=Image.open(filename)
 69 |     depth_png = np.array(image, dtype=int)
 70 |     # make sure we have a proper 16bit depth map here.. not 8bit!
 71 | 
 72 |     if depth_png.shape==(480,640,3):
 73 |         depth_png=(depth_png[:,:,0]+depth_png[:,:,1]+depth_png[:,:,2])/3
 74 |     
 75 |     #depth_png=depth_png[:,:,3]
 76 |     assert(np.max(depth_png) <= 255)
 77 |     depth=depth_png.astype(np.float)
 78 |     #depth = depth_png.astype(np.float) / 256.
 79 |     #depth[depth_png == 0] = -1.
 80 |     image.close()
 81 | 
 82 |     return depth
 83 | 
 84 | def depth_read_kitti(filename):
 85 |     '''Loads depth map D from png file and returns it as a numpy array'''
 86 |     #Lower is closer
 87 |     # From KITTI devkit
 88 |     
 89 |     image=Image.open(filename)
 90 |     depth_png = np.array(image, dtype=int)
 91 |     
 92 |     #TODO: Determine if this if legitimate for getting depth values
 93 |     if depth_png.shape==(192,640,4):
 94 |         # print('it is')
 95 |         depth_png=(depth_png[:,:,0]+depth_png[:,:,1]+depth_png[:,:,2])/3
 96 |     
 97 |     assert(np.max(depth_png) <= 255)
 98 |     depth=depth_png.astype('int8') #np.float
 99 |  
100 |     image.close()
101 | 
102 |     return depth
103 | def heatmap(image,save=False,name='heatmap',cmap='gray'):
104 |     '''Plots heatmap of depth data from image or np.ndarray.'''
105 |     if type(image)==np.ndarray:
106 |         pic_array=image
107 |     else:
108 |         #Convert to np.ndarray
109 |         pic=Image.open(image)
110 |         pic_array=np.array(pic)
111 |     #Plot heatmap
112 |     print(pic_array.shape)
113 |     plt.imshow(pic_array, cmap=cmap, interpolation='nearest') #cmap=binary, plasma, gray
114 |     plt.show()
115 |     if save==True:
116 |         plt.imsave(name+'.png',pic_array, cmap=cmap)
117 |     
118 | if __name__=='__main__':
119 |     filename=r"G:\Documents\KITTI\sandbox\y_depth\2011_09_26_drive_0002_sync\proj_depth\groundtruth\image_02\0000000005.png"
120 |     heatmap(filename)
121 |     d=depth_read(filename)
122 | 


--------------------------------------------------------------------------------
/utils/images_to_video.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | """
 3 | Build video from image sequence.
 4 | """
 5 | import cv2
 6 | from glob import glob
 7 |   
 8 | def images_to_video(folderpath,output_filename=r'output_video.avi',out_FPS=10,width=640,height=480):
 9 |     '''Converts all images in a folder into video.'''
10 | 
11 |     images=glob(folderpath+'*.jpg')
12 |     
13 |     # Define the codec and create VideoWriter object.
14 |     out = cv2.VideoWriter(output_filename,cv2.VideoWriter_fourcc('M','J','P','G'), 
15 |                            out_FPS, (int(width),int(height)))
16 |     
17 |     for image in images:
18 |         img=cv2.imread(image)
19 |         out.write(img)
20 | 
21 |     cv2.destroyAllWindows()
22 |     
23 | if __name__=='__main__':
24 |     folderpath=r"D:\rpi_cal_files\\"
25 |     images_to_video(folderpath,output_filename=r'camera_cal.avi',out_FPS=10,width=640,height=480)


--------------------------------------------------------------------------------
/utils/rgb2depth.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | """
 3 | Tool for creating a depth prediction video from an input RGB video.
 4 | """
 5 | import cv2
 6 | import numpy as np
 7 | from models import models
 8 | import image_utils
 9 | import deep_utils
10 |   
11 | def rgb2depth_video(filename, model, out_FPS=10, width=640, height=192,
12 |                     output_filename=r'depth_output.avi', gamma=1,
13 |                     mirror=False, crop_mode='middle'):
14 |     '''Create depth prediction video from input RGB video. Adjust 
15 |     brightness (gamma) for viewing purposes only. Anything other than 
16 |     gamma=1 is distorting the numerical depth prediction.'''
17 |         
18 |     cam = cv2.VideoCapture(filename)
19 | 
20 |     # Define the codec and create VideoWriter object.
21 |     out = cv2.VideoWriter(output_filename,cv2.VideoWriter_fourcc('M','J','P','G'), 
22 |                           out_FPS, (int(width),int(height)))
23 |       
24 |     while(cam.isOpened()):
25 |         ret_val, img = cam.read()
26 |         
27 |         try:
28 |             if mirror: 
29 |                 img = cv2.flip(img, 1)
30 | 
31 |             #If img doesn't match output height & width
32 |             if (img.shape[0] != height) or (img.shape[1] != width):
33 |                 #Crop image
34 |                 img=image_utils.crop_image(img,width,height,mode=crop_mode)
35 |     
36 |             #Predict depth
37 |             img=img.reshape(1,height,width,3)
38 |             img=np.divide(img,255).astype(np.float16) #Normalize input
39 |             y_est=model.predict(img)
40 |             y_est=y_est.reshape((height,width))
41 |             
42 |             #Map 2D grayscale to RGB equivalent
43 |             vis = cv2.cvtColor((y_est*255*(1/gamma)).astype(np.uint8),cv2.COLOR_GRAY2BGR)
44 |             vis = cv2.cvtColor(vis,cv2.COLOR_BGR2GRAY)
45 |             #Map BGR to Rainbow
46 |             vis=cv2.applyColorMap(vis,cv2.COLORMAP_RAINBOW)
47 |             
48 |             #Write prediction to video
49 |             out.write(vis)
50 |         except:
51 |             break
52 |         
53 |     cam.release()
54 |     cv2.destroyAllWindows()
55 | 
56 | if __name__=='__main__':
57 |     #Load pretrained & compiled model
58 |     weights=r"E:\W-Net_Connected_weights_best_KITTI_35Epochs.hdf5"
59 |     model=models.wnet_connected()
60 |     model=deep_utils.load_model_weights(model,weights)
61 |     #Define input RGB video (tested with .mp4, .mov, and .avi)
62 |     rgb_video=r"G:\Program Files\MATLAB\R2018b\toolbox\vision\visiondata\atrium.mp4"
63 |     #Create depth video
64 |     rgb2depth_video(rgb_video,model,out_FPS=30, width=640, height=192,
65 |                     output_filename=r'depth_output.avi', gamma=0.6,
66 |                     mirror=False, crop_mode='middle')


--------------------------------------------------------------------------------
/utils/rgb2depth_stream.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | """
 3 | Tool for testing depth estimation models on live video stream.
 4 | """
 5 | import cv2
 6 | import numpy as np
 7 | import image_utils
 8 | import deep_utils
 9 | import time
10 | from models import models
11 |   
12 | def rgb2depth_stream(model,method='cv2',mirror=True,width=640,height=192,
13 |                  gamma=1,crop_mode='middle'):
14 |     '''Runs depth estimation on live webcam video stream.  Adjust 
15 |     brightness (gamma) for viewing purposes only. Anything other than 
16 |     gamma=1 is distorting the numerical depth prediction.'''
17 |     cam = cv2.VideoCapture(0)
18 |     
19 |     while True:
20 |         start=time.time()
21 |         
22 |         ret_val, img = cam.read()
23 |         if mirror: 
24 |             img = cv2.flip(img, 1)
25 |             
26 |         #If img doesn't match output height & width
27 |         if (img.shape[0] != height) or (img.shape[1] != width):
28 |             #Crop image
29 |             img=image_utils.crop_image(img,width,height,mode=crop_mode)
30 |   
31 |         img=img.reshape(1,height,width,3)
32 |         img=np.divide(img,255).astype(np.float16)
33 |         #Predict depth
34 |         y_est=model.predict(img)
35 |         y_est=y_est.reshape((height,width))
36 | 
37 |         #Show depth prediction results
38 |         if method=='cv2':        
39 |             #Map 2D grayscale to RGB equivalent
40 |             vis = cv2.cvtColor((y_est*255*(1/gamma)).astype(np.uint8),cv2.COLOR_GRAY2BGR)
41 |             vis = cv2.cvtColor(vis,cv2.COLOR_BGR2GRAY)
42 |             #Map BGR to Rainbow
43 |             vis=cv2.applyColorMap(vis,cv2.COLORMAP_RAINBOW)
44 |             
45 |             cv2.imshow('Depth Estimate', vis)
46 |         elif method=='heatmap':
47 |             image_utils.heatmap(y_est,cmap='plasma')
48 |         else:
49 |             print('Unknown display method.')
50 |         
51 |         #Estimate instantaneous frames per second
52 |         end=time.time()
53 |         fps=round(1/(end-start),2)        
54 |         print(f'FPS: {fps}')
55 | 
56 |         if cv2.waitKey(1) == 27: 
57 |             break  # esc to quit
58 |     cv2.destroyAllWindows()
59 | 
60 | if __name__=='__main__':
61 |     #Load pretrained & compiled model
62 |     weights=r"E:\W-Net_Connected_weights_best_KITTI_35Epochs.hdf5"
63 |     model=models.wnet_connected()
64 |     model=deep_utils.load_model_weights(model,weights)
65 |     
66 |     display_methods=['cv2','heatmap']
67 | 
68 |     rgb2depth_stream(model,method=display_methods[0],mirror=True,
69 |                      width=640,height=192,gamma=0.3,crop_mode='middle')


--------------------------------------------------------------------------------
/utils/stack_videos.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | """
 3 | Stacks videos vertically or horizontally.
 4 | """
 5 | import cv2
 6 | import numpy as np
 7 |   
 8 | def stack_videos(filename1,filename2, out_FPS=10, output_filename=r'output_stack.avi',
 9 |                  stack_direction='vertical'):
10 |     '''Stacks videos vertically or horizontally.'''
11 | 
12 |     cam1 = cv2.VideoCapture(filename1)
13 |     cam2 = cv2.VideoCapture(filename2)
14 |     
15 |     if stack_direction=='vertical':
16 |         vert_mul=2
17 |         hor_mul=1
18 |         axis=0
19 |     else:
20 |         vert_mul=1
21 |         hor_mul=2
22 |         axis=1
23 |         
24 |     # Define the codec and create VideoWriter object.
25 |     out = cv2.VideoWriter(output_filename,cv2.VideoWriter_fourcc('M','J','P','G'), 
26 |                           out_FPS, (int(hor_mul*cam1.get(3)),int(vert_mul*cam1.get(4))))
27 |     
28 |     while(cam1.isOpened()):
29 |         ret_val1, img1 = cam1.read()
30 |         ret_val2, img2 = cam2.read()
31 |         
32 |         axis
33 |         if ret_val1 == True:
34 |             # Write the frame into the file 'output.avi'
35 |             vis=np.concatenate((img1, img2), axis=axis) #0:vertical, 1:horizontal
36 |             out.write(vis)
37 |             
38 |         else:
39 |             break
40 |         
41 |     cam1.release()
42 |     cam2.release()
43 |     cv2.destroyAllWindows()
44 |     
45 | if __name__=='__main__':
46 |     filename1=r"C:\Users\Craig\Documents\GitHub\depth-estimation\models\output_2011_09_26_drive_0009_unseen_10FPS.avi"
47 |     filename2=r"C:\Users\Craig\Documents\GitHub\depth-estimation\models\2011_09_26_drive_0009_unseen_depth_10FPS.avi"
48 |     stack_videos(filename1,filename2,stack_direction='horizontal')


--------------------------------------------------------------------------------