├── CMakeLists.txt
├── DL_Scripts
    ├── MNIST.py
    ├── basic.py
    ├── checkpoint
    ├── detect_ros.py
    ├── export_inference_graph.py
    ├── fusion.py
    ├── generate_tfrecord.py
    ├── image_recognition.py
    ├── lidar_image_pub.py
    ├── multi_sensor_fusion.py
    ├── object_detection.py
    ├── pointcloud.py
    ├── radar_publisher _segment.py
    ├── radar_publisher.py
    ├── ros_fusion.py
    ├── ros_multi_sensor_fusion.py
    ├── save_model.py
    ├── test.py
    ├── train.py
    └── xml_to_csv.py
├── README.md
├── Results
    ├── Screenshot from 2020-06-04 12-10-31.png
    ├── Screenshot from 2020-06-22 15-14-01.png
    ├── VID-20200623-WA0008.mp4
    └── output.gif
├── bag
    └── loop_bag.launch
├── include
    └── nuscenes2bag
    │   ├── DatasetTypes.hpp
    │   ├── EgoPoseConverter.hpp
    │   ├── FileProgress.hpp
    │   ├── Filesystem.hpp
    │   ├── ImageDirectoryConverter.hpp
    │   ├── LidarDirectoryConverter.hpp
    │   ├── LidarDirectoryConverterXYZIR.hpp
    │   ├── MetaDataProvider.hpp
    │   ├── MetaDataReader.hpp
    │   ├── MetaDataTypes.hpp
    │   ├── NuScenes2Bag.hpp
    │   ├── PclRadarObject.hpp
    │   ├── RadarDirectoryConverter.hpp
    │   ├── RunEvery.hpp
    │   ├── SceneConverter.hpp
    │   ├── ToDebugString.hpp
    │   ├── thread_pool.hpp
    │   └── utils.hpp
├── msg
    ├── RadarObject.msg
    └── RadarObjects.msg
├── output_inference_graph_v2
    ├── checkpoint
    ├── frozen_inference_graph.pb
    ├── model.ckpt.data-00000-of-00001
    ├── model.ckpt.index
    ├── model.ckpt.meta
    ├── pipeline.config
    ├── saved_model
    │   └── saved_model.pb
    └── v1.config
├── package.xml
├── src
    ├── EgoPoseConverter.cpp
    ├── FileProgress.cpp
    ├── ImageDirectoryConverter.cpp
    ├── LidarDirectoryConverter.cpp
    ├── LidarDirectoryConverterXYZIR.cpp
    ├── MetaData.cpp
    ├── MetaDataReader.cpp
    ├── NuScenes2Bag.cpp
    ├── RadarDirectoryConverter.cpp
    ├── SceneConverter.cpp
    ├── main.cpp
    ├── pcd_to_image.cpp
    ├── pointcloud_im.cpp
    └── utils.cpp
└── thirdparty
    └── json
        └── nlohmann
            └── json.hpp


/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | 
 2 | cmake_minimum_required(VERSION 3.8) # C++17 support was added in CMake 3.8
 3 | 
 4 | project(nuscenes2bag)
 5 | 
 6 | #set(CMAKE_CXX_STANDARD 11)
 7 | set(CMAKE_CXX_STANDARD 14)
 8 | 
 9 | set(CMAKE_BUILD_TYPE Release) # Debug, Release, RelWithDebInfo
10 | 
11 | find_package(Boost 1.58.0 COMPONENTS filesystem thread REQUIRED) # Ubuntu 16.04
12 | #find_package(Boost 1.65.0 COMPONENTS filesystem thread REQUIRED) # Ubuntu 18.04
13 | 
14 | find_package(catkin
15 |              REQUIRED
16 |              rosbag
17 |              sensor_msgs
18 |              cv_bridge
19 |              pcl_conversions
20 |              pcl_msgs
21 |              message_generation
22 |              geometry_msgs
23 |              std_msgs
24 |              nav_msgs
25 |              tf)
26 | 
27 | find_package(OpenCV REQUIRED core)
28 | 
29 | add_message_files(FILES RadarObjects.msg RadarObject.msg)
30 | 
31 | generate_messages(DEPENDENCIES
32 |                   std_msgs
33 |                   geometry_msgs
34 |                   tf
35 |                   nav_msgs)
36 | 
37 | catkin_package(INCLUDE_DIRS
38 |                include
39 |                thirdparty/json/
40 |                DEPENDS
41 |                OpenCV)
42 | 
43 | include_directories(SYSTEM
44 |                     thirdparty/json/
45 |                     ${catkin_INCLUDE_DIRS}
46 |                     ${Boost_INCLUDE_DIRS}
47 |                     ${OpenCV_INCLUDE_DIRS})
48 | include_directories(include)
49 | 
50 | find_package(PCL REQUIRED COMPONENTS common io)
51 | 
52 | set(SRCS
53 |     src/EgoPoseConverter.cpp
54 |     src/ImageDirectoryConverter.cpp
55 |     src/LidarDirectoryConverter.cpp
56 |     src/LidarDirectoryConverterXYZIR.cpp
57 |     src/RadarDirectoryConverter.cpp
58 |     src/NuScenes2Bag.cpp
59 |     src/FileProgress.cpp
60 |     src/MetaDataReader.cpp
61 |     src/MetaData.cpp
62 |     src/SceneConverter.cpp
63 |     src/utils.cpp)
64 | 
65 | add_executable(${PROJECT_NAME} ${SRCS} src/main.cpp)
66 | 
67 | target_compile_options(${PROJECT_NAME}
68 |                        PRIVATE
69 |                                -Wall
70 |                                -Wextra
71 |                                -pedantic
72 |                                )
73 | 
74 | target_compile_definitions(${PROJECT_NAME} PRIVATE "-DCMAKE_CXX_STANDARD=${CMAKE_CXX_STANDARD}")
75 | 
76 | add_dependencies(${PROJECT_NAME} ${${PROJECT_NAME}_EXPORTED_TARGETS}
77 |                  ${catkin_EXPORTED_TARGETS})
78 | 
79 | target_link_libraries(${PROJECT_NAME}
80 |                       ${OpenCV_LIBRARIES}
81 |                       ${PCL_COMMON_LIBRARY}
82 |                       ${PCL_IO_LIBRARY}
83 |                       ${catkin_LIBRARIES})
84 | 
85 | install(DIRECTORY include/${PROJECT_NAME}/ thirdparty/json/
86 |         DESTINATION ${CATKIN_PACKAGE_INCLUDE_DESTINATION}
87 |         FILES_MATCHING
88 |         PATTERN "*.h"
89 |         PATTERN ".svn" EXCLUDE)
90 | 


--------------------------------------------------------------------------------
/DL_Scripts/MNIST.py:
--------------------------------------------------------------------------------
 1 | import tensorflow as tf
 2 | 
 3 | tf.compat.v1.enable_eager_execution(
 4 |     config=None, device_policy=None, execution_mode=None
 5 | )
 6 | mnist = tf.keras.datasets.mnist
 7 | 
 8 | (x_train, y_train), (x_test, y_test) = mnist.load_data()
 9 | x_train, x_test = x_train / 255.0, x_test / 255.0
10 | model = tf.keras.models.Sequential([
11 |   tf.keras.layers.Flatten(input_shape=(28, 28)),
12 |   tf.keras.layers.Dense(128, activation='relu'),
13 |   tf.keras.layers.Dropout(0.2),
14 |   tf.keras.layers.Dense(10)
15 | ])
16 | 
17 | predictions = model(x_train[:1]).numpy()
18 | predictions
19 | 
20 | tf.nn.softmax(predictions).numpy()
21 | 
22 | loss_fn = tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True)
23 | loss_fn(y_train[:1], predictions).numpy()
24 | model.compile(optimizer='adam',
25 |               loss=loss_fn,
26 |               metrics=['accuracy'])
27 | 
28 | model.fit(x_train, y_train, epochs=5)
29 | model.evaluate(x_test,  y_test, verbose=2)
30 | 
31 | probability_model = tf.keras.Sequential([model,tf.keras.layers.Softmax()]) 
32 | probability_model(x_test[:5])
33 | 


--------------------------------------------------------------------------------
/DL_Scripts/basic.py:
--------------------------------------------------------------------------------
 1 | #The most basic DL model ever
 2 | import tensorflow as tf
 3 | import numpy as np
 4 | from tensorflow import keras
 5 | 
 6 | model = tf.keras.Sequential([keras.layers.Dense(units=1, input_shape=[1])])
 7 | 
 8 | model.compile(optimizer='sgd', loss='mean_squared_error')
 9 | 
10 | xs = np.array([-1.0,  0.0, 1.0, 2.0, 3.0, 4.0], dtype=float)
11 | ys = np.array([-3.0, -1.0, 1.0, 3.0, 5.0, 7.0], dtype=float)
12 | 
13 | model.fit(xs, ys, epochs=500)
14 | print(model.predict([10.0]))
15 | 
16 | 


--------------------------------------------------------------------------------
/DL_Scripts/checkpoint:
--------------------------------------------------------------------------------
1 | model_checkpoint_path: "model.ckpt-10696"
2 | all_model_checkpoint_paths: "model.ckpt-10517"
3 | all_model_checkpoint_paths: "model.ckpt-10562"
4 | all_model_checkpoint_paths: "model.ckpt-10606"
5 | all_model_checkpoint_paths: "model.ckpt-10651"
6 | all_model_checkpoint_paths: "model.ckpt-10696"
7 | 


--------------------------------------------------------------------------------
/DL_Scripts/detect_ros.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python
  2 | 
  3 | import os
  4 | import sys
  5 | import cv2
  6 | import cv_bridge
  7 | import numpy as np
  8 | import time
  9 | try:
 10 |     import tensorflow as tf
 11 | except ImportError:
 12 |     print("unable to import TensorFlow. Is it installed?")
 13 |     sys.exit(1)
 14 | 
 15 | # ROS related imports
 16 | import rospy
 17 | from std_msgs.msg import String , Header
 18 | from sensor_msgs.msg import Image
 19 | from cv_bridge import CvBridge, CvBridgeError
 20 | from vision_msgs.msg import Detection2D, Detection2DArray, ObjectHypothesisWithPose
 21 | from PIL import Image as img
 22 | 
 23 | # Object detection module imports
 24 | import object_detection
 25 | from object_detection.utils import label_map_util
 26 | from object_detection.utils import visualization_utils as vis_util
 27 | from collections import defaultdict
 28 | from io import StringIO
 29 | from matplotlib import pyplot as plt
 30 | import cv2
 31 | from IPython.display import display
 32 | # SET FRACTION OF GPU YOU WANT TO USE HERE
 33 | GPU_FRACTION = 0.4
 34 | 
 35 | ######### Set model here ############
 36 | MODEL_NAME = 'output_inference_graph_v2'
 37 | # Path to frozen detection graph. This is the actual model that is used for the object detection.
 38 | PATH_TO_CKPT = MODEL_NAME + '/frozen_inference_graph.pb'
 39 | # List of the strings that is used to add correct label for each box.
 40 | PATH_TO_LABELS = os.path.join('annotations','label_map.pbtxt')
 41 | NUM_CLASSES = 2
 42 | 
 43 | detection_graph = tf.Graph()
 44 | with detection_graph.as_default():
 45 |     od_graph_def = tf.GraphDef()
 46 |     with tf.gfile.GFile(PATH_TO_CKPT, 'rb') as fid:
 47 |         serialized_graph = fid.read()
 48 |         od_graph_def.ParseFromString(serialized_graph)
 49 |         tf.import_graph_def(od_graph_def, name='')
 50 | 
 51 | ## Loading label map
 52 | # Label maps map indices to category names, so that when our convolution network predicts `5`,
 53 | # we know that this corresponds to `airplane`.  Here we use internal utility functions,
 54 | # but anything that returns a dictionary mapping integers to appropriate string labels would be fine
 55 | label_map = label_map_util.load_labelmap(PATH_TO_LABELS)
 56 | categories = label_map_util.convert_label_map_to_categories(label_map, max_num_classes=NUM_CLASSES, use_display_name=True)
 57 | category_index = label_map_util.create_category_index(categories)
 58 | 
 59 | # Setting the GPU options to use fraction of gpu that has been set
 60 | config = tf.ConfigProto()
 61 | config.gpu_options.per_process_gpu_memory_fraction = GPU_FRACTION
 62 | 
 63 | # Detection
 64 | 
 65 | class Detector:
 66 | 
 67 | 	def __init__(self):
 68 | 		self.object_pub = rospy.Publisher("objects", Detection2DArray, queue_size=1)
 69 | 		self.bridge = CvBridge()
 70 | 		self.image_sub = rospy.Subscriber("image_lidar", Image, self.image_cb)
 71 | 		self.sess = tf.Session(graph=detection_graph,config=config)
 72 | 		#self.front_image_sub=rospy.Subscriber("cam_front/raw",Image,self.front_image_cb)
 73 | 		#self.img_array=np.zeros((450,300))
 74 | 		self.front_image_sub=rospy.Subscriber("debug_image",Image,self.front_image_cb)
 75 | 		self.img_array=np.zeros((640,480))
 76 | 
 77 | 	def front_image_cb(self,data):
 78 | 		self.img_array=cv2.resize(self.bridge.imgmsg_to_cv2(data),(640,480))
 79 | 		#self.img_array=cv2.resize(self.bridge.imgmsg_to_cv2(data),(450,300))
 80 | 		time.sleep(0.2)
 81 | 		#cv2.imshow("window",self.img_array)
 82 | 		#cv2.waitKey(1)
 83 | 
 84 | 	def drawBoundingBox(self,imgcv,array):
 85 | 		cv2.rectangle(imgcv,(int(array[1]),250),(int(array[0]),320),(0,255,0),1)
 86 | 		#cv2.rectangle(imgcv,(_x1,_y1),(_x2,_y2),(0,255,0),cv2.FILLED)
 87 | 		#cv2.putText(imgcv,label,(x1,y1),cv2.FONT_HERSHEY_COMPLEX,0.5,(0,0,0),1)
 88 | 		#cv2.imshow("window",imgcv)
 89 | 		#cv2.waitKey(1) 
 90 | 
 91 | 	def image_cb(self, data):
 92 | 		objArray = Detection2DArray()
 93 | 		try:
 94 | 		    cv_image = self.bridge.imgmsg_to_cv2(data)
 95 | 		except CvBridgeError as e:
 96 | 		    print(e)
 97 | 		# the array based representation of the image will be used later in order to prepare the
 98 | 		# result image with boxes and labels on it.
 99 | 		image=cv_image[:,:,0]
100 | 		mod_image=np.zeros((600,600,3))
101 |  		mod_image[:, :, 0]=image
102 |  		mod_image[:, :, 1]=image
103 | 		mod_image[:, :, 2]=image  		
104 | 		image_np = mod_image.astype(np.uint8)
105 |        	# Expand dimensions since the model expects images to have shape: [1, None, None, 3]
106 | 		image_np_expanded = np.expand_dims(image_np, axis=0)
107 | 		image_tensor = detection_graph.get_tensor_by_name('image_tensor:0')
108 |        	# Each box represents a part of the image where a particular object was detected.
109 | 		boxes = detection_graph.get_tensor_by_name('detection_boxes:0')
110 |         # Each score represent how level of confidence for each of the objects.
111 |         # Score is shown on the result image, together with the class label.
112 | 		scores = detection_graph.get_tensor_by_name('detection_scores:0')
113 | 		classes = detection_graph.get_tensor_by_name('detection_classes:0')
114 | 		num_detections = detection_graph.get_tensor_by_name('num_detections:0')
115 | 		(boxes, scores, classes, num_detections) = self.sess.run([boxes, scores, classes, num_detections],
116 |             feed_dict={image_tensor: image_np_expanded})
117 | 		objects,array=vis_util.visualize_boxes_and_labels_on_image_array(
118 |             image_np,
119 |             np.squeeze(boxes),
120 |             np.squeeze(classes).astype(np.int32),
121 |             np.squeeze(scores),
122 |             category_index,
123 |             use_normalized_coordinates=True,
124 |             line_thickness=2)
125 | 		if(array!=None):
126 | 			array[0]=array[0]*640#450
127 | 			array[1]=array[1]*640#450
128 | 			array[2]=array[2]*480#300
129 | 			array[3]=array[3]*480#300
130 | 			print(array)
131 | 			self.drawBoundingBox(self.img_array,array)
132 | 		#display(img.fromarray(image_np))
133 | 		#cv2.imshow("window",image_np))
134 | 		h1, w1 = image_np.shape[:2]
135 | 		h2, w2 = self.img_array.shape[:2]
136 | 		#create empty matrix
137 | 		vis = np.zeros((max(h1, h2), w1+w2,3), np.uint8)
138 | 		#combine 2 images
139 | 		vis[:h1,:w1,:3] = image_np
140 | 		vis[:h2,w1:w1+w2,:3] =self.img_array
141 | 		cv2.imshow("window",vis)
142 | 		cv2.waitKey(1)
143 | 			
144 | if __name__=='__main__':
145 | 	rospy.init_node('detector_node')
146 | 	obj=Detector()
147 | 	try:
148 | 	    rospy.spin()
149 | 	except KeyboardInterrupt:
150 | 	    print("ShutDown")
151 | 	cv2.destroyAllWindows()
152 | 


--------------------------------------------------------------------------------
/DL_Scripts/export_inference_graph.py:
--------------------------------------------------------------------------------
  1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
  2 | #
  3 | # Licensed under the Apache License, Version 2.0 (the "License");
  4 | # you may not use this file except in compliance with the License.
  5 | # You may obtain a copy of the License at
  6 | #
  7 | #     http://www.apache.org/licenses/LICENSE-2.0
  8 | #
  9 | # Unless required by applicable law or agreed to in writing, software
 10 | # distributed under the License is distributed on an "AS IS" BASIS,
 11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 12 | # See the License for the specific language governing permissions and
 13 | # limitations under the License.
 14 | # ==============================================================================
 15 | 
 16 | r"""Tool to export an object detection model for inference.
 17 | Prepares an object detection tensorflow graph for inference using model
 18 | configuration and a trained checkpoint. Outputs inference
 19 | graph, associated checkpoint files, a frozen inference graph and a
 20 | SavedModel (https://tensorflow.github.io/serving/serving_basic.html).
 21 | The inference graph contains one of three input nodes depending on the user
 22 | specified option.
 23 |   * `image_tensor`: Accepts a uint8 4-D tensor of shape [None, None, None, 3]
 24 |   * `encoded_image_string_tensor`: Accepts a 1-D string tensor of shape [None]
 25 |     containing encoded PNG or JPEG images. Image resolutions are expected to be
 26 |     the same if more than 1 image is provided.
 27 |   * `tf_example`: Accepts a 1-D string tensor of shape [None] containing
 28 |     serialized TFExample protos. Image resolutions are expected to be the same
 29 |     if more than 1 image is provided.
 30 | and the following output nodes returned by the model.postprocess(..):
 31 |   * `num_detections`: Outputs float32 tensors of the form [batch]
 32 |       that specifies the number of valid boxes per image in the batch.
 33 |   * `detection_boxes`: Outputs float32 tensors of the form
 34 |       [batch, num_boxes, 4] containing detected boxes.
 35 |   * `detection_scores`: Outputs float32 tensors of the form
 36 |       [batch, num_boxes] containing class scores for the detections.
 37 |   * `detection_classes`: Outputs float32 tensors of the form
 38 |       [batch, num_boxes] containing classes for the detections.
 39 |   * `raw_detection_boxes`: Outputs float32 tensors of the form
 40 |       [batch, raw_num_boxes, 4] containing detection boxes without
 41 |       post-processing.
 42 |   * `raw_detection_scores`: Outputs float32 tensors of the form
 43 |       [batch, raw_num_boxes, num_classes_with_background] containing class score
 44 |       logits for raw detection boxes.
 45 |   * `detection_masks`: Outputs float32 tensors of the form
 46 |       [batch, num_boxes, mask_height, mask_width] containing predicted instance
 47 |       masks for each box if its present in the dictionary of postprocessed
 48 |       tensors returned by the model.
 49 | Notes:
 50 |  * This tool uses `use_moving_averages` from eval_config to decide which
 51 |    weights to freeze.
 52 | Example Usage:
 53 | --------------
 54 | python export_inference_graph \
 55 |     --input_type image_tensor \
 56 |     --pipeline_config_path path/to/ssd_inception_v2.config \
 57 |     --trained_checkpoint_prefix path/to/model.ckpt \
 58 |     --output_directory path/to/exported_model_directory
 59 | The expected output would be in the directory
 60 | path/to/exported_model_directory (which is created if it does not exist)
 61 | with contents:
 62 |  - inference_graph.pbtxt
 63 |  - model.ckpt.data-00000-of-00001
 64 |  - model.ckpt.info
 65 |  - model.ckpt.meta
 66 |  - frozen_inference_graph.pb
 67 |  + saved_model (a directory)
 68 | Config overrides (see the `config_override` flag) are text protobufs
 69 | (also of type pipeline_pb2.TrainEvalPipelineConfig) which are used to override
 70 | certain fields in the provided pipeline_config_path.  These are useful for
 71 | making small changes to the inference graph that differ from the training or
 72 | eval config.
 73 | Example Usage (in which we change the second stage post-processing score
 74 | threshold to be 0.5):
 75 | python export_inference_graph \
 76 |     --input_type image_tensor \
 77 |     --pipeline_config_path path/to/ssd_inception_v2.config \
 78 |     --trained_checkpoint_prefix path/to/model.ckpt \
 79 |     --output_directory path/to/exported_model_directory \
 80 |     --config_override " \
 81 |             model{ \
 82 |               faster_rcnn { \
 83 |                 second_stage_post_processing { \
 84 |                   batch_non_max_suppression { \
 85 |                     score_threshold: 0.5 \
 86 |                   } \
 87 |                 } \
 88 |               } \
 89 |             }"
 90 | """
 91 | import tensorflow as tf
 92 | from google.protobuf import text_format
 93 | from object_detection import exporter
 94 | from object_detection.protos import pipeline_pb2
 95 | 
 96 | slim = tf.contrib.slim
 97 | flags = tf.app.flags
 98 | 
 99 | flags.DEFINE_string('input_type', 'image_tensor', 'Type of input node. Can be '
100 |                     'one of [`image_tensor`, `encoded_image_string_tensor`, '
101 |                     '`tf_example`]')
102 | flags.DEFINE_string('input_shape', None,
103 |                     'If input_type is `image_tensor`, this can explicitly set '
104 |                     'the shape of this input tensor to a fixed size. The '
105 |                     'dimensions are to be provided as a comma-separated list '
106 |                     'of integers. A value of -1 can be used for unknown '
107 |                     'dimensions. If not specified, for an `image_tensor, the '
108 |                     'default shape will be partially specified as '
109 |                     '`[None, None, None, 3]`.')
110 | flags.DEFINE_string('pipeline_config_path', None,
111 |                     'Path to a pipeline_pb2.TrainEvalPipelineConfig config '
112 |                     'file.')
113 | flags.DEFINE_string('trained_checkpoint_prefix', None,
114 |                     'Path to trained checkpoint, typically of the form '
115 |                     'path/to/model.ckpt')
116 | flags.DEFINE_string('output_directory', None, 'Path to write outputs.')
117 | flags.DEFINE_string('config_override', '',
118 |                     'pipeline_pb2.TrainEvalPipelineConfig '
119 |                     'text proto to override pipeline_config_path.')
120 | flags.DEFINE_boolean('write_inference_graph', False,
121 |                      'If true, writes inference graph to disk.')
122 | tf.app.flags.mark_flag_as_required('pipeline_config_path')
123 | tf.app.flags.mark_flag_as_required('trained_checkpoint_prefix')
124 | tf.app.flags.mark_flag_as_required('output_directory')
125 | FLAGS = flags.FLAGS
126 | 
127 | 
128 | def main(_):
129 |   pipeline_config = pipeline_pb2.TrainEvalPipelineConfig()
130 |   with tf.gfile.GFile(FLAGS.pipeline_config_path, 'r') as f:
131 |     text_format.Merge(f.read(), pipeline_config)
132 |   text_format.Merge(FLAGS.config_override, pipeline_config)
133 |   if FLAGS.input_shape:
134 |     input_shape = [
135 |         int(dim) if dim != '-1' else None
136 |         for dim in FLAGS.input_shape.split(',')
137 |     ]
138 |   else:
139 |     input_shape = None
140 |   exporter.export_inference_graph(
141 |       FLAGS.input_type, pipeline_config, FLAGS.trained_checkpoint_prefix,
142 |       FLAGS.output_directory, input_shape=input_shape,
143 |       write_inference_graph=FLAGS.write_inference_graph)
144 | 
145 | 
146 | if __name__ == '__main__':
147 |   tf.app.run()
148 | 


--------------------------------------------------------------------------------
/DL_Scripts/fusion.py:
--------------------------------------------------------------------------------
  1 | import numpy as np
  2 | import tensorflow as tf
  3 | from tensorflow import keras
  4 | from tensorflow.keras import layers
  5 | print(tf.__version__)
  6 | from tensorflow.keras.models import Sequential,Model
  7 | from tensorflow.keras.layers import  Dense,Conv2D, Flatten, Dropout, MaxPooling2D,concatenate
  8 | from tensorflow.keras.preprocessing.image import ImageDataGenerator
  9 | import cv2
 10 | import os
 11 | import matplotlib.pyplot as plt
 12 | import datetime
 13 | 
 14 | tf.keras.backend.clear_session()
 15 | 
 16 | IMG_HEIGHT=150
 17 | IMG_WIDTH=150
 18 | input_image=keras.Input(shape=(IMG_HEIGHT,IMG_WIDTH,3))
 19 | input_lidar=keras.Input(shape=(IMG_HEIGHT,IMG_WIDTH,3))
 20 | 
 21 | class JoinedGenerator(keras.utils.Sequence):
 22 |     def __init__(self, generator1, generator2):
 23 |         self.generator1 = generator1
 24 |         self.generator2 = generator2 
 25 | 
 26 |     def __len__(self):
 27 |         return len(self.generator1)
 28 | 
 29 |     def __getitem__(self, i):
 30 |         x1, y1 = self.generator1[i]
 31 |         x2, y2 = self.generator2[i]
 32 |         return [x1, x2], y1
 33 | 
 34 |     def on_epoch_end(self):
 35 |         self.generator1.on_epoch_end()
 36 |         self.generator2.on_epoch_end()
 37 | 
 38 | datagen_lidar = ImageDataGenerator()
 39 | # load and iterate training dataset
 40 | train_lidar = datagen_lidar.flow_from_directory('data_lidar/train/', target_size=(IMG_HEIGHT, IMG_WIDTH),class_mode='binary', batch_size=2)
 41 | # load and iterate validation dataset
 42 | val_lidar = datagen_lidar.flow_from_directory('data_lidar/validation/', target_size=(IMG_HEIGHT, IMG_WIDTH),class_mode='binary', batch_size=2)
 43 | # load and iterate test dataset
 44 | test_lidar = datagen_lidar.flow_from_directory('data_lidar/test/', target_size=(IMG_HEIGHT, IMG_WIDTH),class_mode='binary', batch_size=2)
 45 | 
 46 | datagen = ImageDataGenerator()
 47 | # load and iterate training dataset
 48 | train_it = datagen.flow_from_directory('data/train/', target_size=(IMG_HEIGHT, IMG_WIDTH),class_mode='binary', batch_size=2)
 49 | # load and iterate validation dataset
 50 | val_it = datagen.flow_from_directory('data/validation/', target_size=(IMG_HEIGHT, IMG_WIDTH),class_mode='binary', batch_size=2)
 51 | # load and iterate test dataset
 52 | test_it = datagen.flow_from_directory('data/test/', target_size=(IMG_HEIGHT, IMG_WIDTH),class_mode='binary', batch_size=2)
 53 | 
 54 | x=Conv2D(16, 3, padding='same', activation='relu')(input_image)
 55 | output_image=MaxPooling2D()(x)
 56 | 
 57 | model_image = keras.Model(inputs=input_image,outputs=output_image, name='image_input')
 58 | model_image.summary()
 59 | 
 60 | y=Conv2D(16, 3, padding='same', activation='relu')(input_lidar)
 61 | output_lidar=MaxPooling2D()(y)
 62 | 
 63 | model_lidar = keras.Model(inputs=input_lidar,outputs=output_lidar, name='lidar_input')
 64 | model_lidar.summary()
 65 | 
 66 | combined = concatenate([model_image.output, model_lidar.output])
 67 | 
 68 | z=Conv2D(32, 3, padding='same', activation='relu')(combined)
 69 | z=MaxPooling2D()(z)
 70 | z=Conv2D(64, 3, padding='same', activation='relu')(z)
 71 | z=MaxPooling2D()(z)
 72 | z=Conv2D(16, 3, padding='same', activation='relu')(z)
 73 | z=MaxPooling2D()(z)
 74 | z=Flatten()(z)
 75 | z=Dense(512, activation='relu')(z)
 76 | z=Dense(128, activation='relu')(z)
 77 | z = Dense(1, activation="linear")(z)
 78 | fusion = Model(inputs=[model_lidar.input, model_image.input], outputs=z)
 79 | #keras.utils.plot_model(fusion, 'fusion.png', show_shapes=True)
 80 | 
 81 | fusion.compile(optimizer='adam',loss=tf.keras.losses.BinaryCrossentropy(from_logits=True),metrics=['accuracy'])
 82 | 
 83 | checkpoint_path = "training_1/cp_fusion.ckpt"
 84 | checkpoint_dir = os.path.dirname(checkpoint_path)
 85 | 
 86 | # # Create a callback that saves the model's weights
 87 | cp_callback = tf.keras.callbacks.ModelCheckpoint(filepath=checkpoint_path,
 88 |                                                  save_weights_only=True,
 89 |                                                  verbose=1)
 90 | 
 91 | log_dir = "logs/fit/" + datetime.datetime.now().strftime("%Y%m%d-%H%M%S")
 92 | tensorboard_callback = tf.keras.callbacks.TensorBoard(log_dir=log_dir, histogram_freq=1)
 93 | 
 94 | training_generator = JoinedGenerator(train_it, train_lidar)
 95 | validation_generator = JoinedGenerator(val_it, val_lidar)
 96 | test_generator = JoinedGenerator(test_it, test_lidar)
 97 | history = fusion.fit_generator(
 98 |     training_generator,
 99 |     steps_per_epoch=40,
100 |     epochs=10,
101 |     validation_data=validation_generator,
102 |     validation_steps=10,
103 |     callbacks=[cp_callback]#tensorboard_callback]
104 | )	
105 | loss= fusion.evaluate_generator(test_generator, steps=4)
106 | fusion.save_weights('./checkpoints/my_checkpoint') 
107 | 
108 | image_mod=cv2.imread("1.jpg")
109 | image_mod=cv2.resize(image_mod,(150,150))
110 | 
111 | image_mod_lidar=cv2.imread("3.jpg")
112 | image_mod_lidar=cv2.resize(image_mod_lidar,(150,150))
113 | val=fusion.predict([image_mod.reshape(-1,150,150,3),image_mod_lidar.reshape(-1,150,150,3)])
114 | print(val)
115 | if(val[0][0]<0):
116 |     print("car")
117 | else:
118 |     print("pedestrian")
119 |     
120 | image_mod=cv2.imread("2.jpg")
121 | image_mod=cv2.resize(image_mod,(150,150))
122 | 
123 | image_mod_lidar=cv2.imread("5.jpg")
124 | image_mod_lidar=cv2.resize(image_mod_lidar,(150,150))
125 | val=fusion.predict([image_mod.reshape(-1,150,150,3),image_mod_lidar.reshape(-1,150,150,3)])
126 | print(val)
127 | if(val[0][0]<0):
128 |     print("car")
129 | else:
130 |     print("pedestrian")
131 | 


--------------------------------------------------------------------------------
/DL_Scripts/generate_tfrecord.py:
--------------------------------------------------------------------------------
  1 |  
  2 | """
  3 | Usage:
  4 | # Create train data:
  5 | python generate_tfrecord.py --label=<LABEL> --csv_input=<PATH_TO_ANNOTATIONS_FOLDER>/train_labels.csv  --output_path=<PATH_TO_ANNOTATIONS_FOLDER>/train.record
  6 | # Create test data:
  7 | python generate_tfrecord.py --label=<LABEL> --csv_input=<PATH_TO_ANNOTATIONS_FOLDER>/test_labels.csv  --output_path=<PATH_TO_ANNOTATIONS_FOLDER>/test.record
  8 | """
  9 | 
 10 | from __future__ import division
 11 | from __future__ import print_function
 12 | from __future__ import absolute_import
 13 | 
 14 | import os
 15 | import io
 16 | import pandas as pd
 17 | import tensorflow as tf
 18 | import sys
 19 | #sys.path.append("../../models/research")
 20 | 
 21 | from PIL import Image
 22 | from object_detection.utils import dataset_util
 23 | from collections import namedtuple, OrderedDict
 24 | 
 25 | flags = tf.app.flags
 26 | flags.DEFINE_string('csv_input', '', 'Path to the CSV input')
 27 | flags.DEFINE_string('output_path', '', 'Path to output TFRecord')
 28 | # flags.DEFINE_string('label', '', 'Name of class label')
 29 | # if your image has more labels input them as
 30 | flags.DEFINE_string('label0', '', 'Name of class[0] label')
 31 | flags.DEFINE_string('label1', '', 'Name of class[1] label')
 32 | # and so on.
 33 | flags.DEFINE_string('img_path', '', 'Path to images')
 34 | FLAGS = flags.FLAGS
 35 | 
 36 | 
 37 | # TO-DO replace this with label map
 38 | # for multiple labels add more else if statements
 39 | def class_text_to_int(row_label):
 40 |     # if row_label == FLAGS.label:  # 'Person':
 41 |     #     return 1
 42 |     # comment upper if statement and uncomment these statements for multiple labelling
 43 |     if row_label == FLAGS.label0:
 44 |       return 1
 45 |     elif row_label == FLAGS.label1:
 46 |       return 0
 47 |     else:
 48 |         None
 49 | 
 50 | 
 51 | def split(df, group):
 52 |     data = namedtuple('data', ['filename', 'object'])
 53 |     gb = df.groupby(group)
 54 |     return [data(filename, gb.get_group(x)) for filename, x in zip(gb.groups.keys(), gb.groups)]
 55 | 
 56 | 
 57 | def create_tf_example(group, path):
 58 |     with tf.io.gfile.GFile(os.path.join(path, '{}'.format(group.filename)), 'rb') as fid:
 59 |         encoded_jpg = fid.read()
 60 |     encoded_jpg_io = io.BytesIO(encoded_jpg)
 61 |     image = Image.open(encoded_jpg_io)
 62 |     width, height = image.size
 63 | 
 64 |     filename = group.filename.encode('utf8')
 65 |     image_format = b'jpg'
 66 |     # check if the image format is matching with your images.
 67 |     xmins = []
 68 |     xmaxs = []
 69 |     ymins = []
 70 |     ymaxs = []
 71 |     classes_text = []
 72 |     classes = []
 73 | 
 74 |     for index, row in group.object.iterrows():
 75 |         xmins.append(row['xmin'] / width)
 76 |         xmaxs.append(row['xmax'] / width)
 77 |         ymins.append(row['ymin'] / height)
 78 |         ymaxs.append(row['ymax'] / height)
 79 |         classes_text.append(row['class'].encode('utf8'))
 80 |         classes.append(class_text_to_int(row['class']))
 81 | 
 82 |     tf_example = tf.train.Example(features=tf.train.Features(feature={
 83 |         'image/height': dataset_util.int64_feature(height),
 84 |         'image/width': dataset_util.int64_feature(width),
 85 |         'image/filename': dataset_util.bytes_feature(filename),
 86 |         'image/source_id': dataset_util.bytes_feature(filename),
 87 |         'image/encoded': dataset_util.bytes_feature(encoded_jpg),
 88 |         'image/format': dataset_util.bytes_feature(image_format),
 89 |         'image/object/bbox/xmin': dataset_util.float_list_feature(xmins),
 90 |         'image/object/bbox/xmax': dataset_util.float_list_feature(xmaxs),
 91 |         'image/object/bbox/ymin': dataset_util.float_list_feature(ymins),
 92 |         'image/object/bbox/ymax': dataset_util.float_list_feature(ymaxs),
 93 |         'image/object/class/text': dataset_util.bytes_list_feature(classes_text),
 94 |         'image/object/class/label': dataset_util.int64_list_feature(classes),
 95 |     }))
 96 |     return tf_example
 97 | 
 98 | 
 99 | def main(_):
100 |     writer = tf.io.TFRecordWriter(FLAGS.output_path)
101 |     path = os.path.join(os.getcwd(), FLAGS.img_path)
102 |     examples = pd.read_csv(FLAGS.csv_input)
103 |     grouped = split(examples, 'filename')
104 |     for group in grouped:
105 |         tf_example = create_tf_example(group, path)
106 |         writer.write(tf_example.SerializeToString())
107 | 
108 |     writer.close()
109 |     output_path = os.path.join(os.getcwd(), FLAGS.output_path)
110 |     print('Successfully created the TFRecords: {}'.format(output_path))
111 | 
112 | 
113 | if __name__ == '__main__':
114 |     tf.compat.v1.app.run()
115 | 


--------------------------------------------------------------------------------
/DL_Scripts/image_recognition.py:
--------------------------------------------------------------------------------
 1 | import rospy
 2 | from sensor_msgs.msg import Image
 3 | from std_msgs.msg import String
 4 | from cv_bridge import CvBridge
 5 | import cv2
 6 | import numpy as np
 7 | import tensorflow as tf
 8 | import classify_image
 9 | 
10 | 
11 | class RosTensorFlow():
12 |     def __init__(self):
13 |         classify_image.maybe_download_and_extract()
14 |         self._session = tf.Session()
15 |         classify_image.create_graph()
16 |         self._cv_bridge = CvBridge()
17 | 
18 |         self._sub = rospy.Subscriber('/usb_cam/image_raw', Image, self.callback, queue_size=1)
19 |         self._pub = rospy.Publisher('result', String, queue_size=1)
20 |         self.score_threshold = rospy.get_param('~score_threshold', 0.1)
21 |         self.use_top_k = rospy.get_param('~use_top_k', 5)
22 | 
23 |     def callback(self, image_msg):
24 |         cv_image = self._cv_bridge.imgmsg_to_cv2(image_msg, "bgr8")
25 |         # copy from
26 |         # classify_image.py
27 |         image_data = cv2.imencode('.jpg', cv_image)[1].tostring()
28 |         # Creates graph from saved GraphDef.
29 |         softmax_tensor = self._session.graph.get_tensor_by_name('softmax:0')
30 |         predictions = self._session.run(
31 |             softmax_tensor, {'DecodeJpeg/contents:0': image_data})
32 |         predictions = np.squeeze(predictions)
33 |         # Creates node ID --> English string lookup.
34 |         node_lookup = classify_image.NodeLookup()
35 |         top_k = predictions.argsort()[-self.use_top_k:][::-1]
36 |         for node_id in top_k:
37 |             human_string = node_lookup.id_to_string(node_id)
38 |             score = predictions[node_id]
39 |             if score > self.score_threshold:
40 |                 rospy.loginfo('%s (score = %.5f)' % (human_string, score))
41 |                 self._pub.publish(human_string)
42 | 
43 |     def main(self):
44 |         rospy.spin()
45 | 
46 | if __name__ == '__main__':
47 |     classify_image.setup_args()
48 |     rospy.init_node('rostensorflow')
49 |     tensor = RosTensorFlow()
50 |     tensor.main()
51 | 


--------------------------------------------------------------------------------
/DL_Scripts/lidar_image_pub.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | import rospy
 3 | import sensor_msgs.point_cloud2 as pc2
 4 | from sensor_msgs.msg import PointCloud2, PointField,Image
 5 | from roslib import message
 6 | from geometry_msgs.msg import PoseStamped 
 7 | from nav_msgs.msg import Odometry
 8 | from std_msgs.msg import Int32
 9 | import rospy, cv2, cv_bridge, numpy
10 | from sensor_msgs.msg import Image
11 | import cv2
12 | import numpy as np
13 | from matplotlib import pyplot as plt
14 | from visualization_msgs.msg import MarkerArray,Marker
15 | import visualization_msgs
16 | import time
17 | 
18 | class Fusion:
19 |   def __init__(self):
20 | 	self.id=0
21 | 	self.image=np.zeros((451,901,3))
22 | 	self.array=np.zeros((451,901))
23 | 	self.x=np.zeros((451,901))
24 | 	self.y=np.zeros((451,901))
25 | 	self.z=np.zeros((451,901))
26 | 	self.image_gs=np.zeros((600,600,3))
27 | 	self.bridge=cv_bridge.CvBridge()
28 | 	sub_1=rospy.Subscriber("lidar_top", PointCloud2, self.callback_kinect)
29 | 	self.image_pub=rospy.Publisher("image_lidar",Image,queue_size=1	)
30 | 	#sub=rospy.Subscriber("/cam_front/raw",Image,self.image_cb)
31 | 	rate=rospy.Rate(10)
32 | 	rate.sleep()
33 |       
34 |   def image_cb(self,msg):
35 |     self.image=self.bridge.imgmsg_to_cv2(msg,desired_encoding="bgr8")
36 |     self.half = cv2.resize(self.image, (0, 0), fx = 0.5, fy = 0.5)
37 |     self.half=cv2.flip(self.half,0)
38 |     self.x=self.half[:,:,2]
39 |     self.y=self.half[:,:,0]
40 |     self.z=self.half[:,:,1]
41 |     
42 | 
43 |   def callback_kinect(self,data) :
44 |     data_out = pc2.read_points(data, field_names=("x","y","z","intensity"), skip_nans=False)
45 |     #print(data_out)
46 |     i=0
47 |     j=0
48 |     self.id+=1
49 |     for p in data_out:
50 |       if(p[0]>-10 and p[0]<10 and p[1]>-10 and p[1]<10):
51 |     	self.image_gs[int(abs(30*(p[0]+10)))][int(abs(30*(p[1]+10)))]=255
52 |     # cv2.imwrite("ima"+str(self.id)+".jpg",self.image_gs)
53 |     # cv2.imshow("window",self.image_gs)
54 |     # cv2.waitKey(1)
55 |     image_final=self.bridge.cv2_to_imgmsg(self.image_gs,encoding="passthrough")
56 |     self.image_pub.publish(image_final)
57 |     self.image_gs=np.zeros((600,600,3))
58 | 
59 | if __name__ == '__main__':
60 |     try:
61 |       rospy.init_node('listen', anonymous=True)
62 |       fusion=Fusion()
63 |       rospy.spin()
64 |     except rospy.ROSInterruptException:
65 |       print ("error")
66 |       pass
67 | 


--------------------------------------------------------------------------------
/DL_Scripts/multi_sensor_fusion.py:
--------------------------------------------------------------------------------
  1 | import numpy as np
  2 | import tensorflow as tf
  3 | from tensorflow import keras
  4 | from tensorflow.keras import layers
  5 | print(tf.__version__)
  6 | from tensorflow.keras.models import Sequential,Model
  7 | from tensorflow.keras.layers import  Dense,Conv2D, Flatten, Dropout, MaxPooling2D,concatenate
  8 | from tensorflow.keras.preprocessing.image import ImageDataGenerator
  9 | import cv2
 10 | import os
 11 | import matplotlib.pyplot as plt
 12 | import datetime
 13 | 
 14 | tf.keras.backend.clear_session()
 15 | 
 16 | IMG_HEIGHT=150
 17 | IMG_WIDTH=150
 18 | input_image=keras.Input(shape=(IMG_HEIGHT,IMG_WIDTH,3))
 19 | input_lidar=keras.Input(shape=(IMG_HEIGHT,IMG_WIDTH,3))
 20 | input_radar=keras.Input(shape=(IMG_HEIGHT,IMG_WIDTH,3))
 21 | 
 22 | class JoinedGenerator(keras.utils.Sequence):
 23 |     def __init__(self, generator1, generator2,generator3):
 24 |         self.generator1 = generator1
 25 |         self.generator2 = generator2
 26 |         self.generator3 = generator3 
 27 | 
 28 |     def __len__(self):
 29 |         return len(self.generator1)
 30 | 
 31 |     def __getitem__(self, i):
 32 |         x1, y1 = self.generator1[i]
 33 |         x2, y2 = self.generator2[i]
 34 |         x3, y3 = self.generator3[i]
 35 |         return [x1, x2, x3], y1
 36 | 
 37 |     def on_epoch_end(self):
 38 |         self.generator1.on_epoch_end()
 39 |         self.generator2.on_epoch_end()
 40 |         self.generator3.on_epoch_end()
 41 | 
 42 | datagen_lidar = ImageDataGenerator()
 43 | # load and iterate training dataset
 44 | train_lidar = datagen_lidar.flow_from_directory('data_lidar/train/', target_size=(IMG_HEIGHT, IMG_WIDTH),class_mode='binary', batch_size=2)
 45 | # load and iterate validation dataset
 46 | val_lidar = datagen_lidar.flow_from_directory('data_lidar/validation/', target_size=(IMG_HEIGHT, IMG_WIDTH),class_mode='binary', batch_size=2)
 47 | # load and iterate test dataset
 48 | test_lidar = datagen_lidar.flow_from_directory('data_lidar/test/', target_size=(IMG_HEIGHT, IMG_WIDTH),class_mode='binary', batch_size=2)
 49 | 
 50 | datagen = ImageDataGenerator()
 51 | # load and iterate training dataset
 52 | train_it = datagen.flow_from_directory('data/train/', target_size=(IMG_HEIGHT, IMG_WIDTH),class_mode='binary', batch_size=2)
 53 | # load and iterate validation dataset
 54 | val_it = datagen.flow_from_directory('data/validation/', target_size=(IMG_HEIGHT, IMG_WIDTH),class_mode='binary', batch_size=2)
 55 | # load and iterate test dataset
 56 | test_it = datagen.flow_from_directory('data/test/', target_size=(IMG_HEIGHT, IMG_WIDTH),class_mode='binary', batch_size=2)
 57 | 
 58 | datagen_radar = ImageDataGenerator()
 59 | # load and iterate training dataset
 60 | train_radar = datagen_radar.flow_from_directory('data_radar/train/', target_size=(IMG_HEIGHT, IMG_WIDTH),class_mode='binary', batch_size=2)
 61 | # load and iterate validation dataset
 62 | val_radar = datagen_radar.flow_from_directory('data_radar/validation/', target_size=(IMG_HEIGHT, IMG_WIDTH),class_mode='binary', batch_size=2)
 63 | # load and iterate test dataset
 64 | test_radar = datagen_radar.flow_from_directory('data_radar/test/', target_size=(IMG_HEIGHT, IMG_WIDTH),class_mode='binary', batch_size=2)
 65 | 
 66 | x=Conv2D(16, 3, padding='same', activation='relu')(input_image)
 67 | output_image=MaxPooling2D()(x)
 68 | 
 69 | model_image = keras.Model(inputs=input_image,outputs=output_image, name='image_input')
 70 | model_image.summary()
 71 | 
 72 | y=Conv2D(16, 3, padding='same', activation='relu')(input_lidar)
 73 | output_lidar=MaxPooling2D()(y)
 74 | 
 75 | model_lidar = keras.Model(inputs=input_lidar,outputs=output_lidar, name='lidar_input')
 76 | model_lidar.summary()
 77 | 
 78 | w=Conv2D(16, 3, padding='same', activation='relu')(input_radar)
 79 | output_radar=MaxPooling2D()(w)
 80 | 
 81 | model_radar = keras.Model(inputs=input_radar,outputs=output_radar, name='radar_input')
 82 | model_radar.summary()
 83 | 
 84 | combined = concatenate([model_image.output, model_lidar.output, model_radar.output])
 85 | 
 86 | z=Conv2D(32, 3, padding='same', activation='relu')(combined)
 87 | z=MaxPooling2D()(z)
 88 | z=Conv2D(16, 3, padding='same', activation='relu')(z)
 89 | z=MaxPooling2D()(z)
 90 | z=Conv2D(64, 3, padding='same', activation='relu')(z)
 91 | z=MaxPooling2D()(z)
 92 | z=Conv2D(16, 3, padding='same', activation='relu')(z)
 93 | z=MaxPooling2D()(z)
 94 | z=Flatten()(z)
 95 | z=Dense(512, activation='relu')(z)
 96 | z=Dense(256, activation='relu')(z)
 97 | z=Dense(128, activation='relu')(z)
 98 | z = Dense(1, activation="linear")(z)
 99 | fusion = Model(inputs=[model_lidar.input, model_image.input,model_radar.input], outputs=z)
100 | #keras.utils.plot_model(fusion, 'fusion.png', show_shapes=True)
101 | 
102 | fusion.compile(optimizer='adam',loss=tf.keras.losses.BinaryCrossentropy(from_logits=True),metrics=['accuracy'])
103 | 
104 | checkpoint_path = "training_1/cp_fusion.ckpt"
105 | checkpoint_dir = os.path.dirname(checkpoint_path)
106 | 
107 | # # Create a callback that saves the model's weights
108 | cp_callback = tf.keras.callbacks.ModelCheckpoint(filepath=checkpoint_path,
109 |                                                  save_weights_only=True,
110 |                                                  verbose=1)
111 | 
112 | log_dir = "logs/fit/" + datetime.datetime.now().strftime("%Y%m%d-%H%M%S")
113 | tensorboard_callback = tf.keras.callbacks.TensorBoard(log_dir=log_dir, histogram_freq=1)
114 | 
115 | training_generator = JoinedGenerator(train_it, train_lidar, train_radar)
116 | validation_generator = JoinedGenerator(val_it, val_lidar,val_radar)
117 | test_generator = JoinedGenerator(test_it, test_lidar,test_radar)
118 | history = fusion.fit_generator(
119 |     training_generator,
120 |     steps_per_epoch=60,
121 |     epochs=10,
122 |     validation_data=validation_generator,
123 |     validation_steps=10,
124 |     callbacks=[tensorboard_callback]
125 | )	
126 | loss= fusion.evaluate_generator(test_generator, steps=4)
127 | fusion.save_weights('./checkpoints/my_checkpoint') 
128 | 
129 | 
130 | #######################################TEST#################################################
131 | 
132 | image_mod=cv2.imread("1.jpg")
133 | image_mod=cv2.resize(image_mod,(150,150))
134 | 
135 | image_mod_lidar=cv2.imread("3.jpg")
136 | image_mod_lidar=cv2.resize(image_mod_lidar,(150,150))
137 | 
138 | image_mod_radar=cv2.imread("6.jpg")
139 | image_mod_radar=cv2.resize(image_mod_lidar,(150,150))
140 | 
141 | val=fusion.predict([image_mod.reshape(-1,150,150,3),image_mod_lidar.reshape(-1,150,150,3),image_mod_radar.reshape(-1,150,150,3)])
142 | print(val)
143 | if(val[0][0]<0):
144 |     print("car")
145 | else:
146 |     print("pedestrian")
147 | 
148 | image_mod=cv2.imread("2.jpg")
149 | image_mod=cv2.resize(image_mod,(150,150))
150 | 
151 | image_mod_lidar=cv2.imread("4.jpg")
152 | image_mod_lidar=cv2.resize(image_mod_lidar,(150,150))
153 | 
154 | image_mod_radar=cv2.imread("6.jpg")
155 | image_mod_radar=cv2.resize(image_mod_lidar,(150,150))
156 | 
157 | val=fusion.predict([image_mod.reshape(-1,150,150,3),image_mod_lidar.reshape(-1,150,150,3),image_mod_radar.reshape(-1,150,150,3)])
158 | print(val)
159 | if(val[0][0]<0):
160 |     print("car")
161 | else:
162 |     print("pedestrian")
163 | 


--------------------------------------------------------------------------------
/DL_Scripts/object_detection.py:
--------------------------------------------------------------------------------
  1 | 
  2 | # coding: utf-8
  3 | 
  4 | # # Object Detection Demo
  5 | # Welcome to the object detection inference walkthrough!  This notebook will walk you step by step through the process of using a pre-trained model to detect objects in an image. Make sure to follow the [installation instructions](https://github.com/tensorflow/models/blob/master/object_detection/g3doc/installation.md) before you start.
  6 | 
  7 | # # Imports
  8 | 
  9 | # In[1]:
 10 | 
 11 | 
 12 | import numpy as np
 13 | import os
 14 | import six.moves.urllib as urllib
 15 | import sys
 16 | import tarfile
 17 | import tensorflow as tf
 18 | import zipfile
 19 | 
 20 | from collections import defaultdict
 21 | from io import StringIO
 22 | from matplotlib import pyplot as plt
 23 | from PIL import Image
 24 | import cv2
 25 | from IPython.display import display
 26 | # ## Env setup
 27 | 
 28 | # In[2]:
 29 | 
 30 | 
 31 | # This is needed to display the images.
 32 | # get_ipython().magic(u'matplotlib inline')
 33 | import matplotlib
 34 | 
 35 | # This is needed since the notebook is stored in the object_detection folder.
 36 | #sys.path.append("..")
 37 | 
 38 | 
 39 | # ## Object detection imports
 40 | # Here are the imports from the object detection module.
 41 | 
 42 | # In[3]:
 43 | 
 44 | 
 45 | from object_detection.utils import label_map_util
 46 | 
 47 | from object_detection.utils import visualization_utils as vis_util
 48 | 
 49 | 
 50 | MODEL_NAME = 'output_inference_graph_v2'
 51 | 
 52 | 
 53 | # Path to frozen detection graph. This is the actual model that is used for the object detection.
 54 | PATH_TO_CKPT = MODEL_NAME + '/frozen_inference_graph.pb'
 55 | # List of the strings that is used to add correct label for each box.
 56 | PATH_TO_LABELS = os.path.join('annotations','label_map.pbtxt')
 57 | NUM_CLASSES = 2
 58 | 
 59 | 
 60 | # ## Download Model
 61 | 
 62 | # In[5]:
 63 | 
 64 | print (" Loading frozen model into memory")
 65 | 
 66 | 
 67 | detection_graph = tf.Graph()
 68 | with detection_graph.as_default():
 69 |   od_graph_def = tf.compat.v1.GraphDef()
 70 |   with tf.io.gfile.GFile(PATH_TO_CKPT, 'rb') as fid:
 71 |     serialized_graph = fid.read()
 72 |     od_graph_def.ParseFromString(serialized_graph)
 73 |     tf.import_graph_def(od_graph_def, name='')
 74 | 
 75 | 
 76 | # ## Loading label map
 77 | # Label maps map indices to category names, so that when our convolution network predicts `5`, we know that this corresponds to `airplane`.  Here we use internal utility functions, but anything that returns a dictionary mapping integers to appropriate string labels would be fine
 78 | 
 79 | # In[7]:
 80 | 
 81 | 
 82 | label_map = label_map_util.load_labelmap(PATH_TO_LABELS)
 83 | categories = label_map_util.convert_label_map_to_categories(label_map, max_num_classes=NUM_CLASSES, use_display_name=True)
 84 | category_index = label_map_util.create_category_index(categories)
 85 | 
 86 | 
 87 | # ## Helper code
 88 | 
 89 | # In[8]:
 90 | 
 91 | 
 92 | def load_image_into_numpy_array(image):
 93 |   (im_width, im_height) = image.size
 94 |   mod_image=np.zeros((im_height,im_width,3))
 95 |   mod_image[:, :, 0]=image
 96 |   mod_image[:, :, 1]=image
 97 |   mod_image[:, :, 2]=image  
 98 |   return mod_image.astype(np.uint8)
 99 | 
100 | 
101 | # def load_image_into_numpy_array(image):
102 | #   (im_width, im_height) = image.size
103 | #   return np.array(image.getdata()).reshape(
104 | #       (im_height, im_width, 3)).astype(np.uint8)
105 | 
106 | # # Detection
107 | 
108 | # In[9]:
109 | 
110 | 
111 | # For the sake of simplicity we will use only 2 images:
112 | # image1.jpg
113 | # image2.jpg
114 | # If you want to test the code with your images, just add path to the images to the TEST_IMAGE_PATHS.
115 | PATH_TO_TEST_IMAGES_DIR = 'data_lidar/test/car'
116 | TEST_IMAGE_PATHS = [ os.path.join(PATH_TO_TEST_IMAGES_DIR, 'ima{}.jpg'.format(i)) for i in range(2,28) ]
117 | 
118 | # Size, in inches, of the output images.
119 | IMAGE_SIZE = (12, 8)
120 | 
121 | 
122 | # In[11]:
123 | 
124 | 
125 | with detection_graph.as_default():
126 |   with tf.compat.v1.Session(graph=detection_graph) as sess:
127 |     for image_path in TEST_IMAGE_PATHS:
128 |       image = Image.open(image_path)
129 |       # the array based representation of the image will be used later in order to prepare the
130 |       # result image with boxes and labels on it.
131 |       image_np = load_image_into_numpy_array(image)
132 | 
133 |       # Expand dimensions since the model expects images to have shape: [1, None, None, 3]
134 |       image_np_expanded = np.expand_dims(image_np, axis=0)
135 |       image_tensor = detection_graph.get_tensor_by_name('image_tensor:0')
136 |       # Each box represents a part of the image where a particular object was detected.
137 |       boxes = detection_graph.get_tensor_by_name('detection_boxes:0')
138 |       # Each score represent how level of confidence for each of the objects.
139 |       # Score is shown on the result image, together with the class label.
140 |       scores = detection_graph.get_tensor_by_name('detection_scores:0')
141 |       classes = detection_graph.get_tensor_by_name('detection_classes:0')
142 |       num_detections = detection_graph.get_tensor_by_name('num_detections:0')
143 |       # Actual detection.
144 |       (boxes, scores, classes, num_detections) = sess.run(
145 |           [boxes, scores, classes, num_detections],
146 |           feed_dict={image_tensor: image_np_expanded})    
147 |       # Visualization of the results of a detection.
148 |       vis_util.visualize_boxes_and_labels_on_image_array(
149 |           image_np,
150 |           np.squeeze(boxes),
151 |           np.squeeze(classes).astype(np.int32),
152 |           np.squeeze(scores),
153 |           category_index,
154 |           use_normalized_coordinates=True,
155 |           line_thickness=8)
156 |       display(Image.fromarray(image_np))
157 |       cv2.imshow("window",image_np)
158 |       cv2.waitKey(3)
159 |       import time
160 |       time.sleep(1)
161 | 


--------------------------------------------------------------------------------
/DL_Scripts/pointcloud.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | import rospy
 3 | import sensor_msgs.point_cloud2 as pc2
 4 | from sensor_msgs.msg import PointCloud2, PointField
 5 | from roslib import message
 6 | from geometry_msgs.msg import PoseStamped 
 7 | from nav_msgs.msg import Odometry
 8 | from std_msgs.msg import Int32
 9 | import rospy, cv2, cv_bridge, numpy
10 | from sensor_msgs.msg import Image
11 | import cv2
12 | import numpy as np
13 | from matplotlib import pyplot as plt
14 | from visualization_msgs.msg import MarkerArray,Marker
15 | import visualization_msgs
16 | import time
17 | 
18 | class Fusion:
19 | 	def __init__(self):
20 | 		self.image=np.zeros((451,901))
21 | 		self.array=np.zeros((451,901))
22 | 		self.red=np.zeros((451,901))
23 | 		self.green=np.zeros((451,901))
24 | 		self.blue=np.zeros((451,901))
25 | 		self.reconstruct=np.zeros((451,900))
26 | 		self.pub=rospy.Publisher("marker",MarkerArray,queue_size=1)
27 | 		self.bridge=cv_bridge.CvBridge()
28 | 		sub_1=rospy.Subscriber("lidar_top", PointCloud2, self.callback_kinect)
29 | 		sub=rospy.Subscriber("/cam_front/raw",Image,self.image_cb)
30 | 		rate=rospy.Rate(10)
31 | 		rate.sleep()
32 | 	    
33 | 	def image_cb(self,msg):
34 | 		self.image=self.bridge.imgmsg_to_cv2(msg,desired_encoding="bgr8")
35 | 		self.half = cv2.resize(self.image, (0, 0), fx = 0.5, fy = 0.5)
36 | 		self.half=cv2.flip(self.half,0)
37 | 		self.red=self.half[:,:,2]
38 | 		self.blue=self.half[:,:,0]
39 | 		self.green=self.half[:,:,1]
40 | 		
41 | 
42 | 	def callback_kinect(self,data) :
43 | 		data_out = pc2.read_points(data, field_names=("x","y","z","intensity"), skip_nans=False)
44 | 		#print(data_out)
45 | 		marker_array=MarkerArray()
46 | 		id=0	
47 | 		for p in data_out:
48 | 			if(p[0]>-5 and p[0]<5 and p[1]>0.1):
49 | 				marker=Marker()
50 | 				marker.header.frame_id="base_link"	
51 | 				marker.type=visualization_msgs.msg.Marker.CUBE
52 | 				marker.id=id
53 | 				marker.header.stamp=rospy.Time.now()
54 | 				marker.scale.x=0.1
55 | 				marker.scale.y=0.1
56 | 				marker.scale.z=0.1
57 | 				marker.action=visualization_msgs.msg.Marker.ADD
58 | 				marker.color.a=1.0
59 | 				red=self.red[int(30*(p[2]+2.3))][int(45*(p[0]+5))]
60 | 				blue=self.blue[int(30*(p[2]+2.3))][int(45*(p[0]+5))]
61 | 				green=self.green[int(30*(p[2]+2.3))][int(45*(p[0]+5))]
62 | 				#print(str(int(40*(p[0]+5)))+" "+str(int(70*(p[2]+2.3))))
63 | 				#self.reconstruct[450-int(90*(p[2]+1.9))][int(100*(p[0]+5))]=255
64 | 				marker.color.r=float(red)/255
65 | 				marker.color.g=float(green)/255
66 | 				marker.color.b=float(blue)/255
67 | 				marker.pose.position.x=p[0]
68 | 				marker.pose.position.y=p[1]
69 | 				marker.pose.position.z=p[2]+1.9
70 | 				if(id > 10000):
71 | 					id=0
72 | 					marker_array=MarkerArray()
73 | 					pass
74 | 				marker_array.markers.append(marker)
75 | 				id+=1
76 | 		self.pub.publish(marker_array)
77 | 
78 | 
79 | if __name__ == '__main__':
80 |     try:
81 |     	rospy.init_node('listen', anonymous=True)
82 |     	fusion=Fusion()
83 |     	rospy.spin()
84 |     except rospy.ROSInterruptException:
85 |     	print ("error")
86 |         pass
87 | 


--------------------------------------------------------------------------------
/DL_Scripts/radar_publisher _segment.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | import rospy
 3 | import time
 4 | from std_msgs.msg import Float64
 5 | import cv2
 6 | import cv_bridge
 7 | from sensor_msgs.msg import Image
 8 | import numpy as np
 9 | from fusion.msg import RadarObjects,RadarObject
10 | from matplotlib import pyplot as plt
11 | 
12 | class RadarPublisher():
13 | 	def __init__(self):
14 | 		self.image=np.zeros((600,600,3))
15 | 		self.image_pub=rospy.Publisher("radar_image",Image,queue_size=1)
16 | 		self.radar_sub=rospy.Subscriber("radar_front",RadarObjects,self.radarcallback)
17 | 		self.bridge=cv_bridge.CvBridge()
18 | 		self.id=0
19 | 
20 | 	def radarcallback(self,msg):
21 | 		obj=RadarObject()
22 | 		for i in range(0,100):
23 | 			obj=msg.objects[i]
24 | 			#self.image[600-int(2.5*(obj.pose.y+120))][int(2.5*(obj.pose.x+2))]=255
25 | 		# cv2.imshow("window",self.image)
26 | 		# cv2.waitKey(1)
27 | 		self.image=cv2.imread("1.png")
28 | 		self.image = cv2.cvtColor(self.image, cv2.COLOR_BGR2RGB)
29 | 		pixel_values = self.image.reshape((-1, 3))
30 | 		# convert to float
31 | 		pixel_values = np.float32(pixel_values)
32 | 		criteria = (cv2.TERM_CRITERIA_EPS + cv2.TERM_CRITERIA_MAX_ITER, 100, 0.2)
33 | 		k = 3
34 | 		_, labels, (centers) = cv2.kmeans(pixel_values, k, None, criteria, 10, cv2.KMEANS_RANDOM_CENTERS)
35 | 		centers = np.uint8(centers)
36 | 		# flatten the labels array
37 | 		labels = labels.flatten()
38 | 		segmented_image = centers[labels.flatten()]
39 | 		segmented_image = segmented_image.reshape(self.image.shape)
40 | 		cv2.imshow("window",segmented_image)
41 | 		cv2.waitKey(1)
42 | 		# image_final=self.bridge.cv2_to_imgmsg(self.image,encoding="passthrough")
43 | 		# self.image_pub.publish(image_final)
44 | 		self.image=np.zeros((600,600,3))
45 | 
46 | if __name__ == '__main__':
47 | 	rospy.init_node("radar_image")
48 | 	rate=rospy.Rate(10)
49 | 	rp=RadarPublisher()
50 | 	rospy.spin()


--------------------------------------------------------------------------------
/DL_Scripts/radar_publisher.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | import rospy
 3 | import time
 4 | from std_msgs.msg import Float64
 5 | import cv2
 6 | import cv_bridge
 7 | from sensor_msgs.msg import Image
 8 | import numpy as np
 9 | from fusion.msg import RadarObjects,RadarObject
10 | from matplotlib import pyplot as plt
11 | import random
12 | 
13 | class RadarPublisher():
14 | 	def __init__(self):
15 | 		self.image=np.zeros((600,600,3))
16 | 		self.image_pub=rospy.Publisher("radar_image",Image,queue_size=1)
17 | 		self.radar_sub_1=rospy.Subscriber("radar_front",RadarObjects,self.radarcallback_1)
18 | 		#self.radar_sub_2=rospy.Subscriber("radar_front_left",RadarObjects,self.radarcallback_2)
19 | 		#self.radar_sub_3=rospy.Subscriber("radar_front_right",RadarObjects,self.radarcallback_3)
20 | 		self.bridge=cv_bridge.CvBridge()
21 | 		self.id=0
22 | 
23 | 	def radarcallback_1(self,msg):
24 | 		obj=RadarObject()
25 | 		for i in range(0,60):
26 | 			obj=msg.objects[i]
27 | 			self.image[600-int(2.5*(obj.pose.y+120))][int(2.5*(obj.pose.x+2))]=255
28 | 			self.image[600-int(2.5*(obj.pose.y+120+random.gauss(0,0.3)))][int(2.5*(obj.pose.x+2+random.gauss(0,0.3)))]=255
29 | 			self.image[600-int(2.5*(obj.pose.y+120+random.gauss(0,0.3)))][int(2.5*(obj.pose.x+2+random.gauss(0,0.3)))]=255
30 | 			self.image[600-int(2.5*(obj.pose.y+120+random.gauss(0,0.3)))][int(2.5*(obj.pose.x+2+random.gauss(0,0.3)))]=255
31 | 			self.image[600-int(2.5*(obj.pose.y+120+random.gauss(0,0.5)))][int(2.5*(obj.pose.x+2+random.gauss(0,0.5)))]=255
32 | 			self.image[600-int(2.5*(obj.pose.y+120+random.gauss(0,0.7)))][int(2.5*(obj.pose.x+2+random.gauss(0,0.7)))]=255
33 | 		# cv2.imwrite("image_757"+str(self.id)+".jpg",self.image)
34 | 	        # self.id+=1
35 | 		# cv2.imshow("window",self.image)
36 | 		# cv2.waitKey(1)
37 | 		image_final=self.bridge.cv2_to_imgmsg(self.image,encoding="passthrough")
38 | 		self.image_pub.publish(image_final)
39 | 		self.image=np.zeros((600,600,3))
40 | 
41 | 	def radarcallback_2(self,msg):
42 | 		obj=RadarObject()
43 | 		for i in range(0,60):
44 | 			obj=msg.objects[i]
45 | 			self.image[600-int(2.5*(obj.pose.y+120))][int(2.5*(obj.pose.x+2))]=255
46 | 			self.image[600-int(2.5*(obj.pose.y+120+random.gauss(0,0.3)))][int(2.5*(obj.pose.x+2+random.gauss(0,0.3)))]=255
47 | 			self.image[600-int(2.5*(obj.pose.y+120+random.gauss(0,0.3)))][int(2.5*(obj.pose.x+2+random.gauss(0,0.3)))]=255
48 | 			self.image[600-int(2.5*(obj.pose.y+120+random.gauss(0,0.3)))][int(2.5*(obj.pose.x+2+random.gauss(0,0.3)))]=255
49 | 			self.image[600-int(2.5*(obj.pose.y+120+random.gauss(0,0.5)))][int(2.5*(obj.pose.x+2+random.gauss(0,0.5)))]=255
50 | 			self.image[600-int(2.5*(obj.pose.y+120+random.gauss(0,0.7)))][int(2.5*(obj.pose.x+2+random.gauss(0,0.7)))]=255
51 | 
52 | 	def radarcallback_3(self,msg):
53 | 		obj=RadarObject()
54 | 		for i in range(0,30):
55 | 			obj=msg.objects[i]
56 | 			self.image[600-int(2.5*(obj.pose.y+120))][int(2.5*(obj.pose.x+2))]=255
57 | 			self.image[600-int(2.5*(obj.pose.y+120+random.gauss(0,0.3)))][int(2.5*(obj.pose.x+2+random.gauss(0,0.3)))]=255
58 | 			self.image[600-int(2.5*(obj.pose.y+120+random.gauss(0,0.3)))][int(2.5*(obj.pose.x+2+random.gauss(0,0.3)))]=255
59 | 			self.image[600-int(2.5*(obj.pose.y+120+random.gauss(0,0.3)))][int(2.5*(obj.pose.x+2+random.gauss(0,0.3)))]=255
60 | 			self.image[600-int(2.5*(obj.pose.y+120+random.gauss(0,0.5)))][int(2.5*(obj.pose.x+2+random.gauss(0,0.5)))]=255
61 | 			self.image[600-int(2.5*(obj.pose.y+120+random.gauss(0,0.7)))][int(2.5*(obj.pose.x+2+random.gauss(0,0.7)))]=255
62 | 		
63 | 
64 | if __name__ == '__main__':
65 | 	rospy.init_node("radar_image")
66 | 	rate=rospy.Rate(10)
67 | 	rp=RadarPublisher()
68 | 	rospy.spin()
69 | 


--------------------------------------------------------------------------------
/DL_Scripts/ros_fusion.py:
--------------------------------------------------------------------------------
  1 | import rospy
  2 | import tensorflow as tf 
  3 | print(tf.__version__)
  4 | from tensorflow import keras
  5 | from tensorflow.keras.models import Sequential,Model
  6 | from tensorflow.keras.layers import  Dense,Conv2D, Flatten, Dropout, MaxPooling2D,concatenate
  7 | from tensorflow.keras.preprocessing.image import ImageDataGenerator
  8 | import cv2
  9 | import matplotlib.pyplot as plt
 10 | import rospy,cv_bridge,time
 11 | from sensor_msgs.msg import Image
 12 | import numpy as np
 13 | 
 14 | tf.compat.v1.enable_eager_execution()
 15 | class Fusion():
 16 |  	def __init__(self):
 17 |  		self.IMG_HEIGHT = 150
 18 | 		self.IMG_WIDTH = 150
 19 | 		self.night=False
 20 | 		self.image=np.zeros((900,1600,3))
 21 | 		self.image_lidar=np.zeros((600,600,3))
 22 | 		self.sub=rospy.Subscriber("/cam_front/raw",Image,self.image_cb)
 23 | 		self.lidar_sub=rospy.Subscriber("image_lidar",Image,self.lidar_image_cb)
 24 | 		self._session=tf.Session()
 25 | 		self.bridge=cv_bridge.CvBridge()
 26 |  		
 27 |  		self.input_image=keras.Input(shape=(self.IMG_HEIGHT,self.IMG_WIDTH,3))
 28 | 		self.input_lidar=keras.Input(shape=(self.IMG_HEIGHT,self.IMG_WIDTH,3))
 29 | 
 30 | 		self.x=Conv2D(16, 3, padding='same', activation='relu')(self.input_image)
 31 | 		self.output_image=MaxPooling2D()(self.x)
 32 | 
 33 | 		self.model_image = keras.Model(inputs=self.input_image,outputs=self.output_image, name='image_input')
 34 | 		self.model_image.summary()
 35 | 
 36 | 		self.y=Conv2D(16, 3, padding='same', activation='relu')(self.input_lidar)
 37 | 		self.output_lidar=MaxPooling2D()(self.y)
 38 | 
 39 | 		self.model_lidar = keras.Model(inputs=self.input_lidar,outputs=self.output_lidar, name='lidar_input')
 40 | 		self.model_lidar.summary()
 41 | 
 42 | 		self.combined = concatenate([self.model_image.output, self.model_lidar.output])
 43 | 
 44 | 		self.z=Conv2D(32, 3, padding='same', activation='relu')(self.combined)
 45 | 		self.z=MaxPooling2D()(self.z)
 46 | 		self.z=Conv2D(64, 3, padding='same', activation='relu')(self.z)
 47 | 		self.z=MaxPooling2D()(self.z)
 48 | 		self.z=Conv2D(16, 3, padding='same', activation='relu')(self.z)
 49 | 		self.z=MaxPooling2D()(self.z)
 50 | 		self.z=Flatten()(self.z)
 51 | 		self.z=Dense(512, activation='relu')(self.z)
 52 | 		self.z=Dense(128, activation='relu')(self.z)
 53 | 		self.z = Dense(1, activation="linear")(self.z)
 54 | 		self.fusion = Model(inputs=[self.model_lidar.input, self.model_image.input], outputs=self.z)
 55 | 		#keras.utils.plot_model(fusion, 'fusion.png', show_shapes=True)
 56 | 		self.fusion.load_weights('./checkpoints/my_checkpoint')
 57 | 		self.fusion.compile(optimizer='adam',loss=tf.keras.losses.BinaryCrossentropy(from_logits=True),metrics=['accuracy'])
 58 | 		self.fusion.load_weights('./checkpoints/my_checkpoint')
 59 | 		self.fusion._make_predict_function()
 60 | 
 61 | 
 62 | 	def create_model(self):
 63 | 		model = Sequential([
 64 |     	Conv2D(16, 3, padding='same', activation='relu', input_shape=(150,150,3)),
 65 |     	MaxPooling2D(),
 66 | 	    Conv2D(32, 3, padding='same', activation='relu'),
 67 |     	MaxPooling2D(),
 68 |     	Conv2D(64, 3, padding='same', activation='relu'),
 69 | 	    MaxPooling2D(),
 70 | 	    Flatten(),
 71 |     	Dense(512, activation='relu'),
 72 |     	Dense(1)])
 73 | 		model.compile(optimizer='adam',loss=tf.keras.losses.BinaryCrossentropy(from_logits=True),metrics=['accuracy'])
 74 | 		return model
 75 | 
 76 | 
 77 | 	def image_cb(self,msg):
 78 | 		self.image=self.bridge.imgmsg_to_cv2(msg)
 79 | 		# if(False):
 80 | 		# 	self.night=True
 81 | 
 82 | 	def lidar_image_cb(self,msg):
 83 | 		self.image_lidar=np.zeros((600,600,3))
 84 | 		self.image_lidar=self.bridge.imgmsg_to_cv2(msg)
 85 | 		self.prediction()
 86 | 		# if(self.night==False):
 87 | 		# 	self.prediction()
 88 | 		# else: 
 89 | 		# 	model=self.create_model()
 90 | 		# 	model.load_weights('./checkpoints/lidar_checkpoint')
 91 | 		# 	image_mod_lidar=cv2.resize(self.image_lidar,(150,150))
 92 | 		# 	val=model.predict(image_mod_lidar.reshape(-1,150,150,3))
 93 | 		# 	if(val[0][0]>0):
 94 | 		# 		print("person")
 95 | 		# 	else:
 96 | 		# 		print("car")
 97 | 
 98 | 
 99 | 	def prediction(self):
100 | 		image_mod=cv2.resize(self.image,(150,150))
101 | 		image_mod_lidar=cv2.resize(self.image_lidar,(150,150))
102 | 		val=self.fusion.predict([image_mod.reshape(-1,150,150,3),image_mod_lidar.reshape(-1,150,150,3)])
103 | 		if(val[0][0]>0):
104 | 		    print("person")
105 | 		else:
106 | 		    print("car")
107 | 
108 | if __name__ == '__main__':
109 | 	rospy.init_node("fusion_DL")
110 | 	rate=rospy.Rate(10)
111 | 	fus=Fusion()
112 | 	rospy.spin()
113 | 	
114 | 


--------------------------------------------------------------------------------
/DL_Scripts/ros_multi_sensor_fusion.py:
--------------------------------------------------------------------------------
  1 | import rospy
  2 | import tensorflow as tf 
  3 | print(tf.__version__)
  4 | from tensorflow import keras
  5 | from tensorflow.keras.models import Sequential,Model
  6 | from tensorflow.keras.layers import  Dense,Conv2D, Flatten, Dropout, MaxPooling2D,concatenate
  7 | from tensorflow.keras.preprocessing.image import ImageDataGenerator
  8 | import cv2
  9 | import matplotlib.pyplot as plt
 10 | import rospy,cv_bridge,time
 11 | from sensor_msgs.msg import Image
 12 | import numpy as np
 13 | 
 14 | tf.compat.v1.enable_eager_execution()
 15 | class Fusion():
 16 |  	def __init__(self):
 17 |  		self.IMG_HEIGHT = 150
 18 | 		self.IMG_WIDTH = 150
 19 | 		self.night=False
 20 | 		self.image=np.zeros((900,1600,3))
 21 | 		self.image_lidar=np.zeros((600,600,3))
 22 | 		self.sub=rospy.Subscriber("/cam_front/raw",Image,self.image_cb)
 23 | 		self.lidar_sub=rospy.Subscriber("image_lidar",Image,self.lidar_image_cb)
 24 | 		self.radar_sub=rospy.Subscriber("radar_image",Image,self.radar_cb)
 25 | 		self._session=tf.Session()
 26 | 		self.bridge=cv_bridge.CvBridge()
 27 |  		
 28 |  		self.input_image=keras.Input(shape=(self.IMG_HEIGHT,self.IMG_WIDTH,3))
 29 | 		self.input_lidar=keras.Input(shape=(self.IMG_HEIGHT,self.IMG_WIDTH,3))
 30 | 		self.input_radar=keras.Input(shape=(self.IMG_HEIGHT,self.IMG_WIDTH,3))
 31 | 
 32 | 		self.x=Conv2D(16, 3, padding='same', activation='relu')(self.input_image)
 33 | 		self.output_image=MaxPooling2D()(self.x)
 34 | 
 35 | 		self.model_image = keras.Model(inputs=self.input_image,outputs=self.output_image, name='image_input')
 36 | 		self.model_image.summary()
 37 | 
 38 | 		self.y=Conv2D(16, 3, padding='same', activation='relu')(self.input_lidar)
 39 | 		self.output_lidar=MaxPooling2D()(self.y)
 40 | 
 41 | 		self.model_lidar = keras.Model(inputs=self.input_lidar,outputs=self.output_lidar, name='lidar_input')
 42 | 		self.model_lidar.summary()
 43 | 
 44 | 		self.w=Conv2D(16, 3, padding='same', activation='relu')(self.input_radar)
 45 | 		self.output_radar=MaxPooling2D()(self.w)
 46 | 
 47 | 		self.model_radar = keras.Model(inputs=self.input_radar,outputs=self.output_radar, name='radar_input')
 48 | 		self.model_radar.summary()
 49 | 
 50 | 		self.combined = concatenate([self.model_image.output, self.model_lidar.output, self.model_radar.output])
 51 | 
 52 | 		self.z=Conv2D(32, 3, padding='same', activation='relu')(self.combined)
 53 | 		self.z=MaxPooling2D()(self.z)
 54 | 		self.z=Conv2D(16, 3, padding='same', activation='relu')(self.z)
 55 | 		self.z=MaxPooling2D()(self.z)
 56 | 		self.z=Conv2D(64, 3, padding='same', activation='relu')(self.z)
 57 | 		self.z=MaxPooling2D()(self.z)
 58 | 		self.z=Conv2D(16, 3, padding='same', activation='relu')(self.z)
 59 | 		self.z=MaxPooling2D()(self.z)
 60 | 		self.z=Flatten()(self.z)
 61 | 		self.z=Dense(512, activation='relu')(self.z)
 62 | 		self.z=Dense(256, activation='relu')(self.z)
 63 | 		self.z=Dense(128, activation='relu')(self.z)
 64 | 		self.z = Dense(1, activation="linear")(self.z)
 65 | 		self.fusion = Model(inputs=[self.model_lidar.input, self.model_image.input, self.model_radar.input], outputs=self.z)
 66 | 		#keras.utils.plot_model(fusion, 'fusion.png', show_shapes=True)
 67 | 		self.fusion.load_weights('./checkpoints/my_checkpoint')
 68 | 		self.fusion.compile(optimizer='adam',loss=tf.keras.losses.BinaryCrossentropy(from_logits=True),metrics=['accuracy'])
 69 | 		self.fusion.load_weights('./checkpoints/my_checkpoint')
 70 | 		self.fusion._make_predict_function()
 71 | 
 72 | 
 73 | 	def create_model(self):
 74 | 		model = Sequential([
 75 |     	Conv2D(16, 3, padding='same', activation='relu', input_shape=(150,150,3)),
 76 |     	MaxPooling2D(),
 77 | 	    Conv2D(32, 3, padding='same', activation='relu'),
 78 |     	MaxPooling2D(),
 79 |     	Conv2D(64, 3, padding='same', activation='relu'),
 80 | 	    MaxPooling2D(),
 81 | 	    Flatten(),
 82 |     	Dense(512, activation='relu'),
 83 |     	Dense(1)])
 84 | 		model.compile(optimizer='adam',loss=tf.keras.losses.BinaryCrossentropy(from_logits=True),metrics=['accuracy'])
 85 | 		return model
 86 | 
 87 | 
 88 | 	def image_cb(self,msg):
 89 | 		self.image=self.bridge.imgmsg_to_cv2(msg)
 90 | 
 91 | 	def lidar_image_cb(self,msg):
 92 | 		self.image_lidar=np.zeros((600,600,3))
 93 | 		self.image_lidar=self.bridge.imgmsg_to_cv2(msg)
 94 | 
 95 | 	def radar_cb(self,msg):
 96 | 		self.image_radar=np.zeros((600,600,3))
 97 | 		self.image_radar=self.bridge.imgmsg_to_cv2(msg)
 98 | 		self.prediction()
 99 | 
100 | 	def prediction(self):
101 | 		image_mod=cv2.resize(self.image,(150,150))
102 | 		image_mod_lidar=cv2.resize(self.image_lidar,(150,150))
103 | 		image_mod_radar=cv2.resize(self.image_radar,(150,150))
104 | 		val=self.fusion.predict([image_mod.reshape(-1,150,150,3),image_mod_lidar.reshape(-1,150,150,3),image_mod_radar.reshape(-1,150,150,3)])
105 | 		if(val[0][0]>0):
106 | 		    print("person")
107 | 		else:
108 | 		    print("car")
109 | 
110 | if __name__ == '__main__':
111 | 	rospy.init_node("fusion_DL")
112 | 	rate=rospy.Rate(10)
113 | 	fus=Fusion()
114 | 	rospy.spin()
115 | 	
116 | 


--------------------------------------------------------------------------------
/DL_Scripts/save_model.py:
--------------------------------------------------------------------------------
 1 | import tensorflow as tf
 2 | print(tf.__version__)
 3 | from tensorflow.keras.models import Sequential
 4 | from tensorflow.keras.layers import Dense, Conv2D, Flatten, Dropout, MaxPooling2D
 5 | from tensorflow.keras.preprocessing.image import ImageDataGenerator
 6 | import cv2
 7 | import os
 8 | import matplotlib.pyplot as plt
 9 | import rospy,cv_bridge,time
10 | from sensor_msgs.msg import Image
11 | import numpy as np
12 | tf.compat.v1.enable_eager_execution()
13 | 
14 | class Prediction:
15 | 	def __init__(self):
16 | 		self.bridge=cv_bridge.CvBridge()
17 | 		self.IMG_HEIGHT = 200
18 | 		self.IMG_WIDTH = 200
19 | 		#self.sub=rospy.Subscriber("/cam_front/raw",Image,self.image_cb)
20 | 		self.image=cv2.imread("5.jpg")
21 | 		self._session=tf.Session()
22 | 		self.model = Sequential([
23 |     		Conv2D(16, 3, padding='same', activation='relu', input_shape=(self.IMG_HEIGHT, self.IMG_WIDTH ,3)),
24 |     		MaxPooling2D(),
25 |     		Conv2D(32, 3, padding='same', activation='relu'),
26 |     		MaxPooling2D(),
27 |     		Conv2D(64, 3, padding='same', activation='relu'),
28 |     		MaxPooling2D(),
29 |    			Flatten(),
30 |     		Dense(512, activation='relu'),
31 |     		Dense(1)])
32 | 		self.model.compile(optimizer='adam',loss=tf.keras.losses.BinaryCrossentropy(from_logits=True),metrics=['accuracy'])
33 | 		# Restore the weights
34 | 		self.model.load_weights('./checkpoints/lidar_checkpoint')
35 | 		self.model._make_predict_function()
36 | 		self.model.summary()	
37 | 		val=self.model.predict([self.image.reshape(-1,200,200,3)])
38 | 		if(val[0][0]>0):
39 | 		    print("person")
40 | 		else:
41 | 		    print("car")
42 | 
43 | if __name__ == '__main__':
44 | 	prediction=Prediction()
45 | 


--------------------------------------------------------------------------------
/DL_Scripts/test.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | import rospy
 3 | import sensor_msgs.point_cloud2 as pc2
 4 | from sensor_msgs.msg import PointCloud2, PointField
 5 | from roslib import message
 6 | from geometry_msgs.msg import PoseStamped 
 7 | from nav_msgs.msg import Odometry
 8 | from std_msgs.msg import Int32
 9 | import rospy, cv2, cv_bridge, numpy
10 | from sensor_msgs.msg import Image
11 | import cv2
12 | import numpy as np
13 | from matplotlib import pyplot as plt
14 | from visualization_msgs.msg import MarkerArray,Marker
15 | import visualization_msgs
16 | import time
17 | 
18 | class Fusion:
19 |   def __init__(self):
20 | 	self.id=0
21 | 	self.image=np.zeros((451,901,3))
22 | 	self.array=np.zeros((451,901))
23 | 	self.x=np.zeros((451,901))
24 | 	self.y=np.zeros((451,901))
25 | 	self.z=np.zeros((451,901))
26 | 	self.image_gs=np.zeros((600,1200))
27 | 	self.reconstruct=np.zeros((451,900))
28 | 	self.pub=rospy.Publisher("marker",MarkerArray,queue_size=1)
29 | 	self.bridge=cv_bridge.CvBridge()
30 | 	sub_1=rospy.Subscriber("lidar_top", PointCloud2, self.callback_kinect)
31 | 	#sub=rospy.Subscriber("/cam_front/raw",Image,self.image_cb)
32 | 	rate=rospy.Rate(10)
33 | 	rate.sleep()
34 |       
35 |   def image_cb(self,msg):
36 |     self.image=self.bridge.imgmsg_to_cv2(msg,desired_encoding="bgr8")
37 |     self.half = cv2.resize(self.image, (0, 0), fx = 0.5, fy = 0.5)
38 |     self.half=cv2.flip(self.half,0)
39 |     self.x=self.half[:,:,2]
40 |     self.y=self.half[:,:,0]
41 |     self.z=self.half[:,:,1]
42 |     
43 | 
44 |   def callback_kinect(self,data) :
45 |     data_out = pc2.read_points(data, field_names=("x","y","z","intensity"), skip_nans=False)
46 |     #print(data_out)
47 |     i=0
48 |     j=0
49 |     self.id+=1
50 |     for p in data_out:
51 |       if(p[0]>-10 and p[0]<10 and p[1]>-10 and p[1]<10):
52 |         # while(i<450):
53 |         #   i+=1
54 |         #   j=0
55 |         #   while(j<900):
56 |         #     j=j+1
57 |             # self.image[:,:,0][i][j]=int(100*p[0])
58 |             # self.image[:,:,1][i][j]=int(100*p[1])
59 |             # self.image[:,:,2][i][j]=int(100*(p[2]+2))
60 |     	self.image_gs[int(abs(30*(p[0]+10)))][int(abs(30*(p[1]+10)))]=255
61 |     cv2.imwrite("ima"+str(self.id)+".jpg",self.image_gs)
62 |     #self.image_gs=cv2.flip(self.image_gs,0)
63 |     # cv2.imshow("image",self.image_gs)
64 |     # cv2.waitKey(1)
65 |     self.image_gs=np.zeros((600,600))
66 | 
67 | if __name__ == '__main__':
68 |     try:
69 |       rospy.init_node('listen', anonymous=True)
70 |       fusion=Fusion()
71 |       rospy.spin()
72 |     except rospy.ROSInterruptException:
73 |       print ("error")
74 |       pass
75 | 


--------------------------------------------------------------------------------
/DL_Scripts/train.py:
--------------------------------------------------------------------------------
  1 | # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
  2 | #
  3 | # Licensed under the Apache License, Version 2.0 (the "License");
  4 | # you may not use this file except in compliance with the License.
  5 | # You may obtain a copy of the License at
  6 | #
  7 | #     http://www.apache.org/licenses/LICENSE-2.0
  8 | #
  9 | # Unless required by applicable law or agreed to in writing, software
 10 | # distributed under the License is distributed on an "AS IS" BASIS,
 11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 12 | # See the License for the specific language governing permissions and
 13 | # limitations under the License.
 14 | # ==============================================================================
 15 | 
 16 | r"""Training executable for detection models.
 17 | This executable is used to train DetectionModels. There are two ways of
 18 | configuring the training job:
 19 | 1) A single pipeline_pb2.TrainEvalPipelineConfig configuration file
 20 | can be specified by --pipeline_config_path.
 21 | Example usage:
 22 |     ./train \
 23 |         --logtostderr \
 24 |         --train_dir=path/to/train_dir \
 25 |         --pipeline_config_path=pipeline_config.pbtxt
 26 | 2) Three configuration files can be provided: a model_pb2.DetectionModel
 27 | configuration file to define what type of DetectionModel is being trained, an
 28 | input_reader_pb2.InputReader file to specify what training data will be used and
 29 | a train_pb2.TrainConfig file to configure training parameters.
 30 | Example usage:
 31 |     ./train \
 32 |         --logtostderr \
 33 |         --train_dir=path/to/train_dir \
 34 |         --model_config_path=model_config.pbtxt \
 35 |         --train_config_path=train_config.pbtxt \
 36 |         --input_config_path=train_input_config.pbtxt
 37 | """
 38 | 
 39 | import functools
 40 | import json
 41 | import os
 42 | import tensorflow as tf
 43 | 
 44 | from object_detection.builders import dataset_builder
 45 | from object_detection.builders import graph_rewriter_builder
 46 | from object_detection.builders import model_builder
 47 | from object_detection.legacy import trainer
 48 | from object_detection.utils import config_util
 49 | 
 50 | tf.logging.set_verbosity(tf.logging.INFO)
 51 | 
 52 | flags = tf.app.flags
 53 | flags.DEFINE_string('master', '', 'Name of the TensorFlow master to use.')
 54 | flags.DEFINE_integer('task', 0, 'task id')
 55 | flags.DEFINE_integer('num_clones', 1, 'Number of clones to deploy per worker.')
 56 | flags.DEFINE_boolean('clone_on_cpu', False,
 57 |                      'Force clones to be deployed on CPU.  Note that even if '
 58 |                      'set to False (allowing ops to run on gpu), some ops may '
 59 |                      'still be run on the CPU if they have no GPU kernel.')
 60 | flags.DEFINE_integer('worker_replicas', 1, 'Number of worker+trainer '
 61 |                      'replicas.')
 62 | flags.DEFINE_integer('ps_tasks', 0,
 63 |                      'Number of parameter server tasks. If None, does not use '
 64 |                      'a parameter server.')
 65 | flags.DEFINE_string('train_dir', '',
 66 |                     'Directory to save the checkpoints and training summaries.')
 67 | 
 68 | flags.DEFINE_string('pipeline_config_path', '',
 69 |                     'Path to a pipeline_pb2.TrainEvalPipelineConfig config '
 70 |                     'file. If provided, other configs are ignored')
 71 | 
 72 | flags.DEFINE_string('train_config_path', '',
 73 |                     'Path to a train_pb2.TrainConfig config file.')
 74 | flags.DEFINE_string('input_config_path', '',
 75 |                     'Path to an input_reader_pb2.InputReader config file.')
 76 | flags.DEFINE_string('model_config_path', '',
 77 |                     'Path to a model_pb2.DetectionModel config file.')
 78 | 
 79 | FLAGS = flags.FLAGS
 80 | 
 81 | 
 82 | @tf.contrib.framework.deprecated(None, 'Use object_detection/model_main.py.')
 83 | def main(_):
 84 |   assert FLAGS.train_dir, '`train_dir` is missing.'
 85 |   if FLAGS.task == 0: tf.gfile.MakeDirs(FLAGS.train_dir)
 86 |   if FLAGS.pipeline_config_path:
 87 |     configs = config_util.get_configs_from_pipeline_file(
 88 |         FLAGS.pipeline_config_path)
 89 |     if FLAGS.task == 0:
 90 |       tf.gfile.Copy(FLAGS.pipeline_config_path,
 91 |                     os.path.join(FLAGS.train_dir, 'pipeline.config'),
 92 |                     overwrite=True)
 93 |   else:
 94 |     configs = config_util.get_configs_from_multiple_files(
 95 |         model_config_path=FLAGS.model_config_path,
 96 |         train_config_path=FLAGS.train_config_path,
 97 |         train_input_config_path=FLAGS.input_config_path)
 98 |     if FLAGS.task == 0:
 99 |       for name, config in [('model.config', FLAGS.model_config_path),
100 |                            ('train.config', FLAGS.train_config_path),
101 |                            ('input.config', FLAGS.input_config_path)]:
102 |         tf.gfile.Copy(config, os.path.join(FLAGS.train_dir, name),
103 |                       overwrite=True)
104 | 
105 |   model_config = configs['model']
106 |   train_config = configs['train_config']
107 |   input_config = configs['train_input_config']
108 | 
109 |   model_fn = functools.partial(
110 |       model_builder.build,
111 |       model_config=model_config,
112 |       is_training=True)
113 | 
114 |   def get_next(config):
115 |     return dataset_builder.make_initializable_iterator(
116 |         dataset_builder.build(config)).get_next()
117 | 
118 |   create_input_dict_fn = functools.partial(get_next, input_config)
119 | 
120 |   env = json.loads(os.environ.get('TF_CONFIG', '{}'))
121 |   cluster_data = env.get('cluster', None)
122 |   cluster = tf.train.ClusterSpec(cluster_data) if cluster_data else None
123 |   task_data = env.get('task', None) or {'type': 'master', 'index': 0}
124 |   task_info = type('TaskSpec', (object,), task_data)
125 | 
126 |   # Parameters for a single worker.
127 |   ps_tasks = 0
128 |   worker_replicas = 1
129 |   worker_job_name = 'lonely_worker'
130 |   task = 0
131 |   is_chief = True
132 |   master = ''
133 | 
134 |   if cluster_data and 'worker' in cluster_data:
135 |     # Number of total worker replicas include "worker"s and the "master".
136 |     worker_replicas = len(cluster_data['worker']) + 1
137 |   if cluster_data and 'ps' in cluster_data:
138 |     ps_tasks = len(cluster_data['ps'])
139 | 
140 |   if worker_replicas > 1 and ps_tasks < 1:
141 |     raise ValueError('At least 1 ps task is needed for distributed training.')
142 | 
143 |   if worker_replicas >= 1 and ps_tasks > 0:
144 |     # Set up distributed training.
145 |     server = tf.train.Server(tf.train.ClusterSpec(cluster), protocol='grpc',
146 |                              job_name=task_info.type,
147 |                              task_index=task_info.index)
148 |     if task_info.type == 'ps':
149 |       server.join()
150 |       return
151 | 
152 |     worker_job_name = '%s/task:%d' % (task_info.type, task_info.index)
153 |     task = task_info.index
154 |     is_chief = (task_info.type == 'master')
155 |     master = server.target
156 | 
157 |   graph_rewriter_fn = None
158 |   if 'graph_rewriter_config' in configs:
159 |     graph_rewriter_fn = graph_rewriter_builder.build(
160 |         configs['graph_rewriter_config'], is_training=True)
161 | 
162 |   trainer.train(
163 |       create_input_dict_fn,
164 |       model_fn,
165 |       train_config,
166 |       master,
167 |       task,
168 |       FLAGS.num_clones,
169 |       worker_replicas,
170 |       FLAGS.clone_on_cpu,
171 |       ps_tasks,
172 |       worker_job_name,
173 |       is_chief,
174 |       FLAGS.train_dir,
175 |       graph_hook_fn=graph_rewriter_fn)
176 | 
177 | 
178 | if __name__ == '__main__':
179 |   tf.app.run()
180 | 


--------------------------------------------------------------------------------
/DL_Scripts/xml_to_csv.py:
--------------------------------------------------------------------------------
  1 | # """
  2 | # Usage:
  3 | # # Create train data:
  4 | # python xml_to_csv.py -i [PATH_TO_IMAGES_FOLDER]/train -o [PATH_TO_ANNOTATIONS_FOLDER]/train_labels.csv
  5 | # # Create test data:
  6 | # python xml_to_csv.py -i [PATH_TO_IMAGES_FOLDER]/test -o [PATH_TO_ANNOTATIONS_FOLDER]/test_labels.csv
  7 | # """
  8 | 
  9 | # import os
 10 | # import glob
 11 | # import pandas as pd
 12 | # import argparse
 13 | # import xml.etree.ElementTree as ET
 14 | 
 15 | 
 16 | # def xml_to_csv(path):
 17 | #     """Iterates through all .xml files (generated by labelImg) in a given directory and combines them in a single Pandas datagrame.
 18 | #     Parameters:
 19 | #     ----------
 20 | #     path : {str}
 21 | #         The path containing the .xml files
 22 | #     Returns
 23 | #     -------
 24 | #     Pandas DataFrame
 25 | #         The produced dataframe
 26 | #     """
 27 | 
 28 | #     processed = 0
 29 | #     xml_list = []
 30 | #     for xml_file in glob.glob(path + '/*.xml'):
 31 | #         tree = ET.parse(xml_file)
 32 | #         root = tree.getroot()
 33 | #         for member in root.findall('object'):
 34 | #             # check if truncated is not true i.e. 0 and class is person
 35 | #             if member[0].text == 'person' and member[2].text == '0' and member[4].tag == 'bndbox':
 36 | #                 print ('processing file {}'.format(xml_file))
 37 | #                 processed += 1
 38 | #                 value = (root.find('filename').text,
 39 | #                         int(root.find('size')[0].text),
 40 | #                         int(root.find('size')[1].text),
 41 | #                         member[0].text,
 42 | #                         int(member[4][0].text),
 43 | #                         int(member[4][1].text),
 44 | #                         int(member[4][2].text),
 45 | #                         int(member[4][3].text)
 46 | #                         )
 47 | #                 xml_list.append(value)
 48 | #     column_name = ['filename', 'width', 'height',
 49 | #                 'class', 'xmin', 'ymin', 'xmax', 'ymax']
 50 | #     xml_df = pd.DataFrame(xml_list, columns=column_name)
 51 | #     print ('processed xml files : {}'.format(processed))
 52 | #     return xml_df
 53 | 
 54 | 
 55 | # def main():
 56 | #     # Initiate argument parser
 57 | #     parser = argparse.ArgumentParser(
 58 | #         description="Sample TensorFlow XML-to-CSV converter")
 59 | #     parser.add_argument("-i",
 60 | #                         "--inputDir",
 61 | #                         help="Path to the folder where the input .xml files are stored",
 62 | #                         type=str)
 63 | #     parser.add_argument("-o",
 64 | #                         "--outputFile",
 65 | #                         help="Name of output .csv file (including path)", type=str)
 66 | #     args = parser.parse_args()
 67 | 
 68 | #     if(args.inputDir is None):
 69 | #         args.inputDir = os.getcwd()
 70 | #     if(args.outputFile is None):
 71 | #         args.outputFile = args.inputDir + "/labels.csv"
 72 | 
 73 | #     assert(os.path.isdir(args.inputDir))
 74 | 
 75 | #     xml_df = xml_to_csv(args.inputDir)
 76 | #     xml_df.to_csv(
 77 | #         args.outputFile, index=None)
 78 | #     print('Successfully converted xml to csv.')
 79 | 
 80 | 
 81 | # if __name__ == '__main__':
 82 | #     main()
 83 | import json
 84 | import os
 85 | import glob
 86 | import pandas as pd
 87 | import argparse
 88 | import xml.etree.ElementTree as ET
 89 | 
 90 | 
 91 | def __list_to_csv(annotations, output_file):
 92 |     column_name = [
 93 |         'filename', 'width', 'height', 'class', 'xmin', 'ymin', 'xmax', 'ymax'
 94 |     ]
 95 |     xml_df = pd.DataFrame(annotations, columns=column_name)
 96 |     xml_df.to_csv(output_file, index=None)
 97 | 
 98 | 
 99 | def xml_to_csv(xml_dir, output_file):
100 |     """Reads all XML files, generated by labelImg, from a directory and generates a single CSV file"""
101 |     annotations = []
102 |     for xml_file in glob.glob(xml_dir + '/*.xml'):
103 |         tree = ET.parse(xml_file)
104 |         root = tree.getroot()
105 |         for member in root.findall('object'):
106 |             value = (root.find('filename').text,
107 |                      int(root.find('size')[0].text),
108 |                      int(root.find('size')[1].text), member[0].text,
109 |                      int(member[4][0].text), int(member[4][1].text),
110 |                      int(member[4][2].text), int(member[4][3].text))
111 |             annotations.append(value)
112 | 
113 |     __list_to_csv(annotations, output_file)
114 | 
115 | 
116 | def json_to_csv(input_json, output_file):
117 |     """Reads a JSON file, generated by the VGG Image Annotator, and generates a single CSV file"""
118 |     with open(input_json) as f:
119 |         images = json.load(f)
120 | 
121 |     annotations = []
122 | 
123 |     for entry in images:
124 |         filename = images[entry]['filename']
125 |         for region in images[entry]['regions']:
126 |             c = region['region_attributes']['class']
127 |             xmin = region['shape_attributes']['x']
128 |             ymin = region['shape_attributes']['y']
129 |             xmax = xmin + region['shape_attributes']['width']
130 |             ymax = ymin + region['shape_attributes']['height']
131 |             width = 0
132 |             height = 0
133 | 
134 |             value = (filename, width, height, c, xmin, ymin, xmax, ymax)
135 |             annotations.append(value)
136 | 
137 |     __list_to_csv(annotations, output_file)
138 | 
139 | 
140 | if __name__ == "__main__":
141 |     parser = argparse.ArgumentParser(
142 |         description=
143 |         'Reads all XML files, generated by labelImg, from a directory and generates a single CSV file',
144 |         formatter_class=argparse.RawDescriptionHelpFormatter)
145 |     parser.add_argument('type',
146 |                         metavar='type',
147 |                         default='xml',
148 |                         choices=['xml', 'json'],
149 |                         help='LabelImg XML or VIA JSON')
150 |     parser.add_argument(
151 |         'input',
152 |         metavar='input',
153 |         type=str,
154 |         help=
155 |         'Directory containing the XML files generated by labelImg or path to a single VIA JSON'
156 |     )
157 |     parser.add_argument('output_csv',
158 |                         metavar='output_csv',
159 |                         type=str,
160 |                         help='Path where the CSV output will be created')
161 | 
162 |     args = parser.parse_args()
163 | 
164 |     if args.type == 'xml':
165 |         xml_to_csv(args.input, args.output_csv)
166 |     elif args.type == 'json':
167 |         json_to_csv(args.input, args.output_csv)


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | # Multi-Modal Sensor Fusion of LiDAR, Radar and Monocular Camera data for object detection
 2 | 
 3 |  - Ubuntu 16.04 Kinetic: ![](https://github.com/clynamen/nuscenes2bag/workflows/ubuntu_1604_kinetic/badge.svg)
 4 | <br>The output of multi_sensor_fusion based object detection based on the Faster_RCNN_inception_v2 architecture
 5 | <br>**Implemented in Tensorflow 1.14**
 6 | ![Image EXAMPLE RESULT](https://github.com/Matnay/KPIT_Fusion_Object_Detection_DL/blob/master/Results/output.gif)
 7 | ![Image EXAMPLE RESULT](https://github.com/Matnay/KPIT_Fusion_Object_Detection_DL/blob/master/Results/Screenshot%20from%202020-06-22%2015-14-01.png)
 8 | ![Image EXAMPLE RESULT](https://github.com/Matnay/KPIT_Deep_Learning/blob/master/Results/Screenshot%20from%202020-06-04%2012-10-31.png)
 9 | # nuscenes to rosbag
10 | Simple C++ tool for converting the [nuScenes](https://www.nuscenes.org/) dataset from [Aptiv](https://www.aptiv.com).
11 | 
12 | The tool loads the json metadata and then the sample files for each scene. The sample are converted in a suitable ROS msg and written to a bag. TF tree is also written.
13 | 
14 | Probably the original dataset is also collected by Aptiv using ROS, so most data has the same format.
15 | 
16 | ![](images/ros_preview.png)
17 | 
18 | ## Install
19 | The tool is a normal ROS package. Place it under a workspace and build it with catkin.
20 | 
21 | ## Usage
22 | 
23 | **Command-line arguments:**
24 | `--dataroot`: The path to the directory that contains the 'maps', 'samples' and 'sweeps'.
25 | `--version`: (optional) The sub-directory that contains the metadata .json files. Default = "v1.0-mini"
26 | 
27 | 
28 | **Converting the 'mini' dataset:**
29 | 
30 | Convert one scene to a bag file, saved in a new directory:
31 | Scene '0061' will be saved to 'nuscenes_bags/61.bag'
32 | ```
33 | rosrun nuscenes2bag nuscenes2bag --scene_number 0061 --dataroot /path/to/nuscenes_mini_meta_v1.0/ --out nuscenes_bags/
34 | ```
35 | 
36 | 
37 | Convert the entire dataset to bag files:
38 | This processes 4 scenes simultaneously, however the scene numbers are not processed in numerical order.
39 | ```
40 | rosrun nuscenes2bag nuscenes2bag --dataroot /path/to/nuscenes_mini_meta_v1.0/ --out nuscenes_bags/ --jobs 4
41 | ```
42 | - [ ] Radar support
43 | 
44 | nuscenestobag
45 |  - [clynamen](https://github.com/clynamen/)
46 |  - [ChernoA](https://github.com/ChernoA)
47 | 
48 | LiDAR RADAR and monocular camera image fusion
49 | 
50 | Data trained on nuscenes dataset
51 | After running rosbag run node to convert pointcloud into depth encoded 2d BEV frame representation 
52 | 
53 | ```
54 | rosrun fusion lidar_image_pub
55 | ```
56 | 
57 | Run multi_sensor_fusion.py to view classification results
58 | ```
59 | rosrun fusion ros_multi_sensor_fusion.py
60 | ```
61 | Object Detection implemented usinhg faster_rcnn_inception_v2
62 | ```
63 | rosrun fusion faster_rcnn
64 | ```
65 | 
66 | #### Citing
67 | 
68 | If you use this work in an academic context, please cite the following publication:
69 | ```
70 | @InProceedings{10.1007/978-981-16-7996-4_40,
71 | author="Mathur, Pranay
72 | and Kumar, Ravish
73 | and Jain, Rahul",
74 | editor="Chen, Joy Iong-Zong
75 | and Wang, Haoxiang
76 | and Du, Ke-Lin
77 | and Suma, V.",
78 | title="Multi-sensor Fusion-Based Object Detection Implemented on ROS",
79 | booktitle="Machine Learning and Autonomous Systems",
80 | year="2022",
81 | publisher="Springer Singapore",
82 | address="Singapore",
83 | pages="551--563",
84 | abstract="Mathur, PranayKumar, RavishJain, Rahul3D Perception of the environment in real-time is a critical aspect for object detection, obstacle avoidance, and classification in autonomous vehicles. This paper proposes a novel 3D object classifier that can exploit data from a LIDAR, a RADAR, and a monocular camera image after orthogonal projection. To achieve this, a learnable architecture is designed end-to-end, which fuses the detection results from multiple sensor modalities initially and exploits continuous convolution subsequently to achieve the desired levels of accuracy. An adaptive algorithm for prediction in real-time is used to automatically increase weightage to prediction results from a particular sensor modality which aids in keeping accuracy invariant to scene changes. To prevent the bias, we are using a training strategy which provides attention to the specific type of sensor. This strategy is inspired by dropout. The entire algorithm has been implemented on the Robot Operating System to make it easier to deploy and transfer. We have experimentally evaluated our method on the NuScenes dataset.",
85 | isbn="978-981-16-7996-4"
86 | }
87 | ```
88 | #### Contact
89 | - Pranay Mathur [![Gmail: Pranay Mathur](https://img.shields.io/badge/gmail-%23D14836.svg?&style=plastic&logo=gmail&logoColor=white)](mailto:matnay17@gmail.com) [![Linkedin: offjangir](https://img.shields.io/badge/-Pranay_Mathur-blue?style=flat-square&logo=Linkedin&logoColor=white&link=https://www.linkedin.com/in/yash-jangir-6a71651a1)](https://www.linkedin.com/in/pranay-mathur1998/)
90 | 


--------------------------------------------------------------------------------
/Results/Screenshot from 2020-06-04 12-10-31.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Matnay/Sensor_Fusion_Object_Detection_KPIT/14f3815fc2829db9bede86c31f23e721f6423f79/Results/Screenshot from 2020-06-04 12-10-31.png


--------------------------------------------------------------------------------
/Results/Screenshot from 2020-06-22 15-14-01.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Matnay/Sensor_Fusion_Object_Detection_KPIT/14f3815fc2829db9bede86c31f23e721f6423f79/Results/Screenshot from 2020-06-22 15-14-01.png


--------------------------------------------------------------------------------
/Results/VID-20200623-WA0008.mp4:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Matnay/Sensor_Fusion_Object_Detection_KPIT/14f3815fc2829db9bede86c31f23e721f6423f79/Results/VID-20200623-WA0008.mp4


--------------------------------------------------------------------------------
/Results/output.gif:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Matnay/Sensor_Fusion_Object_Detection_KPIT/14f3815fc2829db9bede86c31f23e721f6423f79/Results/output.gif


--------------------------------------------------------------------------------
/bag/loop_bag.launch:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <launch>
 3 | 
 4 |     <arg name="bagfile" default="<enterbagname>.bag" />
 5 | 
 6 |     <!-- Play rosbag record -->
 7 |     <node 
 8 |         pkg="rosbag"
 9 |         type="play"
10 |         name="player"
11 |         output="screen"
12 |         args="--clock --loop $(find lidar_camera_calibration)/bagfiles/$(arg bagfile)" />
13 | 
14 | </launch>
15 | 


--------------------------------------------------------------------------------
/include/nuscenes2bag/DatasetTypes.hpp:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include <array>
 4 | #include <iostream>
 5 | #include <sstream>
 6 | #include <string>
 7 | 
 8 | #include "nuscenes2bag/ToDebugString.hpp"
 9 | 
10 | namespace nuscenes2bag {
11 | 
12 | enum class SampleType
13 | {
14 |   NONE,
15 |   CAMERA,
16 |   RADAR,
17 |   LIDAR
18 | };
19 | 
20 | typedef std::string Token;
21 | typedef uint64_t TimeStamp;
22 | typedef uint32_t SceneId;
23 | typedef std::array<std::array<double, 3>, 3> IntrinsicsMatrix;
24 | 
25 | }
26 | 


--------------------------------------------------------------------------------
/include/nuscenes2bag/EgoPoseConverter.hpp:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | #include <geometry_msgs/TransformStamped.h>
 3 | #include <nav_msgs/Odometry.h>
 4 | #include <tf/tfMessage.h>
 5 | 
 6 | #include "nuscenes2bag/utils.hpp"
 7 | #include <nuscenes2bag/MetaDataTypes.hpp>
 8 | 
 9 | namespace nuscenes2bag {
10 | 
11 | nav_msgs::Odometry
12 | egoPoseInfo2OdometryMsg(const EgoPoseInfo& egoPoseInfo);
13 | 
14 | geometry_msgs::TransformStamped
15 | egoPoseInfo2TransformStamped(const EgoPoseInfo& egoPoseInfo);
16 | 
17 | }
18 | 


--------------------------------------------------------------------------------
/include/nuscenes2bag/FileProgress.hpp:
--------------------------------------------------------------------------------
 1 | #pragma once 
 2 | 
 3 | #include <atomic>
 4 | 
 5 | namespace nuscenes2bag {
 6 | 
 7 | class FileProgress {
 8 |     public:
 9 |         FileProgress();
10 | 
11 |         void addToProcess(uint32_t toProcess);
12 | 
13 |         void addToProcessed(uint32_t processed);
14 | 
15 |         float getProgressPercentage();
16 | 
17 |     public:
18 |         std::atomic<uint32_t> processedFiles;
19 |         std::atomic<uint32_t> toProcessFiles;
20 | };
21 | 
22 | }


--------------------------------------------------------------------------------
/include/nuscenes2bag/Filesystem.hpp:
--------------------------------------------------------------------------------
1 | #pragma once
2 | 
3 | #if CMAKE_CXX_STANDARD >= 17
4 | #include <filesystem>
5 | namespace fs = std::filesystem;
6 | #else
7 | #include <boost/filesystem.hpp>
8 | namespace fs = boost::filesystem;
9 | #endif


--------------------------------------------------------------------------------
/include/nuscenes2bag/ImageDirectoryConverter.hpp:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include "sensor_msgs/Image.h"
 4 | #include "nuscenes2bag/Filesystem.hpp"
 5 | 
 6 | #include <cv_bridge/cv_bridge.h>
 7 | 
 8 | #include <opencv2/core/core.hpp>
 9 | #include <opencv2/imgcodecs.hpp>
10 | 
11 | #include <boost/optional.hpp>
12 | 
13 | namespace nuscenes2bag {
14 | 
15 | boost::optional<sensor_msgs::Image> readImageFile(const fs::path& filePath) noexcept;
16 | 
17 | }
18 | 


--------------------------------------------------------------------------------
/include/nuscenes2bag/LidarDirectoryConverter.hpp:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include "nuscenes2bag/Filesystem.hpp"
 4 | #include "sensor_msgs/PointCloud2.h"
 5 | #include <pcl_ros/point_cloud.h>
 6 | 
 7 | namespace nuscenes2bag {
 8 | 
 9 | boost::optional<sensor_msgs::PointCloud2> readLidarFile(const fs::path& filePath);
10 | 
11 | }
12 | 


--------------------------------------------------------------------------------
/include/nuscenes2bag/LidarDirectoryConverterXYZIR.hpp:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include "sensor_msgs/PointCloud2.h"
 4 | #include <pcl_ros/point_cloud.h>
 5 | #include "nuscenes2bag/Filesystem.hpp"
 6 | 
 7 | namespace nuscenes2bag {
 8 | 
 9 | boost::optional<sensor_msgs::PointCloud2> readLidarFileXYZIR(const fs::path& filePath);
10 | 
11 | }
12 | 


--------------------------------------------------------------------------------
/include/nuscenes2bag/MetaDataProvider.hpp:
--------------------------------------------------------------------------------
 1 | #include "nuscenes2bag/MetaDataTypes.hpp"
 2 | 
 3 | #include <exception>
 4 | #include <vector>
 5 | 
 6 | #include <boost/optional.hpp>
 7 | 
 8 | namespace nuscenes2bag {
 9 | 
10 | class MetaDataProvider
11 | {
12 | public:
13 |   virtual ~MetaDataProvider() = default;
14 | 
15 |   virtual std::vector<Token> getAllSceneTokens() const = 0;
16 | 
17 |   virtual boost::optional<SceneInfo> getSceneInfo(const Token& sceneToken) const = 0;
18 |   virtual boost::optional<SceneInfo> getSceneInfoByNumber(const uint32_t sceneNumber) const = 0;
19 | 
20 |   virtual std::vector<SampleDataInfo> getSceneSampleData(
21 |     const Token& sceneSampleData) const = 0;
22 |   virtual std::vector<EgoPoseInfo> getEgoPoseInfo(
23 |     const Token& sceneToken) const = 0;
24 |   virtual CalibratedSensorInfo getCalibratedSensorInfo(
25 |     const Token& calibratedSensorToken) const = 0;
26 |   virtual std::vector<CalibratedSensorInfoAndName> getSceneCalibratedSensorInfo(
27 |     const Token& sceneToken) const = 0;
28 |   virtual CalibratedSensorName getSensorName(
29 |     const Token& sensorToken) const = 0;
30 | };
31 | 
32 | }


--------------------------------------------------------------------------------
/include/nuscenes2bag/MetaDataReader.hpp:
--------------------------------------------------------------------------------
 1 | #include <iostream>
 2 | #include <map>
 3 | #include <set>
 4 | 
 5 | #include <nlohmann/json.hpp>
 6 | 
 7 | #include "nuscenes2bag/MetaDataTypes.hpp"
 8 | #include "nuscenes2bag/Filesystem.hpp"
 9 | #include "nuscenes2bag/MetaDataProvider.hpp"
10 | #include "nuscenes2bag/ToDebugString.hpp"
11 | 
12 | #include <boost/optional.hpp>
13 | 
14 | namespace nuscenes2bag {
15 | 
16 | class InvalidMetaDataException : public std::exception
17 | {
18 | private:
19 |   std::string msg;
20 | 
21 | public:
22 |   InvalidMetaDataException(const std::string& msg)
23 |     : msg(msg)
24 |   {}
25 |   ~InvalidMetaDataException() throw(){}
26 |   const char* what() const throw() { return this->msg.c_str(); }
27 | };
28 | 
29 | class MetaDataReader : public MetaDataProvider {
30 | public:
31 |   void loadFromDirectory(const fs::path &directoryPath);
32 | 
33 | 
34 |   std::vector<Token> getAllSceneTokens() const override;
35 | 
36 |   boost::optional<SceneInfo> getSceneInfo(const Token &sceneToken) const override;
37 | 
38 |   std::vector<SampleDataInfo>
39 |   getSceneSampleData(const Token &sceneToken) const override;
40 |   std::vector<EgoPoseInfo>
41 |   getEgoPoseInfo(const Token &sceneToken) const override;
42 |   CalibratedSensorInfo
43 |   getCalibratedSensorInfo(const Token &calibratedSensorToken) const override;
44 |   std::vector<CalibratedSensorInfoAndName>
45 |   getSceneCalibratedSensorInfo(const Token &sceneToken) const override;
46 |   CalibratedSensorName
47 |   getSensorName(const Token &sensorToken) const override;
48 | 
49 |   boost::optional<SceneInfo>
50 |   getSceneInfoByNumber(const uint32_t sceneNumber) const override;
51 | 
52 | private:
53 |   static nlohmann::json slurpJsonFile(const fs::path &filePath);
54 |   static std::vector<SceneInfo>
55 |   loadScenesFromFile(const fs::path &filePath);
56 |   static std::map<Token, std::vector<SampleInfo>>
57 |   loadSampleInfos(const fs::path &filePath);
58 |   static std::map<Token, std::vector<SampleDataInfo>>
59 |   loadSampleDataInfos(const fs::path &filePath);
60 |   static std::map<Token, std::vector<EgoPoseInfo>> loadEgoPoseInfos(
61 |       const fs::path &filePath,
62 |       std::map<Token, Token> sample2SampleData);
63 |   static std::map<Token, CalibratedSensorInfo>
64 |   loadCalibratedSensorInfo(const fs::path &filePath);
65 |   static std::map<Token, CalibratedSensorName>
66 |   loadCalibratedSensorNames(const fs::path &filePath);
67 | 
68 |   std::vector<SceneInfo> scenes;
69 |   std::map<Token, std::vector<SampleInfo>> scene2Samples;
70 |   std::map<Token, std::vector<SampleDataInfo>> sample2SampleData;
71 |   std::map<Token, std::vector<EgoPoseInfo>> scene2EgoPose;
72 |   std::map<Token, CalibratedSensorInfo> calibratedSensorToken2CalibratedSensorInfo;
73 |   std::map<Token, std::set<CalibratedSensorInfoAndName>> scene2CalibratedSensorInfo;
74 |   std::map<Token, CalibratedSensorName> sensorToken2CalibratedSensorName;
75 |   bool loadFromDirectoryCalled = false;
76 | };
77 | 
78 | }


--------------------------------------------------------------------------------
/include/nuscenes2bag/MetaDataTypes.hpp:
--------------------------------------------------------------------------------
 1 | #pragma once 
 2 | 
 3 | #include <string>
 4 | #include <array>
 5 | 
 6 | #include <boost/optional.hpp>
 7 | 
 8 | #include "nuscenes2bag/ToDebugString.hpp"
 9 | #include "nuscenes2bag/DatasetTypes.hpp"
10 | 
11 | namespace nuscenes2bag {
12 | 
13 | struct SceneInfo {
14 |     Token token; 
15 |     uint32_t sampleNumber;
16 |     SceneId sceneId;
17 |     std::string name;
18 |     std::string description;
19 |     Token firstSampleToken; 
20 | };
21 | 
22 | struct SampleInfo {
23 |     Token scene_token;
24 |     Token token;
25 |     TimeStamp timeStamp;
26 | };
27 | 
28 | struct SampleDataInfo {
29 |     // Token scene_token;
30 |     Token token;
31 |     TimeStamp timeStamp;
32 |     Token egoPoseToken;
33 |     Token calibratedSensorToken;
34 |     std::string fileFormat;
35 |     bool isKeyFrame;
36 |     std::string fileName;
37 | };
38 | 
39 | struct CalibratedSensorInfo {
40 |     Token token;
41 |     Token sensorToken;
42 |     double translation[3];
43 |     double rotation[4];
44 |     boost::optional<IntrinsicsMatrix> cameraIntrinsics;
45 | };
46 | 
47 | struct CalibratedSensorName {
48 |     Token token;
49 |     std::string name;
50 |     std::string modality;
51 | };
52 | 
53 | struct CalibratedSensorInfoAndName {
54 |     CalibratedSensorInfo info;
55 |     CalibratedSensorName name;
56 | 
57 |     inline friend bool operator<(const CalibratedSensorInfoAndName& l, const CalibratedSensorInfoAndName& r)
58 |     {
59 |         return l.info.token < r.info.token;
60 |     }
61 | };
62 | 
63 | struct EgoPoseInfo {
64 |     Token token;
65 |     TimeStamp timeStamp;
66 |     double translation[3];
67 |     double rotation[4];
68 | };
69 | 
70 | template <> std::string to_debug_string(const SceneInfo& t);
71 | template <> std::string to_debug_string(const SampleInfo& t);
72 | template <> std::string to_debug_string(const SampleDataInfo& t);
73 | 
74 | }


--------------------------------------------------------------------------------
/include/nuscenes2bag/NuScenes2Bag.hpp:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include <rosbag/bag.h>
 4 | 
 5 | #include "nuscenes2bag/DatasetTypes.hpp"
 6 | #include "nuscenes2bag/Filesystem.hpp"
 7 | 
 8 | #include <boost/optional.hpp>
 9 | 
10 | 
11 | namespace nuscenes2bag {
12 | 
13 | struct NuScenes2Bag {
14 | 
15 | public:
16 |   NuScenes2Bag();
17 | 
18 |   void convertDirectory(const fs::path &inDatasetPath,
19 |                         const std::string& version,
20 |                         const fs::path &outputRosbagPath,
21 |                         int32_t threadNumber,
22 |                         boost::optional<int32_t> sceneNumberOpt
23 |                         );
24 | 
25 | private:
26 |   std::string inDatasetPathString;
27 | };
28 | 
29 | }


--------------------------------------------------------------------------------
/include/nuscenes2bag/PclRadarObject.hpp:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include <cstdint>
 4 | #define PCL_NO_PRECOMPILE
 5 | #include <pcl/io/pcd_io.h>
 6 | #include <pcl/point_cloud.h>
 7 | #include <pcl/point_types.h>
 8 | 
 9 | namespace nuscenes2bag {
10 | 
11 | struct PclRadarObject {
12 |   //   FIELDS x y z dyn_prop id
13 |   // SIZE 4 4 4 1 2
14 |   // rcs vx vy vx_comp vy_comp
15 |   // 4 4 4 4 4
16 |   // is_quality_valid ambig_state x_rms y_rms invalid_state pdh0 vx_rms vy_rms
17 |   // 1 1 1 1 1 1 1 1
18 | 
19 |   float x;
20 |   float y;
21 |   float z;
22 | //   PCL_ADD_POINT4D
23 | 
24 |   int8_t dyn_prop;
25 |   int16_t id;
26 |   float rcs;
27 |   float vx;
28 |   float vy;
29 |   float vx_comp;
30 |   float vy_comp;
31 |   int8_t is_quality_valid;
32 |   int8_t ambig_state;
33 |   int8_t x_rms;
34 |   int8_t y_rms;
35 |   int8_t invalid_state;
36 |   int8_t pdh0;
37 |   int8_t vx_rms;
38 |   int8_t vy_rms;
39 |   EIGEN_MAKE_ALIGNED_OPERATOR_NEW
40 | } EIGEN_ALIGN16;
41 | 
42 | }
43 | 
44 | POINT_CLOUD_REGISTER_POINT_STRUCT(
45 |     nuscenes2bag::PclRadarObject, 
46 |     (float, x, x)
47 |     (float, y, y)
48 |     (float, z, z)
49 |     (int8_t, dyn_prop, dyn_prop)
50 |     (int16_t, id, id)
51 |     (float, rcs, rcs)
52 |     (float, vx, vx)
53 |     (float, vy, vy)
54 |     (float, vx_comp, vx_comp)
55 |     (float, vy_comp, vy_comp)
56 |     (int8_t, is_quality_valid, is_quality_valid)
57 |     (int8_t, ambig_state, ambig_state)
58 |     (int8_t, x_rms, x_rms)
59 |     (int8_t, y_rms, y_rms)
60 |     (int8_t, invalid_state, invalid_state)
61 |     (int8_t, pdh0, pdh0)
62 |     (int8_t, vx_rms, vx_rms)
63 |     (int8_t, vy_rms, vy_rms)
64 |     )
65 | 


--------------------------------------------------------------------------------
/include/nuscenes2bag/RadarDirectoryConverter.hpp:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include "nuscenes2bag/RadarObjects.h"
 4 | #include "nuscenes2bag/PclRadarObject.hpp"
 5 | #include "nuscenes2bag/Filesystem.hpp"
 6 | 
 7 | namespace nuscenes2bag {
 8 | 
 9 | boost::optional<nuscenes2bag::RadarObjects> readRadarFile(const fs::path& filePath);
10 | 
11 | }


--------------------------------------------------------------------------------
/include/nuscenes2bag/RunEvery.hpp:
--------------------------------------------------------------------------------
 1 | #pragma once 
 2 | 
 3 | #include <chrono>
 4 | 
 5 | namespace nuscenes2bag {
 6 | 
 7 | template <typename T> class RunEvery {
 8 | public:
 9 |   RunEvery(std::chrono::milliseconds periodMs, T &&lambda)
10 |       : periodMs(periodMs), lastExecutionTime(std::chrono::system_clock::now()),
11 |         lambda(lambda) {}
12 | 
13 |   void update() {
14 |     auto now = std::chrono::system_clock::now();
15 |     auto dtMs = std::chrono::duration_cast<std::chrono::milliseconds>(
16 |         now - lastExecutionTime);
17 |     if (dtMs > periodMs) {
18 |       lambda();
19 |       lastExecutionTime = now;
20 |     }
21 |   }
22 | 
23 |   std::chrono::milliseconds periodMs;
24 |   std::chrono::time_point<std::chrono::system_clock> lastExecutionTime;
25 |   T lambda;
26 | };
27 | 
28 | }


--------------------------------------------------------------------------------
/include/nuscenes2bag/SceneConverter.hpp:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include "nuscenes2bag/Filesystem.hpp"
 4 | #include "nuscenes2bag/MetaDataReader.hpp"
 5 | #include "nuscenes2bag/FileProgress.hpp"
 6 | #include "rosbag/bag.h"
 7 | 
 8 | namespace nuscenes2bag {
 9 | 
10 | class SceneConverter {
11 |     public:
12 |     SceneConverter(const MetaDataProvider& metaDataProvider);
13 | 
14 |     void submit(const Token& sceneToken, FileProgress& fileProgress);
15 | 
16 |     void run(const fs::path& inPath, const fs::path& outDirectoryPath, FileProgress& fileProgress);
17 | 
18 |     private:
19 |     void convertSampleDatas(rosbag::Bag& outBag, const fs::path &inPath, FileProgress& fileProgress);
20 |     void convertEgoPoseInfos(rosbag::Bag& outBag, const std::vector<CalibratedSensorInfoAndName>& calibratedSensorInfo);
21 |     
22 |     private:
23 |     const MetaDataProvider& metaDataProvider;
24 |     std::vector<SampleDataInfo> sampleDatas;
25 |     std::vector<EgoPoseInfo> egoPoseInfos;
26 |     SceneId sceneId;
27 |     Token sceneToken;
28 | };
29 | 
30 | }


--------------------------------------------------------------------------------
/include/nuscenes2bag/ToDebugString.hpp:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include <string>
 4 | 
 5 | #define SHOW_FIRST_MEMBER(memberName) "{" #memberName << o.memberName
 6 | #define SHOW_MEMBER(memberName) ", "#memberName << o.memberName
 7 | #define SHOW_LAST_MEMBER(memberName) ", "#memberName"}" << o.memberName
 8 | 
 9 | namespace nuscenes2bag {
10 | 
11 | template <typename T> std::string to_debug_string(const T& t);
12 | 
13 | }


--------------------------------------------------------------------------------
/include/nuscenes2bag/thread_pool.hpp:
--------------------------------------------------------------------------------
  1 | /*
  2 |  * Thread pool with queueing policies.
  3 |  * Uses C++11 and Boost ASIO.
  4 |  *
  5 |  * Code from here:
  6 |  * http://github.com/en4bz/ThreadPool
  7 |  *
  8 |  * Authors:
  9 |  * Jakob Progsch, 2012
 10 |  * Ian Forbes, 2014
 11 |  *
 12 |  */
 13 | 
 14 | /*
 15 |  *Copyright (c) 2012 Jakob Progsch
 16 |  *
 17 |  *This software is provided 'as-is', without any express or implied
 18 |  *warranty. In no event will the authors be held liable for any damages
 19 |  *arising from the use of this software.
 20 |  *
 21 |  *Permission is granted to anyone to use this software for any purpose,
 22 |  *including commercial applications, and to alter it and redistribute it
 23 |  *freely, subject to the following restrictions:
 24 |  *
 25 |  *  1. The origin of this software must not be misrepresented; you must not
 26 |  *  claim that you wrote the original software. If you use this software
 27 |  *  in a product, an acknowledgment in the product documentation would be
 28 |  *  appreciated but is not required.
 29 |  *
 30 |  *  2. Altered source versions must be plainly marked as such, and must not be
 31 |  *  misrepresented as being the original software.
 32 | 
 33 |  *  3. This notice may not be removed or altered from any source
 34 |  *  distribution.
 35 |  */
 36 | 
 37 | #ifndef THREAD_POOL_HPP
 38 | #define THREAD_POOL_HPP
 39 | 
 40 | #include <stack>
 41 | #include <queue>
 42 | #include <mutex>
 43 | #include <memory>
 44 | #include <thread>
 45 | #include <vector>
 46 | #include <future>
 47 | #include <stdexcept>
 48 | #include <functional>
 49 | #include <type_traits>
 50 | #include <condition_variable>
 51 | 
 52 | #include <iostream>
 53 | 
 54 | typedef std::function<void(void)> task_t;
 55 | 
 56 | class prioritized_task{
 57 | private:
 58 |     int priority;
 59 |     task_t task;
 60 | public:
 61 |     prioritized_task(int p, task_t&& f) : priority(p), task(f) {}
 62 | 
 63 |     bool operator< (const prioritized_task& other) const{
 64 |         return this->priority < other.priority;
 65 |     }
 66 | 
 67 |     void operator()(void){
 68 |         task();
 69 |     }
 70 | };
 71 | 
 72 | typedef std::queue<task_t> FIFO;
 73 | typedef std::stack<task_t> LIFO;
 74 | typedef std::priority_queue<prioritized_task> PRIORITY;
 75 | 
 76 | template <typename policy_type = FIFO>
 77 | class ThreadPool {
 78 | private:
 79 |     std::vector<std::thread> mWorkers;
 80 |     policy_type mTasks;
 81 | 
 82 |     std::mutex queue_mutex;
 83 |     std::condition_variable condition;
 84 |     std::atomic<bool> isActive;
 85 | public:
 86 |     ThreadPool (size_t numThreads = std::thread::hardware_concurrency() ) : isActive(true){
 87 |         for(size_t i = 0 ; i < numThreads; i++)
 88 |             mWorkers.emplace_back(std::thread(&ThreadPool::scheduler_loop,this));
 89 |     }
 90 | 
 91 | private:
 92 |     void scheduler_loop(){
 93 |         while(1){
 94 |             std::unique_lock<std::mutex> lock(this->queue_mutex);
 95 |             while(this->mTasks.empty()){
 96 |                 if( !this->isActive.load() ) return;
 97 |                 this->condition.wait(lock);
 98 |             }
 99 |             std::function<void()> lNextTask = this->mTasks.top();
100 |             this->mTasks.pop();
101 |             lock.unlock();
102 |             lNextTask();
103 |         }
104 |     }
105 | 
106 | public:
107 | 
108 |     ThreadPool(ThreadPool& to_copy) = delete; //Probably wouldn't and shouldn't copy this.
109 |     void operator =(ThreadPool& to_copy) = delete;
110 | 
111 |     template<class F, class... Args> //Below is the return type...Yes it is ridiculous, but it works. Enabled if policy_tpye IS NOT PRIORITY
112 |     typename std::enable_if< ! std::is_same<policy_type,PRIORITY>::value, std::future<typename std::result_of<F(Args...)>::type> >::type
113 |     enqueue(F&& f, Args&&... args){
114 |         typedef typename std::result_of<F(Args...)>::type return_type;
115 |         if ( ! isActive.load() ) // Don't allow enqueueing after stopping the pool
116 |             throw std::runtime_error("enqueue on stopped ThreadPool");
117 | 
118 |         auto task = std::make_shared<std::packaged_task<return_type()>>(std::bind(std::forward<F>(f), std::forward<Args>(args)...) );
119 | 
120 |         std::future<return_type> result = task->get_future();
121 |         {
122 |             std::unique_lock<std::mutex> lock(queue_mutex);
123 |             mTasks.push([task](){ (*task)(); });
124 |         }
125 |         condition.notify_one();
126 |         return result;
127 |     }
128 | 
129 |     template<class F, class... Args> //Below is the return type...Yes it is ridiculous, but it works. Enabled if policy_tpye IS PRIORITY
130 |     typename std::enable_if< std::is_same<policy_type,PRIORITY>::value, std::future<typename std::result_of<F(Args...)>::type> >::type
131 |     enqueue(int priority, F&& f, Args&&... args){
132 |         typedef typename std::result_of<F(Args...)>::type return_type;
133 |         // Don't allow enqueueing after stopping the pool
134 |         if ( ! isActive.load() )
135 |             throw std::runtime_error("enqueue on stopped ThreadPool");
136 | 
137 |         auto task = std::make_shared<std::packaged_task<return_type()>>(std::bind(std::forward<F>(f), std::forward<Args>(args)...) );
138 | 
139 |         std::future<return_type> res = task->get_future();
140 |         {
141 |             std::unique_lock<std::mutex> lock(queue_mutex);
142 |             mTasks.push(prioritized_task(priority, [task](void){ (*task)();}));
143 |         }
144 |         condition.notify_one();
145 |         return res;
146 |     }
147 | 
148 |     int pending(void){
149 |         std::unique_lock<std::mutex> lock(queue_mutex);
150 |         return this->mTasks.size();
151 |     }
152 | 
153 |     void close(){
154 |         this->isActive.store(false);
155 |         condition.notify_all();
156 |         for(std::thread& t : mWorkers)
157 |             t.join();
158 |     }
159 | 
160 |     ~ThreadPool(void){
161 |         this->close();
162 |     }
163 | };
164 | 
165 | template<>
166 | ThreadPool<FIFO>::ThreadPool (size_t numThreads) : isActive(true){
167 |     for(size_t i = 0 ; i < numThreads; i++){
168 |         mWorkers.emplace_back(std::thread(
169 |         [this] {
170 |             while(true){
171 |                 std::unique_lock<std::mutex> lock(this->queue_mutex);
172 |                 while( this->isActive.load() && this->mTasks.empty())
173 |                     this->condition.wait(lock);
174 |                 if( ! this->isActive.load() && this->mTasks.empty())
175 |                     return;
176 |                 task_t lNextTask(this->mTasks.front());
177 |                 this->mTasks.pop();
178 |                 lock.unlock();
179 |                 lNextTask();
180 |             }
181 |         }
182 |         ));
183 |     }
184 | }
185 | 
186 | #endif
187 | 


--------------------------------------------------------------------------------
/include/nuscenes2bag/utils.hpp:
--------------------------------------------------------------------------------
 1 | #pragma once
 2 | 
 3 | #include "nuscenes2bag/DatasetTypes.hpp"
 4 | 
 5 | #include "ros/ros.h"
 6 | #include <algorithm>
 7 | #include <string>
 8 | #include <iostream>
 9 | #include <exception>
10 | 
11 | #define PRINT_EXCEPTION(e) std::cout << "[ERROR] Exception thrown: " << __FILE__ << ":" << __LINE__ << " " << e.what() << std::endl;
12 | 
13 | namespace nuscenes2bag {
14 | 
15 | 
16 | std::string toLower(const std::string& str);
17 | 
18 | bool string_icontains(const std::string& string,
19 |                       const std::string& sub);
20 | 
21 | ros::Time stampUs2RosTime(uint64_t stampUs);
22 | 
23 | template <class T> T uniq(T t) {
24 |   sort(t.begin(), t.end());
25 |   t.erase(unique(t.begin(), t.end()), t.end());
26 |   return t;
27 | }
28 | 
29 | template <template <class, class, class...> class Container, class Key,
30 |           class Value, class... TArgs>
31 | Value &getExistingOrDefault(Container<Key, Value, TArgs...> &container,
32 |                             const Key &key) {
33 |   auto it = container.find(key);
34 |   if (it == container.end()) {
35 |     container.insert(std::pair<Key, Value>(key, Value()));
36 |     it = container.find(key);
37 |     return it->second;
38 |   } else {
39 |     return it->second;
40 |   }
41 | }
42 | 
43 | template <typename T, typename U> void assignArray2Vector3(T& vector3, const U* ar) {
44 |     vector3.x = ar[0];
45 |     vector3.y = ar[1];
46 |     vector3.z = ar[2];
47 | }
48 | 
49 | template <typename T, typename U> void assignArray2Quaternion(T& quat, const U* ar) {
50 |     quat.x = ar[1];
51 |     quat.y = ar[2];
52 |     quat.z = ar[3];
53 |     quat.w = ar[0];
54 | }
55 | 
56 | class UnableToParseFileException : public std::exception {
57 |   private:
58 |     std::string msg;
59 | 
60 |   public:
61 |     UnableToParseFileException(const std::string& fileName) {
62 |       msg += "Unable to parse ";
63 |       msg += fileName;
64 |     };
65 |     ~UnableToParseFileException() throw() {};
66 |     const char *what() const throw() { return this->msg.c_str(); };
67 | };
68 | 
69 | }


--------------------------------------------------------------------------------
/msg/RadarObject.msg:
--------------------------------------------------------------------------------
 1 | geometry_msgs/Vector3 pose
 2 | uint8 dyn_prop
 3 | uint16 id
 4 | float32 rcs
 5 | float32 vx
 6 | float32 vy
 7 | float32 vx_comp
 8 | float32 vy_comp
 9 | uint8 is_quality_valid
10 | uint8 ambig_state
11 | uint8 x_rms
12 | uint8 y_rms
13 | uint8 invalid_state
14 | uint8 pdh0
15 | uint8 vx_rms
16 | uint8 vy_rms


--------------------------------------------------------------------------------
/msg/RadarObjects.msg:
--------------------------------------------------------------------------------
1 | std_msgs/Header header
2 | RadarObject[] objects


--------------------------------------------------------------------------------
/output_inference_graph_v2/checkpoint:
--------------------------------------------------------------------------------
1 | model_checkpoint_path: "model.ckpt"
2 | all_model_checkpoint_paths: "model.ckpt"
3 | 


--------------------------------------------------------------------------------
/output_inference_graph_v2/frozen_inference_graph.pb:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Matnay/Sensor_Fusion_Object_Detection_KPIT/14f3815fc2829db9bede86c31f23e721f6423f79/output_inference_graph_v2/frozen_inference_graph.pb


--------------------------------------------------------------------------------
/output_inference_graph_v2/model.ckpt.data-00000-of-00001:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Matnay/Sensor_Fusion_Object_Detection_KPIT/14f3815fc2829db9bede86c31f23e721f6423f79/output_inference_graph_v2/model.ckpt.data-00000-of-00001


--------------------------------------------------------------------------------
/output_inference_graph_v2/model.ckpt.index:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Matnay/Sensor_Fusion_Object_Detection_KPIT/14f3815fc2829db9bede86c31f23e721f6423f79/output_inference_graph_v2/model.ckpt.index


--------------------------------------------------------------------------------
/output_inference_graph_v2/model.ckpt.meta:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Matnay/Sensor_Fusion_Object_Detection_KPIT/14f3815fc2829db9bede86c31f23e721f6423f79/output_inference_graph_v2/model.ckpt.meta


--------------------------------------------------------------------------------
/output_inference_graph_v2/pipeline.config:
--------------------------------------------------------------------------------
  1 | model {
  2 |   ssd {
  3 |     num_classes: 2
  4 |     image_resizer {
  5 |       fixed_shape_resizer {
  6 |         height: 300
  7 |         width: 300
  8 |       }
  9 |     }
 10 |     feature_extractor {
 11 |       type: "ssd_mobilenet_v1"
 12 |       depth_multiplier: 1.0
 13 |       min_depth: 16
 14 |       conv_hyperparams {
 15 |         regularizer {
 16 |           l2_regularizer {
 17 |             weight: 3.99999989895e-05
 18 |           }
 19 |         }
 20 |         initializer {
 21 |           truncated_normal_initializer {
 22 |             mean: 0.0
 23 |             stddev: 0.0299999993294
 24 |           }
 25 |         }
 26 |         activation: RELU_6
 27 |         batch_norm {
 28 |           decay: 0.999700009823
 29 |           center: true
 30 |           scale: true
 31 |           epsilon: 0.0010000000475
 32 |           train: true
 33 |         }
 34 |       }
 35 |     }
 36 |     box_coder {
 37 |       faster_rcnn_box_coder {
 38 |         y_scale: 10.0
 39 |         x_scale: 10.0
 40 |         height_scale: 5.0
 41 |         width_scale: 5.0
 42 |       }
 43 |     }
 44 |     matcher {
 45 |       argmax_matcher {
 46 |         matched_threshold: 0.5
 47 |         unmatched_threshold: 0.5
 48 |         ignore_thresholds: false
 49 |         negatives_lower_than_unmatched: true
 50 |         force_match_for_each_row: true
 51 |       }
 52 |     }
 53 |     similarity_calculator {
 54 |       iou_similarity {
 55 |       }
 56 |     }
 57 |     box_predictor {
 58 |       convolutional_box_predictor {
 59 |         conv_hyperparams {
 60 |           regularizer {
 61 |             l2_regularizer {
 62 |               weight: 3.99999989895e-05
 63 |             }
 64 |           }
 65 |           initializer {
 66 |             truncated_normal_initializer {
 67 |               mean: 0.0
 68 |               stddev: 0.0299999993294
 69 |             }
 70 |           }
 71 |           activation: RELU_6
 72 |           batch_norm {
 73 |             decay: 0.999700009823
 74 |             center: true
 75 |             scale: true
 76 |             epsilon: 0.0010000000475
 77 |             train: true
 78 |           }
 79 |         }
 80 |         min_depth: 0
 81 |         max_depth: 0
 82 |         num_layers_before_predictor: 0
 83 |         use_dropout: false
 84 |         dropout_keep_probability: 0.800000011921
 85 |         kernel_size: 1
 86 |         box_code_size: 4
 87 |         apply_sigmoid_to_scores: false
 88 |       }
 89 |     }
 90 |     anchor_generator {
 91 |       ssd_anchor_generator {
 92 |         num_layers: 6
 93 |         min_scale: 0.20000000298
 94 |         max_scale: 0.949999988079
 95 |         aspect_ratios: 1.0
 96 |         aspect_ratios: 2.0
 97 |         aspect_ratios: 0.5
 98 |         aspect_ratios: 3.0
 99 |         aspect_ratios: 0.333299994469
100 |       }
101 |     }
102 |     post_processing {
103 |       batch_non_max_suppression {
104 |         score_threshold: 0.300000011921
105 |         iou_threshold: 0.600000023842
106 |         max_detections_per_class: 100
107 |         max_total_detections: 100
108 |       }
109 |       score_converter: SIGMOID
110 |     }
111 |     normalize_loss_by_num_matches: true
112 |     loss {
113 |       localization_loss {
114 |         weighted_smooth_l1 {
115 |         }
116 |       }
117 |       classification_loss {
118 |         weighted_sigmoid {
119 |         }
120 |       }
121 |       hard_example_miner {
122 |         num_hard_examples: 3000
123 |         iou_threshold: 0.990000009537
124 |         loss_type: CLASSIFICATION
125 |         max_negatives_per_positive: 3
126 |         min_negatives_per_image: 0
127 |       }
128 |       classification_weight: 1.0
129 |       localization_weight: 1.0
130 |     }
131 |   }
132 | }
133 | train_config {
134 |   batch_size: 24
135 |   data_augmentation_options {
136 |     random_horizontal_flip {
137 |     }
138 |   }
139 |   data_augmentation_options {
140 |     ssd_random_crop {
141 |     }
142 |   }
143 |   optimizer {
144 |     rms_prop_optimizer {
145 |       learning_rate {
146 |         exponential_decay_learning_rate {
147 |           initial_learning_rate: 0.00400000018999
148 |           decay_steps: 800720
149 |           decay_factor: 0.949999988079
150 |         }
151 |       }
152 |       momentum_optimizer_value: 0.899999976158
153 |       decay: 0.899999976158
154 |       epsilon: 1.0
155 |     }
156 |   }
157 |   fine_tune_checkpoint: "pre-trained-model/model.ckpt"
158 |   from_detection_checkpoint: true
159 |   num_steps: 200000
160 | }
161 | train_input_reader {
162 |   label_map_path: "annotations/label_map.pbtxt"
163 |   tf_record_input_reader {
164 |     input_path: "annotations/train.record"
165 |   }
166 | }
167 | eval_config {
168 |   num_examples: 8000
169 |   max_evals: 10
170 |   use_moving_averages: false
171 | }
172 | eval_input_reader {
173 |   label_map_path: "annotations/label_map.pbtxt"
174 |   shuffle: false
175 |   num_readers: 1
176 |   tf_record_input_reader {
177 |     input_path: "annotations/test.record"
178 |   }
179 | }
180 | 


--------------------------------------------------------------------------------
/output_inference_graph_v2/saved_model/saved_model.pb:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Matnay/Sensor_Fusion_Object_Detection_KPIT/14f3815fc2829db9bede86c31f23e721f6423f79/output_inference_graph_v2/saved_model/saved_model.pb


--------------------------------------------------------------------------------
/output_inference_graph_v2/v1.config:
--------------------------------------------------------------------------------
  1 | model {
  2 |   ssd {
  3 |     num_classes: 2
  4 |     image_resizer {
  5 |       fixed_shape_resizer {
  6 |         height: 300
  7 |         width: 300
  8 |       }
  9 |     }
 10 |     feature_extractor {
 11 |       type: "ssd_mobilenet_v1"
 12 |       depth_multiplier: 1.0
 13 |       min_depth: 16
 14 |       conv_hyperparams {
 15 |         regularizer {
 16 |           l2_regularizer {
 17 |             weight: 3.99999989895e-05
 18 |           }
 19 |         }
 20 |         initializer {
 21 |           truncated_normal_initializer {
 22 |             mean: 0.0
 23 |             stddev: 0.0299999993294
 24 |           }
 25 |         }
 26 |         activation: RELU_6
 27 |         batch_norm {
 28 |           decay: 0.999700009823
 29 |           center: true
 30 |           scale: true
 31 |           epsilon: 0.0010000000475
 32 |           train: true
 33 |         }
 34 |       }
 35 |     }
 36 |     box_coder {
 37 |       faster_rcnn_box_coder {
 38 |         y_scale: 10.0
 39 |         x_scale: 10.0
 40 |         height_scale: 5.0
 41 |         width_scale: 5.0
 42 |       }
 43 |     }
 44 |     matcher {
 45 |       argmax_matcher {
 46 |         matched_threshold: 0.5
 47 |         unmatched_threshold: 0.5
 48 |         ignore_thresholds: false
 49 |         negatives_lower_than_unmatched: true
 50 |         force_match_for_each_row: true
 51 |       }
 52 |     }
 53 |     similarity_calculator {
 54 |       iou_similarity {
 55 |       }
 56 |     }
 57 |     box_predictor {
 58 |       convolutional_box_predictor {
 59 |         conv_hyperparams {
 60 |           regularizer {
 61 |             l2_regularizer {
 62 |               weight: 3.99999989895e-05
 63 |             }
 64 |           }
 65 |           initializer {
 66 |             truncated_normal_initializer {
 67 |               mean: 0.0
 68 |               stddev: 0.0299999993294
 69 |             }
 70 |           }
 71 |           activation: RELU_6
 72 |           batch_norm {
 73 |             decay: 0.999700009823
 74 |             center: true
 75 |             scale: true
 76 |             epsilon: 0.0010000000475
 77 |             train: true
 78 |           }
 79 |         }
 80 |         min_depth: 0
 81 |         max_depth: 0
 82 |         num_layers_before_predictor: 0
 83 |         use_dropout: false
 84 |         dropout_keep_probability: 0.800000011921
 85 |         kernel_size: 1
 86 |         box_code_size: 4
 87 |         apply_sigmoid_to_scores: false
 88 |       }
 89 |     }
 90 |     anchor_generator {
 91 |       ssd_anchor_generator {
 92 |         num_layers: 6
 93 |         min_scale: 0.20000000298
 94 |         max_scale: 0.949999988079
 95 |         aspect_ratios: 1.0
 96 |         aspect_ratios: 2.0
 97 |         aspect_ratios: 0.5
 98 |         aspect_ratios: 3.0
 99 |         aspect_ratios: 0.333299994469
100 |       }
101 |     }
102 |     post_processing {
103 |       batch_non_max_suppression {
104 |         score_threshold: 0.300000011921
105 |         iou_threshold: 0.600000023842
106 |         max_detections_per_class: 100
107 |         max_total_detections: 100
108 |       }
109 |       score_converter: SIGMOID
110 |     }
111 |     normalize_loss_by_num_matches: true
112 |     loss {
113 |       localization_loss {
114 |         weighted_smooth_l1 {
115 |         }
116 |       }
117 |       classification_loss {
118 |         weighted_sigmoid {
119 |         }
120 |       }
121 |       hard_example_miner {
122 |         num_hard_examples: 3000
123 |         iou_threshold: 0.990000009537
124 |         loss_type: CLASSIFICATION
125 |         max_negatives_per_positive: 3
126 |         min_negatives_per_image: 0
127 |       }
128 |       classification_weight: 1.0
129 |       localization_weight: 1.0
130 |     }
131 |   }
132 | }
133 | train_config {
134 |   batch_size: 24
135 |   data_augmentation_options {
136 |     random_horizontal_flip {
137 |     }
138 |   }
139 |   data_augmentation_options {
140 |     ssd_random_crop {
141 |     }
142 |   }
143 |   optimizer {
144 |     rms_prop_optimizer {
145 |       learning_rate {
146 |         exponential_decay_learning_rate {
147 |           initial_learning_rate: 0.00400000018999
148 |           decay_steps: 800720
149 |           decay_factor: 0.949999988079
150 |         }
151 |       }
152 |       momentum_optimizer_value: 0.899999976158
153 |       decay: 0.899999976158
154 |       epsilon: 1.0
155 |     }
156 |   }
157 |   fine_tune_checkpoint: "pre-trained-model/model.ckpt"
158 |   from_detection_checkpoint: true
159 |   num_steps: 200000
160 | }
161 | train_input_reader {
162 |   label_map_path: "annotations/label_map.pbtxt"
163 |   tf_record_input_reader {
164 |     input_path: "annotations/train.record"
165 |   }
166 | }
167 | eval_config {
168 |   num_examples: 8000
169 |   max_evals: 10
170 |   use_moving_averages: false
171 | }
172 | eval_input_reader {
173 |   label_map_path: "annotations/label_map.pbtxt"
174 |   shuffle: false
175 |   num_readers: 1
176 |   tf_record_input_reader {
177 |     input_path: "annotations/test.record"
178 |   }
179 | }
180 | 


--------------------------------------------------------------------------------
/package.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0"?>
 2 | <package format="2">
 3 |   <name>nuscenes2bag</name>
 4 |   <version>0.0.1</version>
 5 |   <description>Convert nuscenes dataset to rosbag</description>
 6 | 
 7 |   <maintainer email="clynamen@gmail.com">clynamen</maintainer>
 8 |   <license>MIT</license>
 9 |   <author email="clynamen@gmail.com">clynamen</author>
10 |   <build_depend>message_generation</build_depend>
11 |   <exec_depend>message_runtime</exec_depend>
12 |   <buildtool_depend>catkin</buildtool_depend>
13 |   <build_depend>opencv</build_depend>
14 |   <build_depend>rosbag</build_depend>
15 |   <build_depend>sensor_msgs</build_depend>
16 |   <build_depend>geometry_msgs</build_depend>
17 |   <build_depend>nav_msgs</build_depend>
18 |   <build_depend>tf</build_depend>
19 |   <build_depend>cv_bridge</build_depend>
20 |   <build_export_depend>opencv</build_export_depend>
21 |   <exec_depend>opencv</exec_depend>
22 |   <exec_depend>rosbag</exec_depend>
23 |   <exec_depend>sensor_msgs</exec_depend>
24 |   <exec_depend>geometry_msgs</exec_depend>
25 |   <exec_depend>nav_msgs</exec_depend>
26 |   <exec_depend>tf</exec_depend>
27 |   <exec_depend>cv_bridge</exec_depend>
28 | 
29 | 
30 |   <export>
31 |   </export>
32 | </package>
33 | 


--------------------------------------------------------------------------------
/src/EgoPoseConverter.cpp:
--------------------------------------------------------------------------------
 1 | #include "nuscenes2bag/utils.hpp"
 2 | #include <geometry_msgs/TransformStamped.h>
 3 | #include <nav_msgs/Odometry.h>
 4 | #include <tf/tfMessage.h>
 5 | 
 6 | #include "nuscenes2bag/utils.hpp"
 7 | #include <nuscenes2bag/MetaDataTypes.hpp>
 8 | 
 9 | namespace nuscenes2bag {
10 | 
11 | nav_msgs::Odometry
12 | egoPoseInfo2OdometryMsg(const EgoPoseInfo& egoPoseInfo)
13 | {
14 |   nav_msgs::Odometry msg;
15 |   msg.header.stamp = stampUs2RosTime(egoPoseInfo.timeStamp);
16 |   msg.header.frame_id = "odom";
17 |   msg.child_frame_id = "base_link";
18 | 
19 |   assignArray2Vector3(msg.pose.pose.position, egoPoseInfo.translation);
20 |   assignArray2Quaternion(msg.pose.pose.orientation, egoPoseInfo.rotation);
21 | 
22 |   return msg;
23 | }
24 | 
25 | geometry_msgs::TransformStamped
26 | egoPoseInfo2TransformStamped(const EgoPoseInfo& egoPoseInfo)
27 | {
28 |   geometry_msgs::TransformStamped msg;
29 |   msg.header.stamp = stampUs2RosTime(egoPoseInfo.timeStamp);
30 |   msg.header.frame_id = "odom";
31 |   msg.child_frame_id = "base_link";
32 | 
33 |   assignArray2Vector3(msg.transform.translation, egoPoseInfo.translation);
34 |   assignArray2Quaternion(msg.transform.rotation, egoPoseInfo.rotation);
35 | 
36 |   return msg;
37 | }
38 | 
39 | }


--------------------------------------------------------------------------------
/src/FileProgress.cpp:
--------------------------------------------------------------------------------
 1 | #include "nuscenes2bag/FileProgress.hpp"
 2 | #include <iostream>
 3 | 
 4 | namespace nuscenes2bag {
 5 | 
 6 | FileProgress::FileProgress()
 7 |   : processedFiles(0)
 8 |   , toProcessFiles(0)
 9 | {}
10 | 
11 | void
12 | FileProgress::addToProcess(uint32_t toProcess)
13 | {
14 |   toProcessFiles += toProcess;
15 | }
16 | 
17 | void
18 | FileProgress::addToProcessed(uint32_t processed)
19 | {
20 |   processedFiles += processed;
21 | }
22 | 
23 | float
24 | FileProgress::getProgressPercentage()
25 | {
26 |   return ((double)processedFiles) / toProcessFiles;
27 | }
28 | 
29 | }


--------------------------------------------------------------------------------
/src/ImageDirectoryConverter.cpp:
--------------------------------------------------------------------------------
 1 | #include "nuscenes2bag/ImageDirectoryConverter.hpp"
 2 | #include "nuscenes2bag/utils.hpp"
 3 | #include <thread>
 4 | 
 5 | namespace nuscenes2bag {
 6 | 
 7 | boost::optional<sensor_msgs::Image>
 8 | readImageFile(const fs::path& filePath) noexcept
 9 | {
10 |   cv::Mat image;
11 |   try {
12 |     image = imread(filePath.string().c_str(), cv::IMREAD_COLOR);
13 |     sensor_msgs::ImagePtr msg =
14 |       cv_bridge::CvImage(std_msgs::Header(), "bgr8", image).toImageMsg();
15 | 
16 |     return boost::optional<sensor_msgs::Image>(*msg);
17 | 
18 |   } catch (const std::exception& e) {
19 |     PRINT_EXCEPTION(e);
20 |   }
21 | 
22 |   return boost::none;
23 | }
24 | 
25 | }


--------------------------------------------------------------------------------
/src/LidarDirectoryConverter.cpp:
--------------------------------------------------------------------------------
  1 | #include "nuscenes2bag/LidarDirectoryConverter.hpp"
  2 | #include "nuscenes2bag/utils.hpp"
  3 | #include <exception>
  4 | 
  5 | using namespace sensor_msgs;
  6 | using namespace std;
  7 | 
  8 | namespace nuscenes2bag {
  9 | 
 10 | inline void
 11 | fillFieldsForPointcloud(std::vector<PointField>& fields)
 12 | {
 13 |   PointField field;
 14 |   field.datatype = sensor_msgs::PointField::FLOAT32;
 15 |   field.offset = 0;
 16 |   field.count = 1;
 17 |   field.name = std::string("x");
 18 |   fields.push_back(field);
 19 | 
 20 |   field.datatype = sensor_msgs::PointField::FLOAT32;
 21 |   field.offset = 4;
 22 |   field.count = 1;
 23 |   field.name = std::string("y");
 24 |   fields.push_back(field);
 25 | 
 26 |   field.datatype = sensor_msgs::PointField::FLOAT32;
 27 |   field.offset = 8;
 28 |   field.count = 1;
 29 |   field.name = std::string("z");
 30 |   fields.push_back(field);
 31 | 
 32 |   field.datatype = sensor_msgs::PointField::FLOAT32;
 33 |   field.offset = 12;
 34 |   field.count = 1;
 35 |   field.name = std::string("intensity");
 36 |   fields.push_back(field);
 37 | }
 38 | 
 39 | // Convert float32 to 4 bytes
 40 | union
 41 | {
 42 |   float value;
 43 |   uint8_t byte[4];
 44 | } floatToBytes;
 45 | 
 46 | inline void
 47 | push_back_float32(std::vector<uint8_t>& data, float float_data)
 48 | {
 49 | 
 50 |   /*
 51 |   // dereferencing type-punned pointer will break strict-aliasing rules
 52 |   data.push_back((*reinterpret_cast<uint32_t*>(&float_data) >> 0) & 0xFF);
 53 |   data.push_back((*reinterpret_cast<uint32_t*>(&float_data) >> 8) & 0xFF);
 54 |   data.push_back((*reinterpret_cast<uint32_t*>(&float_data) >> 16) & 0xFF);
 55 |   data.push_back((*reinterpret_cast<uint32_t*>(&float_data) >> 24) & 0xFF);
 56 |   */
 57 | 
 58 |   floatToBytes.value = float_data;
 59 |   data.push_back(floatToBytes.byte[0]);
 60 |   data.push_back(floatToBytes.byte[1]);
 61 |   data.push_back(floatToBytes.byte[2]);
 62 |   data.push_back(floatToBytes.byte[3]);
 63 | }
 64 | 
 65 | inline std::vector<float>
 66 | readBinaryPcdFile(std::ifstream& fin)
 67 | {
 68 |   std::vector<float> fileValues;
 69 |   uint8_t skipCounter = 0;
 70 |   float f;
 71 |   while (fin.read(reinterpret_cast<char*>(&f), sizeof(float))) {
 72 |     // skip 5th value of each point
 73 |     if (skipCounter < 4) {
 74 |       fileValues.push_back(f);
 75 |       skipCounter++;
 76 |     } else {
 77 |       skipCounter = 0;
 78 |     }
 79 |   }
 80 | 
 81 |   return fileValues;
 82 | }
 83 | 
 84 | boost::optional<sensor_msgs::PointCloud2>
 85 | readLidarFile(const fs::path& filePath)
 86 | {
 87 | 
 88 |   PointCloud2 cloud;
 89 |   cloud.header.frame_id = std::string("lidar");
 90 |   cloud.is_bigendian = false;
 91 |   cloud.point_step = sizeof(float) * 4; // Length of each point in bytes
 92 |   cloud.height = 1;
 93 | 
 94 |   try {
 95 |     std::ifstream fin(filePath.string(), std::ios::binary);
 96 |     const std::vector<float> fileValues = readBinaryPcdFile(fin);
 97 | 
 98 |     if (fileValues.size() % 4 != 0) {
 99 |       throw UnableToParseFileException(filePath.string());
100 |     }
101 |     const size_t pointsNumber = fileValues.size() / 4;
102 |     cloud.width = pointsNumber;
103 | 
104 |     std::vector<uint8_t> data;
105 |     for (auto float_data : fileValues) {
106 |       push_back_float32(data, float_data);
107 |     }
108 | 
109 |     fillFieldsForPointcloud(cloud.fields);
110 |     cloud.data = data;
111 |     cloud.row_step = data.size(); // Length of row in bytes
112 | 
113 |   } catch (const std::exception& e) {
114 |     PRINT_EXCEPTION(e);
115 | 
116 |     return boost::none;
117 |   }
118 | 
119 |   return boost::optional<sensor_msgs::PointCloud2>(cloud);
120 | }
121 | 
122 | }


--------------------------------------------------------------------------------
/src/LidarDirectoryConverterXYZIR.cpp:
--------------------------------------------------------------------------------
  1 | #include "nuscenes2bag/LidarDirectoryConverterXYZIR.hpp"
  2 | #include "nuscenes2bag/utils.hpp"
  3 | #include <exception>
  4 | 
  5 | using namespace sensor_msgs;
  6 | using namespace std;
  7 | 
  8 | namespace nuscenes2bag {
  9 | 
 10 | inline void
 11 | fillFieldsForPointcloudXYZIR(std::vector<PointField>& fields)
 12 | {
 13 |   PointField field;
 14 |   field.datatype = sensor_msgs::PointField::FLOAT32;
 15 |   field.offset = 0;
 16 |   field.count = 1;
 17 |   field.name = std::string("x");
 18 |   fields.push_back(field);
 19 | 
 20 |   field.datatype = sensor_msgs::PointField::FLOAT32;
 21 |   field.offset = 4;
 22 |   field.count = 1;
 23 |   field.name = std::string("y");
 24 |   fields.push_back(field);
 25 | 
 26 |   field.datatype = sensor_msgs::PointField::FLOAT32;
 27 |   field.offset = 8;
 28 |   field.count = 1;
 29 |   field.name = std::string("z");
 30 |   fields.push_back(field);
 31 | 
 32 |   // This field only contains positive integers but it's encoded as a float (4
 33 |   // bytes)
 34 |   field.datatype = sensor_msgs::PointField::FLOAT32;
 35 |   field.offset = 12;
 36 |   field.count = 1;
 37 |   field.name = std::string("intensity");
 38 |   fields.push_back(field);
 39 | 
 40 |   // This field only contains positive integers but it's encoded as a float (4
 41 |   // bytes)
 42 |   field.datatype = sensor_msgs::PointField::FLOAT32;
 43 |   field.offset = 16;
 44 |   field.count = 1;
 45 |   field.name = std::string("ring");
 46 |   fields.push_back(field);
 47 | }
 48 | 
 49 | // Convert float32 to 4 bytes
 50 | union
 51 | {
 52 |   float value;
 53 |   uint8_t byte[4];
 54 | } floatToBytes;
 55 | 
 56 | inline void
 57 | push_back_float32_XYZIR(std::vector<uint8_t>& data, float float_data)
 58 | {
 59 |   floatToBytes.value = float_data;
 60 |   data.push_back(floatToBytes.byte[0]);
 61 |   data.push_back(floatToBytes.byte[1]);
 62 |   data.push_back(floatToBytes.byte[2]);
 63 |   data.push_back(floatToBytes.byte[3]);
 64 | }
 65 | 
 66 | inline std::vector<float>
 67 | readBinaryPcdFileXYZIR(std::ifstream& fin)
 68 | {
 69 |   std::vector<float> fileValues;
 70 |   float f;
 71 |   while (fin.read(reinterpret_cast<char*>(&f), sizeof(float))) {
 72 |     fileValues.push_back(f);
 73 |   }
 74 | 
 75 |   return fileValues;
 76 | }
 77 | 
 78 | boost::optional<sensor_msgs::PointCloud2>
 79 | readLidarFileXYZIR(const fs::path& filePath)
 80 | {
 81 | 
 82 |   PointCloud2 cloud;
 83 |   cloud.header.frame_id = std::string("lidar");
 84 |   cloud.is_bigendian = false;
 85 |   cloud.point_step = sizeof(float) * 5; // Length of each point in bytes
 86 |   cloud.height = 1;
 87 | 
 88 |   try {
 89 |     std::ifstream fin(filePath.string(), std::ios::binary);
 90 |     const std::vector<float> fileValues = readBinaryPcdFileXYZIR(fin);
 91 | 
 92 |     if (fileValues.size() % 5 != 0) {
 93 |       throw UnableToParseFileException(filePath.string());
 94 |     }
 95 |     const size_t pointsNumber = fileValues.size() / 5;
 96 |     cloud.width = pointsNumber;
 97 | 
 98 |     std::vector<uint8_t> data;
 99 |     for (auto float_data : fileValues) {
100 |       push_back_float32_XYZIR(data, float_data);
101 |     }
102 | 
103 |     fillFieldsForPointcloudXYZIR(cloud.fields);
104 |     cloud.data = data;
105 |     cloud.row_step = data.size(); // Length of row in bytes
106 | 
107 |   } catch (const std::exception& e) {
108 |     PRINT_EXCEPTION(e);
109 | 
110 |     return boost::none;
111 |   }
112 | 
113 |   return boost::optional<sensor_msgs::PointCloud2>(cloud);
114 | }
115 | 
116 | }


--------------------------------------------------------------------------------
/src/MetaData.cpp:
--------------------------------------------------------------------------------
 1 | #include "nuscenes2bag/MetaDataTypes.hpp"
 2 | #include <sstream>
 3 | 
 4 | namespace nuscenes2bag {
 5 | 
 6 | template<>
 7 | std::string
 8 | to_debug_string(const SceneInfo& o)
 9 | {
10 |   std::ostringstream os;
11 |   os << SHOW_FIRST_MEMBER(token) << SHOW_MEMBER(sampleNumber)
12 |      << SHOW_MEMBER(sceneId) << SHOW_MEMBER(name)
13 |      << SHOW_LAST_MEMBER(description);
14 |   return os.str();
15 | }
16 | 
17 | template<>
18 | std::string
19 | to_debug_string(const SampleInfo& o)
20 | {
21 |   std::ostringstream os;
22 |   os << SHOW_FIRST_MEMBER(token) << SHOW_LAST_MEMBER(timeStamp);
23 |   return os.str();
24 | }
25 | 
26 | template<>
27 | std::string
28 | to_debug_string(const SampleDataInfo& o)
29 | {
30 |   std::ostringstream os;
31 |   os << "{" << SHOW_FIRST_MEMBER(token) << SHOW_LAST_MEMBER(fileName);
32 |   return os.str();
33 | }
34 | 
35 | }


--------------------------------------------------------------------------------
/src/MetaDataReader.cpp:
--------------------------------------------------------------------------------
  1 | #include "nuscenes2bag/utils.hpp"
  2 | #include <nuscenes2bag/MetaDataReader.hpp>
  3 | 
  4 | #include <algorithm>
  5 | #include <fstream>
  6 | #include <iostream>
  7 | #include <map>
  8 | #include <regex>
  9 | 
 10 | using namespace std;
 11 | namespace json = nlohmann;
 12 | 
 13 | namespace nuscenes2bag {
 14 | 
 15 | template<typename T>
 16 | void
 17 | throwKeyNotFound(const T& key, const char* msg)
 18 | {
 19 |   std::string errorMsg = "MetaDataError: ";
 20 |   errorMsg += msg;
 21 |   errorMsg += " [" + key + "]";
 22 |   throw InvalidMetaDataException(errorMsg);
 23 | }
 24 | 
 25 | template<template<class, class, class...> class Container,
 26 |          class Key,
 27 |          class Value,
 28 |          class... TArgs>
 29 | const Value&
 30 | findOrThrow(const Container<Key, Value, TArgs...>& container,
 31 |             const Key& key,
 32 |             const char* msg)
 33 | {
 34 |   auto it = container.find(key);
 35 |   if (it == container.end()) {
 36 |     throwKeyNotFound<Key>(key, msg);
 37 |   }
 38 |   return it->second;
 39 | }
 40 | 
 41 | void
 42 | MetaDataReader::loadFromDirectory(const fs::path& directoryPath)
 43 | {
 44 |   const fs::path sceneFile = directoryPath / "scene.json";
 45 |   const fs::path sampleFile = directoryPath / "sample.json";
 46 |   const fs::path sampleDataFile = directoryPath / "sample_data.json";
 47 |   const fs::path egoPoseFile = directoryPath / "ego_pose.json";
 48 |   const fs::path calibratedSensorFile =
 49 |     directoryPath / "calibrated_sensor.json";
 50 |   const fs::path sensorFile = directoryPath / "sensor.json";
 51 | 
 52 |   scenes = loadScenesFromFile(sceneFile);
 53 |   scene2Samples = loadSampleInfos(sampleFile);
 54 |   sample2SampleData = loadSampleDataInfos(sampleDataFile);
 55 |   calibratedSensorToken2CalibratedSensorInfo =
 56 |     loadCalibratedSensorInfo(calibratedSensorFile);
 57 |   sensorToken2CalibratedSensorName = loadCalibratedSensorNames(sensorFile);
 58 | 
 59 |   // build inverse (EgoPose.token -> Scene.token) map
 60 |   // and (scene.token -> calibratedSensor[]) map
 61 |   std::map<Token, Token> egoPoseToken2sceneToken;
 62 | 
 63 |   for (const auto& keyvalue : scene2Samples) {
 64 |     const Token& sceneToken = keyvalue.first;
 65 |     const std::vector<SampleInfo>& sampleInfos = keyvalue.second;
 66 | 
 67 |     for (const auto& sampleInfo : sampleInfos) {
 68 |       for (const auto& sampleData : sample2SampleData[sampleInfo.token]) {
 69 |         // add egoPoseInfo
 70 |         egoPoseToken2sceneToken.emplace(sampleData.egoPoseToken, sceneToken);
 71 | 
 72 |         // add calibrated sensor info
 73 |         auto& calibratedSensorInfoSet =
 74 |           getExistingOrDefault(scene2CalibratedSensorInfo, sceneToken);
 75 |         const auto& calibratedSensorInfo =
 76 |           findOrThrow(calibratedSensorToken2CalibratedSensorInfo,
 77 |                       sampleData.calibratedSensorToken,
 78 |                       "unable to find calibrated sensor");
 79 |         const auto& calibratedSensorName =
 80 |           findOrThrow(sensorToken2CalibratedSensorName,
 81 |                       calibratedSensorInfo.sensorToken,
 82 |                       "unable to find sensor");
 83 |         calibratedSensorInfoSet.insert(CalibratedSensorInfoAndName{
 84 |           calibratedSensorInfo, calibratedSensorName });
 85 |       }
 86 |     }
 87 |   }
 88 | 
 89 |   scene2EgoPose = loadEgoPoseInfos(egoPoseFile, egoPoseToken2sceneToken);
 90 | 
 91 |   loadFromDirectoryCalled = true;
 92 | }
 93 | 
 94 | json::json
 95 | MetaDataReader::slurpJsonFile(const fs::path& filePath)
 96 | {
 97 |   std::ifstream file(filePath.string());
 98 |   if (!file.is_open()) {
 99 |     std::string errMsg = string("Unable to open ") + filePath.string();
100 |     throw std::runtime_error(errMsg);
101 |   }
102 |   json::json newJson;
103 |   file >> newJson;
104 |   return newJson;
105 | }
106 | 
107 | std::vector<SceneInfo>
108 | MetaDataReader::loadScenesFromFile(const fs::path& filePath)
109 | {
110 |   auto sceneJsons = slurpJsonFile(filePath);
111 |   std::vector<SceneInfo> sceneInfos;
112 | 
113 |   std::regex sceneIdRegex("scene-(\\d+)");
114 | 
115 |   for (const auto& sceneJson : sceneJsons) {
116 |     std::string sceneIdStr = sceneJson["name"];
117 |     std::smatch match;
118 |     std::regex_search(sceneIdStr, match, sceneIdRegex);
119 |     SceneId sceneId = std::stoi(match.str(1));
120 |     sceneInfos.push_back(SceneInfo{
121 |       sceneJson["token"],
122 |       sceneJson["nbr_samples"],
123 |       sceneId,
124 |       sceneJson["name"],
125 |       sceneJson["description"],
126 |       sceneJson["first_sample_token"],
127 |     });
128 |   }
129 | 
130 |   return sceneInfos;
131 | }
132 | 
133 | std::map<Token, std::vector<SampleInfo>>
134 | MetaDataReader::loadSampleInfos(const fs::path& filePath)
135 | {
136 |   auto sampleInfos = slurpJsonFile(filePath);
137 |   std::map<Token, std::vector<SampleInfo>> token2Samples;
138 | 
139 |   for (const auto& sampleInfo : sampleInfos) {
140 |     Token sampleToken = sampleInfo["token"];
141 |     Token sceneToken = sampleInfo["scene_token"];
142 |     std::vector<SampleInfo>& samples =
143 |       getExistingOrDefault(token2Samples, sceneToken);
144 |     samples.push_back(
145 |       SampleInfo{ sceneToken, sampleToken, sampleInfo["timestamp"] });
146 |   }
147 | 
148 |   return token2Samples;
149 | }
150 | 
151 | std::map<Token, std::vector<SampleDataInfo>>
152 | MetaDataReader::loadSampleDataInfos(const fs::path& filePath)
153 | {
154 |   auto sampleDataJsons = slurpJsonFile(filePath);
155 |   std::map<Token, std::vector<SampleDataInfo>> sample2SampleData;
156 | 
157 |   for (const auto& sampleDataJson : sampleDataJsons) {
158 |     Token sampleToken = sampleDataJson["sample_token"];
159 |     Token sampleDataToken = sampleDataJson["token"];
160 |     std::vector<SampleDataInfo>& sampleDatas =
161 |       getExistingOrDefault(sample2SampleData, sampleToken);
162 |     sampleDatas.push_back(SampleDataInfo{
163 |       sampleDataToken,
164 |       sampleDataJson["timestamp"],
165 |       sampleDataJson["ego_pose_token"],
166 |       sampleDataJson["calibrated_sensor_token"],
167 |       sampleDataJson["fileformat"],
168 |       sampleDataJson["is_key_frame"],
169 |       sampleDataJson["filename"],
170 |     });
171 |   }
172 | 
173 |   return sample2SampleData;
174 | }
175 | 
176 | EgoPoseInfo
177 | egoPoseJson2EgoPoseInfo(const json::json& egoPoseJson)
178 | {
179 |   EgoPoseInfo egoPoseInfo;
180 | 
181 |   egoPoseInfo.translation[0] = egoPoseJson["translation"][0];
182 |   egoPoseInfo.translation[1] = egoPoseJson["translation"][1];
183 |   egoPoseInfo.translation[2] = egoPoseJson["translation"][2];
184 | 
185 |   egoPoseInfo.rotation[0] = egoPoseJson["rotation"][0];
186 |   egoPoseInfo.rotation[1] = egoPoseJson["rotation"][1];
187 |   egoPoseInfo.rotation[2] = egoPoseJson["rotation"][2];
188 |   egoPoseInfo.rotation[3] = egoPoseJson["rotation"][3];
189 | 
190 |   egoPoseInfo.timeStamp = egoPoseJson["timestamp"];
191 | 
192 |   return egoPoseInfo;
193 | }
194 | 
195 | std::map<Token, std::vector<EgoPoseInfo>>
196 | MetaDataReader::loadEgoPoseInfos(
197 |   const fs::path& filePath,
198 |   std::map<Token, Token> sampleDataToken2SceneToken)
199 | {
200 | 
201 |   auto egoPoseJsons = slurpJsonFile(filePath);
202 |   std::map<Token, std::vector<EgoPoseInfo>> sceneToken2EgoPoseInfos;
203 | 
204 |   for (const auto& egoPoseJson : egoPoseJsons) {
205 |     Token sampleDataToken = egoPoseJson["token"];
206 |     const auto& sceneToken = findOrThrow(sampleDataToken2SceneToken,
207 |                                          sampleDataToken,
208 |                                          " Unable to find sample token");
209 |     std::vector<EgoPoseInfo>& egoPoses =
210 |       getExistingOrDefault(sceneToken2EgoPoseInfos, sceneToken);
211 | 
212 |     EgoPoseInfo egoPoseInfo = egoPoseJson2EgoPoseInfo(egoPoseJson);
213 |     egoPoses.push_back(egoPoseInfo);
214 |   }
215 | 
216 |   return sceneToken2EgoPoseInfos;
217 | }
218 | 
219 | std::map<Token, CalibratedSensorInfo>
220 | MetaDataReader::loadCalibratedSensorInfo(const fs::path& filePath)
221 | {
222 |   auto calibratedSensorJsons = slurpJsonFile(filePath);
223 |   std::map<Token, CalibratedSensorInfo>
224 |     calibratedSensorToken2CalibratedSensorInfo;
225 | 
226 |   for (const auto& calibratedSensorJson : calibratedSensorJsons) {
227 |     Token token = calibratedSensorJson["token"];
228 |     auto translation = calibratedSensorJson["translation"];
229 |     auto rotation = calibratedSensorJson["rotation"];
230 |     CalibratedSensorInfo calibratedSensorInfo{
231 |       token,
232 |       calibratedSensorJson["sensor_token"],
233 |       { translation[0], translation[1], translation[2] },
234 |       { rotation[0], rotation[1], rotation[2], rotation[3] },
235 |       boost::none
236 |     };
237 | 
238 |     boost::optional<json::json> sensor_intrinsics =
239 |       calibratedSensorJson["rotation"];
240 | 
241 |     calibratedSensorToken2CalibratedSensorInfo.emplace(token,
242 |                                                        calibratedSensorInfo);
243 |   }
244 | 
245 |   return calibratedSensorToken2CalibratedSensorInfo;
246 | }
247 | 
248 | std::map<Token, CalibratedSensorName>
249 | MetaDataReader::loadCalibratedSensorNames(const fs::path& filePath)
250 | {
251 |   auto calibratedSensorNameJsons = slurpJsonFile(filePath);
252 |   std::map<Token, CalibratedSensorName> sensorToken2CalibratedSensorName;
253 | 
254 |   for (const auto& calibratedSensorNameJson : calibratedSensorNameJsons) {
255 |     sensorToken2CalibratedSensorName.emplace(
256 |       calibratedSensorNameJson["token"],
257 |       CalibratedSensorName{ calibratedSensorNameJson["token"],
258 |                             calibratedSensorNameJson["channel"],
259 |                             calibratedSensorNameJson["modality"] });
260 |   };
261 | 
262 |   return sensorToken2CalibratedSensorName;
263 | }
264 | 
265 | std::vector<Token>
266 | MetaDataReader::getAllSceneTokens() const
267 | {
268 |   assert(loadFromDirectoryCalled);
269 |   std::vector<Token> tokens;
270 |   std::transform(scenes.begin(),
271 |                  scenes.end(),
272 |                  std::back_inserter(tokens),
273 |                  [](const SceneInfo& sceneInfo) { return sceneInfo.token; });
274 |   return tokens;
275 | }
276 | 
277 | boost::optional<SceneInfo>
278 | MetaDataReader::getSceneInfo(const Token& sceneToken) const
279 | {
280 |   assert(loadFromDirectoryCalled);
281 |   auto it = std::find_if(
282 |     scenes.begin(), scenes.end(), [&sceneToken](const SceneInfo& sceneInfo) {
283 |       return sceneInfo.token == sceneToken;
284 |     });
285 |   if (it == scenes.end()) {
286 | 
287 |     return boost::none;
288 |   }
289 | 
290 |   return boost::optional<SceneInfo>(*it);
291 | }
292 | 
293 | std::vector<SampleDataInfo>
294 | MetaDataReader::getSceneSampleData(const Token& sceneToken) const
295 | {
296 |   std::vector<SampleDataInfo> sampleDataInfos;
297 | 
298 |   const auto& sceneSamples =
299 |     findOrThrow(scene2Samples, sceneToken, " sample for scene token");
300 |   for (const auto& sceneSample : sceneSamples) {
301 |     const Token& sceneSampleToken = sceneSample.token;
302 |     const auto& sceneSampleDatas = findOrThrow(
303 |       sample2SampleData, sceneSampleToken, " sample data for sample token");
304 | 
305 |     for (const SampleDataInfo& sampleData : sceneSampleDatas) {
306 |       sampleDataInfos.push_back(sampleData);
307 |     }
308 |   }
309 | 
310 |   return sampleDataInfos;
311 | }
312 | 
313 | std::vector<EgoPoseInfo>
314 | MetaDataReader::getEgoPoseInfo(const Token& sceneToken) const
315 | {
316 |   return findOrThrow(scene2EgoPose, sceneToken, "ego pose by scene token");
317 | }
318 | 
319 | CalibratedSensorInfo
320 | MetaDataReader::getCalibratedSensorInfo(
321 |   const Token& calibratedSensorToken) const
322 | {
323 |   return findOrThrow(calibratedSensorToken2CalibratedSensorInfo,
324 |                      calibratedSensorToken,
325 |                      "calibrated sensor info by sensor token");
326 | }
327 | 
328 | CalibratedSensorName
329 | MetaDataReader::getSensorName(const Token& sensorToken) const
330 | {
331 |   return findOrThrow(sensorToken2CalibratedSensorName,
332 |                      sensorToken,
333 |                      "sensor name by sensor token");
334 | }
335 | 
336 | std::vector<CalibratedSensorInfoAndName>
337 | MetaDataReader::getSceneCalibratedSensorInfo(const Token& sceneToken) const
338 | {
339 |   std::vector<CalibratedSensorInfoAndName> sceneCalibratedSensorInfo;
340 |   const auto& sceneCalibratedSensorInfoSet =
341 |     findOrThrow(scene2CalibratedSensorInfo,
342 |                 sceneToken,
343 |                 "calibrated sensor info by scene token");
344 |   std::copy(sceneCalibratedSensorInfoSet.begin(),
345 |             sceneCalibratedSensorInfoSet.end(),
346 |             std::back_inserter(sceneCalibratedSensorInfo));
347 |   return sceneCalibratedSensorInfo;
348 | }
349 | 
350 | boost::optional<SceneInfo>
351 | MetaDataReader::getSceneInfoByNumber(const uint32_t sceneNumber) const
352 | {
353 |   boost::optional<SceneInfo> sceneInfoOpt;
354 |   for (const auto& scene : scenes) {
355 |     if (scene.sceneId == sceneNumber) {
356 |       sceneInfoOpt = scene;
357 |     }
358 |   }
359 |   return sceneInfoOpt;
360 | }
361 | 
362 | }


--------------------------------------------------------------------------------
/src/NuScenes2Bag.cpp:
--------------------------------------------------------------------------------
  1 | #include "nuscenes2bag/NuScenes2Bag.hpp"
  2 | #include "nuscenes2bag/ImageDirectoryConverter.hpp"
  3 | #include "nuscenes2bag/LidarDirectoryConverter.hpp"
  4 | #include "nuscenes2bag/RadarObjects.h"
  5 | #include "nuscenes2bag/RunEvery.hpp"
  6 | #include "nuscenes2bag/SceneConverter.hpp"
  7 | #include "nuscenes2bag/utils.hpp"
  8 | 
  9 | #include <memory> // std::unique_ptr
 10 | 
 11 | #include <boost/asio.hpp>
 12 | 
 13 | #if BOOST_VERSION >= 106600
 14 | // thread_pool was added in Boost 1.66.0
 15 | #include <boost/asio/thread_pool.hpp>
 16 | #else
 17 | #include "nuscenes2bag/thread_pool.hpp"
 18 | #endif
 19 | 
 20 | #include <iostream>
 21 | 
 22 | #include <array>
 23 | #include <std_msgs/Int32.h>
 24 | #include <std_msgs/String.h>
 25 | #include <thread>
 26 | 
 27 | using namespace std;
 28 | 
 29 | namespace nuscenes2bag {
 30 | 
 31 | NuScenes2Bag::NuScenes2Bag() {}
 32 | 
 33 | void
 34 | NuScenes2Bag::convertDirectory(const fs::path& inDatasetPath,
 35 |                                const std::string& version,
 36 |                                const fs::path& outputRosbagPath,
 37 |                                int threadNumber,
 38 |                                boost::optional<int32_t> sceneNumberOpt)
 39 | {
 40 |   if ((threadNumber < 1) || (threadNumber > 64)) {
 41 |     std::cout << "Forcing at least one job number (-j1)" << std::endl;
 42 |     threadNumber = 1;
 43 |   }
 44 | 
 45 |   MetaDataReader metaDataReader;
 46 | 
 47 |   fs::path metadataPath = inDatasetPath;
 48 |   metadataPath /= fs::path(version); // Append sub-directory
 49 |   std::cout << "Loading metadata from " + metadataPath.string() + " ..."
 50 |             << std::endl;
 51 | 
 52 |   try {
 53 |     // If file is not found, a runtime_error is thrown
 54 |     metaDataReader.loadFromDirectory(metadataPath);
 55 |   } catch (const runtime_error& e) {
 56 |     std::cerr << "Error: " << e.what() << '\n';
 57 |     std::exit(-1);
 58 |   }
 59 | 
 60 |   cout << "Initializing " << threadNumber << " threads..." << endl;
 61 | 
 62 | #if BOOST_VERSION >= 106600
 63 |   boost::asio::thread_pool pool(threadNumber);
 64 |   std::vector<std::unique_ptr<SceneConverter>> sceneConverters;
 65 | #else
 66 |   ThreadPool<FIFO> pool(threadNumber);
 67 |   std::vector<boost::shared_ptr<SceneConverter>> sceneConverters;
 68 | #endif
 69 | 
 70 |   FileProgress fileProgress;
 71 | 
 72 |   fs::create_directories(outputRosbagPath);
 73 | 
 74 |   std::vector<Token> chosenSceneTokens;
 75 | 
 76 | #if BOOST_VERSION >= 106600
 77 | 
 78 |   if (sceneNumberOpt) {
 79 |     auto sceneInfoOpt =
 80 |       metaDataReader.getSceneInfoByNumber(sceneNumberOpt.value());
 81 |     if (sceneInfoOpt) {
 82 |       chosenSceneTokens.push_back(sceneInfoOpt->token);
 83 |     } else {
 84 |       std::cout << "Scene with ID=" << sceneNumberOpt.value() << " not found!"
 85 |                 << std::endl;
 86 |     }
 87 |   } else {
 88 |     chosenSceneTokens = metaDataReader.getAllSceneTokens();
 89 |     ;
 90 |   }
 91 | 
 92 |   for (const auto& sceneToken : chosenSceneTokens) {
 93 |     std::unique_ptr<SceneConverter> sceneConverter =
 94 |       std::make_unique<SceneConverter>(metaDataReader);
 95 |     sceneConverter->submit(sceneToken, fileProgress);
 96 |     SceneConverter* sceneConverterPtr = sceneConverter.get();
 97 |     sceneConverters.push_back(std::move(sceneConverter));
 98 |     boost::asio::defer(pool, [&, sceneConverterPtr]() {
 99 |       sceneConverterPtr->run(inDatasetPath, outputRosbagPath, fileProgress);
100 |     });
101 |   }
102 | 
103 |   RunEvery<std::function<void()>> showProgress(
104 |     std::chrono::milliseconds(1000), [&fileProgress]() {
105 |       std::cout << "Progress: "
106 |                 << static_cast<int>(fileProgress.getProgressPercentage() * 100)
107 |                 << "% [" << fileProgress.processedFiles << "/"
108 |                 << fileProgress.toProcessFiles << "]" << std::endl;
109 |     });
110 | 
111 |   // TODO: replace check with futures
112 |   while (fileProgress.processedFiles != fileProgress.toProcessFiles) {
113 |     showProgress.update();
114 |     std::this_thread::sleep_for(std::chrono::milliseconds(100));
115 |   }
116 | 
117 |   pool.join();
118 | 
119 | #else
120 | 
121 |   if (sceneNumberOpt) {
122 |     auto sceneInfoOpt =
123 |       metaDataReader.getSceneInfoByNumber(sceneNumberOpt.value());
124 |     if (sceneInfoOpt) {
125 |       chosenSceneTokens.push_back(sceneInfoOpt->token);
126 |     } else {
127 |       std::cout << "Scene with ID=" << sceneNumberOpt.value() << " not found!"
128 |                 << std::endl;
129 |     }
130 |   } else {
131 |     chosenSceneTokens = metaDataReader.getAllSceneTokens();
132 |     ;
133 |   }
134 | 
135 |   int counter = 0;
136 | 
137 |   for (const auto& sceneToken : chosenSceneTokens) {
138 |     boost::shared_ptr<SceneConverter> sceneConverter =
139 |       boost::make_shared<SceneConverter>(SceneConverter(metaDataReader));
140 |     sceneConverter->submit(sceneToken, fileProgress);
141 |     sceneConverters.push_back(std::move(sceneConverter));
142 | 
143 |     // Add task to FIFO queue.
144 |     // If we use 4 threads then we finish converting 4 scenes to bag files
145 |     // before starting to convert the 5th.
146 |     auto fn1 = [&, sceneConverters]() {
147 |       auto sceneInfo = metaDataReader.getSceneInfo(sceneToken);
148 |       std::cout << "Converting log " << counter << " of "
149 |                 << chosenSceneTokens.size() << ", " << sceneInfo->name
150 |                 << std::endl;
151 |       sceneConverters.back()->run(
152 |         inDatasetPath, outputRosbagPath, fileProgress);
153 |     };
154 |     pool.enqueue(fn1);
155 | 
156 |     counter++;
157 |   }
158 | 
159 |   while (fileProgress.processedFiles != fileProgress.toProcessFiles) {
160 |     std::cout << "Progress: "
161 |               << static_cast<int>(fileProgress.getProgressPercentage() * 100)
162 |               << "% [" << fileProgress.processedFiles << "/"
163 |               << fileProgress.toProcessFiles << "]" << std::endl;
164 |     std::this_thread::sleep_for(std::chrono::milliseconds(500));
165 |   }
166 | 
167 | #endif
168 | }
169 | 
170 | }
171 | 


--------------------------------------------------------------------------------
/src/RadarDirectoryConverter.cpp:
--------------------------------------------------------------------------------
 1 | #include "nuscenes2bag/RadarDirectoryConverter.hpp"
 2 | 
 3 | #include <pcl_ros/point_cloud.h>
 4 | 
 5 | using namespace sensor_msgs;
 6 | using namespace std;
 7 | using namespace nuscenes2bag;
 8 | 
 9 | namespace nuscenes2bag {
10 | 
11 | boost::optional<RadarObjects>
12 | readRadarFile(const fs::path& filePath)
13 | {
14 |   const auto fileName = filePath.string();
15 |   pcl::PointCloud<PclRadarObject>::Ptr cloud(
16 |     new pcl::PointCloud<PclRadarObject>);
17 | 
18 |   if (pcl::io::loadPCDFile<PclRadarObject>(fileName, *cloud) ==
19 |       -1) //* load the file
20 |   {
21 |     std::string error = "Could not read ";
22 |     error += fileName;
23 |     cout << error << endl;
24 |     // PCL_ERROR(error);
25 | 
26 |     return boost::none;
27 |   }
28 | 
29 |   RadarObjects radarObjects;
30 | 
31 |   for (const auto& pclRadarObject : *cloud) {
32 |     RadarObject obj;
33 |     obj.pose.x = pclRadarObject.x;
34 |     obj.pose.y = pclRadarObject.y;
35 |     obj.pose.z = pclRadarObject.z;
36 |     obj.dyn_prop = pclRadarObject.dyn_prop;
37 |     obj.rcs = pclRadarObject.rcs;
38 |     obj.vx = pclRadarObject.vx;
39 |     obj.vy = pclRadarObject.vy;
40 |     obj.vx_comp = pclRadarObject.vx_comp;
41 |     obj.vy_comp = pclRadarObject.vy_comp;
42 |     obj.is_quality_valid = pclRadarObject.is_quality_valid;
43 |     obj.ambig_state = pclRadarObject.ambig_state;
44 |     obj.x_rms = pclRadarObject.x_rms;
45 |     obj.y_rms = pclRadarObject.y_rms;
46 |     obj.invalid_state = pclRadarObject.invalid_state;
47 |     obj.pdh0 = pclRadarObject.pdh0;
48 |     obj.vx_rms = pclRadarObject.vx_rms;
49 |     obj.vy_rms = pclRadarObject.vy_rms;
50 |     radarObjects.objects.push_back(obj);
51 |   }
52 | 
53 |   return boost::optional<RadarObjects>(radarObjects);
54 | }
55 | 
56 | }


--------------------------------------------------------------------------------
/src/SceneConverter.cpp:
--------------------------------------------------------------------------------
  1 | #include "nuscenes2bag/SceneConverter.hpp"
  2 | #include "nuscenes2bag/DatasetTypes.hpp"
  3 | #include "nuscenes2bag/utils.hpp"
  4 | 
  5 | #include "nuscenes2bag/EgoPoseConverter.hpp"
  6 | #include "nuscenes2bag/ImageDirectoryConverter.hpp"
  7 | #include "nuscenes2bag/LidarDirectoryConverter.hpp"
  8 | #include "nuscenes2bag/LidarDirectoryConverterXYZIR.hpp"
  9 | #include "nuscenes2bag/RadarDirectoryConverter.hpp"
 10 | 
 11 | #include <array>
 12 | #include <iostream>
 13 | #include <regex>
 14 | #include <string>
 15 | 
 16 | using namespace std;
 17 | 
 18 | namespace nuscenes2bag {
 19 | 
 20 | SceneConverter::SceneConverter(const MetaDataProvider& metaDataProvider)
 21 |   : metaDataProvider(metaDataProvider)
 22 | {}
 23 | 
 24 | boost::optional<SampleType>
 25 | getSampleType(const std::string& filename)
 26 | {
 27 |   std::array<std::pair<const char*, SampleType>, 3> pairs = {
 28 |     { { "CAM", SampleType::CAMERA },
 29 |       { "RADAR", SampleType::RADAR },
 30 |       { "LIDAR", SampleType::LIDAR } }
 31 |   };
 32 |   for (const auto& strAndSampleType : pairs) {
 33 |     const auto& str = strAndSampleType.first;
 34 |     const auto& sampleType = strAndSampleType.second;
 35 |     if (filename.find(str) != string::npos) {
 36 |       return boost::optional<SampleType>(sampleType);
 37 |     }
 38 |   }
 39 |   cout << "Unknown file " << filename << endl;
 40 |   return boost::none;
 41 | }
 42 | 
 43 | template<typename T>
 44 | void
 45 | writeMsg(const std::string topicName,
 46 |          const std::string& frameID,
 47 |          const TimeStamp timeStamp,
 48 |          rosbag::Bag& outBag,
 49 |          boost::optional<T> msgOpt)
 50 | {
 51 |   if (msgOpt) {
 52 |     auto& msg = msgOpt.value();
 53 |     msg.header.frame_id = frameID;
 54 |     msg.header.stamp = stampUs2RosTime(timeStamp);
 55 |     outBag.write(std::string(topicName).c_str(), msg.header.stamp, msg);
 56 |   }
 57 | }
 58 | 
 59 | static const std::regex TOPIC_REGEX = std::regex(".*__([A-Z_]+)__.*");
 60 | 
 61 | void
 62 | SceneConverter::submit(const Token& sceneToken, FileProgress& fileProgress)
 63 | {
 64 | 
 65 |   boost::optional<SceneInfo> sceneInfoOpt =
 66 |     metaDataProvider.getSceneInfo(sceneToken);
 67 |   // if(!sceneInfoOpt) {
 68 |   //     // cout << "SceneInfo for " << sceneToken << " not found!" << endl;
 69 |   //     return;
 70 |   // }
 71 |   assert(sceneInfoOpt);
 72 |   SceneInfo& sceneInfo = sceneInfoOpt.value();
 73 | 
 74 |   sceneId = sceneInfo.sceneId;
 75 |   this->sceneToken = sceneToken;
 76 |   sampleDatas = metaDataProvider.getSceneSampleData(sceneToken);
 77 |   egoPoseInfos = metaDataProvider.getEgoPoseInfo(sceneToken);
 78 | 
 79 |   fileProgress.addToProcess(sampleDatas.size());
 80 | }
 81 | 
 82 | void
 83 | SceneConverter::run(const fs::path& inPath,
 84 |                     const fs::path& outDirectoryPath,
 85 |                     FileProgress& fileProgress)
 86 | {
 87 | 
 88 |   std::string bagName =
 89 |     outDirectoryPath.string() + "/" + std::to_string(sceneId) + ".bag";
 90 | 
 91 |   rosbag::Bag outBag;
 92 |   outBag.open(bagName, rosbag::bagmode::Write);
 93 | 
 94 |   auto sensorInfos = metaDataProvider.getSceneCalibratedSensorInfo(sceneToken);
 95 |   convertEgoPoseInfos(outBag, sensorInfos);
 96 |   convertSampleDatas(outBag, inPath, fileProgress);
 97 | 
 98 |   outBag.close();
 99 | }
100 | 
101 | void
102 | SceneConverter::convertSampleDatas(rosbag::Bag& outBag,
103 |                                    const fs::path& inPath,
104 |                                    FileProgress& fileProgress)
105 | {
106 |   for (const auto& sampleData : sampleDatas) {
107 |     fs::path sampleFilePath = inPath / sampleData.fileName;
108 | 
109 |     boost::optional<SampleType> sampleTypeOpt =
110 |       getSampleType(sampleFilePath.string());
111 |     if (!sampleTypeOpt) {
112 |       continue;
113 |     }
114 |     SampleType& sampleType = sampleTypeOpt.value();
115 | 
116 |     CalibratedSensorInfo calibratedSensorInfo =
117 |       metaDataProvider.getCalibratedSensorInfo(
118 |         sampleData.calibratedSensorToken);
119 |     CalibratedSensorName calibratedSensorName =
120 |       metaDataProvider.getSensorName(calibratedSensorInfo.sensorToken);
121 |     std::string sensorName = toLower(calibratedSensorName.name);
122 | 
123 |     if (sampleType == SampleType::CAMERA) {
124 |       auto topicName = sensorName + "/raw";
125 |       auto msg = readImageFile(sampleFilePath);
126 |       writeMsg(topicName, sensorName, sampleData.timeStamp, outBag, msg);
127 | 
128 |     } else if (sampleType == SampleType::LIDAR) {
129 |       auto topicName = sensorName;
130 | 
131 |       // PointCloud format:
132 |       auto msg = readLidarFile(sampleFilePath); // x,y,z,intensity
133 |       // auto msg = readLidarFileXYZIR(sampleFilePath); // x,y,z,intensity,ring
134 | 
135 |       writeMsg(topicName, sensorName, sampleData.timeStamp, outBag, msg);
136 | 
137 |     } else if (sampleType == SampleType::RADAR) {
138 |       auto topicName = sensorName;
139 |       auto msg = readRadarFile(sampleFilePath);
140 |       writeMsg(topicName, sensorName, sampleData.timeStamp, outBag, msg);
141 | 
142 |     } else {
143 |       cout << "Unknown sample type" << endl;
144 |     }
145 | 
146 |     fileProgress.addToProcessed(1);
147 |   }
148 | }
149 | 
150 | geometry_msgs::TransformStamped
151 | makeTransform(const char* frame_id,
152 |               const char* child_frame_id,
153 |               const double* translation,
154 |               const double* rotation,
155 |               ros::Time stamp = ros::Time(0))
156 | {
157 |   geometry_msgs::TransformStamped msg;
158 |   msg.header.frame_id = std::string(frame_id);
159 |   msg.header.stamp = stamp;
160 |   msg.child_frame_id = std::string(child_frame_id);
161 |   assignArray2Vector3(msg.transform.translation, translation);
162 |   assignArray2Quaternion(msg.transform.rotation, rotation);
163 |   return msg;
164 | }
165 | 
166 | geometry_msgs::TransformStamped
167 | makeIdentityTransform(const char* frame_id,
168 |                       const char* child_frame_id,
169 |                       ros::Time stamp = ros::Time(0))
170 | {
171 |   geometry_msgs::TransformStamped msg;
172 |   msg.header.frame_id = std::string(frame_id);
173 |   msg.header.stamp = stamp;
174 |   msg.child_frame_id = std::string(child_frame_id);
175 |   msg.transform.rotation.w = 1;
176 |   return msg;
177 | }
178 | 
179 | void
180 | SceneConverter::convertEgoPoseInfos(
181 |   rosbag::Bag& outBag,
182 |   const std::vector<CalibratedSensorInfoAndName>& calibratedSensorInfos)
183 | {
184 | 
185 |   std::vector<geometry_msgs::TransformStamped> constantTransforms;
186 |   for (const auto& calibratedSensorInfo : calibratedSensorInfos) {
187 |     auto sensorTransform =
188 |       makeTransform("base_link",
189 |                     toLower(calibratedSensorInfo.name.name).c_str(),
190 |                     calibratedSensorInfo.info.translation,
191 |                     calibratedSensorInfo.info.rotation);
192 |     constantTransforms.push_back(sensorTransform);
193 |   }
194 |   geometry_msgs::TransformStamped tfMap2Odom =
195 |     makeIdentityTransform("map", "odom");
196 |   constantTransforms.push_back(tfMap2Odom);
197 | 
198 |   const std::string odomTopic = "/odom";
199 |   for (const auto& egoPose : egoPoseInfos) {
200 |     // write odom
201 |     nav_msgs::Odometry odomMsg = egoPoseInfo2OdometryMsg(egoPose);
202 |     outBag.write(odomTopic.c_str(), odomMsg.header.stamp, odomMsg);
203 | 
204 |     // write TFs
205 |     geometry_msgs::TransformStamped tfOdom2Base =
206 |       egoPoseInfo2TransformStamped(egoPose);
207 |     tf::tfMessage tfMsg;
208 |     tfMsg.transforms.push_back(tfOdom2Base);
209 |     for (const auto& constantTransform : constantTransforms) {
210 |       auto constantTransformWithNewStamp = constantTransform;
211 |       constantTransformWithNewStamp.header.stamp = odomMsg.header.stamp;
212 |       tfMsg.transforms.push_back(constantTransformWithNewStamp);
213 |     }
214 |     outBag.write("/tf", odomMsg.header.stamp, tfMsg);
215 |   }
216 | }
217 | 
218 | }


--------------------------------------------------------------------------------
/src/main.cpp:
--------------------------------------------------------------------------------
 1 | #include "nuscenes2bag/MetaDataReader.hpp"
 2 | #include "nuscenes2bag/NuScenes2Bag.hpp"
 3 | #include <boost/program_options.hpp>
 4 | #include <iostream>
 5 | 
 6 | using namespace boost::program_options;
 7 | using namespace nuscenes2bag;
 8 | 
 9 | int
10 | main(const int argc, const char* argv[])
11 | {
12 |   try {
13 |     std::string dataroot;
14 |     std::string version = "v1.0-mini";
15 |     std::string outputBagName;
16 |     int32_t threadNumber = -1;
17 |     int32_t sceneNumber = -1;
18 | 
19 |     options_description desc{ "Options" };
20 |     desc.add_options()("help,h", "show help");
21 | 
22 |     options_description inputDesc{ "input" };
23 |     inputDesc.add_options()("scene_number,n",
24 |                             value<int32_t>(&sceneNumber),
25 |                             "only convert a given scene")(
26 |       "dataroot,s",
27 |       value<std::string>(&dataroot)->required(),
28 |       "Path to root of dataset containing 'maps', 'samples', 'sweeps'")(
29 |       "version",
30 |       value<std::string>(&version),
31 |       "Version string (default = 'v1.0-mini')")(
32 |       "out,o", value<std::string>(&outputBagName), "output bag name")(
33 |       "jobs,j",
34 |       value<int32_t>(&threadNumber),
35 |       "number of jobs (thread number)");
36 |     variables_map vm;
37 | 
38 |     desc.add(inputDesc);
39 | 
40 |     store(parse_command_line(argc, argv, desc), vm);
41 |     notify(vm);
42 | 
43 |     if (vm.count("help")) {
44 |       std::cout << desc << '\n';
45 |     } else {
46 |       NuScenes2Bag converter{};
47 | 
48 |       fs::path sampleDirPath(dataroot);
49 | 
50 |       boost::optional<int32_t> sceneNumberOpt;
51 |       if (sceneNumber > 0) {
52 |         sceneNumberOpt = sceneNumber;
53 |       }
54 |       converter.convertDirectory(
55 |         sampleDirPath, version, outputBagName, threadNumber, sceneNumberOpt);
56 |     }
57 |   } catch (const error& ex) {
58 |     std::cerr << ex.what() << '\n';
59 |   }
60 | 
61 |   return 0;
62 | }


--------------------------------------------------------------------------------
/src/pcd_to_image.cpp:
--------------------------------------------------------------------------------
 1 | #include <ros/ros.h>
 2 | //Image message
 3 | #include <sensor_msgs/Image.h>
 4 | #include <sensor_msgs/PointCloud2.h>
 5 | //pcl::toROSMsg
 6 | //conversions from PCL custom types
 7 | #include <pcl_conversions/pcl_conversions.h>
 8 | //stl stuff
 9 | #include <string>
10 | 
11 | class PointCloudToImage
12 | {
13 | public:
14 |   void
15 |   cloud_cb (const sensor_msgs::PointCloud2ConstPtr& cloud)
16 |   {
17 |     if (cloud->height <= 1)
18 |     {
19 |       ROS_ERROR("Input point cloud is not organized, ignoring!");
20 |       return;
21 |     }
22 |     try
23 |     {
24 |       pcl::toROSMsg (*cloud, image_); //convert the cloud
25 |       image_.header = cloud->header;
26 |       image_pub_.publish (image_); //publish our cloud image
27 |     }
28 |     catch (std::runtime_error &e)
29 |     {
30 |       ROS_ERROR_STREAM("Error in converting cloud to image message: "
31 |                         << e.what());
32 |     }
33 |   }
34 |   PointCloudToImage () : cloud_topic_("lidar_top"),image_topic_("output")
35 |   {
36 |     sub_ = nh_.subscribe (cloud_topic_, 30,
37 |                           &PointCloudToImage::cloud_cb, this);
38 |     image_pub_ = nh_.advertise<sensor_msgs::Image> (image_topic_, 30);
39 | 
40 |     //print some info about the node
41 |     std::string r_ct = nh_.resolveName (cloud_topic_);
42 |     std::string r_it = nh_.resolveName (image_topic_);
43 |     ROS_INFO_STREAM("Listening for incoming data on topic " << r_ct );
44 |     ROS_INFO_STREAM("Publishing image on topic " << r_it );
45 |   }
46 | private:
47 |   ros::NodeHandle nh_;
48 |   sensor_msgs::Image image_; //cache the image message
49 |   std::string cloud_topic_; //default input
50 |   std::string image_topic_; //default output
51 |   ros::Subscriber sub_; //cloud subscriber
52 |   ros::Publisher image_pub_; //image message publisher
53 | };
54 | 
55 | int
56 | main (int argc, char **argv)
57 | {
58 |   ros::init (argc, argv, "convert_pointcloud_to_image");
59 |   PointCloudToImage pci; //this loads up the node
60 |   ros::spin (); //where she stops nobody knows
61 |   return 0;
62 | }
63 | 


--------------------------------------------------------------------------------
/src/pointcloud_im.cpp:
--------------------------------------------------------------------------------
  1 | #include <iostream>
  2 | #include <string.h>
  3 | #include <fstream>
  4 | #include <algorithm>
  5 | #include <iterator>
  6 | #include "kf_tracker/featureDetection.h"
  7 | #include "kf_tracker/CKalmanFilter.h"
  8 | #include <opencv2/core/core.hpp>
  9 | #include <opencv2/highgui/highgui.hpp>
 10 | #include <opencv2/imgproc/imgproc.hpp>
 11 | #include <opencv2/video/video.hpp>
 12 | #include "opencv2/video/tracking.hpp"
 13 | #include <ros/ros.h>
 14 | #include <pcl/io/pcd_io.h>
 15 | #include <pcl/point_types.h>
 16 | #include "pcl_ros/point_cloud.h"
 17 | #include <geometry_msgs/Point.h>
 18 | #include <std_msgs/Float32MultiArray.h>
 19 | #include <std_msgs/Int32MultiArray.h>
 20 | 
 21 | #include <sensor_msgs/PointCloud2.h>
 22 | #include <pcl_conversions/pcl_conversions.h>
 23 | #include <pcl/point_cloud.h>
 24 | #include <pcl/point_types.h>
 25 | #include <pcl/common/geometry.h>
 26 | #include <pcl/filters/extract_indices.h>
 27 | #include <pcl/filters/voxel_grid.h>
 28 | #include <pcl/features/normal_3d.h>
 29 | #include <pcl/kdtree/kdtree.h>
 30 | #include <pcl/sample_consensus/method_types.h>
 31 | #include <pcl/sample_consensus/model_types.h>
 32 | #include <pcl/segmentation/sac_segmentation.h>
 33 | #include <pcl/segmentation/extract_clusters.h>
 34 | #include <pcl/common/centroid.h>
 35 |  
 36 | #include <visualization_msgs/MarkerArray.h>
 37 | #include <visualization_msgs/Marker.h>
 38 | #include <limits>
 39 | #include <utility>
 40 | 
 41 | using namespace std;
 42 | using namespace cv;
 43 | 
 44 | 
 45 | ros::Publisher objID_pub;
 46 | 
 47 |     // KF init
 48 |     int stateDim=4;// [x,y,v_x,v_y]//,w,h]
 49 |     int measDim=2;// [z_x,z_y,z_w,z_h]
 50 |     int ctrlDim=0;
 51 |     cv::KalmanFilter KF0(stateDim,measDim,ctrlDim,CV_32F);
 52 |     cv::KalmanFilter KF1(stateDim,measDim,ctrlDim,CV_32F);
 53 |     cv::KalmanFilter KF2(stateDim,measDim,ctrlDim,CV_32F);
 54 |     cv::KalmanFilter KF3(stateDim,measDim,ctrlDim,CV_32F);
 55 |     cv::KalmanFilter KF4(stateDim,measDim,ctrlDim,CV_32F);
 56 |     cv::KalmanFilter KF5(stateDim,measDim,ctrlDim,CV_32F);
 57 | 
 58 |     ros::Publisher pub_cluster0;
 59 |     ros::Publisher pub_cluster1;
 60 |     ros::Publisher pub_cluster2;
 61 |     ros::Publisher pub_cluster3;
 62 |     ros::Publisher pub_cluster4;
 63 |     ros::Publisher pub_cluster5;
 64 | 
 65 |     ros::Publisher markerPub;
 66 | 
 67 |     std::vector<geometry_msgs::Point> prevClusterCenters;
 68 | 
 69 | 
 70 |     cv::Mat state(stateDim,1,CV_32F);
 71 |     cv::Mat_<float> measurement(2,1); 
 72 | 
 73 |     std::vector<int> objID;// Output of the data association using KF
 74 |    // measurement.setTo(Scalar(0));
 75 | 
 76 | bool firstFrame=true;
 77 | 
 78 | // calculate euclidean distance of two points
 79 |   double euclidean_distance(geometry_msgs::Point& p1, geometry_msgs::Point& p2)
 80 |   {
 81 |     return sqrt((p1.x - p2.x) * (p1.x - p2.x) + (p1.y - p2.y) * (p1.y - p2.y) + (p1.z - p2.z) * (p1.z - p2.z));
 82 |   }
 83 | /*
 84 | //Count unique object IDs. just to make sure same ID has not been assigned to two KF_Trackers.  
 85 | int countIDs(vector<int> v)
 86 | {
 87 |     transform(v.begin(), v.end(), v.begin(), abs); // O(n) where n = distance(v.end(), v.begin())
 88 |     sort(v.begin(), v.end()); // Average case O(n log n), worst case O(n^2) (usually implemented as quicksort.
 89 |     // To guarantee worst case O(n log n) replace with make_heap, then sort_heap.
 90 | 
 91 |     // Unique will take a sorted range, and move things around to get duplicated
 92 |     // items to the back and returns an iterator to the end of the unique section of the range
 93 |     auto unique_end = unique(v.begin(), v.end()); // Again n comparisons
 94 |     return distance(unique_end, v.begin()); // Constant time for random access iterators (like vector's)
 95 | }
 96 | */
 97 | 
 98 | /*
 99 | 
100 | objID: vector containing the IDs of the clusters that should be associated with each KF_Tracker
101 | objID[0] corresponds to KFT0, objID[1] corresponds to KFT1 etc.
102 | */
103 | 
104 | std::pair<int,int> findIndexOfMin(std::vector<std::vector<float> > distMat)
105 | {
106 |     cout<<"findIndexOfMin cALLED\n";
107 |     std::pair<int,int>minIndex;
108 |     float minEl=std::numeric_limits<float>::max();
109 |     cout<<"minEl="<<minEl<<"\n";
110 |     for (int i=0; i<distMat.size();i++)
111 |         for(int j=0;j<distMat.at(0).size();j++)
112 |         {
113 |             if( distMat[i][j]<minEl)
114 |             {
115 |                 minEl=distMat[i][j];
116 |                 minIndex=std::make_pair(i,j);
117 | 
118 |             }
119 | 
120 |         }
121 |     cout<<"minIndex="<<minIndex.first<<","<<minIndex.second<<"\n";
122 |     return minIndex;
123 | }
124 | void KFT(const std_msgs::Float32MultiArray ccs)
125 | {
126 | 
127 | 
128 | 
129 |     // First predict, to update the internal statePre variable
130 | 
131 |     std::vector<cv::Mat> pred{KF0.predict(),KF1.predict(),KF2.predict(),KF3.predict(),KF4.predict(),KF5.predict()};
132 |  //cout<<"Pred successfull\n";
133 | 
134 |     //cv::Point predictPt(prediction.at<float>(0),prediction.at<float>(1));
135 |    // cout<<"Prediction 1 ="<<prediction.at<float>(0)<<","<<prediction.at<float>(1)<<"\n";
136 | 
137 |     // Get measurements
138 |     // Extract the position of the clusters forom the multiArray. To check if the data
139 |     // coming in, check the .z (every third) coordinate and that will be 0.0
140 |     std::vector<geometry_msgs::Point> clusterCenters;//clusterCenters
141 |    
142 |     int i=0;
143 |     for (std::vector<float>::const_iterator it=ccs.data.begin();it!=ccs.data.end();it+=3)
144 |     {
145 |         geometry_msgs::Point pt;
146 |         pt.x=*it;
147 |         pt.y=*(it+1);
148 |         pt.z=*(it+2);
149 | 
150 |         clusterCenters.push_back(pt);
151 |        
152 |     }
153 | 
154 |   //  cout<<"CLusterCenters Obtained"<<"\n";
155 |     std::vector<geometry_msgs::Point> KFpredictions;
156 |     i=0;
157 |     for (auto it=pred.begin();it!=pred.end();it++)
158 |     {
159 |         geometry_msgs::Point pt;
160 |         pt.x=(*it).at<float>(0);
161 |         pt.y=(*it).at<float>(1);
162 |         pt.z=(*it).at<float>(2);
163 | 
164 |         KFpredictions.push_back(pt);
165 |         
166 |     }
167 |   // cout<<"Got predictions"<<"\n";
168 | 
169 |     
170 |     
171 |     // Find the cluster that is more probable to be belonging to a given KF.
172 |     objID.clear();//Clear the objID vector
173 |     objID.resize(6);//Allocate default elements so that [i] doesnt segfault. Should be done better
174 |     // Copy clusterCentres for modifying it and preventing multiple assignments of the same ID
175 |     std::vector<geometry_msgs::Point> copyOfClusterCenters(clusterCenters);
176 |     std::vector<std::vector<float> > distMat;
177 | 
178 |     for(int filterN=0;filterN<6;filterN++)
179 |     {
180 |         std::vector<float> distVec;
181 |         for(int n=0;n<6;n++)
182 |         {
183 |             distVec.push_back(euclidean_distance(KFpredictions[filterN],copyOfClusterCenters[n]));
184 |         }
185 | 
186 |         distMat.push_back(distVec);
187 |       /*// Based on distVec instead of distMat (global min). Has problems with the person's leg going out of scope 
188 |        int ID=std::distance(distVec.begin(),min_element(distVec.begin(),distVec.end()));
189 |        //cout<<"finterlN="<<filterN<<"   minID="<<ID
190 |        objID.push_back(ID);
191 |       // Prevent assignment of the same object ID to multiple clusters
192 |        copyOfClusterCenters[ID].x=100000;// A large value so that this center is not assigned to another cluster
193 |        copyOfClusterCenters[ID].y=10000;
194 |        copyOfClusterCenters[ID].z=10000;
195 |       */
196 |      cout<<"filterN="<<filterN<<"\n";
197 | 
198 | 
199 |     }
200 | 
201 |     cout<<"distMat.size()"<<distMat.size()<<"\n";
202 |     cout<<"distMat[0].size()"<<distMat.at(0).size()<<"\n";
203 |     // DEBUG: print the distMat
204 |     for ( const auto &row : distMat )
205 |     {
206 |        for ( const auto &s : row ) std::cout << s << ' ';
207 |        std::cout << std::endl;
208 |     }
209 | 
210 | 
211 | 
212 |     for(int clusterCount=0;clusterCount<6;clusterCount++)
213 |     {
214 |         // 1. Find min(distMax)==> (i,j);
215 |         std::pair<int,int> minIndex(findIndexOfMin(distMat));
216 |          cout<<"Received minIndex="<<minIndex.first<<","<<minIndex.second<<"\n";
217 |         // 2. objID[i]=clusterCenters[j]; counter++
218 |         objID[minIndex.first]=minIndex.second;
219 |     
220 |         // 3. distMat[i,:]=10000; distMat[:,j]=10000
221 |         distMat[minIndex.first]=std::vector<float>(6,10000.0);// Set the row to a high number.
222 |         for(int row=0;row<distMat.size();row++)//set the column to a high number
223 |         {
224 |             distMat[row][minIndex.second]=10000.0;
225 |         }
226 |         // 4. if(counter<6) got to 1.
227 |         cout<<"clusterCount="<<clusterCount<<"\n";
228 | 
229 |     }
230 | 
231 |    // cout<<"Got object IDs"<<"\n";
232 |     //countIDs(objID);// for verif/corner cases
233 | 
234 |     //display objIDs
235 |   /* DEBUG
236 |     cout<<"objID= ";
237 |     for(auto it=objID.begin();it!=objID.end();it++)
238 |         cout<<*it<<" ,";
239 |     cout<<"\n";
240 |     */
241 | 
242 |     visualization_msgs::MarkerArray clusterMarkers;
243 | 
244 |      for (int i=0;i<6;i++)
245 |      {
246 |         visualization_msgs::Marker m;
247 | 
248 |         m.id=i;
249 |         m.type=visualization_msgs::Marker::CUBE;
250 |         m.header.frame_id="/map";
251 |         m.scale.x=0.3;         m.scale.y=0.3;         m.scale.z=0.3;
252 |         m.action=visualization_msgs::Marker::ADD;
253 |         m.color.a=1.0;
254 |         m.color.r=i%2?1:0;
255 |         m.color.g=i%3?1:0;
256 |         m.color.b=i%4?1:0;
257 | 
258 |        //geometry_msgs::Point clusterC(clusterCenters.at(objID[i]));
259 |         geometry_msgs::Point clusterC(KFpredictions[i]);
260 |        m.pose.position.x=clusterC.x;
261 |        m.pose.position.y=clusterC.y;
262 |        m.pose.position.z=clusterC.z;
263 | 
264 |        clusterMarkers.markers.push_back(m);
265 |      }
266 | 
267 |     prevClusterCenters=clusterCenters;
268 | 
269 |      markerPub.publish(clusterMarkers);
270 | 
271 | 
272 | 
273 | 
274 |     std_msgs::Int32MultiArray obj_id;
275 |     for(auto it=objID.begin();it!=objID.end();it++)
276 |         obj_id.data.push_back(*it);
277 |     // Publish the object IDs
278 |     objID_pub.publish(obj_id);
279 |     // convert clusterCenters from geometry_msgs::Point to floats
280 |     std::vector<std::vector<float> > cc;
281 |     for (int i=0;i<6;i++)
282 |     {
283 |         vector<float> pt;
284 |         pt.push_back(clusterCenters[objID[i]].x);
285 |         pt.push_back(clusterCenters[objID[i]].y);
286 |         pt.push_back(clusterCenters[objID[i]].z);
287 |         
288 |         cc.push_back(pt);
289 |     }
290 |     //cout<<"cc[5][0]="<<cc[5].at(0)<<"cc[5][1]="<<cc[5].at(1)<<"cc[5][2]="<<cc[5].at(2)<<"\n";
291 |     float meas0[2]={cc[0].at(0),cc[0].at(1)};
292 |     float meas1[2]={cc[1].at(0),cc[1].at(1)};
293 |     float meas2[2]={cc[2].at(0),cc[2].at(1)};
294 |     float meas3[2]={cc[3].at(0),cc[3].at(1)};
295 |     float meas4[2]={cc[4].at(0),cc[4].at(1)};
296 |     float meas5[2]={cc[5].at(0),cc[5].at(1)};
297 | 
298 | 
299 | 
300 |     // The update phase 
301 |     cv::Mat meas0Mat=cv::Mat(2,1,CV_32F,meas0);
302 |     cv::Mat meas1Mat=cv::Mat(2,1,CV_32F,meas1);
303 |     cv::Mat meas2Mat=cv::Mat(2,1,CV_32F,meas2);
304 |     cv::Mat meas3Mat=cv::Mat(2,1,CV_32F,meas3);
305 |     cv::Mat meas4Mat=cv::Mat(2,1,CV_32F,meas4);
306 |     cv::Mat meas5Mat=cv::Mat(2,1,CV_32F,meas5);
307 | 
308 | //cout<<"meas0Mat"<<meas0Mat<<"\n";
309 | if (!(meas0Mat.at<float>(0,0)==0.0f || meas0Mat.at<float>(1,0)==0.0f))
310 |     Mat estimated0 = KF0.correct(meas0Mat);
311 | if (!(meas1[0]==0.0f || meas1[1]==0.0f))
312 |     Mat estimated1 = KF1.correct(meas1Mat);
313 | if (!(meas2[0]==0.0f || meas2[1]==0.0f))
314 |     Mat estimated2 = KF2.correct(meas2Mat);
315 | if (!(meas3[0]==0.0f || meas3[1]==0.0f))
316 |     Mat estimated3 = KF3.correct(meas3Mat);
317 | if (!(meas4[0]==0.0f || meas4[1]==0.0f))
318 |     Mat estimated4 = KF4.correct(meas4Mat);
319 | if (!(meas5[0]==0.0f || meas5[1]==0.0f))
320 |     Mat estimated5 = KF5.correct(meas5Mat);
321 |     
322 |  
323 |     // Publish the point clouds belonging to each clusters
324 | 
325 | 
326 |    // cout<<"estimate="<<estimated.at<float>(0)<<","<<estimated.at<float>(1)<<"\n";
327 |    // Point statePt(estimated.at<float>(0),estimated.at<float>(1));
328 | //cout<<"DONE KF_TRACKER\n";
329 |    
330 | }
331 | void publish_cloud(ros::Publisher& pub, pcl::PointCloud<pcl::PointXYZ>::Ptr cluster){
332 |   sensor_msgs::PointCloud2::Ptr clustermsg (new sensor_msgs::PointCloud2);
333 |   pcl::toROSMsg (*cluster , *clustermsg);
334 |   clustermsg->header.frame_id = "/map";
335 |   clustermsg->header.stamp = ros::Time::now();
336 |   pub.publish (*clustermsg);
337 | 
338 | }
339 | 
340 | 
341 | void cloud_cb (const sensor_msgs::PointCloud2ConstPtr& input)
342 | 
343 | {
344 |    // cout<<"IF firstFrame="<<firstFrame<<"\n";
345 |     // If this is the first frame, initialize kalman filters for the clustered objects
346 | if (firstFrame)
347 | {   
348 |   // Initialize 6 Kalman Filters; Assuming 6 max objects in the dataset. 
349 |   // Could be made generic by creating a Kalman Filter only when a new object is detected  
350 | 
351 |     float dvx=0.01f; //1.0
352 |     float dvy=0.01f;//1.0
353 |     float dx=1.0f;
354 |     float dy=1.0f;
355 |     KF0.transitionMatrix = (Mat_<float>(4, 4) << dx,0,1,0,   0,dy,0,1,  0,0,dvx,0,  0,0,0,dvy);
356 |     KF1.transitionMatrix = (Mat_<float>(4, 4) << dx,0,1,0,   0,dy,0,1,  0,0,dvx,0,  0,0,0,dvy);
357 |     KF2.transitionMatrix = (Mat_<float>(4, 4) << dx,0,1,0,   0,dy,0,1,  0,0,dvx,0,  0,0,0,dvy);
358 |     KF3.transitionMatrix = (Mat_<float>(4, 4) << dx,0,1,0,   0,dy,0,1,  0,0,dvx,0,  0,0,0,dvy);
359 |     KF4.transitionMatrix = (Mat_<float>(4, 4) << dx,0,1,0,   0,dy,0,1,  0,0,dvx,0,  0,0,0,dvy);
360 |     KF5.transitionMatrix = (Mat_<float>(4, 4) << dx,0,1,0,   0,dy,0,1,  0,0,dvx,0,  0,0,0,dvy);
361 | 
362 |     cv::setIdentity(KF0.measurementMatrix);
363 |     cv::setIdentity(KF1.measurementMatrix);
364 |     cv::setIdentity(KF2.measurementMatrix);
365 |     cv::setIdentity(KF3.measurementMatrix);
366 |     cv::setIdentity(KF4.measurementMatrix);
367 |     cv::setIdentity(KF5.measurementMatrix);
368 |     // Process Noise Covariance Matrix Q
369 |     // [ Ex 0  0    0 0    0 ]
370 |     // [ 0  Ey 0    0 0    0 ]
371 |     // [ 0  0  Ev_x 0 0    0 ]
372 |     // [ 0  0  0    1 Ev_y 0 ]
373 |     //// [ 0  0  0    0 1    Ew ]
374 |     //// [ 0  0  0    0 0    Eh ]
375 |     float sigmaP=0.01;
376 |     float sigmaQ=0.1;
377 |     setIdentity(KF0.processNoiseCov, Scalar::all(sigmaP));
378 |     setIdentity(KF1.processNoiseCov, Scalar::all(sigmaP));
379 |     setIdentity(KF2.processNoiseCov, Scalar::all(sigmaP));
380 |     setIdentity(KF3.processNoiseCov, Scalar::all(sigmaP));
381 |     setIdentity(KF4.processNoiseCov, Scalar::all(sigmaP));
382 |     setIdentity(KF5.processNoiseCov, Scalar::all(sigmaP));
383 |     // Meas noise cov matrix R
384 |      cv::setIdentity(KF0.measurementNoiseCov, cv::Scalar(sigmaQ));//1e-1
385 |      cv::setIdentity(KF1.measurementNoiseCov, cv::Scalar(sigmaQ));
386 |      cv::setIdentity(KF2.measurementNoiseCov, cv::Scalar(sigmaQ));
387 |      cv::setIdentity(KF3.measurementNoiseCov, cv::Scalar(sigmaQ));
388 |      cv::setIdentity(KF4.measurementNoiseCov, cv::Scalar(sigmaQ));
389 |      cv::setIdentity(KF5.measurementNoiseCov, cv::Scalar(sigmaQ));
390 | 
391 | // Process the point cloud
392 |      pcl::PointCloud<pcl::PointXYZ>::Ptr input_cloud (new pcl::PointCloud<pcl::PointXYZ>);
393 |   pcl::PointCloud<pcl::PointXYZ>::Ptr clustered_cloud (new pcl::PointCloud<pcl::PointXYZ>);
394 |       /* Creating the KdTree from input point cloud*/
395 |   pcl::search::KdTree<pcl::PointXYZ>::Ptr tree (new pcl::search::KdTree<pcl::PointXYZ>);
396 | 
397 |   pcl::fromROSMsg (*input, *input_cloud);
398 | 
399 |   tree->setInputCloud (input_cloud);
400 | 
401 | 
402 |   std::vector<pcl::PointIndices> cluster_indices;
403 |   pcl::EuclideanClusterExtraction<pcl::PointXYZ> ec;
404 |   ec.setClusterTolerance (0.08); 
405 |   ec.setMinClusterSize (10);
406 |   ec.setMaxClusterSize (600);
407 |   ec.setSearchMethod (tree);
408 |   ec.setInputCloud (input_cloud);
409 |   /* Extract the clusters out of pc and save indices in cluster_indices.*/
410 |   ec.extract (cluster_indices);
411 | 
412 |   
413 |   std::vector<pcl::PointIndices>::const_iterator it;
414 |   std::vector<int>::const_iterator pit;
415 |   // Vector of cluster pointclouds
416 |   std::vector<pcl::PointCloud<pcl::PointXYZ>::Ptr > cluster_vec;
417 |     // Cluster centroids
418 |   std::vector<pcl::PointXYZ> clusterCentroids;
419 | 
420 |   for(it = cluster_indices.begin(); it != cluster_indices.end(); ++it) {
421 |           
422 |          pcl::PointCloud<pcl::PointXYZ>::Ptr cloud_cluster (new pcl::PointCloud<pcl::PointXYZ>);
423 |          float x=0.0; float y=0.0;
424 |          int numPts=0;
425 |           for(pit = it->indices.begin(); pit != it->indices.end(); pit++) 
426 |           {
427 |           
428 |                   cloud_cluster->points.push_back(input_cloud->points[*pit]);
429 |                   x+=input_cloud->points[*pit].x;
430 |                   y+=input_cloud->points[*pit].y;
431 |                   numPts++;
432 | 
433 | 
434 |                   //dist_this_point = pcl::geometry::distance(input_cloud->points[*pit],
435 |                   //                                          origin);
436 |                   //mindist_this_cluster = std::min(dist_this_point, mindist_this_cluster);
437 |           }
438 | 
439 |          
440 |       pcl::PointXYZ centroid;
441 |       centroid.x=x/numPts;
442 |       centroid.y=y/numPts;
443 |       centroid.z=0.0;
444 |       
445 |       cluster_vec.push_back(cloud_cluster);
446 | 
447 |       //Get the centroid of the cluster
448 |       clusterCentroids.push_back(centroid);
449 | 
450 | 
451 |     }
452 | 
453 |     //Ensure at least 6 clusters exist to publish (later clusters may be empty)
454 |     while (cluster_vec.size() < 6){
455 |       pcl::PointCloud<pcl::PointXYZ>::Ptr empty_cluster (new pcl::PointCloud<pcl::PointXYZ>);
456 |       empty_cluster->points.push_back(pcl::PointXYZ(0,0,0));
457 |       cluster_vec.push_back(empty_cluster);
458 |     }
459 | 
460 |         while (clusterCentroids.size()<6)
461 |     {
462 |       pcl::PointXYZ centroid;
463 |       centroid.x=0.0;
464 |       centroid.y=0.0;
465 |       centroid.z=0.0;
466 |       
467 |        clusterCentroids.push_back(centroid);
468 |     }
469 |     
470 | 
471 |      // Set initial state
472 |      KF0.statePre.at<float>(0)=clusterCentroids.at(0).x;
473 |      KF0.statePre.at<float>(1)=clusterCentroids.at(0).y;
474 |      KF0.statePre.at<float>(2)=0;// initial v_x
475 |      KF0.statePre.at<float>(3)=0;//initial v_y
476 | 
477 |      // Set initial state
478 |      KF1.statePre.at<float>(0)=clusterCentroids.at(1).x;
479 |      KF1.statePre.at<float>(1)=clusterCentroids.at(1).y;
480 |      KF1.statePre.at<float>(2)=0;// initial v_x
481 |      KF1.statePre.at<float>(3)=0;//initial v_y
482 | 
483 |      // Set initial state
484 |      KF2.statePre.at<float>(0)=clusterCentroids.at(2).x;
485 |      KF2.statePre.at<float>(1)=clusterCentroids.at(2).y;
486 |      KF2.statePre.at<float>(2)=0;// initial v_x
487 |      KF2.statePre.at<float>(3)=0;//initial v_y
488 | 
489 | 
490 |      // Set initial state
491 |      KF3.statePre.at<float>(0)=clusterCentroids.at(3).x;
492 |      KF3.statePre.at<float>(1)=clusterCentroids.at(3).y;
493 |      KF3.statePre.at<float>(2)=0;// initial v_x
494 |      KF3.statePre.at<float>(3)=0;//initial v_y
495 | 
496 |      // Set initial state
497 |      KF4.statePre.at<float>(0)=clusterCentroids.at(4).x;
498 |      KF4.statePre.at<float>(1)=clusterCentroids.at(4).y;
499 |      KF4.statePre.at<float>(2)=0;// initial v_x
500 |      KF4.statePre.at<float>(3)=0;//initial v_y
501 | 
502 |      // Set initial state
503 |      KF5.statePre.at<float>(0)=clusterCentroids.at(5).x;
504 |      KF5.statePre.at<float>(1)=clusterCentroids.at(5).y;
505 |      KF5.statePre.at<float>(2)=0;// initial v_x
506 |      KF5.statePre.at<float>(3)=0;//initial v_y
507 | 
508 |      firstFrame=false;
509 | 
510 |     for (int i=0;i<6;i++)
511 |      {
512 |         geometry_msgs::Point pt;
513 |         pt.x=clusterCentroids.at(i).x;
514 |         pt.y=clusterCentroids.at(i).y;
515 |         prevClusterCenters.push_back(pt);
516 |      }
517 |    /*  // Print the initial state of the kalman filter for debugging
518 |      cout<<"KF0.satePre="<<KF0.statePre.at<float>(0)<<","<<KF0.statePre.at<float>(1)<<"\n";
519 |      cout<<"KF1.satePre="<<KF1.statePre.at<float>(0)<<","<<KF1.statePre.at<float>(1)<<"\n";
520 |      cout<<"KF2.satePre="<<KF2.statePre.at<float>(0)<<","<<KF2.statePre.at<float>(1)<<"\n";
521 |      cout<<"KF3.satePre="<<KF3.statePre.at<float>(0)<<","<<KF3.statePre.at<float>(1)<<"\n";
522 |      cout<<"KF4.satePre="<<KF4.statePre.at<float>(0)<<","<<KF4.statePre.at<float>(1)<<"\n";
523 |      cout<<"KF5.satePre="<<KF5.statePre.at<float>(0)<<","<<KF5.statePre.at<float>(1)<<"\n";
524 | 
525 |      //cin.ignore();// To be able to see the printed initial state of the KalmanFilter
526 |      */
527 | }
528 | 
529 |  
530 | else
531 | { 
532 |   //cout<<"ELSE firstFrame="<<firstFrame<<"\n";
533 |   pcl::PointCloud<pcl::PointXYZ>::Ptr input_cloud (new pcl::PointCloud<pcl::PointXYZ>);
534 |   pcl::PointCloud<pcl::PointXYZ>::Ptr clustered_cloud (new pcl::PointCloud<pcl::PointXYZ>);
535 |       /* Creating the KdTree from input point cloud*/
536 |   pcl::search::KdTree<pcl::PointXYZ>::Ptr tree (new pcl::search::KdTree<pcl::PointXYZ>);
537 | 
538 |   pcl::fromROSMsg (*input, *input_cloud);
539 | 
540 |   tree->setInputCloud (input_cloud);
541 | 
542 |   /* Here we are creating a vector of PointIndices, which contains the actual index
543 |    * information in a vector<int>. The indices of each detected cluster are saved here.
544 |    * Cluster_indices is a vector containing one instance of PointIndices for each detected 
545 |    * cluster. Cluster_indices[0] contain all indices of the first cluster in input point cloud.
546 |    */
547 |   std::vector<pcl::PointIndices> cluster_indices;
548 |   pcl::EuclideanClusterExtraction<pcl::PointXYZ> ec;
549 |   ec.setClusterTolerance (0.3);
550 |   ec.setMinClusterSize (10);
551 |   ec.setMaxClusterSize (600);
552 |   ec.setSearchMethod (tree);
553 |   ec.setInputCloud (input_cloud);
554 | //cout<<"PCL init successfull\n";
555 |   /* Extract the clusters out of pc and save indices in cluster_indices.*/
556 |   ec.extract (cluster_indices);
557 | //cout<<"PCL extract successfull\n";
558 |   /* To separate each cluster out of the vector<PointIndices> we have to 
559 |    * iterate through cluster_indices, create a new PointCloud for each 
560 |    * entry and write all points of the current cluster in the PointCloud. 
561 |    */
562 |   //pcl::PointXYZ origin (0,0,0);
563 |   //float mindist_this_cluster = 1000;
564 |   //float dist_this_point = 1000;
565 | 
566 |   std::vector<pcl::PointIndices>::const_iterator it;
567 |   std::vector<int>::const_iterator pit;
568 |   // Vector of cluster pointclouds
569 |   std::vector<pcl::PointCloud<pcl::PointXYZ>::Ptr > cluster_vec;
570 | 
571 |      // Cluster centroids
572 |   std::vector<pcl::PointXYZ> clusterCentroids;
573 | 
574 |   
575 | 
576 |   for(it = cluster_indices.begin(); it != cluster_indices.end(); ++it)
577 |    {
578 |         float x=0.0; float y=0.0;
579 |          int numPts=0;
580 |           pcl::PointCloud<pcl::PointXYZ>::Ptr cloud_cluster (new pcl::PointCloud<pcl::PointXYZ>);
581 |           for(pit = it->indices.begin(); pit != it->indices.end(); pit++) 
582 |           {
583 |           
584 |                   cloud_cluster->points.push_back(input_cloud->points[*pit]);
585 | 
586 | 
587 |                   x+=input_cloud->points[*pit].x;
588 |                   y+=input_cloud->points[*pit].y;
589 |                   numPts++;
590 | 
591 |                   //dist_this_point = pcl::geometry::distance(input_cloud->points[*pit],
592 |                   //                                          origin);
593 |                   //mindist_this_cluster = std::min(dist_this_point, mindist_this_cluster);
594 |           }
595 | 
596 |     pcl::PointXYZ centroid;
597 |       centroid.x=x/numPts;
598 |       centroid.y=y/numPts;
599 |       centroid.z=0.0;
600 |       
601 |       cluster_vec.push_back(cloud_cluster);
602 | 
603 |       //Get the centroid of the cluster
604 |       clusterCentroids.push_back(centroid);
605 | 
606 |     }
607 |    // cout<<"cluster_vec got some clusters\n";
608 | 
609 |     //Ensure at least 6 clusters exist to publish (later clusters may be empty)
610 |     while (cluster_vec.size() < 6){
611 |       pcl::PointCloud<pcl::PointXYZ>::Ptr empty_cluster (new pcl::PointCloud<pcl::PointXYZ>);
612 |       empty_cluster->points.push_back(pcl::PointXYZ(0,0,0));
613 |       cluster_vec.push_back(empty_cluster);
614 |     }
615 | 
616 |      while (clusterCentroids.size()<6)
617 |     {
618 |       pcl::PointXYZ centroid;
619 |       centroid.x=0.0;
620 |       centroid.y=0.0;
621 |       centroid.z=0.0;
622 |       
623 |        clusterCentroids.push_back(centroid);
624 |     }
625 | 
626 | 
627 |     std_msgs::Float32MultiArray cc;
628 |     for(int i=0;i<6;i++)
629 |     {
630 |         cc.data.push_back(clusterCentroids.at(i).x);
631 |         cc.data.push_back(clusterCentroids.at(i).y);
632 |         cc.data.push_back(clusterCentroids.at(i).z);    
633 | 
634 |     }
635 |    // cout<<"6 clusters initialized\n";
636 | 
637 |     //cc_pos.publish(cc);// Publish cluster mid-points.
638 |     KFT(cc);
639 |     int i=0;
640 |     bool publishedCluster[6];
641 |     for(auto it=objID.begin();it!=objID.end();it++)
642 |         { //cout<<"Inside the for loop\n";
643 |             
644 |         
645 |             switch(i)
646 |             {
647 |                 cout<<"Inside the switch case\n";
648 |                 case 0: { 
649 |                             publish_cloud(pub_cluster0,cluster_vec[*it]);
650 |                             publishedCluster[i]=true;//Use this flag to publish only once for a given obj ID
651 |                             i++;
652 |                             break;
653 | 
654 |                         }
655 |                 case 1: {
656 |                             publish_cloud(pub_cluster1,cluster_vec[*it]);
657 |                             publishedCluster[i]=true;//Use this flag to publish only once for a given obj ID
658 |                             i++;
659 |                             break;
660 | 
661 |                         }
662 |                 case 2: {
663 |                             publish_cloud(pub_cluster2,cluster_vec[*it]);
664 |                             publishedCluster[i]=true;//Use this flag to publish only once for a given obj ID
665 |                             i++;
666 |                             break;
667 | 
668 |                         }
669 |                 case 3: {
670 |                             publish_cloud(pub_cluster3,cluster_vec[*it]);
671 |                             publishedCluster[i]=true;//Use this flag to publish only once for a given obj ID
672 |                             i++;
673 |                             break;
674 | 
675 |                         }
676 |                 case 4: {
677 |                             publish_cloud(pub_cluster4,cluster_vec[*it]);
678 |                             publishedCluster[i]=true;//Use this flag to publish only once for a given obj ID
679 |                             i++;
680 |                             break;
681 | 
682 |                         }
683 | 
684 |                 case 5: {
685 |                             publish_cloud(pub_cluster5,cluster_vec[*it]);
686 |                             publishedCluster[i]=true;//Use this flag to publish only once for a given obj ID
687 |                             i++;
688 |                             break;
689 | 
690 |                         }
691 |                 default: break;
692 |             }
693 |         
694 |         }
695 | 
696 | } 
697 | 
698 | }   
699 | 
700 | 
701 |   
702 | 
703 | int main(int argc, char** argv)
704 | {
705 |     // ROS init
706 |     ros::init (argc,argv,"kf_tracker");
707 |     ros::NodeHandle nh;
708 | 
709 |    
710 |     // Publishers to publish the state of the objects (pos and vel)
711 |     //objState1=nh.advertise<geometry_msgs::Twist> ("obj_1",1);
712 | 
713 | 
714 | 
715 | cout<<"About to setup callback\n";
716 | 
717 | // Create a ROS subscriber for the input point cloud
718 |   ros::Subscriber sub = nh.subscribe ("lidar_top", 1, cloud_cb);
719 |   // Create a ROS publisher for the output point cloud
720 |   pub_cluster0 = nh.advertise<sensor_msgs::PointCloud2> ("cluster_0", 1);
721 |   pub_cluster1 = nh.advertise<sensor_msgs::PointCloud2> ("cluster_1", 1);
722 |   pub_cluster2 = nh.advertise<sensor_msgs::PointCloud2> ("cluster_2", 1);
723 |   pub_cluster3 = nh.advertise<sensor_msgs::PointCloud2> ("cluster_3", 1);
724 |   pub_cluster4 = nh.advertise<sensor_msgs::PointCloud2> ("cluster_4", 1);
725 |   pub_cluster5 = nh.advertise<sensor_msgs::PointCloud2> ("cluster_5", 1);
726 |       // Subscribe to the clustered pointclouds
727 |     //ros::Subscriber c1=nh.subscribe("ccs",100,KFT); 
728 |     objID_pub = nh.advertise<std_msgs::Int32MultiArray>("obj_id", 1);
729 | /* Point cloud clustering
730 | */
731 |     
732 |   //cc_pos=nh.advertise<std_msgs::Float32MultiArray>("ccs",100);//clusterCenter1
733 |   markerPub= nh.advertise<visualization_msgs::MarkerArray> ("viz",1);
734 | 
735 | /* Point cloud clustering
736 | */    
737 | 
738 | 
739 |     ros::spin();
740 | 
741 | 
742 | }
743 | 


--------------------------------------------------------------------------------
/src/utils.cpp:
--------------------------------------------------------------------------------
 1 | #include "nuscenes2bag/utils.hpp"
 2 | 
 3 | #include <iostream>
 4 | 
 5 | namespace nuscenes2bag {
 6 | 
 7 | std::string
 8 | toLower(const std::string& str)
 9 | {
10 |   std::string lowerStr(str);
11 |   std::transform(lowerStr.begin(),
12 |                  lowerStr.end(),
13 |                  lowerStr.begin(),
14 |                  [](unsigned char c) { return std::tolower(c); });
15 |   return lowerStr;
16 | }
17 | 
18 | bool
19 | string_icontains(const std::string& string, const std::string& sub)
20 | {
21 |   std::string lowerString = toLower(string);
22 |   std::string lowerSub = toLower(sub);
23 |   return lowerString.find(lowerSub) != std::string::npos;
24 | }
25 | 
26 | ros::Time
27 | stampUs2RosTime(uint64_t stampUs)
28 | {
29 |   ros::Time t;
30 |   t = t.fromNSec(stampUs * 1000);
31 |   return t;
32 | }
33 | 
34 | }


--------------------------------------------------------------------------------