osrf · vinay0410 · Oct 13, 2018 · Oct 14, 2018 · Oct 17, 2018
diff --git a/README.md b/README.md
@@ -12,9 +12,20 @@ To run Default SSD (Single Shot Detection) algorithm:
 
 1. Install ROS: http://wiki.ros.org/kinetic/Installation/Ubuntu
 
-2. Install camera dependencies
+2. Install vision_msgs Dependency
+    `sudo apt install ros-kinetic-vision-msgs`
 
-    `sudo apt-get install ros-kinetic-usb_cam ros-kinetic-openni2-launch`
+3. Install any one of the following camera dependencies
+
+    `sudo apt install ros-kinetic-openni2-launch` (for openni2 supported camera)
+
+                OR
+
+    `sudo apt install ros-kinetic-usb-cam`  (usb camera / webcam)
+
+                OR
+
+    `sudo apt install ros-kinetic-cv-camera`  (usb camera / webcam)
 
 3. Install tensorflow into python virtualenv: https://www.tensorflow.org/install/install_linux
 
@@ -34,11 +45,9 @@ To run Default SSD (Single Shot Detection) algorithm:
 
     `cd ~/catkin_ws/src`
 
-    `git clone https://github.com/Kukanani/vision_msgs.git`
-
     `git clone https://github.com/osrf/tensorflow_object_detector.git`
 
-6. Build tensorflow_object_detector and Vision message 
+6. Build tensorflow_object_detector and Vision message
 
     `cd ~/catkin_ws && catkin_make`
 
@@ -54,11 +63,12 @@ To run Default SSD (Single Shot Detection) algorithm:
 
     `roslaunch tensorflow_object_detector usb_cam_detector.launch`
 
+    OR
 
+    `roslaunch tensorflow_object_detector cv_camera_detector.launch`
 
 If you want to try any other ML model:
 
-1. Download any Object Detection Models from the Tensorflow Object detection API and place it in `data/models/`. You can find the models in tensorflow Object Detection Model Zoo: https://github.com/tensorflow/models/blob/master/object_detection/g3doc/detection_model_zoo.md. Extract the `tar.gz` file.
-
-2. Edit the MODEL_NAME and LABEL_NAME in detect_ros.py. By default it is `ssd_mobilenet_v1_coco_11_06_2017` with `mscoco_label_map.pbtxt` respectively. 
+1. Download any Object Detection Models from the Tensorflow Object detection API. You can find the models in tensorflow Object Detection Model Zoo: https://github.com/tensorflow/models/blob/master/object_detection/g3doc/detection_model_zoo.md. Extract the `tar.gz` file.
 
+2. Edit the parameters in any of the launch file. If no parameters are provided then, `ssd_mobilenet_v2_coco_2018_03_29` is downloaded and stored in `~/data/models`.
diff --git a/CMakeLists.txt → detector/CMakeLists.txt b/CMakeLists.txt → detector/CMakeLists.txt
@@ -17,27 +17,7 @@ find_package(catkin REQUIRED COMPONENTS
 )
 
 ##set the URL to download
-set(URL "http://download.tensorflow.org/models/object_detection/ssd_mobilenet_v1_coco_11_06_2017.tar.gz")
-set(DOWNLOAD_PATH ${CMAKE_CURRENT_SOURCE_DIR}/data/models/ssd_mobilenet_v1_coco_11_06_2017.tar.gz)
-set(EXTRACTED_PATH ${CMAKE_CURRENT_SOURCE_DIR}/data/models)
-
-if (NOT EXISTS "${EXTRACTED_PATH}/ssd_mobilenet_v1_coco_11_06_2017")
-  if (NOT EXISTS "${DOWNLOAD_PATH}")
-  message(STATUS "Downloading SSD model ....")
-  file(
-    DOWNLOAD "${URL}" "${DOWNLOAD_PATH}"
-    SHOW_PROGRESS
-  )
-  endif()
-  message(STATUS "Extracting...")
-  execute_process(
-    COMMAND cmake -E tar xzf ${DOWNLOAD_PATH}
-    WORKING_DIRECTORY ${EXTRACTED_PATH}
-  )
-endif()
-
-file(REMOVE ${DOWNLOAD_PATH})
-
+
 ## System dependencies are found with CMake's conventions
 # find_package(Boost REQUIRED COMPONENTS system)
 
@@ -133,7 +113,7 @@ catkin_package(
 #  DEPENDS system_lib
 )
 
-catkin_install_python(PROGRAMS scripts/detect_ros.py 
+catkin_install_python(PROGRAMS scripts/detect_ros.py
 			DESTINATION ${CATKIN_PACKAGE_BIN_DESTINATION})
 ###########
 ## Build ##

diff --git a/config/display.rviz → detector/config/display.rviz b/config/display.rviz → detector/config/display.rviz
diff --git a/data/.gitignore → detector/data/.gitignore b/data/.gitignore → detector/data/.gitignore
diff --git a/data/labels/mscoco_label_map.pbtxt → detector/data/labels/mscoco_label_map.pbtxt b/data/labels/mscoco_label_map.pbtxt → detector/data/labels/mscoco_label_map.pbtxt
diff --git a/data/labels/pascal_label_map.pbtxt → detector/data/labels/pascal_label_map.pbtxt b/data/labels/pascal_label_map.pbtxt → detector/data/labels/pascal_label_map.pbtxt
diff --git a/data/labels/pet_label_map.pbtxt → detector/data/labels/pet_label_map.pbtxt b/data/labels/pet_label_map.pbtxt → detector/data/labels/pet_label_map.pbtxt
diff --git a/data/models/readme.md → detector/data/models/readme.md b/data/models/readme.md → detector/data/models/readme.md
diff --git a/detector/launch/cv_camera_detector.launch b/detector/launch/cv_camera_detector.launch
@@ -0,0 +1,17 @@
+<launch>
+	<node pkg= "tensorflow_object_detector" name="detect_ros" type="detect_ros.py"  output="screen">
+    <remap from="image" to="/cv_camera_node/image_raw"/>
+
+		<param name="model_path" value=""/>
+		<param name="labels_path" value=""/>
+		<param name="num_classes" value="90"/>
+	</node>
+
+  <node pkg="cv_camera" type="cv_camera_node" name="cv_camera_node" output="screen">
+    <param name="device_id" value="0"/>
+  </node>
+
+  <node pkg="image_view" type="image_view" name="image_view">
+    <remap from="image" to="debug_image"/>
+  </node>
+</launch>
diff --git a/launch/object_detect.launch → detector/launch/object_detect.launch b/launch/object_detect.launch → detector/launch/object_detect.launch
@@ -1,6 +1,10 @@
 <launch>
-	<node pkg= "tensorflow_object_detector" name="detect_ros" type="detect_ros.py"  output="screen"> 
+	<node pkg= "tensorflow_object_detector" name="detect_ros" type="detect_ros.py"  output="screen">
     <remap from='image' to='/camera/rgb/image_raw'/>
+
+		<param name="model_path" value=""/>
+		<param name="labels_path" value=""/>
+		<param name="num_classes" value="90"/>
 	</node>
 	<!-- rviz -->
   <arg name ="rviz" default="true" />

diff --git a/launch/usb_cam_detector.launch → detector/launch/usb_cam_detector.launch b/launch/usb_cam_detector.launch → detector/launch/usb_cam_detector.launch
@@ -1,6 +1,10 @@
 <launch>
-	<node pkg= "tensorflow_object_detector" name="detect_ros" type="detect_ros.py"  output="screen"> 
+	<node pkg= "tensorflow_object_detector" name="detect_ros" type="detect_ros.py"  output="screen">
     <remap from="image" to="/usb_cam_node/image_raw"/>
+
+		<param name="model_path" value=""/>
+		<param name="labels_path" value=""/>
+		<param name="num_classes" value="90"/>
 	</node>
 
   <node pkg="usb_cam" type="usb_cam_node" name="usb_cam_node" output="screen">

diff --git a/package.xml → detector/package.xml b/package.xml → detector/package.xml
diff --git a/detector/scripts/detect_ros.py b/detector/scripts/detect_ros.py
@@ -0,0 +1,225 @@
+#!/usr/bin/env python
+## Author: Rohit
+## Date: July, 25, 2017
+# Purpose: Ros node to detect objects using tensorflow
+
+import os
+import sys
+import cv2
+import tarfile
+import numpy as np
+try:
+    import tensorflow as tf
+except ImportError:
+    print("unable to import TensorFlow. Is it installed?")
+    print("  sudo apt install python-pip")
+    print("  sudo pip install tensorflow")
+    sys.exit(1)
+
+# ROS related imports
+import rospy
+from std_msgs.msg import String , Header
+from sensor_msgs.msg import Image
+from cv_bridge import CvBridge, CvBridgeError
+from vision_msgs.msg import Detection2D, Detection2DArray, ObjectHypothesisWithPose
+
+# Object detection module imports
+import object_detection
+from object_detection.utils import label_map_util
+from object_detection.utils import visualization_utils as vis_util
+import urllib2
+
+DEFAULT_MODEL = os.path.join(os.path.expanduser("~"), "data", "models", "ssd_mobilenet_v1_coco_2018_01_28", "frozen_inference_graph.pb")
+DEFAULT_LABELS = os.path.join(os.path.dirname(sys.path[0]), "data", "labels", "mscoco_label_map.pbtxt")
+
+def download_model(url, location):
+
+    file_name = url.split('/')[-1]
+    u = urllib2.urlopen(url)
+    if not os.path.exists(location):
+        os.makedirs(location)
+
+    file_path = os.path.join(location, os.path.basename(url))
+    f = open(file_path, 'wb')
+    meta = u.info()
+    file_size = int(meta.getheaders("Content-Length")[0])
+    print "Downloading: %s Bytes: %s" % (file_name, file_size)
+
+    file_size_dl = 0
+    block_sz = 8192
+    while True:
+        buffer = u.read(block_sz)
+        if not buffer:
+            break
+
+        file_size_dl += len(buffer)
+        f.write(buffer)
+        status = r"%10d  [%3.2f%%]" % (file_size_dl, file_size_dl * 100. / file_size)
+        status = status + chr(8)*(len(status)+1)
+        print status,
+
+    f.close()
+
+    return file_path
+
+def download_data():
+    ## Downloading COCO Trained Model
+    if not os.path.exists(DEFAULT_MODEL):
+        model_path = os.path.join(os.path.expanduser("~"), "data", "models")
+        final_path = download_model("http://download.tensorflow.org/models/object_detection/ssd_mobilenet_v1_coco_2018_01_28.tar.gz", model_path)
+        print final_path
+        tar = tarfile.open(final_path)
+        tar.extractall(path=os.path.dirname(final_path))
+        tar.close()
+
+def get_model_params():
+    model_path = rospy.get_param("~model_path")
+    labels_path = rospy.get_param("~labels_path")
+
+
+    if (not model_path and not labels_path):
+        rospy.logwarn("No params passed, using default model")
+        download_data()
+        return (DEFAULT_MODEL, DEFAULT_LABELS)
+
+    elif (os.path.exists(os.path.join(model_path, "frozen_inference_graph.pb")) and os.path.exists(labels_path)):
+        rospy.loginfo("Using Passed parameters")
+        return (os.path.join(model_path, "frozen_inference_graph.pb"), labels_path)
+
+    else:
+        raise Exception("Either Incomplete arguments were passed or the paths do not exist. To use the default model do not pass any parameters. NOTE: Please use absolute paths in params")
+
+# Detection
+
+class Detector:
+
+    def __init__(self):
+
+        ######### Set model here ############
+        path_to_ckpt, path_to_labels = get_model_params()
+
+        num_classes = rospy.get_param("~num_classes")
+
+        detection_graph = tf.Graph()
+        with detection_graph.as_default():
+            od_graph_def = tf.GraphDef()
+            with tf.gfile.GFile(path_to_ckpt, 'rb') as fid:
+                serialized_graph = fid.read()
+                od_graph_def.ParseFromString(serialized_graph)
+                tf.import_graph_def(od_graph_def, name='')
+
+        ## Loading label map
+        # Label maps map indices to category names, so that when our convolution network predicts `5`,
+        # we know that this corresponds to `airplane`.  Here we use internal utility functions,
+        # but anything that returns a dictionary mapping integers to appropriate string labels would be fine
+        label_map = label_map_util.load_labelmap(path_to_labels)
+        categories = label_map_util.convert_label_map_to_categories(label_map, max_num_classes=num_classes, use_display_name=True)
+        self.category_index = label_map_util.create_category_index(categories)
+
+        # Setting the GPU options to use fraction of gpu that has been set
+        # config = tf.ConfigProto()
+        # config.gpu_options.per_process_gpu_memory_fraction = GPU_FRACTION
+        ops = detection_graph.get_operations()
+        all_tensor_names = {output.name for op in ops for output in op.outputs}
+        self.tensor_dict = {}
+        for key in [
+            'num_detections', 'detection_boxes', 'detection_scores',
+            'detection_classes', 'detection_masks'
+        ]:
+            tensor_name = key + ':0'
+            if tensor_name in all_tensor_names:
+                self.tensor_dict[key] = detection_graph.get_tensor_by_name(
+                    tensor_name)
+
+        self.image_tensor = detection_graph.get_tensor_by_name('image_tensor:0')
+
+        self.sess = tf.Session(graph=detection_graph)
+
+        rospy.loginfo("Initializing")
+
+        dummy_tensor = np.zeros((1,1,1,3), dtype=np.int32)
+        self.sess.run(self.tensor_dict,
+                               feed_dict={self.image_tensor: dummy_tensor})
+
+        self.image_pub = rospy.Publisher("debug_image",Image, queue_size=1)
+        self.object_pub = rospy.Publisher("objects", Detection2DArray, queue_size=1)
+        self.bridge = CvBridge()
+        self.image_sub = rospy.Subscriber("image", Image, self.image_cb, queue_size=1, buff_size=2**24)
+
+
+    def image_cb(self, data):
+        objArray = Detection2DArray()
+        try:
+            cv_image = self.bridge.imgmsg_to_cv2(data, "bgr8")
+        except CvBridgeError as e:
+            print(e)
+        image=cv2.cvtColor(cv_image,cv2.COLOR_BGR2RGB)
+
+        # the array based representation of the image will be used later in order to prepare the
+        # result image with boxes and labels on it.
+        image_np = np.asarray(image)
+        # Expand dimensions since the model expects images to have shape: [1, None, None, 3]
+        image_np_expanded = np.expand_dims(image_np, axis=0)
+
+        output_dict = self.sess.run(self.tensor_dict,
+                                    feed_dict={self.image_tensor: image_np_expanded})
+
+        objects=vis_util.visualize_boxes_and_labels_on_image_array(
+            image,
+            np.squeeze(output_dict["detection_boxes"]),
+            np.squeeze(output_dict["detection_classes"]).astype(np.int32),
+            np.squeeze(output_dict["detection_scores"]),
+            self.category_index,
+            use_normalized_coordinates=True,
+            line_thickness=2)
+
+        objArray.detections =[]
+        objArray.header=data.header
+        object_count=1
+
+        for i in range(len(objects)):
+            object_count+=1
+            objArray.detections.append(self.object_predict(objects[i],data.header,image_np,cv_image))
+
+        self.object_pub.publish(objArray)
+
+        img=cv2.cvtColor(image_np, cv2.COLOR_BGR2RGB)
+        image_out = Image()
+        try:
+            image_out = self.bridge.cv2_to_imgmsg(img,"bgr8")
+        except CvBridgeError as e:
+            print(e)
+        image_out.header = data.header
+        self.image_pub.publish(image_out)
+
+    def object_predict(self,object_data, header, image_np,image):
+        image_height,image_width,channels = image.shape
+        obj=Detection2D()
+        obj_hypothesis= ObjectHypothesisWithPose()
+
+        object_id=object_data[0]
+        object_score=object_data[1]
+        dimensions=object_data[2]
+
+        obj.header=header
+        obj_hypothesis.id = object_id
+        obj_hypothesis.score = object_score
+        obj.results.append(obj_hypothesis)
+        obj.bbox.size_y = int((dimensions[2]-dimensions[0])*image_height)
+        obj.bbox.size_x = int((dimensions[3]-dimensions[1] )*image_width)
+        obj.bbox.center.x = int((dimensions[1] + dimensions [3])*image_width/2)
+        obj.bbox.center.y = int((dimensions[0] + dimensions[2])*image_height/2)
+
+        return obj
+
+def main(args):
+    rospy.init_node('detector_node')
+    obj=Detector()
+    try:
+        rospy.spin()
+    except KeyboardInterrupt:
+        print("ShutDown")
+    cv2.destroyAllWindows()
+
+if __name__=='__main__':
+    main(sys.argv)
diff --git a/setup.py → detector/setup.py b/setup.py → detector/setup.py
diff --git a/src/object_detection/__init__.py → detector/src/object_detection/__init__.py b/src/object_detection/__init__.py → detector/src/object_detection/__init__.py
diff --git a/...t_detection/anchor_generators/__init__.py → ...r/src/object_detection/protos/__init__.py b/...t_detection/anchor_generators/__init__.py → ...r/src/object_detection/protos/__init__.py
diff --git a/...tection/protos/string_int_label_map.proto → ...tection/protos/string_int_label_map.proto b/...tection/protos/string_int_label_map.proto → ...tection/protos/string_int_label_map.proto
diff --git a/...ection/protos/string_int_label_map_pb2.py → ...ection/protos/string_int_label_map_pb2.py b/...ection/protos/string_int_label_map_pb2.py → ...ection/protos/string_int_label_map_pb2.py
diff --git a/src/object_detection/box_coders/__init__.py → ...or/src/object_detection/utils/__init__.py b/src/object_detection/box_coders/__init__.py → ...or/src/object_detection/utils/__init__.py
diff --git a/src/object_detection/utils/label_map_util.py → .../object_detection/utils/label_map_util.py b/src/object_detection/utils/label_map_util.py → .../object_detection/utils/label_map_util.py
diff --git a/...ct_detection/utils/visualization_utils.py → ...ct_detection/utils/visualization_utils.py b/...ct_detection/utils/visualization_utils.py → ...ct_detection/utils/visualization_utils.py