improve default and readme

Signed-off-by: Owen-Liuyuxuan <[email protected]>
Owen-Liuyuxuan · Nov 6, 2023 · f90eaba · f90eaba
1 parent 39da711
commit f90eaba
Show file tree

Hide file tree

Showing 3 changed files with 73 additions and 18 deletions.
diff --git a/docs/ros2_vision_inference.gif b/docs/ros2_vision_inference.gif
diff --git a/readme.md b/readme.md
@@ -0,0 +1,68 @@
+# ROS2 Vision Inference
+
+This repo contains a unified inference multi-threading nodes for monocular 3D object detection, depth prediction and semantic segmentation.
+
+![RVIZ Example](docs/ros2_vision_inference.gif)
+
+You could checkout the ROS1 version of each inference package:
+
+- [Monodepth ROS1](https://github.com/Owen-Liuyuxuan/monodepth_ros)
+- [Mono3D ROS1](https://github.com/Owen-Liuyuxuan/visualDet3D_ros)
+
+In this repo, we fully re-structure the code and messages formats for ROS2 (humble), and integrate multi-thread inferencing for three vision tasks.
+
+- Currently all pretrained models are trained using the [visionfactory](https://github.com/Owen-Liuyuxuan/visionfactory) repo. Thus focusing on out-door autonomous driving scenarios. But it is ok to plugin ONNX models that satisfiy the [interface](#onnx-model-interface).
+
+
+## Getting Started
+
+This repo relies on [ROS2](https://docs.ros.org/en/humble/Installation.html) and onnxruntime:
+
+```bash
+pip3 install onnxruntime-gpu
+```
+
+For Orin, find the pip wheel in https://elinux.org/Jetson_Zoo with version number > 1.3 is ok
+
+Under the workspace directory, find the [launch file](./launch/detect_seg_depth.launch.xml) and change topic names and onnx checkpoint paths then build the workspace (you can choose to either launch any of the three tasks in the launch file)
+
+```bash
+colcon build --synlink-install
+source install/setup.bash
+ros2 launch ros2_vision_inference detect_seg_depth.launch.xml
+```
+
+Notice that as a known issue from [ros2 python package](https://github.com/ros2/launch/issues/187). The launch/rviz files are copied but not symlinked when we run "colcon build",
+so **whenever we modify the launch file, we need to rebuild the package**; whenever we want to modify the rviz file, we need to save it explicitly in the src folder.
+
+```bash
+colcon build --symlink-install --packages-select=ros2_vision_inference # rebuilding only ros2_vision_inference
+```
+
+## Interface
+
+### Subscribed Topics
+
+/image_raw ([sensor_msgs/Image](https://docs.ros2.org/latest/api/sensor_msgs/msg/Image.html))
+
+/camera_info ([sensor_msgs/CameraInfo](https://docs.ros2.org/latest/api/sensor_msgs/msg/CameraInfo.html))
+
+### Publishing Topics
+
+/depth_image ([sensor_msgs/Image](https://docs.ros2.org/latest/api/sensor_msgs/msg/Image.html)): Depth image of float type.
+
+/seg_image ([sensor_msgs/Image](https://docs.ros2.org/latest/api/sensor_msgs/msg/Image.html)): RGB-colorized segmentation images.
+
+/mono3d/bbox ([visualization_msgs/MarkerArray](https://docs.ros2.org/foxy/api/visualization_msgs/msg/MarkerArray.html)): 3D bounding boxes outputs.
+
+/point_cloud ([sensor_msgs/PointCloud2](https://docs.ros2.org/latest/api/sensor_msgs/msg/PointCloud2.html)): projecting /seg_image with /depth_image into a point cloud.
+
+## ONNX Model Interface
+
+MonoDepth ONNX: `def forward(self, normalized_images[1, 3, H, W], P[1, 3, 4]):->float[1, 1, H, W]`
+
+Segmentation ONNX `def forward(self, normalized_images[1, 3, H, W]):->long[1, H, W]`
+
+Mono3D ONNX: `def forward(self, normalized_images[1, 3, H, W], P[1, 3, 4]):->scores[N], bboxes[N,12], cls_indexes[N]`
+
+Classes definitions are from the [visionfactory](https://github.com/Owen-Liuyuxuan/visionfactory) repo.
diff --git a/ros2_vision_inference/ros2_vision_inference.py b/ros2_vision_inference/ros2_vision_inference.py
@@ -1,12 +1,10 @@
-import os
+import onnxruntime as ort
 import numpy as np
 import rclpy
 import cv2
-import torch
 from .utils.ros_util import ROSInterface
 from sensor_msgs.msg import CameraInfo, Image, PointCloud2
-from visualization_msgs.msg import Marker, MarkerArray
-from std_msgs.msg import String, Int32, Bool, Float32
+from visualization_msgs.msg import MarkerArray
 import threading
 from numba import jit
 from .seg_labels import PALETTE
@@ -52,7 +50,6 @@ def __init__(self, *args, **kwargs):
  self.build_model(*args, **kwargs)
 
  def build_model(self, onnx_path):
- import onnxruntime as ort
  self.ort_session = ort.InferenceSession(onnx_path, providers=['CUDAExecutionProvider'])
  input_shape = self.ort_session.get_inputs()[0].shape # [1, 3, h, w]
  self.inference_h = input_shape[2]
@@ -61,16 +58,6 @@ def build_model(self, onnx_path):
  def set_inputs(self, image, P=None):
  self.image = image
  self.P = P
-
- def collate_fn(self, batch):
- collated_data = {}
- for key in batch[0]:
- if isinstance(batch[0][key], torch.Tensor):
- collated_data[key] = torch.stack([item[key] for item in batch], dim=0)
- elif isinstance(batch[0][key], np.ndarray):
- collated_data[key] = torch.stack([torch.from_numpy(item[key]) for item in batch], dim=0)
-
- return collated_data
 
  def resize(self, image, P=None):
  self.h0, self.w0 = image.shape[0:2]
@@ -173,15 +160,15 @@ def _read_params(self):
 
  if self.mono3d_flag:
  self.mono3d_weight_path = self.ros_interface.read_one_parameters("MONO3D_CKPT_FILE",
- "/home/yliuhb/vision_factory/weights/mono3d.pth")
+ "/home/yliuhb/vision_factory/weights/mono3d.onnx")
 
  if self.seg_flag:
  self.seg_weight_path = self.ros_interface.read_one_parameters("SEG_CKPT_FILE",
- "/home/yliuhb/vision_factory/weights/seg.pth")
+ "/home/yliuhb/vision_factory/weights/seg.onnx")
 
  if self.monodepth_flag:
  self.monodepth_weight_path = self.ros_interface.read_one_parameters("MONODEPTH_CKPT_FILE",
- "/home/yliuhb/vision_factory/weights/monodepth.pth")
+ "/home/yliuhb/vision_factory/weights/monodepth.onnx")
 
  self.gpu_index = int(self.ros_interface.read_one_parameters("GPU", 0))
  self.seg_opacity = float(self.ros_interface.read_one_parameters("opacity", 0.9))