Hi, I am trying to integtate the output image from gen2-deeplav3-dep

Depthai-experiments ros compatibility about depthai-ros HOT 4 CLOSED

luxonis commented on July 29, 2024

Depthai-experiments ros compatibility

from depthai-ros.

Comments (4)

saching13 commented on July 29, 2024

Can you share your code ?

from depthai-ros.

anujchadha284 commented on July 29, 2024

#!/usr/bin/env python3
'''

Blob taken from the great PINTO zoo

git clone [email protected]:PINTO0309/PINTO_model_zoo.git
cd PINTO_model_zoo/026_mobile-deeplabv3-plus/01_float32/
./download.sh
source /opt/intel/openvino/bin/setupvars.sh
python3 /opt/intel/openvino/deployment_tools/model_optimizer/mo_tf.py --input_model deeplab_v3_plus_mnv2_decoder_256.pb --model_name deeplab_v3_plus_mnv2_decoder_256 --input_shape [1,256,256,3] --data_type FP16 --output_dir openvino/256x256/FP16 --mean_values [127.5,127.5,127.5] --scale_values [127.5,127.5,127.5]
/opt/intel/openvino/deployment_tools/inference_engine/lib/intel64/myriad_compile -ip U8 -VPU_NUMBER_OF_SHAVES 6 -VPU_NUMBER_OF_CMX_SLICES 6 -m openvino/256x256/FP16/deeplab_v3_plus_mnv2_decoder_256.xml -o deeplabv3p_person_6_shaves.blob
'''

import cv2
import depthai as dai
import numpy as np
import argparse
import time
from datetime import datetime, timedelta

##
import rospy
from cv_bridge import CvBridge, CvBridgeError
from sensor_msgs.msg import Image

TARGET_SHAPE = (400,400)
class FPSHandler:
    def __init__(self, cap=None):
        self.timestamp = time.time()
        self.start = time.time()
        self.frame_cnt = 0
    def next_iter(self):
        self.timestamp = time.time()
        self.frame_cnt += 1
    def fps(self):
        return self.frame_cnt / (self.timestamp - self.start)

class HostSync:
    def __init__(self):
        self.arrays = {}
    def add_msg(self, name, msg):
        if not name in self.arrays:
            self.arrays[name] = []
        self.arrays[name].append(msg)
    def get_msgs(self, timestamp):
        ret = {}
        for name, arr in self.arrays.items():
            for i, msg in enumerate(arr):
                time_diff = abs(msg.getTimestamp() - timestamp)
                # 20ms since we add rgb/depth frames at 30FPS => 33ms. If
                # time difference is below 20ms, it's considered as synced
                if time_diff < timedelta(milliseconds=20):
                    ret[name] = msg
                    self.arrays[name] = arr[i:]
                    break
        return ret

class stereoCam:
    def __init__(self):
        parser = argparse.ArgumentParser()
        preamble_string = "/home/anuj.chadha/workspace/stereo-ws/src/luxonis/depthai-ros-examples/depthai_examples/scripts/gen2-deeplabv3_depth/"
        parser.add_argument("-shape", "--nn_shape", help="select NN model shape", default=256, type=int)
        parser.add_argument("-nn", "--nn_path", help="select model path for inference", default='models/deeplab_v3_plus_mvn2_decoder_256_openvino_2021.2_6shave.blob', type=str)
        args = parser.parse_args()

        # Custom JET colormap with 0 mapped to `black` - better disparity visualization
        self.jet_custom = cv2.applyColorMap(np.arange(256, dtype=np.uint8), cv2.COLORMAP_JET)
        self.jet_custom[0] = [0, 0, 0]

        self.nn_shape = args.nn_shape
        nn_path = preamble_string + args.nn_path


        self.colorBackground = cv2.resize(self.crop_to_square(cv2.imread("/home/anuj.chadha/workspace/stereo-ws/src/luxonis/depthai-ros-examples/depthai_examples/scripts/gen2-deeplabv3_depth/background.jpeg")), (400,400))

        # Start defining a pipeline

        self.pipeline = dai.Pipeline()

        self.pipeline.setOpenVINOVersion(version=dai.OpenVINO.Version.VERSION_2021_2)

        cam = self.pipeline.createColorCamera()
        cam.setResolution(dai.ColorCameraProperties.SensorResolution.THE_1080_P)
        # Color cam: 1920x1080
        # Mono cam: 640x400
        cam.setIspScale(2,3) # To match 400P mono cameras
        cam.setBoardSocket(dai.CameraBoardSocket.RGB)
        cam.initialControl.setManualFocus(130)

        # For deeplabv3
        cam.setColorOrder(dai.ColorCameraProperties.ColorOrder.BGR)
        cam.setPreviewSize(self.nn_shape, self.nn_shape)
        cam.setInterleaved(False)

        # NN output linked to XLinkOut
        isp_xout = self.pipeline.createXLinkOut()
        isp_xout.setStreamName("cam")
        cam.isp.link(isp_xout.input)

        # Define a neural network that will make predictions based on the source frames
        detection_nn = self.pipeline.createNeuralNetwork()
        detection_nn.setBlobPath(nn_path)
        detection_nn.input.setBlocking(False)
        detection_nn.setNumInferenceThreads(2)
        cam.preview.link(detection_nn.input)

        # NN output linked to XLinkOut
        xout_nn = self.pipeline.createXLinkOut()
        xout_nn.setStreamName("nn")
        detection_nn.out.link(xout_nn.input)

        xout_passthrough = self.pipeline.createXLinkOut()
        xout_passthrough.setStreamName("pass")
        # Only send metadata, we are only interested in timestamp, so we can sync
        # depth frames with NN output
        xout_passthrough.setMetadataOnly(True)
        detection_nn.passthrough.link(xout_passthrough.input)

        # Left mono camera
        left = self.pipeline.createMonoCamera()
        left.setResolution(dai.MonoCameraProperties.SensorResolution.THE_400_P)
        left.setBoardSocket(dai.CameraBoardSocket.LEFT)
        # Right mono camera
        right = self.pipeline.createMonoCamera()
        right.setResolution(dai.MonoCameraProperties.SensorResolution.THE_400_P)
        right.setBoardSocket(dai.CameraBoardSocket.RIGHT)

        # Create a node that will produce the depth map (using disparity output as it's easier to visualize depth this way)
        self.stereo = self.pipeline.createStereoDepth()
        self.stereo.initialConfig.setConfidenceThreshold(245)
        self.stereo.initialConfig.setMedianFilter(dai.StereoDepthProperties.MedianFilter.KERNEL_7x7)
        # stereo.initialConfig.setBilateralFilterSigma(64000)
        self.stereo.setLeftRightCheck(True)
        self.stereo.setDepthAlign(dai.CameraBoardSocket.RGB)
        left.out.link(self.stereo.left)
        right.out.link(self.stereo.right)

        # Create depth output
        xout_disp = self.pipeline.createXLinkOut()
        xout_disp.setStreamName("disparity")
        self.stereo.disparity.link(xout_disp.input)

        self.image_pub = rospy.Publisher("image_topic_2",Image, queue_size=10)

        self.bridge = CvBridge()

        self.image_message = None

    def webcam_pub(self):
        print("-------- Pipeline Setup! -------- ")
        with dai.Device(self.pipeline.getOpenVINOVersion()) as device:
            print("-------- Camera Started --------")
            cams = device.getConnectedCameras()
            depth_enabled = dai.CameraBoardSocket.LEFT in cams and dai.CameraBoardSocket.RIGHT in cams
            if not depth_enabled:
                raise RuntimeError("Unable to run this experiment on device without depth capabilities! (Available cameras: {})".format(cams))
            device.startPipeline(self.pipeline)
            # Output queues will be used to get the outputs from the device
            q_color = device.getOutputQueue(name="cam", maxSize=4, blocking=False)
            q_disp = device.getOutputQueue(name="disparity", maxSize=4, blocking=False)
            q_nn = device.getOutputQueue(name="nn", maxSize=4, blocking=False)
            q_pass = device.getOutputQueue(name="pass", maxSize=4, blocking=False)

            fps = FPSHandler()
            sync = HostSync()
            disp_frame = None
            disp_multiplier = 255 / self.stereo.getMaxDisparity()

            frame = None
            frame_back = None
            depth = None
            depth_weighted = None
            frames = {}
            while not rospy.is_shutdown():
                sync.add_msg("color", q_color.get())

                in_depth = q_disp.tryGet()
                if in_depth is not None:
                    sync.add_msg("depth", in_depth)

                in_nn = q_nn.tryGet()
                if in_nn is not None:
                    fps.next_iter()
                    # Get NN output timestamp from the passthrough
                    timestamp = q_pass.get().getTimestamp()
                    msgs = sync.get_msgs(timestamp)

                    # get layer1 data
                    layer1 = in_nn.getFirstLayerInt32()
                    # reshape to numpy array
                    lay1 = np.asarray(layer1, dtype=np.int32).reshape((self.nn_shape, self.nn_shape))
                    output_colors = self.decode_deeplabv3p(lay1)

                    # To match depth frames
                    output_colors = cv2.resize(output_colors, TARGET_SHAPE)

                    if "color" in msgs:
                        frame = msgs["color"].getCvFrame()
                        frame = self.crop_to_square(frame)
                        frame = cv2.resize(frame, TARGET_SHAPE)
                        frames['frame'] = frame
                        frame = cv2.addWeighted(frame, 1, output_colors,0.5,0)
                        cv2.putText(frame, "Fps: {:.2f}".format(fps.fps()), (2, frame.shape[0] - 4), cv2.FONT_HERSHEY_TRIPLEX, 0.4, color=(255, 255, 255))
                        frames['colored_frame'] = frame

                    if "depth" in msgs:
                        disp_frame = msgs["depth"].getFrame()
                        disp_frame = (disp_frame * disp_multiplier).astype(np.uint8)
                        disp_frame = self.crop_to_square(disp_frame)
                        disp_frame = cv2.resize(disp_frame, TARGET_SHAPE)

                        # Colorize the disparity
                        frames['depth'] = cv2.applyColorMap(disp_frame, self.jet_custom)

                        multiplier = self.get_multiplier(lay1)
                        multiplier = cv2.resize(multiplier, TARGET_SHAPE)
                        depth_overlay = disp_frame * multiplier
                        frames['cutout'] = cv2.applyColorMap(depth_overlay, self.jet_custom)

                        if 'frame' in frames:
                            # shape (400,400) multipliers -> shape (400,400,3)
                            multiplier = np.repeat(multiplier[:, :, np.newaxis], 3, axis=2)
                            rgb_cutout = frames['frame'] * multiplier
                            multiplier[multiplier == 0] = 255
                            multiplier[multiplier == 1] = 0
                            multiplier[multiplier == 255] = 1
                            frames['background'] = self.colorBackground * multiplier
                            frames['background'] += rgb_cutout
                        # You can add custom code here, for example depth averaging
                if len(frames) == 5:
                    row1 = np.concatenate((frames['colored_frame'], frames['background']), axis=1)
                    row2 = np.concatenate((frames['depth'], frames['cutout']), axis=1)
                    # print(row1)
                    cv2.imshow("Combined frame", np.concatenate((row1,row2), axis=0))
                    # cv2.imshow(np.concatenate((frames['colored_frame'], frames['background']), axis=1))
                    self.image_message = self.bridge.cv2_to_imgmsg(frames['depth'], encoding="passthrough")
                    self.image_pub.publish(self.image_message)
                if cv2.waitKey(1) == ord('q'):
                    break

    def decode_deeplabv3p(self, output_tensor):
        class_colors = [[0,0,0],  [0,255,0]]
        class_colors = np.asarray(class_colors, dtype=np.uint8)

        output = output_tensor.reshape(self.nn_shape,self.nn_shape)
        output_colors = np.take(class_colors, output, axis=0)
        return output_colors

    def get_multiplier(self, output_tensor):
        class_binary = [[0], [1]]
        class_binary = np.asarray(class_binary, dtype=np.uint8)
        output = output_tensor.reshape(self.nn_shape,self.nn_shape)
        output_colors = np.take(class_binary, output, axis=0)
        return output_colors

    def crop_to_square(self, frame):
        height = frame.shape[0]
        width  = frame.shape[1]
        delta = int((width-height) / 2)
        # print(height, width, delta)
        # print(frame[0:height, delta:width-delta])
        return frame[0:height, delta:width-delta]

if __name__ == '__main__':
    rospy.init_node('stereoimage', anonymous=True)
    try:
        stereocam = stereoCam()
        stereocam.webcam_pub()
    except rospy.ROSInterruptException:
        pass

from depthai-ros.

saching13 commented on July 29, 2024

Thanks. Can you check the depthai version and if it is < 2.11.1.0 can you update it and give it a shot once ?

from depthai-ros.

Serafadam commented on July 29, 2024

Closing due to inactivity, if you think this should remain open, please tag me in a comment here.

from depthai-ros.

Depthai-experiments ros compatibility about depthai-ros HOT 4 CLOSED

Comments (4)

Related Issues (20)

Recommend Projects

React

Vue.js

Typescript

TensorFlow

Django

Laravel

D3

Recommend Topics

javascript

web

server

Machine learning

Visualization

Game

Recommend Org

Facebook

Microsoft

Google

Alibaba

D3

Tencent