Erol444 · July 4, 2023 14:09
diff --git a/rgb-depth-align-alpha1.py b/rgb-depth-align-alpha1.py
 #!/usr/bin/env python3

 import cv2
 import numpy as np
 import depthai as dai

 # Weights to use when blending depth/rgb image (should equal 1.0)
 rgbWeight = 0.4
 depthWeight = 0.6


 def updateBlendWeights(percent_rgb):
    """
    Update the rgb and depth weights used to blend depth/rgb image

    @param[in] percent_rgb The rgb weight expressed as a percentage (0..100)
    """
    global depthWeight
    global rgbWeight
    rgbWeight = float(percent_rgb)/100.0
    depthWeight = 1.0 - rgbWeight


 # Optional. If set (True), the ColorCamera is downscaled from 1080p to 720p.
 # Otherwise (False), the aligned depth is automatically upscaled to 1080p
 downscaleColor = False
 fps = 30
 # The disparity is computed at this resolution, then upscaled to RGB resolution
 monoResolution = dai.MonoCameraProperties.SensorResolution.THE_720_P

 # Create pipeline
 pipeline = dai.Pipeline()
 device = dai.Device()
 queueNames = []

 # Define sources and outputs
 camRgb = pipeline.create(dai.node.ColorCamera)
 left = pipeline.create(dai.node.MonoCamera)
 right = pipeline.create(dai.node.MonoCamera)
 stereo = pipeline.create(dai.node.StereoDepth)

 rgbOut = pipeline.create(dai.node.XLinkOut)
 disparityOut = pipeline.create(dai.node.XLinkOut)

 rgbOut.setStreamName("rgb")
 queueNames.append("rgb")
 disparityOut.setStreamName("disp")
 queueNames.append("disp")

 #Properties
 rgbCamSocket = dai.CameraBoardSocket.CAM_A

 camRgb.setBoardSocket(rgbCamSocket)
 camRgb.setResolution(dai.ColorCameraProperties.SensorResolution.THE_720_P)
 camRgb.setFps(fps)
 if downscaleColor: camRgb.setIspScale(2, 3)
 # For now, RGB needs fixed focus to properly align with depth.
 # This value was used during calibration
 try:
    calibData = device.readCalibration2()
    lensPosition = calibData.getLensPosition(rgbCamSocket)
    if lensPosition:
        camRgb.initialControl.setManualFocus(lensPosition)
 except:
    raise
 left.setResolution(monoResolution)
 left.setCamera("left")
 left.setFps(fps)
 right.setResolution(monoResolution)
 right.setCamera("right")
 right.setFps(fps)

 stereo.setDefaultProfilePreset(dai.node.StereoDepth.PresetMode.HIGH_DENSITY)
 # LR-check is required for depth alignment
 stereo.setLeftRightCheck(True)
 stereo.setDepthAlign(rgbCamSocket)

 # Linking
 camRgb.isp.link(rgbOut.input)
 left.out.link(stereo.left)
 right.out.link(stereo.right)
 stereo.disparity.link(disparityOut.input)


 alpha = 1
 stereo.setAlphaScaling(alpha)

 rgb_w = camRgb.getResolutionWidth()
 rgb_h = camRgb.getResolutionHeight()
 rgbIntrinsics = np.array(calibData.getCameraIntrinsics(rgbCamSocket, rgb_w, rgb_h))
 rgb_d = np.array(calibData.getDistortionCoefficients(rgbCamSocket))

 rgb_new_cam_matrix, _ = cv2.getOptimalNewCameraMatrix(rgbIntrinsics, rgb_d, (rgb_w, rgb_h), alpha)

 map_x, map_y = cv2.initUndistortRectifyMap(rgbIntrinsics, rgb_d, None, rgb_new_cam_matrix, (rgb_w, rgb_h), cv2.CV_32FC1)

 # Connect to device and start pipeline
 with device:
    device.startPipeline(pipeline)

    frameRgb = None
    frameDisp = None

    # Configure windows; trackbar adjusts blending ratio of rgb/depth
    rgbWindowName = "rgb"
    depthWindowName = "depth"
    blendedWindowName = "rgb-depth"
    cv2.namedWindow(rgbWindowName)
    cv2.namedWindow(depthWindowName)
    cv2.namedWindow(blendedWindowName)
    cv2.createTrackbar('RGB Weight %', blendedWindowName, int(rgbWeight*100), 100, updateBlendWeights)

    while True:
        latestPacket = {}
        latestPacket["rgb"] = None
        latestPacket["disp"] = None

        queueEvents = device.getQueueEvents(("rgb", "disp"))
        for queueName in queueEvents:
            packets = device.getOutputQueue(queueName).tryGetAll()
            if len(packets) > 0:
                latestPacket[queueName] = packets[-1]

        if latestPacket["rgb"] is not None:
            frameRgb = latestPacket["rgb"].getCvFrame()
            frameRgb = cv2.remap(frameRgb, map_x, map_y, cv2.INTER_LINEAR)
            cv2.imshow(rgbWindowName, frameRgb)

        if latestPacket["disp"] is not None:
            frameDisp = latestPacket["disp"].getFrame()
            maxDisparity = stereo.initialConfig.getMaxDisparity()
            # Optional, extend range 0..95 -> 0..255, for a better visualisation
            if 1: frameDisp = (frameDisp * 255. / maxDisparity).astype(np.uint8)
            # Optional, apply false colorization
            if 1: frameDisp = cv2.applyColorMap(frameDisp, cv2.COLORMAP_HOT)
            frameDisp = np.ascontiguousarray(frameDisp)
            cv2.imshow(depthWindowName, frameDisp)

        # Blend when both received
        if frameRgb is not None and frameDisp is not None:
            # Need to have both frames in BGR format before blending
            if len(frameDisp.shape) < 3:
                frameDisp = cv2.cvtColor(frameDisp, cv2.COLOR_GRAY2BGR)
            blended = cv2.addWeighted(frameRgb, rgbWeight, frameDisp, depthWeight, 0)
            cv2.imshow(blendedWindowName, blended)
            frameRgb = None
            frameDisp = None

        if cv2.waitKey(1) == ord('q'):
            break
	#!/usr/bin/env python3

	import cv2
	import numpy as np
	import depthai as dai

	# Weights to use when blending depth/rgb image (should equal 1.0)
	rgbWeight = 0.4
	depthWeight = 0.6


	def updateBlendWeights(percent_rgb):
	"""
	Update the rgb and depth weights used to blend depth/rgb image

	@param[in] percent_rgb The rgb weight expressed as a percentage (0..100)
	"""
	global depthWeight
	global rgbWeight
	rgbWeight = float(percent_rgb)/100.0
	depthWeight = 1.0 - rgbWeight


	# Optional. If set (True), the ColorCamera is downscaled from 1080p to 720p.
	# Otherwise (False), the aligned depth is automatically upscaled to 1080p
	downscaleColor = False
	fps = 30
	# The disparity is computed at this resolution, then upscaled to RGB resolution
	monoResolution = dai.MonoCameraProperties.SensorResolution.THE_720_P

	# Create pipeline
	pipeline = dai.Pipeline()
	device = dai.Device()
	queueNames = []

	# Define sources and outputs
	camRgb = pipeline.create(dai.node.ColorCamera)
	left = pipeline.create(dai.node.MonoCamera)
	right = pipeline.create(dai.node.MonoCamera)
	stereo = pipeline.create(dai.node.StereoDepth)

	rgbOut = pipeline.create(dai.node.XLinkOut)
	disparityOut = pipeline.create(dai.node.XLinkOut)

	rgbOut.setStreamName("rgb")
	queueNames.append("rgb")
	disparityOut.setStreamName("disp")
	queueNames.append("disp")

	#Properties
	rgbCamSocket = dai.CameraBoardSocket.CAM_A

	camRgb.setBoardSocket(rgbCamSocket)
	camRgb.setResolution(dai.ColorCameraProperties.SensorResolution.THE_720_P)
	camRgb.setFps(fps)
	if downscaleColor: camRgb.setIspScale(2, 3)
	# For now, RGB needs fixed focus to properly align with depth.
	# This value was used during calibration
	try:
	calibData = device.readCalibration2()
	lensPosition = calibData.getLensPosition(rgbCamSocket)
	if lensPosition:
	camRgb.initialControl.setManualFocus(lensPosition)
	except:
	raise
	left.setResolution(monoResolution)
	left.setCamera("left")
	left.setFps(fps)
	right.setResolution(monoResolution)
	right.setCamera("right")
	right.setFps(fps)

	stereo.setDefaultProfilePreset(dai.node.StereoDepth.PresetMode.HIGH_DENSITY)
	# LR-check is required for depth alignment
	stereo.setLeftRightCheck(True)
	stereo.setDepthAlign(rgbCamSocket)

	# Linking
	camRgb.isp.link(rgbOut.input)
	left.out.link(stereo.left)
	right.out.link(stereo.right)
	stereo.disparity.link(disparityOut.input)


	alpha = 1
	stereo.setAlphaScaling(alpha)

	rgb_w = camRgb.getResolutionWidth()
	rgb_h = camRgb.getResolutionHeight()
	rgbIntrinsics = np.array(calibData.getCameraIntrinsics(rgbCamSocket, rgb_w, rgb_h))
	rgb_d = np.array(calibData.getDistortionCoefficients(rgbCamSocket))

	rgb_new_cam_matrix, _ = cv2.getOptimalNewCameraMatrix(rgbIntrinsics, rgb_d, (rgb_w, rgb_h), alpha)

	map_x, map_y = cv2.initUndistortRectifyMap(rgbIntrinsics, rgb_d, None, rgb_new_cam_matrix, (rgb_w, rgb_h), cv2.CV_32FC1)

	# Connect to device and start pipeline
	with device:
	device.startPipeline(pipeline)

	frameRgb = None
	frameDisp = None

	# Configure windows; trackbar adjusts blending ratio of rgb/depth
	rgbWindowName = "rgb"
	depthWindowName = "depth"
	blendedWindowName = "rgb-depth"
	cv2.namedWindow(rgbWindowName)
	cv2.namedWindow(depthWindowName)
	cv2.namedWindow(blendedWindowName)
	cv2.createTrackbar('RGB Weight %', blendedWindowName, int(rgbWeight*100), 100, updateBlendWeights)

	while True:
	latestPacket = {}
	latestPacket["rgb"] = None
	latestPacket["disp"] = None

	queueEvents = device.getQueueEvents(("rgb", "disp"))
	for queueName in queueEvents:
	packets = device.getOutputQueue(queueName).tryGetAll()
	if len(packets) > 0:
	latestPacket[queueName] = packets[-1]

	if latestPacket["rgb"] is not None:
	frameRgb = latestPacket["rgb"].getCvFrame()
	frameRgb = cv2.remap(frameRgb, map_x, map_y, cv2.INTER_LINEAR)
	cv2.imshow(rgbWindowName, frameRgb)

	if latestPacket["disp"] is not None:
	frameDisp = latestPacket["disp"].getFrame()
	maxDisparity = stereo.initialConfig.getMaxDisparity()
	# Optional, extend range 0..95 -> 0..255, for a better visualisation
	if 1: frameDisp = (frameDisp * 255. / maxDisparity).astype(np.uint8)
	# Optional, apply false colorization
	if 1: frameDisp = cv2.applyColorMap(frameDisp, cv2.COLORMAP_HOT)
	frameDisp = np.ascontiguousarray(frameDisp)
	cv2.imshow(depthWindowName, frameDisp)

	# Blend when both received
	if frameRgb is not None and frameDisp is not None:
	# Need to have both frames in BGR format before blending
	if len(frameDisp.shape) < 3:
	frameDisp = cv2.cvtColor(frameDisp, cv2.COLOR_GRAY2BGR)
	blended = cv2.addWeighted(frameRgb, rgbWeight, frameDisp, depthWeight, 0)
	cv2.imshow(blendedWindowName, blended)
	frameRgb = None
	frameDisp = None

	if cv2.waitKey(1) == ord('q'):
	break