luxonis · kkeroo · Jun 6, 2024 · May 28, 2024 · May 28, 2024 · May 28, 2024
@@ -1 +1,2 @@
-from .img_detections import ImgDetectionsWithKeypoints
+from .img_detections import ImgDetectionsWithKeypoints
+from .hand_keypoints import HandKeypoints
diff --git a/ml/messages/hand_keypoints.py b/ml/messages/hand_keypoints.py
@@ -0,0 +1,21 @@
+import depthai as dai
+from typing import List
+
+class HandKeypoints(dai.Buffer):
+    def __init__(self):
+        dai.Buffer.__init__(self)
+        self.confidence: float = 0.0
+        self.handdedness: float = 0.0
+        self._keypoints: List[dai.Point3f] = []
+
+    @property
+    def keypoints(self) -> List[dai.Point3f]:
+        return self._keypoints
+
+    @keypoints.setter
+    def keypoints(self, value: List[dai.Point3f]):
+        if not isinstance(value, list):
+            raise TypeError("keypoints must be a list.")
+        for item in value:
+            if not isinstance(item, dai.Point3f):
+                raise TypeError("All items in keypoints must be of type dai.Point3f.")
@@ -0,0 +1,89 @@
+import depthai as dai
+import numpy as np
+import cv2
+
+from .utils.medipipe import generate_handtracker_anchors, decode_bboxes, rect_transformation, detections_to_rect
+
+class MPHandDetectionParser(dai.node.ThreadedHostNode):
+    def __init__(
+        self,
+        score_threshold=0.5,
+        nms_threshold=0.5,
+        top_k=100
+    ):
+        dai.node.ThreadedHostNode.__init__(self)
+        self.input = dai.Node.Input(self)
+        self.out = dai.Node.Output(self)
+
+        self.score_threshold = score_threshold
+        self.nms_threshold = nms_threshold
+        self.top_k = top_k
+
+    def setConfidenceThreshold(self, threshold):
+        self.score_threshold = threshold
+
+    def setNMSThreshold(self, threshold):
+        self.nms_threshold = threshold
+
+    def setTopK(self, top_k):
+        self.top_k = top_k
+
+    def run(self):
+        """
+        Postprocessing logic for MediPipe Hand detection model.
+
+        Returns:
+            dai.ImgDetections containing bounding boxes, labels, and confidence scores of detected hands.
+        """
+
+        while self.isRunning():
+
+            try:
+                output: dai.NNData = self.input.get()
+            except dai.MessageQueue.QueueException as e:
+                break  # Pipeline was stopped
+
+            tensorInfo = output.getTensorInfo("Identity")
+            bboxes = output.getTensor(f"Identity").reshape(2016, 18).astype(np.float32)
+            bboxes = (bboxes - tensorInfo.qpZp) * tensorInfo.qpScale
+            tensorInfo = output.getTensorInfo("Identity_1")
+            scores = output.getTensor(f"Identity_1").reshape(2016).astype(np.float32)
+            scores = (scores - tensorInfo.qpZp) * tensorInfo.qpScale
+
+            anchors = generate_handtracker_anchors(192, 192)
+            decoded_bboxes = decode_bboxes(0.5, scores, bboxes, anchors, scale=192)
+            detections_to_rect(decoded_bboxes)
+            rect_transformation(decoded_bboxes, 192, 192)
+
+            bboxes = []
+            scores = []
+
+            for hand in decoded_bboxes:
+                extended_points = hand.rect_points
+                xmin = int(min(extended_points[0][0], extended_points[1][0]))
+                ymin = int(min(extended_points[0][1], extended_points[1][1]))
+                xmax = int(max(extended_points[2][0], extended_points[3][0]))
+                ymax = int(max(extended_points[2][1], extended_points[3][1]))
+
+                bboxes.append([xmin, ymin, xmax, ymax])
+                scores.append(hand.pd_score)
+
+            indices = cv2.dnn.NMSBoxes(bboxes, scores, self.score_threshold, self.nms_threshold, top_k=self.top_k)
+            bboxes = np.array(bboxes)[indices]
+            scores = np.array(scores)[indices]
+
+            detections = []
+            for bbox, score in zip(bboxes, scores):
+                detection = dai.ImgDetection()
+                detection.confidence = score
+                detection.label = 0
+                detection.xmin = bbox[0]
+                detection.ymin = bbox[1]
+                detection.xmax = bbox[2]
+                detection.ymax = bbox[3]
+                detections.append(detection)
+
+            detections_msg = dai.ImgDetections()
+            detections_msg.detections = detections
+
+            self.out.send(detections_msg)
@@ -0,0 +1,68 @@
+import depthai as dai
+import numpy as np
+import cv2
+
+from ..messages import HandKeypoints
+
+class MPHandLandmarkParser(dai.node.ThreadedHostNode):
+    def __init__(
+        self,
+        score_threshold=0.5,
+        scale_factor=224
+    ):
+        dai.node.ThreadedHostNode.__init__(self)
+        self.input = dai.Node.Input(self)
+        self.out = dai.Node.Output(self)
+
+        self.score_threshold = score_threshold
+        self.scale_factor = scale_factor
+
+    def setScoreThreshold(self, threshold):
+        self.score_threshold = threshold
+
+    def setScaleFactor(self, scale_factor):
+        self.scale_factor = scale_factor
+
+    def run(self):
+        """
+        Postprocessing logic for MediaPipe Hand landmark model.
+
+        Returns:
+            HandLandmarks containing normalized 21 landmarks, confidence score, and handdedness score (right or left hand).
+        """
+
+        while self.isRunning():
+
+            try:
+                output: dai.NNData = self.input.get()
+            except dai.MessageQueue.QueueException as e:
+                break  # Pipeline was stopped
+
+            tensorInfo = output.getTensorInfo("Identity")
+            landmarks = output.getTensor(f"Identity").reshape(21, 3).astype(np.float32)
+            landmarks = (landmarks - tensorInfo.qpZp) * tensorInfo.qpScale
+            tensorInfo = output.getTensorInfo("Identity_1")
+            hand_score = output.getTensor(f"Identity_1").reshape(-1).astype(np.float32)
+            hand_score = (hand_score - tensorInfo.qpZp) * tensorInfo.qpScale
+            hand_score = hand_score[0]
+            tensorInfo = output.getTensorInfo("Identity_2")
+            handdedness = output.getTensor(f"Identity_2").reshape(-1).astype(np.float32)
+            handdedness = (handdedness - tensorInfo.qpZp) * tensorInfo.qpScale
+            handdedness = handdedness[0]
+
+            # normalize landmarks
+            landmarks /= self.scale_factor
+
+            hand_landmarks_msg = HandKeypoints()
+            hand_landmarks_msg.handdedness = handdedness
+            hand_landmarks_msg.confidence = hand_score
+            hand_landmarks = []
+            if hand_score >= self.score_threshold:
+                for i in range(21):
+                    pt = dai.Point3f()
+                    pt.x = landmarks[i][0]
+                    pt.y = landmarks[i][1]
+                    pt.z = landmarks[i][2]
+                    hand_landmarks.append(pt)
+            hand_landmarks_msg.landmarks = hand_landmarks
+            self.out.send(hand_landmarks_msg)
diff --git a/ml/postprocessing/mediapipe_selfie_segmentation.py b/ml/postprocessing/mediapipe_selfie_segmentation.py
@@ -0,0 +1,41 @@
+import depthai as dai
+import numpy as np
+import cv2
+from .utils.message_creation import create_segmentation_message
+
+class MPSeflieSegParser(dai.node.ThreadedHostNode):
+    def __init__(
+        self,
+        threshold=0.5,
+    ):
+        dai.node.ThreadedHostNode.__init__(self)
+        self.input = dai.Node.Input(self)
+        self.out = dai.Node.Output(self)
+
+        self.threshold = threshold
+
+    def setConfidenceThreshold(self, threshold):
+        self.threshold = threshold
+
+    def run(self):
+        """
+        Postprocessing logic for MediaPipe Selfie Segmentation model.
+
+        Returns:
+            Segmenation mask with two classes 1 - person, 0 - background.
+        """
+
+        while self.isRunning():
+
+            try:
+                output: dai.NNData = self.input.get()
+            except dai.MessageQueue.QueueException as e:
+                break  # Pipeline was stopped
+
+            segmentation_mask = output.getTensor("output")
+            segmentation_mask = segmentation_mask[0].squeeze() > self.threshold
+            overlay_image = np.zeros((segmentation_mask.shape[0], segmentation_mask.shape[1], 1), dtype=np.uint8)
+            overlay_image[segmentation_mask] = 1
+
+            imgFrame = create_segmentation_message(overlay_image)
+            self.out.send(imgFrame)
@@ -2,21 +2,19 @@
 import numpy as np
 import cv2
 
-from ..custom_messages.img_detections import ImgDetectionsWithKeypoints
+from ..messages import ImgDetectionsWithKeypoints
 
 class SCRFDParser(dai.node.ThreadedHostNode):
     def __init__(
         self,
         score_threshold=0.5,
         nms_threshold=0.5,
-        top_k=100,
-        input_size=(640, 640), # WH
+        top_k=100
     ):
         dai.node.ThreadedHostNode.__init__(self)
         self.input = dai.Node.Input(self)
         self.out = dai.Node.Output(self)
 
-        self.input_size = input_size
         self.score_threshold = score_threshold
         self.nms_threshold = nms_threshold
         self.top_k = top_k
@@ -30,9 +28,6 @@ def setNMSThreshold(self, threshold):
     def setTopK(self, top_k):
         self.top_k = top_k
 
-    def setInputSize(self, width, height):
-        self.input_size = (width, height)
-
     def run(self):
         """
         Postprocessing logic for SCRFD model.