2 долоо хоног өмнө · 8de31378a0
--- a/brain/PlannerNode2/Skill/person_approach_skill/config/person_approach.yaml
+++ b/brain/PlannerNode2/Skill/person_approach_skill/config/person_approach.yaml
@@ -0,0 +1,38 @@
 
				+person_approach_node:
			
 
				+  ros__parameters:
			
 
				+    # RTSP 地址
			
 
				+    rtsp_url: "rtsp://admin:hhzx2025@192.168.0.36:554/Streaming/Channels/201"
			
 
				+
			
 
				+    # HBM 模型
			
 
				+    model_path: "/opt/hobot/model/s100/basic/yolov5x_672x672_nv12.hbm"
			
 
				+
			
 
				+    # COCO 标签
			
 
				+    label_file: "/app/res/labels/coco_classes.names"
			
 
				+
			
 
				+    # pydev_demo 的 utils 路径
			
 
				+    # 因为 preprocess_utils/postprocess_utils/common_utils 还在 /app/pydev_demo/utils
			
 
				+    pydev_demo_path: "/app/pydev_demo"
			
 
				+
			
 
				+    # BPU 调度
			
 
				+    priority: 0
			
 
				+    bpu_cores: [0]
			
 
				+
			
 
				+    # YOLO 后处理
			
 
				+    score_thres: 0.25
			
 
				+    nms_thres: 0.45
			
 
				+
			
 
				+    # 人物靠近判断
			
 
				+    person_score_thres: 0.45
			
 
				+    area_ratio_thres: 0.15
			
 
				+    center_offset_thres: 0.25
			
 
				+    stable_frames: 5
			
 
				+    cooldown_sec: 8.0
			
 
				+
			
 
				+    # 循环间隔
			
 
				+    loop_sleep_sec: 0.01
			
 
				+
			
 
				+    # 调试日志
			
 
				+    debug: true
			
 
				+
			
 
				+    # 事件 Topic
			
 
				+    event_topic: "/skill/person_approach/event"
			
--- a/brain/PlannerNode2/Skill/person_approach_skill/launch/person_approach_node.launch.py
+++ b/brain/PlannerNode2/Skill/person_approach_skill/launch/person_approach_node.launch.py
@@ -0,0 +1,25 @@
 
				+#!/usr/bin/env python3
			
 
				+# -*- coding: utf-8 -*-
			
 
				+
			
 
				+import os
			
 
				+
			
 
				+from launch import LaunchDescription
			
 
				+from launch_ros.actions import Node
			
 
				+from ament_index_python.packages import get_package_share_directory
			
 
				+
			
 
				+
			
 
				+def generate_launch_description():
			
 
				+    pkg_share = get_package_share_directory("person_approach_skill")
			
 
				+    config_file = os.path.join(pkg_share, "config", "person_approach.yaml")
			
 
				+
			
 
				+    person_approach_node = Node(
			
 
				+        package="person_approach_skill",
			
 
				+        executable="person_approach_node",
			
 
				+        name="person_approach_node",
			
 
				+        output="screen",
			
 
				+        parameters=[config_file],
			
 
				+    )
			
 
				+
			
 
				+    return LaunchDescription([
			
 
				+        person_approach_node,
			
 
				+    ])
			
--- a/brain/PlannerNode2/Skill/person_approach_skill/package.xml
+++ b/brain/PlannerNode2/Skill/person_approach_skill/package.xml
@@ -0,0 +1,25 @@
 
				+<?xml version="1.0"?>
			
 
				+<package format="3">
			
 
				+  <name>person_approach_skill</name>
			
 
				+  <version>0.0.0</version>
			
 
				+  <description>Greeting vision skill for AI Agent</description>
			
 
				+  <maintainer email="sunrise@example.com">sunrise</maintainer>
			
 
				+  <license>Apache-2.0</license>
			
 
				+
			
 
				+  <buildtool_depend>ament_python</buildtool_depend>
			
 
				+
			
 
				+  <depend>rclpy</depend>
			
 
				+  <depend>std_msgs</depend>
			
 
				+
			
 
				+  <exec_depend>launch</exec_depend>
			
 
				+  <exec_depend>launch_ros</exec_depend>
			
 
				+
			
 
				+  <test_depend>ament_copyright</test_depend>
			
 
				+  <test_depend>ament_flake8</test_depend>
			
 
				+  <test_depend>ament_pep257</test_depend>
			
 
				+  <test_depend>python3-pytest</test_depend>
			
 
				+
			
 
				+  <export>
			
 
				+    <build_type>ament_python</build_type>
			
 
				+  </export>
			
 
				+</package>
			
--- a/brain/PlannerNode2/Skill/person_approach_skill/person_approach_skill/__init__.py
+++ b/brain/PlannerNode2/Skill/person_approach_skill/person_approach_skill/__init__.py
--- a/brain/PlannerNode2/Skill/person_approach_skill/person_approach_skill/person_approach_node.py
+++ b/brain/PlannerNode2/Skill/person_approach_skill/person_approach_skill/person_approach_node.py
@@ -0,0 +1,777 @@
 
				+#!/usr/bin/env python3
			
 
				+# -*- coding: utf-8 -*-
			
 
				+
			
 
				+import os
			
 
				+
			
 
				+# 必须放在 import cv2 前，强制 RTSP 使用 TCP
			
 
				+os.environ["OPENCV_FFMPEG_CAPTURE_OPTIONS"] = "rtsp_transport;tcp"
			
 
				+
			
 
				+import cv2
			
 
				+import sys
			
 
				+import json
			
 
				+import time
			
 
				+import signal
			
 
				+import numpy as np
			
 
				+import hbm_runtime
			
 
				+import rclpy
			
 
				+
			
 
				+from rclpy.node import Node
			
 
				+from std_msgs.msg import String
			
 
				+from typing import Optional, Dict, Tuple
			
 
				+from hobot_vio import libsrcampy as srcampy
			
 
				+
			
 
				+
			
 
				+STRIDES = np.array([8, 16, 32], dtype=np.int32)
			
 
				+
			
 
				+ANCHORS = np.array([
			
 
				+    [10, 13], [16, 30], [33, 23],
			
 
				+    [30, 61], [62, 45], [59, 119],
			
 
				+    [116, 90], [156, 198], [373, 326]
			
 
				+], dtype=np.float32).reshape(3, 3, 2)
			
 
				+
			
 
				+
			
 
				+def ret_ok(ret):
			
 
				+    if isinstance(ret, (list, tuple)):
			
 
				+        return len(ret) > 0 and ret[0] == 0
			
 
				+    return ret == 0
			
 
				+
			
 
				+
			
 
				+def get_nalu_pos(byte_stream: bytes):
			
 
				+    size = len(byte_stream)
			
 
				+    nals = []
			
 
				+    retnals = []
			
 
				+
			
 
				+    start_code = b"\x00\x00\x01"
			
 
				+    pos = 0
			
 
				+
			
 
				+    while pos < size:
			
 
				+        is4bytes = False
			
 
				+        retpos = byte_stream.find(start_code, pos)
			
 
				+
			
 
				+        if retpos == -1:
			
 
				+            break
			
 
				+
			
 
				+        if retpos > 0 and byte_stream[retpos - 1] == 0:
			
 
				+            retpos -= 1
			
 
				+            is4bytes = True
			
 
				+
			
 
				+        pos = retpos + (4 if is4bytes else 3)
			
 
				+
			
 
				+        if pos >= size:
			
 
				+            break
			
 
				+
			
 
				+        val = int(byte_stream[pos])
			
 
				+        fb = (val >> 7) & 0x1
			
 
				+        nri = (val >> 5) & 0x3
			
 
				+        nalu_type = val & 0x1F
			
 
				+
			
 
				+        nals.append((pos, is4bytes, fb, nri, nalu_type))
			
 
				+
			
 
				+    if not nals:
			
 
				+        return []
			
 
				+
			
 
				+    for i in range(0, len(nals) - 1):
			
 
				+        start = nals[i][0]
			
 
				+        end = nals[i + 1][0] - (5 if nals[i + 1][1] else 4)
			
 
				+        retnals.append((
			
 
				+            start,
			
 
				+            end,
			
 
				+            nals[i][1],
			
 
				+            nals[i][2],
			
 
				+            nals[i][3],
			
 
				+            nals[i][4],
			
 
				+        ))
			
 
				+
			
 
				+    start = nals[-1][0]
			
 
				+    end = size - 1
			
 
				+    retnals.append((
			
 
				+        start,
			
 
				+        end,
			
 
				+        nals[-1][1],
			
 
				+        nals[-1][2],
			
 
				+        nals[-1][3],
			
 
				+        nals[-1][4],
			
 
				+    ))
			
 
				+
			
 
				+    return retnals
			
 
				+
			
 
				+
			
 
				+def get_h264_nalu_type(byte_stream: bytes):
			
 
				+    nalu_types = []
			
 
				+    nalu_pos = get_nalu_pos(byte_stream)
			
 
				+
			
 
				+    for _, _, _, _, _, nalu_type in nalu_pos:
			
 
				+        nalu_types.append(nalu_type)
			
 
				+
			
 
				+    return nalu_types
			
 
				+
			
 
				+
			
 
				+class YoloV5X:
			
 
				+    def __init__(
			
 
				+        self,
			
 
				+        model_path: str,
			
 
				+        score_thres: float,
			
 
				+        nms_thres: float,
			
 
				+        pre_utils,
			
 
				+        post_utils,
			
 
				+    ):
			
 
				+        self.pre_utils = pre_utils
			
 
				+        self.post_utils = post_utils
			
 
				+
			
 
				+        self.model = hbm_runtime.HB_HBMRuntime(model_path)
			
 
				+
			
 
				+        self.model_name = self.model.model_names[0]
			
 
				+        self.input_names = self.model.input_names[self.model_name]
			
 
				+        self.output_names = self.model.output_names[self.model_name]
			
 
				+        self.input_shapes = self.model.input_shapes[self.model_name]
			
 
				+        self.output_quants = self.model.output_quants[self.model_name]
			
 
				+
			
 
				+        self.input_H = self.input_shapes[self.input_names[0]][1]
			
 
				+        self.input_W = self.input_shapes[self.input_names[0]][2]
			
 
				+
			
 
				+        self.score_thres = score_thres
			
 
				+        self.nms_thres = nms_thres
			
 
				+
			
 
				+        self.resize_type = 1
			
 
				+        self.classes_num = 80
			
 
				+
			
 
				+    def set_scheduling_params(
			
 
				+        self,
			
 
				+        priority: Optional[int] = None,
			
 
				+        bpu_cores: Optional[list] = None,
			
 
				+    ):
			
 
				+        kwargs = {}
			
 
				+
			
 
				+        if priority is not None:
			
 
				+            kwargs["priority"] = {self.model_name: priority}
			
 
				+
			
 
				+        if bpu_cores is not None:
			
 
				+            kwargs["bpu_cores"] = {self.model_name: bpu_cores}
			
 
				+
			
 
				+        if kwargs:
			
 
				+            self.model.set_scheduling_params(**kwargs)
			
 
				+
			
 
				+    def pre_process(
			
 
				+        self,
			
 
				+        img: np.ndarray,
			
 
				+        width: int,
			
 
				+        height: int,
			
 
				+    ) -> Dict[str, Dict[str, np.ndarray]]:
			
 
				+        y, uv = self.pre_utils.split_nv12_bytes(img, width, height)
			
 
				+
			
 
				+        y_resized, uv_resized = self.pre_utils.resize_nv12_yuv(
			
 
				+            y,
			
 
				+            uv,
			
 
				+            self.input_W,
			
 
				+            self.input_H,
			
 
				+        )
			
 
				+
			
 
				+        y_input = y_resized[..., None][None, ...]
			
 
				+        uv_input = uv_resized[None, ...]
			
 
				+
			
 
				+        return {
			
 
				+            self.model_name: {
			
 
				+                self.input_names[0]: y_input,
			
 
				+                self.input_names[1]: uv_input,
			
 
				+            }
			
 
				+        }
			
 
				+
			
 
				+    def forward(
			
 
				+        self,
			
 
				+        input_tensor: Dict[str, Dict[str, np.ndarray]],
			
 
				+    ) -> Dict[str, np.ndarray]:
			
 
				+        outputs = self.model.run(input_tensor)
			
 
				+        return outputs[self.model_name]
			
 
				+
			
 
				+    def post_process(
			
 
				+        self,
			
 
				+        outputs: Dict[str, np.ndarray],
			
 
				+        img_w: int,
			
 
				+        img_h: int,
			
 
				+    ) -> Tuple[np.ndarray, np.ndarray, np.ndarray]:
			
 
				+        fp32_outputs = self.post_utils.dequantize_outputs(
			
 
				+            outputs,
			
 
				+            self.output_quants,
			
 
				+        )
			
 
				+
			
 
				+        pred = self.post_utils.decode_outputs(
			
 
				+            self.output_names,
			
 
				+            fp32_outputs,
			
 
				+            STRIDES,
			
 
				+            ANCHORS,
			
 
				+            self.classes_num,
			
 
				+        )
			
 
				+
			
 
				+        xyxy_boxes, score, cls = self.post_utils.filter_predictions(
			
 
				+            pred,
			
 
				+            self.score_thres,
			
 
				+        )
			
 
				+
			
 
				+        keep = self.post_utils.NMS(
			
 
				+            xyxy_boxes,
			
 
				+            score,
			
 
				+            cls,
			
 
				+            self.nms_thres,
			
 
				+        )
			
 
				+
			
 
				+        xyxy = self.post_utils.scale_coords_back(
			
 
				+            xyxy_boxes[keep],
			
 
				+            img_w,
			
 
				+            img_h,
			
 
				+            self.input_W,
			
 
				+            self.input_H,
			
 
				+            self.resize_type,
			
 
				+        )
			
 
				+
			
 
				+        return xyxy, cls[keep], score[keep]
			
 
				+
			
 
				+
			
 
				+class RtspH264Decoder:
			
 
				+    def __init__(self, rtsp_url: str, logger=None):
			
 
				+        self.rtsp_url = rtsp_url
			
 
				+        self.logger = logger
			
 
				+
			
 
				+        self.cap = None
			
 
				+        self.dec = None
			
 
				+
			
 
				+        self.width = 0
			
 
				+        self.height = 0
			
 
				+        self.fps = 0.0
			
 
				+
			
 
				+        self.dec_chn = 0
			
 
				+        self.dec_type = 1
			
 
				+
			
 
				+        self.find_pps_sps = 0
			
 
				+        self.skip_count = 0
			
 
				+
			
 
				+    def log_info(self, text):
			
 
				+        if self.logger:
			
 
				+            self.logger.info(text)
			
 
				+        else:
			
 
				+            print(text)
			
 
				+
			
 
				+    def log_warn(self, text):
			
 
				+        if self.logger:
			
 
				+            self.logger.warn(text)
			
 
				+        else:
			
 
				+            print("[WARN]", text)
			
 
				+
			
 
				+    def log_error(self, text):
			
 
				+        if self.logger:
			
 
				+            self.logger.error(text)
			
 
				+        else:
			
 
				+            print("[ERROR]", text)
			
 
				+
			
 
				+    def open(self, dec_chn=0, dec_type=1):
			
 
				+        self.dec_chn = dec_chn
			
 
				+        self.dec_type = dec_type
			
 
				+
			
 
				+        self.cap = cv2.VideoCapture(self.rtsp_url, cv2.CAP_FFMPEG)
			
 
				+        self.cap.set(cv2.CAP_PROP_FORMAT, -1)
			
 
				+
			
 
				+        if not self.cap.isOpened():
			
 
				+            self.log_error(f"[RTSP] 打开失败: {self.rtsp_url}")
			
 
				+            return False
			
 
				+
			
 
				+        self.width = int(self.cap.get(cv2.CAP_PROP_FRAME_WIDTH))
			
 
				+        self.height = int(self.cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
			
 
				+        self.fps = self.cap.get(cv2.CAP_PROP_FPS)
			
 
				+
			
 
				+        self.log_info(
			
 
				+            f"[RTSP] open success, width={self.width}, height={self.height}, fps={self.fps}"
			
 
				+        )
			
 
				+
			
 
				+        if self.width <= 0 or self.height <= 0:
			
 
				+            self.log_error("[RTSP] width/height 无效")
			
 
				+            self.close()
			
 
				+            return False
			
 
				+
			
 
				+        self.dec = srcampy.Decoder()
			
 
				+        ret = self.dec.decode(
			
 
				+            "",
			
 
				+            self.dec_chn,
			
 
				+            self.dec_type,
			
 
				+            self.width,
			
 
				+            self.height,
			
 
				+        )
			
 
				+
			
 
				+        self.log_info(f"[DEC] decode ret={ret}")
			
 
				+
			
 
				+        if not ret_ok(ret):
			
 
				+            self.log_error("[DEC] 初始化失败")
			
 
				+            self.close()
			
 
				+            return False
			
 
				+
			
 
				+        self.find_pps_sps = 0
			
 
				+        self.skip_count = 0
			
 
				+
			
 
				+        return True
			
 
				+
			
 
				+    def close(self):
			
 
				+        try:
			
 
				+            if self.dec is not None:
			
 
				+                self.dec.close()
			
 
				+        except Exception as e:
			
 
				+            self.log_warn(f"[DEC] close 异常: {e}")
			
 
				+
			
 
				+        try:
			
 
				+            if self.cap is not None:
			
 
				+                self.cap.release()
			
 
				+        except Exception as e:
			
 
				+            self.log_warn(f"[RTSP] release 异常: {e}")
			
 
				+
			
 
				+        self.cap = None
			
 
				+        self.dec = None
			
 
				+
			
 
				+    def reopen(self):
			
 
				+        self.log_warn("[RTSP] 准备重连")
			
 
				+        self.close()
			
 
				+        time.sleep(0.5)
			
 
				+        return self.open(self.dec_chn, self.dec_type)
			
 
				+
			
 
				+    def read_frame(self):
			
 
				+        if self.cap is None or self.dec is None:
			
 
				+            return None
			
 
				+
			
 
				+        ret, stream_frame = self.cap.read()
			
 
				+
			
 
				+        if not ret or stream_frame is None:
			
 
				+            self.log_warn("[RTSP] read failed")
			
 
				+            if not self.reopen():
			
 
				+                time.sleep(1.0)
			
 
				+            return None
			
 
				+
			
 
				+        stream_bytes = stream_frame.tobytes()
			
 
				+
			
 
				+        try:
			
 
				+            nalu_types = get_h264_nalu_type(stream_bytes)
			
 
				+        except Exception as e:
			
 
				+            self.log_warn(f"[RTSP] parse nalu failed: {e}")
			
 
				+            return None
			
 
				+
			
 
				+        if not nalu_types:
			
 
				+            return None
			
 
				+
			
 
				+        if (nalu_types[0] in [1, 5]) and self.find_pps_sps == 0:
			
 
				+            return None
			
 
				+
			
 
				+        self.find_pps_sps = 1
			
 
				+
			
 
				+        ret = self.dec.set_img(stream_bytes, self.dec_chn)
			
 
				+        if ret != 0:
			
 
				+            self.log_warn(f"[DEC] set_img failed ret={ret}")
			
 
				+            return None
			
 
				+
			
 
				+        if self.skip_count < 8:
			
 
				+            self.skip_count += 1
			
 
				+            return None
			
 
				+
			
 
				+        frame = self.dec.get_img()
			
 
				+        return frame
			
 
				+
			
 
				+
			
 
				+class PersonApproachNode(Node):
			
 
				+    def __init__(self):
			
 
				+        super().__init__("person_approach_node")
			
 
				+
			
 
				+        self.declare_params()
			
 
				+        self.load_params()
			
 
				+
			
 
				+        self.load_pydev_utils()
			
 
				+
			
 
				+        self.event_pub = self.create_publisher(
			
 
				+            String,
			
 
				+            self.event_topic,
			
 
				+            10,
			
 
				+        )
			
 
				+
			
 
				+        self.running = True
			
 
				+        self.decoder = None
			
 
				+        self.yolo = None
			
 
				+        self.class_names = []
			
 
				+
			
 
				+        self.stable_count = 0
			
 
				+        self.last_event_time = 0.0
			
 
				+        self.frame_count = 0
			
 
				+        self.fps_start_time = time.time()
			
 
				+
			
 
				+        self.get_logger().info("[人物靠近] 节点初始化完成")
			
 
				+
			
 
				+    def declare_params(self):
			
 
				+        self.declare_parameter(
			
 
				+            "rtsp_url",
			
 
				+            "rtsp://admin:hhzx2025@192.168.0.36:554/Streaming/Channels/201",
			
 
				+        )
			
 
				+        self.declare_parameter(
			
 
				+            "model_path",
			
 
				+            "/opt/hobot/model/s100/basic/yolov5x_672x672_nv12.hbm",
			
 
				+        )
			
 
				+        self.declare_parameter(
			
 
				+            "label_file",
			
 
				+            "/app/res/labels/coco_classes.names",
			
 
				+        )
			
 
				+        self.declare_parameter(
			
 
				+            "pydev_demo_path",
			
 
				+            "/app/pydev_demo",
			
 
				+        )
			
 
				+
			
 
				+        self.declare_parameter("priority", 0)
			
 
				+        self.declare_parameter("bpu_cores", [0])
			
 
				+
			
 
				+        self.declare_parameter("score_thres", 0.25)
			
 
				+        self.declare_parameter("nms_thres", 0.45)
			
 
				+
			
 
				+        self.declare_parameter("person_score_thres", 0.45)
			
 
				+        self.declare_parameter("area_ratio_thres", 0.15)
			
 
				+        self.declare_parameter("center_offset_thres", 0.25)
			
 
				+        self.declare_parameter("stable_frames", 5)
			
 
				+        self.declare_parameter("cooldown_sec", 8.0)
			
 
				+        self.declare_parameter("loop_sleep_sec", 0.01)
			
 
				+
			
 
				+        self.declare_parameter("debug", True)
			
 
				+        self.declare_parameter("event_topic", "/greeting/person_approach")
			
 
				+
			
 
				+    def load_params(self):
			
 
				+        self.rtsp_url = self.get_parameter("rtsp_url").value
			
 
				+        self.model_path = self.get_parameter("model_path").value
			
 
				+        self.label_file = self.get_parameter("label_file").value
			
 
				+        self.pydev_demo_path = self.get_parameter("pydev_demo_path").value
			
 
				+
			
 
				+        self.priority = int(self.get_parameter("priority").value)
			
 
				+        self.bpu_cores = list(self.get_parameter("bpu_cores").value)
			
 
				+
			
 
				+        self.score_thres = float(self.get_parameter("score_thres").value)
			
 
				+        self.nms_thres = float(self.get_parameter("nms_thres").value)
			
 
				+
			
 
				+        self.person_score_thres = float(
			
 
				+            self.get_parameter("person_score_thres").value
			
 
				+        )
			
 
				+        self.area_ratio_thres = float(
			
 
				+            self.get_parameter("area_ratio_thres").value
			
 
				+        )
			
 
				+        self.center_offset_thres = float(
			
 
				+            self.get_parameter("center_offset_thres").value
			
 
				+        )
			
 
				+        self.stable_frames = int(
			
 
				+            self.get_parameter("stable_frames").value
			
 
				+        )
			
 
				+        self.cooldown_sec = float(
			
 
				+            self.get_parameter("cooldown_sec").value
			
 
				+        )
			
 
				+        self.loop_sleep_sec = float(
			
 
				+            self.get_parameter("loop_sleep_sec").value
			
 
				+        )
			
 
				+
			
 
				+        self.debug = bool(self.get_parameter("debug").value)
			
 
				+        self.event_topic = self.get_parameter("event_topic").value
			
 
				+
			
 
				+    def load_pydev_utils(self):
			
 
				+        """
			
 
				+        加载 YOLO demo 的 utils。
			
 
				+        优先使用 person_approach_skill 包内置 utils。
			
 
				+        """
			
 
				+        try:
			
 
				+            from person_approach_skill.utils import preprocess_utils as pre_utils
			
 
				+            from person_approach_skill.utils import postprocess_utils as post_utils
			
 
				+            from person_approach_skill.utils import common_utils as common
			
 
				+
			
 
				+            self.pre_utils = pre_utils
			
 
				+            self.post_utils = post_utils
			
 
				+            self.common = common
			
 
				+
			
 
				+            self.get_logger().info("[人物靠近] 使用 person_approach_skill 内置 utils")
			
 
				+            return
			
 
				+
			
 
				+        except Exception as e:
			
 
				+            self.get_logger().warn(f"[人物靠近] 内置 utils 加载失败，尝试外部 utils: {e}")
			
 
				+
			
 
				+        candidate_paths = [
			
 
				+            self.pydev_demo_path,
			
 
				+            "/app/pydev_demo",
			
 
				+            "/app/pydev_demo/12_rtsp_yolov5x_display_sample/..",
			
 
				+        ]
			
 
				+
			
 
				+        for path in candidate_paths:
			
 
				+            path = os.path.abspath(path)
			
 
				+            if path not in sys.path:
			
 
				+                sys.path.insert(0, path)
			
 
				+
			
 
				+        try:
			
 
				+            import skill_utils.preprocess_utils as pre_utils
			
 
				+            import skill_utils.postprocess_utils as post_utils
			
 
				+            import skill_utils.common_utils as common
			
 
				+
			
 
				+            self.pre_utils = pre_utils
			
 
				+            self.post_utils = post_utils
			
 
				+            self.common = common
			
 
				+
			
 
				+            self.get_logger().info("[人物靠近] 使用外部 /app/pydev_demo/utils")
			
 
				+
			
 
				+        except Exception as e:
			
 
				+            self.get_logger().error(
			
 
				+                f"[人物靠近] utils 加载失败: {e}，请检查 pydev_demo_path={self.pydev_demo_path}"
			
 
				+            )
			
 
				+            raise
			
 
				+
			
 
				+    def init_detector(self):
			
 
				+        if not os.path.exists(self.model_path):
			
 
				+            self.get_logger().error(f"[人物靠近] 模型不存在: {self.model_path}")
			
 
				+            return False
			
 
				+
			
 
				+        if not os.path.exists(self.label_file):
			
 
				+            self.get_logger().error(f"[人物靠近] label 文件不存在: {self.label_file}")
			
 
				+            return False
			
 
				+
			
 
				+        self.class_names = self.common.load_class_names(self.label_file)
			
 
				+
			
 
				+        self.yolo = YoloV5X(
			
 
				+            model_path=self.model_path,
			
 
				+            score_thres=self.score_thres,
			
 
				+            nms_thres=self.nms_thres,
			
 
				+            pre_utils=self.pre_utils,
			
 
				+            post_utils=self.post_utils,
			
 
				+        )
			
 
				+
			
 
				+        self.yolo.set_scheduling_params(
			
 
				+            priority=self.priority,
			
 
				+            bpu_cores=self.bpu_cores,
			
 
				+        )
			
 
				+
			
 
				+        self.get_logger().info(
			
 
				+            f"[人物靠近] 模型加载完成: {self.model_path}"
			
 
				+        )
			
 
				+
			
 
				+        self.decoder = RtspH264Decoder(
			
 
				+            rtsp_url=self.rtsp_url,
			
 
				+            logger=self.get_logger(),
			
 
				+        )
			
 
				+
			
 
				+        if not self.decoder.open(dec_chn=0, dec_type=1):
			
 
				+            self.get_logger().error("[人物靠近] RTSP/Decoder 初始化失败")
			
 
				+            return False
			
 
				+
			
 
				+        self.get_logger().info(
			
 
				+            f"[人物靠近] RTSP 初始化完成: {self.decoder.width}x{self.decoder.height}"
			
 
				+        )
			
 
				+
			
 
				+        return True
			
 
				+
			
 
				+    def get_person_class_id(self):
			
 
				+        for idx, name in enumerate(self.class_names):
			
 
				+            if name.strip().lower() == "person":
			
 
				+                return idx
			
 
				+        return 0
			
 
				+
			
 
				+    def detect_person_close(self, boxes, cls_ids, scores, width, height):
			
 
				+        person_cls_id = self.get_person_class_id()
			
 
				+
			
 
				+        image_area = float(width * height)
			
 
				+        img_cx = width / 2.0
			
 
				+
			
 
				+        best = None
			
 
				+
			
 
				+        for box, cls_id, score in zip(boxes, cls_ids, scores):
			
 
				+            cls_id = int(cls_id)
			
 
				+            score = float(score)
			
 
				+
			
 
				+            if cls_id != person_cls_id:
			
 
				+                continue
			
 
				+
			
 
				+            if score < self.person_score_thres:
			
 
				+                continue
			
 
				+
			
 
				+            x1, y1, x2, y2 = box.astype(float)
			
 
				+
			
 
				+            x1 = max(0.0, min(float(width - 1), x1))
			
 
				+            y1 = max(0.0, min(float(height - 1), y1))
			
 
				+            x2 = max(0.0, min(float(width - 1), x2))
			
 
				+            y2 = max(0.0, min(float(height - 1), y2))
			
 
				+
			
 
				+            box_w = max(0.0, x2 - x1)
			
 
				+            box_h = max(0.0, y2 - y1)
			
 
				+
			
 
				+            if box_w <= 0 or box_h <= 0:
			
 
				+                continue
			
 
				+
			
 
				+            area_ratio = (box_w * box_h) / image_area
			
 
				+            cx = (x1 + x2) / 2.0
			
 
				+            center_offset = abs(cx - img_cx) / float(width)
			
 
				+
			
 
				+            is_close = (
			
 
				+                area_ratio >= self.area_ratio_thres
			
 
				+                and center_offset <= self.center_offset_thres
			
 
				+            )
			
 
				+
			
 
				+            candidate = {
			
 
				+                "is_close": is_close,
			
 
				+                "score": score,
			
 
				+                "bbox": [
			
 
				+                    int(x1),
			
 
				+                    int(y1),
			
 
				+                    int(x2),
			
 
				+                    int(y2),
			
 
				+                ],
			
 
				+                "area_ratio": float(area_ratio),
			
 
				+                "center_offset": float(center_offset),
			
 
				+                "class_id": int(cls_id),
			
 
				+                "class_name": "person",
			
 
				+            }
			
 
				+
			
 
				+            if best is None:
			
 
				+                best = candidate
			
 
				+            elif candidate["area_ratio"] > best["area_ratio"]:
			
 
				+                best = candidate
			
 
				+
			
 
				+        return best
			
 
				+
			
 
				+    def publish_person_approach(self, result):
			
 
				+        now = time.time()
			
 
				+
			
 
				+        if now - self.last_event_time < self.cooldown_sec:
			
 
				+            return
			
 
				+
			
 
				+        self.last_event_time = now
			
 
				+
			
 
				+        event = {
			
 
				+            "event": "person_approach",
			
 
				+            "score": float(result["score"]),
			
 
				+            "bbox": result["bbox"],
			
 
				+            "area_ratio": float(result["area_ratio"]),
			
 
				+            "center_offset": float(result["center_offset"]),
			
 
				+            "timestamp": now,
			
 
				+            "source": "person_approach_node",
			
 
				+        }
			
 
				+
			
 
				+        self.event_pub.publish(
			
 
				+            String(data=json.dumps(event, ensure_ascii=False))
			
 
				+        )
			
 
				+
			
 
				+        self.get_logger().info(
			
 
				+            f"[人物靠近] 发布人员靠近事件: {event}"
			
 
				+        )
			
 
				+
			
 
				+    def process_once(self):
			
 
				+        frame = self.decoder.read_frame()
			
 
				+
			
 
				+        if frame is None:
			
 
				+            return
			
 
				+
			
 
				+        width = self.decoder.width
			
 
				+        height = self.decoder.height
			
 
				+
			
 
				+        expected_len = width * height * 3 // 2
			
 
				+        if len(frame) != expected_len:
			
 
				+            self.get_logger().warn(
			
 
				+                f"[人物靠近] NV12 长度不匹配 len={len(frame)}, expected={expected_len}"
			
 
				+            )
			
 
				+            return
			
 
				+
			
 
				+        img_np = np.frombuffer(frame, dtype=np.uint8)
			
 
				+
			
 
				+        input_tensor = self.yolo.pre_process(
			
 
				+            img_np,
			
 
				+            width,
			
 
				+            height,
			
 
				+        )
			
 
				+
			
 
				+        outputs = self.yolo.forward(input_tensor)
			
 
				+
			
 
				+        boxes, cls_ids, scores = self.yolo.post_process(
			
 
				+            outputs,
			
 
				+            width,
			
 
				+            height,
			
 
				+        )
			
 
				+
			
 
				+        result = self.detect_person_close(
			
 
				+            boxes,
			
 
				+            cls_ids,
			
 
				+            scores,
			
 
				+            width,
			
 
				+            height,
			
 
				+        )
			
 
				+
			
 
				+        if result and result["is_close"]:
			
 
				+            self.stable_count += 1
			
 
				+
			
 
				+            if self.debug:
			
 
				+                self.get_logger().info(
			
 
				+                    "[人物靠近] person close candidate "
			
 
				+                    f"stable={self.stable_count}/{self.stable_frames}, "
			
 
				+                    f"score={result['score']:.2f}, "
			
 
				+                    f"area={result['area_ratio']:.3f}, "
			
 
				+                    f"center_offset={result['center_offset']:.3f}, "
			
 
				+                    f"bbox={result['bbox']}"
			
 
				+                )
			
 
				+
			
 
				+            if self.stable_count >= self.stable_frames:
			
 
				+                self.publish_person_approach(result)
			
 
				+                self.stable_count = 0
			
 
				+        else:
			
 
				+            self.stable_count = 0
			
 
				+
			
 
				+        self.frame_count += 1
			
 
				+        now = time.time()
			
 
				+
			
 
				+        if now - self.fps_start_time > 3.0:
			
 
				+            fps = self.frame_count / (now - self.fps_start_time)
			
 
				+            self.get_logger().info(f"[人物靠近] FPS: {fps:.2f}")
			
 
				+            self.frame_count = 0
			
 
				+            self.fps_start_time = now
			
 
				+
			
 
				+    def run_loop(self):
			
 
				+        self.get_logger().info("[人物靠近] 开始检测循环")
			
 
				+
			
 
				+        if not self.init_detector():
			
 
				+            self.get_logger().error("[人物靠近] 初始化失败，节点退出")
			
 
				+            return
			
 
				+
			
 
				+        while rclpy.ok() and self.running:
			
 
				+            rclpy.spin_once(self, timeout_sec=0.0)
			
 
				+
			
 
				+            try:
			
 
				+                self.process_once()
			
 
				+            except Exception as e:
			
 
				+                self.get_logger().error(f"[人物靠近] process_once 异常: {e}")
			
 
				+                time.sleep(0.1)
			
 
				+
			
 
				+            if self.loop_sleep_sec > 0:
			
 
				+                time.sleep(self.loop_sleep_sec)
			
 
				+
			
 
				+        self.close()
			
 
				+
			
 
				+    def close(self):
			
 
				+        self.get_logger().info("[人物靠近] 正在释放资源")
			
 
				+
			
 
				+        try:
			
 
				+            if self.decoder is not None:
			
 
				+                self.decoder.close()
			
 
				+        except Exception as e:
			
 
				+            self.get_logger().warn(f"[人物靠近] decoder close 异常: {e}")
			
 
				+
			
 
				+        self.get_logger().info("[人物靠近] 节点退出")
			
 
				+
			
 
				+
			
 
				+def main(args=None):
			
 
				+    rclpy.init(args=args)
			
 
				+
			
 
				+    node = PersonApproachNode()
			
 
				+
			
 
				+    def _signal_handler(sig, frame):
			
 
				+        node.get_logger().info("[人物靠近] 收到退出信号")
			
 
				+        node.running = False
			
 
				+
			
 
				+    signal.signal(signal.SIGINT, _signal_handler)
			
 
				+    signal.signal(signal.SIGTERM, _signal_handler)
			
 
				+
			
 
				+    try:
			
 
				+        node.run_loop()
			
 
				+    except KeyboardInterrupt:
			
 
				+        node.get_logger().info("[人物靠近] KeyboardInterrupt")
			
 
				+    finally:
			
 
				+        node.close()
			
 
				+        node.destroy_node()
			
 
				+        rclpy.shutdown()
			
 
				+
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    main()
			
--- a/brain/PlannerNode2/Skill/person_approach_skill/resource/person_approach_skill
+++ b/brain/PlannerNode2/Skill/person_approach_skill/resource/person_approach_skill
--- a/brain/PlannerNode2/Skill/person_approach_skill/setup.cfg
+++ b/brain/PlannerNode2/Skill/person_approach_skill/setup.cfg
@@ -0,0 +1,4 @@
 
				+[develop]
			
 
				+script_dir=$base/lib/person_approach_skill
			
 
				+[install]
			
 
				+install_scripts=$base/lib/person_approach_skill
			
--- a/brain/PlannerNode2/Skill/person_approach_skill/setup.py
+++ b/brain/PlannerNode2/Skill/person_approach_skill/setup.py
@@ -0,0 +1,41 @@
 
				+from setuptools import setup, find_packages
			
 
				+import os
			
 
				+from glob import glob
			
 
				+
			
 
				+package_name = 'person_approach_skill'
			
 
				+
			
 
				+setup(
			
 
				+    name=package_name,
			
 
				+    version='0.0.0',
			
 
				+    packages=find_packages(),
			
 
				+    data_files=[
			
 
				+        (
			
 
				+            'share/ament_index/resource_index/packages',
			
 
				+            ['resource/' + package_name]
			
 
				+        ),
			
 
				+        (
			
 
				+            'share/' + package_name,
			
 
				+            ['package.xml']
			
 
				+        ),
			
 
				+        (
			
 
				+            os.path.join('share', package_name, 'config'),
			
 
				+            glob('config/*.yaml')
			
 
				+        ),
			
 
				+        (
			
 
				+            os.path.join('share', package_name, 'launch'),
			
 
				+            glob('launch/*.py')
			
 
				+        ),
			
 
				+    ],
			
 
				+    install_requires=['setuptools'],
			
 
				+    zip_safe=True,
			
 
				+    maintainer='sunrise',
			
 
				+    maintainer_email='sunrise@example.com',
			
 
				+    description='Greeting vision skill for AI Agent',
			
 
				+    license='Apache-2.0',
			
 
				+    tests_require=['pytest'],
			
 
				+    entry_points={
			
 
				+        'console_scripts': [
			
 
				+            'person_approach_node = person_approach_skill.person_approach_node:main',
			
 
				+        ],
			
 
				+    },
			
 
				+)
			
--- a/brain/PlannerNode2/Skill/person_approach_skill/skill_utils/__init__.py
+++ b/brain/PlannerNode2/Skill/person_approach_skill/skill_utils/__init__.py
@@ -0,0 +1,7 @@
 
				+# flake8: noqa: F401
			
 
				+# flake8: noqa: F403
			
 
				+
			
 
				+from .preprocess_utils import *
			
 
				+from .postprocess_utils import *
			
 
				+from .draw_utils import *
			
 
				+from .common_utils import *
			
--- a/brain/PlannerNode2/Skill/person_approach_skill/skill_utils/common_utils.py
+++ b/brain/PlannerNode2/Skill/person_approach_skill/skill_utils/common_utils.py
@@ -0,0 +1,213 @@
 
				+# Copyright (c) 2025 D-Robotics Corporation
			
 
				+#
			
 
				+# Licensed under the Apache License, Version 2.0 (the "License");
			
 
				+# you may not use this file except in compliance with the License.
			
 
				+# You may obtain a copy of the License at
			
 
				+#
			
 
				+#     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+#
			
 
				+# Unless required by applicable law or agreed to in writing, software
			
 
				+# distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+# See the License for the specific language governing permissions and
			
 
				+# limitations under the License.
			
 
				+
			
 
				+# flake8: noqa: E501
			
 
				+
			
 
				+import cv2
			
 
				+import numpy as np
			
 
				+
			
 
				+# List of predefined RGB color tuples used for bounding box visualization.
			
 
				+rdk_colors = [
			
 
				+    (56, 56, 255), (151, 157, 255), (31, 112, 255), (29, 178, 255),
			
 
				+    (49, 210, 207), (10, 249, 72), (23, 204, 146), (134, 219, 61),
			
 
				+    (52, 147, 26), (187, 212, 0), (168, 153, 44), (255, 194, 0),
			
 
				+    (147, 69, 52), (255, 115, 100), (236, 24, 0), (255, 56, 132),
			
 
				+    (133, 0, 82), (255, 56, 203), (200, 149, 255), (199, 55, 255)]
			
 
				+
			
 
				+
			
 
				+def load_image(img_path: str) -> np.ndarray:
			
 
				+    """
			
 
				+    @brief Load an image from file path using OpenCV.
			
 
				+    @param img_path Path to the image file.
			
 
				+    @return Image as a NumPy ndarray in BGR format.
			
 
				+    @throws FileNotFoundError if the image cannot be loaded.
			
 
				+    """
			
 
				+    img = cv2.imread(img_path)
			
 
				+    if img is None:
			
 
				+        raise FileNotFoundError(f"Image file '{img_path}' not found.")
			
 
				+    return img
			
 
				+
			
 
				+
			
 
				+def load_class_names(path: str) -> list:
			
 
				+    """
			
 
				+    @brief Load class names from a file.
			
 
				+    @param path Path to the label file, each line contains a class name.
			
 
				+    @return List of class name strings.
			
 
				+    """
			
 
				+    with open(path, 'r') as f:
			
 
				+        # Strip whitespace and filter out empty lines
			
 
				+        class_names = [line.strip() for line in f.readlines() if line.strip()]
			
 
				+    return class_names
			
 
				+
			
 
				+
			
 
				+def zscore_normalize_lastdim(x: np.ndarray) -> np.ndarray:
			
 
				+    """
			
 
				+    @brief Normalize input array along the last dimension.
			
 
				+    @details This function performs standard score normalization (z-score).
			
 
				+    @param x Input NumPy array of shape (..., channels).
			
 
				+    @return Normalized array with mean 0 and variance 1 per vector.
			
 
				+    """
			
 
				+    mean = np.mean(x, axis=-1, keepdims=True)        # Compute mean per sample
			
 
				+    var = np.var(x, axis=-1, keepdims=True)          # Compute variance per sample
			
 
				+    return np.squeeze((x - mean) / np.sqrt(var + 1e-5))  # Z-score normalization
			
 
				+
			
 
				+
			
 
				+def print_model_info(models: object) -> None:
			
 
				+    """Print detailed information about input and \
			
 
				+        output tensors of all models in the system."""
			
 
				+
			
 
				+    # 1. Model Name List
			
 
				+    print("=== Model Name List ===")
			
 
				+    model_names = models.model_names
			
 
				+    print(model_names)
			
 
				+
			
 
				+    # 2. Total Number of Models
			
 
				+    print("\n=== Model Count ===")
			
 
				+    print(models.model_count)
			
 
				+
			
 
				+    # 3. Input Count per Model
			
 
				+    print("\n=== Input Counts ===")
			
 
				+    input_counts = models.input_counts
			
 
				+    for model, count in input_counts.items():
			
 
				+        print(f"{model}: {count}")
			
 
				+
			
 
				+    # 4. Input Names per Model
			
 
				+    print("\n=== Input Names ===")
			
 
				+    input_names = models.input_names
			
 
				+    for model, inputs in input_names.items():
			
 
				+        print(f"{model}:")
			
 
				+        for name in inputs:
			
 
				+            print(f"  - {name}")
			
 
				+
			
 
				+    # 5. Input Tensor Shapes
			
 
				+    print("\n=== Input Tensor Shapes ===")
			
 
				+    input_shapes = models.input_shapes
			
 
				+    for model, inputs in input_shapes.items():
			
 
				+        print(f"{model}:")
			
 
				+        for name, shape in inputs.items():
			
 
				+            print(f"  {name} -> shape: {shape}")
			
 
				+
			
 
				+    # 6. Input Tensor Data Types
			
 
				+    print("\n=== Input Tensor Types ===")
			
 
				+    input_types = models.input_dtypes
			
 
				+    for model, inputs in input_types.items():
			
 
				+        print(f"{model}:")
			
 
				+        for name, dtype in inputs.items():
			
 
				+            print(f"  {name} -> dtype: {dtype.name}")
			
 
				+
			
 
				+    # 7. Input Quantization Information
			
 
				+    print("\n=== Input Quantization Info ===")
			
 
				+    input_quanti_info = models.input_quants
			
 
				+    for model, inputs in input_quanti_info.items():
			
 
				+        print(f"{model}:")
			
 
				+        for name, info in inputs.items():
			
 
				+            print(f"  {name}:")
			
 
				+            print(f"    quanti_type: {info.quant_type.name}")
			
 
				+            print(f"    quantize_axis: {info.axis}")
			
 
				+            print(f"    scale_data: {info.scale.tolist()}")
			
 
				+            print(f"    zero_point_data: {info.zero_point.tolist()}")
			
 
				+
			
 
				+    # 8. Input Tensor Stride
			
 
				+    print("\n=== Input Tensor Stride ===")
			
 
				+    input_strides = models.input_strides
			
 
				+    for model, inputs in input_strides.items():
			
 
				+        print(f"{model}:")
			
 
				+        for name, stride in inputs.items():
			
 
				+            print(f"  {name} -> stride: {stride}")
			
 
				+
			
 
				+    # 9. Input Descriptions
			
 
				+    input_descs = models.input_descs
			
 
				+    for model, inputs in input_descs.items():
			
 
				+        for name, desc in inputs.items():
			
 
				+            print(f"[Input] {model}.{name} desc: {desc}")
			
 
				+
			
 
				+    print("\n================ OUTPUT TESTS ================\n")
			
 
				+
			
 
				+    # 1. Output Count per Model
			
 
				+    print("=== Output Counts ===")
			
 
				+    output_counts = models.output_counts
			
 
				+    for model, count in output_counts.items():
			
 
				+        print(f"{model}: {count}")
			
 
				+
			
 
				+    # 2. Output Names per Model
			
 
				+    print("\n=== Output Names ===")
			
 
				+    output_names = models.output_names
			
 
				+    for model, outputs in output_names.items():
			
 
				+        print(f"{model}:")
			
 
				+        for name in outputs:
			
 
				+            print(f"  - {name}")
			
 
				+
			
 
				+    # 3. Output Tensor Shapes
			
 
				+    print("\n=== Output Tensor Shapes ===")
			
 
				+    output_shapes = models.output_shapes
			
 
				+    for model, outputs in output_shapes.items():
			
 
				+        print(f"{model}:")
			
 
				+        for name, shape in outputs.items():
			
 
				+            print(f"  {name} -> shape: {shape}")
			
 
				+
			
 
				+    # 4. Output Tensor Data Types
			
 
				+    print("\n=== Output Tensor Types ===")
			
 
				+    output_types = models.output_dtypes
			
 
				+    for model, outputs in output_types.items():
			
 
				+        print(f"{model}:")
			
 
				+        for name, dtype in outputs.items():
			
 
				+            print(f"  {name} -> dtype: {dtype.name}")
			
 
				+
			
 
				+    # 5. Output Quantization Information
			
 
				+    print("\n=== Output Quantization Info ===")
			
 
				+    output_quanti = models.output_quants
			
 
				+    for model, outputs in output_quanti.items():
			
 
				+        print(f"{model}:")
			
 
				+        for name, info in outputs.items():
			
 
				+            print(f"  {name}:")
			
 
				+            print(f"    quanti_type: {info.quant_type.name}")
			
 
				+            print(f"    quantize_axis: {info.axis}")
			
 
				+            print(f"    scale_data: {info.scale}")
			
 
				+            print(f"    zero_point_data: {info.zero_point}")
			
 
				+
			
 
				+    # 6. Output Tensor Stride
			
 
				+    print("\n=== Output Tensor Stride ===")
			
 
				+    output_stride = models.output_strides
			
 
				+    for model, outputs in output_stride.items():
			
 
				+        print(f"{model}:")
			
 
				+        for name, stride in outputs.items():
			
 
				+            print(f"  {name} -> stride: {stride}")
			
 
				+
			
 
				+    # 7. Output Descriptions
			
 
				+    output_descs = models.output_descs
			
 
				+    for model, outputs in output_descs.items():
			
 
				+        for name, desc in outputs.items():
			
 
				+            print(f"[Output] {model}.{name} desc: {desc}")
			
 
				+
			
 
				+    # Get and Print Model Description Info
			
 
				+    print("\nModel Description:")
			
 
				+    model_desc = models.model_descs
			
 
				+    for model_name, desc in model_desc.items():
			
 
				+        print(f" - {model_name}: {desc}")
			
 
				+
			
 
				+    # Get and Print HBM Description Info
			
 
				+    print("\nHBM Description:")
			
 
				+    hbm_desc = models.hbm_descs
			
 
				+    for file_name, desc in hbm_desc.items():
			
 
				+        print(f" - {file_name}: {desc}")
			
 
				+
			
 
				+        # Get and PrintScheduling Params
			
 
				+    print("\n=== Scheduling Parameters ===")
			
 
				+    sched_params = models.sched_params
			
 
				+    for model_name, sched in sched_params.items():
			
 
				+        print(f"{model_name}:")
			
 
				+        print(f"  priority    : {sched.priority}")
			
 
				+        print(f"  customId    : {sched.customId}")
			
 
				+        print(f"  bpu_cores   : {sched.bpu_cores}")
			
 
				+        print(f"  deviceId    : {sched.deviceId}")
			
--- a/brain/PlannerNode2/Skill/person_approach_skill/skill_utils/draw_utils.py
+++ b/brain/PlannerNode2/Skill/person_approach_skill/skill_utils/draw_utils.py
@@ -0,0 +1,207 @@
 
				+# Copyright (c) 2025 D-Robotics Corporation
			
 
				+#
			
 
				+# Licensed under the Apache License, Version 2.0 (the "License");
			
 
				+# you may not use this file except in compliance with the License.
			
 
				+# You may obtain a copy of the License at
			
 
				+#
			
 
				+#     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+#
			
 
				+# Unless required by applicable law or agreed to in writing, software
			
 
				+# distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+# See the License for the specific language governing permissions and
			
 
				+# limitations under the License.
			
 
				+
			
 
				+# flake8: noqa: E501
			
 
				+
			
 
				+import cv2
			
 
				+import numpy as np
			
 
				+
			
 
				+
			
 
				+def draw_boxes(image: np.ndarray, boxes: np.ndarray, cls_ids: np.ndarray,
			
 
				+               scores: np.ndarray, class_names: list, colors: list) -> np.ndarray:
			
 
				+    """
			
 
				+    @brief Draw bounding boxes with class names and scores on the image.
			
 
				+    @param image Input image as a NumPy array.
			
 
				+    @param boxes Bounding boxes as a NumPy array of shape (N, 4), format: [x1, y1, x2, y2].
			
 
				+    @param cls_ids List or array of class indices corresponding to boxes.
			
 
				+    @param scores List or array of confidence scores for each detection.
			
 
				+    @param class_names List of class name strings.
			
 
				+    @param colors List of RGB color tuples for each class.
			
 
				+    @return Image with drawn boxes and labels.
			
 
				+    """
			
 
				+    for box, cls_id, score in zip(boxes, cls_ids, scores):
			
 
				+        x1, y1, x2, y2 = map(int, box)
			
 
				+        color = colors[cls_id % len(colors)]
			
 
				+        label = f"{class_names[cls_id]} {score:.2f}"
			
 
				+
			
 
				+        # Draw bounding box
			
 
				+        cv2.rectangle(image, (x1, y1), (x2, y2), color, thickness=2)
			
 
				+
			
 
				+        # Draw class label and score
			
 
				+        cv2.putText(image, label, (x1, max(y1 - 5, 0)),
			
 
				+                    fontFace=cv2.FONT_HERSHEY_SIMPLEX,
			
 
				+                    fontScale=0.5, color=color, thickness=1)
			
 
				+
			
 
				+    return image
			
 
				+
			
 
				+
			
 
				+def draw_masks(image: np.ndarray, boxes: np.ndarray, masks: list,
			
 
				+               cls_ids: list, colors: list, alpha: float = 0.3) -> None:
			
 
				+    """
			
 
				+    @brief Overlay semi-transparent instance masks on the image.
			
 
				+    @param image Input image to draw on (modified in-place).
			
 
				+    @param boxes Bounding boxes corresponding to masks, shape: (N, 4).
			
 
				+    @param masks List of binary masks, each with shape matching box region.
			
 
				+    @param cls_ids List of class indices for each instance.
			
 
				+    @param colors List of RGB color tuples for each class.
			
 
				+    @param alpha Transparency level for the masks (0: transparent, 1: opaque).
			
 
				+    @return None
			
 
				+    """
			
 
				+    for class_id, box, mask in zip(cls_ids, boxes, masks):
			
 
				+        x1, y1, x2, y2 = map(int, box)
			
 
				+        if mask.size == 0 or x2 <= x1 or y2 <= y1:
			
 
				+            continue
			
 
				+
			
 
				+        region = image[y1:y2, x1:x2]  # Crop region from image
			
 
				+        mask_area = mask.astype(bool)  # Convert to boolean mask
			
 
				+
			
 
				+        if not np.any(mask_area):
			
 
				+            continue
			
 
				+
			
 
				+        # Generate a solid color patch
			
 
				+        color = colors[(class_id - 1) % len(colors)]
			
 
				+        color_patch = np.empty(region.shape, dtype=np.uint8)
			
 
				+        color_patch[:, :] = color
			
 
				+
			
 
				+        # Blend mask with image
			
 
				+        region[mask_area] = (
			
 
				+            (1 - alpha) * region[mask_area] + alpha * color_patch[mask_area]
			
 
				+        ).astype(np.uint8)
			
 
				+
			
 
				+
			
 
				+def draw_contours(img: np.ndarray, boxes: np.ndarray, masks: list,
			
 
				+                  cls_ids: list, colors: list, thickness: int = 2) -> None:
			
 
				+    """
			
 
				+    @brief Draw contour outlines of instance masks on the image.
			
 
				+    @param img Input image to draw on (modified in-place).
			
 
				+    @param boxes Bounding boxes for each mask, shape: (N, 4).
			
 
				+    @param masks List of binary masks for each instance.
			
 
				+    @param cls_ids List of class indices for each instance.
			
 
				+    @param colors List of RGB color tuples.
			
 
				+    @param thickness Thickness of contour lines.
			
 
				+    @return None
			
 
				+    """
			
 
				+    for class_id, box, mask in zip(cls_ids, boxes, masks):
			
 
				+        x1, y1, x2, y2 = map(int, box)
			
 
				+        if mask.size == 0:
			
 
				+            continue
			
 
				+
			
 
				+        # Extract external contours from mask
			
 
				+        contours, _ = cv2.findContours(mask, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
			
 
				+        if not contours:
			
 
				+            continue
			
 
				+
			
 
				+        # Merge all contours and shift to global coordinates
			
 
				+        merged_points = np.vstack([c for c in contours])
			
 
				+        merged_points[:, 0, 0] += x1
			
 
				+        merged_points[:, 0, 1] += y1
			
 
				+
			
 
				+        # Draw the contour line on the image
			
 
				+        cv2.polylines(img, [merged_points], isClosed=True,
			
 
				+                      color=colors[(class_id - 1) % len(colors)],
			
 
				+                      thickness=thickness)
			
 
				+
			
 
				+
			
 
				+def rgb_to_disp_color(rgb_tuple: tuple) -> int:
			
 
				+    """
			
 
				+    @brief Convert RGB tuple to 32-bit ARGB display color format.
			
 
				+    @details Format is ARGB: alpha in high 8 bits, followed by R, G, B.
			
 
				+    @param rgb_tuple Tuple of (R, G, B) values.
			
 
				+    @return 32-bit ARGB integer color value.
			
 
				+    """
			
 
				+    r, g, b = rgb_tuple
			
 
				+    alpha = 255
			
 
				+    return (alpha << 24) | (r << 16) | (g << 8) | b
			
 
				+
			
 
				+
			
 
				+def draw_detections_on_disp(disp, boxes: np.ndarray, cls_ids: list,
			
 
				+                            scores: list, class_names: list,
			
 
				+                            colors: list, chn: int = 2) -> None:
			
 
				+    """
			
 
				+    @brief Draw detection boxes and labels on a hardware display.
			
 
				+    @param disp Display device object with `set_graph_rect` and `set_graph_word` methods.
			
 
				+    @param boxes Array of bounding boxes (N, 4).
			
 
				+    @param cls_ids List of class indices.
			
 
				+    @param scores List of detection confidence scores.
			
 
				+    @param class_names List of class name strings.
			
 
				+    @param colors List of RGB color tuples.
			
 
				+    @param chn Display channel index.
			
 
				+    @return None
			
 
				+    """
			
 
				+    # Clear canvas
			
 
				+    disp.set_graph_rect(0, 0, 0, 0, 2, 1, 0, 3)
			
 
				+    disp.set_graph_word(0, 0, "", chn, 1, 0, 16)
			
 
				+
			
 
				+    for box, cls_id, score in zip(boxes, cls_ids, scores):
			
 
				+        x1, y1, x2, y2 = map(int, box)
			
 
				+        label = f"{class_names[cls_id]} {score:.2f}"
			
 
				+        color = rgb_to_disp_color(colors[cls_id % len(colors)])
			
 
				+
			
 
				+        # Draw bounding box on display
			
 
				+        disp.set_graph_rect(x1, y1, x2, y2, 2, 0, color, 3)
			
 
				+        # Draw class name and confidence
			
 
				+        disp.set_graph_word(x1, max(y1 - 20, 0), label, chn, 0, color, 16)
			
 
				+
			
 
				+
			
 
				+def draw_keypoints(image: np.ndarray, kpts_xy: np.ndarray,
			
 
				+                   kpts_score: np.ndarray, kpt_conf_thresh: float = 0.5,
			
 
				+                   radius_outer: int = 5, radius_inner: int = 2) -> None:
			
 
				+    """
			
 
				+    @brief Draw keypoints with confidence scores on an image.
			
 
				+    @param image Input/output image in-place modification.
			
 
				+    @param kpts_xy Keypoints coordinates, shape (N, K, 2).
			
 
				+    @param kpts_score Keypoints confidence scores, shape (N, K, 1).
			
 
				+    @param kpt_conf_thresh Confidence threshold to show keypoints.
			
 
				+    @param radius_outer Outer circle radius.
			
 
				+    @param radius_inner Inner circle radius.
			
 
				+    @return None
			
 
				+    """
			
 
				+    # Convert threshold to logit space (same as sigmoid(score) > threshold)
			
 
				+    kpt_conf_inverse = -np.log(1 / kpt_conf_thresh - 1)
			
 
				+
			
 
				+    for instance_xy, instance_score in zip(kpts_xy, kpts_score):
			
 
				+        for j in range(instance_xy.shape[0]):
			
 
				+            if instance_score[j, 0] < kpt_conf_inverse:
			
 
				+                continue
			
 
				+
			
 
				+            x, y = int(instance_xy[j, 0]), int(instance_xy[j, 1])
			
 
				+
			
 
				+            # Draw outer and inner circles
			
 
				+            cv2.circle(image, (x, y), radius_outer, (0, 0, 255), -1)
			
 
				+            cv2.circle(image, (x, y), radius_inner, (0, 255, 255), -1)
			
 
				+
			
 
				+            # Draw index number twice for bold outline effect
			
 
				+            cv2.putText(image, f"{j}", (x, y), cv2.FONT_HERSHEY_SIMPLEX,
			
 
				+                        0.5, (0, 0, 255), 3, cv2.LINE_AA)
			
 
				+            cv2.putText(image, f"{j}", (x, y), cv2.FONT_HERSHEY_SIMPLEX,
			
 
				+                        0.5, (0, 255, 255), 1, cv2.LINE_AA)
			
 
				+
			
 
				+
			
 
				+def draw_polygon_boxes(img: np.ndarray, bboxes: list,
			
 
				+                       color: tuple = (128, 240, 128),
			
 
				+                       thickness: int = 3) -> np.ndarray:
			
 
				+    """
			
 
				+    @brief Draw polygon-style bounding boxes on a copy of the image.
			
 
				+    @param img Input image (BGR format).
			
 
				+    @param bboxes List of polygon boxes, each is an ndarray of shape (N, 2).
			
 
				+    @param color Polygon color (B, G, R).
			
 
				+    @param thickness Line thickness.
			
 
				+    @return Image with drawn polygons.
			
 
				+    """
			
 
				+    img_copy = img.copy()
			
 
				+    for bbox in bboxes:
			
 
				+        bbox = bbox.astype(int)
			
 
				+        # Draw closed polygon on image
			
 
				+        cv2.polylines(img_copy, [bbox], isClosed=True, color=color, thickness=thickness)
			
 
				+    return img_copy
			
--- a/brain/PlannerNode2/Skill/person_approach_skill/skill_utils/postprocess_utils.py
+++ b/brain/PlannerNode2/Skill/person_approach_skill/skill_utils/postprocess_utils.py
@@ -0,0 +1,576 @@
 
				+# Copyright (c) 2025 D-Robotics Corporation
			
 
				+#
			
 
				+# Licensed under the Apache License, Version 2.0 (the "License");
			
 
				+# you may not use this file except in compliance with the License.
			
 
				+# You may obtain a copy of the License at
			
 
				+#
			
 
				+#     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+#
			
 
				+# Unless required by applicable law or agreed to in writing, software
			
 
				+# distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+# See the License for the specific language governing permissions and
			
 
				+# limitations under the License.
			
 
				+
			
 
				+# flake8: noqa: E501
			
 
				+
			
 
				+import cv2
			
 
				+import numpy as np
			
 
				+from hbm_runtime import QuantParams
			
 
				+from scipy.special import softmax
			
 
				+
			
 
				+
			
 
				+def sigmoid(x: np.ndarray) -> np.ndarray:
			
 
				+    """
			
 
				+    @brief Compute the sigmoid activation function.
			
 
				+    @param x Input NumPy array.
			
 
				+    @return NumPy array after applying sigmoid function element-wise.
			
 
				+    """
			
 
				+    return 1.0 / (1.0 + cv2.exp(-x))
			
 
				+
			
 
				+
			
 
				+def recover_to_original_size(img: np.ndarray,
			
 
				+                             orig_w: int,
			
 
				+                             orig_h: int,
			
 
				+                             resize_type: int = 1) -> np.ndarray:
			
 
				+    """
			
 
				+    @brief Restore resized image back to original size.
			
 
				+    @details Supports direct resize or reverse letterbox removal.
			
 
				+    @param img Input image of shape (H, W, C).
			
 
				+    @param orig_w Original image width.
			
 
				+    @param orig_h Original image height.
			
 
				+    @param resize_type Resize type used before: 0 (direct) or 1 (letterbox).
			
 
				+    @return Resized image of shape (orig_h, orig_w, C).
			
 
				+    """
			
 
				+    h, w = img.shape[:2]  # current size after preprocess
			
 
				+
			
 
				+    if resize_type == 0:
			
 
				+        # Resize directly to original dimensions
			
 
				+        img_resized = cv2.resize(img, (orig_w, orig_h),
			
 
				+                                 interpolation=cv2.INTER_NEAREST)
			
 
				+    elif resize_type == 1:
			
 
				+        # Remove padding and resize back from letterbox
			
 
				+        scale = min(h / orig_h, w / orig_w)
			
 
				+        new_w, new_h = int(orig_w * scale), int(orig_h * scale)
			
 
				+
			
 
				+        pad_w = w - new_w
			
 
				+        pad_h = h - new_h
			
 
				+        left = pad_w // 2
			
 
				+        top = pad_h // 2
			
 
				+
			
 
				+        # Crop out the letterbox padding
			
 
				+        cropped = img[top:top + new_h, left:left + new_w]
			
 
				+
			
 
				+        # Resize cropped region to original size
			
 
				+        img_resized = cv2.resize(cropped, (orig_w, orig_h),
			
 
				+                                 interpolation=cv2.INTER_NEAREST)
			
 
				+    else:
			
 
				+        raise ValueError(f"Invalid resize_type: {resize_type}, must be 0 or 1")
			
 
				+
			
 
				+    return img_resized
			
 
				+
			
 
				+
			
 
				+def print_topk_predictions(output: np.ndarray,
			
 
				+                           idx2label: dict,
			
 
				+                           topk: int = 5) -> None:
			
 
				+    """
			
 
				+    @brief Print top-k classification predictions.
			
 
				+    @details Uses softmax to compute probability and selects top-k.
			
 
				+    @param output Raw logits as NumPy array (shape: [num_classes]).
			
 
				+    @param idx2label Dictionary mapping class indices to labels.
			
 
				+    @param topk Number of top predictions to display.
			
 
				+    @return None
			
 
				+    """
			
 
				+    # Softmax with stability adjustment
			
 
				+    exp_logits = np.exp(output - np.max(output))
			
 
				+    probabilities = exp_logits / np.sum(exp_logits)
			
 
				+
			
 
				+    # Top-k indices
			
 
				+    topk_idx = np.argsort(probabilities)[-topk:][::-1]
			
 
				+    topk_prob = probabilities[topk_idx]
			
 
				+
			
 
				+    print(f"Top-{topk} Predictions:")
			
 
				+    for i in range(topk):
			
 
				+        idx = topk_idx[i]
			
 
				+        prob = topk_prob[i]
			
 
				+        label = idx2label[idx] if idx2label and idx in idx2label else f"Class {idx}"
			
 
				+        print(f"{label}: {prob:.4f}")
			
 
				+
			
 
				+
			
 
				+def dequantize_tensor(q_tensor: np.ndarray, quant_info: QuantParams) -> np.ndarray:
			
 
				+    """
			
 
				+    @brief Dequantize a quantized tensor to floating-point values.
			
 
				+    @details Supports both per-tensor and per-channel dequantization based on quant_info.
			
 
				+    @param q_tensor Quantized tensor (e.g., int8 or uint8).
			
 
				+    @param quant_info Quantization parameters (scale, zero_point, axis, type).
			
 
				+    @return Dequantized tensor (float32).
			
 
				+    """
			
 
				+    if quant_info.quant_type != 1:  # 1 indicates linear scale quantization
			
 
				+        return q_tensor
			
 
				+
			
 
				+    if quant_info.scale.ndim == 0 or q_tensor.ndim == 1 or quant_info.scale.size == 1:
			
 
				+        # Per-tensor dequantization
			
 
				+        return (q_tensor.astype(np.float32) - quant_info.zero_point.astype(np.float32)) * quant_info.scale
			
 
				+    else:
			
 
				+        # Per-channel dequantization
			
 
				+        shape = [1] * q_tensor.ndim
			
 
				+        shape[quant_info.axis] = -1
			
 
				+        scale = quant_info.scale.reshape(shape)
			
 
				+        zero_point = quant_info.zero_point.reshape(shape)
			
 
				+        return (q_tensor.astype(np.float32) - zero_point.astype(np.float32)) * scale
			
 
				+
			
 
				+
			
 
				+def dequantize_outputs(outputs: dict, quan_infos: dict) -> dict:
			
 
				+    """
			
 
				+    @brief Dequantize a dictionary of quantized model outputs.
			
 
				+    @param outputs Dictionary of quantized output tensors.
			
 
				+    @param quan_infos Dictionary of quantization parameters per output.
			
 
				+    @return Dictionary of dequantized float32 outputs.
			
 
				+    """
			
 
				+    fp32_outputs = {}
			
 
				+    for name, output in outputs.items():
			
 
				+        quant_info = quan_infos[name]
			
 
				+        fp32_outputs[name] = dequantize_tensor(output, quant_info)
			
 
				+    return fp32_outputs
			
 
				+
			
 
				+
			
 
				+def scale_coords_back(xyxy: np.ndarray,
			
 
				+                      img_w: int,
			
 
				+                      img_h: int,
			
 
				+                      input_w: int,
			
 
				+                      input_h: int,
			
 
				+                      resize_type: int = 1) -> np.ndarray:
			
 
				+    """
			
 
				+    @brief Map coordinates from resized image back to original image scale.
			
 
				+    @param xyxy Bounding boxes (N, 4) in resized image.
			
 
				+    @param img_w Original image width.
			
 
				+    @param img_h Original image height.
			
 
				+    @param input_w Network input width.
			
 
				+    @param input_h Network input height.
			
 
				+    @param resize_type Resize strategy: 0 (resize), 1 (letterbox).
			
 
				+    @return Bounding boxes rescaled to original image dimensions.
			
 
				+    """
			
 
				+    if resize_type == 0:
			
 
				+        # Direct resize
			
 
				+        scale_x = img_w / input_w
			
 
				+        scale_y = img_h / input_h
			
 
				+        xyxy[:, [0, 2]] *= scale_x
			
 
				+        xyxy[:, [1, 3]] *= scale_y
			
 
				+    elif resize_type == 1:
			
 
				+        # Letterbox resize
			
 
				+        scale = min(input_w / img_w, input_h / img_h)
			
 
				+        pad_w = (input_w - img_w * scale) / 2
			
 
				+        pad_h = (input_h - img_h * scale) / 2
			
 
				+        xyxy[:, [0, 2]] = (xyxy[:, [0, 2]] - pad_w) / scale
			
 
				+        xyxy[:, [1, 3]] = (xyxy[:, [1, 3]] - pad_h) / scale
			
 
				+    else:
			
 
				+        raise ValueError("resize_type must be 0 (resize) or 1 (letterbox)")
			
 
				+
			
 
				+    # Clamp coordinates within valid image bounds
			
 
				+    xyxy[:, [0, 2]] = np.clip(xyxy[:, [0, 2]], 0, img_w)
			
 
				+    xyxy[:, [1, 3]] = np.clip(xyxy[:, [1, 3]], 0, img_h)
			
 
				+
			
 
				+    return xyxy
			
 
				+
			
 
				+
			
 
				+def NMS(xyxy: np.ndarray,
			
 
				+        score: np.ndarray,
			
 
				+        cls: np.ndarray,
			
 
				+        iou_thresh: float = 0.45) -> list:
			
 
				+    """
			
 
				+    @brief Perform class-wise Non-Maximum Suppression (NMS).
			
 
				+    @details Keeps boxes with highest scores and removes overlaps above IoU threshold.
			
 
				+    @param xyxy Bounding boxes (N, 4).
			
 
				+    @param score Confidence scores (N,).
			
 
				+    @param cls Class IDs for each box (N,).
			
 
				+    @param iou_thresh IoU threshold for suppression.
			
 
				+    @return List of indices to keep.
			
 
				+    """
			
 
				+    keep = []
			
 
				+    for c in np.unique(cls):
			
 
				+        idx = np.where(cls == c)[0]
			
 
				+        x1, y1, x2, y2 = xyxy[idx].T
			
 
				+        area = (x2 - x1) * (y2 - y1)
			
 
				+        order = score[idx].argsort()[::-1]  # Sort by descending score
			
 
				+
			
 
				+        while order.size > 0:
			
 
				+            i = order[0]
			
 
				+            keep.append(idx[i])
			
 
				+            # Compute IoU with remaining boxes
			
 
				+            xx1 = np.maximum(x1[i], x1[order[1:]])
			
 
				+            yy1 = np.maximum(y1[i], y1[order[1:]])
			
 
				+            xx2 = np.minimum(x2[i], x2[order[1:]])
			
 
				+            yy2 = np.minimum(y2[i], y2[order[1:]])
			
 
				+            inter = np.clip(xx2 - xx1, 0, None) * np.clip(yy2 - yy1, 0, None)
			
 
				+            iou = inter / (area[i] + area[order[1:]] - inter + 1e-9)
			
 
				+
			
 
				+            # Keep boxes with IoU below threshold
			
 
				+            order = order[1:][iou < iou_thresh]
			
 
				+
			
 
				+    return keep
			
 
				+
			
 
				+
			
 
				+def xywh_to_xyxy(xywh: np.ndarray) -> np.ndarray:
			
 
				+    """
			
 
				+    @brief Convert bounding boxes from (x_center, y_center, w, h) to (x1, y1, x2, y2).
			
 
				+    @param xywh (N, 4) array in [center_x, center_y, width, height] format.
			
 
				+    @return (N, 4) array in [x1, y1, x2, y2] format.
			
 
				+    """
			
 
				+    x1y1 = xywh[:, :2] - xywh[:, 2:] / 2
			
 
				+    x2y2 = xywh[:, :2] + xywh[:, 2:] / 2
			
 
				+    return np.hstack([x1y1, x2y2])
			
 
				+
			
 
				+
			
 
				+def filter_classification(cls_output: np.ndarray, conf_thres_raw: float) -> tuple[np.ndarray, np.ndarray, np.ndarray]:
			
 
				+    """
			
 
				+    @brief Filter classification outputs using raw confidence threshold.
			
 
				+    @param cls_output Classification logits of shape (N, C).
			
 
				+    @param conf_thres_raw Threshold applied to max logit (before sigmoid).
			
 
				+    @return Tuple of:
			
 
				+        - scores: Sigmoid confidence scores of selected predictions
			
 
				+        - ids: Class indices of selected predictions
			
 
				+        - valid_indices: Original indices of selected predictions
			
 
				+    """
			
 
				+    cls_output = cls_output.reshape(-1, cls_output.shape[-1])
			
 
				+    max_scores = np.max(cls_output, axis=1)
			
 
				+    valid_indices = np.flatnonzero(max_scores >= conf_thres_raw)
			
 
				+    ids = np.argmax(cls_output[valid_indices], axis=1)
			
 
				+    # Apply sigmoid
			
 
				+    scores = 1 / (1 + np.exp(-max_scores[valid_indices]))
			
 
				+    return scores, ids, valid_indices
			
 
				+
			
 
				+
			
 
				+def filter_mces(mces_output: np.ndarray, valid_indices: np.ndarray) -> np.ndarray:
			
 
				+    """
			
 
				+    @brief Extract MCES features from selected predictions.
			
 
				+    @param mces_output.
			
 
				+    @param valid_indices Indices of valid predictions.
			
 
				+    @return Filtered MCES tensor of shape (K, D), K = len(valid_indices).
			
 
				+    """
			
 
				+    mces_output = mces_output.reshape(-1, mces_output.shape[-1])
			
 
				+    mces = mces_output[valid_indices, :]
			
 
				+    return mces
			
 
				+
			
 
				+
			
 
				+def filter_predictions(pred: np.ndarray, score_thres: float) -> tuple[np.ndarray, np.ndarray, np.ndarray]:
			
 
				+    """
			
 
				+    @brief Filter detection predictions by confidence threshold.
			
 
				+    @param pred Tensor of shape (N, 5 + C): [x, y, w, h, obj_conf, class_probs...].
			
 
				+    @param score_thres Threshold on (obj_conf * class_conf).
			
 
				+    @return Tuple of:
			
 
				+        - xyxy: Filtered bounding boxes (Nf, 4)
			
 
				+        - score: Filtered scores (Nf,)
			
 
				+        - cls: Class indices (Nf,)
			
 
				+    """
			
 
				+    xywh = pred[:, :4]
			
 
				+
			
 
				+    # Combine objectness and class scores
			
 
				+    conf_all = pred[:, 4:5] * pred[:, 5:]
			
 
				+    cls = conf_all.argmax(axis=1)
			
 
				+    score = conf_all[np.arange(len(pred)), cls]
			
 
				+    mask = score > score_thres
			
 
				+    xyxy = xywh_to_xyxy(xywh[mask])
			
 
				+    return xyxy, score[mask], cls[mask]
			
 
				+
			
 
				+
			
 
				+def gen_anchor(grid_size: int) -> np.ndarray:
			
 
				+    """
			
 
				+    @brief Generate anchor center positions on a square grid.
			
 
				+    @param grid_size Size of the square grid (e.g., 80 for 80x80).
			
 
				+    @return (N, 2) array of anchor coordinates [x, y].
			
 
				+    """
			
 
				+    x = np.tile(np.linspace(0.5, grid_size - 0.5, grid_size), reps=grid_size)
			
 
				+    y = np.repeat(np.linspace(0.5, grid_size - 0.5, grid_size), grid_size)
			
 
				+    return np.stack([x, y], axis=1)
			
 
				+
			
 
				+
			
 
				+def decode_boxes(boxes_output: np.ndarray,
			
 
				+                 valid_indices: np.ndarray,
			
 
				+                 grid_size: int,
			
 
				+                 stride: int,
			
 
				+                 weights_static: np.ndarray) -> np.ndarray:
			
 
				+    """
			
 
				+    @brief Decode bounding boxes from distributional predictions.
			
 
				+    @param boxes_output Tensor of shape (N, 4 * 16).
			
 
				+    @param valid_indices Indices of valid predictions.
			
 
				+    @param grid_size Feature map grid size.
			
 
				+    @param stride Downsampling factor.
			
 
				+    @param weights_static Discrete location weights (e.g., 0~15).
			
 
				+    @return Decoded bounding boxes in xyxy format (M, 4).
			
 
				+    """
			
 
				+    bboxes = boxes_output.reshape(-1, boxes_output.shape[-1])
			
 
				+    bboxes_float32 = bboxes[valid_indices]
			
 
				+    # Softmax over 16 bins per LTRB side and apply expectation
			
 
				+    ltrb = np.sum(softmax(bboxes_float32.reshape(-1, 4, 16), axis=2) *
			
 
				+                  weights_static, axis=2)
			
 
				+    anchor = gen_anchor(grid_size)[valid_indices]
			
 
				+    x1y1 = anchor - ltrb[:, 0:2]
			
 
				+    x2y2 = anchor + ltrb[:, 2:4]
			
 
				+    return np.hstack([x1y1, x2y2]) * stride
			
 
				+
			
 
				+
			
 
				+def decode_masks(mces: np.ndarray,
			
 
				+                 boxes: np.ndarray,
			
 
				+                 protos: np.ndarray,
			
 
				+                 input_w: int,
			
 
				+                 input_h: int,
			
 
				+                 mask_w: int,
			
 
				+                 mask_h: int,
			
 
				+                 mask_thresh: float = 0.5) -> list[np.ndarray]:
			
 
				+    """
			
 
				+    @brief Decode instance segmentation masks.
			
 
				+    @param mces Mask coefficients for each detection (M, C).
			
 
				+    @param boxes Bounding boxes (M, 4).
			
 
				+    @param protos Mask prototype feature map (H, W, C).
			
 
				+    @param input_w Width of the input image.
			
 
				+    @param input_h Height of the input image.
			
 
				+    @param mask_w Width of the mask proto.
			
 
				+    @param mask_h Height of the mask proto.
			
 
				+    @param mask_thresh Threshold to binarize masks.
			
 
				+    @return List of (H, W) binary mask arrays.
			
 
				+    """
			
 
				+    masks = []
			
 
				+    x_scale = mask_w / input_w
			
 
				+    y_scale = mask_h / input_h
			
 
				+
			
 
				+    for i, (x1, y1, x2, y2) in enumerate(boxes):
			
 
				+        # Crop proto features using scaled coordinates
			
 
				+        x1_corp = int(x1 * x_scale)
			
 
				+        y1_corp = int(y1 * y_scale)
			
 
				+        x2_corp = int(x2 * x_scale)
			
 
				+        y2_corp = int(y2 * y_scale)
			
 
				+
			
 
				+        proto_crop = protos[y1_corp:y2_corp, x1_corp:x2_corp, :]  # (H, W, C)
			
 
				+        mc = mces[i]
			
 
				+        # Linear combination and thresholding
			
 
				+        mask = (np.sum(proto_crop * mc[np.newaxis, np.newaxis, :], axis=2)
			
 
				+                > mask_thresh).astype(np.uint8)
			
 
				+        masks.append(mask)
			
 
				+
			
 
				+    return masks
			
 
				+
			
 
				+
			
 
				+def decode_kpts(kpts_output: np.ndarray,
			
 
				+                valid_indices: np.ndarray,
			
 
				+                grid_size: int,
			
 
				+                stride: int,
			
 
				+                anchor: np.ndarray = None) -> tuple[np.ndarray, np.ndarray]:
			
 
				+    """
			
 
				+    @brief Decode keypoint coordinates from model output.
			
 
				+    @param kpts_output Keypoint tensor of shape (N, 17*3).
			
 
				+    @param valid_indices Indices of valid predictions.
			
 
				+    @param grid_size Size of feature map grid.
			
 
				+    @param stride Downsampling factor (e.g., 8, 16, 32).
			
 
				+    @param anchor Optional anchor points. If None, generated automatically.
			
 
				+    @return Tuple:
			
 
				+            - kpts_xy: (M, 17, 2) pixel coordinates of keypoints.
			
 
				+            - kpts_score: (M, 17, 1) keypoint confidence scores.
			
 
				+    """
			
 
				+    kpts_output = kpts_output.reshape(-1, kpts_output.shape[-1])
			
 
				+    kpts = kpts_output[valid_indices].reshape(-1, 17, 3)  # (M, 17, 3)
			
 
				+
			
 
				+    if anchor is None:
			
 
				+        anchor = gen_anchor(grid_size)[valid_indices]  # (M, 2)
			
 
				+
			
 
				+    # Decode x, y using anchor and stride
			
 
				+    kpts_xy = (kpts[:, :, :2] * 2.0 + (anchor[:, None, :] - 0.5)) * stride
			
 
				+
			
 
				+    # Extract score without activation (or apply sigmoid optionally)
			
 
				+    kpts_score = kpts[:, :, 2:3]
			
 
				+
			
 
				+    return kpts_xy, kpts_score
			
 
				+
			
 
				+
			
 
				+def decode_layer(feat: np.ndarray,
			
 
				+                 stride: int,
			
 
				+                 anchor: np.ndarray,
			
 
				+                 classes_num: int = 80) -> np.ndarray:
			
 
				+    """
			
 
				+    @brief Decode a single feature layer from detection head.
			
 
				+    @param feat Raw model output tensor of shape (1, na, h, w, c).
			
 
				+    @param stride Stride of the feature layer.
			
 
				+    @param anchor Anchor sizes for this layer (na, 2).
			
 
				+    @param classes_num Number of output classes.
			
 
				+    @return Decoded prediction array of shape (N, 5 + num_classes).
			
 
				+    """
			
 
				+    _, _, h, w, _ = feat.shape  #  h/w: feature map size
			
 
				+
			
 
				+    # Create coordinate grid of shape (1, 1, h, w, 2)
			
 
				+    grid_y, grid_x = np.mgrid[0:h, 0:w]
			
 
				+    grid = np.stack((grid_x, grid_y), axis=-1)[None, None]
			
 
				+
			
 
				+    # batch sigmoid
			
 
				+    feat_sig = sigmoid(feat[..., :5 + classes_num])
			
 
				+
			
 
				+    # Decode center offsets (dx, dy) and size (dw, dh)
			
 
				+    dxdy = feat_sig[..., :2]
			
 
				+    dwdh = feat_sig[..., 2:4]
			
 
				+    obj  = feat_sig[..., 4:5]
			
 
				+    cls  = feat_sig[..., 5:]
			
 
				+
			
 
				+    # Compute center coordinates in original image scale
			
 
				+    xy = (dxdy * 2. - 0.5 + grid) * stride
			
 
				+
			
 
				+    # Compute width/height from anchor sizes
			
 
				+    wh = (dwdh * 2.) ** 2 * anchor[:, None, None, :]
			
 
				+
			
 
				+    # Construct final output tensor (xywh + obj + class scores)
			
 
				+    out = np.empty((*xy.shape[:-1], 5 + classes_num), dtype=np.float32)
			
 
				+    out[..., 0:2] = xy
			
 
				+    out[..., 2:4] = wh
			
 
				+    out[..., 4:5] = obj
			
 
				+    out[..., 5:]  = cls
			
 
				+
			
 
				+    return out.reshape(-1, 5 + classes_num)
			
 
				+
			
 
				+
			
 
				+def decode_outputs(output_names: list[str],
			
 
				+                   fp32_outputs: dict[str, np.ndarray],
			
 
				+                   strides: list[int],
			
 
				+                   anchors: list[np.ndarray],
			
 
				+                   classes_num: int = 80) -> np.ndarray:
			
 
				+    """
			
 
				+    @brief Decode all feature maps from model output.
			
 
				+    @param output_names List of output tensor names.
			
 
				+    @param fp32_outputs Dict of decoded tensors from model.
			
 
				+    @param strides Stride values for each output head.
			
 
				+    @param anchors Anchor arrays for each head.
			
 
				+    @param classes_num Number of output classes.
			
 
				+    @return Concatenated prediction tensor of shape (N, 5 + classes).
			
 
				+    """
			
 
				+    decoded = []
			
 
				+    for i, key in enumerate(output_names):
			
 
				+        out = fp32_outputs[key]
			
 
				+        h, w = out.shape[1:3]
			
 
				+        # Reshape and transpose to (1, na, h, w, c)
			
 
				+        feat = out.reshape(1, h, w, 3, 5 + classes_num).transpose(0, 3, 1, 2, 4)
			
 
				+        decoded.append(decode_layer(feat, strides[i], anchors[i], classes_num))
			
 
				+    return np.concatenate(decoded, axis=0)
			
 
				+
			
 
				+
			
 
				+def get_bounding_boxes(dilated_polys: list[np.ndarray], min_area: float) -> list[np.ndarray]:
			
 
				+    """
			
 
				+    @brief Extract minimum area bounding boxes from polygon contours.
			
 
				+    @param dilated_polys List of polygon contours. Each element is a NumPy array of shape (N, 1, 2).
			
 
				+    @param min_area Minimum area threshold to filter small boxes.
			
 
				+    @return List of bounding boxes. Each is a NumPy array of shape (4, 2), type int.
			
 
				+    """
			
 
				+    boxes_list = []
			
 
				+    for cnt in dilated_polys:
			
 
				+        if cv2.contourArea(cnt) < min_area:
			
 
				+            continue  # Skip small contours
			
 
				+        rect = cv2.minAreaRect(cnt)
			
 
				+        box = cv2.boxPoints(rect).astype(np.int_)
			
 
				+        boxes_list.append(box)
			
 
				+    return boxes_list
			
 
				+
			
 
				+
			
 
				+def resize_masks_to_boxes(masks: list[np.ndarray],
			
 
				+                          boxes: list[tuple[float, float, float, float]],
			
 
				+                          img_w: int, img_h: int,
			
 
				+                          interpolation: int = cv2.INTER_LANCZOS4,
			
 
				+                          do_morph: bool = True) -> list[np.ndarray]:
			
 
				+    """
			
 
				+    @brief Resize binary masks to fit inside their corresponding bounding boxes.
			
 
				+    @param masks List of binary mask arrays of shape (H, W), dtype=uint8.
			
 
				+    @param boxes List of bounding boxes in (x1, y1, x2, y2) format.
			
 
				+    @param img_w Width of the original image.
			
 
				+    @param img_h Height of the original image.
			
 
				+    @param interpolation OpenCV interpolation method used for resizing.
			
 
				+    @param do_morph Whether to apply morphological open to smooth the mask.
			
 
				+    @return List of resized binary masks cropped to box size.
			
 
				+    """
			
 
				+    resized_masks = []
			
 
				+    for mask, (x1, y1, x2, y2) in zip(masks, boxes):
			
 
				+        # Clamp coordinates to image bounds
			
 
				+        x1, y1 = max(int(x1), 0), max(int(y1), 0)
			
 
				+        x2, y2 = min(int(x2), img_w), min(int(y2), img_h)
			
 
				+
			
 
				+        target_w = max(x2 - x1, 1)
			
 
				+        target_h = max(y2 - y1, 1)
			
 
				+
			
 
				+        resized = cv2.resize(mask, (target_w, target_h), interpolation=interpolation)
			
 
				+
			
 
				+        if do_morph:
			
 
				+            # Apply morphological filtering
			
 
				+            resized = cv2.morphologyEx(resized, cv2.MORPH_OPEN, np.ones((5, 5), np.uint8))
			
 
				+
			
 
				+        resized_masks.append(resized)
			
 
				+
			
 
				+    return resized_masks
			
 
				+
			
 
				+
			
 
				+def scale_keypoints_to_original_image(kpts_xy: np.ndarray,
			
 
				+                                      kpts_score: np.ndarray,
			
 
				+                                      boxes: list[tuple[float, float, float, float]],
			
 
				+                                      img_w: int, img_h: int,
			
 
				+                                      input_w: int, input_h: int,
			
 
				+                                      resize_type: int = 1) -> tuple[np.ndarray, np.ndarray]:
			
 
				+    """
			
 
				+    @brief Scale keypoints back to original image coordinates.
			
 
				+    @param kpts_xy Keypoint coordinates of shape (M, 17, 2), float32.
			
 
				+    @param kpts_score Keypoint scores of shape (M, 17, 1), float32.
			
 
				+    @param boxes List of bounding boxes, not used here.
			
 
				+    @param img_w Width of the original image.
			
 
				+    @param img_h Height of the original image.
			
 
				+    @param input_w Width of model input.
			
 
				+    @param input_h Height of model input.
			
 
				+    @param resize_type 0 = direct resize, 1 = letterbox resize.
			
 
				+    @return Tuple of (scaled keypoints, scores), both NumPy arrays.
			
 
				+    """
			
 
				+    scaled_kpts = kpts_xy.copy()
			
 
				+
			
 
				+    if resize_type == 0:
			
 
				+        scale_x = img_w / input_w
			
 
				+        scale_y = img_h / input_h
			
 
				+        scaled_kpts[..., 0] *= scale_x
			
 
				+        scaled_kpts[..., 1] *= scale_y
			
 
				+
			
 
				+    elif resize_type == 1:
			
 
				+        scale = min(input_w / img_w, input_h / img_h)
			
 
				+        pad_w = (input_w - img_w * scale) / 2
			
 
				+        pad_h = (input_h - img_h * scale) / 2
			
 
				+        scaled_kpts[..., 0] = (scaled_kpts[..., 0] - pad_w) / scale
			
 
				+        scaled_kpts[..., 1] = (scaled_kpts[..., 1] - pad_h) / scale
			
 
				+
			
 
				+    else:
			
 
				+        raise ValueError("resize_type must be 0 or 1")
			
 
				+
			
 
				+    # Clip to image bounds
			
 
				+    scaled_kpts[..., 0] = np.clip(scaled_kpts[..., 0], 0, img_w)
			
 
				+    scaled_kpts[..., 1] = np.clip(scaled_kpts[..., 1], 0, img_h)
			
 
				+
			
 
				+    return scaled_kpts, kpts_score
			
 
				+
			
 
				+
			
 
				+def crop_and_rotate_image(img: np.ndarray, box: np.ndarray) -> np.ndarray:
			
 
				+    """
			
 
				+    @brief Crop and rotate a region from the image using a rotated bounding box.
			
 
				+    @param img Input image array of shape (H, W, C), dtype=uint8.
			
 
				+    @param box Bounding box as 4-point array of shape (4, 2).
			
 
				+    @return Cropped and rotated region image as a NumPy array.
			
 
				+    """
			
 
				+    rect = cv2.minAreaRect(box)
			
 
				+    box = cv2.boxPoints(rect).astype(np.intp)
			
 
				+    width = int(rect[1][0])
			
 
				+    height = int(rect[1][1])
			
 
				+    angle = rect[2]
			
 
				+
			
 
				+    src_pts = box.astype("float32")
			
 
				+    dst_pts = np.array([[0, height - 1],
			
 
				+                        [0, 0],
			
 
				+                        [width - 1, 0],
			
 
				+                        [width - 1, height - 1]], dtype="float32")
			
 
				+
			
 
				+    # Apply perspective transform
			
 
				+    M = cv2.getPerspectiveTransform(src_pts, dst_pts)
			
 
				+    warped = cv2.warpPerspective(img, M, (width, height))
			
 
				+
			
 
				+    # Rotate if angle is large
			
 
				+    if angle >= 45:
			
 
				+        rotated = cv2.rotate(warped, cv2.ROTATE_90_CLOCKWISE)
			
 
				+    else:
			
 
				+        rotated = warped
			
 
				+
			
 
				+    print("width:", rotated.shape[1], "height:", rotated.shape[0])
			
 
				+    return rotated
			
--- a/brain/PlannerNode2/Skill/person_approach_skill/skill_utils/preprocess_utils.py
+++ b/brain/PlannerNode2/Skill/person_approach_skill/skill_utils/preprocess_utils.py
@@ -0,0 +1,166 @@
 
				+# Copyright (c) 2025 D-Robotics Corporation
			
 
				+#
			
 
				+# Licensed under the Apache License, Version 2.0 (the "License");
			
 
				+# you may not use this file except in compliance with the License.
			
 
				+# You may obtain a copy of the License at
			
 
				+#
			
 
				+#     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+#
			
 
				+# Unless required by applicable law or agreed to in writing, software
			
 
				+# distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+# See the License for the specific language governing permissions and
			
 
				+# limitations under the License.
			
 
				+
			
 
				+# flake8: noqa: E501
			
 
				+
			
 
				+import cv2
			
 
				+import numpy as np
			
 
				+
			
 
				+
			
 
				+def bgr_to_nv12_planes(image: np.ndarray) -> tuple:
			
 
				+    """
			
 
				+    @brief Convert a BGR image to NV12 format (Y and UV planes).
			
 
				+    @param image Input BGR image as a NumPy array of shape (H, W, 3).
			
 
				+    @return A tuple of:
			
 
				+        - y: Y plane with shape (1, H, W, 1)
			
 
				+        - uv: UV plane with shape (1, H/2, W/2, 2)
			
 
				+    """
			
 
				+    height, width = image.shape[:2]
			
 
				+    area = height * width
			
 
				+
			
 
				+    # Convert to planar YUV I420 format
			
 
				+    yuv420p = cv2.cvtColor(image, cv2.COLOR_BGR2YUV_I420)
			
 
				+    yuv420p = yuv420p.reshape((area * 3 // 2,))
			
 
				+
			
 
				+    # Extract Y, U, V planes
			
 
				+    y = yuv420p[:area].reshape((height, width))
			
 
				+    u = yuv420p[area:area + area // 4].reshape((height // 2, width // 2))
			
 
				+    v = yuv420p[area + area // 4:].reshape((height // 2, width // 2))
			
 
				+
			
 
				+    # Interleave U and V to form UV plane
			
 
				+    uv = np.stack((u, v), axis=-1)
			
 
				+
			
 
				+    # Add batch and channel dimensions
			
 
				+    y = y[np.newaxis, :, :, np.newaxis]
			
 
				+    uv = uv[np.newaxis, :, :, :]
			
 
				+
			
 
				+    return y, uv
			
 
				+
			
 
				+
			
 
				+def resized_image(img: np.ndarray, input_W: int, input_H: int,
			
 
				+                  resize_type: int = 1,
			
 
				+                  interpolation=cv2.INTER_NEAREST) -> np.ndarray:
			
 
				+    """
			
 
				+    @brief Resize image with either direct resize or letterbox strategy.
			
 
				+    @param img Input image (H, W, 3).
			
 
				+    @param input_W Target width.
			
 
				+    @param input_H Target height.
			
 
				+    @param resize_type Resize method: 0 for direct resize, 1 for letterbox padding.
			
 
				+    @param interpolation Interpolation method (default: nearest).
			
 
				+    @return Resized image with shape (input_H, input_W, 3).
			
 
				+    """
			
 
				+    img_h, img_w = img.shape[:2]
			
 
				+
			
 
				+    if resize_type == 0:  # Direct resize
			
 
				+        resized = cv2.resize(img, (input_W, input_H), interpolation=interpolation)
			
 
				+    elif resize_type == 1:  # Letterbox resize (preserve aspect ratio)
			
 
				+        scale = min(input_H / img_h, input_W / img_w)
			
 
				+        new_w, new_h = int(img_w * scale), int(img_h * scale)
			
 
				+        resized = cv2.resize(img, (new_w, new_h))
			
 
				+
			
 
				+        pad_w = input_W - new_w
			
 
				+        pad_h = input_H - new_h
			
 
				+        left, right = pad_w // 2, pad_w - pad_w // 2
			
 
				+        top, bottom = pad_h // 2, pad_h - pad_h // 2
			
 
				+
			
 
				+        # Pad image with gray (127,127,127)
			
 
				+        resized = cv2.copyMakeBorder(resized, top, bottom, left, right,
			
 
				+                                     borderType=cv2.BORDER_CONSTANT,
			
 
				+                                     value=(127, 127, 127))
			
 
				+    else:
			
 
				+        raise ValueError(f"Invalid resize_type: {resize_type}, must be 0 or 1")
			
 
				+
			
 
				+    return resized
			
 
				+
			
 
				+
			
 
				+def split_nv12_bytes(nv12_bytes: bytes, width: int, height: int) -> tuple:
			
 
				+    """
			
 
				+    @brief Split raw NV12 bytes into Y and UV planes.
			
 
				+    @param nv12_bytes Input NV12-encoded byte stream.
			
 
				+    @param width Width of the image.
			
 
				+    @param height Height of the image.
			
 
				+    @return Tuple (y, uv), where:
			
 
				+        - y: shape (H, W), dtype uint8
			
 
				+        - uv: shape (H/2, W), dtype uint8 (interleaved UV)
			
 
				+    """
			
 
				+    y_size = width * height
			
 
				+    uv_size = y_size // 2
			
 
				+    nv12_array = np.frombuffer(nv12_bytes, dtype=np.uint8)
			
 
				+
			
 
				+    y = nv12_array[:y_size].reshape((height, width))
			
 
				+    uv = nv12_array[y_size:y_size + uv_size].reshape((height // 2, width))
			
 
				+
			
 
				+    return y, uv
			
 
				+
			
 
				+
			
 
				+def letterbox_resize_gray(gray_img: np.ndarray, target_w: int, target_h: int) -> np.ndarray:
			
 
				+    """
			
 
				+    @brief Resize a grayscale image using letterbox (aspect ratio preserving) strategy.
			
 
				+    @param gray_img Input grayscale image of shape (H, W).
			
 
				+    @param target_w Target width.
			
 
				+    @param target_h Target height.
			
 
				+    @return Resized and padded grayscale image of shape (target_h, target_w).
			
 
				+    """
			
 
				+    h, w = gray_img.shape
			
 
				+    scale = min(target_w / w, target_h / h)
			
 
				+    new_w, new_h = int(w * scale), int(h * scale)
			
 
				+    resized = cv2.resize(gray_img, (new_w, new_h))
			
 
				+
			
 
				+    pad_w = target_w - new_w
			
 
				+    pad_h = target_h - new_h
			
 
				+    top, bottom = pad_h // 2, pad_h - pad_h // 2
			
 
				+    left, right = pad_w // 2, pad_w - pad_w // 2
			
 
				+
			
 
				+    # Pad with value 127 (gray)
			
 
				+    padded = cv2.copyMakeBorder(resized, top, bottom, left, right,
			
 
				+                                borderType=cv2.BORDER_CONSTANT, value=127)
			
 
				+    return padded
			
 
				+
			
 
				+
			
 
				+def resize_nv12_yuv(y: np.ndarray, uv: np.ndarray,
			
 
				+                    target_h: int = 672, target_w: int = 672,
			
 
				+                    keep_ratio: bool = True) -> tuple:
			
 
				+    """
			
 
				+    @brief Resize Y and UV planes of an NV12 image to target resolution.
			
 
				+    @param y Y plane of shape (H, W).
			
 
				+    @param uv Interleaved UV plane of shape (H/2, W).
			
 
				+    @param target_h Target height.
			
 
				+    @param target_w Target width.
			
 
				+    @param keep_ratio Whether to preserve aspect ratio (uses letterbox if True).
			
 
				+    @return Tuple of resized:
			
 
				+        - y_resized: shape (target_h, target_w)
			
 
				+        - uv_resized: shape (target_h/2, target_w/2, 2)
			
 
				+    """
			
 
				+    # Resize Y
			
 
				+    if keep_ratio:
			
 
				+        y_resized = letterbox_resize_gray(y, target_w, target_h)
			
 
				+    else:
			
 
				+        y_resized = cv2.resize(y, (target_w, target_h))
			
 
				+
			
 
				+    # Split UV into U and V components
			
 
				+    u = uv[:, 0::2]
			
 
				+    v = uv[:, 1::2]
			
 
				+
			
 
				+    # Resize U and V separately
			
 
				+    if keep_ratio:
			
 
				+        u_resized = letterbox_resize_gray(u, target_w // 2, target_h // 2)
			
 
				+        v_resized = letterbox_resize_gray(v, target_w // 2, target_h // 2)
			
 
				+    else:
			
 
				+        u_resized = cv2.resize(u, (target_w // 2, target_h // 2))
			
 
				+        v_resized = cv2.resize(v, (target_w // 2, target_h // 2))
			
 
				+
			
 
				+    # Re-stack into UV plane
			
 
				+    uv_resized = np.stack((u_resized, v_resized), axis=-1)
			
 
				+
			
 
				+    return y_resized, uv_resized
			
--- a/brain/PlannerNode2/largemodel/largemodel/action_service.py
+++ b/brain/PlannerNode2/largemodel/largemodel/action_service.py
@@ -99,6 +99,10 @@ class CustomActionServer(Node):
 
				         self.first_record = True  # 首次记录位置 / First record
			
 
				         self.is_recording = False  # 录音状态 / Recording status
			
 
				         self.IS_SAVING = False #是否正在保存图像
			
 
				+        self.welcome_mode = False  # 迎宾模式标志 / Welcome mode flag
			
 
				+        self.process_map = {
			
 
				+            'person_approach': {'pid': None, 'sub': None, 'running': False}
			
 
				+        }  # 进程管理字典 / Process management map
			
 
				         self.joint6 = (
			
 
				             140  # 默认机械臂六轴的初始角度 / Default angle of the six-axis arm
			
 
				         )
			
@@ -497,10 +501,28 @@ class CustomActionServer(Node):
 
				         """
			
 
				 
			
 
				         if msg.data:
			
 
				-            if (
			
 
				+            self.get_logger().info(f"wakeup_callback: welcome_mode={self.welcome_mode}, action_runing={self.action_runing}")
			
 
				+            # 迎宾模式打断处理
			
 
				+            if self.welcome_mode:
			
 
				+                ##self.stop_event.set()  # 停止 TTS 播放
			
 
				+                # 杀掉所有管理的进程
			
 
				+                for process_name, process_info in self.process_map.items():
			
 
				+                    if process_info['pid'] is not None:
			
 
				+                        self.kill_process_tree(process_info['pid'])
			
 
				+                        process_info['pid'] = None
			
 
				+                    if process_info['sub'] is not None:
			
 
				+                        self.destroy_subscription(process_info['sub'])
			
 
				+                        process_info['sub'] = None
			
 
				+                    process_info['running'] = False
			
 
				+                self.welcome_mode = False
			
 
				+                self.stop_event.clear()  # 清除停止事件，避免影响后续播放
			
 
				+                self.get_logger().info("Welcome mode interrupted by wakeup")
			
 
				+
			
 
				+            elif (
			
 
				                 pygame.mixer.music.get_busy()  # 如果音乐正在播放/If the music is playing
			
 
				             ):
			
 
				                 self.stop_event.set()  # 停止正在播放的音乐/Stop the music currently playing
			
 
				+                self.stop_event.clear()  # 清除事件，避免影响后续播放
			
 
				             if (
			
 
				                 self.action_runing  # 如果当前有动作正在执行/If there is an action currently being
			
 
				             ):
			
@@ -508,6 +530,65 @@ class CustomActionServer(Node):
 
				                 self.stop()
			
 
				         # self.check_all_process()
			
 
				 
			
 
				+    def welcome(self):
			
 
				+        """
			
 
				+        迎宾模式函数 / Welcome mode function
			
 
				+        启动人物靠近检测节点，订阅检测事件，收到事件后播放欢迎语
			
 
				+        """
			
 
				+        if self.welcome_mode:
			
 
				+            self.get_logger().warn("Welcome mode already running")
			
 
				+            return
			
 
				+
			
 
				+        self.welcome_mode = True
			
 
				+
			
 
				+        # 启动 person_approach 节点
			
 
				+        process = subprocess.Popen(
			
 
				+            ["ros2", "launch", "person_approach_skill", "person_approach_node.launch.py"]
			
 
				+        )
			
 
				+        self.process_map['person_approach']['pid'] = process.pid
			
 
				+        self.process_map['person_approach']['running'] = True
			
 
				+        self.get_logger().info(f"Started person_approach node, PID: {process.pid}")
			
 
				+
			
 
				+        # 创建事件订阅
			
 
				+        self.process_map['person_approach']['sub'] = self.create_subscription(
			
 
				+            String, "/skill/person_approach/event",
			
 
				+            self.person_approach_event_callback, 10
			
 
				+        )
			
 
				+        self.get_logger().info("Subscribed to /skill/person_approach/event")
			
 
				+
			
 
				+    def person_approach_event_callback(self, msg):
			
 
				+        """
			
 
				+        人物靠近事件回调函数 / Person approach event callback
			
 
				+        收到事件后播放欢迎语
			
 
				+        """
			
 
				+        if not self.welcome_mode:
			
 
				+            return
			
 
				+
			
 
				+        try:
			
 
				+            data = json.loads(msg.data)
			
 
				+            if data.get('event') == 'person_approach':
			
 
				+                self.get_logger().info(f"Person approach detected: {data}")
			
 
				+
			
 
				+                # 停止上一个 TTS 播放
			
 
				+                self.stop_event.set()
			
 
				+                time.sleep(0.1)
			
 
				+
			
 
				+                # 欢迎语内容（后续可修改）
			
 
				+                welcome_text = "欢迎光临"
			
 
				+
			
 
				+                # TTS 合成
			
 
				+                self.model_client.voice_synthesis(
			
 
				+                    welcome_text, self.tts_out_path
			
 
				+                )
			
 
				+                # 异步播放
			
 
				+                self.play_audio_async(self.tts_out_path)
			
 
				+                self.get_logger().info(f"Playing welcome TTS: {welcome_text}")
			
 
				+
			
 
				+        except json.JSONDecodeError:
			
 
				+            self.get_logger().error("Failed to parse person_approach event data")
			
 
				+        except Exception as e:
			
 
				+            self.get_logger().error(f"Error in person_approach_event_callback: {e}")
			
 
				+
			
 
				     def get_current_pose(self):
			
 
				         """
			
 
				         获取当前在全局地图坐标系下的位置 /Get the current position in the global map coordinate system
			
@@ -556,6 +637,7 @@ class CustomActionServer(Node):
 
				         """
			
 
				         从navpose_dict字典中获取目标点坐标.并导航到目标点
			
 
				         """
			
 
				+        self.get_logger().info(f"navigation called with point_name: {point_name}")
			
 
				         self.navigation_finish_flag = False
			
 
				         self.goal_handle = None
			
 
				         self.result = None
			
@@ -1307,6 +1389,7 @@ class CustomActionServer(Node):
 
				             else:
			
 
				                 action_name, args_str = match.groups()
			
 
				                 args = [arg.strip() for arg in args_str.split(",")] if args_str else []
			
 
				+                self.get_logger().info(f"Executing action: {action_name} with args: {args}")
			
 
				                 method = getattr(self, action_name)
			
 
				                 method(*args)
			
 
				 
			
@@ -1370,6 +1453,7 @@ class CustomActionServer(Node):
 
				         """
			
 
				         return
			
 
				 
			
 
				+    @staticmethod
			
 
				     def kill_process_tree(pid):
			
 
				         try:
			
 
				             parent = psutil.Process(pid)
			
@@ -1408,16 +1492,24 @@ class CustomActionServer(Node):
 
				         """
			
 
				         同步方式播放音频函数The function for playing audio in synchronous mode
			
 
				         """
			
 
				+        self.get_logger().info(f"play_audio called: file={file_path}, is_recording={self.is_recording}")
			
 
				         if self.is_recording:
			
 
				+            self.get_logger().warn("play_audio: is_recording=True, skip")
			
 
				             return
			
 
				+        if pygame.mixer.music.get_busy():
			
 
				+            pygame.mixer.music.stop()
			
 
				+        self.stop_event.clear()
			
 
				         pygame.mixer.music.load(file_path)
			
 
				         pygame.mixer.music.play()
			
 
				+        self.get_logger().info(f"play_audio: started playing {file_path}")
			
 
				         while pygame.mixer.music.get_busy():
			
 
				             if self.stop_event.is_set() or self.is_recording:
			
 
				                 pygame.mixer.music.stop()
			
 
				-                self.stop_event.clear()  # 清除事件
			
 
				+                self.stop_event.clear()
			
 
				+                self.get_logger().info("play_audio: stopped by event")
			
 
				                 return
			
 
				             pygame.time.Clock().tick(10)
			
 
				+        self.get_logger().info("play_audio: playback finished")
			
 
				         if feedback:
			
 
				             self.action_status_pub("response_done")
			
 
				 
			
@@ -1426,19 +1518,29 @@ class CustomActionServer(Node):
 
				         异步方式播放音频函数The function for playing audio in asynchronous mode
			
 
				         """
			
 
				         if self.is_recording:
			
 
				+            self.get_logger().warn("play_audio_async: is_recording=True, skip")
			
 
				             return
			
 
				 
			
 
				         def target():
			
 
				-            pygame.mixer.music.load(file_path)
			
 
				-            pygame.mixer.music.play()
			
 
				-            while pygame.mixer.music.get_busy():
			
 
				-                if self.stop_event.is_set() or self.is_recording:
			
 
				-                    pygame.mixer.music.stop()
			
 
				-                    self.stop_event.clear()  # 清除事件
			
 
				-                    return
			
 
				-                pygame.time.Clock().tick(5)
			
 
				-            if feedback:
			
 
				-                self.action_status_pub("response_done")
			
 
				+            try:
			
 
				+                if pygame.mixer.music.get_busy():
			
 
				+                    pygame.mixer.music.stop()  # 只在播放中才停止
			
 
				+                pygame.mixer.music.load(file_path)
			
 
				+                self.stop_event.clear()  # 清除停止事件，在播放前清除
			
 
				+                pygame.mixer.music.play()
			
 
				+                self.get_logger().info(f"play_audio_async: started playing {file_path}")
			
 
				+                while pygame.mixer.music.get_busy():
			
 
				+                    if self.stop_event.is_set() or self.is_recording:
			
 
				+                        pygame.mixer.music.stop()
			
 
				+                        self.stop_event.clear()
			
 
				+                        self.get_logger().info("play_audio_async: stopped by event")
			
 
				+                        return
			
 
				+                    pygame.time.Clock().tick(5)
			
 
				+                self.get_logger().info("play_audio_async: playback finished")
			
 
				+                if feedback:
			
 
				+                    self.action_status_pub("response_done")
			
 
				+            except Exception as e:
			
 
				+                self.get_logger().error(f"play_audio_async error: {e}")
			
 
				 
			
 
				         thread = threading.Thread(target=target)
			
 
				         thread.daemon = True
			
--- a/brain/PlannerNode2/largemodel/utils/promot.py
+++ b/brain/PlannerNode2/largemodel/utils/promot.py
@@ -208,6 +208,9 @@ action_function_library='''
 
				 - **获取当前视角图像**:`seewhat()`  
			
 
				   - 说明:调用后机器人上传一张`640×480`像素的俯视图像,用于物体定位。  
			
 
				 ## 其他函数   
			
 
				+- **迎宾模式**:`welcome()`
			
 
				+  - 说明:启动迎宾模式,机器人会检测人员靠近并播放欢迎语"欢迎光临"。
			
 
				+
			
 
				 - **结束当前任务周期**:`finish_dialogue()`  
			
 
				   - 说明:清空上下文,结束任务（如用户指令“退下”“休息”）。  
			
 
				 - **等待一段时间**:`wait(x)`