PyPI - smartpi - Versions diffs - 0.1.34__py3-none-any.whl → 0.1.36__py3-none-any.whl - Mend

smartpi 0.1.34py3-none-any.whl → 0.1.36py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

smartpi/__init__.py +1 -1
smartpi/base_driver.py +1 -0
smartpi/camera.py +84 -0
smartpi/color_sensor.py +1 -0
smartpi/humidity.py +1 -0
smartpi/led.py +1 -0
smartpi/light_sensor.py +11 -6
smartpi/motor.py +11 -2
smartpi/move.py +63 -46
smartpi/onnx_hand_workflow.py +201 -0
smartpi/onnx_image_workflow.py +176 -0
smartpi/onnx_pose_workflow.py +482 -0
smartpi/onnx_text_workflow.py +173 -0
smartpi/onnx_voice_workflow.py +437 -0
smartpi/posenet_utils.py +222 -0
smartpi/rknn_hand_workflow.py +245 -0
smartpi/rknn_image_workflow.py +405 -0
smartpi/rknn_pose_workflow.py +592 -0
smartpi/rknn_text_workflow.py +240 -0
smartpi/rknn_voice_workflow.py +394 -0
smartpi/servo.py +10 -0
smartpi/temperature.py +1 -0
smartpi/touch_sensor.py +1 -0
smartpi/trace.py +18 -11
smartpi/ultrasonic.py +1 -0
{smartpi-0.1.34.dist-info → smartpi-0.1.36.dist-info}/METADATA +1 -1
smartpi-0.1.36.dist-info/RECORD +32 -0
smartpi-0.1.34.dist-info/RECORD +0 -20
{smartpi-0.1.34.dist-info → smartpi-0.1.36.dist-info}/WHEEL +0 -0
{smartpi-0.1.34.dist-info → smartpi-0.1.36.dist-info}/top_level.txt +0 -0

smartpi/__init__.py CHANGED Viewed

@@ -4,5 +4,5 @@ from .base_driver import P1, P2, P3, P4, P5, P6, M1, M2, M3, M4, M5, M6
 __all__ = ["base_driver","gui","ultrasonic","touch_sensor","temperature","humidity","light_sensor","color_sensor","motor","servo","led","flash",
            "P1", "P2", "P3", "P4", "P5", "P6", "M1", "M2", "M3", "M4", "M5", "M6"]
-__version__ = "0.1.34"
+__version__ = "0.1.36"

smartpi/base_driver.py CHANGED Viewed

@@ -415,6 +415,7 @@ def single_operate_sensor(op_struct: bytes, block_time: float) -> Optional[bytes
 def P_port_init(port:bytes) -> Optional[bytes]:
     servo_str=[0xA0, 0x0F, 0x00, 0xBE]
     servo_str[0]=0XA0+port
+    time.sleep(0.005)
     response = single_operate_sensor(servo_str,0)
     if response:
         return 0

smartpi/camera.py ADDED Viewed

@@ -0,0 +1,84 @@
+# coding: utf-8
+import cv2
+import os
+import time
+import platform
+class Camera:
+    def __init__(self, indexes=[0, 1, 2, 3], target_width=640, target_height=480):
+        self.cap = None
+        self.indexes = indexes
+        self.target_width = target_width
+        self.target_height = target_height
+        self.open_camera()
+    def open_camera(self):
+        """打开摄像头（硬件加速+参数优化）"""
+        for idx in self.indexes:
+            try:
+                # 适配linux/Android的V4L2硬件加速（RK芯片优先）
+                if platform.system() == "Linux":
+                    cap = cv2.VideoCapture(idx, cv2.CAP_V4L2)
+                    # 尝试启用硬件加速（兼容不同OpenCV版本）
+                    try:
+                        # 对于较新版本的OpenCV
+                        if hasattr(cv2, 'CAP_PROP_HW_ACCELERATION') and hasattr(cv2, 'VIDEO_ACCELERATION_ANY'):
+                            cap.set(cv2.CAP_PROP_HW_ACCELERATION, cv2.VIDEO_ACCELERATION_ANY)
+                    except AttributeError as ae:
+                        print(f"硬件加速设置不支持，使用默认配置: {ae}")
+                else:
+                    cap = cv2.VideoCapture(idx)
+                if cap.isOpened():
+                    # 尝试设置分辨率
+                    cap.set(cv2.CAP_PROP_FRAME_WIDTH, self.target_width)
+                    cap.set(cv2.CAP_PROP_FRAME_HEIGHT, self.target_height)
+                    # 获取实际设置的分辨率
+                    actual_width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+                    actual_height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+                    print(f"摄像头 {idx} 已打开, 分辨率: {actual_width}x{actual_height}")
+                    self.cap = cap
+                    return True
+            except Exception as e:
+                print(f"尝试打开摄像头 {idx} 失败: {e}")
+                continue
+        print("无法打开任何摄像头")
+        return False
+    def read_frame(self):
+        """读取一帧并自动处理错误"""
+        if not self.cap or not self.cap.isOpened():
+            return False, None
+        ret, frame = self.cap.read()
+        if not ret:
+            print("读取帧失败，尝试重新打开摄像头...")
+            self.release()
+            time.sleep(1)
+            if self.open_camera():
+                return self.read_frame()
+            return False, None
+        # 调整到目标分辨率
+        if frame.shape[1] != self.target_width or frame.shape[0] != self.target_height:
+            frame = cv2.resize(frame, (self.target_width, self.target_height))
+        return True, frame
+    def get_resolution(self):
+        """获取当前分辨率"""
+        if self.cap and self.cap.isOpened():
+            return (
+                int(self.cap.get(cv2.CAP_PROP_FRAME_WIDTH)),
+                int(self.cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+            )
+        return self.target_width, self.target_height
+    def release(self):
+        """释放摄像头资源"""
+        if self.cap and self.cap.isOpened():
+            self.cap.release()
+            self.cap = None

smartpi/color_sensor.py CHANGED Viewed

@@ -8,6 +8,7 @@ def get_value(port:bytes) -> Optional[bytes]:
     color_str=[0xA0, 0x04, 0x00, 0xBE]
     color_str[0]=0XA0+port
     color_str[2]=1
+    time.sleep(0.005)
     response = base_driver.single_operate_sensor(color_str,0)
     if response == None:
         return None

smartpi/humidity.py CHANGED Viewed

@@ -9,6 +9,7 @@ def get_value(port:bytes) -> Optional[bytes]:
     humi_str=[0XA0, 0X0C, 0X01, 0X71, 0X00, 0XBE]
     humi_str[0]=0XA0+port
     humi_str[4]=0X01
+    time.sleep(0.005)
     response = base_driver.single_operate_sensor(humi_str,0)
     if response == None:
         return None

smartpi/led.py CHANGED Viewed

@@ -10,6 +10,7 @@ def set_color(port:bytes,command:bytes) -> Optional[bytes]:
     color_lamp_str[0]=0XA0+port
     color_lamp_str[2]=command
 #    response = base_driver.single_operate_sensor(color_lamp_str,0)
+    time.sleep(0.005)
     base_driver.write_data(0X01, 0X02, color_lamp_str)
 #    if response == None:
 #        return None

smartpi/light_sensor.py CHANGED Viewed

@@ -9,7 +9,7 @@ def turn_off(port:bytes) -> Optional[bytes]:
     light_str[0]=0XA0+port
     light_str[2]=0x03
 #    response = base_driver.single_operate_sensor(light_str,0)
-#    base_driver.write_data(0X01, 0X02, light_str)
+    base_driver.write_data(0X01, 0X02, light_str)
 #    if response == None:
 #        return None
 #    else:
@@ -20,6 +20,7 @@ def get_value(port:bytes) -> Optional[bytes]:
     light_str=[0xA0, 0x02, 0x00, 0xBE]
     light_str[0]=0XA0+port
     light_str[2]=0x01
+    time.sleep(0.005)
     response = base_driver.single_operate_sensor(light_str,0)
     if response == None:
         return None
@@ -35,17 +36,20 @@ def set_threshold(port:bytes,threshold:int) -> Optional[bytes]:
     light_str[2]=0x04
     light_str[4]=threshold//256
     light_str[5]=threshold%256
-    response = base_driver.single_operate_sensor(light_str,0)
-    if response == None:
-        return None
-    else:
-        return 0
+    time.sleep(0.005)
+    base_driver.write_data(0X01, 0X02, light_str)
+#    response = base_driver.single_operate_sensor(light_str,0)
+#    if response == None:
+#        return None
+#    else:
+    return 0
 #�����ֵ��ȡ port:����P�˿ڣ�
 def get_threshold(port:bytes) -> Optional[bytes]:
     light_str=[0xA0, 0x02, 0x00, 0xBE]
     light_str[0]=0XA0+port
     light_str[2]=0x05
+    time.sleep(0.005)
     response = base_driver.single_operate_sensor(light_str,0)
     if response == None:
         return None
@@ -59,6 +63,7 @@ def get_bool_data(port:bytes) -> Optional[bytes]:
     light_str=[0xA0, 0x02, 0x00, 0xBE]
     light_str[0]=0XA0+port
     light_str[2]=0x06
+    time.sleep(0.005)
     response = base_driver.single_operate_sensor(light_str,0)
     if response == None:
         return None

smartpi/motor.py CHANGED Viewed

@@ -8,7 +8,8 @@ from smartpi import base_driver
 #��������ȡ port:����M�˿ڣ�
 def get_motor_encoder(port:bytes) -> Optional[bytes]:
     motor_str=[0xA0, 0x01, 0x01, 0xBE]
-    motor_str[0]=0XA0+port
+    motor_str[0]=0XA0+port
+    time.sleep(0.005)
     response = base_driver.single_operate_sensor(motor_str,0)
     if response == None:
         return None
@@ -22,6 +23,7 @@ def reset_motor_encoder(port:bytes) -> Optional[bytes]:
     motor_str=[0xA0, 0x01, 0x03, 0xBE]
     motor_str[0]=0XA0+port
 #    response = base_driver.single_operate_sensor(motor_str,0)
+    time.sleep(0.005)
     base_driver.write_data(0X01, 0X02, motor_str)
 #    if response == None:
 #        return None
@@ -34,6 +36,7 @@ def set_motor_direction(port:bytes,direc:bytes) -> Optional[bytes]:
     motor_str[0]=0XA0+port
     motor_str[4]=direc
 #    response = base_driver.single_operate_sensor(motor_str,0)
+    time.sleep(0.005)
     base_driver.write_data(0X01, 0X02, motor_str)
 #    if response == None:
 #        return None
@@ -56,6 +59,7 @@ def set_motor(port:bytes,speed:int) -> Optional[bytes]:
     motor_str[4]=m_par
 #    response = base_driver.single_operate_sensor(motor_str,0)
+    time.sleep(0.005)
     base_driver.write_data(0X01, 0X02, motor_str)
 #    if response == None:
 #        return None
@@ -67,6 +71,7 @@ def set_motor_stop(port:bytes) -> Optional[bytes]:
     motor_str=[0xA0, 0x01, 0x0B, 0xBE]
     motor_str[0]=0XA0+port
 #    response = base_driver.single_operate_sensor(motor_str,0)
+    time.sleep(0.005)
     base_driver.write_data(0X01, 0X02, motor_str)
 #    if response == None:
 #        return None
@@ -91,6 +96,7 @@ def set_motor_angle(port:bytes,speed:int,degree:int) -> Optional[bytes]:
     motor_str[6]=degree//256
     motor_str[7]=degree%256
 #    response = base_driver.single_operate_sensor(motor_str,0)
+    time.sleep(0.005)
     base_driver.write_data(0X01, 0X02, motor_str)
 #    if response == None:
 #        return None
@@ -122,6 +128,7 @@ def set_motor_second(port:bytes,speed:int,second:float) -> Optional[bytes]:
     motor_str[9]=byte_array[3]
 #    response = base_driver.single_operate_sensor(motor_str,0)
+    time.sleep(0.005)
     base_driver.write_data(0X01, 0X02, motor_str)
 #    if response == None:
 #        return None
@@ -145,6 +152,7 @@ def set_motor_constspeed(port:bytes,speed:int) -> Optional[bytes]:
     motor_str[4]=m_par
 #    response = base_driver.single_operate_sensor(motor_str,0)
+    time.sleep(0.005)
     base_driver.write_data(0X01, 0X02, motor_str)
 #    if response == None:
 #        return None
@@ -154,7 +162,8 @@ def set_motor_constspeed(port:bytes,speed:int) -> Optional[bytes]:
 #�����ٶȶ�ȡ port:����M�˿ڣ�
 def get_motor_speed(port:bytes) -> Optional[bytes]:
     motor_str=[0xA0, 0x01, 0x10, 0xBE]
-    motor_str[0]=0XA0+port
+    motor_str[0]=0XA0+port
+    time.sleep(0.005)
     response = base_driver.single_operate_sensor(motor_str,0)
     if response == None:
         return None

smartpi/move.py CHANGED Viewed

@@ -19,12 +19,13 @@ def run_second(dir:bytes,speed:bytes,second:bytes) -> Optional[bytes]:
     move_str[6]=speed
     move_str[8]=second
-    response = base_driver.single_operate_sensor(move_str,0)
-    if response == None:
-        return None
-    else:
-        return 0
+    time.sleep(0.005)
+    base_driver.write_data(0X01, 0X02, move_str)
+#    response = base_driver.single_operate_sensor(move_str,0)
+#    if response == None:
+#        return None
+#    else:
+    return 0
 #以速度移动x度：dir:方向forward、backward、turnright、turnleft：speed:0~100：angle:65535
 def run_angle(dir:bytes,speed:bytes,angle:int) -> Optional[bytes]:
@@ -43,11 +44,13 @@ def run_angle(dir:bytes,speed:bytes,angle:int) -> Optional[bytes]:
     move_str[8]=angle//256
     move_str[9]=angle%256
-    response = base_driver.single_operate_sensor(move_str,0)
-    if response == None:
-        return None
-    else:
-        return 0
+    time.sleep(0.005)
+    base_driver.write_data(0X01, 0X02, move_str)
+#    response = base_driver.single_operate_sensor(move_str,0)
+#    if response == None:
+#        return None
+#    else:
+    return 0
 #以速度移动：dir:方向forward、backward、turnright、turnleft；speed:0~100；
 def run(dir:bytes,speed:bytes) -> Optional[bytes]:
@@ -64,11 +67,13 @@ def run(dir:bytes,speed:bytes) -> Optional[bytes]:
     move_str[6]=speed
-    response = base_driver.single_operate_sensor(move_str,0)
-    if response == None:
-        return None
-    else:
-        return 0
+    time.sleep(0.005)
+    base_driver.write_data(0X01, 0X02, move_str)
+#    response = base_driver.single_operate_sensor(move_str,0)
+#    if response == None:
+#        return None
+#    else:
+    return 0
 #设置左右轮速度移动x秒：Lspeed:-100~100；Rspeed:-100~100；second:1~255
 def run_speed_second(Lspeed:int,Rspeed:int,second:bytes) -> Optional[bytes]:
@@ -98,11 +103,13 @@ def run_speed_second(Lspeed:int,Rspeed:int,second:bytes) -> Optional[bytes]:
     move_str[8]=second
-    response = base_driver.single_operate_sensor(move_str,0)
-    if response == None:
-        return None
-    else:
-        return 0
+    time.sleep(0.005)
+    base_driver.write_data(0X01, 0X02, move_str)
+#    response = base_driver.single_operate_sensor(move_str,0)
+#    if response == None:
+#        return None
+#    else:
+    return 0
 #设置左右轮速度移动：Lspeed:-100~100；Rspeed:-100~100；
 def run_speed(Lspeed:int,Rspeed:int) -> Optional[bytes]:
@@ -130,11 +137,13 @@ def run_speed(Lspeed:int,Rspeed:int) -> Optional[bytes]:
     move_str[4]=m_par
-    response = base_driver.single_operate_sensor(move_str,0)
-    if response == None:
-        return None
-    else:
-        return 0
+    time.sleep(0.005)
+    base_driver.write_data(0X01, 0X02, move_str)
+#    response = base_driver.single_operate_sensor(move_str,0)
+#    if response == None:
+#        return None
+#    else:
+    return 0
 #设置左右轮功率移动：Lpower:0~100；Rpower:0~100；
 def run_power(Lpower:bytes,Rpower:bytes) -> Optional[bytes]:
@@ -143,11 +152,13 @@ def run_power(Lpower:bytes,Rpower:bytes) -> Optional[bytes]:
     move_str[4]=Rpower
     move_str[6]=Lpower
-    response = base_driver.single_operate_sensor(move_str,0)
-    if response == None:
-        return None
-    else:
-        return 0
+    time.sleep(0.005)
+    base_driver.write_data(0X01, 0X02, move_str)
+#    response = base_driver.single_operate_sensor(move_str,0)
+#    if response == None:
+#        return None
+#    else:
+    return 0
 #设置最大功率：M1:0~100；M2:0~100；M3:0~100；M4:0~100；M5:0~100；M6:0~100；
 def set_maxpower(M1:bytes,M2:bytes,M3:bytes,M4:bytes,M5:bytes,M6:bytes) -> Optional[bytes]:
@@ -160,21 +171,25 @@ def set_maxpower(M1:bytes,M2:bytes,M3:bytes,M4:bytes,M5:bytes,M6:bytes) -> Optio
     move_str[12]=M5
     move_str[14]=M6
-    response = base_driver.single_operate_sensor(move_str,0)
-    if response == None:
-        return None
-    else:
-        return 0
+    time.sleep(0.005)
+    base_driver.write_data(0X01, 0X02, move_str)
+#    response = base_driver.single_operate_sensor(move_str,0)
+#    if response == None:
+#        return None
+#    else:
+    return 0
 #马达停止
 def stop() -> Optional[bytes]:
     move_str=[0xA0, 0x01, 0x0A, 0xBE]
-    response = base_driver.single_operate_sensor(move_str,0)
-    if response == None:
-        return None
-    else:
-        return 0
+    time.sleep(0.005)
+    base_driver.write_data(0X01, 0X02, move_str)
+#    response = base_driver.single_operate_sensor(move_str,0)
+#    if response == None:
+#        return None
+#    else:
+    return 0
 #设置左右轮方向：Lmotor:1~6；Rmotor:1~6；state: no_reversal、all_reversal、left_reversal、right_reversal
 def set_move_init(Lmotor:bytes,Rmotor:bytes,state:bytes) -> Optional[bytes]:
@@ -192,10 +207,12 @@ def set_move_init(Lmotor:bytes,Rmotor:bytes,state:bytes) -> Optional[bytes]:
     move_str[6]=Rmotor
     move_str[8]=Lmotor
-    response = base_driver.single_operate_sensor(move_str,0)
-    if response == None:
-        return None
-    else:
-        return 0
+    time.sleep(0.005)
+    base_driver.write_data(0X01, 0X02, move_str)
+#    response = base_driver.single_operate_sensor(move_str,0)
+#    if response == None:
+#        return None
+#    else:
+    return 0

smartpi/onnx_hand_workflow.py ADDED Viewed

@@ -0,0 +1,201 @@
+import cv2
+import numpy as np
+import onnxruntime as ort
+import mediapipe as mp
+import json
+from PIL import Image
+import time  # 用于时间测量
+class GestureWorkflow:
+    def __init__(self, model_path):
+        # 初始化MediaPipe Hands
+        self.mp_hands = mp.solutions.hands
+        self.hands = self.mp_hands.Hands(
+            static_image_mode=False,  # 视频流模式  如果只是获取照片的手势关键点 请设置为True
+            max_num_hands=1,#如果想要检测双手，请设置成2
+            min_detection_confidence=0.5,#手势关键点的阈值
+            model_complexity=0#使用最简单的模型  如果效果不准确 可以考虑设置比较复制的模型  1
+        )
+        # 初始化元数据
+        self.min_vals = None
+        self.max_vals = None
+        self.class_labels = None
+        # 加载模型和元数据
+        self.load_model(model_path)
+    def load_model(self, model_path):
+        """加载模型并解析元数据"""
+        # 初始化ONNX Runtime会话
+        self.session = ort.InferenceSession(model_path)
+        # 加载元数据
+        self._load_metadata()
+    def _load_metadata(self):
+        """从ONNX模型元数据中加载归一化参数和类别标签"""
+        model_meta = self.session.get_modelmeta()
+        # 检查custom_metadata_map是否存在
+        if hasattr(model_meta, 'custom_metadata_map'):
+            metadata = model_meta.custom_metadata_map
+            if 'minMaxValues' in metadata:
+                min_max_data = json.loads(metadata['minMaxValues'])
+                self.min_vals = min_max_data.get('min')
+                self.max_vals = min_max_data.get('max')
+            if 'classes' in metadata:
+                class_labels = json.loads(metadata['classes'])
+                self.class_labels = list(class_labels.values()) if isinstance(class_labels, dict) else class_labels
+        else:
+            # 对于旧版本的ONNX Runtime，使用metadata_props
+            for prop in model_meta.metadata_props:
+                if prop.key == 'minMaxValues':
+                    min_max_data = json.loads(prop.value)
+                    self.min_vals = min_max_data.get('min')
+                    self.max_vals = min_max_data.get('max')
+                elif prop.key == 'classes':
+                    class_labels = json.loads(prop.value)
+                    self.class_labels = list(class_labels.values()) if isinstance(class_labels, dict) else class_labels
+        # 设置默认值
+        if self.class_labels is None:
+            self.class_labels = ["点赞", "点踩", "胜利", "拳头", "我爱你", "手掌"]
+    def preprocess_image(self, image, target_width=224, target_height=224):
+        """
+        预处理图像：保持比例缩放并居中放置在目标尺寸的画布上
+        返回处理后的OpenCV图像 (BGR格式)
+        """
+        # 将OpenCV图像转换为PIL格式
+        image_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+        pil_image = Image.fromarray(image_rgb)
+        # 计算缩放比例
+        width, height = pil_image.size
+        scale = min(target_width / width, target_height / height)
+        # 计算新尺寸和位置
+        new_width = int(width * scale)
+        new_height = int(height * scale)
+        x = (target_width - new_width) // 2
+        y = (target_height - new_height) // 2
+        # 创建白色背景画布并粘贴缩放后的图像
+        canvas = Image.new('RGB', (target_width, target_height), (255, 255, 255))
+        resized_image = pil_image.resize((new_width, new_height), Image.Resampling.LANCZOS)
+        canvas.paste(resized_image, (x, y))
+        # 转换回OpenCV格式
+        processed_image = np.array(canvas)
+        return cv2.cvtColor(processed_image, cv2.COLOR_RGB2BGR)
+    def extract_hand_keypoints(self, image):
+        """从图像中提取手部关键点"""
+        # 转换图像为RGB格式并处理
+        image_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+        results = self.hands.process(image_rgb)
+        if results.multi_hand_landmarks:
+            # 只使用检测到的第一只手
+            landmarks = results.multi_hand_world_landmarks[0]
+            # 提取关键点坐标
+            keypoints = []
+            for landmark in landmarks.landmark:
+                keypoints.extend([landmark.x, landmark.y, landmark.z])
+            return np.array(keypoints, dtype=np.float32)
+        return None
+    def normalize_keypoints(self, keypoints):
+        """归一化关键点数据"""
+        if self.min_vals is None or self.max_vals is None:
+            return keypoints  # 如果没有归一化参数，返回原始数据
+        normalized = []
+        for i, value in enumerate(keypoints):
+            if i < len(self.min_vals) and i < len(self.max_vals):
+                min_val = self.min_vals[i]
+                max_val = self.max_vals[i]
+                if max_val - min_val > 0:
+                    normalized.append((value - min_val) / (max_val - min_val))
+                else:
+                    normalized.append(0)
+            else:
+                normalized.append(value)
+        return np.array(normalized, dtype=np.float32)
+    def predict_frame(self, frame):
+        """执行手势分类预测（直接处理图像帧）"""
+        # 记录开始时间
+        start_time = time.time()
+        # 预处理图像
+        processed_image = self.preprocess_image(frame, 224, 224)
+        # 提取关键点
+        keypoints = self.extract_hand_keypoints(processed_image)
+        min_time = time.time()
+        hand_time = min_time - start_time
+        #print(f"关键点识别耗时: {hand_time:.4f}秒")
+        if keypoints is None:
+            return None, {"error": "未检测到手部"}
+        # 归一化关键点
+        normalized_kps = self.normalize_keypoints(keypoints)
+        # 准备ONNX输入
+        input_data = normalized_kps.reshape(1, -1).astype(np.float32)
+        # 运行推理
+        input_name = self.session.get_inputs()[0].name
+        outputs = self.session.run(None, {input_name: input_data})
+        predictions = outputs[0][0]
+        # 获取预测结果
+        class_id = np.argmax(predictions)
+        confidence = float(predictions[class_id])
+        # 获取类别标签
+        label = self.class_labels[class_id] if class_id < len(self.class_labels) else f"未知类别 {class_id}"
+        end_time = time.time()
+        all_time = end_time - start_time
+        onnx_time = end_time - min_time
+        print(f"onnx耗时: {onnx_time:.4f}秒")
+        print(f"总耗时: {all_time:.4f}秒")
+        # 返回原始结果和格式化结果
+        raw_result = predictions.tolist()
+        formatted_result = {
+            'class': label,
+            'confidence': confidence,
+            'class_id': class_id,
+            'probabilities': raw_result
+        }
+        return raw_result, formatted_result
+    # 保留原始方法以兼容旧代码
+    def predict(self, image_path):
+        """执行手势分类预测（从文件路径）"""
+        try:
+            # 使用PIL库读取图像，避免libpng版本问题
+            pil_image = Image.open(image_path)
+            # 转换为RGB格式
+            rgb_image = pil_image.convert('RGB')
+            # 转换为numpy数组
+            image_array = np.array(rgb_image)
+            # 转换为BGR格式（OpenCV使用的格式）
+            image = cv2.cvtColor(image_array, cv2.COLOR_RGB2BGR)
+            if image is None:
+                raise ValueError(f"无法读取图像: {image_path}")
+            return self.predict_frame(image)
+        except Exception as e:
+            # 如果PIL失败，尝试使用cv2作为备选
+            image = cv2.imread(image_path)
+            if image is None:
+                raise ValueError(f"无法读取图像: {image_path}")
+            return self.predict_frame(image)

smartpi 0.1.34__py3-none-any.whl → 0.1.36__py3-none-any.whl

smartpi 0.1.34py3-none-any.whl → 0.1.36py3-none-any.whl