PyPI - smartpi - Versions diffs - 1.1.5__py3-none-any.whl → 1.1.6__py3-none-any.whl - Mend

smartpi 1.1.5py3-none-any.whl → 1.1.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (68) hide show

smartpi/__init__.py +1 -1
smartpi/onnx_text_workflow.pyc +0 -0
smartpi/posenet_utils.pyc +0 -0
smartpi/rknn_text_workflow.pyc +0 -0
{smartpi-1.1.5.dist-info → smartpi-1.1.6.dist-info}/METADATA +2 -3
{smartpi-1.1.5.dist-info → smartpi-1.1.6.dist-info}/RECORD +8 -68
smartpi/__init__.pyc +0 -0
smartpi/_gui.py +0 -66
smartpi/ai_asr.py +0 -1037
smartpi/ai_llm.py +0 -934
smartpi/ai_tts.py +0 -938
smartpi/ai_vad.py +0 -83
smartpi/audio.py +0 -125
smartpi/base_driver.py +0 -618
smartpi/camera.py +0 -84
smartpi/color_sensor.py +0 -18
smartpi/cw2015.py +0 -179
smartpi/flash.py +0 -130
smartpi/humidity.py +0 -20
smartpi/led.py +0 -19
smartpi/light_sensor.py +0 -72
smartpi/local_model.py +0 -432
smartpi/mcp_client.py +0 -100
smartpi/mcp_fastmcp.py +0 -322
smartpi/mcp_intent_recognizer.py +0 -408
smartpi/models/__init__.pyc +0 -0
smartpi/models/snakers4_silero-vad/__init__.pyc +0 -0
smartpi/models/snakers4_silero-vad/hubconf.pyc +0 -0
smartpi/motor.py +0 -177
smartpi/move.py +0 -218
smartpi/onnx_hand_workflow.py +0 -201
smartpi/onnx_image_workflow.py +0 -176
smartpi/onnx_pose_workflow.py +0 -482
smartpi/onnx_text_workflow.py +0 -173
smartpi/onnx_voice_workflow.py +0 -437
smartpi/posemodel/__init__.pyc +0 -0
smartpi/posenet_utils.py +0 -222
smartpi/rknn_hand_workflow.py +0 -245
smartpi/rknn_image_workflow.py +0 -405
smartpi/rknn_pose_workflow.py +0 -592
smartpi/rknn_text_workflow.py +0 -240
smartpi/rknn_voice_workflow.py +0 -394
smartpi/servo.py +0 -178
smartpi/temperature.py +0 -18
smartpi/tencentcloud-speech-sdk-python/__init__.pyc +0 -0
smartpi/tencentcloud-speech-sdk-python/asr/__init__.pyc +0 -0
smartpi/tencentcloud-speech-sdk-python/asr/flash_recognizer.pyc +0 -0
smartpi/tencentcloud-speech-sdk-python/asr/speech_recognizer.pyc +0 -0
smartpi/tencentcloud-speech-sdk-python/common/__init__.pyc +0 -0
smartpi/tencentcloud-speech-sdk-python/common/credential.pyc +0 -0
smartpi/tencentcloud-speech-sdk-python/common/log.pyc +0 -0
smartpi/tencentcloud-speech-sdk-python/common/utils.pyc +0 -0
smartpi/tencentcloud-speech-sdk-python/soe/__init__.pyc +0 -0
smartpi/tencentcloud-speech-sdk-python/soe/speaking_assessment.pyc +0 -0
smartpi/tencentcloud-speech-sdk-python/tts/__init__.pyc +0 -0
smartpi/tencentcloud-speech-sdk-python/tts/flowing_speech_synthesizer.pyc +0 -0
smartpi/tencentcloud-speech-sdk-python/tts/speech_synthesizer.pyc +0 -0
smartpi/tencentcloud-speech-sdk-python/tts/speech_synthesizer_ws.pyc +0 -0
smartpi/tencentcloud-speech-sdk-python/vc/__init__.pyc +0 -0
smartpi/tencentcloud-speech-sdk-python/vc/speech_convertor_ws.pyc +0 -0
smartpi/text_gte_model/__init__.pyc +0 -0
smartpi/text_gte_model/config/__init__.pyc +0 -0
smartpi/text_gte_model/gte/__init__.pyc +0 -0
smartpi/touch_sensor.py +0 -16
smartpi/trace.py +0 -120
smartpi/ultrasonic.py +0 -20
{smartpi-1.1.5.dist-info → smartpi-1.1.6.dist-info}/WHEEL +0 -0
{smartpi-1.1.5.dist-info → smartpi-1.1.6.dist-info}/top_level.txt +0 -0

smartpi/rknn_text_workflow.py DELETED Viewed

@@ -1,240 +0,0 @@
-import numpy as np
-import onnxruntime as ort
-import onnx
-import json
-import os
-import time
-from transformers import AutoTokenizer
-from rknnlite.api import RKNNLite
-# 获取当前文件的绝对路径
-current_dir = os.path.dirname(os.path.abspath(__file__))
-# 构建默认的GTE模型和分词器配置路径
-default_feature_model = os.path.join(current_dir, 'text_gte_model', 'gte', 'gte_model.onnx')
-default_tokenizer_path = os.path.join(current_dir, 'text_gte_model', 'config')
-class TextClassificationWorkflow:
-    def __init__(self, class_model_path, feature_model_path=None, tokenizer_path=None):
-        # 如果没有提供路径，则使用默认路径
-        self.feature_model_path = feature_model_path or default_feature_model
-        self.tokenizer_path = tokenizer_path or default_tokenizer_path
-        self.class_model_path = class_model_path
-        # 加载分词器
-        self.tokenizer = AutoTokenizer.from_pretrained(
-            self.tokenizer_path,
-            local_files_only=True
-        )
-        # 加载特征提取模型（保持ONNX不变）
-        self.feature_session = ort.InferenceSession(self.feature_model_path)
-        self.feature_input_names = [input.name for input in self.feature_session.get_inputs()]
-        # 初始化分类模型（替换为RKNN）
-        self.class_rknn = RKNNLite()
-        self._load_rknn_class_model(class_model_path)
-        # 加载元数据（类别标签）
-        self.label_names = self._load_metadata(class_model_path)
-        print(f"分类模型加载成功，共 {len(self.label_names)} 个类别: {self.label_names}")
-    def _load_rknn_class_model(self, model_path):
-        """加载RKNN分类模型并初始化运行时"""
-        try:
-            ret = self.class_rknn.load_rknn(model_path)
-            if ret != 0:
-                raise RuntimeError(f'加载分类RKNN模型失败 ({model_path}), 错误码: {ret}')
-            ret = self.class_rknn.init_runtime()
-            if ret != 0:
-                raise RuntimeError(f'初始化分类模型NPU运行时失败, 错误码: {ret}')
-            print(f"分类RKNN模型加载成功: {os.path.basename(model_path)}")
-        except Exception as e:
-            print(f"分类模型加载失败: {e}")
-            raise
-    def _get_metadata_path(self, model_path):
-        """获取RKNN模型对应的元数据文件路径"""
-        base_dir = os.path.dirname(model_path)
-        base_name = os.path.basename(model_path)
-        metadata_name = os.path.splitext(base_name)[0] + '_metadata.json'
-        metadata_path = os.path.join(base_dir, metadata_name)
-        if not os.path.exists(metadata_path):
-            metadata_path = os.path.join(base_dir, 'rknn_metadata.json')
-        return metadata_path
-    def _load_metadata(self, model_path):
-        """从RKNN元数据文件加载类别标签"""
-        try:
-            metadata_path = self._get_metadata_path(model_path)
-            if os.path.exists(metadata_path):
-                with open(metadata_path, 'r', encoding='utf-8') as f:
-                    metadata = json.load(f)
-                if 'classes' in metadata:
-                    return metadata['classes']
-                else:
-                    print(f"元数据文件中未找到类别信息")
-            onnx_model_path = os.path.splitext(model_path)[0] + '.onnx'
-            if os.path.exists(onnx_model_path):
-                onnx_model = onnx.load(onnx_model_path)
-                if onnx_model.metadata_props:
-                    for prop in onnx_model.metadata_props:
-                        if prop.key == 'classes':
-                            try:
-                                return json.loads(prop.value)
-                            except json.JSONDecodeError:
-                                return prop.value.split(',')
-        except Exception as e:
-            print(f"元数据读取错误: {e}")
-        # 获取类别数（修复：确保正确获取输出维度）
-        num_classes = 10
-        try:
-            output_shapes = self.class_rknn.get_output_shape()
-            if output_shapes and len(output_shapes) > 0:
-                num_classes = output_shapes[0][-1]
-        except:
-            pass
-        label_names = [f"Class_{i}" for i in range(num_classes)]
-        print(f"警告: 未找到类别信息，使用自动生成的名称: {label_names}")
-        return label_names
-    def _extract_features(self, texts):
-        """特征提取（保持ONNX推理不变）"""
-        inputs = self.tokenizer(
-            texts,
-            padding=True,
-            truncation=True,
-            max_length=512,
-            return_tensors="np"
-        )
-        onnx_inputs = {name: inputs[name].astype(np.int64) for name in self.feature_input_names}
-        onnx_outputs = self.feature_session.run(None, onnx_inputs)
-        last_hidden_state = onnx_outputs[0]
-        return last_hidden_state[:, 0, :].astype(np.float32)
-    def _classify(self, embeddings):
-        """分类推理（修复：支持批量输入，若模型不支持则单样本循环）"""
-        embeddings = embeddings.astype(np.float32)
-        batch_size = embeddings.shape[0]
-        all_results = []
-        # 检查RKNN模型是否支持批量输入（通过输入形状判断）
-        try:
-            input_shapes = self.class_rknn.get_input_shape()
-            if input_shapes and len(input_shapes) > 0:
-                # 输入形状格式：[batch, ...]，若第一维为-1或大于1则支持批量
-                if input_shapes[0][0] in (-1, batch_size):
-                    # 支持批量输入，直接推理
-                    class_results = self.class_rknn.inference(inputs=[embeddings])[0]
-                    return class_results
-        except:
-            pass
-        # 若不支持批量输入，则逐个处理样本
-        for i in range(batch_size):
-            single_embedding = embeddings[i:i+1]  # 保持维度为[1, feature_dim]
-            result = self.class_rknn.inference(inputs=[single_embedding])[0]
-            all_results.append(result[0])  # 取单样本结果
-        return np.array(all_results)  # 合并为批量结果
-    def predict(self, texts):
-        """执行文本分类预测，包含时间测量功能"""
-        if not texts:
-            return [], []
-        # 记录总开始时间
-        total_start_time = time.time()
-        # 记录特征提取时间
-        feature_start_time = time.time()
-        embeddings = self._extract_features(texts)
-        feature_time = time.time() - feature_start_time
-        # 记录分类推理时间
-        classify_start_time = time.time()
-        probs = self._classify(embeddings)
-        classify_time = time.time() - classify_start_time
-        # 计算总时间
-        total_time = time.time() - total_start_time
-        predicted_indices = np.argmax(probs, axis=1)
-        # 打印调试信息：确认批量大小是否正确
-        print(f"处理文本数量: {len(texts)}, 预测结果数量: {len(predicted_indices)}")
-        raw_results = []
-        formatted_results = []
-        for i, (text, idx, prob_vec) in enumerate(zip(texts, predicted_indices, probs)):
-            label = self.label_names[idx] if idx < len(self.label_names) else f"未知类别 {idx}"
-            confidence = float(prob_vec[idx])
-            raw_results.append(prob_vec.tolist())
-            formatted_results.append({
-                'text': text,
-                'class': label,
-                'confidence': confidence,
-                'class_id': int(idx),
-                'probabilities': prob_vec.tolist(),
-                # 添加时间信息
-                'preprocess_time': 0.0,  # 文本不需要传统的图像预处理
-                'feature_extract_time': feature_time / len(texts),  # 平均到每个文本
-                'inference_time': classify_time / len(texts),  # 平均到每个文本
-                'total_time': total_time / len(texts)  # 平均到每个文本
-            })
-        return raw_results, formatted_results
-    def release(self):
-        """释放资源"""
-        if hasattr(self, 'class_rknn') and self.class_rknn:
-            self.class_rknn.release()
-        print("RKNN分类模型资源已释放")
-    def __del__(self):
-        self.release()
-# 使用示例
-if __name__ == "__main__":
-    # 替换为实际路径
-    class_model = "./model.rknn"
-    # 初始化工作流（现在只需要提供分类模型路径，GTE模型和分词器使用默认路径）
-    classifier = TextClassificationWorkflow(
-        class_model_path=class_model
-    )
-    # 测试文本（2个样本）
-    test_texts = [
-        "强大",
-        "再见"
-    ]
-    # 进行预测
-    raw_results, formatted_results = classifier.predict(test_texts)
-    # 打印所有结果
-    print("\n所有预测结果：")
-    for i, result in enumerate(formatted_results):
-        print(f"样本 {i+1}:")
-        print(f"  文本: {result['text']}")
-        print(f"  分类: {result['class']}")
-        print(f"  置信度: {result['confidence']:.4f}")
-        print(f"  类别ID: {result['class_id']}")
-        print(f"  概率分布: {result['probabilities']}")
-        print("---")
-    # 释放资源
-    classifier.release()

smartpi/rknn_voice_workflow.py DELETED Viewed

@@ -1,394 +0,0 @@
-import numpy as np
-import librosa
-import os
-import json
-import time
-from rknnlite.api import RKNNLite
-class Workflow:
-    def __init__(self, model_path=None, smoothing_time_constant=0, step_size=43):
-        self.rknn_lite = None
-        self.classes = []  # 只保留类别标签
-        self.metadata = {}
-        self.model_params = {
-            'fft_size': 2048,
-            'sample_rate': 44100,
-            'num_frames': 43,  # 每块帧数
-            'spec_features': 232  # 频谱特征数
-        }
-        self.smoothing_time_constant = smoothing_time_constant
-        self.step_size = step_size
-        self.frame_duration = None
-        self.hop_length = 735  # 44100/60=735 (每帧时长 ~16.67ms)
-        self.previous_spec = None
-        self.input_shape = [1, 232, 1, 43]  # RKNN模型输入形状
-        if model_path:
-            self.load_model(model_path)
-        # 计算帧时间信息
-        self.frame_duration = self.hop_length / self.model_params['sample_rate']
-        self.block_duration = self.model_params['num_frames'] * self.frame_duration
-    def load_model(self, model_path):
-        """加载RKNN模型并仅解析classes元数据"""
-        try:
-            self.rknn_lite = RKNNLite()
-            # 加载RKNN模型
-            ret = self.rknn_lite.load_rknn(model_path)
-            if ret != 0:
-                raise RuntimeError(f'加载RKNN模型失败, 错误码: {ret}')
-            # 初始化运行时环境
-            ret = self.rknn_lite.init_runtime()
-            if ret != 0:
-                raise RuntimeError(f'初始化NPU运行时失败, 错误码: {ret}')
-            # 加载元数据（仅提取classes）
-            metadata_path = self._get_metadata_path(model_path)
-            self._load_metadata(metadata_path)
-            print(f"使用指定输入形状: {self.input_shape}")
-        except Exception as e:
-            print(f"模型加载失败: {e}")
-    def _get_metadata_path(self, model_path):
-        """获取元数据文件路径"""
-        base_dir = os.path.dirname(model_path)
-        base_name = os.path.basename(model_path)
-        metadata_name = os.path.splitext(base_name)[0] + '_metadata.json'
-        metadata_path = os.path.join(base_dir, metadata_name)
-        if not os.path.exists(metadata_path):
-            metadata_path = os.path.join(base_dir, 'rknn_metadata.json')
-        return metadata_path
-    def _load_metadata(self, metadata_path):
-        """仅从JSON文件加载classes元数据"""
-        self.classes = []  # 初始化为空列表
-        try:
-            if os.path.exists(metadata_path):
-                with open(metadata_path, 'r', encoding='utf-8') as f:
-                    metadata = json.load(f)
-                # 只提取classes，忽略其他元数据
-                self.classes = metadata.get('classes', [])
-                print(f"从 {metadata_path} 加载类别标签成功，共 {len(self.classes)} 个类别")
-            else:
-                print(f"元数据文件 {metadata_path} 不存在，将使用空类别标签")
-        except Exception as e:
-            print(f"加载元数据失败: {e}，将使用空类别标签")
-    def _apply_hann_window(self, frame):
-        """应用汉宁窗函数"""
-        return frame * np.hanning(len(frame))
-    def _apply_temporal_smoothing(self, current_spec):
-        """应用时域指数平滑"""
-        if self.previous_spec is None:
-            self.previous_spec = current_spec
-            return current_spec
-        smoothed = (self.smoothing_time_constant * self.previous_spec
-                    + (1 - self.smoothing_time_constant) * current_spec)
-        self.previous_spec = smoothed.copy()
-        return smoothed
-    def _load_audio(self, audio_path):
-        """加载音频文件（支持wav和webm）"""
-        ext = os.path.splitext(audio_path)[1].lower()
-        if ext == '.wav':
-            audio, sr = librosa.load(audio_path, sr=self.model_params['sample_rate'])
-            return audio, sr
-        elif ext == '.webm':
-            try:
-                from pydub import AudioSegment
-            except ImportError:
-                raise ImportError("处理webm格式需要pydub库，请先安装：pip install pydub")
-            try:
-                audio_segment = AudioSegment.from_file(audio_path, format='webm')
-                audio_segment = audio_segment.set_channels(1).set_frame_rate(self.model_params['sample_rate'])
-                samples = np.array(audio_segment.get_array_of_samples(), dtype=np.float32)
-                return samples / 32768.0, self.model_params['sample_rate']  # 归一化到[-1, 1]
-            except FileNotFoundError as e:
-                if 'ffmpeg' in str(e).lower() or 'avconv' in str(e).lower():
-                    print("\n" + "="*60)
-                    print("检测到错误：缺少ffmpeg支持，无法处理webm格式音频")
-                    print("="*60)
-                    print("请安装ffmpeg后重试（参考之前的安装指南）")
-                    print("="*60 + "\n")
-                    raise
-                else:
-                    raise
-            except Exception as e:
-                print(f"处理webm音频时发生错误：{str(e)}")
-                raise
-        else:
-            raise ValueError(f"不支持的音频格式: {ext}，目前支持 .wav 和 .webm")
-    def _preprocess_audio(self, audio_path):
-        """预处理音频文件，返回[232, 时间帧]形状的分贝谱"""
-        audio, sr = self._load_audio(audio_path)
-        assert sr == self.model_params['sample_rate'], f"采样率不匹配，需要 {self.model_params['sample_rate']}Hz"
-        # 计算STFT
-        hop_length = self.hop_length
-        win_length = self.model_params['fft_size']
-        n_fft = self.model_params['fft_size']
-        # 分帧并加窗
-        frames = librosa.util.frame(audio, frame_length=win_length, hop_length=hop_length)
-        windowed_frames = np.zeros_like(frames)
-        for i in range(frames.shape[1]):
-            windowed_frames[:, i] = self._apply_hann_window(frames[:, i])
-        # FFT+幅度谱+分贝转换
-        D = np.fft.rfft(windowed_frames, n=n_fft, axis=0)
-        magnitude = np.abs(D)
-        db = 20 * np.log10(np.maximum(1e-5, magnitude))  # 避免log(0)
-        # 截取特征维度，返回[232, 时间帧]
-        return db[:self.model_params['spec_features'], :]
-    def preprocess_audio_segment(self, audio_segment):
-        """预处理音频片段，返回[232, 时间帧]形状的分贝谱"""
-        # 计算STFT（逻辑与_preprocess_audio一致）
-        hop_length = self.hop_length
-        win_length = self.model_params['fft_size']
-        n_fft = self.model_params['fft_size']
-        frames = librosa.util.frame(audio_segment, frame_length=win_length, hop_length=hop_length)
-        windowed_frames = np.zeros_like(frames)
-        for i in range(frames.shape[1]):
-            windowed_frames[:, i] = self._apply_hann_window(frames[:, i])
-        D = np.fft.rfft(windowed_frames, n=n_fft, axis=0)
-        magnitude = np.abs(D)
-        db = 20 * np.log10(np.maximum(1e-5, magnitude))
-        return db[:self.model_params['spec_features'], :]
-    def _extract_blocks(self, full_spec):
-        """从完整频谱中提取[232, 43]的块"""
-        total_time_frames = full_spec.shape[1]
-        blocks = []
-        start_indices = []
-        num_blocks = (total_time_frames - self.model_params['num_frames']) // self.step_size + 1
-        for i in range(num_blocks):
-            start = i * self.step_size
-            end = start + self.model_params['num_frames']
-            block = full_spec[:, start:end]  # 提取[232, 43]的块
-            # 不足43帧时填充
-            if block.shape[1] < self.model_params['num_frames']:
-                padded = np.zeros((self.model_params['spec_features'], self.model_params['num_frames']))
-                padded[:, :block.shape[1]] = block
-                block = padded
-            blocks.append(block)
-            start_indices.append(start)
-        return blocks, start_indices
-    def _normalize(self, spec):
-        """简化归一化：仅使用当前频谱块的均值和方差"""
-        epsilon = 1e-8
-        mean = np.mean(spec)
-        variance = np.var(spec)
-        std = np.sqrt(variance)
-        return ((spec - mean) / (std + epsilon)).astype(np.float32)
-    def inference(self, audio_path, model_path=None):
-        if model_path and not self.rknn_lite:
-            self.load_model(model_path)
-        full_spec = self._preprocess_audio(audio_path)  # 形状[232, 总时间帧]
-        blocks, start_indices = self._extract_blocks(full_spec)
-        block_results = []
-        print(f"开始处理音频: {audio_path}")
-        print(f"总帧数: {full_spec.shape[1]}, 总时长: {full_spec.shape[1] * self.frame_duration:.2f}秒")
-        print(f"将处理 {len(blocks)} 个块 (每块 {self.model_params['num_frames']}帧 = {self.block_duration:.3f}秒)")
-        print("=" * 60)
-        for i, block in enumerate(blocks):
-            start_time = time.time()
-            # 归一化+调整维度至[1, 232, 1, 43]
-            normalized_block = self._normalize(block)
-            input_tensor = normalized_block[:, np.newaxis, :]  # [232, 1, 43]
-            input_tensor = input_tensor[np.newaxis, ...]       # [1, 232, 1, 43]
-            # RKNN推理
-            outputs = self.rknn_lite.inference(inputs=[input_tensor])
-            raw_output = outputs[0][0]
-            result = self._format_output(raw_output)
-            # 记录结果
-            process_time = time.time() - start_time
-            start_frame = start_indices[i]
-            end_frame = start_frame + self.model_params['num_frames']
-            start_time_sec = start_frame * self.frame_duration
-            end_time_sec = end_frame * self.frame_duration
-            block_results.append({
-                'block_index': i,
-                'start_time': start_time_sec,
-                'end_time': end_time_sec,
-                'process_time': process_time,
-                'result': result,
-                'raw_output': raw_output
-            })
-            print(f"块 #{i+1} [时间: {start_time_sec:.2f}-{end_time_sec:.2f}s]")
-            print(f"  分类: {result['class']}, 置信度: {result['confidence']}%")
-            print(f"  处理时间: {process_time * 1000:.2f}ms")
-            print("-" * 50)
-        final_result = self._aggregate_results(block_results)
-        return block_results, final_result
-    def process_audio_segment(self, audio_segment):
-        """处理音频片段（实时处理），包含时间测量功能"""
-        if not self.rknn_lite:
-            raise ValueError("请先加载模型")
-        # 记录总开始时间
-        total_start_time = time.time()
-        # 记录预处理时间
-        preprocess_start_time = time.time()
-        full_spec = self.preprocess_audio_segment(audio_segment)
-        blocks, start_indices = self._extract_blocks(full_spec)
-        preprocess_time = time.time() - preprocess_start_time
-        block_results = []
-        inference_time = 0.0
-        for i, block in enumerate(blocks):
-            # 记录归一化时间
-            normalize_start_time = time.time()
-            normalized_block = self._normalize(block)
-            input_tensor = normalized_block[:, np.newaxis, :][np.newaxis, ...]  # [1, 232, 1, 43]
-            normalize_time = time.time() - normalize_start_time
-            # 记录推理时间
-            inference_start_time = time.time()
-            outputs = self.rknn_lite.inference(inputs=[input_tensor])
-            block_inference_time = time.time() - inference_start_time
-            inference_time += block_inference_time
-            raw_output = outputs[0][0]
-            result = self._format_output(raw_output)
-            start_frame = start_indices[i]
-            end_frame = start_frame + self.model_params['num_frames']
-            start_time_sec = start_frame * self.frame_duration
-            end_time_sec = end_frame * self.frame_duration
-            block_results.append({
-                'block_index': i,
-                'start_time': start_time_sec,
-                'end_time': end_time_sec,
-                'result': result,
-                'raw_output': raw_output,
-                'normalize_time': normalize_time,
-                'inference_time': block_inference_time
-            })
-        final_result = self._aggregate_results(block_results)
-        # 计算总时间
-        total_time = time.time() - total_start_time
-        # 如果有最终结果，添加时间信息
-        if final_result:
-            final_result['preprocess_time'] = preprocess_time
-            final_result['inference_time'] = inference_time
-            final_result['total_time'] = total_time
-        return block_results, final_result
-    def _format_output(self, predictions):
-        """格式化推理结果"""
-        class_idx = np.argmax(predictions)
-        confidence = int(predictions[class_idx] * 100)
-        # 若没有类别标签，直接返回索引
-        label = self.classes[class_idx] if (self.classes and class_idx < len(self.classes)) else f"类别{class_idx}"
-        return {
-            'class': label,
-            'confidence': confidence,
-            'probabilities': predictions.tolist()
-        }
-    def _aggregate_results(self, block_results):
-        """聚合所有块的结果"""
-        if len(block_results) == 2:
-            # 两个块时取置信度最高的
-            best_result = max(block_results, key=lambda x: x['result']['confidence'])
-            return {
-                'class': best_result['result']['class'],
-                'confidence': best_result['result']['confidence'],
-                'occurrence_percentage': 100.0,
-                'total_blocks': len(block_results),
-                'class_distribution': {best_result['result']['class']: 1},
-                'aggregation_method': 'highest_confidence'
-            }
-        # 统计每个类别的出现次数和最大置信度
-        class_counts = {}
-        max_confidence = {}
-        for result in block_results:
-            cls = result['result']['class']
-            conf = result['result']['confidence']
-            class_counts[cls] = class_counts.get(cls, 0) + 1
-            if cls not in max_confidence or conf > max_confidence[cls]:
-                max_confidence[cls] = conf
-        if not class_counts:
-            return None
-        # 多数投票决定最终类别
-        most_common_cls = max(class_counts.items(), key=lambda x: x[1])[0]
-        count = class_counts[most_common_cls]
-        return {
-            'class': most_common_cls,
-            'confidence': max_confidence[most_common_cls],
-            'occurrence_percentage': (count / len(block_results)) * 100,
-            'total_blocks': len(block_results),
-            'class_distribution': class_counts,
-            'aggregation_method': 'majority_vote'
-        }
-    def release(self):
-        """释放RKNN资源"""
-        if hasattr(self, 'rknn_lite') and self.rknn_lite:
-            self.rknn_lite.release()
-            print("RKNN资源已释放")
-    def __del__(self):
-        """析构函数自动释放资源"""
-        self.release()
-# 使用示例
-if __name__ == "__main__":
-    # 加载模型（替换为实际的.rknn模型路径）
-    model = Workflow("audio_model.rknn")
-    # 处理音频文件（替换为实际的音频路径）
-    blocks, result = model.inference("test_audio.wav")
-    print("\n最终结果:")
-    print(f"分类: {result['class']}, 置信度: {result['confidence']}%")
-    print(f"在 {result['total_blocks']} 个块中出现比例: {result['occurrence_percentage']:.2f}%")

smartpi 1.1.5__py3-none-any.whl → 1.1.6__py3-none-any.whl

smartpi 1.1.5py3-none-any.whl → 1.1.6py3-none-any.whl