PyPI - vision-agents-plugins-wizper - Versions diffs - 0.1.11__py3-none-any.whl → 0.1.12__py3-none-any.whl - Mend

vision-agents-plugins-wizper 0.1.11py3-none-any.whl → 0.1.12py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of vision-agents-plugins-wizper might be problematic. Click here for more details.

Files changed (7) hide show

.gitignore CHANGED Viewed

@@ -84,3 +84,4 @@ stream-py/
 # Artifacts / assets
 *.pt
 *.kef
+*.onnx

PKG-INFO CHANGED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: vision-agents-plugins-wizper
-Version: 0.1.11
+Version: 0.1.12
 Summary: Wizper plugin for Vision Agents
 Project-URL: Documentation, https://visionagents.ai/
 Project-URL: Website, https://visionagents.ai/

vision_agents/plugins/wizper/stt.py CHANGED Viewed

@@ -4,32 +4,13 @@ Fal Wizper STT Plugin for Stream
 Provides real-time audio transcription and translation using fal-ai/wizper (Whisper v3).
 This plugin integrates with Stream's audio processing pipeline to provide high-quality
 speech-to-text capabilities.
-Example usage:
-    from vision_agents.plugins import fal
-    # For transcription
-    stt = fal.STT(task="transcribe")
-    # For translation to Portuguese
-    stt = fal.STT(task="translate", target_language="pt")
-    @stt.on("transcript")
-    async def on_transcript(text: str, user: Any, metadata: dict):
-        print(f"Transcript: {text}")
-    @stt.on("error")
-    async def on_error(error: str):
-        print(f"Error: {error}")
 """
-import io
 import logging
 import os
 import tempfile
 from pathlib import Path
 from typing import TYPE_CHECKING, Optional
-import wave
 import fal_client
 from getstream.video.rtc.track_util import PcmData
@@ -76,27 +57,6 @@ class STT(stt.STT):
         self.target_language = target_language
         self._fal_client = client if client is not None else fal_client.AsyncClient()
-    def _pcm_to_wav_bytes(self, pcm_data: PcmData) -> bytes:
-        """
-        Convert PCM data to WAV format bytes.
-        Args:
-            pcm_data: PCM audio data from Stream's audio pipeline
-        Returns:
-            WAV format audio data as bytes
-        """
-        wav_buffer = io.BytesIO()
-        with wave.open(wav_buffer, "wb") as wav_file:
-            wav_file.setnchannels(1)  # Mono
-            wav_file.setsampwidth(2)  # 16-bit
-            wav_file.setframerate(self.sample_rate)
-            wav_file.writeframes(pcm_data.samples.tobytes())
-        wav_buffer.seek(0)
-        return wav_buffer.read()
     async def process_audio(
         self,
         pcm_data: PcmData,
@@ -122,8 +82,8 @@ class STT(stt.STT):
                 "Sending speech audio to fal-ai/wizper",
                 extra={"audio_bytes": pcm_data.samples.nbytes},
             )
-            # Convert PCM to WAV format for upload
-            wav_data = self._pcm_to_wav_bytes(pcm_data)
+            # Convert PCM to WAV format for upload using shared PcmData method
+            wav_data = pcm_data.to_wav_bytes()
             # Create temporary file for upload
             with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as temp_file:
@@ -151,7 +111,7 @@ class STT(stt.STT):
                 )
                 if "text" in result:
                     text = result["text"].strip()
-                    if text:
+                    if text and participant is not None:
                         response_metadata = TranscriptResponse()
                         self._emit_transcript_event(
                             text, participant, response_metadata

{vision_agents_plugins_wizper-0.1.11.dist-info → vision_agents_plugins_wizper-0.1.12.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: vision-agents-plugins-wizper
-Version: 0.1.11
+Version: 0.1.12
 Summary: Wizper plugin for Vision Agents
 Project-URL: Documentation, https://visionagents.ai/
 Project-URL: Website, https://visionagents.ai/

vision_agents_plugins_wizper-0.1.12.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,9 @@
+./.gitignore,sha256=ye7v72rmcYcz93U_u9IyYUvYJKEXGElBsTevPVyASo0,923
+./PKG-INFO,sha256=eBdcwmO3PZHGtalyBIPFycUERCl28ZBjYB97saPWLWw,505
+./README.md,sha256=7MDH68Ywzj2WKm3QAFCUvupBHxrTdjtAL0WqrqaCHFc,24
+./pyproject.toml,sha256=eSC8A7YqeCWd9_VfDiwOc9z3KPGzSPbf9IIqk_aWES0,959
+./vision_agents/plugins/wizper/__init__.py,sha256=aRLgDFc3zq4tNj3G9kmM4zJzSpO7hYqGujz3zTTPsMk,93
+./vision_agents/plugins/wizper/stt.py,sha256=d2XLQQufSL4qruSumff1gj2aA_dssbA0DUN4RZNNIwA,4778
+vision_agents_plugins_wizper-0.1.12.dist-info/METADATA,sha256=eBdcwmO3PZHGtalyBIPFycUERCl28ZBjYB97saPWLWw,505
+vision_agents_plugins_wizper-0.1.12.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+vision_agents_plugins_wizper-0.1.12.dist-info/RECORD,,

vision_agents_plugins_wizper-0.1.11.dist-info/RECORD DELETED Viewed

@@ -1,9 +0,0 @@
-./.gitignore,sha256=S6wPCu4rBDB_yyTYoXbMIR-pn4OPv6b3Ulnx1n5RWvo,916
-./PKG-INFO,sha256=TwinEYIZ4okitRugRaXwoXs71LAPmO7kZSCCKW8U7l8,505
-./README.md,sha256=7MDH68Ywzj2WKm3QAFCUvupBHxrTdjtAL0WqrqaCHFc,24
-./pyproject.toml,sha256=eSC8A7YqeCWd9_VfDiwOc9z3KPGzSPbf9IIqk_aWES0,959
-./vision_agents/plugins/wizper/__init__.py,sha256=aRLgDFc3zq4tNj3G9kmM4zJzSpO7hYqGujz3zTTPsMk,93
-./vision_agents/plugins/wizper/stt.py,sha256=bHEGG8aeN9NBZjtiWhZ8GvK5aszmAebGbXU4pqYisa4,5819
-vision_agents_plugins_wizper-0.1.11.dist-info/METADATA,sha256=TwinEYIZ4okitRugRaXwoXs71LAPmO7kZSCCKW8U7l8,505
-vision_agents_plugins_wizper-0.1.11.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-vision_agents_plugins_wizper-0.1.11.dist-info/RECORD,,

{vision_agents_plugins_wizper-0.1.11.dist-info → vision_agents_plugins_wizper-0.1.12.dist-info}/WHEEL RENAMED Viewed

File without changes

vision-agents-plugins-wizper 0.1.11__py3-none-any.whl → 0.1.12__py3-none-any.whl

Potentially problematic release.

vision-agents-plugins-wizper 0.1.11py3-none-any.whl → 0.1.12py3-none-any.whl