PyPI - videosdk-plugins-openai - Versions diffs - 0.0.37__tar.gz → 0.0.38__tar.gz - Mend

videosdk-plugins-openai 0.0.37tar.gz → 0.0.38tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of videosdk-plugins-openai might be problematic. Click here for more details.

Files changed (11) hide show

{videosdk_plugins_openai-0.0.37 → videosdk_plugins_openai-0.0.38}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: videosdk-plugins-openai
-Version: 0.0.37
+Version: 0.0.38
 Summary: VideoSDK Agent Framework plugin for OpenAI services
 Author: videosdk
 License-Expression: Apache-2.0
@@ -13,7 +13,7 @@ Classifier: Topic :: Multimedia :: Video
 Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
 Requires-Python: >=3.11
 Requires-Dist: openai[realtime]>=1.68.2
-Requires-Dist: videosdk-agents>=0.0.37
+Requires-Dist: videosdk-agents>=0.0.38
 Description-Content-Type: text/markdown
 # VideoSDK OpenAI Plugin

{videosdk_plugins_openai-0.0.37 → videosdk_plugins_openai-0.0.38}/pyproject.toml RENAMED Viewed

@@ -20,7 +20,7 @@ classifiers = [
     "Topic :: Multimedia :: Video",
     "Topic :: Scientific/Engineering :: Artificial Intelligence",
 ]
-dependencies = ["videosdk-agents>=0.0.37", "openai[realtime]>=1.68.2"]
+dependencies = ["videosdk-agents>=0.0.38", "openai[realtime]>=1.68.2"]
 [tool.hatch.version]
 path = "videosdk/plugins/openai/version.py"

{videosdk_plugins_openai-0.0.37 → videosdk_plugins_openai-0.0.38}/videosdk/plugins/openai/realtime_api.py RENAMED Viewed

@@ -351,6 +351,7 @@ class OpenAIRealtime(RealtimeBaseModel[OpenAIEventTypes]):
     async def _handle_speech_stopped(self, data: dict) -> None:
         """Handle speech detection end"""
         await realtime_metrics_collector.set_user_speech_end()
+        self.emit("user_speech_ended", {})
     async def _handle_response_created(self, data: dict) -> None:
         """Handle initial response creation"""
@@ -425,6 +426,7 @@ class OpenAIRealtime(RealtimeBaseModel[OpenAIEventTypes]):
             if not self._agent_speaking:
                 await realtime_metrics_collector.set_agent_speech_start()
                 self._agent_speaking = True
+                self.emit("agent_speech_started", {})
             base64_audio_data = base64.b64decode(data.get("delta"))
             if base64_audio_data:
                 if self.audio_track and self.loop:
@@ -444,6 +446,7 @@ class OpenAIRealtime(RealtimeBaseModel[OpenAIEventTypes]):
         if self.audio_track:
             self.audio_track.interrupt()
         if self._agent_speaking:
+            self.emit("agent_speech_ended", {})
             await realtime_metrics_collector.set_agent_speech_end(timeout=1.0)
             self._agent_speaking = False
@@ -492,6 +495,7 @@ class OpenAIRealtime(RealtimeBaseModel[OpenAIEventTypes]):
             except Exception:
                 pass
             self._current_audio_transcript = ""
+        self.emit("agent_speech_ended", {})
         await realtime_metrics_collector.set_agent_speech_end(timeout=1.0)
         self._agent_speaking = False
         pass