PyPI - livekit-plugins-google - Versions diffs - 1.2.14__py3-none-any.whl → 1.2.16__py3-none-any.whl - Mend

livekit-plugins-google 1.2.14py3-none-any.whl → 1.2.16py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of livekit-plugins-google might be problematic. Click here for more details.

Files changed (13) hide show

livekit/plugins/google/__init__.py CHANGED Viewed

@@ -19,14 +19,14 @@ Supports Gemini, Cloud Speech-to-Text, and Cloud Text-to-Speech.
 See https://docs.livekit.io/agents/integrations/stt/google/ for more information.
 """
-from . import beta
+from . import beta, realtime
 from .llm import LLM
 from .stt import STT, SpeechStream
 from .tools import _LLMTool
 from .tts import TTS
 from .version import __version__
-__all__ = ["STT", "TTS", "SpeechStream", "__version__", "beta", "LLM", "_LLMTool"]
+__all__ = ["STT", "TTS", "realtime", "SpeechStream", "__version__", "beta", "LLM", "_LLMTool"]
 from livekit.agents import Plugin
 from .log import logger

livekit/plugins/google/beta/__init__.py CHANGED Viewed

@@ -1,7 +1,7 @@
-from . import realtime
+from .. import realtime
 from .gemini_tts import TTS as GeminiTTS
-__all__ = ["realtime", "GeminiTTS"]
+__all__ = ["GeminiTTS", "realtime"]
 # Cleanup docs of unexported modules
 _module = dir()

livekit/plugins/google/llm.py CHANGED Viewed

@@ -136,6 +136,10 @@ class LLM(llm.LLM):
                 _, gcp_project = default_async(  # type: ignore
                     scopes=["https://www.googleapis.com/auth/cloud-platform"]
                 )
+            if not gcp_project or not gcp_location:
+                raise ValueError(
+                    "Project is required for VertexAI via project kwarg or GOOGLE_CLOUD_PROJECT environment variable"  # noqa: E501
+                )
             gemini_api_key = None  # VertexAI does not require an API key
         else:

livekit/plugins/google/models.py CHANGED Viewed

@@ -10,6 +10,7 @@ SpeechModels = Literal[
     "medical_conversation",
     "chirp",
     "chirp_2",
+    "chirp_3",
     "latest_long",
     "latest_short",
 ]

livekit/plugins/google/{beta/realtime → realtime}/api_proto.py RENAMED Viewed

@@ -10,11 +10,43 @@ LiveAPIModels = Literal[
     # models supported on Gemini API
     "gemini-2.0-flash-live-001",
     "gemini-live-2.5-flash-preview",
+    "gemini-2.5-flash-native-audio-preview-09-2025",
     "gemini-2.5-flash-preview-native-audio-dialog",
     "gemini-2.5-flash-exp-native-audio-thinking-dialog",
 ]
-Voice = Literal["Puck", "Charon", "Kore", "Fenrir", "Aoede", "Leda", "Orus", "Zephyr"]
+Voice = Literal[
+    "Achernar",
+    "Achird",
+    "Algenib",
+    "Algieba",
+    "Alnilam",
+    "Aoede",
+    "Autonoe",
+    "Callirrhoe",
+    "Charon",
+    "Despina",
+    "Enceladus",
+    "Erinome",
+    "Fenrir",
+    "Gacrux",
+    "Iapetus",
+    "Kore",
+    "Laomedeia",
+    "Leda",
+    "Orus",
+    "Pulcherrima",
+    "Puck",
+    "Rasalgethi",
+    "Sadachbia",
+    "Sadaltager",
+    "Schedar",
+    "Sulafat",
+    "Umbriel",
+    "Vindemiatrix",
+    "Zephyr",
+    "Zubenelgenubi",
+]
 ClientEvents = Union[

livekit/plugins/google/{beta/realtime → realtime}/realtime_api.py RENAMED Viewed

@@ -10,6 +10,7 @@ from collections.abc import Iterator
 from dataclasses import dataclass, field
 from typing import Literal
+from google.auth._default_async import default_async
 from google.genai import Client as GenAIClient, types
 from google.genai.live import AsyncSession
 from livekit import rtc
@@ -23,11 +24,11 @@ from livekit.agents.types import (
     NotGivenOr,
 )
 from livekit.agents.utils import audio as audio_utils, images, is_given
-from livekit.plugins.google.beta.realtime.api_proto import ClientEvents, LiveAPIModels, Voice
+from livekit.plugins.google.realtime.api_proto import ClientEvents, LiveAPIModels, Voice
-from ...log import logger
-from ...tools import _LLMTool
-from ...utils import create_tools_config, get_tool_results_for_realtime, to_fnc_ctx
+from ..log import logger
+from ..tools import _LLMTool
+from ..utils import create_tools_config, get_tool_results_for_realtime, to_fnc_ctx
 INPUT_AUDIO_SAMPLE_RATE = 16000
 INPUT_AUDIO_CHANNELS = 1
@@ -78,6 +79,7 @@ class _RealtimeOptions:
     gemini_tools: NotGivenOr[list[_LLMTool]] = NOT_GIVEN
     tool_behavior: NotGivenOr[types.Behavior] = NOT_GIVEN
     tool_response_scheduling: NotGivenOr[types.FunctionResponseScheduling] = NOT_GIVEN
+    thinking_config: NotGivenOr[types.ThinkingConfig] = NOT_GIVEN
 @dataclass
@@ -144,6 +146,7 @@ class RealtimeModel(llm.RealtimeModel):
         conn_options: APIConnectOptions = DEFAULT_API_CONNECT_OPTIONS,
         http_options: NotGivenOr[types.HttpOptions] = NOT_GIVEN,
         _gemini_tools: NotGivenOr[list[_LLMTool]] = NOT_GIVEN,
+        thinking_config: NotGivenOr[types.ThinkingConfig] = NOT_GIVEN,
     ) -> None:
         """
         Initializes a RealtimeModel instance for interacting with Google's Realtime API.
@@ -180,6 +183,7 @@ class RealtimeModel(llm.RealtimeModel):
             context_window_compression (ContextWindowCompressionConfig, optional): The configuration for context window compression. Defaults to None.
             tool_behavior (Behavior, optional): The behavior for tool call. Default behavior is BLOCK in Gemini Realtime API.
             tool_response_scheduling (FunctionResponseScheduling, optional): The scheduling for tool response. Default scheduling is WHEN_IDLE.
+            thinking_config (ThinkingConfig, optional): Native audio thinking configuration.
             conn_options (APIConnectOptions, optional): The configuration for the API connection. Defaults to DEFAULT_API_CONNECT_OPTIONS.
             _gemini_tools (list[LLMTool], optional): Gemini-specific tools to use for the session. This parameter is experimental and may change.
@@ -232,6 +236,10 @@ class RealtimeModel(llm.RealtimeModel):
         )
         if use_vertexai:
+            if not gcp_project:
+                _, gcp_project = default_async(  # type: ignore
+                    scopes=["https://www.googleapis.com/auth/cloud-platform"]
+                )
             if not gcp_project or not gcp_location:
                 raise ValueError(
                     "Project is required for VertexAI via project kwarg or GOOGLE_CLOUD_PROJECT environment variable"  # noqa: E501
@@ -274,6 +282,7 @@ class RealtimeModel(llm.RealtimeModel):
             tool_behavior=tool_behavior,
             conn_options=conn_options,
             http_options=http_options,
+            thinking_config=thinking_config,
         )
         self._sessions = weakref.WeakSet[RealtimeSession]()
@@ -510,7 +519,12 @@ class RealtimeSession(llm.RealtimeSession):
         for f in self._resample_audio(frame):
             for nf in self._bstream.write(f.data.tobytes()):
                 realtime_input = types.LiveClientRealtimeInput(
-                    media_chunks=[types.Blob(data=nf.data.tobytes(), mime_type="audio/pcm")]
+                    media_chunks=[
+                        types.Blob(
+                            data=nf.data.tobytes(),
+                            mime_type=f"audio/pcm;rate={INPUT_AUDIO_SAMPLE_RATE}",
+                        )
+                    ]
                 )
                 self._send_client_event(realtime_input)
@@ -814,6 +828,9 @@ class RealtimeSession(llm.RealtimeSession):
                 frequency_penalty=self._opts.frequency_penalty
                 if is_given(self._opts.frequency_penalty)
                 else None,
+                thinking_config=self._opts.thinking_config
+                if is_given(self._opts.thinking_config)
+                else None,
             ),
             system_instruction=types.Content(parts=[types.Part(text=self._opts.instructions)])
             if is_given(self._opts.instructions)

livekit/plugins/google/stt.py CHANGED Viewed

@@ -618,17 +618,28 @@ def _streaming_recognize_response_to_speech_data(
 ) -> stt.SpeechData | None:
     text = ""
     confidence = 0.0
+    final_result = None
     for result in resp.results:
         if len(result.alternatives) == 0:
             continue
-        text += result.alternatives[0].transcript
-        confidence += result.alternatives[0].confidence
-    confidence /= len(resp.results)
-    lg = resp.results[0].language_code
+        else:
+            if result.is_final:
+                final_result = result
+                break
+            else:
+                text += result.alternatives[0].transcript
+                confidence += result.alternatives[0].confidence
+    if final_result is not None:
+        text = final_result.alternatives[0].transcript
+        confidence = final_result.alternatives[0].confidence
+        lg = final_result.language_code
+    else:
+        confidence /= len(resp.results)
+        if confidence < min_confidence_threshold:
+            return None
+        lg = resp.results[0].language_code
-    if confidence < min_confidence_threshold:
-        return None
     if text == "":
         return None

livekit/plugins/google/version.py CHANGED Viewed

@@ -12,4 +12,4 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
-__version__ = "1.2.14"
+__version__ = "1.2.16"

{livekit_plugins_google-1.2.14.dist-info → livekit_plugins_google-1.2.16.dist-info}/METADATA RENAMED Viewed

@@ -1,13 +1,13 @@
 Metadata-Version: 2.4
 Name: livekit-plugins-google
-Version: 1.2.14
+Version: 1.2.16
 Summary: Agent Framework plugin for services from Google Cloud
 Project-URL: Documentation, https://docs.livekit.io
 Project-URL: Website, https://livekit.io/
 Project-URL: Source, https://github.com/livekit/agents
 Author: LiveKit
 License-Expression: Apache-2.0
-Keywords: audio,livekit,realtime,video,webrtc
+Keywords: ai,audio,gemini,google,livekit,realtime,video,voice
 Classifier: Intended Audience :: Developers
 Classifier: License :: OSI Approved :: Apache Software License
 Classifier: Programming Language :: Python :: 3
@@ -22,7 +22,7 @@ Requires-Dist: google-auth<3,>=2
 Requires-Dist: google-cloud-speech<3,>=2
 Requires-Dist: google-cloud-texttospeech<3,>=2.27
 Requires-Dist: google-genai>=v1.23.0
-Requires-Dist: livekit-agents>=1.2.14
+Requires-Dist: livekit-agents>=1.2.16
 Description-Content-Type: text/markdown
 # Google AI plugin for LiveKit Agents

livekit_plugins_google-1.2.16.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,18 @@
+livekit/plugins/google/__init__.py,sha256=bYHN04-Ttynj09POAnFP3mln-wrEc1vanUD_YpoWOE4,1434
+livekit/plugins/google/llm.py,sha256=M2v1sUJVVNtmOOJvuWhHsGygQlCJo73pSyrwVxdjzcA,19198
+livekit/plugins/google/log.py,sha256=GI3YWN5YzrafnUccljzPRS_ZALkMNk1i21IRnTl2vNA,69
+livekit/plugins/google/models.py,sha256=jsXHLSCDw-T5dZXeDE2nMT2lr0GooCYO4y4aW7Htps4,2816
+livekit/plugins/google/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+livekit/plugins/google/stt.py,sha256=fsWoNnpjgLxqY43cx6GbRI-_QLvXmMvD4WczJFjnoOA,26846
+livekit/plugins/google/tools.py,sha256=tD5HVDHO5JfUF029Cx3axHMJec0Gxalkl7s1FDgxLzI,259
+livekit/plugins/google/tts.py,sha256=2Ba4HjAc9RWYL3W4Z2586Ir3bYQGdSH2gfxSR7VsyY4,17454
+livekit/plugins/google/utils.py,sha256=tFByjJ357A1WdCPwBQC4JABR9G5kxX0g7_FuWAIxix4,10002
+livekit/plugins/google/version.py,sha256=6RxW2Q7KoSNRlDtulIUp5F0_o0atksX-Xpp45NaSCaI,601
+livekit/plugins/google/beta/__init__.py,sha256=4q5dx-Y6o9peCDziB03Skf5ngH4PTBsZC86ZawWrgnk,271
+livekit/plugins/google/beta/gemini_tts.py,sha256=SpKorOteQ7GYoGWsxV5YPuGeMexoosmtDXQVz_1ZeLA,8743
+livekit/plugins/google/realtime/__init__.py,sha256=_fW2NMN22F-hnQ4xAJ_g5lPbR7CvM_xXzSWlUQY-E-U,188
+livekit/plugins/google/realtime/api_proto.py,sha256=oXKKlf0soMK_MA4LcqP8R5iPgpZvmqjb9KxHJFaBpgk,1261
+livekit/plugins/google/realtime/realtime_api.py,sha256=mePWYDAdb3i9l5a-m7JwmTuU_mbtYngR-XRvOYrqxe4,51109
+livekit_plugins_google-1.2.16.dist-info/METADATA,sha256=bBUYb-Z4kIrrK1s3ThbGr-PCt09zTkXuseOQhMjw3eA,1925
+livekit_plugins_google-1.2.16.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+livekit_plugins_google-1.2.16.dist-info/RECORD,,

livekit_plugins_google-1.2.14.dist-info/RECORD DELETED Viewed

@@ -1,18 +0,0 @@
-livekit/plugins/google/__init__.py,sha256=XIyZ-iFnRBpaLtOJgVwojlB-a8GjdDugVFcjBpMEww8,1412
-livekit/plugins/google/llm.py,sha256=u9ZSSkdouPk0018UdiLfgthgTjjLLrXgseX1zrkeg64,18962
-livekit/plugins/google/log.py,sha256=GI3YWN5YzrafnUccljzPRS_ZALkMNk1i21IRnTl2vNA,69
-livekit/plugins/google/models.py,sha256=poOvUBvgpqmmQV5EUQsq0RgNIRAq7nH-_IZIcIfPSBI,2801
-livekit/plugins/google/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-livekit/plugins/google/stt.py,sha256=i99gqXAvYeuhdJ8wh6UlOqLXj6f5_cIni71EwSR4FGw,26467
-livekit/plugins/google/tools.py,sha256=tD5HVDHO5JfUF029Cx3axHMJec0Gxalkl7s1FDgxLzI,259
-livekit/plugins/google/tts.py,sha256=2Ba4HjAc9RWYL3W4Z2586Ir3bYQGdSH2gfxSR7VsyY4,17454
-livekit/plugins/google/utils.py,sha256=tFByjJ357A1WdCPwBQC4JABR9G5kxX0g7_FuWAIxix4,10002
-livekit/plugins/google/version.py,sha256=3ilX8YY1RDy023FFuAB6eNeNvQ8-OJdFmtdMR-6h7Y8,601
-livekit/plugins/google/beta/__init__.py,sha256=RvAUdvEiRN-fe4JrgPcN0Jkw1kZR9wPerGMFVjS1Cc0,270
-livekit/plugins/google/beta/gemini_tts.py,sha256=SpKorOteQ7GYoGWsxV5YPuGeMexoosmtDXQVz_1ZeLA,8743
-livekit/plugins/google/beta/realtime/__init__.py,sha256=_fW2NMN22F-hnQ4xAJ_g5lPbR7CvM_xXzSWlUQY-E-U,188
-livekit/plugins/google/beta/realtime/api_proto.py,sha256=nb_QkVQDEH7h0SKA9vdS3JaL12a6t2Z1ja4SdnxE6a8,814
-livekit/plugins/google/beta/realtime/realtime_api.py,sha256=bvGLk75j6mO870PYLTZh2W3xY5IxuFkjGevltY2BhQA,50294
-livekit_plugins_google-1.2.14.dist-info/METADATA,sha256=BNs2mhT68ao86W-TD9s67SXy-T7sWrLDT-FAOr5TC2o,1909
-livekit_plugins_google-1.2.14.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-livekit_plugins_google-1.2.14.dist-info/RECORD,,

/livekit/plugins/google/{beta/realtime → realtime}/__init__.py RENAMED Viewed

File without changes

{livekit_plugins_google-1.2.14.dist-info → livekit_plugins_google-1.2.16.dist-info}/WHEEL RENAMED Viewed

File without changes

livekit-plugins-google 1.2.14__py3-none-any.whl → 1.2.16__py3-none-any.whl

Potentially problematic release.

livekit-plugins-google 1.2.14py3-none-any.whl → 1.2.16py3-none-any.whl