PyPI - livekit-plugins-google - Versions diffs - 0.10.0__py3-none-any.whl → 0.10.2__py3-none-any.whl - Mend

livekit-plugins-google 0.10.0py3-none-any.whl → 0.10.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

livekit/plugins/google/beta/realtime/realtime_api.py CHANGED Viewed

@@ -75,6 +75,7 @@ class InputTranscription:
 @dataclass
 class Capabilities:
     supports_truncate: bool
+    input_audio_sample_rate: int | None = None
 @dataclass
@@ -156,6 +157,7 @@ class RealtimeModel:
         super().__init__()
         self._capabilities = Capabilities(
             supports_truncate=False,
+            input_audio_sample_rate=16000,
         )
         self._model = model
         self._loop = loop or asyncio.get_event_loop()
@@ -307,8 +309,6 @@ class GeminiRealtimeSession(utils.EventEmitter[EventTypes]):
         self._init_sync_task = asyncio.create_task(asyncio.sleep(0))
         self._send_ch = utils.aio.Chan[ClientEvents]()
         self._active_response_id = None
-        if chat_ctx:
-            self.generate_reply(chat_ctx)
     async def aclose(self) -> None:
         if self._send_ch.closed:
@@ -336,25 +336,6 @@ class GeminiRealtimeSession(utils.EventEmitter[EventTypes]):
     def _queue_msg(self, msg: ClientEvents) -> None:
         self._send_ch.send_nowait(msg)
-    def generate_reply(
-        self,
-        ctx: llm.ChatContext | llm.ChatMessage,
-        turn_complete: bool = True,
-    ) -> None:
-        if isinstance(ctx, llm.ChatMessage) and isinstance(ctx.content, str):
-            new_chat_ctx = llm.ChatContext()
-            new_chat_ctx.append(text=ctx.content, role=ctx.role)
-        elif isinstance(ctx, llm.ChatContext):
-            new_chat_ctx = ctx
-        else:
-            raise ValueError("Invalid chat context")
-        turns, _ = _build_gemini_ctx(new_chat_ctx, id(self))
-        client_content = LiveClientContent(
-            turn_complete=turn_complete,
-            turns=turns,
-        )
-        self._queue_msg(client_content)
     def chat_ctx_copy(self) -> llm.ChatContext:
         return self._chat_ctx.copy()
@@ -370,7 +351,16 @@ class GeminiRealtimeSession(utils.EventEmitter[EventTypes]):
             "cancel_existing", "cancel_new", "keep_both"
         ] = "keep_both",
     ) -> None:
-        raise NotImplementedError("create_response is not supported yet")
+        turns, _ = _build_gemini_ctx(self._chat_ctx, id(self))
+        ctx = [self._opts.instructions] + turns if self._opts.instructions else turns
+        if not ctx:
+            logger.warning(
+                "gemini-realtime-session: No chat context to send, sending dummy content."
+            )
+            ctx = [Content(parts=[Part(text=".")])]
+        self._queue_msg(LiveClientContent(turns=ctx, turn_complete=True))
     def commit_audio_buffer(self) -> None:
         raise NotImplementedError("commit_audio_buffer is not supported yet")

livekit/plugins/google/beta/realtime/transcriber.py CHANGED Viewed

@@ -56,6 +56,7 @@ class TranscriberSession(utils.EventEmitter[EventTypes]):
         super().__init__()
         self._client = client
         self._model = model
+        self._needed_sr = 16000
         self._closed = False
         system_instructions = types.Content(
             parts=[types.Part(text=SYSTEM_INSTRUCTIONS)]
@@ -72,18 +73,37 @@ class TranscriberSession(utils.EventEmitter[EventTypes]):
             self._main_task(), name="gemini-realtime-transcriber"
         )
         self._send_ch = utils.aio.Chan[ClientEvents]()
+        self._resampler: rtc.AudioResampler | None = None
         self._active_response_id = None
     def _push_audio(self, frame: rtc.AudioFrame) -> None:
         if self._closed:
             return
-        self._queue_msg(
-            types.LiveClientRealtimeInput(
-                media_chunks=[
-                    types.Blob(data=frame.data.tobytes(), mime_type="audio/pcm")
-                ]
+        if frame.sample_rate != self._needed_sr:
+            if not self._resampler:
+                self._resampler = rtc.AudioResampler(
+                    frame.sample_rate,
+                    self._needed_sr,
+                    quality=rtc.AudioResamplerQuality.HIGH,
+                )
+        if self._resampler:
+            for f in self._resampler.push(frame):
+                self._queue_msg(
+                    types.LiveClientRealtimeInput(
+                        media_chunks=[
+                            types.Blob(data=f.data.tobytes(), mime_type="audio/pcm")
+                        ]
+                    )
+                )
+        else:
+            self._queue_msg(
+                types.LiveClientRealtimeInput(
+                    media_chunks=[
+                        types.Blob(data=frame.data.tobytes(), mime_type="audio/pcm")
+                    ]
+                )
             )
-        )
     def _queue_msg(self, msg: ClientEvents) -> None:
         if not self._closed:

livekit/plugins/google/llm.py CHANGED Viewed

@@ -108,8 +108,8 @@ class LLM(llm.LLM):
         self._api_key = api_key or os.environ.get("GOOGLE_API_KEY", None)
         _gac = os.environ.get("GOOGLE_APPLICATION_CREDENTIALS")
         if _gac is None:
-            raise ValueError(
-                "`GOOGLE_APPLICATION_CREDENTIALS` environment variable is not set. please set it to the path of the service account key file."
+            logger.warning(
+                "`GOOGLE_APPLICATION_CREDENTIALS` environment variable is not set. please set it to the path of the service account key file. Otherwise, use any of the other Google Cloud auth methods."
             )
         if vertexai:

livekit/plugins/google/stt.py CHANGED Viewed

@@ -89,9 +89,9 @@ class STT(stt.STT):
         detect_language: bool = True,
         interim_results: bool = True,
         punctuate: bool = True,
-        spoken_punctuation: bool = True,
-        model: SpeechModels = "long",
-        location: str = "global",
+        spoken_punctuation: bool = False,
+        model: SpeechModels = "chirp_2",
+        location: str = "us-central1",
         sample_rate: int = 16000,
         credentials_info: dict | None = None,
         credentials_file: str | None = None,

livekit/plugins/google/version.py CHANGED Viewed

@@ -12,4 +12,4 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
-__version__ = "0.10.0"
+__version__ = "0.10.2"

{livekit_plugins_google-0.10.0.dist-info → livekit_plugins_google-0.10.2.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.2
 Name: livekit-plugins-google
-Version: 0.10.0
+Version: 0.10.2
 Summary: Agent Framework plugin for services from Google Cloud
 Home-page: https://github.com/livekit/agents
 License: Apache-2.0
@@ -23,7 +23,7 @@ Requires-Dist: google-auth<3,>=2
 Requires-Dist: google-cloud-speech<3,>=2
 Requires-Dist: google-cloud-texttospeech<3,>=2
 Requires-Dist: google-genai==0.5.0
-Requires-Dist: livekit-agents>=0.12.3
+Requires-Dist: livekit-agents>=0.12.11
 Dynamic: classifier
 Dynamic: description
 Dynamic: description-content-type

{livekit_plugins_google-0.10.0.dist-info → livekit_plugins_google-0.10.2.dist-info}/RECORD RENAMED Viewed

@@ -1,18 +1,18 @@
 livekit/plugins/google/__init__.py,sha256=e_kSlFNmKhyyeliz7f4WOKc_Y0-y39QjO5nCWuguhss,1171
 livekit/plugins/google/_utils.py,sha256=mjsqblhGMgAZ2MNPisAVkNsqq4gfO6vvprEKzAGoVwE,7248
-livekit/plugins/google/llm.py,sha256=vL8iyRqWVPT0wCDeXTlybytlyJ-J-VolVQYqP-ZVlb0,16388
+livekit/plugins/google/llm.py,sha256=o9EJBv3rS5vKRq7m5YjSSqOxtH6pPekxRS_lra35hzk,16445
 livekit/plugins/google/log.py,sha256=GI3YWN5YzrafnUccljzPRS_ZALkMNk1i21IRnTl2vNA,69
 livekit/plugins/google/models.py,sha256=w_qmOk5y86vjtszDiGpP9p0ctjQeaB8-UzqprxgpvCY,1407
 livekit/plugins/google/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-livekit/plugins/google/stt.py,sha256=E5kXPbicH4FEXBjyBzfqQWA-nPhKkojzcc-cbtWdmNs,21088
+livekit/plugins/google/stt.py,sha256=FA6Lpeb8QvRXLzkQ7cjsoMxHdtEGwHWkpN_TKqAdKAQ,21097
 livekit/plugins/google/tts.py,sha256=95qXCigVQYWNbcN3pIKBpIah4b31U_MWtXv5Ji0AMc4,9229
-livekit/plugins/google/version.py,sha256=sAL7xgP18DEksjwYUwabcCgRgKAAGXSWs6xp7NgcxoU,601
+livekit/plugins/google/version.py,sha256=jklx55q_NtxoIUiYD5AFOO11S_Jij8P491Y8nkw-VZk,601
 livekit/plugins/google/beta/__init__.py,sha256=AxRYc7NGG62Tv1MmcZVCDHNvlhbC86hM-_yP01Qb28k,47
 livekit/plugins/google/beta/realtime/__init__.py,sha256=sGTn6JFNyA30QUXBZ_BV3l2eHpGAzR35ByXxg77vWNU,205
 livekit/plugins/google/beta/realtime/api_proto.py,sha256=9EhmwgeIgKDqdSijv5Q9pgx7UhAakK02ZDwbnUsra_o,657
-livekit/plugins/google/beta/realtime/realtime_api.py,sha256=vCjDQZvHS749Gf-QOLo-RaW4HlQHlzuArd3IlN5xMmY,21459
-livekit/plugins/google/beta/realtime/transcriber.py,sha256=3TaYbtvPWHkxKlDSZSMLWBbR7KewBRg3HcdIxuGhl9c,5880
-livekit_plugins_google-0.10.0.dist-info/METADATA,sha256=lsA9pwlWHE-q-9x3HKn2EeJ7ZdcpjxzEtYs1wRH5axE,2057
-livekit_plugins_google-0.10.0.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
-livekit_plugins_google-0.10.0.dist-info/top_level.txt,sha256=OoDok3xUmXbZRvOrfvvXB-Juu4DX79dlq188E19YHoo,8
-livekit_plugins_google-0.10.0.dist-info/RECORD,,
+livekit/plugins/google/beta/realtime/realtime_api.py,sha256=OwNoPmmomMtRkmYw-g2u7hIYpeIrSSNky7FlcHBVyFQ,21150
+livekit/plugins/google/beta/realtime/transcriber.py,sha256=JnZ75NyiOLkpvQ5N2nDniumDKcrjiq_tlryiLbuBoDM,6658
+livekit_plugins_google-0.10.2.dist-info/METADATA,sha256=dTBdAuYpGyCFVJNw0c8upUEdaFgdodWwrm1bB3a4Xp4,2058
+livekit_plugins_google-0.10.2.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
+livekit_plugins_google-0.10.2.dist-info/top_level.txt,sha256=OoDok3xUmXbZRvOrfvvXB-Juu4DX79dlq188E19YHoo,8
+livekit_plugins_google-0.10.2.dist-info/RECORD,,

{livekit_plugins_google-0.10.0.dist-info → livekit_plugins_google-0.10.2.dist-info}/WHEEL RENAMED Viewed

File without changes

{livekit_plugins_google-0.10.0.dist-info → livekit_plugins_google-0.10.2.dist-info}/top_level.txt RENAMED Viewed

File without changes

livekit-plugins-google 0.10.0__py3-none-any.whl → 0.10.2__py3-none-any.whl

livekit-plugins-google 0.10.0py3-none-any.whl → 0.10.2py3-none-any.whl