PyPI - livekit-plugins-deepgram - Versions diffs - 1.0.23__tar.gz → 1.1.0__tar.gz - Mend

livekit-plugins-deepgram 1.0.23tar.gz → 1.1.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

{livekit_plugins_deepgram-1.0.23 → livekit_plugins_deepgram-1.1.0}/.gitignore RENAMED Viewed

@@ -146,6 +146,9 @@ venv.bak/
 .dmypy.json
 dmypy.json
+# trunk
+.trunk/
 # Pyre type checker
 .pyre/

{livekit_plugins_deepgram-1.0.23 → livekit_plugins_deepgram-1.1.0}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: livekit-plugins-deepgram
-Version: 1.0.23
+Version: 1.1.0
 Summary: Agent Framework plugin for services using Deepgram's API.
 Project-URL: Documentation, https://docs.livekit.io
 Project-URL: Website, https://livekit.io/
@@ -18,7 +18,7 @@ Classifier: Topic :: Multimedia :: Sound/Audio
 Classifier: Topic :: Multimedia :: Video
 Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
 Requires-Python: >=3.9.0
-Requires-Dist: livekit-agents[codecs]>=1.0.23
+Requires-Dist: livekit-agents[codecs]>=1.1.0
 Requires-Dist: numpy>=1.26
 Description-Content-Type: text/markdown

{livekit_plugins_deepgram-1.0.23 → livekit_plugins_deepgram-1.1.0}/livekit/plugins/deepgram/__init__.py RENAMED Viewed

@@ -32,7 +32,7 @@ from .log import logger
 class DeepgramPlugin(Plugin):
-    def __init__(self):
+    def __init__(self) -> None:
         super().__init__(__name__, __version__, __package__, logger)

{livekit_plugins_deepgram-1.0.23 → livekit_plugins_deepgram-1.1.0}/livekit/plugins/deepgram/stt.py RENAMED Viewed

@@ -94,7 +94,7 @@ class AudioEnergyFilter:
 @dataclass
 class STTOptions:
-    language: DeepgramLanguages | str
+    language: DeepgramLanguages | str | None
     detect_language: bool
     interim_results: bool
     punctuate: bool
@@ -181,9 +181,10 @@ class STT(stt.STT):
         )
         self._base_url = base_url
-        self._api_key = api_key if is_given(api_key) else os.environ.get("DEEPGRAM_API_KEY")
-        if not self._api_key:
+        deepgram_api_key = api_key if is_given(api_key) else os.environ.get("DEEPGRAM_API_KEY")
+        if not deepgram_api_key:
             raise ValueError("Deepgram API key is required")
+        self._api_key = deepgram_api_key
         model = _validate_model(model, language)
         _validate_keyterms(model, language, keyterms, keywords)
@@ -305,7 +306,7 @@ class STT(stt.STT):
         numerals: NotGivenOr[bool] = NOT_GIVEN,
         mip_opt_out: NotGivenOr[bool] = NOT_GIVEN,
         tags: NotGivenOr[list[str]] = NOT_GIVEN,
-    ):
+    ) -> None:
         if is_given(language):
             self._opts.language = language
         if is_given(model):
@@ -383,14 +384,13 @@ class SpeechStream(stt.SpeechStream):
         http_session: aiohttp.ClientSession,
         base_url: str,
     ) -> None:
-        super().__init__(stt=stt, conn_options=conn_options, sample_rate=opts.sample_rate)
         if opts.detect_language or opts.language is None:
             raise ValueError(
                 "language detection is not supported in streaming mode, "
                 "please disable it and specify a language"
             )
+        super().__init__(stt=stt, conn_options=conn_options, sample_rate=opts.sample_rate)
         self._opts = opts
         self._api_key = api_key
         self._session = http_session
@@ -429,7 +429,7 @@ class SpeechStream(stt.SpeechStream):
         numerals: NotGivenOr[bool] = NOT_GIVEN,
         mip_opt_out: NotGivenOr[bool] = NOT_GIVEN,
         tags: NotGivenOr[list[str]] = NOT_GIVEN,
-    ):
+    ) -> None:
         if is_given(language):
             self._opts.language = language
         if is_given(model):
@@ -466,7 +466,7 @@ class SpeechStream(stt.SpeechStream):
     async def _run(self) -> None:
         closing_ws = False
-        async def keepalive_task(ws: aiohttp.ClientWebSocketResponse):
+        async def keepalive_task(ws: aiohttp.ClientWebSocketResponse) -> None:
             # if we want to keep the connection alive even if no audio is sent,
             # Deepgram expects a keepalive message.
             # https://developers.deepgram.com/reference/listen-live#stream-keepalive
@@ -478,7 +478,7 @@ class SpeechStream(stt.SpeechStream):
                 return
         @utils.log_exceptions(logger=logger)
-        async def send_task(ws: aiohttp.ClientWebSocketResponse):
+        async def send_task(ws: aiohttp.ClientWebSocketResponse) -> None:
             nonlocal closing_ws
             # forward audio to deepgram in chunks of 50ms
@@ -529,7 +529,7 @@ class SpeechStream(stt.SpeechStream):
             await ws.send_str(SpeechStream._CLOSE_MSG)
         @utils.log_exceptions(logger=logger)
-        async def recv_task(ws: aiohttp.ClientWebSocketResponse):
+        async def recv_task(ws: aiohttp.ClientWebSocketResponse) -> None:
             nonlocal closing_ws
             while True:
                 msg = await ws.receive()
@@ -569,9 +569,9 @@ class SpeechStream(stt.SpeechStream):
                 wait_reconnect_task = asyncio.create_task(self._reconnect_event.wait())
                 try:
                     done, _ = await asyncio.wait(
-                        [tasks_group, wait_reconnect_task],
+                        (tasks_group, wait_reconnect_task),
                         return_when=asyncio.FIRST_COMPLETED,
-                    )  # type: ignore
+                    )
                     # propagate exceptions from completed tasks
                     for task in done:

livekit_plugins_deepgram-1.1.0/livekit/plugins/deepgram/tts.py ADDED Viewed

@@ -0,0 +1,318 @@
+from __future__ import annotations
+import asyncio
+import json
+import os
+import weakref
+from dataclasses import dataclass, replace
+import aiohttp
+from livekit.agents import (
+    APIConnectionError,
+    APIConnectOptions,
+    APIStatusError,
+    APITimeoutError,
+    tokenize,
+    tts,
+    utils,
+)
+from livekit.agents.types import (
+    DEFAULT_API_CONNECT_OPTIONS,
+    NOT_GIVEN,
+    NotGivenOr,
+)
+from livekit.agents.utils import is_given
+from ._utils import _to_deepgram_url
+from .log import logger
+BASE_URL = "https://api.deepgram.com/v1/speak"
+NUM_CHANNELS = 1
+@dataclass
+class _TTSOptions:
+    model: str
+    encoding: str
+    sample_rate: int
+    word_tokenizer: tokenize.WordTokenizer
+    base_url: str
+    api_key: str
+    mip_opt_out: bool = False
+class TTS(tts.TTS):
+    def __init__(
+        self,
+        *,
+        model: str = "aura-2-andromeda-en",
+        encoding: str = "linear16",
+        sample_rate: int = 24000,
+        api_key: str | None = None,
+        base_url: str = BASE_URL,
+        word_tokenizer: NotGivenOr[tokenize.WordTokenizer] = NOT_GIVEN,
+        http_session: aiohttp.ClientSession | None = None,
+        mip_opt_out: bool = False,
+    ) -> None:
+        """
+        Create a new instance of Deepgram TTS.
+        Args:
+            model (str): TTS model to use. Defaults to "aura-2-andromeda-en".
+            encoding (str): Audio encoding to use. Defaults to "linear16".
+            sample_rate (int): Sample rate of audio. Defaults to 24000.
+            api_key (str): Deepgram API key. If not provided, will look for DEEPGRAM_API_KEY in environment.
+            base_url (str): Base URL for Deepgram TTS API. Defaults to "https://api.deepgram.com/v1/speak"
+            word_tokenizer (tokenize.WordTokenizer): Tokenizer for processing text. Defaults to basic WordTokenizer.
+            http_session (aiohttp.ClientSession): Optional aiohttp session to use for requests.
+        """  # noqa: E501
+        super().__init__(
+            capabilities=tts.TTSCapabilities(streaming=True),
+            sample_rate=sample_rate,
+            num_channels=NUM_CHANNELS,
+        )
+        api_key = api_key or os.environ.get("DEEPGRAM_API_KEY")
+        if not api_key:
+            raise ValueError("Deepgram API key required. Set DEEPGRAM_API_KEY or provide api_key.")
+        if not is_given(word_tokenizer):
+            word_tokenizer = tokenize.basic.WordTokenizer(ignore_punctuation=False)
+        self._opts = _TTSOptions(
+            model=model,
+            encoding=encoding,
+            sample_rate=sample_rate,
+            word_tokenizer=word_tokenizer,
+            base_url=base_url,
+            api_key=api_key,
+            mip_opt_out=mip_opt_out,
+        )
+        self._session = http_session
+        self._streams = weakref.WeakSet[SynthesizeStream]()
+        self._pool = utils.ConnectionPool[aiohttp.ClientWebSocketResponse](
+            connect_cb=self._connect_ws,
+            close_cb=self._close_ws,
+            max_session_duration=3600,  # 1 hour
+            mark_refreshed_on_get=False,
+        )
+    async def _connect_ws(self, timeout: float) -> aiohttp.ClientWebSocketResponse:
+        session = self._ensure_session()
+        config = {
+            "encoding": self._opts.encoding,
+            "model": self._opts.model,
+            "sample_rate": self._opts.sample_rate,
+            "mip_opt_out": self._opts.mip_opt_out,
+        }
+        return await asyncio.wait_for(
+            session.ws_connect(
+                _to_deepgram_url(config, self._opts.base_url, websocket=True),
+                headers={"Authorization": f"Token {self._opts.api_key}"},
+            ),
+            timeout,
+        )
+    async def _close_ws(self, ws: aiohttp.ClientWebSocketResponse) -> None:
+        await ws.close()
+    def _ensure_session(self) -> aiohttp.ClientSession:
+        if not self._session:
+            self._session = utils.http_context.http_session()
+        return self._session
+    def update_options(
+        self,
+        *,
+        model: NotGivenOr[str] = NOT_GIVEN,
+    ) -> None:
+        """
+        Args:
+            model (str): TTS model to use.
+        """
+        if is_given(model):
+            self._opts.model = model
+    def synthesize(
+        self, text: str, *, conn_options: APIConnectOptions = DEFAULT_API_CONNECT_OPTIONS
+    ) -> ChunkedStream:
+        return ChunkedStream(tts=self, input_text=text, conn_options=conn_options)
+    def stream(
+        self, *, conn_options: APIConnectOptions = DEFAULT_API_CONNECT_OPTIONS
+    ) -> SynthesizeStream:
+        stream = SynthesizeStream(tts=self, conn_options=conn_options)
+        self._streams.add(stream)
+        return stream
+    def prewarm(self) -> None:
+        self._pool.prewarm()
+    async def aclose(self) -> None:
+        for stream in list(self._streams):
+            await stream.aclose()
+        self._streams.clear()
+        await self._pool.aclose()
+class ChunkedStream(tts.ChunkedStream):
+    def __init__(self, *, tts: TTS, input_text: str, conn_options: APIConnectOptions) -> None:
+        super().__init__(tts=tts, input_text=input_text, conn_options=conn_options)
+        self._tts: TTS = tts
+        self._opts = replace(tts._opts)
+    async def _run(self, output_emitter: tts.AudioEmitter) -> None:
+        try:
+            async with self._tts._ensure_session().post(
+                _to_deepgram_url(
+                    {
+                        "encoding": self._opts.encoding,
+                        "container": "none",
+                        "model": self._opts.model,
+                        "sample_rate": self._opts.sample_rate,
+                        "mip_opt_out": self._opts.mip_opt_out,
+                    },
+                    self._opts.base_url,
+                    websocket=False,
+                ),
+                headers={
+                    "Authorization": f"Token {self._opts.api_key}",
+                    "Content-Type": "application/json",
+                },
+                json={"text": self._input_text},
+                timeout=aiohttp.ClientTimeout(total=30, sock_connect=self._conn_options.timeout),
+            ) as resp:
+                resp.raise_for_status()
+                output_emitter.initialize(
+                    request_id=utils.shortuuid(),
+                    sample_rate=self._opts.sample_rate,
+                    num_channels=NUM_CHANNELS,
+                    mime_type="audio/pcm",
+                )
+                async for data, _ in resp.content.iter_chunks():
+                    output_emitter.push(data)
+                output_emitter.flush()
+        except asyncio.TimeoutError:
+            raise APITimeoutError() from None
+        except aiohttp.ClientResponseError as e:
+            raise APIStatusError(
+                message=e.message, status_code=e.status, request_id=None, body=None
+            ) from None
+        except Exception as e:
+            raise APIConnectionError() from e
+class SynthesizeStream(tts.SynthesizeStream):
+    def __init__(self, *, tts: TTS, conn_options: APIConnectOptions):
+        super().__init__(tts=tts, conn_options=conn_options)
+        self._tts: TTS = tts
+        self._opts = replace(tts._opts)
+        self._segments_ch = utils.aio.Chan[tokenize.WordStream]()
+    async def _run(self, output_emitter: tts.AudioEmitter) -> None:
+        request_id = utils.shortuuid()
+        output_emitter.initialize(
+            request_id=request_id,
+            sample_rate=self._opts.sample_rate,
+            num_channels=1,
+            mime_type="audio/pcm",
+            stream=True,
+        )
+        async def _tokenize_input() -> None:
+            # Converts incoming text into WordStreams and sends them into _segments_ch
+            word_stream = None
+            async for input in self._input_ch:
+                if isinstance(input, str):
+                    if word_stream is None:
+                        word_stream = self._opts.word_tokenizer.stream()
+                        self._segments_ch.send_nowait(word_stream)
+                    word_stream.push_text(input)
+                elif isinstance(input, self._FlushSentinel):
+                    if word_stream:
+                        word_stream.end_input()
+                    word_stream = None
+            self._segments_ch.close()
+        async def _run_segments() -> None:
+            async for word_stream in self._segments_ch:
+                await self._run_ws(word_stream, output_emitter)
+        tasks = [
+            asyncio.create_task(_tokenize_input()),
+            asyncio.create_task(_run_segments()),
+        ]
+        try:
+            await asyncio.gather(*tasks)
+        except asyncio.TimeoutError:
+            raise APITimeoutError() from None
+        except aiohttp.ClientResponseError as e:
+            raise APIStatusError(
+                message=e.message, status_code=e.status, request_id=request_id, body=None
+            ) from None
+        except Exception as e:
+            raise APIConnectionError() from e
+        finally:
+            await utils.aio.gracefully_cancel(*tasks)
+    async def _run_ws(
+        self, word_stream: tokenize.WordStream, output_emitter: tts.AudioEmitter
+    ) -> None:
+        segment_id = utils.shortuuid()
+        output_emitter.start_segment(segment_id=segment_id)
+        async def send_task(ws: aiohttp.ClientWebSocketResponse) -> None:
+            async for word in word_stream:
+                speak_msg = {"type": "Speak", "text": f"{word.token} "}
+                self._mark_started()
+                await ws.send_str(json.dumps(speak_msg))
+            # Always flush after a segment
+            flush_msg = {"type": "Flush"}
+            await ws.send_str(json.dumps(flush_msg))
+        async def recv_task(ws: aiohttp.ClientWebSocketResponse) -> None:
+            while True:
+                msg = await ws.receive()
+                if msg.type in (
+                    aiohttp.WSMsgType.CLOSE,
+                    aiohttp.WSMsgType.CLOSED,
+                    aiohttp.WSMsgType.CLOSING,
+                ):
+                    raise APIStatusError("Deepgram websocket connection closed unexpectedly")
+                if msg.type == aiohttp.WSMsgType.BINARY:
+                    output_emitter.push(msg.data)
+                elif msg.type == aiohttp.WSMsgType.TEXT:
+                    resp = json.loads(msg.data)
+                    mtype = resp.get("type")
+                    if mtype == "Flushed":
+                        output_emitter.end_segment()
+                        break
+                    elif mtype == "Warning":
+                        logger.warning("Deepgram warning: %s", resp.get("warn_msg"))
+                    elif mtype == "Metadata":
+                        pass
+                    else:
+                        logger.debug("Unknown message type: %s", resp)
+        async with self._tts._pool.connection(timeout=self._conn_options.timeout) as ws:
+            tasks = [
+                asyncio.create_task(send_task(ws)),
+                asyncio.create_task(recv_task(ws)),
+            ]
+            try:
+                await asyncio.gather(*tasks)
+            finally:
+                await utils.aio.gracefully_cancel(*tasks)

{livekit_plugins_deepgram-1.0.23 → livekit_plugins_deepgram-1.1.0}/livekit/plugins/deepgram/version.py RENAMED Viewed

@@ -12,4 +12,4 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
-__version__ = "1.0.23"
+__version__ = "1.1.0"

{livekit_plugins_deepgram-1.0.23 → livekit_plugins_deepgram-1.1.0}/pyproject.toml RENAMED Viewed

@@ -22,7 +22,7 @@ classifiers = [
     "Programming Language :: Python :: 3.10",
     "Programming Language :: Python :: 3 :: Only",
 ]
-dependencies = ["livekit-agents[codecs]>=1.0.23", "numpy>=1.26"]
+dependencies = ["livekit-agents[codecs]>=1.1.0", "numpy>=1.26"]
 [project.urls]
 Documentation = "https://docs.livekit.io"

livekit_plugins_deepgram-1.0.23/livekit/plugins/deepgram/tts.py DELETED Viewed

@@ -1,438 +0,0 @@
-from __future__ import annotations
-import asyncio
-import json
-import os
-import weakref
-from dataclasses import dataclass
-import aiohttp
-from livekit.agents import (
-    APIConnectionError,
-    APIConnectOptions,
-    APIStatusError,
-    APITimeoutError,
-    tokenize,
-    tts,
-    utils,
-)
-from livekit.agents.types import (
-    DEFAULT_API_CONNECT_OPTIONS,
-    NOT_GIVEN,
-    NotGivenOr,
-)
-from livekit.agents.utils import is_given
-from ._utils import _to_deepgram_url
-from .log import logger
-BASE_URL = "https://api.deepgram.com/v1/speak"
-NUM_CHANNELS = 1
-@dataclass
-class _TTSOptions:
-    model: str
-    encoding: str
-    sample_rate: int
-    word_tokenizer: tokenize.WordTokenizer
-    mip_opt_out: bool = False
-class TTS(tts.TTS):
-    def __init__(
-        self,
-        *,
-        model: str = "aura-2-andromeda-en",
-        encoding: str = "linear16",
-        sample_rate: int = 24000,
-        api_key: NotGivenOr[str] = NOT_GIVEN,
-        base_url: str = BASE_URL,
-        word_tokenizer: NotGivenOr[tokenize.WordTokenizer] = NOT_GIVEN,
-        http_session: aiohttp.ClientSession | None = None,
-        mip_opt_out: bool = False,
-    ) -> None:
-        """
-        Create a new instance of Deepgram TTS.
-        Args:
-            model (str): TTS model to use. Defaults to "aura-2-andromeda-en".
-            encoding (str): Audio encoding to use. Defaults to "linear16".
-            sample_rate (int): Sample rate of audio. Defaults to 24000.
-            api_key (str): Deepgram API key. If not provided, will look for DEEPGRAM_API_KEY in environment.
-            base_url (str): Base URL for Deepgram TTS API. Defaults to "https://api.deepgram.com/v1/speak"
-            word_tokenizer (tokenize.WordTokenizer): Tokenizer for processing text. Defaults to basic WordTokenizer.
-            http_session (aiohttp.ClientSession): Optional aiohttp session to use for requests.
-        """  # noqa: E501
-        super().__init__(
-            capabilities=tts.TTSCapabilities(streaming=True),
-            sample_rate=sample_rate,
-            num_channels=NUM_CHANNELS,
-        )
-        self._api_key = api_key if is_given(api_key) else os.environ.get("DEEPGRAM_API_KEY")
-        if not self._api_key:
-            raise ValueError("Deepgram API key required. Set DEEPGRAM_API_KEY or provide api_key.")
-        if not is_given(word_tokenizer):
-            word_tokenizer = tokenize.basic.WordTokenizer(ignore_punctuation=False)
-        self._opts = _TTSOptions(
-            model=model,
-            encoding=encoding,
-            sample_rate=sample_rate,
-            word_tokenizer=word_tokenizer,
-            mip_opt_out=mip_opt_out,
-        )
-        self._session = http_session
-        self._base_url = base_url
-        self._streams = weakref.WeakSet[SynthesizeStream]()
-        self._pool = utils.ConnectionPool[aiohttp.ClientWebSocketResponse](
-            connect_cb=self._connect_ws,
-            close_cb=self._close_ws,
-            max_session_duration=3600,  # 1 hour
-            mark_refreshed_on_get=False,
-        )
-    async def _connect_ws(self) -> aiohttp.ClientWebSocketResponse:
-        session = self._ensure_session()
-        config = {
-            "encoding": self._opts.encoding,
-            "model": self._opts.model,
-            "sample_rate": self._opts.sample_rate,
-            "mip_opt_out": self._opts.mip_opt_out,
-        }
-        return await asyncio.wait_for(
-            session.ws_connect(
-                _to_deepgram_url(config, self._base_url, websocket=True),
-                headers={"Authorization": f"Token {self._api_key}"},
-            ),
-            self._conn_options.timeout,
-        )
-    async def _close_ws(self, ws: aiohttp.ClientWebSocketResponse):
-        await ws.close()
-    def _ensure_session(self) -> aiohttp.ClientSession:
-        if not self._session:
-            self._session = utils.http_context.http_session()
-        return self._session
-    def update_options(
-        self,
-        *,
-        model: NotGivenOr[str] = NOT_GIVEN,
-        sample_rate: NotGivenOr[int] = NOT_GIVEN,
-    ) -> None:
-        """
-        args:
-            model (str): TTS model to use.
-            sample_rate (int): Sample rate of audio.
-        """
-        if is_given(model):
-            self._opts.model = model
-        if is_given(sample_rate):
-            self._opts.sample_rate = sample_rate
-        for stream in self._streams:
-            stream.update_options(
-                model=model,
-                sample_rate=sample_rate,
-            )
-    def synthesize(
-        self,
-        text: str,
-        *,
-        conn_options: APIConnectOptions = DEFAULT_API_CONNECT_OPTIONS,
-    ) -> ChunkedStream:
-        return ChunkedStream(
-            tts=self,
-            input_text=text,
-            base_url=self._base_url,
-            api_key=self._api_key,
-            conn_options=conn_options,
-            opts=self._opts,
-            session=self._ensure_session(),
-        )
-    def stream(
-        self, *, conn_options: APIConnectOptions = DEFAULT_API_CONNECT_OPTIONS
-    ) -> SynthesizeStream:
-        stream = SynthesizeStream(
-            tts=self,
-            conn_options=conn_options,
-            base_url=self._base_url,
-            api_key=self._api_key,
-            opts=self._opts,
-            session=self._ensure_session(),
-        )
-        self._streams.add(stream)
-        return stream
-    def prewarm(self) -> None:
-        self._pool.prewarm()
-    async def aclose(self) -> None:
-        for stream in list(self._streams):
-            await stream.aclose()
-        self._streams.clear()
-        await self._pool.aclose()
-        await super().aclose()
-class ChunkedStream(tts.ChunkedStream):
-    def __init__(
-        self,
-        *,
-        tts: TTS,
-        base_url: str,
-        api_key: str,
-        input_text: str,
-        opts: _TTSOptions,
-        session: aiohttp.ClientSession,
-        conn_options: APIConnectOptions,
-    ) -> None:
-        super().__init__(tts=tts, input_text=input_text, conn_options=conn_options)
-        self._opts = opts
-        self._session = session
-        self._base_url = base_url
-        self._api_key = api_key
-    async def _run(self) -> None:
-        request_id = utils.shortuuid()
-        audio_bstream = utils.audio.AudioByteStream(
-            sample_rate=self._opts.sample_rate,
-            num_channels=NUM_CHANNELS,
-        )
-        try:
-            config = {
-                "encoding": self._opts.encoding,
-                "model": self._opts.model,
-                "sample_rate": self._opts.sample_rate,
-                "mip_opt_out": self._opts.mip_opt_out,
-            }
-            async with self._session.post(
-                _to_deepgram_url(config, self._base_url, websocket=False),
-                headers={
-                    "Authorization": f"Token {self._api_key}",
-                    "Content-Type": "application/json",
-                },
-                json={"text": self._input_text},
-                timeout=aiohttp.ClientTimeout(connect=self._conn_options.timeout, total=30),
-            ) as res:
-                if res.status != 200:
-                    raise APIStatusError(
-                        message=res.reason or "Unknown error occurred.",
-                        status_code=res.status,
-                        request_id=request_id,
-                        body=await res.json(),
-                    )
-                async for bytes_data, _ in res.content.iter_chunks():
-                    for frame in audio_bstream.write(bytes_data):
-                        self._event_ch.send_nowait(
-                            tts.SynthesizedAudio(
-                                request_id=request_id,
-                                frame=frame,
-                            )
-                        )
-                for frame in audio_bstream.flush():
-                    self._event_ch.send_nowait(
-                        tts.SynthesizedAudio(request_id=request_id, frame=frame)
-                    )
-        except asyncio.TimeoutError as e:
-            raise APITimeoutError() from e
-        except aiohttp.ClientResponseError as e:
-            raise APIStatusError(
-                message=e.message,
-                status_code=e.status,
-                request_id=request_id,
-                body=None,
-            ) from e
-        except Exception as e:
-            raise APIConnectionError() from e
-class SynthesizeStream(tts.SynthesizeStream):
-    def __init__(
-        self,
-        *,
-        tts: TTS,
-        base_url: str,
-        api_key: str,
-        opts: _TTSOptions,
-        session: aiohttp.ClientSession,
-        conn_options: APIConnectOptions,
-    ):
-        super().__init__(tts=tts, conn_options=conn_options)
-        self._opts = opts
-        self._session = session
-        self._base_url = base_url
-        self._api_key = api_key
-        self._segments_ch = utils.aio.Chan[tokenize.WordStream]()
-        self._reconnect_event = asyncio.Event()
-    def update_options(
-        self,
-        *,
-        model: NotGivenOr[str] = NOT_GIVEN,
-        sample_rate: NotGivenOr[int] = NOT_GIVEN,
-    ) -> None:
-        if is_given(model):
-            self._opts.model = model
-        if is_given(sample_rate):
-            self._opts.sample_rate = sample_rate
-        self._reconnect_event.set()
-    async def _run(self) -> None:
-        closing_ws = False
-        request_id = utils.shortuuid()
-        segment_id = utils.shortuuid()
-        audio_bstream = utils.audio.AudioByteStream(
-            sample_rate=self._opts.sample_rate,
-            num_channels=NUM_CHANNELS,
-        )
-        @utils.log_exceptions(logger=logger)
-        async def _tokenize_input():
-            # Converts incoming text into WordStreams and sends them into _segments_ch
-            word_stream = None
-            async for input in self._input_ch:
-                if isinstance(input, str):
-                    if word_stream is None:
-                        word_stream = self._opts.word_tokenizer.stream()
-                        self._segments_ch.send_nowait(word_stream)
-                    word_stream.push_text(input)
-                elif isinstance(input, self._FlushSentinel):
-                    if word_stream:
-                        word_stream.end_input()
-                    word_stream = None
-            self._segments_ch.close()
-        @utils.log_exceptions(logger=logger)
-        async def _run_segments(ws: aiohttp.ClientWebSocketResponse):
-            nonlocal closing_ws
-            async for word_stream in self._segments_ch:
-                async for word in word_stream:
-                    speak_msg = {"type": "Speak", "text": f"{word.token} "}
-                    self._mark_started()
-                    await ws.send_str(json.dumps(speak_msg))
-                # Always flush after a segment
-                flush_msg = {"type": "Flush"}
-                await ws.send_str(json.dumps(flush_msg))
-            # after all segments, close
-            close_msg = {"type": "Close"}
-            closing_ws = True
-            await ws.send_str(json.dumps(close_msg))
-        async def recv_task(ws: aiohttp.ClientWebSocketResponse):
-            emitter = tts.SynthesizedAudioEmitter(
-                event_ch=self._event_ch,
-                request_id=request_id,
-                segment_id=segment_id,
-            )
-            while True:
-                msg = await ws.receive()
-                if msg.type in (
-                    aiohttp.WSMsgType.CLOSE,
-                    aiohttp.WSMsgType.CLOSED,
-                    aiohttp.WSMsgType.CLOSING,
-                ):
-                    if not closing_ws:
-                        raise APIStatusError(
-                            "Deepgram websocket connection closed unexpectedly",
-                            request_id=request_id,
-                        )
-                    return
-                if msg.type == aiohttp.WSMsgType.BINARY:
-                    data = msg.data
-                    for frame in audio_bstream.write(data):
-                        emitter.push(frame)
-                elif msg.type == aiohttp.WSMsgType.TEXT:
-                    resp = json.loads(msg.data)
-                    mtype = resp.get("type")
-                    if mtype == "Flushed":
-                        for frame in audio_bstream.flush():
-                            emitter.push(frame)
-                        emitter.flush()
-                        break
-                    elif mtype == "Warning":
-                        logger.warning("Deepgram warning: %s", resp.get("warn_msg"))
-                    elif mtype == "Metadata":
-                        pass
-                    else:
-                        logger.debug("Unknown message type: %s", resp)
-        async def _connection_timeout():
-            # Deepgram has a 60-minute timeout period for websocket connections
-            await asyncio.sleep(3300)
-            logger.warning("Deepgram TTS maximum connection time reached. Reconnecting...")
-            self._reconnect_event.set()
-        ws: aiohttp.ClientWebSocketResponse | None = None
-        while True:
-            try:
-                config = {
-                    "encoding": self._opts.encoding,
-                    "model": self._opts.model,
-                    "sample_rate": self._opts.sample_rate,
-                    "mip_opt_out": self._opts.mip_opt_out,
-                }
-                ws = await asyncio.wait_for(
-                    self._session.ws_connect(
-                        _to_deepgram_url(config, self._base_url, websocket=True),
-                        headers={"Authorization": f"Token {self._api_key}"},
-                    ),
-                    self._conn_options.timeout,
-                )
-                closing_ws = False
-                tasks = [
-                    asyncio.create_task(_tokenize_input()),
-                    asyncio.create_task(_run_segments(ws)),
-                    asyncio.create_task(recv_task(ws)),
-                ]
-                wait_reconnect_task = asyncio.create_task(self._reconnect_event.wait())
-                connection_timeout_task = asyncio.create_task(_connection_timeout())
-                try:
-                    done, _ = await asyncio.wait(
-                        [
-                            asyncio.gather(*tasks),
-                            wait_reconnect_task,
-                            connection_timeout_task,
-                        ],
-                        return_when=asyncio.FIRST_COMPLETED,
-                    )  # type: ignore
-                    if wait_reconnect_task not in done:
-                        break
-                    self._reconnect_event.clear()
-                finally:
-                    await utils.aio.gracefully_cancel(
-                        *tasks, wait_reconnect_task, connection_timeout_task
-                    )
-            except asyncio.TimeoutError as e:
-                raise APITimeoutError() from e
-            except aiohttp.ClientResponseError as e:
-                raise APIStatusError(
-                    message=e.message,
-                    status_code=e.status,
-                    request_id=request_id,
-                    body=None,
-                ) from e
-            except Exception as e:
-                raise APIConnectionError() from e
-            finally:
-                if ws is not None and not ws.closed:
-                    await ws.close()

{livekit_plugins_deepgram-1.0.23 → livekit_plugins_deepgram-1.1.0}/README.md RENAMED Viewed

File without changes

{livekit_plugins_deepgram-1.0.23 → livekit_plugins_deepgram-1.1.0}/livekit/plugins/deepgram/_utils.py RENAMED Viewed

File without changes

{livekit_plugins_deepgram-1.0.23 → livekit_plugins_deepgram-1.1.0}/livekit/plugins/deepgram/log.py RENAMED Viewed

File without changes

{livekit_plugins_deepgram-1.0.23 → livekit_plugins_deepgram-1.1.0}/livekit/plugins/deepgram/models.py RENAMED Viewed

File without changes

{livekit_plugins_deepgram-1.0.23 → livekit_plugins_deepgram-1.1.0}/livekit/plugins/deepgram/py.typed RENAMED Viewed

File without changes

livekit-plugins-deepgram 1.0.23__tar.gz → 1.1.0__tar.gz

livekit-plugins-deepgram 1.0.23tar.gz → 1.1.0tar.gz