PyPI - sarvamai - Versions diffs - 0.1.7__py3-none-any.whl → 0.1.8__py3-none-any.whl - Mend

sarvamai 0.1.7py3-none-any.whl → 0.1.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (35) hide show

sarvamai/__init__.py +56 -1
sarvamai/client.py +3 -0
sarvamai/core/client_wrapper.py +2 -2
sarvamai/requests/__init__.py +20 -0
sarvamai/requests/audio_output.py +11 -0
sarvamai/requests/audio_output_data.py +15 -0
sarvamai/requests/configure_connection.py +18 -0
sarvamai/requests/configure_connection_data.py +83 -0
sarvamai/requests/error_response.py +11 -0
sarvamai/requests/error_response_data.py +18 -0
sarvamai/requests/flush_signal.py +14 -0
sarvamai/requests/ping_signal.py +14 -0
sarvamai/requests/send_text.py +11 -0
sarvamai/requests/send_text_data.py +7 -0
sarvamai/text_to_speech_streaming/__init__.py +4 -0
sarvamai/text_to_speech_streaming/client.py +153 -0
sarvamai/text_to_speech_streaming/raw_client.py +130 -0
sarvamai/text_to_speech_streaming/socket_client.py +309 -0
sarvamai/types/__init__.py +26 -0
sarvamai/types/audio_output.py +21 -0
sarvamai/types/audio_output_data.py +27 -0
sarvamai/types/configure_connection.py +28 -0
sarvamai/types/configure_connection_data.py +93 -0
sarvamai/types/configure_connection_data_output_audio_bitrate.py +7 -0
sarvamai/types/configure_connection_data_speaker.py +7 -0
sarvamai/types/configure_connection_data_target_language_code.py +8 -0
sarvamai/types/error_response.py +21 -0
sarvamai/types/error_response_data.py +28 -0
sarvamai/types/flush_signal.py +24 -0
sarvamai/types/ping_signal.py +24 -0
sarvamai/types/send_text.py +21 -0
sarvamai/types/send_text_data.py +19 -0
{sarvamai-0.1.7.dist-info → sarvamai-0.1.8.dist-info}/METADATA +2 -2
{sarvamai-0.1.7.dist-info → sarvamai-0.1.8.dist-info}/RECORD +35 -8
{sarvamai-0.1.7.dist-info → sarvamai-0.1.8.dist-info}/WHEEL +0 -0

sarvamai/text_to_speech_streaming/raw_client.py ADDED Viewed

@@ -0,0 +1,130 @@
+# This file was auto-generated by Fern from our API Definition.
+import typing
+from contextlib import asynccontextmanager, contextmanager
+import httpx
+import websockets
+import websockets.sync.client as websockets_sync_client
+from ..core.api_error import ApiError
+from ..core.client_wrapper import AsyncClientWrapper, SyncClientWrapper
+from ..core.request_options import RequestOptions
+from .socket_client import AsyncTextToSpeechStreamingSocketClient, TextToSpeechStreamingSocketClient
+class RawTextToSpeechStreamingClient:
+    def __init__(self, *, client_wrapper: SyncClientWrapper):
+        self._client_wrapper = client_wrapper
+    @contextmanager
+    def connect(
+        self,
+        *,
+        model: typing.Optional[typing.Literal["bulbul:v2"]] = None,
+        api_subscription_key: typing.Optional[str] = None,
+        request_options: typing.Optional[RequestOptions] = None,
+    ) -> typing.Iterator[TextToSpeechStreamingSocketClient]:
+        """
+        Bidirectional WebSocket channel for real-time TTS synthesis.
+        Supports streaming, flushing, config updates, and audio playback.
+        Parameters
+        ----------
+        model : typing.Optional[typing.Literal["bulbul:v2"]]
+            Text to speech model to use
+        api_subscription_key : typing.Optional[str]
+            API subscription key for authentication
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
+        Returns
+        -------
+        TextToSpeechStreamingSocketClient
+        """
+        ws_url = self._client_wrapper.get_environment().production + "/text-to-speech/ws"
+        query_params = httpx.QueryParams()
+        if model is not None:
+            query_params = query_params.add("model", model)
+        ws_url = ws_url + f"?{query_params}"
+        headers = self._client_wrapper.get_headers()
+        if api_subscription_key is not None:
+            headers["Api-Subscription-Key"] = str(api_subscription_key)
+        if request_options and "additional_headers" in request_options:
+            headers.update(request_options["additional_headers"])
+        try:
+            with websockets_sync_client.connect(ws_url, additional_headers=headers) as protocol:
+                yield TextToSpeechStreamingSocketClient(websocket=protocol)
+        except websockets.exceptions.InvalidStatusCode as exc:
+            status_code: int = exc.status_code
+            if status_code == 401:
+                raise ApiError(
+                    status_code=status_code,
+                    headers=dict(headers),
+                    body="Websocket initialized with invalid credentials.",
+                )
+            raise ApiError(
+                status_code=status_code,
+                headers=dict(headers),
+                body="Unexpected error when initializing websocket connection.",
+            )
+class AsyncRawTextToSpeechStreamingClient:
+    def __init__(self, *, client_wrapper: AsyncClientWrapper):
+        self._client_wrapper = client_wrapper
+    @asynccontextmanager
+    async def connect(
+        self,
+        *,
+        model: typing.Optional[typing.Literal["bulbul:v2"]] = None,
+        api_subscription_key: typing.Optional[str] = None,
+        request_options: typing.Optional[RequestOptions] = None,
+    ) -> typing.AsyncIterator[AsyncTextToSpeechStreamingSocketClient]:
+        """
+        Bidirectional WebSocket channel for real-time TTS synthesis.
+        Supports streaming, flushing, config updates, and audio playback.
+        Parameters
+        ----------
+        model : typing.Optional[typing.Literal["bulbul:v2"]]
+            Text to speech model to use
+        api_subscription_key : typing.Optional[str]
+            API subscription key for authentication
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
+        Returns
+        -------
+        AsyncTextToSpeechStreamingSocketClient
+        """
+        ws_url = self._client_wrapper.get_environment().production + "/text-to-speech/ws"
+        query_params = httpx.QueryParams()
+        if model is not None:
+            query_params = query_params.add("model", model)
+        ws_url = ws_url + f"?{query_params}"
+        headers = self._client_wrapper.get_headers()
+        if api_subscription_key is not None:
+            headers["Api-Subscription-Key"] = str(api_subscription_key)
+        if request_options and "additional_headers" in request_options:
+            headers.update(request_options["additional_headers"])
+        try:
+            async with websockets.connect(ws_url, extra_headers=headers) as protocol:
+                yield AsyncTextToSpeechStreamingSocketClient(websocket=protocol)
+        except websockets.exceptions.InvalidStatusCode as exc:
+            status_code: int = exc.status_code
+            if status_code == 401:
+                raise ApiError(
+                    status_code=status_code,
+                    headers=dict(headers),
+                    body="Websocket initialized with invalid credentials.",
+                )
+            raise ApiError(
+                status_code=status_code,
+                headers=dict(headers),
+                body="Unexpected error when initializing websocket connection.",
+            )

sarvamai/text_to_speech_streaming/socket_client.py ADDED Viewed

@@ -0,0 +1,309 @@
+# This file was auto-generated by Fern from our API Definition.
+import json
+import typing
+import websockets
+import websockets.sync.connection as websockets_sync_connection
+from ..core.events import EventEmitterMixin, EventType
+from ..core.pydantic_utilities import parse_obj_as
+from ..types.audio_output import AudioOutput
+from ..types.flush_signal import FlushSignal
+from ..types.error_response import ErrorResponse
+from ..types.configure_connection import ConfigureConnection
+from ..types.configure_connection_data import ConfigureConnectionData
+from ..types.ping_signal import PingSignal
+from ..types.send_text import SendText
+from ..types.send_text_data import SendTextData
+TextToSpeechStreamingSocketClientResponse = typing.Union[AudioOutput, ErrorResponse]
+class AsyncTextToSpeechStreamingSocketClient(EventEmitterMixin):
+    def __init__(self, *, websocket: websockets.WebSocketClientProtocol):
+        super().__init__()
+        self._websocket = websocket
+    async def __aiter__(self):
+        async for message in self._websocket:
+            message = json.loads(message) if isinstance(message, str) else message
+            yield parse_obj_as(TextToSpeechStreamingSocketClientResponse, message)  # type: ignore
+    async def start_listening(self):
+        """
+        Start listening for messages on the websocket connection.
+        Emits events in the following order:
+        - EventType.OPEN when connection is established
+        - EventType.MESSAGE for each message received
+        - EventType.ERROR if an error occurs
+        - EventType.CLOSE when connection is closed
+        """
+        self._emit(EventType.OPEN, None)
+        try:
+            async for raw_message in self._websocket:
+                raw_message = (
+                    json.loads(raw_message)
+                    if isinstance(raw_message, str)
+                    else raw_message
+                )
+                parsed = parse_obj_as(TextToSpeechStreamingSocketClientResponse, raw_message)  # type: ignore
+                self._emit(EventType.MESSAGE, parsed)
+        except websockets.WebSocketException as exc:
+            self._emit(EventType.ERROR, exc)
+        finally:
+            self._emit(EventType.CLOSE, None)
+    async def configure(
+        self,
+        target_language_code: str,
+        speaker: str = "anushka",
+        pitch: float = 0.0,
+        pace: float = 1.0,
+        loudness: float = 1.0,
+        speech_sample_rate: int = 22050,
+        enable_preprocessing: bool = False,
+        output_audio_codec: str = "mp3",
+        output_audio_bitrate: str = "128k",
+        min_buffer_size: int = 50,
+        max_chunk_length: int = 150,
+    ) -> None:
+        """
+        Configuration message required as the first message after establishing the WebSocket connection.
+        This initializes TTS parameters and can be updated at any time during the WebSocket lifecycle
+        by sending a new config message. When a config update is sent, any text currently in the buffer
+        will be automatically flushed and processed before applying the new configuration.
+        :param target_language_code: The language of the text is BCP-47 format
+        :param speaker: The speaker voice to be used for the output audio. Default: Anushka.
+            Model Compatibility (bulbul:v2): Female: Anushka, Manisha, Vidya, Arya;
+            Male: Abhilash, Karun, Hitesh
+        :param pitch: Controls the pitch of the audio. Lower values result in a deeper voice,
+            while higher values make it sharper. The suitable range is between -0.75
+            and 0.75. Default is 0.0.
+        :param pace: Controls the speed of the audio. Lower values result in slower speech,
+            while higher values make it faster. The suitable range is between 0.5
+            and 2.0. Default is 1.0.
+        :param loudness: Controls the loudness of the audio. Lower values result in quieter audio,
+            while higher values make it louder. The suitable range is between 0.3
+            and 3.0. Default is 1.0.
+        :param speech_sample_rate: Specifies the sample rate of the output audio. Supported values are
+            8000, 16000, 22050, 24000 Hz. If not provided, the default is 22050 Hz.
+        :param enable_preprocessing: Controls whether normalization of English words and numeric entities
+            (e.g., numbers, dates) is performed. Set to true for better handling
+            of mixed-language text. Default is false.
+        :param output_audio_codec: Audio codec (currently supports MP3 only, optimized for real-time playback)
+        :param output_audio_bitrate: Audio bitrate (choose from 5 supported bitrate options)
+        :param min_buffer_size: Minimum character length that triggers buffer flushing for TTS model processing
+        :param max_chunk_length: Maximum length for sentence splitting (adjust based on content length)
+        """
+        data = ConfigureConnectionData(
+            target_language_code=target_language_code,
+            speaker=speaker,
+            pitch=pitch,
+            pace=pace,
+            loudness=loudness,
+            speech_sample_rate=speech_sample_rate,
+            enable_preprocessing=enable_preprocessing,
+            output_audio_codec=output_audio_codec,
+            output_audio_bitrate=output_audio_bitrate,
+            min_buffer_size=min_buffer_size,
+            max_chunk_length=max_chunk_length,
+        )
+        message = ConfigureConnection(data=data)
+        await self._send_model(message)
+    async def convert(self, text: str) -> None:
+        """
+        Send text to be converted to speech. Text length should be 1-2500 characters.
+        Recommended: <500 characters for optimal streaming performance.
+        Real-time endpoints perform better with longer character counts.
+        :param text: Text to be synthesized (1-2500 characters, recommended <500)
+        """
+        data = SendTextData(text=text)
+        message = SendText(data=data)
+        await self._send_model(message)
+    async def flush(self) -> None:
+        """
+        Forces the text buffer to process immediately, regardless of the min_buffer_size threshold.
+        Use this when you need to process remaining text that hasn't reached the minimum buffer size.
+        """
+        message = FlushSignal()
+        await self._send_model(message)
+    async def ping(self) -> None:
+        """
+        Send ping signal to keep the WebSocket connection alive. The connection automatically
+        closes after one minute of inactivity.
+        """
+        message = PingSignal()
+        await self._send_model(message)
+    async def recv(self) -> TextToSpeechStreamingSocketClientResponse:
+        """
+        Receive a message from the websocket connection.
+        """
+        data = await self._websocket.recv()
+        data = json.loads(data) if isinstance(data, str) else data
+        return parse_obj_as(TextToSpeechStreamingSocketClientResponse, data)  # type: ignore
+    async def _send(self, data: typing.Any) -> None:
+        """
+        Send a message to the websocket connection.
+        """
+        if isinstance(data, dict):
+            data = json.dumps(data)
+        await self._websocket.send(data)
+    async def _send_model(self, data: typing.Any) -> None:
+        """
+        Send a Pydantic model to the websocket connection.
+        """
+        await self._send(data.dict())
+class TextToSpeechStreamingSocketClient(EventEmitterMixin):
+    def __init__(self, *, websocket: websockets_sync_connection.Connection):
+        super().__init__()
+        self._websocket = websocket
+    def __iter__(self):
+        for message in self._websocket:
+            message = json.loads(message) if isinstance(message, str) else message
+            yield parse_obj_as(TextToSpeechStreamingSocketClientResponse, message)  # type: ignore
+    def start_listening(self):
+        """
+        Start listening for messages on the websocket connection.
+        Emits events in the following order:
+        - EventType.OPEN when connection is established
+        - EventType.MESSAGE for each message received
+        - EventType.ERROR if an error occurs
+        - EventType.CLOSE when connection is closed
+        """
+        self._emit(EventType.OPEN, None)
+        try:
+            for raw_message in self._websocket:
+                raw_message = (
+                    json.loads(raw_message)
+                    if isinstance(raw_message, str)
+                    else raw_message
+                )
+                parsed = parse_obj_as(TextToSpeechStreamingSocketClientResponse, raw_message)  # type: ignore
+                self._emit(EventType.MESSAGE, parsed)
+        except websockets.WebSocketException as exc:
+            self._emit(EventType.ERROR, exc)
+        finally:
+            self._emit(EventType.CLOSE, None)
+    def configure(
+        self,
+        target_language_code: str,
+        speaker: str = "anushka",
+        pitch: float = 0.0,
+        pace: float = 1.0,
+        loudness: float = 1.0,
+        speech_sample_rate: int = 22050,
+        enable_preprocessing: bool = False,
+        output_audio_codec: str = "mp3",
+        output_audio_bitrate: str = "128k",
+        min_buffer_size: int = 50,
+        max_chunk_length: int = 150,
+    ) -> None:
+        """
+        Configuration message required as the first message after establishing the WebSocket connection.
+        This initializes TTS parameters and can be updated at any time during the WebSocket lifecycle
+        by sending a new config message. When a config update is sent, any text currently in the buffer
+        will be automatically flushed and processed before applying the new configuration.
+        :param target_language_code: The language of the text is BCP-47 format
+        :param speaker: The speaker voice to be used for the output audio. Default: Anushka.
+            Model Compatibility (bulbul:v2): Female: Anushka, Manisha, Vidya, Arya;
+            Male: Abhilash, Karun, Hitesh
+        :param pitch: Controls the pitch of the audio. Lower values result in a deeper voice,
+            while higher values make it sharper. The suitable range is between -0.75
+            and 0.75. Default is 0.0.
+        :param pace: Controls the speed of the audio. Lower values result in slower speech,
+            while higher values make it faster. The suitable range is between 0.5
+            and 2.0. Default is 1.0.
+        :param loudness: Controls the loudness of the audio. Lower values result in quieter audio,
+            while higher values make it louder. The suitable range is between 0.3
+            and 3.0. Default is 1.0.
+        :param speech_sample_rate: Specifies the sample rate of the output audio. Supported values are
+            8000, 16000, 22050, 24000 Hz. If not provided, the default is 22050 Hz.
+        :param enable_preprocessing: Controls whether normalization of English words and numeric entities
+            (e.g., numbers, dates) is performed. Set to true for better handling
+            of mixed-language text. Default is false.
+        :param output_audio_codec: Audio codec (currently supports MP3 only, optimized for real-time playback)
+        :param output_audio_bitrate: Audio bitrate (choose from 5 supported bitrate options)
+        :param min_buffer_size: Minimum character length that triggers buffer flushing for TTS model processing
+        :param max_chunk_length: Maximum length for sentence splitting (adjust based on content length)
+        """
+        data = ConfigureConnectionData(
+            target_language_code=target_language_code,
+            speaker=speaker,
+            pitch=pitch,
+            pace=pace,
+            loudness=loudness,
+            speech_sample_rate=speech_sample_rate,
+            enable_preprocessing=enable_preprocessing,
+            output_audio_codec=output_audio_codec,
+            output_audio_bitrate=output_audio_bitrate,
+            min_buffer_size=min_buffer_size,
+            max_chunk_length=max_chunk_length,
+        )
+        message = ConfigureConnection(data=data)
+        self._send_model(message)
+    def convert(self, text: str) -> None:
+        """
+        Send text to be converted to speech. Text length should be 1-2500 characters.
+        Recommended: <500 characters for optimal streaming performance.
+        Real-time endpoints perform better with longer character counts.
+        :param text: Text to be synthesized (1-2500 characters, recommended <500)
+        """
+        data = SendTextData(text=text)
+        message = SendText(data=data)
+        self._send_model(message)
+    def flush(self) -> None:
+        """
+        Forces the text buffer to process immediately, regardless of the min_buffer_size threshold.
+        Use this when you need to process remaining text that hasn't reached the minimum buffer size.
+        """
+        message = FlushSignal()
+        self._send_model(message)
+    def ping(self) -> None:
+        """
+        Send ping signal to keep the WebSocket connection alive. The connection automatically
+        closes after one minute of inactivity.
+        """
+        message = PingSignal()
+        self._send_model(message)
+    def recv(self) -> TextToSpeechStreamingSocketClientResponse:
+        """
+        Receive a message from the websocket connection.
+        """
+        data = self._websocket.recv()
+        data = json.loads(data) if isinstance(data, str) else data
+        return parse_obj_as(TextToSpeechStreamingSocketClientResponse, data)  # type: ignore
+    def _send(self, data: typing.Any) -> None:
+        """
+        Send a message to the websocket connection.
+        """
+        if isinstance(data, dict):
+            data = json.dumps(data)
+        self._websocket.send(data)
+    def _send_model(self, data: typing.Any) -> None:
+        """
+        Send a Pydantic model to the websocket connection.
+        """
+        self._send(data.dict())

sarvamai/types/__init__.py CHANGED Viewed

@@ -4,6 +4,8 @@
 from .audio_data import AudioData
 from .audio_message import AudioMessage
+from .audio_output import AudioOutput
+from .audio_output_data import AudioOutputData
 from .chat_completion_request_assistant_message import ChatCompletionRequestAssistantMessage
 from .chat_completion_request_message import (
     ChatCompletionRequestMessage,
@@ -17,6 +19,11 @@ from .chat_completion_response_message import ChatCompletionResponseMessage
 from .choice import Choice
 from .completion_usage import CompletionUsage
 from .config_message import ConfigMessage
+from .configure_connection import ConfigureConnection
+from .configure_connection_data import ConfigureConnectionData
+from .configure_connection_data_output_audio_bitrate import ConfigureConnectionDataOutputAudioBitrate
+from .configure_connection_data_speaker import ConfigureConnectionDataSpeaker
+from .configure_connection_data_target_language_code import ConfigureConnectionDataTargetLanguageCode
 from .create_chat_completion_response import CreateChatCompletionResponse
 from .diarized_entry import DiarizedEntry
 from .diarized_transcript import DiarizedTranscript
@@ -24,15 +31,21 @@ from .error_code import ErrorCode
 from .error_data import ErrorData
 from .error_details import ErrorDetails
 from .error_message import ErrorMessage
+from .error_response import ErrorResponse
+from .error_response_data import ErrorResponseData
 from .events_data import EventsData
 from .finish_reason import FinishReason
+from .flush_signal import FlushSignal
 from .format import Format
 from .language_identification_response import LanguageIdentificationResponse
 from .numerals_format import NumeralsFormat
+from .ping_signal import PingSignal
 from .reasoning_effort import ReasoningEffort
 from .response_type import ResponseType
 from .role import Role
 from .sarvam_model_ids import SarvamModelIds
+from .send_text import SendText
+from .send_text_data import SendTextData
 from .speech_sample_rate import SpeechSampleRate
 from .speech_to_text_language import SpeechToTextLanguage
 from .speech_to_text_model import SpeechToTextModel
@@ -68,6 +81,8 @@ from .transliteration_response import TransliterationResponse
 __all__ = [
     "AudioData",
     "AudioMessage",
+    "AudioOutput",
+    "AudioOutputData",
     "ChatCompletionRequestAssistantMessage",
     "ChatCompletionRequestMessage",
     "ChatCompletionRequestMessage_Assistant",
@@ -79,6 +94,11 @@ __all__ = [
     "Choice",
     "CompletionUsage",
     "ConfigMessage",
+    "ConfigureConnection",
+    "ConfigureConnectionData",
+    "ConfigureConnectionDataOutputAudioBitrate",
+    "ConfigureConnectionDataSpeaker",
+    "ConfigureConnectionDataTargetLanguageCode",
     "CreateChatCompletionResponse",
     "DiarizedEntry",
     "DiarizedTranscript",
@@ -86,15 +106,21 @@ __all__ = [
     "ErrorData",
     "ErrorDetails",
     "ErrorMessage",
+    "ErrorResponse",
+    "ErrorResponseData",
     "EventsData",
     "FinishReason",
+    "FlushSignal",
     "Format",
     "LanguageIdentificationResponse",
     "NumeralsFormat",
+    "PingSignal",
     "ReasoningEffort",
     "ResponseType",
     "Role",
     "SarvamModelIds",
+    "SendText",
+    "SendTextData",
     "SpeechSampleRate",
     "SpeechToTextLanguage",
     "SpeechToTextModel",

sarvamai/types/audio_output.py ADDED Viewed

@@ -0,0 +1,21 @@
+# This file was auto-generated by Fern from our API Definition.
+import typing
+import pydantic
+from ..core.pydantic_utilities import IS_PYDANTIC_V2, UniversalBaseModel
+from .audio_output_data import AudioOutputData
+class AudioOutput(UniversalBaseModel):
+    type: typing.Literal["audio"] = "audio"
+    data: AudioOutputData
+    if IS_PYDANTIC_V2:
+        model_config: typing.ClassVar[pydantic.ConfigDict] = pydantic.ConfigDict(extra="allow", frozen=True)  # type: ignore # Pydantic v2
+    else:
+        class Config:
+            frozen = True
+            smart_union = True
+            extra = pydantic.Extra.allow

sarvamai/types/audio_output_data.py ADDED Viewed

@@ -0,0 +1,27 @@
+# This file was auto-generated by Fern from our API Definition.
+import typing
+import pydantic
+from ..core.pydantic_utilities import IS_PYDANTIC_V2, UniversalBaseModel
+class AudioOutputData(UniversalBaseModel):
+    content_type: str = pydantic.Field()
+    """
+    MIME type of the audio content (e.g., 'audio/mp3', 'audio/wav')
+    """
+    audio: str = pydantic.Field()
+    """
+    Base64-encoded audio data ready for playback or download
+    """
+    if IS_PYDANTIC_V2:
+        model_config: typing.ClassVar[pydantic.ConfigDict] = pydantic.ConfigDict(extra="allow", frozen=True)  # type: ignore # Pydantic v2
+    else:
+        class Config:
+            frozen = True
+            smart_union = True
+            extra = pydantic.Extra.allow

sarvamai/types/configure_connection.py ADDED Viewed

@@ -0,0 +1,28 @@
+# This file was auto-generated by Fern from our API Definition.
+import typing
+import pydantic
+from ..core.pydantic_utilities import IS_PYDANTIC_V2, UniversalBaseModel
+from .configure_connection_data import ConfigureConnectionData
+class ConfigureConnection(UniversalBaseModel):
+    """
+    Configuration message required as the first message after establishing the WebSocket connection.
+    This initializes TTS parameters and can be updated at any time during the WebSocket lifecycle
+    by sending a new config message. When a config update is sent, any text currently in the buffer
+    will be automatically flushed and processed before applying the new configuration.
+    """
+    type: typing.Literal["config"] = "config"
+    data: ConfigureConnectionData
+    if IS_PYDANTIC_V2:
+        model_config: typing.ClassVar[pydantic.ConfigDict] = pydantic.ConfigDict(extra="allow", frozen=True)  # type: ignore # Pydantic v2
+    else:
+        class Config:
+            frozen = True
+            smart_union = True
+            extra = pydantic.Extra.allow

sarvamai 0.1.7__py3-none-any.whl → 0.1.8__py3-none-any.whl

sarvamai 0.1.7py3-none-any.whl → 0.1.8py3-none-any.whl