PyPI - sarvamai - Versions diffs - 0.1.22a3__py3-none-any.whl → 0.1.23a1__py3-none-any.whl - Mend

sarvamai 0.1.22a3py3-none-any.whl → 0.1.23a1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (64) hide show

sarvamai/__init__.py +405 -206
sarvamai/chat/raw_client.py +20 -20
sarvamai/client.py +186 -34
sarvamai/core/__init__.py +76 -21
sarvamai/core/client_wrapper.py +19 -3
sarvamai/core/force_multipart.py +4 -2
sarvamai/core/http_client.py +217 -97
sarvamai/core/http_response.py +1 -1
sarvamai/core/http_sse/__init__.py +42 -0
sarvamai/core/http_sse/_api.py +112 -0
sarvamai/core/http_sse/_decoders.py +61 -0
sarvamai/core/http_sse/_exceptions.py +7 -0
sarvamai/core/http_sse/_models.py +17 -0
sarvamai/core/jsonable_encoder.py +8 -0
sarvamai/core/pydantic_utilities.py +110 -4
sarvamai/errors/__init__.py +40 -6
sarvamai/errors/bad_request_error.py +1 -1
sarvamai/errors/forbidden_error.py +1 -1
sarvamai/errors/internal_server_error.py +1 -1
sarvamai/errors/service_unavailable_error.py +1 -1
sarvamai/errors/too_many_requests_error.py +1 -1
sarvamai/errors/unprocessable_entity_error.py +1 -1
sarvamai/requests/__init__.py +150 -62
sarvamai/requests/audio_data.py +0 -6
sarvamai/requests/error_response_data.py +1 -1
sarvamai/requests/file_signed_url_details.py +1 -1
sarvamai/requests/speech_to_text_transcription_data.py +2 -8
sarvamai/requests/speech_to_text_translate_transcription_data.py +0 -6
sarvamai/speech_to_text/raw_client.py +54 -52
sarvamai/speech_to_text_job/job.py +100 -2
sarvamai/speech_to_text_job/raw_client.py +134 -130
sarvamai/speech_to_text_streaming/__init__.py +38 -10
sarvamai/speech_to_text_streaming/client.py +0 -44
sarvamai/speech_to_text_streaming/raw_client.py +0 -44
sarvamai/speech_to_text_streaming/types/__init__.py +36 -8
sarvamai/speech_to_text_translate_job/job.py +100 -2
sarvamai/speech_to_text_translate_job/raw_client.py +134 -130
sarvamai/speech_to_text_translate_streaming/__init__.py +36 -9
sarvamai/speech_to_text_translate_streaming/client.py +0 -44
sarvamai/speech_to_text_translate_streaming/raw_client.py +0 -44
sarvamai/speech_to_text_translate_streaming/types/__init__.py +36 -9
sarvamai/text/client.py +0 -12
sarvamai/text/raw_client.py +60 -72
sarvamai/text_to_speech/client.py +18 -0
sarvamai/text_to_speech/raw_client.py +38 -20
sarvamai/text_to_speech_streaming/__init__.py +28 -1
sarvamai/text_to_speech_streaming/types/__init__.py +30 -1
sarvamai/types/__init__.py +222 -102
sarvamai/types/audio_data.py +0 -6
sarvamai/types/chat_completion_request_message.py +6 -2
sarvamai/types/completion_event_flag.py +3 -1
sarvamai/types/error_response_data.py +1 -1
sarvamai/types/file_signed_url_details.py +1 -1
sarvamai/types/speech_to_text_transcription_data.py +2 -8
sarvamai/types/speech_to_text_translate_transcription_data.py +0 -6
{sarvamai-0.1.22a3.dist-info → sarvamai-0.1.23a1.dist-info}/METADATA +2 -1
{sarvamai-0.1.22a3.dist-info → sarvamai-0.1.23a1.dist-info}/RECORD +58 -59
sarvamai/speech_to_text_streaming/types/speech_to_text_streaming_input_audio_codec.py +0 -33
sarvamai/speech_to_text_streaming/types/speech_to_text_streaming_stream_ongoing_speech_results.py +0 -5
sarvamai/speech_to_text_translate_streaming/types/speech_to_text_translate_streaming_input_audio_codec.py +0 -33
sarvamai/speech_to_text_translate_streaming/types/speech_to_text_translate_streaming_stream_ongoing_speech_results.py +0 -5
sarvamai/types/audio_data_input_audio_codec.py +0 -33
sarvamai/types/response_speech_state.py +0 -7
{sarvamai-0.1.22a3.dist-info → sarvamai-0.1.23a1.dist-info}/WHEEL +0 -0

sarvamai/speech_to_text_streaming/__init__.py CHANGED Viewed

@@ -2,20 +2,48 @@
 # isort: skip_file
-from .types import (
-    SpeechToTextStreamingFlushSignal,
-    SpeechToTextStreamingHighVadSensitivity,
-    SpeechToTextStreamingInputAudioCodec,
-    SpeechToTextStreamingLanguageCode,
-    SpeechToTextStreamingStreamOngoingSpeechResults,
-    SpeechToTextStreamingVadSignals,
-)
+import typing
+from importlib import import_module
+if typing.TYPE_CHECKING:
+    from .types import (
+        SpeechToTextStreamingFlushSignal,
+        SpeechToTextStreamingHighVadSensitivity,
+        SpeechToTextStreamingLanguageCode,
+        SpeechToTextStreamingVadSignals,
+    )
+_dynamic_imports: typing.Dict[str, str] = {
+    "SpeechToTextStreamingFlushSignal": ".types",
+    "SpeechToTextStreamingHighVadSensitivity": ".types",
+    "SpeechToTextStreamingLanguageCode": ".types",
+    "SpeechToTextStreamingVadSignals": ".types",
+}
+def __getattr__(attr_name: str) -> typing.Any:
+    module_name = _dynamic_imports.get(attr_name)
+    if module_name is None:
+        raise AttributeError(f"No {attr_name} found in _dynamic_imports for module name -> {__name__}")
+    try:
+        module = import_module(module_name, __package__)
+        if module_name == f".{attr_name}":
+            return module
+        else:
+            return getattr(module, attr_name)
+    except ImportError as e:
+        raise ImportError(f"Failed to import {attr_name} from {module_name}: {e}") from e
+    except AttributeError as e:
+        raise AttributeError(f"Failed to get {attr_name} from {module_name}: {e}") from e
+def __dir__():
+    lazy_attrs = list(_dynamic_imports.keys())
+    return sorted(lazy_attrs)
 __all__ = [
     "SpeechToTextStreamingFlushSignal",
     "SpeechToTextStreamingHighVadSensitivity",
-    "SpeechToTextStreamingInputAudioCodec",
     "SpeechToTextStreamingLanguageCode",
-    "SpeechToTextStreamingStreamOngoingSpeechResults",
     "SpeechToTextStreamingVadSignals",
 ]

sarvamai/speech_to_text_streaming/client.py CHANGED Viewed

@@ -13,11 +13,7 @@ from .raw_client import AsyncRawSpeechToTextStreamingClient, RawSpeechToTextStre
 from .socket_client import AsyncSpeechToTextStreamingSocketClient, SpeechToTextStreamingSocketClient
 from .types.speech_to_text_streaming_flush_signal import SpeechToTextStreamingFlushSignal
 from .types.speech_to_text_streaming_high_vad_sensitivity import SpeechToTextStreamingHighVadSensitivity
-from .types.speech_to_text_streaming_input_audio_codec import SpeechToTextStreamingInputAudioCodec
 from .types.speech_to_text_streaming_language_code import SpeechToTextStreamingLanguageCode
-from .types.speech_to_text_streaming_stream_ongoing_speech_results import (
-    SpeechToTextStreamingStreamOngoingSpeechResults,
-)
 from .types.speech_to_text_streaming_vad_signals import SpeechToTextStreamingVadSignals
 try:
@@ -47,13 +43,10 @@ class SpeechToTextStreamingClient:
         *,
         language_code: SpeechToTextStreamingLanguageCode,
         model: typing.Optional[typing.Literal["saarika:v2.5"]] = None,
-        input_audio_codec: typing.Optional[SpeechToTextStreamingInputAudioCodec] = None,
         sample_rate: typing.Optional[str] = None,
         high_vad_sensitivity: typing.Optional[SpeechToTextStreamingHighVadSensitivity] = None,
         vad_signals: typing.Optional[SpeechToTextStreamingVadSignals] = None,
         flush_signal: typing.Optional[SpeechToTextStreamingFlushSignal] = None,
-        stream_ongoing_speech_results: typing.Optional[SpeechToTextStreamingStreamOngoingSpeechResults] = None,
-        streaming_ongoing_requests_frame_size: typing.Optional[str] = None,
         api_subscription_key: typing.Optional[str] = None,
         request_options: typing.Optional[RequestOptions] = None,
     ) -> typing.Iterator[SpeechToTextStreamingSocketClient]:
@@ -72,9 +65,6 @@ class SpeechToTextStreamingClient:
         model : typing.Optional[typing.Literal["saarika:v2.5"]]
             Speech to text model to use
-        input_audio_codec : typing.Optional[SpeechToTextStreamingInputAudioCodec]
-            Audio codec/format of the input file. Our API automatically detects all codec formats, but for PCM files specifically (pcm_s16le, pcm_l16, pcm_raw), you must pass this parameter. PCM files supports sample rate 16000 and 8000.
         sample_rate : typing.Optional[str]
             Audio sample rate for the WebSocket connection. When specified as a connection parameter, only 16kHz and 8kHz are supported. 8kHz is only available via this connection parameter. If not specified, defaults to 16kHz.
@@ -87,12 +77,6 @@ class SpeechToTextStreamingClient:
         flush_signal : typing.Optional[SpeechToTextStreamingFlushSignal]
             Signal to flush the audio buffer and finalize transcription
-        stream_ongoing_speech_results : typing.Optional[SpeechToTextStreamingStreamOngoingSpeechResults]
-            Enable streaming of ongoing speech results during active speech
-        streaming_ongoing_requests_frame_size : typing.Optional[str]
-            Frame size for streaming ongoing speech results (1-100)
         api_subscription_key : typing.Optional[str]
             API subscription key for authentication
@@ -109,8 +93,6 @@ class SpeechToTextStreamingClient:
             query_params = query_params.add("language-code", language_code)
         if model is not None:
             query_params = query_params.add("model", model)
-        if input_audio_codec is not None:
-            query_params = query_params.add("input_audio_codec", input_audio_codec)
         if sample_rate is not None:
             query_params = query_params.add("sample_rate", sample_rate)
         if high_vad_sensitivity is not None:
@@ -119,12 +101,6 @@ class SpeechToTextStreamingClient:
             query_params = query_params.add("vad_signals", vad_signals)
         if flush_signal is not None:
             query_params = query_params.add("flush_signal", flush_signal)
-        if stream_ongoing_speech_results is not None:
-            query_params = query_params.add("stream_ongoing_speech_results", stream_ongoing_speech_results)
-        if streaming_ongoing_requests_frame_size is not None:
-            query_params = query_params.add(
-                "streaming_ongoing_requests_frame_size", streaming_ongoing_requests_frame_size
-            )
         ws_url = ws_url + f"?{query_params}"
         headers = self._raw_client._client_wrapper.get_headers()
         if api_subscription_key is not None:
@@ -170,13 +146,10 @@ class AsyncSpeechToTextStreamingClient:
         *,
         language_code: SpeechToTextStreamingLanguageCode,
         model: typing.Optional[typing.Literal["saarika:v2.5"]] = None,
-        input_audio_codec: typing.Optional[SpeechToTextStreamingInputAudioCodec] = None,
         sample_rate: typing.Optional[str] = None,
         high_vad_sensitivity: typing.Optional[SpeechToTextStreamingHighVadSensitivity] = None,
         vad_signals: typing.Optional[SpeechToTextStreamingVadSignals] = None,
         flush_signal: typing.Optional[SpeechToTextStreamingFlushSignal] = None,
-        stream_ongoing_speech_results: typing.Optional[SpeechToTextStreamingStreamOngoingSpeechResults] = None,
-        streaming_ongoing_requests_frame_size: typing.Optional[str] = None,
         api_subscription_key: typing.Optional[str] = None,
         request_options: typing.Optional[RequestOptions] = None,
     ) -> typing.AsyncIterator[AsyncSpeechToTextStreamingSocketClient]:
@@ -195,9 +168,6 @@ class AsyncSpeechToTextStreamingClient:
         model : typing.Optional[typing.Literal["saarika:v2.5"]]
             Speech to text model to use
-        input_audio_codec : typing.Optional[SpeechToTextStreamingInputAudioCodec]
-            Audio codec/format of the input file. Our API automatically detects all codec formats, but for PCM files specifically (pcm_s16le, pcm_l16, pcm_raw), you must pass this parameter. PCM files supports sample rate 16000 and 8000.
         sample_rate : typing.Optional[str]
             Audio sample rate for the WebSocket connection. When specified as a connection parameter, only 16kHz and 8kHz are supported. 8kHz is only available via this connection parameter. If not specified, defaults to 16kHz.
@@ -210,12 +180,6 @@ class AsyncSpeechToTextStreamingClient:
         flush_signal : typing.Optional[SpeechToTextStreamingFlushSignal]
             Signal to flush the audio buffer and finalize transcription
-        stream_ongoing_speech_results : typing.Optional[SpeechToTextStreamingStreamOngoingSpeechResults]
-            Enable streaming of ongoing speech results during active speech
-        streaming_ongoing_requests_frame_size : typing.Optional[str]
-            Frame size for streaming ongoing speech results (1-100)
         api_subscription_key : typing.Optional[str]
             API subscription key for authentication
@@ -232,8 +196,6 @@ class AsyncSpeechToTextStreamingClient:
             query_params = query_params.add("language-code", language_code)
         if model is not None:
             query_params = query_params.add("model", model)
-        if input_audio_codec is not None:
-            query_params = query_params.add("input_audio_codec", input_audio_codec)
         if sample_rate is not None:
             query_params = query_params.add("sample_rate", sample_rate)
         if high_vad_sensitivity is not None:
@@ -242,12 +204,6 @@ class AsyncSpeechToTextStreamingClient:
             query_params = query_params.add("vad_signals", vad_signals)
         if flush_signal is not None:
             query_params = query_params.add("flush_signal", flush_signal)
-        if stream_ongoing_speech_results is not None:
-            query_params = query_params.add("stream_ongoing_speech_results", stream_ongoing_speech_results)
-        if streaming_ongoing_requests_frame_size is not None:
-            query_params = query_params.add(
-                "streaming_ongoing_requests_frame_size", streaming_ongoing_requests_frame_size
-            )
         ws_url = ws_url + f"?{query_params}"
         headers = self._raw_client._client_wrapper.get_headers()
         if api_subscription_key is not None:

sarvamai/speech_to_text_streaming/raw_client.py CHANGED Viewed

@@ -12,11 +12,7 @@ from ..core.request_options import RequestOptions
 from .socket_client import AsyncSpeechToTextStreamingSocketClient, SpeechToTextStreamingSocketClient
 from .types.speech_to_text_streaming_flush_signal import SpeechToTextStreamingFlushSignal
 from .types.speech_to_text_streaming_high_vad_sensitivity import SpeechToTextStreamingHighVadSensitivity
-from .types.speech_to_text_streaming_input_audio_codec import SpeechToTextStreamingInputAudioCodec
 from .types.speech_to_text_streaming_language_code import SpeechToTextStreamingLanguageCode
-from .types.speech_to_text_streaming_stream_ongoing_speech_results import (
-    SpeechToTextStreamingStreamOngoingSpeechResults,
-)
 from .types.speech_to_text_streaming_vad_signals import SpeechToTextStreamingVadSignals
 try:
@@ -35,13 +31,10 @@ class RawSpeechToTextStreamingClient:
         *,
         language_code: SpeechToTextStreamingLanguageCode,
         model: typing.Optional[typing.Literal["saarika:v2.5"]] = None,
-        input_audio_codec: typing.Optional[SpeechToTextStreamingInputAudioCodec] = None,
         sample_rate: typing.Optional[str] = None,
         high_vad_sensitivity: typing.Optional[SpeechToTextStreamingHighVadSensitivity] = None,
         vad_signals: typing.Optional[SpeechToTextStreamingVadSignals] = None,
         flush_signal: typing.Optional[SpeechToTextStreamingFlushSignal] = None,
-        stream_ongoing_speech_results: typing.Optional[SpeechToTextStreamingStreamOngoingSpeechResults] = None,
-        streaming_ongoing_requests_frame_size: typing.Optional[str] = None,
         api_subscription_key: typing.Optional[str] = None,
         request_options: typing.Optional[RequestOptions] = None,
     ) -> typing.Iterator[SpeechToTextStreamingSocketClient]:
@@ -60,9 +53,6 @@ class RawSpeechToTextStreamingClient:
         model : typing.Optional[typing.Literal["saarika:v2.5"]]
             Speech to text model to use
-        input_audio_codec : typing.Optional[SpeechToTextStreamingInputAudioCodec]
-            Audio codec/format of the input file. Our API automatically detects all codec formats, but for PCM files specifically (pcm_s16le, pcm_l16, pcm_raw), you must pass this parameter. PCM files supports sample rate 16000 and 8000.
         sample_rate : typing.Optional[str]
             Audio sample rate for the WebSocket connection. When specified as a connection parameter, only 16kHz and 8kHz are supported. 8kHz is only available via this connection parameter. If not specified, defaults to 16kHz.
@@ -75,12 +65,6 @@ class RawSpeechToTextStreamingClient:
         flush_signal : typing.Optional[SpeechToTextStreamingFlushSignal]
             Signal to flush the audio buffer and finalize transcription
-        stream_ongoing_speech_results : typing.Optional[SpeechToTextStreamingStreamOngoingSpeechResults]
-            Enable streaming of ongoing speech results during active speech
-        streaming_ongoing_requests_frame_size : typing.Optional[str]
-            Frame size for streaming ongoing speech results (1-100)
         api_subscription_key : typing.Optional[str]
             API subscription key for authentication
@@ -97,8 +81,6 @@ class RawSpeechToTextStreamingClient:
             query_params = query_params.add("language-code", language_code)
         if model is not None:
             query_params = query_params.add("model", model)
-        if input_audio_codec is not None:
-            query_params = query_params.add("input_audio_codec", input_audio_codec)
         if sample_rate is not None:
             query_params = query_params.add("sample_rate", sample_rate)
         if high_vad_sensitivity is not None:
@@ -107,12 +89,6 @@ class RawSpeechToTextStreamingClient:
             query_params = query_params.add("vad_signals", vad_signals)
         if flush_signal is not None:
             query_params = query_params.add("flush_signal", flush_signal)
-        if stream_ongoing_speech_results is not None:
-            query_params = query_params.add("stream_ongoing_speech_results", stream_ongoing_speech_results)
-        if streaming_ongoing_requests_frame_size is not None:
-            query_params = query_params.add(
-                "streaming_ongoing_requests_frame_size", streaming_ongoing_requests_frame_size
-            )
         ws_url = ws_url + f"?{query_params}"
         headers = self._client_wrapper.get_headers()
         if api_subscription_key is not None:
@@ -147,13 +123,10 @@ class AsyncRawSpeechToTextStreamingClient:
         *,
         language_code: SpeechToTextStreamingLanguageCode,
         model: typing.Optional[typing.Literal["saarika:v2.5"]] = None,
-        input_audio_codec: typing.Optional[SpeechToTextStreamingInputAudioCodec] = None,
         sample_rate: typing.Optional[str] = None,
         high_vad_sensitivity: typing.Optional[SpeechToTextStreamingHighVadSensitivity] = None,
         vad_signals: typing.Optional[SpeechToTextStreamingVadSignals] = None,
         flush_signal: typing.Optional[SpeechToTextStreamingFlushSignal] = None,
-        stream_ongoing_speech_results: typing.Optional[SpeechToTextStreamingStreamOngoingSpeechResults] = None,
-        streaming_ongoing_requests_frame_size: typing.Optional[str] = None,
         api_subscription_key: typing.Optional[str] = None,
         request_options: typing.Optional[RequestOptions] = None,
     ) -> typing.AsyncIterator[AsyncSpeechToTextStreamingSocketClient]:
@@ -172,9 +145,6 @@ class AsyncRawSpeechToTextStreamingClient:
         model : typing.Optional[typing.Literal["saarika:v2.5"]]
             Speech to text model to use
-        input_audio_codec : typing.Optional[SpeechToTextStreamingInputAudioCodec]
-            Audio codec/format of the input file. Our API automatically detects all codec formats, but for PCM files specifically (pcm_s16le, pcm_l16, pcm_raw), you must pass this parameter. PCM files supports sample rate 16000 and 8000.
         sample_rate : typing.Optional[str]
             Audio sample rate for the WebSocket connection. When specified as a connection parameter, only 16kHz and 8kHz are supported. 8kHz is only available via this connection parameter. If not specified, defaults to 16kHz.
@@ -187,12 +157,6 @@ class AsyncRawSpeechToTextStreamingClient:
         flush_signal : typing.Optional[SpeechToTextStreamingFlushSignal]
             Signal to flush the audio buffer and finalize transcription
-        stream_ongoing_speech_results : typing.Optional[SpeechToTextStreamingStreamOngoingSpeechResults]
-            Enable streaming of ongoing speech results during active speech
-        streaming_ongoing_requests_frame_size : typing.Optional[str]
-            Frame size for streaming ongoing speech results (1-100)
         api_subscription_key : typing.Optional[str]
             API subscription key for authentication
@@ -209,8 +173,6 @@ class AsyncRawSpeechToTextStreamingClient:
             query_params = query_params.add("language-code", language_code)
         if model is not None:
             query_params = query_params.add("model", model)
-        if input_audio_codec is not None:
-            query_params = query_params.add("input_audio_codec", input_audio_codec)
         if sample_rate is not None:
             query_params = query_params.add("sample_rate", sample_rate)
         if high_vad_sensitivity is not None:
@@ -219,12 +181,6 @@ class AsyncRawSpeechToTextStreamingClient:
             query_params = query_params.add("vad_signals", vad_signals)
         if flush_signal is not None:
             query_params = query_params.add("flush_signal", flush_signal)
-        if stream_ongoing_speech_results is not None:
-            query_params = query_params.add("stream_ongoing_speech_results", stream_ongoing_speech_results)
-        if streaming_ongoing_requests_frame_size is not None:
-            query_params = query_params.add(
-                "streaming_ongoing_requests_frame_size", streaming_ongoing_requests_frame_size
-            )
         ws_url = ws_url + f"?{query_params}"
         headers = self._client_wrapper.get_headers()
         if api_subscription_key is not None:

sarvamai/speech_to_text_streaming/types/__init__.py CHANGED Viewed

@@ -2,18 +2,46 @@
 # isort: skip_file
-from .speech_to_text_streaming_flush_signal import SpeechToTextStreamingFlushSignal
-from .speech_to_text_streaming_high_vad_sensitivity import SpeechToTextStreamingHighVadSensitivity
-from .speech_to_text_streaming_input_audio_codec import SpeechToTextStreamingInputAudioCodec
-from .speech_to_text_streaming_language_code import SpeechToTextStreamingLanguageCode
-from .speech_to_text_streaming_stream_ongoing_speech_results import SpeechToTextStreamingStreamOngoingSpeechResults
-from .speech_to_text_streaming_vad_signals import SpeechToTextStreamingVadSignals
+import typing
+from importlib import import_module
+if typing.TYPE_CHECKING:
+    from .speech_to_text_streaming_flush_signal import SpeechToTextStreamingFlushSignal
+    from .speech_to_text_streaming_high_vad_sensitivity import SpeechToTextStreamingHighVadSensitivity
+    from .speech_to_text_streaming_language_code import SpeechToTextStreamingLanguageCode
+    from .speech_to_text_streaming_vad_signals import SpeechToTextStreamingVadSignals
+_dynamic_imports: typing.Dict[str, str] = {
+    "SpeechToTextStreamingFlushSignal": ".speech_to_text_streaming_flush_signal",
+    "SpeechToTextStreamingHighVadSensitivity": ".speech_to_text_streaming_high_vad_sensitivity",
+    "SpeechToTextStreamingLanguageCode": ".speech_to_text_streaming_language_code",
+    "SpeechToTextStreamingVadSignals": ".speech_to_text_streaming_vad_signals",
+}
+def __getattr__(attr_name: str) -> typing.Any:
+    module_name = _dynamic_imports.get(attr_name)
+    if module_name is None:
+        raise AttributeError(f"No {attr_name} found in _dynamic_imports for module name -> {__name__}")
+    try:
+        module = import_module(module_name, __package__)
+        if module_name == f".{attr_name}":
+            return module
+        else:
+            return getattr(module, attr_name)
+    except ImportError as e:
+        raise ImportError(f"Failed to import {attr_name} from {module_name}: {e}") from e
+    except AttributeError as e:
+        raise AttributeError(f"Failed to get {attr_name} from {module_name}: {e}") from e
+def __dir__():
+    lazy_attrs = list(_dynamic_imports.keys())
+    return sorted(lazy_attrs)
 __all__ = [
     "SpeechToTextStreamingFlushSignal",
     "SpeechToTextStreamingHighVadSensitivity",
-    "SpeechToTextStreamingInputAudioCodec",
     "SpeechToTextStreamingLanguageCode",
-    "SpeechToTextStreamingStreamOngoingSpeechResults",
     "SpeechToTextStreamingVadSignals",
 ]

sarvamai/speech_to_text_translate_job/job.py CHANGED Viewed

@@ -150,9 +150,58 @@ class AsyncSpeechToTextTranslateJob:
                 "output_file": detail.outputs[0].file_name,
             }
             for detail in (job_status.job_details or [])
-            if detail.inputs and detail.outputs
+            if detail.inputs and detail.outputs and detail.state == "Success"
         ]
+    async def get_file_results(
+        self,
+    ) -> typing.Dict[str, typing.List[typing.Dict[str, typing.Any]]]:
+        """
+        Get detailed results for each file in the batch job.
+        Returns
+        -------
+        Dict[str, List[Dict[str, Any]]]
+            Dictionary with 'successful' and 'failed' keys, each containing a list of file details.
+            Each file detail includes:
+            - 'file_name': Name of the input file
+            - 'status': Status of processing ('Success' or 'Failed')
+            - 'error_message': Error message if failed (None if successful)
+            - 'output_file': Name of output file if successful (None if failed)
+        """
+        job_status = await self.get_status()
+        results: typing.Dict[str, typing.List[typing.Dict[str, typing.Any]]] = {
+            "successful": [],
+            "failed": [],
+        }
+        for detail in job_status.job_details or []:
+            # Check for empty lists explicitly
+            if not detail.inputs or len(detail.inputs) == 0:
+                continue
+            try:
+                file_info = {
+                    "file_name": detail.inputs[0].file_name,
+                    "status": detail.state,
+                    "error_message": detail.error_message,
+                    "output_file": (
+                        detail.outputs[0].file_name
+                        if detail.outputs and len(detail.outputs) > 0
+                        else None
+                    ),
+                }
+                if detail.state == "Success":
+                    results["successful"].append(file_info)
+                else:
+                    results["failed"].append(file_info)
+            except (IndexError, AttributeError):
+                # Skip malformed job details
+                continue
+        return results
     async def download_outputs(self, output_dir: str) -> bool:
         """
         Download output files to the specified directory.
@@ -395,9 +444,58 @@ class SpeechToTextTranslateJob:
                 "output_file": detail.outputs[0].file_name,
             }
             for detail in (job_status.job_details or [])
-            if detail.inputs and detail.outputs
+            if detail.inputs and detail.outputs and detail.state == "Success"
         ]
+    def get_file_results(
+        self,
+    ) -> typing.Dict[str, typing.List[typing.Dict[str, typing.Any]]]:
+        """
+        Get detailed results for each file in the batch job.
+        Returns
+        -------
+        Dict[str, List[Dict[str, Any]]]
+            Dictionary with 'successful' and 'failed' keys, each containing a list of file details.
+            Each file detail includes:
+            - 'file_name': Name of the input file
+            - 'status': Status of processing ('Success' or 'Failed')
+            - 'error_message': Error message if failed (None if successful)
+            - 'output_file': Name of output file if successful (None if failed)
+        """
+        job_status = self.get_status()
+        results: typing.Dict[str, typing.List[typing.Dict[str, typing.Any]]] = {
+            "successful": [],
+            "failed": [],
+        }
+        for detail in job_status.job_details or []:
+            # Check for empty lists explicitly
+            if not detail.inputs or len(detail.inputs) == 0:
+                continue
+            try:
+                file_info = {
+                    "file_name": detail.inputs[0].file_name,
+                    "status": detail.state,
+                    "error_message": detail.error_message,
+                    "output_file": (
+                        detail.outputs[0].file_name
+                        if detail.outputs and len(detail.outputs) > 0
+                        else None
+                    ),
+                }
+                if detail.state == "Success":
+                    results["successful"].append(file_info)
+                else:
+                    results["failed"].append(file_info)
+            except (IndexError, AttributeError):
+                # Skip malformed job details
+                continue
+        return results
     def download_outputs(self, output_dir: str) -> bool:
         """
         Download output files to the specified directory.

sarvamai 0.1.22a3__py3-none-any.whl → 0.1.23a1__py3-none-any.whl

sarvamai 0.1.22a3py3-none-any.whl → 0.1.23a1py3-none-any.whl