sarvamai 0.1.23a6__py3-none-any.whl → 0.1.23a8__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- sarvamai/__init__.py +52 -0
- sarvamai/client.py +3 -0
- sarvamai/core/client_wrapper.py +2 -2
- sarvamai/doc_digitization_job/__init__.py +4 -0
- sarvamai/doc_digitization_job/client.py +776 -0
- sarvamai/doc_digitization_job/job.py +496 -0
- sarvamai/doc_digitization_job/raw_client.py +1176 -0
- sarvamai/requests/__init__.py +20 -0
- sarvamai/requests/doc_digitization_create_job_response.py +25 -0
- sarvamai/requests/doc_digitization_download_files_response.py +37 -0
- sarvamai/requests/doc_digitization_error_details.py +21 -0
- sarvamai/requests/doc_digitization_error_message.py +11 -0
- sarvamai/requests/doc_digitization_job_detail.py +64 -0
- sarvamai/requests/doc_digitization_job_parameters.py +21 -0
- sarvamai/requests/doc_digitization_job_status_response.py +65 -0
- sarvamai/requests/doc_digitization_page_error.py +24 -0
- sarvamai/requests/doc_digitization_upload_files_response.py +34 -0
- sarvamai/requests/doc_digitization_webhook_callback.py +19 -0
- sarvamai/requests/speech_to_text_response.py +14 -6
- sarvamai/requests/speech_to_text_transcription_data.py +0 -14
- sarvamai/requests/speech_to_text_translate_response.py +9 -6
- sarvamai/requests/speech_to_text_translate_transcription_data.py +0 -13
- sarvamai/speech_to_text_streaming/client.py +2 -30
- sarvamai/speech_to_text_streaming/raw_client.py +2 -30
- sarvamai/speech_to_text_streaming/types/speech_to_text_streaming_language_code.py +1 -25
- sarvamai/types/__init__.py +30 -0
- sarvamai/types/doc_digitization_create_job_response.py +37 -0
- sarvamai/types/doc_digitization_download_files_response.py +47 -0
- sarvamai/types/doc_digitization_error_code.py +15 -0
- sarvamai/types/doc_digitization_error_details.py +33 -0
- sarvamai/types/doc_digitization_error_message.py +23 -0
- sarvamai/types/doc_digitization_job_detail.py +74 -0
- sarvamai/types/doc_digitization_job_detail_state.py +7 -0
- sarvamai/types/doc_digitization_job_parameters.py +33 -0
- sarvamai/types/doc_digitization_job_state.py +7 -0
- sarvamai/types/doc_digitization_job_status_response.py +75 -0
- sarvamai/types/doc_digitization_output_format.py +5 -0
- sarvamai/types/doc_digitization_page_error.py +36 -0
- sarvamai/types/doc_digitization_supported_language.py +32 -0
- sarvamai/types/doc_digitization_upload_files_response.py +44 -0
- sarvamai/types/doc_digitization_webhook_callback.py +31 -0
- sarvamai/types/speech_to_text_language.py +1 -24
- sarvamai/types/speech_to_text_response.py +14 -6
- sarvamai/types/speech_to_text_transcription_data.py +0 -14
- sarvamai/types/speech_to_text_translate_language.py +1 -25
- sarvamai/types/speech_to_text_translate_response.py +9 -6
- sarvamai/types/speech_to_text_translate_transcription_data.py +0 -13
- {sarvamai-0.1.23a6.dist-info → sarvamai-0.1.23a8.dist-info}/METADATA +1 -1
- {sarvamai-0.1.23a6.dist-info → sarvamai-0.1.23a8.dist-info}/RECORD +50 -21
- {sarvamai-0.1.23a6.dist-info → sarvamai-0.1.23a8.dist-info}/WHEEL +0 -0
sarvamai/requests/__init__.py
CHANGED
|
@@ -27,6 +27,16 @@ from .configure_connection_data import ConfigureConnectionDataParams
|
|
|
27
27
|
from .create_chat_completion_response import CreateChatCompletionResponseParams
|
|
28
28
|
from .diarized_entry import DiarizedEntryParams
|
|
29
29
|
from .diarized_transcript import DiarizedTranscriptParams
|
|
30
|
+
from .doc_digitization_create_job_response import DocDigitizationCreateJobResponseParams
|
|
31
|
+
from .doc_digitization_download_files_response import DocDigitizationDownloadFilesResponseParams
|
|
32
|
+
from .doc_digitization_error_details import DocDigitizationErrorDetailsParams
|
|
33
|
+
from .doc_digitization_error_message import DocDigitizationErrorMessageParams
|
|
34
|
+
from .doc_digitization_job_detail import DocDigitizationJobDetailParams
|
|
35
|
+
from .doc_digitization_job_parameters import DocDigitizationJobParametersParams
|
|
36
|
+
from .doc_digitization_job_status_response import DocDigitizationJobStatusResponseParams
|
|
37
|
+
from .doc_digitization_page_error import DocDigitizationPageErrorParams
|
|
38
|
+
from .doc_digitization_upload_files_response import DocDigitizationUploadFilesResponseParams
|
|
39
|
+
from .doc_digitization_webhook_callback import DocDigitizationWebhookCallbackParams
|
|
30
40
|
from .error_data import ErrorDataParams
|
|
31
41
|
from .error_details import ErrorDetailsParams
|
|
32
42
|
from .error_message import ErrorMessageParams
|
|
@@ -89,6 +99,16 @@ __all__ = [
|
|
|
89
99
|
"CreateChatCompletionResponseParams",
|
|
90
100
|
"DiarizedEntryParams",
|
|
91
101
|
"DiarizedTranscriptParams",
|
|
102
|
+
"DocDigitizationCreateJobResponseParams",
|
|
103
|
+
"DocDigitizationDownloadFilesResponseParams",
|
|
104
|
+
"DocDigitizationErrorDetailsParams",
|
|
105
|
+
"DocDigitizationErrorMessageParams",
|
|
106
|
+
"DocDigitizationJobDetailParams",
|
|
107
|
+
"DocDigitizationJobParametersParams",
|
|
108
|
+
"DocDigitizationJobStatusResponseParams",
|
|
109
|
+
"DocDigitizationPageErrorParams",
|
|
110
|
+
"DocDigitizationUploadFilesResponseParams",
|
|
111
|
+
"DocDigitizationWebhookCallbackParams",
|
|
92
112
|
"ErrorDataParams",
|
|
93
113
|
"ErrorDetailsParams",
|
|
94
114
|
"ErrorMessageParams",
|
|
@@ -0,0 +1,25 @@
|
|
|
1
|
+
# This file was auto-generated by Fern from our API Definition.
|
|
2
|
+
|
|
3
|
+
import typing_extensions
|
|
4
|
+
from ..types.doc_digitization_job_state import DocDigitizationJobState
|
|
5
|
+
from ..types.storage_container_type import StorageContainerType
|
|
6
|
+
from .doc_digitization_job_parameters import DocDigitizationJobParametersParams
|
|
7
|
+
|
|
8
|
+
|
|
9
|
+
class DocDigitizationCreateJobResponseParams(typing_extensions.TypedDict):
|
|
10
|
+
job_id: str
|
|
11
|
+
"""
|
|
12
|
+
Unique job identifier (UUID)
|
|
13
|
+
"""
|
|
14
|
+
|
|
15
|
+
storage_container_type: StorageContainerType
|
|
16
|
+
"""
|
|
17
|
+
Storage Container Type
|
|
18
|
+
"""
|
|
19
|
+
|
|
20
|
+
job_parameters: DocDigitizationJobParametersParams
|
|
21
|
+
"""
|
|
22
|
+
Job configuration parameters
|
|
23
|
+
"""
|
|
24
|
+
|
|
25
|
+
job_state: DocDigitizationJobState
|
|
@@ -0,0 +1,37 @@
|
|
|
1
|
+
# This file was auto-generated by Fern from our API Definition.
|
|
2
|
+
|
|
3
|
+
import typing
|
|
4
|
+
|
|
5
|
+
import typing_extensions
|
|
6
|
+
from ..types.doc_digitization_job_state import DocDigitizationJobState
|
|
7
|
+
from ..types.storage_container_type import StorageContainerType
|
|
8
|
+
from .file_signed_url_details import FileSignedUrlDetailsParams
|
|
9
|
+
|
|
10
|
+
|
|
11
|
+
class DocDigitizationDownloadFilesResponseParams(typing_extensions.TypedDict):
|
|
12
|
+
"""
|
|
13
|
+
Response for download-files endpoint.
|
|
14
|
+
"""
|
|
15
|
+
|
|
16
|
+
job_id: str
|
|
17
|
+
"""
|
|
18
|
+
Job identifier (UUID)
|
|
19
|
+
"""
|
|
20
|
+
|
|
21
|
+
job_state: DocDigitizationJobState
|
|
22
|
+
"""
|
|
23
|
+
Current job state
|
|
24
|
+
"""
|
|
25
|
+
|
|
26
|
+
storage_container_type: StorageContainerType
|
|
27
|
+
"""
|
|
28
|
+
Storage backend type
|
|
29
|
+
"""
|
|
30
|
+
|
|
31
|
+
download_urls: typing.Dict[str, FileSignedUrlDetailsParams]
|
|
32
|
+
"""
|
|
33
|
+
Map of filename to presigned download URL details
|
|
34
|
+
"""
|
|
35
|
+
|
|
36
|
+
error_code: typing_extensions.NotRequired[str]
|
|
37
|
+
error_message: typing_extensions.NotRequired[str]
|
|
@@ -0,0 +1,21 @@
|
|
|
1
|
+
# This file was auto-generated by Fern from our API Definition.
|
|
2
|
+
|
|
3
|
+
import typing_extensions
|
|
4
|
+
from ..types.doc_digitization_error_code import DocDigitizationErrorCode
|
|
5
|
+
|
|
6
|
+
|
|
7
|
+
class DocDigitizationErrorDetailsParams(typing_extensions.TypedDict):
|
|
8
|
+
message: str
|
|
9
|
+
"""
|
|
10
|
+
Message describing the error
|
|
11
|
+
"""
|
|
12
|
+
|
|
13
|
+
code: DocDigitizationErrorCode
|
|
14
|
+
"""
|
|
15
|
+
Error code for the specific error that has occurred.
|
|
16
|
+
"""
|
|
17
|
+
|
|
18
|
+
request_id: typing_extensions.NotRequired[str]
|
|
19
|
+
"""
|
|
20
|
+
Unique identifier for the request. Format: date_UUID4
|
|
21
|
+
"""
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
# This file was auto-generated by Fern from our API Definition.
|
|
2
|
+
|
|
3
|
+
import typing_extensions
|
|
4
|
+
from .doc_digitization_error_details import DocDigitizationErrorDetailsParams
|
|
5
|
+
|
|
6
|
+
|
|
7
|
+
class DocDigitizationErrorMessageParams(typing_extensions.TypedDict):
|
|
8
|
+
error: DocDigitizationErrorDetailsParams
|
|
9
|
+
"""
|
|
10
|
+
Error details
|
|
11
|
+
"""
|
|
@@ -0,0 +1,64 @@
|
|
|
1
|
+
# This file was auto-generated by Fern from our API Definition.
|
|
2
|
+
|
|
3
|
+
import typing
|
|
4
|
+
|
|
5
|
+
import typing_extensions
|
|
6
|
+
from ..types.doc_digitization_job_detail_state import DocDigitizationJobDetailState
|
|
7
|
+
from .doc_digitization_page_error import DocDigitizationPageErrorParams
|
|
8
|
+
from .task_file_details import TaskFileDetailsParams
|
|
9
|
+
|
|
10
|
+
|
|
11
|
+
class DocDigitizationJobDetailParams(typing_extensions.TypedDict):
|
|
12
|
+
"""
|
|
13
|
+
Processing details for a single input file with page-level metrics.
|
|
14
|
+
"""
|
|
15
|
+
|
|
16
|
+
inputs: typing.Sequence[TaskFileDetailsParams]
|
|
17
|
+
"""
|
|
18
|
+
Input file(s) for this task
|
|
19
|
+
"""
|
|
20
|
+
|
|
21
|
+
outputs: typing.Sequence[TaskFileDetailsParams]
|
|
22
|
+
"""
|
|
23
|
+
Output file(s) produced
|
|
24
|
+
"""
|
|
25
|
+
|
|
26
|
+
state: DocDigitizationJobDetailState
|
|
27
|
+
"""
|
|
28
|
+
Processing state for this file
|
|
29
|
+
"""
|
|
30
|
+
|
|
31
|
+
total_pages: typing_extensions.NotRequired[int]
|
|
32
|
+
"""
|
|
33
|
+
Total pages/images in the input file
|
|
34
|
+
"""
|
|
35
|
+
|
|
36
|
+
pages_processed: typing_extensions.NotRequired[int]
|
|
37
|
+
"""
|
|
38
|
+
Number of pages processed so far
|
|
39
|
+
"""
|
|
40
|
+
|
|
41
|
+
pages_succeeded: typing_extensions.NotRequired[int]
|
|
42
|
+
"""
|
|
43
|
+
Number of pages successfully processed
|
|
44
|
+
"""
|
|
45
|
+
|
|
46
|
+
pages_failed: typing_extensions.NotRequired[int]
|
|
47
|
+
"""
|
|
48
|
+
Number of pages that failed processing
|
|
49
|
+
"""
|
|
50
|
+
|
|
51
|
+
error_message: typing_extensions.NotRequired[str]
|
|
52
|
+
"""
|
|
53
|
+
Error message if processing failed
|
|
54
|
+
"""
|
|
55
|
+
|
|
56
|
+
error_code: typing_extensions.NotRequired[str]
|
|
57
|
+
"""
|
|
58
|
+
Standardized error code if failed
|
|
59
|
+
"""
|
|
60
|
+
|
|
61
|
+
page_errors: typing_extensions.NotRequired[typing.Sequence[DocDigitizationPageErrorParams]]
|
|
62
|
+
"""
|
|
63
|
+
Detailed errors for each failed page
|
|
64
|
+
"""
|
|
@@ -0,0 +1,21 @@
|
|
|
1
|
+
# This file was auto-generated by Fern from our API Definition.
|
|
2
|
+
|
|
3
|
+
import typing_extensions
|
|
4
|
+
from ..types.doc_digitization_output_format import DocDigitizationOutputFormat
|
|
5
|
+
from ..types.doc_digitization_supported_language import DocDigitizationSupportedLanguage
|
|
6
|
+
|
|
7
|
+
|
|
8
|
+
class DocDigitizationJobParametersParams(typing_extensions.TypedDict):
|
|
9
|
+
"""
|
|
10
|
+
Job parameters for document digitization.
|
|
11
|
+
"""
|
|
12
|
+
|
|
13
|
+
language: typing_extensions.NotRequired[DocDigitizationSupportedLanguage]
|
|
14
|
+
"""
|
|
15
|
+
ISO language code for the document
|
|
16
|
+
"""
|
|
17
|
+
|
|
18
|
+
output_format: typing_extensions.NotRequired[DocDigitizationOutputFormat]
|
|
19
|
+
"""
|
|
20
|
+
Output format: html or md
|
|
21
|
+
"""
|
|
@@ -0,0 +1,65 @@
|
|
|
1
|
+
# This file was auto-generated by Fern from our API Definition.
|
|
2
|
+
|
|
3
|
+
import datetime as dt
|
|
4
|
+
import typing
|
|
5
|
+
|
|
6
|
+
import typing_extensions
|
|
7
|
+
from ..types.doc_digitization_job_state import DocDigitizationJobState
|
|
8
|
+
from ..types.storage_container_type import StorageContainerType
|
|
9
|
+
from .doc_digitization_job_detail import DocDigitizationJobDetailParams
|
|
10
|
+
|
|
11
|
+
|
|
12
|
+
class DocDigitizationJobStatusResponseParams(typing_extensions.TypedDict):
|
|
13
|
+
"""
|
|
14
|
+
Response model for job status endpoint.
|
|
15
|
+
"""
|
|
16
|
+
|
|
17
|
+
job_id: str
|
|
18
|
+
"""
|
|
19
|
+
Job identifier (UUID)
|
|
20
|
+
"""
|
|
21
|
+
|
|
22
|
+
job_state: DocDigitizationJobState
|
|
23
|
+
"""
|
|
24
|
+
Current job state
|
|
25
|
+
"""
|
|
26
|
+
|
|
27
|
+
created_at: dt.datetime
|
|
28
|
+
"""
|
|
29
|
+
Job creation timestamp (ISO 8601)
|
|
30
|
+
"""
|
|
31
|
+
|
|
32
|
+
updated_at: dt.datetime
|
|
33
|
+
"""
|
|
34
|
+
Last update timestamp (ISO 8601)
|
|
35
|
+
"""
|
|
36
|
+
|
|
37
|
+
storage_container_type: StorageContainerType
|
|
38
|
+
"""
|
|
39
|
+
Storage backend type
|
|
40
|
+
"""
|
|
41
|
+
|
|
42
|
+
total_files: typing_extensions.NotRequired[int]
|
|
43
|
+
"""
|
|
44
|
+
Total input files (always 1)
|
|
45
|
+
"""
|
|
46
|
+
|
|
47
|
+
successful_files_count: typing_extensions.NotRequired[int]
|
|
48
|
+
"""
|
|
49
|
+
Files that completed successfully
|
|
50
|
+
"""
|
|
51
|
+
|
|
52
|
+
failed_files_count: typing_extensions.NotRequired[int]
|
|
53
|
+
"""
|
|
54
|
+
Files that failed
|
|
55
|
+
"""
|
|
56
|
+
|
|
57
|
+
error_message: typing_extensions.NotRequired[str]
|
|
58
|
+
"""
|
|
59
|
+
Job-level error message
|
|
60
|
+
"""
|
|
61
|
+
|
|
62
|
+
job_details: typing_extensions.NotRequired[typing.Sequence[DocDigitizationJobDetailParams]]
|
|
63
|
+
"""
|
|
64
|
+
Per-file processing details with page metrics
|
|
65
|
+
"""
|
|
@@ -0,0 +1,24 @@
|
|
|
1
|
+
# This file was auto-generated by Fern from our API Definition.
|
|
2
|
+
|
|
3
|
+
import typing_extensions
|
|
4
|
+
|
|
5
|
+
|
|
6
|
+
class DocDigitizationPageErrorParams(typing_extensions.TypedDict):
|
|
7
|
+
"""
|
|
8
|
+
Error details for a specific page.
|
|
9
|
+
"""
|
|
10
|
+
|
|
11
|
+
page_number: int
|
|
12
|
+
"""
|
|
13
|
+
Page number that failed
|
|
14
|
+
"""
|
|
15
|
+
|
|
16
|
+
error_code: str
|
|
17
|
+
"""
|
|
18
|
+
Standardized error code
|
|
19
|
+
"""
|
|
20
|
+
|
|
21
|
+
error_message: str
|
|
22
|
+
"""
|
|
23
|
+
Human-readable error description
|
|
24
|
+
"""
|
|
@@ -0,0 +1,34 @@
|
|
|
1
|
+
# This file was auto-generated by Fern from our API Definition.
|
|
2
|
+
|
|
3
|
+
import typing
|
|
4
|
+
|
|
5
|
+
import typing_extensions
|
|
6
|
+
from ..types.doc_digitization_job_state import DocDigitizationJobState
|
|
7
|
+
from ..types.storage_container_type import StorageContainerType
|
|
8
|
+
from .file_signed_url_details import FileSignedUrlDetailsParams
|
|
9
|
+
|
|
10
|
+
|
|
11
|
+
class DocDigitizationUploadFilesResponseParams(typing_extensions.TypedDict):
|
|
12
|
+
"""
|
|
13
|
+
Response with presigned upload URLs
|
|
14
|
+
"""
|
|
15
|
+
|
|
16
|
+
job_id: str
|
|
17
|
+
"""
|
|
18
|
+
Job identifier
|
|
19
|
+
"""
|
|
20
|
+
|
|
21
|
+
job_state: DocDigitizationJobState
|
|
22
|
+
"""
|
|
23
|
+
Current job state
|
|
24
|
+
"""
|
|
25
|
+
|
|
26
|
+
upload_urls: typing.Dict[str, FileSignedUrlDetailsParams]
|
|
27
|
+
"""
|
|
28
|
+
Map of filename to presigned upload URL details
|
|
29
|
+
"""
|
|
30
|
+
|
|
31
|
+
storage_container_type: StorageContainerType
|
|
32
|
+
"""
|
|
33
|
+
Storage backend type
|
|
34
|
+
"""
|
|
@@ -0,0 +1,19 @@
|
|
|
1
|
+
# This file was auto-generated by Fern from our API Definition.
|
|
2
|
+
|
|
3
|
+
import typing_extensions
|
|
4
|
+
|
|
5
|
+
|
|
6
|
+
class DocDigitizationWebhookCallbackParams(typing_extensions.TypedDict):
|
|
7
|
+
"""
|
|
8
|
+
Webhook configuration for job completion notification
|
|
9
|
+
"""
|
|
10
|
+
|
|
11
|
+
url: str
|
|
12
|
+
"""
|
|
13
|
+
HTTPS webhook URL to call upon job completion (HTTP not allowed)
|
|
14
|
+
"""
|
|
15
|
+
|
|
16
|
+
auth_token: typing_extensions.NotRequired[str]
|
|
17
|
+
"""
|
|
18
|
+
Authorization token sent as X-SARVAM-JOB-CALLBACK-TOKEN header
|
|
19
|
+
"""
|
|
@@ -1,20 +1,28 @@
|
|
|
1
1
|
# This file was auto-generated by Fern from our API Definition.
|
|
2
2
|
|
|
3
3
|
import typing_extensions
|
|
4
|
+
from .diarized_transcript import DiarizedTranscriptParams
|
|
5
|
+
from .timestamps_model import TimestampsModelParams
|
|
4
6
|
|
|
5
7
|
|
|
6
8
|
class SpeechToTextResponseParams(typing_extensions.TypedDict):
|
|
7
|
-
request_id: str
|
|
9
|
+
request_id: typing_extensions.NotRequired[str]
|
|
10
|
+
transcript: str
|
|
8
11
|
"""
|
|
9
|
-
|
|
12
|
+
The transcribed text from the provided audio file.
|
|
10
13
|
"""
|
|
11
14
|
|
|
12
|
-
|
|
15
|
+
timestamps: typing_extensions.NotRequired[TimestampsModelParams]
|
|
13
16
|
"""
|
|
14
|
-
|
|
17
|
+
Contains timestamps for the transcribed text. This field is included only if with_timestamps is set to true
|
|
18
|
+
"""
|
|
19
|
+
|
|
20
|
+
diarized_transcript: typing_extensions.NotRequired[DiarizedTranscriptParams]
|
|
21
|
+
"""
|
|
22
|
+
Diarized transcript of the provided speech
|
|
15
23
|
"""
|
|
16
24
|
|
|
17
|
-
language_code: str
|
|
25
|
+
language_code: typing_extensions.NotRequired[str]
|
|
18
26
|
"""
|
|
19
|
-
|
|
27
|
+
This will return the BCP-47 code of language spoken in the input. If multiple languages are detected, this will return language code of most predominant spoken language. If no language is detected, this will be null
|
|
20
28
|
"""
|
|
@@ -32,18 +32,4 @@ class SpeechToTextTranscriptionDataParams(typing_extensions.TypedDict):
|
|
|
32
32
|
BCP-47 code of detected language
|
|
33
33
|
"""
|
|
34
34
|
|
|
35
|
-
language_probability: typing_extensions.NotRequired[float]
|
|
36
|
-
"""
|
|
37
|
-
Float value (0.0 to 1.0) indicating the probability of the detected language being correct. Higher values indicate higher confidence.
|
|
38
|
-
|
|
39
|
-
**When it returns a value:**
|
|
40
|
-
- When `language_code` is not provided in the request
|
|
41
|
-
- When `language_code` is set to `unknown`
|
|
42
|
-
|
|
43
|
-
**When it returns null:**
|
|
44
|
-
- When a specific `language_code` is provided (language detection is skipped)
|
|
45
|
-
|
|
46
|
-
The parameter is always present in the response.
|
|
47
|
-
"""
|
|
48
|
-
|
|
49
35
|
metrics: TranscriptionMetricsParams
|
|
@@ -1,20 +1,23 @@
|
|
|
1
1
|
# This file was auto-generated by Fern from our API Definition.
|
|
2
2
|
|
|
3
3
|
import typing_extensions
|
|
4
|
+
from ..types.speech_to_text_translate_language import SpeechToTextTranslateLanguage
|
|
5
|
+
from .diarized_transcript import DiarizedTranscriptParams
|
|
4
6
|
|
|
5
7
|
|
|
6
8
|
class SpeechToTextTranslateResponseParams(typing_extensions.TypedDict):
|
|
7
|
-
request_id: str
|
|
9
|
+
request_id: typing_extensions.NotRequired[str]
|
|
10
|
+
transcript: str
|
|
8
11
|
"""
|
|
9
|
-
|
|
12
|
+
Transcript of the provided speech
|
|
10
13
|
"""
|
|
11
14
|
|
|
12
|
-
|
|
15
|
+
language_code: typing_extensions.NotRequired[SpeechToTextTranslateLanguage]
|
|
13
16
|
"""
|
|
14
|
-
|
|
17
|
+
This will return the BCP-47 code of language spoken in the input. If multiple languages are detected, this will return language code of most predominant spoken language. If no language is detected, this will be null
|
|
15
18
|
"""
|
|
16
19
|
|
|
17
|
-
|
|
20
|
+
diarized_transcript: typing_extensions.NotRequired[DiarizedTranscriptParams]
|
|
18
21
|
"""
|
|
19
|
-
|
|
22
|
+
Diarized transcript of the provided speech
|
|
20
23
|
"""
|
|
@@ -20,17 +20,4 @@ class SpeechToTextTranslateTranscriptionDataParams(typing_extensions.TypedDict):
|
|
|
20
20
|
BCP-47 code of detected source language (null when language detection is in progress)
|
|
21
21
|
"""
|
|
22
22
|
|
|
23
|
-
language_probability: typing_extensions.NotRequired[float]
|
|
24
|
-
"""
|
|
25
|
-
Float value (0.0 to 1.0) indicating the probability of the detected source language being correct. Higher values indicate higher confidence.
|
|
26
|
-
|
|
27
|
-
**When it returns a value:**
|
|
28
|
-
- Always returns a value as source language is auto-detected for translation
|
|
29
|
-
|
|
30
|
-
**When it returns null:**
|
|
31
|
-
- When language detection confidence is unavailable
|
|
32
|
-
|
|
33
|
-
The parameter is always present in the response.
|
|
34
|
-
"""
|
|
35
|
-
|
|
36
23
|
metrics: TranscriptionMetricsParams
|
|
@@ -67,7 +67,7 @@ class SpeechToTextStreamingClient:
|
|
|
67
67
|
language_code : SpeechToTextStreamingLanguageCode
|
|
68
68
|
Specifies the language of the input audio in BCP-47 format.
|
|
69
69
|
|
|
70
|
-
**Available Options
|
|
70
|
+
**Available Options:**
|
|
71
71
|
- `hi-IN`: Hindi
|
|
72
72
|
- `bn-IN`: Bengali
|
|
73
73
|
- `gu-IN`: Gujarati
|
|
@@ -80,20 +80,6 @@ class SpeechToTextStreamingClient:
|
|
|
80
80
|
- `te-IN`: Telugu
|
|
81
81
|
- `en-IN`: English
|
|
82
82
|
|
|
83
|
-
**Additional Options (saaras:v3 only):**
|
|
84
|
-
- `as-IN`: Assamese
|
|
85
|
-
- `ur-IN`: Urdu
|
|
86
|
-
- `ne-IN`: Nepali
|
|
87
|
-
- `kok-IN`: Konkani
|
|
88
|
-
- `ks-IN`: Kashmiri
|
|
89
|
-
- `sd-IN`: Sindhi
|
|
90
|
-
- `sa-IN`: Sanskrit
|
|
91
|
-
- `sat-IN`: Santali
|
|
92
|
-
- `mni-IN`: Manipuri
|
|
93
|
-
- `brx-IN`: Bodo
|
|
94
|
-
- `mai-IN`: Maithili
|
|
95
|
-
- `doi-IN`: Dogri
|
|
96
|
-
|
|
97
83
|
model : typing.Optional[SpeechToTextStreamingModel]
|
|
98
84
|
Specifies the model to use for speech-to-text conversion.
|
|
99
85
|
|
|
@@ -231,7 +217,7 @@ class AsyncSpeechToTextStreamingClient:
|
|
|
231
217
|
language_code : SpeechToTextStreamingLanguageCode
|
|
232
218
|
Specifies the language of the input audio in BCP-47 format.
|
|
233
219
|
|
|
234
|
-
**Available Options
|
|
220
|
+
**Available Options:**
|
|
235
221
|
- `hi-IN`: Hindi
|
|
236
222
|
- `bn-IN`: Bengali
|
|
237
223
|
- `gu-IN`: Gujarati
|
|
@@ -244,20 +230,6 @@ class AsyncSpeechToTextStreamingClient:
|
|
|
244
230
|
- `te-IN`: Telugu
|
|
245
231
|
- `en-IN`: English
|
|
246
232
|
|
|
247
|
-
**Additional Options (saaras:v3 only):**
|
|
248
|
-
- `as-IN`: Assamese
|
|
249
|
-
- `ur-IN`: Urdu
|
|
250
|
-
- `ne-IN`: Nepali
|
|
251
|
-
- `kok-IN`: Konkani
|
|
252
|
-
- `ks-IN`: Kashmiri
|
|
253
|
-
- `sd-IN`: Sindhi
|
|
254
|
-
- `sa-IN`: Sanskrit
|
|
255
|
-
- `sat-IN`: Santali
|
|
256
|
-
- `mni-IN`: Manipuri
|
|
257
|
-
- `brx-IN`: Bodo
|
|
258
|
-
- `mai-IN`: Maithili
|
|
259
|
-
- `doi-IN`: Dogri
|
|
260
|
-
|
|
261
233
|
model : typing.Optional[SpeechToTextStreamingModel]
|
|
262
234
|
Specifies the model to use for speech-to-text conversion.
|
|
263
235
|
|
|
@@ -55,7 +55,7 @@ class RawSpeechToTextStreamingClient:
|
|
|
55
55
|
language_code : SpeechToTextStreamingLanguageCode
|
|
56
56
|
Specifies the language of the input audio in BCP-47 format.
|
|
57
57
|
|
|
58
|
-
**Available Options
|
|
58
|
+
**Available Options:**
|
|
59
59
|
- `hi-IN`: Hindi
|
|
60
60
|
- `bn-IN`: Bengali
|
|
61
61
|
- `gu-IN`: Gujarati
|
|
@@ -68,20 +68,6 @@ class RawSpeechToTextStreamingClient:
|
|
|
68
68
|
- `te-IN`: Telugu
|
|
69
69
|
- `en-IN`: English
|
|
70
70
|
|
|
71
|
-
**Additional Options (saaras:v3 only):**
|
|
72
|
-
- `as-IN`: Assamese
|
|
73
|
-
- `ur-IN`: Urdu
|
|
74
|
-
- `ne-IN`: Nepali
|
|
75
|
-
- `kok-IN`: Konkani
|
|
76
|
-
- `ks-IN`: Kashmiri
|
|
77
|
-
- `sd-IN`: Sindhi
|
|
78
|
-
- `sa-IN`: Sanskrit
|
|
79
|
-
- `sat-IN`: Santali
|
|
80
|
-
- `mni-IN`: Manipuri
|
|
81
|
-
- `brx-IN`: Bodo
|
|
82
|
-
- `mai-IN`: Maithili
|
|
83
|
-
- `doi-IN`: Dogri
|
|
84
|
-
|
|
85
71
|
model : typing.Optional[SpeechToTextStreamingModel]
|
|
86
72
|
Specifies the model to use for speech-to-text conversion.
|
|
87
73
|
|
|
@@ -208,7 +194,7 @@ class AsyncRawSpeechToTextStreamingClient:
|
|
|
208
194
|
language_code : SpeechToTextStreamingLanguageCode
|
|
209
195
|
Specifies the language of the input audio in BCP-47 format.
|
|
210
196
|
|
|
211
|
-
**Available Options
|
|
197
|
+
**Available Options:**
|
|
212
198
|
- `hi-IN`: Hindi
|
|
213
199
|
- `bn-IN`: Bengali
|
|
214
200
|
- `gu-IN`: Gujarati
|
|
@@ -221,20 +207,6 @@ class AsyncRawSpeechToTextStreamingClient:
|
|
|
221
207
|
- `te-IN`: Telugu
|
|
222
208
|
- `en-IN`: English
|
|
223
209
|
|
|
224
|
-
**Additional Options (saaras:v3 only):**
|
|
225
|
-
- `as-IN`: Assamese
|
|
226
|
-
- `ur-IN`: Urdu
|
|
227
|
-
- `ne-IN`: Nepali
|
|
228
|
-
- `kok-IN`: Konkani
|
|
229
|
-
- `ks-IN`: Kashmiri
|
|
230
|
-
- `sd-IN`: Sindhi
|
|
231
|
-
- `sa-IN`: Sanskrit
|
|
232
|
-
- `sat-IN`: Santali
|
|
233
|
-
- `mni-IN`: Manipuri
|
|
234
|
-
- `brx-IN`: Bodo
|
|
235
|
-
- `mai-IN`: Maithili
|
|
236
|
-
- `doi-IN`: Dogri
|
|
237
|
-
|
|
238
210
|
model : typing.Optional[SpeechToTextStreamingModel]
|
|
239
211
|
Specifies the model to use for speech-to-text conversion.
|
|
240
212
|
|
|
@@ -3,30 +3,6 @@
|
|
|
3
3
|
import typing
|
|
4
4
|
|
|
5
5
|
SpeechToTextStreamingLanguageCode = typing.Union[
|
|
6
|
-
typing.Literal[
|
|
7
|
-
"en-IN",
|
|
8
|
-
"hi-IN",
|
|
9
|
-
"bn-IN",
|
|
10
|
-
"gu-IN",
|
|
11
|
-
"kn-IN",
|
|
12
|
-
"ml-IN",
|
|
13
|
-
"mr-IN",
|
|
14
|
-
"od-IN",
|
|
15
|
-
"pa-IN",
|
|
16
|
-
"ta-IN",
|
|
17
|
-
"te-IN",
|
|
18
|
-
"as-IN",
|
|
19
|
-
"ur-IN",
|
|
20
|
-
"ne-IN",
|
|
21
|
-
"kok-IN",
|
|
22
|
-
"ks-IN",
|
|
23
|
-
"sd-IN",
|
|
24
|
-
"sa-IN",
|
|
25
|
-
"sat-IN",
|
|
26
|
-
"mni-IN",
|
|
27
|
-
"brx-IN",
|
|
28
|
-
"mai-IN",
|
|
29
|
-
"doi-IN",
|
|
30
|
-
],
|
|
6
|
+
typing.Literal["en-IN", "hi-IN", "bn-IN", "gu-IN", "kn-IN", "ml-IN", "mr-IN", "od-IN", "pa-IN", "ta-IN", "te-IN"],
|
|
31
7
|
typing.Any,
|
|
32
8
|
]
|
sarvamai/types/__init__.py
CHANGED
|
@@ -34,6 +34,21 @@ from .connection_sample_rate import ConnectionSampleRate
|
|
|
34
34
|
from .create_chat_completion_response import CreateChatCompletionResponse
|
|
35
35
|
from .diarized_entry import DiarizedEntry
|
|
36
36
|
from .diarized_transcript import DiarizedTranscript
|
|
37
|
+
from .doc_digitization_create_job_response import DocDigitizationCreateJobResponse
|
|
38
|
+
from .doc_digitization_download_files_response import DocDigitizationDownloadFilesResponse
|
|
39
|
+
from .doc_digitization_error_code import DocDigitizationErrorCode
|
|
40
|
+
from .doc_digitization_error_details import DocDigitizationErrorDetails
|
|
41
|
+
from .doc_digitization_error_message import DocDigitizationErrorMessage
|
|
42
|
+
from .doc_digitization_job_detail import DocDigitizationJobDetail
|
|
43
|
+
from .doc_digitization_job_detail_state import DocDigitizationJobDetailState
|
|
44
|
+
from .doc_digitization_job_parameters import DocDigitizationJobParameters
|
|
45
|
+
from .doc_digitization_job_state import DocDigitizationJobState
|
|
46
|
+
from .doc_digitization_job_status_response import DocDigitizationJobStatusResponse
|
|
47
|
+
from .doc_digitization_output_format import DocDigitizationOutputFormat
|
|
48
|
+
from .doc_digitization_page_error import DocDigitizationPageError
|
|
49
|
+
from .doc_digitization_supported_language import DocDigitizationSupportedLanguage
|
|
50
|
+
from .doc_digitization_upload_files_response import DocDigitizationUploadFilesResponse
|
|
51
|
+
from .doc_digitization_webhook_callback import DocDigitizationWebhookCallback
|
|
37
52
|
from .error_code import ErrorCode
|
|
38
53
|
from .error_data import ErrorData
|
|
39
54
|
from .error_details import ErrorDetails
|
|
@@ -134,6 +149,21 @@ __all__ = [
|
|
|
134
149
|
"CreateChatCompletionResponse",
|
|
135
150
|
"DiarizedEntry",
|
|
136
151
|
"DiarizedTranscript",
|
|
152
|
+
"DocDigitizationCreateJobResponse",
|
|
153
|
+
"DocDigitizationDownloadFilesResponse",
|
|
154
|
+
"DocDigitizationErrorCode",
|
|
155
|
+
"DocDigitizationErrorDetails",
|
|
156
|
+
"DocDigitizationErrorMessage",
|
|
157
|
+
"DocDigitizationJobDetail",
|
|
158
|
+
"DocDigitizationJobDetailState",
|
|
159
|
+
"DocDigitizationJobParameters",
|
|
160
|
+
"DocDigitizationJobState",
|
|
161
|
+
"DocDigitizationJobStatusResponse",
|
|
162
|
+
"DocDigitizationOutputFormat",
|
|
163
|
+
"DocDigitizationPageError",
|
|
164
|
+
"DocDigitizationSupportedLanguage",
|
|
165
|
+
"DocDigitizationUploadFilesResponse",
|
|
166
|
+
"DocDigitizationWebhookCallback",
|
|
137
167
|
"ErrorCode",
|
|
138
168
|
"ErrorData",
|
|
139
169
|
"ErrorDetails",
|