sarvamai 0.1.23a4__tar.gz → 0.1.23a6__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (245) hide show
  1. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/PKG-INFO +1 -1
  2. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/pyproject.toml +1 -1
  3. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/__init__.py +4 -0
  4. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/core/client_wrapper.py +2 -2
  5. sarvamai-0.1.23a6/src/sarvamai/requests/speech_to_text_job_parameters.py +73 -0
  6. sarvamai-0.1.23a6/src/sarvamai/requests/speech_to_text_response.py +20 -0
  7. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/speech_to_text_transcription_data.py +14 -0
  8. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/speech_to_text_translate_job_parameters.py +4 -1
  9. sarvamai-0.1.23a6/src/sarvamai/requests/speech_to_text_translate_response.py +20 -0
  10. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/speech_to_text_translate_transcription_data.py +13 -0
  11. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text/client.py +84 -26
  12. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text/raw_client.py +84 -26
  13. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_streaming/__init__.py +2 -0
  14. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_streaming/client.py +117 -18
  15. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_streaming/raw_client.py +117 -18
  16. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_streaming/types/__init__.py +2 -0
  17. sarvamai-0.1.23a6/src/sarvamai/speech_to_text_streaming/types/speech_to_text_streaming_input_audio_codec.py +7 -0
  18. sarvamai-0.1.23a6/src/sarvamai/speech_to_text_streaming/types/speech_to_text_streaming_language_code.py +32 -0
  19. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_streaming/types/speech_to_text_streaming_mode.py +1 -1
  20. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_translate_streaming/__init__.py +2 -0
  21. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_translate_streaming/client.py +23 -2
  22. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_translate_streaming/raw_client.py +23 -2
  23. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_translate_streaming/types/__init__.py +2 -0
  24. sarvamai-0.1.23a6/src/sarvamai/speech_to_text_translate_streaming/types/speech_to_text_translate_streaming_input_audio_codec.py +7 -0
  25. sarvamai-0.1.23a6/src/sarvamai/types/mode.py +5 -0
  26. sarvamai-0.1.23a6/src/sarvamai/types/speech_to_text_job_parameters.py +85 -0
  27. sarvamai-0.1.23a6/src/sarvamai/types/speech_to_text_language.py +33 -0
  28. sarvamai-0.1.23a6/src/sarvamai/types/speech_to_text_model.py +5 -0
  29. sarvamai-0.1.23a6/src/sarvamai/types/speech_to_text_response.py +32 -0
  30. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/speech_to_text_transcription_data.py +14 -0
  31. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/speech_to_text_translate_job_parameters.py +4 -1
  32. sarvamai-0.1.23a6/src/sarvamai/types/speech_to_text_translate_language.py +32 -0
  33. sarvamai-0.1.23a6/src/sarvamai/types/speech_to_text_translate_model.py +5 -0
  34. sarvamai-0.1.23a4/src/sarvamai/types/speech_to_text_translate_transcription_data.py → sarvamai-0.1.23a6/src/sarvamai/types/speech_to_text_translate_response.py +3 -6
  35. sarvamai-0.1.23a6/src/sarvamai/types/speech_to_text_translate_transcription_data.py +48 -0
  36. sarvamai-0.1.23a4/src/sarvamai/requests/speech_to_text_job_parameters.py +0 -41
  37. sarvamai-0.1.23a4/src/sarvamai/requests/speech_to_text_response.py +0 -28
  38. sarvamai-0.1.23a4/src/sarvamai/requests/speech_to_text_translate_response.py +0 -23
  39. sarvamai-0.1.23a4/src/sarvamai/speech_to_text_streaming/types/speech_to_text_streaming_language_code.py +0 -8
  40. sarvamai-0.1.23a4/src/sarvamai/types/mode.py +0 -7
  41. sarvamai-0.1.23a4/src/sarvamai/types/speech_to_text_job_parameters.py +0 -53
  42. sarvamai-0.1.23a4/src/sarvamai/types/speech_to_text_language.py +0 -10
  43. sarvamai-0.1.23a4/src/sarvamai/types/speech_to_text_model.py +0 -7
  44. sarvamai-0.1.23a4/src/sarvamai/types/speech_to_text_response.py +0 -40
  45. sarvamai-0.1.23a4/src/sarvamai/types/speech_to_text_translate_language.py +0 -8
  46. sarvamai-0.1.23a4/src/sarvamai/types/speech_to_text_translate_model.py +0 -5
  47. sarvamai-0.1.23a4/src/sarvamai/types/speech_to_text_translate_response.py +0 -35
  48. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/README.md +0 -0
  49. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/chat/__init__.py +0 -0
  50. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/chat/client.py +0 -0
  51. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/chat/raw_client.py +0 -0
  52. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/client.py +0 -0
  53. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/core/__init__.py +0 -0
  54. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/core/api_error.py +0 -0
  55. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/core/datetime_utils.py +0 -0
  56. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/core/events.py +0 -0
  57. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/core/file.py +0 -0
  58. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/core/force_multipart.py +0 -0
  59. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/core/http_client.py +0 -0
  60. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/core/http_response.py +0 -0
  61. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/core/jsonable_encoder.py +0 -0
  62. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/core/pydantic_utilities.py +0 -0
  63. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/core/query_encoder.py +0 -0
  64. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/core/remove_none_from_dict.py +0 -0
  65. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/core/request_options.py +0 -0
  66. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/core/serialization.py +0 -0
  67. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/environment.py +0 -0
  68. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/errors/__init__.py +0 -0
  69. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/errors/bad_request_error.py +0 -0
  70. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/errors/forbidden_error.py +0 -0
  71. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/errors/internal_server_error.py +0 -0
  72. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/errors/service_unavailable_error.py +0 -0
  73. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/errors/too_many_requests_error.py +0 -0
  74. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/errors/unprocessable_entity_error.py +0 -0
  75. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/play.py +0 -0
  76. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/py.typed +0 -0
  77. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/__init__.py +0 -0
  78. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/audio_data.py +0 -0
  79. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/audio_message.py +0 -0
  80. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/audio_output.py +0 -0
  81. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/audio_output_data.py +0 -0
  82. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/base_job_parameters.py +0 -0
  83. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/bulk_job_callback.py +0 -0
  84. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/bulk_job_init_response_v_1.py +0 -0
  85. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/chat_completion_request_assistant_message.py +0 -0
  86. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/chat_completion_request_message.py +0 -0
  87. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/chat_completion_request_system_message.py +0 -0
  88. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/chat_completion_request_user_message.py +0 -0
  89. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/chat_completion_response_message.py +0 -0
  90. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/choice.py +0 -0
  91. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/completion_usage.py +0 -0
  92. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/config_message.py +0 -0
  93. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/configure_connection.py +0 -0
  94. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/configure_connection_data.py +0 -0
  95. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/create_chat_completion_response.py +0 -0
  96. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/diarized_entry.py +0 -0
  97. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/diarized_transcript.py +0 -0
  98. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/error_data.py +0 -0
  99. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/error_details.py +0 -0
  100. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/error_message.py +0 -0
  101. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/error_response.py +0 -0
  102. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/error_response_data.py +0 -0
  103. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/event_response.py +0 -0
  104. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/event_response_data.py +0 -0
  105. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/events_data.py +0 -0
  106. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/file_signed_url_details.py +0 -0
  107. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/files_download_response.py +0 -0
  108. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/files_request.py +0 -0
  109. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/files_upload_response.py +0 -0
  110. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/flush_signal.py +0 -0
  111. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/job_status_v_1_response.py +0 -0
  112. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/language_identification_response.py +0 -0
  113. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/ping_signal.py +0 -0
  114. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/send_text.py +0 -0
  115. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/send_text_data.py +0 -0
  116. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/speech_to_text_response_data.py +0 -0
  117. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/speech_to_text_streaming_response.py +0 -0
  118. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/speech_to_text_translate_response_data.py +0 -0
  119. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/speech_to_text_translate_streaming_response.py +0 -0
  120. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/stop_configuration.py +0 -0
  121. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/stt_flush_signal.py +0 -0
  122. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/task_detail_v_1.py +0 -0
  123. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/task_file_details.py +0 -0
  124. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/text_to_speech_response.py +0 -0
  125. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/timestamps_model.py +0 -0
  126. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/transcription_metrics.py +0 -0
  127. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/translation_response.py +0 -0
  128. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/requests/transliteration_response.py +0 -0
  129. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text/__init__.py +0 -0
  130. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_job/__init__.py +0 -0
  131. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_job/client.py +0 -0
  132. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_job/job.py +0 -0
  133. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_job/raw_client.py +0 -0
  134. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_streaming/socket_client.py +0 -0
  135. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_streaming/types/speech_to_text_streaming_flush_signal.py +0 -0
  136. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_streaming/types/speech_to_text_streaming_high_vad_sensitivity.py +0 -0
  137. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_streaming/types/speech_to_text_streaming_model.py +0 -0
  138. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_streaming/types/speech_to_text_streaming_vad_signals.py +0 -0
  139. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_translate_job/__init__.py +0 -0
  140. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_translate_job/client.py +0 -0
  141. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_translate_job/job.py +0 -0
  142. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_translate_job/raw_client.py +0 -0
  143. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_translate_streaming/socket_client.py +0 -0
  144. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_translate_streaming/types/speech_to_text_translate_streaming_flush_signal.py +0 -0
  145. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_translate_streaming/types/speech_to_text_translate_streaming_high_vad_sensitivity.py +0 -0
  146. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/speech_to_text_translate_streaming/types/speech_to_text_translate_streaming_vad_signals.py +0 -0
  147. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/text/__init__.py +0 -0
  148. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/text/client.py +0 -0
  149. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/text/raw_client.py +0 -0
  150. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/text_to_speech/__init__.py +0 -0
  151. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/text_to_speech/client.py +0 -0
  152. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/text_to_speech/raw_client.py +0 -0
  153. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/text_to_speech_streaming/__init__.py +0 -0
  154. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/text_to_speech_streaming/client.py +0 -0
  155. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/text_to_speech_streaming/raw_client.py +0 -0
  156. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/text_to_speech_streaming/socket_client.py +0 -0
  157. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/text_to_speech_streaming/types/__init__.py +0 -0
  158. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/text_to_speech_streaming/types/text_to_speech_streaming_model.py +0 -0
  159. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/text_to_speech_streaming/types/text_to_speech_streaming_send_completion_event.py +0 -0
  160. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/__init__.py +0 -0
  161. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/audio_data.py +0 -0
  162. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/audio_message.py +0 -0
  163. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/audio_output.py +0 -0
  164. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/audio_output_data.py +0 -0
  165. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/base_job_parameters.py +0 -0
  166. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/bulk_job_callback.py +0 -0
  167. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/bulk_job_init_response_v_1.py +0 -0
  168. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/chat_completion_request_assistant_message.py +0 -0
  169. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/chat_completion_request_message.py +0 -0
  170. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/chat_completion_request_system_message.py +0 -0
  171. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/chat_completion_request_user_message.py +0 -0
  172. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/chat_completion_response_message.py +0 -0
  173. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/choice.py +0 -0
  174. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/completion_event_flag.py +0 -0
  175. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/completion_usage.py +0 -0
  176. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/config_message.py +0 -0
  177. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/configure_connection.py +0 -0
  178. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/configure_connection_data.py +0 -0
  179. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/configure_connection_data_model.py +0 -0
  180. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/configure_connection_data_output_audio_bitrate.py +0 -0
  181. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/configure_connection_data_output_audio_codec.py +0 -0
  182. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/configure_connection_data_speaker.py +0 -0
  183. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/configure_connection_data_target_language_code.py +0 -0
  184. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/connection_sample_rate.py +0 -0
  185. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/create_chat_completion_response.py +0 -0
  186. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/diarized_entry.py +0 -0
  187. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/diarized_transcript.py +0 -0
  188. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/error_code.py +0 -0
  189. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/error_data.py +0 -0
  190. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/error_details.py +0 -0
  191. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/error_message.py +0 -0
  192. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/error_response.py +0 -0
  193. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/error_response_data.py +0 -0
  194. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/event_response.py +0 -0
  195. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/event_response_data.py +0 -0
  196. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/events_data.py +0 -0
  197. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/events_data_signal_type.py +0 -0
  198. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/file_signed_url_details.py +0 -0
  199. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/files_download_response.py +0 -0
  200. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/files_request.py +0 -0
  201. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/files_upload_response.py +0 -0
  202. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/finish_reason.py +0 -0
  203. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/flush_signal.py +0 -0
  204. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/input_audio_codec.py +0 -0
  205. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/job_state.py +0 -0
  206. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/job_status_v_1_response.py +0 -0
  207. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/language_identification_response.py +0 -0
  208. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/numerals_format.py +0 -0
  209. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/ping_signal.py +0 -0
  210. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/reasoning_effort.py +0 -0
  211. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/response_type.py +0 -0
  212. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/role.py +0 -0
  213. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/sarvam_model_ids.py +0 -0
  214. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/send_text.py +0 -0
  215. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/send_text_data.py +0 -0
  216. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/speech_sample_rate.py +0 -0
  217. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/speech_to_text_response_data.py +0 -0
  218. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/speech_to_text_streaming_response.py +0 -0
  219. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/speech_to_text_translate_response_data.py +0 -0
  220. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/speech_to_text_translate_streaming_response.py +0 -0
  221. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/spoken_form_numerals_format.py +0 -0
  222. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/stop_configuration.py +0 -0
  223. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/storage_container_type.py +0 -0
  224. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/stt_flush_signal.py +0 -0
  225. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/task_detail_v_1.py +0 -0
  226. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/task_file_details.py +0 -0
  227. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/task_state.py +0 -0
  228. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/text_to_speech_language.py +0 -0
  229. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/text_to_speech_model.py +0 -0
  230. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/text_to_speech_output_audio_codec.py +0 -0
  231. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/text_to_speech_response.py +0 -0
  232. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/text_to_speech_speaker.py +0 -0
  233. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/timestamps_model.py +0 -0
  234. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/transcription_metrics.py +0 -0
  235. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/translate_mode.py +0 -0
  236. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/translate_model.py +0 -0
  237. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/translate_source_language.py +0 -0
  238. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/translate_speaker_gender.py +0 -0
  239. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/translate_target_language.py +0 -0
  240. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/translation_response.py +0 -0
  241. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/translatiterate_target_language.py +0 -0
  242. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/transliterate_mode.py +0 -0
  243. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/transliterate_source_language.py +0 -0
  244. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/types/transliteration_response.py +0 -0
  245. {sarvamai-0.1.23a4 → sarvamai-0.1.23a6}/src/sarvamai/version.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: sarvamai
3
- Version: 0.1.23a4
3
+ Version: 0.1.23a6
4
4
  Summary:
5
5
  Requires-Python: >=3.8,<4.0
6
6
  Classifier: Intended Audience :: Developers
@@ -3,7 +3,7 @@ name = "sarvamai"
3
3
 
4
4
  [tool.poetry]
5
5
  name = "sarvamai"
6
- version = "0.1.23a4"
6
+ version = "0.1.23a6"
7
7
  description = ""
8
8
  readme = "README.md"
9
9
  authors = []
@@ -188,6 +188,7 @@ from .requests import (
188
188
  from .speech_to_text_streaming import (
189
189
  SpeechToTextStreamingFlushSignal,
190
190
  SpeechToTextStreamingHighVadSensitivity,
191
+ SpeechToTextStreamingInputAudioCodec,
191
192
  SpeechToTextStreamingLanguageCode,
192
193
  SpeechToTextStreamingMode,
193
194
  SpeechToTextStreamingModel,
@@ -196,6 +197,7 @@ from .speech_to_text_streaming import (
196
197
  from .speech_to_text_translate_streaming import (
197
198
  SpeechToTextTranslateStreamingFlushSignal,
198
199
  SpeechToTextTranslateStreamingHighVadSensitivity,
200
+ SpeechToTextTranslateStreamingInputAudioCodec,
199
201
  SpeechToTextTranslateStreamingVadSignals,
200
202
  )
201
203
  from .text_to_speech_streaming import TextToSpeechStreamingModel, TextToSpeechStreamingSendCompletionEvent
@@ -320,6 +322,7 @@ __all__ = [
320
322
  "SpeechToTextResponseParams",
321
323
  "SpeechToTextStreamingFlushSignal",
322
324
  "SpeechToTextStreamingHighVadSensitivity",
325
+ "SpeechToTextStreamingInputAudioCodec",
323
326
  "SpeechToTextStreamingLanguageCode",
324
327
  "SpeechToTextStreamingMode",
325
328
  "SpeechToTextStreamingModel",
@@ -338,6 +341,7 @@ __all__ = [
338
341
  "SpeechToTextTranslateResponseParams",
339
342
  "SpeechToTextTranslateStreamingFlushSignal",
340
343
  "SpeechToTextTranslateStreamingHighVadSensitivity",
344
+ "SpeechToTextTranslateStreamingInputAudioCodec",
341
345
  "SpeechToTextTranslateStreamingResponse",
342
346
  "SpeechToTextTranslateStreamingResponseParams",
343
347
  "SpeechToTextTranslateStreamingVadSignals",
@@ -23,10 +23,10 @@ class BaseClientWrapper:
23
23
 
24
24
  def get_headers(self) -> typing.Dict[str, str]:
25
25
  headers: typing.Dict[str, str] = {
26
- "User-Agent": "sarvamai/0.1.23a4",
26
+ "User-Agent": "sarvamai/0.1.23a6",
27
27
  "X-Fern-Language": "Python",
28
28
  "X-Fern-SDK-Name": "sarvamai",
29
- "X-Fern-SDK-Version": "0.1.23a4",
29
+ "X-Fern-SDK-Version": "0.1.23a6",
30
30
  **(self.get_custom_headers() or {}),
31
31
  }
32
32
  headers["api-subscription-key"] = self.api_subscription_key
@@ -0,0 +1,73 @@
1
+ # This file was auto-generated by Fern from our API Definition.
2
+
3
+ import typing_extensions
4
+ from ..types.mode import Mode
5
+ from ..types.speech_to_text_model import SpeechToTextModel
6
+ from ..types.speech_to_text_translate_language import SpeechToTextTranslateLanguage
7
+
8
+
9
+ class SpeechToTextJobParametersParams(typing_extensions.TypedDict):
10
+ language_code: typing_extensions.NotRequired[SpeechToTextTranslateLanguage]
11
+ """
12
+ Specifies the language of the input audio in BCP-47 format.
13
+
14
+ **Available Options:**
15
+ - `unknown` (default): Use when the language is not known; the API will auto-detect.
16
+ - `hi-IN`: Hindi
17
+ - `bn-IN`: Bengali
18
+ - `kn-IN`: Kannada
19
+ - `ml-IN`: Malayalam
20
+ - `mr-IN`: Marathi
21
+ - `od-IN`: Odia
22
+ - `pa-IN`: Punjabi
23
+ - `ta-IN`: Tamil
24
+ - `te-IN`: Telugu
25
+ - `en-IN`: English
26
+ - `gu-IN`: Gujarati
27
+ """
28
+
29
+ model: typing_extensions.NotRequired[SpeechToTextModel]
30
+ """
31
+ Model to be used for speech to text.
32
+
33
+ - **saarika:v2.5** (default): Transcribes audio in the spoken language.
34
+
35
+ - **saaras:v3**: State-of-the-art model with flexible output formats. Supports multiple modes via the `mode` parameter: transcribe, translate, verbatim, translit, codemix.
36
+ """
37
+
38
+ mode: typing_extensions.NotRequired[Mode]
39
+ """
40
+ Mode of operation. **Only applicable when using saaras:v3 model.**
41
+
42
+ Example audio: 'मेरा फोन नंबर है 9840950950'
43
+
44
+ - **transcribe** (default): Standard transcription in the original language with proper formatting and number normalization.
45
+ - Output: `मेरा फोन नंबर है 9840950950`
46
+
47
+ - **translate**: Translates speech from any supported Indic language to English.
48
+ - Output: `My phone number is 9840950950`
49
+
50
+ - **verbatim**: Exact word-for-word transcription without normalization, preserving filler words and spoken numbers as-is.
51
+ - Output: `मेरा फोन नंबर है नौ आठ चार zero नौ पांच zero नौ पांच zero`
52
+
53
+ - **translit**: Romanization - Transliterates speech to Latin/Roman script only.
54
+ - Output: `mera phone number hai 9840950950`
55
+
56
+ - **codemix**: Code-mixed text with English words in English and Indic words in native script.
57
+ - Output: `मेरा phone number है 9840950950`
58
+ """
59
+
60
+ with_timestamps: typing_extensions.NotRequired[bool]
61
+ """
62
+ Whether to include timestamps in the response
63
+ """
64
+
65
+ with_diarization: typing_extensions.NotRequired[bool]
66
+ """
67
+ Enables speaker diarization, which identifies and separates different speakers in the audio. In beta mode
68
+ """
69
+
70
+ num_speakers: typing_extensions.NotRequired[int]
71
+ """
72
+ Number of speakers to be detected in the audio. This is used when with_diarization is true.
73
+ """
@@ -0,0 +1,20 @@
1
+ # This file was auto-generated by Fern from our API Definition.
2
+
3
+ import typing_extensions
4
+
5
+
6
+ class SpeechToTextResponseParams(typing_extensions.TypedDict):
7
+ request_id: str
8
+ """
9
+ Unique identifier for the request
10
+ """
11
+
12
+ transcript: str
13
+ """
14
+ The transcribed text from the provided audio file.
15
+ """
16
+
17
+ language_code: str
18
+ """
19
+ The BCP-47 code of language spoken in the input (e.g., hi-IN, en-IN). If multiple languages are detected, returns the most predominant spoken language.
20
+ """
@@ -32,4 +32,18 @@ class SpeechToTextTranscriptionDataParams(typing_extensions.TypedDict):
32
32
  BCP-47 code of detected language
33
33
  """
34
34
 
35
+ language_probability: typing_extensions.NotRequired[float]
36
+ """
37
+ Float value (0.0 to 1.0) indicating the probability of the detected language being correct. Higher values indicate higher confidence.
38
+
39
+ **When it returns a value:**
40
+ - When `language_code` is not provided in the request
41
+ - When `language_code` is set to `unknown`
42
+
43
+ **When it returns null:**
44
+ - When a specific `language_code` is provided (language detection is skipped)
45
+
46
+ The parameter is always present in the response.
47
+ """
48
+
35
49
  metrics: TranscriptionMetricsParams
@@ -12,7 +12,10 @@ class SpeechToTextTranslateJobParametersParams(typing_extensions.TypedDict):
12
12
 
13
13
  model: typing_extensions.NotRequired[SpeechToTextTranslateModel]
14
14
  """
15
- Model to be used for converting speech to text in target language
15
+ Model to be used for speech to text translation.
16
+
17
+ - **saaras:v2.5** (default): Translation model that translates audio from any spoken Indic language to English.
18
+ - Example: Hindi audio → English text output
16
19
  """
17
20
 
18
21
  with_diarization: typing_extensions.NotRequired[bool]
@@ -0,0 +1,20 @@
1
+ # This file was auto-generated by Fern from our API Definition.
2
+
3
+ import typing_extensions
4
+
5
+
6
+ class SpeechToTextTranslateResponseParams(typing_extensions.TypedDict):
7
+ request_id: str
8
+ """
9
+ Unique identifier for the request
10
+ """
11
+
12
+ transcript: str
13
+ """
14
+ English translation of the provided speech
15
+ """
16
+
17
+ language_code: str
18
+ """
19
+ The BCP-47 code of the detected source language spoken in the input (e.g., hi-IN, kn-IN).
20
+ """
@@ -20,4 +20,17 @@ class SpeechToTextTranslateTranscriptionDataParams(typing_extensions.TypedDict):
20
20
  BCP-47 code of detected source language (null when language detection is in progress)
21
21
  """
22
22
 
23
+ language_probability: typing_extensions.NotRequired[float]
24
+ """
25
+ Float value (0.0 to 1.0) indicating the probability of the detected source language being correct. Higher values indicate higher confidence.
26
+
27
+ **When it returns a value:**
28
+ - Always returns a value as source language is auto-detected for translation
29
+
30
+ **When it returns null:**
31
+ - When language detection confidence is unavailable
32
+
33
+ The parameter is always present in the response.
34
+ """
35
+
23
36
  metrics: TranscriptionMetricsParams
@@ -65,23 +65,49 @@ class SpeechToTextClient:
65
65
 
66
66
  model : typing.Optional[SpeechToTextModel]
67
67
  Specifies the model to use for speech-to-text conversion.
68
- - **saarika:v2.5** (default): Standard transcription model
69
- - **saarika:v3**: Advanced transcription model
70
- - **saaras:v3**: Advanced model with multiple output modes
68
+
69
+ - **saarika:v2.5** (default): Transcribes audio in the spoken language.
70
+
71
+ - **saaras:v3**: State-of-the-art model with flexible output formats. Supports multiple modes via the `mode` parameter: transcribe, translate, verbatim, translit, codemix.
71
72
 
72
73
  mode : typing.Optional[Mode]
73
74
  Mode of operation. **Only applicable when using saaras:v3 model.**
74
- - **transcribe** (default): Standard transcription
75
- - **translate**: Translation to English
76
- - **indic-en**: Indic to English translation
77
- - **verbatim**: Exact transcription
78
- - **translit**: Transliteration to Latin script
79
- - **codemix**: Code-mixed output
75
+
76
+ Example audio: 'मेरा फोन नंबर है 9840950950'
77
+
78
+ - **transcribe** (default): Standard transcription in the original language with proper formatting and number normalization.
79
+ - Output: `मेरा फोन नंबर है 9840950950`
80
+
81
+ - **translate**: Translates speech from any supported Indic language to English.
82
+ - Output: `My phone number is 9840950950`
83
+
84
+ - **verbatim**: Exact word-for-word transcription without normalization, preserving filler words and spoken numbers as-is.
85
+ - Output: `मेरा फोन नंबर है नौ आठ चार zero नौ पांच zero नौ पांच zero`
86
+
87
+ - **translit**: Romanization - Transliterates speech to Latin/Roman script only.
88
+ - Output: `mera phone number hai 9840950950`
89
+
90
+ - **codemix**: Code-mixed text with English words in English and Indic words in native script.
91
+ - Output: `मेरा phone number है 9840950950`
80
92
 
81
93
  language_code : typing.Optional[SpeechToTextLanguage]
82
- Specifies the language of the input audio.
83
- For the `saarika:v2.5` model, it is optional.
84
- `unknown`: Use this when the language is not known; the API will detect it automatically.
94
+ Specifies the language of the input audio in BCP-47 format.
95
+
96
+ **Note:** This parameter is optional for `saarika:v2.5` model.
97
+
98
+ **Available Options:**
99
+ - `unknown`: Use when the language is not known; the API will auto-detect.
100
+ - `hi-IN`: Hindi
101
+ - `bn-IN`: Bengali
102
+ - `kn-IN`: Kannada
103
+ - `ml-IN`: Malayalam
104
+ - `mr-IN`: Marathi
105
+ - `od-IN`: Odia
106
+ - `pa-IN`: Punjabi
107
+ - `ta-IN`: Tamil
108
+ - `te-IN`: Telugu
109
+ - `en-IN`: English
110
+ - `gu-IN`: Gujarati
85
111
 
86
112
  input_audio_codec : typing.Optional[InputAudioCodec]
87
113
  Input Audio codec/format of the input file. PCM files are supported only at 16kHz sample rate.
@@ -146,7 +172,10 @@ class SpeechToTextClient:
146
172
  Conversation context can be passed as a prompt to boost model accuracy. However, the current system is at an experimentation stage and doesn't match the prompt performance of large language models.
147
173
 
148
174
  model : typing.Optional[SpeechToTextTranslateModel]
149
- Model to be used for converting speech to text in target language
175
+ Model to be used for speech to text translation.
176
+
177
+ - **saaras:v2.5** (default): Translation model that translates audio from any spoken Indic language to English.
178
+ - Example: Hindi audio → English text output
150
179
 
151
180
  input_audio_codec : typing.Optional[InputAudioCodec]
152
181
  Audio codec/format of the input file. Our API automatically detects all codec formats, but for PCM files specifically (pcm_s16le, pcm_l16, pcm_raw), you must pass this parameter. PCM files are supported only at 16kHz sample rate.
@@ -221,23 +250,49 @@ class AsyncSpeechToTextClient:
221
250
 
222
251
  model : typing.Optional[SpeechToTextModel]
223
252
  Specifies the model to use for speech-to-text conversion.
224
- - **saarika:v2.5** (default): Standard transcription model
225
- - **saarika:v3**: Advanced transcription model
226
- - **saaras:v3**: Advanced model with multiple output modes
253
+
254
+ - **saarika:v2.5** (default): Transcribes audio in the spoken language.
255
+
256
+ - **saaras:v3**: State-of-the-art model with flexible output formats. Supports multiple modes via the `mode` parameter: transcribe, translate, verbatim, translit, codemix.
227
257
 
228
258
  mode : typing.Optional[Mode]
229
259
  Mode of operation. **Only applicable when using saaras:v3 model.**
230
- - **transcribe** (default): Standard transcription
231
- - **translate**: Translation to English
232
- - **indic-en**: Indic to English translation
233
- - **verbatim**: Exact transcription
234
- - **translit**: Transliteration to Latin script
235
- - **codemix**: Code-mixed output
260
+
261
+ Example audio: 'मेरा फोन नंबर है 9840950950'
262
+
263
+ - **transcribe** (default): Standard transcription in the original language with proper formatting and number normalization.
264
+ - Output: `मेरा फोन नंबर है 9840950950`
265
+
266
+ - **translate**: Translates speech from any supported Indic language to English.
267
+ - Output: `My phone number is 9840950950`
268
+
269
+ - **verbatim**: Exact word-for-word transcription without normalization, preserving filler words and spoken numbers as-is.
270
+ - Output: `मेरा फोन नंबर है नौ आठ चार zero नौ पांच zero नौ पांच zero`
271
+
272
+ - **translit**: Romanization - Transliterates speech to Latin/Roman script only.
273
+ - Output: `mera phone number hai 9840950950`
274
+
275
+ - **codemix**: Code-mixed text with English words in English and Indic words in native script.
276
+ - Output: `मेरा phone number है 9840950950`
236
277
 
237
278
  language_code : typing.Optional[SpeechToTextLanguage]
238
- Specifies the language of the input audio.
239
- For the `saarika:v2.5` model, it is optional.
240
- `unknown`: Use this when the language is not known; the API will detect it automatically.
279
+ Specifies the language of the input audio in BCP-47 format.
280
+
281
+ **Note:** This parameter is optional for `saarika:v2.5` model.
282
+
283
+ **Available Options:**
284
+ - `unknown`: Use when the language is not known; the API will auto-detect.
285
+ - `hi-IN`: Hindi
286
+ - `bn-IN`: Bengali
287
+ - `kn-IN`: Kannada
288
+ - `ml-IN`: Malayalam
289
+ - `mr-IN`: Marathi
290
+ - `od-IN`: Odia
291
+ - `pa-IN`: Punjabi
292
+ - `ta-IN`: Tamil
293
+ - `te-IN`: Telugu
294
+ - `en-IN`: English
295
+ - `gu-IN`: Gujarati
241
296
 
242
297
  input_audio_codec : typing.Optional[InputAudioCodec]
243
298
  Input Audio codec/format of the input file. PCM files are supported only at 16kHz sample rate.
@@ -310,7 +365,10 @@ class AsyncSpeechToTextClient:
310
365
  Conversation context can be passed as a prompt to boost model accuracy. However, the current system is at an experimentation stage and doesn't match the prompt performance of large language models.
311
366
 
312
367
  model : typing.Optional[SpeechToTextTranslateModel]
313
- Model to be used for converting speech to text in target language
368
+ Model to be used for speech to text translation.
369
+
370
+ - **saaras:v2.5** (default): Translation model that translates audio from any spoken Indic language to English.
371
+ - Example: Hindi audio → English text output
314
372
 
315
373
  input_audio_codec : typing.Optional[InputAudioCodec]
316
374
  Audio codec/format of the input file. Our API automatically detects all codec formats, but for PCM files specifically (pcm_s16le, pcm_l16, pcm_raw), you must pass this parameter. PCM files are supported only at 16kHz sample rate.
@@ -63,23 +63,49 @@ class RawSpeechToTextClient:
63
63
 
64
64
  model : typing.Optional[SpeechToTextModel]
65
65
  Specifies the model to use for speech-to-text conversion.
66
- - **saarika:v2.5** (default): Standard transcription model
67
- - **saarika:v3**: Advanced transcription model
68
- - **saaras:v3**: Advanced model with multiple output modes
66
+
67
+ - **saarika:v2.5** (default): Transcribes audio in the spoken language.
68
+
69
+ - **saaras:v3**: State-of-the-art model with flexible output formats. Supports multiple modes via the `mode` parameter: transcribe, translate, verbatim, translit, codemix.
69
70
 
70
71
  mode : typing.Optional[Mode]
71
72
  Mode of operation. **Only applicable when using saaras:v3 model.**
72
- - **transcribe** (default): Standard transcription
73
- - **translate**: Translation to English
74
- - **indic-en**: Indic to English translation
75
- - **verbatim**: Exact transcription
76
- - **translit**: Transliteration to Latin script
77
- - **codemix**: Code-mixed output
73
+
74
+ Example audio: 'मेरा फोन नंबर है 9840950950'
75
+
76
+ - **transcribe** (default): Standard transcription in the original language with proper formatting and number normalization.
77
+ - Output: `मेरा फोन नंबर है 9840950950`
78
+
79
+ - **translate**: Translates speech from any supported Indic language to English.
80
+ - Output: `My phone number is 9840950950`
81
+
82
+ - **verbatim**: Exact word-for-word transcription without normalization, preserving filler words and spoken numbers as-is.
83
+ - Output: `मेरा फोन नंबर है नौ आठ चार zero नौ पांच zero नौ पांच zero`
84
+
85
+ - **translit**: Romanization - Transliterates speech to Latin/Roman script only.
86
+ - Output: `mera phone number hai 9840950950`
87
+
88
+ - **codemix**: Code-mixed text with English words in English and Indic words in native script.
89
+ - Output: `मेरा phone number है 9840950950`
78
90
 
79
91
  language_code : typing.Optional[SpeechToTextLanguage]
80
- Specifies the language of the input audio.
81
- For the `saarika:v2.5` model, it is optional.
82
- `unknown`: Use this when the language is not known; the API will detect it automatically.
92
+ Specifies the language of the input audio in BCP-47 format.
93
+
94
+ **Note:** This parameter is optional for `saarika:v2.5` model.
95
+
96
+ **Available Options:**
97
+ - `unknown`: Use when the language is not known; the API will auto-detect.
98
+ - `hi-IN`: Hindi
99
+ - `bn-IN`: Bengali
100
+ - `kn-IN`: Kannada
101
+ - `ml-IN`: Malayalam
102
+ - `mr-IN`: Marathi
103
+ - `od-IN`: Odia
104
+ - `pa-IN`: Punjabi
105
+ - `ta-IN`: Tamil
106
+ - `te-IN`: Telugu
107
+ - `en-IN`: English
108
+ - `gu-IN`: Gujarati
83
109
 
84
110
  input_audio_codec : typing.Optional[InputAudioCodec]
85
111
  Input Audio codec/format of the input file. PCM files are supported only at 16kHz sample rate.
@@ -223,7 +249,10 @@ class RawSpeechToTextClient:
223
249
  Conversation context can be passed as a prompt to boost model accuracy. However, the current system is at an experimentation stage and doesn't match the prompt performance of large language models.
224
250
 
225
251
  model : typing.Optional[SpeechToTextTranslateModel]
226
- Model to be used for converting speech to text in target language
252
+ Model to be used for speech to text translation.
253
+
254
+ - **saaras:v2.5** (default): Translation model that translates audio from any spoken Indic language to English.
255
+ - Example: Hindi audio → English text output
227
256
 
228
257
  input_audio_codec : typing.Optional[InputAudioCodec]
229
258
  Audio codec/format of the input file. Our API automatically detects all codec formats, but for PCM files specifically (pcm_s16le, pcm_l16, pcm_raw), you must pass this parameter. PCM files are supported only at 16kHz sample rate.
@@ -370,23 +399,49 @@ class AsyncRawSpeechToTextClient:
370
399
 
371
400
  model : typing.Optional[SpeechToTextModel]
372
401
  Specifies the model to use for speech-to-text conversion.
373
- - **saarika:v2.5** (default): Standard transcription model
374
- - **saarika:v3**: Advanced transcription model
375
- - **saaras:v3**: Advanced model with multiple output modes
402
+
403
+ - **saarika:v2.5** (default): Transcribes audio in the spoken language.
404
+
405
+ - **saaras:v3**: State-of-the-art model with flexible output formats. Supports multiple modes via the `mode` parameter: transcribe, translate, verbatim, translit, codemix.
376
406
 
377
407
  mode : typing.Optional[Mode]
378
408
  Mode of operation. **Only applicable when using saaras:v3 model.**
379
- - **transcribe** (default): Standard transcription
380
- - **translate**: Translation to English
381
- - **indic-en**: Indic to English translation
382
- - **verbatim**: Exact transcription
383
- - **translit**: Transliteration to Latin script
384
- - **codemix**: Code-mixed output
409
+
410
+ Example audio: 'मेरा फोन नंबर है 9840950950'
411
+
412
+ - **transcribe** (default): Standard transcription in the original language with proper formatting and number normalization.
413
+ - Output: `मेरा फोन नंबर है 9840950950`
414
+
415
+ - **translate**: Translates speech from any supported Indic language to English.
416
+ - Output: `My phone number is 9840950950`
417
+
418
+ - **verbatim**: Exact word-for-word transcription without normalization, preserving filler words and spoken numbers as-is.
419
+ - Output: `मेरा फोन नंबर है नौ आठ चार zero नौ पांच zero नौ पांच zero`
420
+
421
+ - **translit**: Romanization - Transliterates speech to Latin/Roman script only.
422
+ - Output: `mera phone number hai 9840950950`
423
+
424
+ - **codemix**: Code-mixed text with English words in English and Indic words in native script.
425
+ - Output: `मेरा phone number है 9840950950`
385
426
 
386
427
  language_code : typing.Optional[SpeechToTextLanguage]
387
- Specifies the language of the input audio.
388
- For the `saarika:v2.5` model, it is optional.
389
- `unknown`: Use this when the language is not known; the API will detect it automatically.
428
+ Specifies the language of the input audio in BCP-47 format.
429
+
430
+ **Note:** This parameter is optional for `saarika:v2.5` model.
431
+
432
+ **Available Options:**
433
+ - `unknown`: Use when the language is not known; the API will auto-detect.
434
+ - `hi-IN`: Hindi
435
+ - `bn-IN`: Bengali
436
+ - `kn-IN`: Kannada
437
+ - `ml-IN`: Malayalam
438
+ - `mr-IN`: Marathi
439
+ - `od-IN`: Odia
440
+ - `pa-IN`: Punjabi
441
+ - `ta-IN`: Tamil
442
+ - `te-IN`: Telugu
443
+ - `en-IN`: English
444
+ - `gu-IN`: Gujarati
390
445
 
391
446
  input_audio_codec : typing.Optional[InputAudioCodec]
392
447
  Input Audio codec/format of the input file. PCM files are supported only at 16kHz sample rate.
@@ -530,7 +585,10 @@ class AsyncRawSpeechToTextClient:
530
585
  Conversation context can be passed as a prompt to boost model accuracy. However, the current system is at an experimentation stage and doesn't match the prompt performance of large language models.
531
586
 
532
587
  model : typing.Optional[SpeechToTextTranslateModel]
533
- Model to be used for converting speech to text in target language
588
+ Model to be used for speech to text translation.
589
+
590
+ - **saaras:v2.5** (default): Translation model that translates audio from any spoken Indic language to English.
591
+ - Example: Hindi audio → English text output
534
592
 
535
593
  input_audio_codec : typing.Optional[InputAudioCodec]
536
594
  Audio codec/format of the input file. Our API automatically detects all codec formats, but for PCM files specifically (pcm_s16le, pcm_l16, pcm_raw), you must pass this parameter. PCM files are supported only at 16kHz sample rate.
@@ -5,6 +5,7 @@
5
5
  from .types import (
6
6
  SpeechToTextStreamingFlushSignal,
7
7
  SpeechToTextStreamingHighVadSensitivity,
8
+ SpeechToTextStreamingInputAudioCodec,
8
9
  SpeechToTextStreamingLanguageCode,
9
10
  SpeechToTextStreamingMode,
10
11
  SpeechToTextStreamingModel,
@@ -14,6 +15,7 @@ from .types import (
14
15
  __all__ = [
15
16
  "SpeechToTextStreamingFlushSignal",
16
17
  "SpeechToTextStreamingHighVadSensitivity",
18
+ "SpeechToTextStreamingInputAudioCodec",
17
19
  "SpeechToTextStreamingLanguageCode",
18
20
  "SpeechToTextStreamingMode",
19
21
  "SpeechToTextStreamingModel",