sarvamai 0.1.23a4__tar.gz → 0.1.23a5__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (236) hide show
  1. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/PKG-INFO +1 -1
  2. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/pyproject.toml +1 -1
  3. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/core/client_wrapper.py +2 -2
  4. sarvamai-0.1.23a5/src/sarvamai/requests/speech_to_text_job_parameters.py +73 -0
  5. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/speech_to_text_translate_job_parameters.py +4 -1
  6. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text/client.py +84 -26
  7. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text/raw_client.py +84 -26
  8. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_streaming/client.py +74 -18
  9. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_streaming/raw_client.py +74 -18
  10. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_streaming/types/speech_to_text_streaming_mode.py +1 -1
  11. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_translate_streaming/client.py +8 -2
  12. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_translate_streaming/raw_client.py +8 -2
  13. sarvamai-0.1.23a5/src/sarvamai/types/mode.py +5 -0
  14. sarvamai-0.1.23a5/src/sarvamai/types/speech_to_text_job_parameters.py +85 -0
  15. sarvamai-0.1.23a5/src/sarvamai/types/speech_to_text_model.py +5 -0
  16. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/speech_to_text_translate_job_parameters.py +4 -1
  17. sarvamai-0.1.23a5/src/sarvamai/types/speech_to_text_translate_model.py +5 -0
  18. sarvamai-0.1.23a4/src/sarvamai/requests/speech_to_text_job_parameters.py +0 -41
  19. sarvamai-0.1.23a4/src/sarvamai/types/mode.py +0 -7
  20. sarvamai-0.1.23a4/src/sarvamai/types/speech_to_text_job_parameters.py +0 -53
  21. sarvamai-0.1.23a4/src/sarvamai/types/speech_to_text_model.py +0 -7
  22. sarvamai-0.1.23a4/src/sarvamai/types/speech_to_text_translate_model.py +0 -5
  23. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/README.md +0 -0
  24. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/__init__.py +0 -0
  25. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/chat/__init__.py +0 -0
  26. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/chat/client.py +0 -0
  27. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/chat/raw_client.py +0 -0
  28. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/client.py +0 -0
  29. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/core/__init__.py +0 -0
  30. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/core/api_error.py +0 -0
  31. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/core/datetime_utils.py +0 -0
  32. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/core/events.py +0 -0
  33. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/core/file.py +0 -0
  34. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/core/force_multipart.py +0 -0
  35. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/core/http_client.py +0 -0
  36. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/core/http_response.py +0 -0
  37. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/core/jsonable_encoder.py +0 -0
  38. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/core/pydantic_utilities.py +0 -0
  39. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/core/query_encoder.py +0 -0
  40. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/core/remove_none_from_dict.py +0 -0
  41. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/core/request_options.py +0 -0
  42. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/core/serialization.py +0 -0
  43. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/environment.py +0 -0
  44. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/errors/__init__.py +0 -0
  45. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/errors/bad_request_error.py +0 -0
  46. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/errors/forbidden_error.py +0 -0
  47. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/errors/internal_server_error.py +0 -0
  48. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/errors/service_unavailable_error.py +0 -0
  49. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/errors/too_many_requests_error.py +0 -0
  50. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/errors/unprocessable_entity_error.py +0 -0
  51. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/play.py +0 -0
  52. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/py.typed +0 -0
  53. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/__init__.py +0 -0
  54. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/audio_data.py +0 -0
  55. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/audio_message.py +0 -0
  56. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/audio_output.py +0 -0
  57. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/audio_output_data.py +0 -0
  58. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/base_job_parameters.py +0 -0
  59. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/bulk_job_callback.py +0 -0
  60. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/bulk_job_init_response_v_1.py +0 -0
  61. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/chat_completion_request_assistant_message.py +0 -0
  62. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/chat_completion_request_message.py +0 -0
  63. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/chat_completion_request_system_message.py +0 -0
  64. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/chat_completion_request_user_message.py +0 -0
  65. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/chat_completion_response_message.py +0 -0
  66. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/choice.py +0 -0
  67. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/completion_usage.py +0 -0
  68. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/config_message.py +0 -0
  69. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/configure_connection.py +0 -0
  70. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/configure_connection_data.py +0 -0
  71. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/create_chat_completion_response.py +0 -0
  72. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/diarized_entry.py +0 -0
  73. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/diarized_transcript.py +0 -0
  74. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/error_data.py +0 -0
  75. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/error_details.py +0 -0
  76. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/error_message.py +0 -0
  77. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/error_response.py +0 -0
  78. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/error_response_data.py +0 -0
  79. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/event_response.py +0 -0
  80. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/event_response_data.py +0 -0
  81. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/events_data.py +0 -0
  82. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/file_signed_url_details.py +0 -0
  83. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/files_download_response.py +0 -0
  84. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/files_request.py +0 -0
  85. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/files_upload_response.py +0 -0
  86. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/flush_signal.py +0 -0
  87. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/job_status_v_1_response.py +0 -0
  88. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/language_identification_response.py +0 -0
  89. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/ping_signal.py +0 -0
  90. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/send_text.py +0 -0
  91. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/send_text_data.py +0 -0
  92. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/speech_to_text_response.py +0 -0
  93. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/speech_to_text_response_data.py +0 -0
  94. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/speech_to_text_streaming_response.py +0 -0
  95. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/speech_to_text_transcription_data.py +0 -0
  96. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/speech_to_text_translate_response.py +0 -0
  97. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/speech_to_text_translate_response_data.py +0 -0
  98. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/speech_to_text_translate_streaming_response.py +0 -0
  99. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/speech_to_text_translate_transcription_data.py +0 -0
  100. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/stop_configuration.py +0 -0
  101. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/stt_flush_signal.py +0 -0
  102. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/task_detail_v_1.py +0 -0
  103. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/task_file_details.py +0 -0
  104. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/text_to_speech_response.py +0 -0
  105. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/timestamps_model.py +0 -0
  106. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/transcription_metrics.py +0 -0
  107. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/translation_response.py +0 -0
  108. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/requests/transliteration_response.py +0 -0
  109. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text/__init__.py +0 -0
  110. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_job/__init__.py +0 -0
  111. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_job/client.py +0 -0
  112. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_job/job.py +0 -0
  113. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_job/raw_client.py +0 -0
  114. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_streaming/__init__.py +0 -0
  115. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_streaming/socket_client.py +0 -0
  116. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_streaming/types/__init__.py +0 -0
  117. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_streaming/types/speech_to_text_streaming_flush_signal.py +0 -0
  118. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_streaming/types/speech_to_text_streaming_high_vad_sensitivity.py +0 -0
  119. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_streaming/types/speech_to_text_streaming_language_code.py +0 -0
  120. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_streaming/types/speech_to_text_streaming_model.py +0 -0
  121. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_streaming/types/speech_to_text_streaming_vad_signals.py +0 -0
  122. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_translate_job/__init__.py +0 -0
  123. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_translate_job/client.py +0 -0
  124. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_translate_job/job.py +0 -0
  125. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_translate_job/raw_client.py +0 -0
  126. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_translate_streaming/__init__.py +0 -0
  127. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_translate_streaming/socket_client.py +0 -0
  128. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_translate_streaming/types/__init__.py +0 -0
  129. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_translate_streaming/types/speech_to_text_translate_streaming_flush_signal.py +0 -0
  130. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_translate_streaming/types/speech_to_text_translate_streaming_high_vad_sensitivity.py +0 -0
  131. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/speech_to_text_translate_streaming/types/speech_to_text_translate_streaming_vad_signals.py +0 -0
  132. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/text/__init__.py +0 -0
  133. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/text/client.py +0 -0
  134. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/text/raw_client.py +0 -0
  135. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/text_to_speech/__init__.py +0 -0
  136. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/text_to_speech/client.py +0 -0
  137. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/text_to_speech/raw_client.py +0 -0
  138. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/text_to_speech_streaming/__init__.py +0 -0
  139. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/text_to_speech_streaming/client.py +0 -0
  140. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/text_to_speech_streaming/raw_client.py +0 -0
  141. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/text_to_speech_streaming/socket_client.py +0 -0
  142. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/text_to_speech_streaming/types/__init__.py +0 -0
  143. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/text_to_speech_streaming/types/text_to_speech_streaming_model.py +0 -0
  144. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/text_to_speech_streaming/types/text_to_speech_streaming_send_completion_event.py +0 -0
  145. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/__init__.py +0 -0
  146. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/audio_data.py +0 -0
  147. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/audio_message.py +0 -0
  148. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/audio_output.py +0 -0
  149. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/audio_output_data.py +0 -0
  150. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/base_job_parameters.py +0 -0
  151. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/bulk_job_callback.py +0 -0
  152. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/bulk_job_init_response_v_1.py +0 -0
  153. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/chat_completion_request_assistant_message.py +0 -0
  154. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/chat_completion_request_message.py +0 -0
  155. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/chat_completion_request_system_message.py +0 -0
  156. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/chat_completion_request_user_message.py +0 -0
  157. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/chat_completion_response_message.py +0 -0
  158. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/choice.py +0 -0
  159. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/completion_event_flag.py +0 -0
  160. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/completion_usage.py +0 -0
  161. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/config_message.py +0 -0
  162. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/configure_connection.py +0 -0
  163. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/configure_connection_data.py +0 -0
  164. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/configure_connection_data_model.py +0 -0
  165. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/configure_connection_data_output_audio_bitrate.py +0 -0
  166. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/configure_connection_data_output_audio_codec.py +0 -0
  167. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/configure_connection_data_speaker.py +0 -0
  168. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/configure_connection_data_target_language_code.py +0 -0
  169. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/connection_sample_rate.py +0 -0
  170. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/create_chat_completion_response.py +0 -0
  171. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/diarized_entry.py +0 -0
  172. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/diarized_transcript.py +0 -0
  173. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/error_code.py +0 -0
  174. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/error_data.py +0 -0
  175. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/error_details.py +0 -0
  176. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/error_message.py +0 -0
  177. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/error_response.py +0 -0
  178. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/error_response_data.py +0 -0
  179. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/event_response.py +0 -0
  180. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/event_response_data.py +0 -0
  181. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/events_data.py +0 -0
  182. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/events_data_signal_type.py +0 -0
  183. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/file_signed_url_details.py +0 -0
  184. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/files_download_response.py +0 -0
  185. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/files_request.py +0 -0
  186. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/files_upload_response.py +0 -0
  187. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/finish_reason.py +0 -0
  188. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/flush_signal.py +0 -0
  189. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/input_audio_codec.py +0 -0
  190. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/job_state.py +0 -0
  191. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/job_status_v_1_response.py +0 -0
  192. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/language_identification_response.py +0 -0
  193. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/numerals_format.py +0 -0
  194. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/ping_signal.py +0 -0
  195. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/reasoning_effort.py +0 -0
  196. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/response_type.py +0 -0
  197. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/role.py +0 -0
  198. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/sarvam_model_ids.py +0 -0
  199. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/send_text.py +0 -0
  200. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/send_text_data.py +0 -0
  201. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/speech_sample_rate.py +0 -0
  202. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/speech_to_text_language.py +0 -0
  203. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/speech_to_text_response.py +0 -0
  204. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/speech_to_text_response_data.py +0 -0
  205. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/speech_to_text_streaming_response.py +0 -0
  206. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/speech_to_text_transcription_data.py +0 -0
  207. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/speech_to_text_translate_language.py +0 -0
  208. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/speech_to_text_translate_response.py +0 -0
  209. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/speech_to_text_translate_response_data.py +0 -0
  210. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/speech_to_text_translate_streaming_response.py +0 -0
  211. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/speech_to_text_translate_transcription_data.py +0 -0
  212. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/spoken_form_numerals_format.py +0 -0
  213. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/stop_configuration.py +0 -0
  214. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/storage_container_type.py +0 -0
  215. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/stt_flush_signal.py +0 -0
  216. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/task_detail_v_1.py +0 -0
  217. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/task_file_details.py +0 -0
  218. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/task_state.py +0 -0
  219. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/text_to_speech_language.py +0 -0
  220. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/text_to_speech_model.py +0 -0
  221. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/text_to_speech_output_audio_codec.py +0 -0
  222. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/text_to_speech_response.py +0 -0
  223. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/text_to_speech_speaker.py +0 -0
  224. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/timestamps_model.py +0 -0
  225. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/transcription_metrics.py +0 -0
  226. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/translate_mode.py +0 -0
  227. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/translate_model.py +0 -0
  228. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/translate_source_language.py +0 -0
  229. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/translate_speaker_gender.py +0 -0
  230. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/translate_target_language.py +0 -0
  231. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/translation_response.py +0 -0
  232. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/translatiterate_target_language.py +0 -0
  233. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/transliterate_mode.py +0 -0
  234. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/transliterate_source_language.py +0 -0
  235. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/types/transliteration_response.py +0 -0
  236. {sarvamai-0.1.23a4 → sarvamai-0.1.23a5}/src/sarvamai/version.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: sarvamai
3
- Version: 0.1.23a4
3
+ Version: 0.1.23a5
4
4
  Summary:
5
5
  Requires-Python: >=3.8,<4.0
6
6
  Classifier: Intended Audience :: Developers
@@ -3,7 +3,7 @@ name = "sarvamai"
3
3
 
4
4
  [tool.poetry]
5
5
  name = "sarvamai"
6
- version = "0.1.23a4"
6
+ version = "0.1.23a5"
7
7
  description = ""
8
8
  readme = "README.md"
9
9
  authors = []
@@ -23,10 +23,10 @@ class BaseClientWrapper:
23
23
 
24
24
  def get_headers(self) -> typing.Dict[str, str]:
25
25
  headers: typing.Dict[str, str] = {
26
- "User-Agent": "sarvamai/0.1.23a4",
26
+ "User-Agent": "sarvamai/0.1.23a5",
27
27
  "X-Fern-Language": "Python",
28
28
  "X-Fern-SDK-Name": "sarvamai",
29
- "X-Fern-SDK-Version": "0.1.23a4",
29
+ "X-Fern-SDK-Version": "0.1.23a5",
30
30
  **(self.get_custom_headers() or {}),
31
31
  }
32
32
  headers["api-subscription-key"] = self.api_subscription_key
@@ -0,0 +1,73 @@
1
+ # This file was auto-generated by Fern from our API Definition.
2
+
3
+ import typing_extensions
4
+ from ..types.mode import Mode
5
+ from ..types.speech_to_text_model import SpeechToTextModel
6
+ from ..types.speech_to_text_translate_language import SpeechToTextTranslateLanguage
7
+
8
+
9
+ class SpeechToTextJobParametersParams(typing_extensions.TypedDict):
10
+ language_code: typing_extensions.NotRequired[SpeechToTextTranslateLanguage]
11
+ """
12
+ Specifies the language of the input audio in BCP-47 format.
13
+
14
+ **Available Options:**
15
+ - `unknown` (default): Use when the language is not known; the API will auto-detect.
16
+ - `hi-IN`: Hindi
17
+ - `bn-IN`: Bengali
18
+ - `kn-IN`: Kannada
19
+ - `ml-IN`: Malayalam
20
+ - `mr-IN`: Marathi
21
+ - `od-IN`: Odia
22
+ - `pa-IN`: Punjabi
23
+ - `ta-IN`: Tamil
24
+ - `te-IN`: Telugu
25
+ - `en-IN`: English
26
+ - `gu-IN`: Gujarati
27
+ """
28
+
29
+ model: typing_extensions.NotRequired[SpeechToTextModel]
30
+ """
31
+ Model to be used for speech to text.
32
+
33
+ - **saarika:v2.5** (default): Transcribes audio in the spoken language.
34
+
35
+ - **saaras:v3**: State-of-the-art model with flexible output formats. Supports multiple modes via the `mode` parameter: transcribe, translate, verbatim, translit, codemix.
36
+ """
37
+
38
+ mode: typing_extensions.NotRequired[Mode]
39
+ """
40
+ Mode of operation. **Only applicable when using saaras:v3 model.**
41
+
42
+ Example audio: 'मेरा फोन नंबर है 9840950950'
43
+
44
+ - **transcribe** (default): Standard transcription in the original language with proper formatting and number normalization.
45
+ - Output: `मेरा फोन नंबर है 9840950950`
46
+
47
+ - **translate**: Translates speech from any supported Indic language to English.
48
+ - Output: `My phone number is 9840950950`
49
+
50
+ - **verbatim**: Exact word-for-word transcription without normalization, preserving filler words and spoken numbers as-is.
51
+ - Output: `मेरा फोन नंबर है नौ आठ चार zero नौ पांच zero नौ पांच zero`
52
+
53
+ - **translit**: Romanization - Transliterates speech to Latin/Roman script only.
54
+ - Output: `mera phone number hai 9840950950`
55
+
56
+ - **codemix**: Code-mixed text with English words in English and Indic words in native script.
57
+ - Output: `मेरा phone number है 9840950950`
58
+ """
59
+
60
+ with_timestamps: typing_extensions.NotRequired[bool]
61
+ """
62
+ Whether to include timestamps in the response
63
+ """
64
+
65
+ with_diarization: typing_extensions.NotRequired[bool]
66
+ """
67
+ Enables speaker diarization, which identifies and separates different speakers in the audio. In beta mode
68
+ """
69
+
70
+ num_speakers: typing_extensions.NotRequired[int]
71
+ """
72
+ Number of speakers to be detected in the audio. This is used when with_diarization is true.
73
+ """
@@ -12,7 +12,10 @@ class SpeechToTextTranslateJobParametersParams(typing_extensions.TypedDict):
12
12
 
13
13
  model: typing_extensions.NotRequired[SpeechToTextTranslateModel]
14
14
  """
15
- Model to be used for converting speech to text in target language
15
+ Model to be used for speech to text translation.
16
+
17
+ - **saaras:v2.5** (default): Translation model that translates audio from any spoken Indic language to English.
18
+ - Example: Hindi audio → English text output
16
19
  """
17
20
 
18
21
  with_diarization: typing_extensions.NotRequired[bool]
@@ -65,23 +65,49 @@ class SpeechToTextClient:
65
65
 
66
66
  model : typing.Optional[SpeechToTextModel]
67
67
  Specifies the model to use for speech-to-text conversion.
68
- - **saarika:v2.5** (default): Standard transcription model
69
- - **saarika:v3**: Advanced transcription model
70
- - **saaras:v3**: Advanced model with multiple output modes
68
+
69
+ - **saarika:v2.5** (default): Transcribes audio in the spoken language.
70
+
71
+ - **saaras:v3**: State-of-the-art model with flexible output formats. Supports multiple modes via the `mode` parameter: transcribe, translate, verbatim, translit, codemix.
71
72
 
72
73
  mode : typing.Optional[Mode]
73
74
  Mode of operation. **Only applicable when using saaras:v3 model.**
74
- - **transcribe** (default): Standard transcription
75
- - **translate**: Translation to English
76
- - **indic-en**: Indic to English translation
77
- - **verbatim**: Exact transcription
78
- - **translit**: Transliteration to Latin script
79
- - **codemix**: Code-mixed output
75
+
76
+ Example audio: 'मेरा फोन नंबर है 9840950950'
77
+
78
+ - **transcribe** (default): Standard transcription in the original language with proper formatting and number normalization.
79
+ - Output: `मेरा फोन नंबर है 9840950950`
80
+
81
+ - **translate**: Translates speech from any supported Indic language to English.
82
+ - Output: `My phone number is 9840950950`
83
+
84
+ - **verbatim**: Exact word-for-word transcription without normalization, preserving filler words and spoken numbers as-is.
85
+ - Output: `मेरा फोन नंबर है नौ आठ चार zero नौ पांच zero नौ पांच zero`
86
+
87
+ - **translit**: Romanization - Transliterates speech to Latin/Roman script only.
88
+ - Output: `mera phone number hai 9840950950`
89
+
90
+ - **codemix**: Code-mixed text with English words in English and Indic words in native script.
91
+ - Output: `मेरा phone number है 9840950950`
80
92
 
81
93
  language_code : typing.Optional[SpeechToTextLanguage]
82
- Specifies the language of the input audio.
83
- For the `saarika:v2.5` model, it is optional.
84
- `unknown`: Use this when the language is not known; the API will detect it automatically.
94
+ Specifies the language of the input audio in BCP-47 format.
95
+
96
+ **Note:** This parameter is optional for `saarika:v2.5` model.
97
+
98
+ **Available Options:**
99
+ - `unknown`: Use when the language is not known; the API will auto-detect.
100
+ - `hi-IN`: Hindi
101
+ - `bn-IN`: Bengali
102
+ - `kn-IN`: Kannada
103
+ - `ml-IN`: Malayalam
104
+ - `mr-IN`: Marathi
105
+ - `od-IN`: Odia
106
+ - `pa-IN`: Punjabi
107
+ - `ta-IN`: Tamil
108
+ - `te-IN`: Telugu
109
+ - `en-IN`: English
110
+ - `gu-IN`: Gujarati
85
111
 
86
112
  input_audio_codec : typing.Optional[InputAudioCodec]
87
113
  Input Audio codec/format of the input file. PCM files are supported only at 16kHz sample rate.
@@ -146,7 +172,10 @@ class SpeechToTextClient:
146
172
  Conversation context can be passed as a prompt to boost model accuracy. However, the current system is at an experimentation stage and doesn't match the prompt performance of large language models.
147
173
 
148
174
  model : typing.Optional[SpeechToTextTranslateModel]
149
- Model to be used for converting speech to text in target language
175
+ Model to be used for speech to text translation.
176
+
177
+ - **saaras:v2.5** (default): Translation model that translates audio from any spoken Indic language to English.
178
+ - Example: Hindi audio → English text output
150
179
 
151
180
  input_audio_codec : typing.Optional[InputAudioCodec]
152
181
  Audio codec/format of the input file. Our API automatically detects all codec formats, but for PCM files specifically (pcm_s16le, pcm_l16, pcm_raw), you must pass this parameter. PCM files are supported only at 16kHz sample rate.
@@ -221,23 +250,49 @@ class AsyncSpeechToTextClient:
221
250
 
222
251
  model : typing.Optional[SpeechToTextModel]
223
252
  Specifies the model to use for speech-to-text conversion.
224
- - **saarika:v2.5** (default): Standard transcription model
225
- - **saarika:v3**: Advanced transcription model
226
- - **saaras:v3**: Advanced model with multiple output modes
253
+
254
+ - **saarika:v2.5** (default): Transcribes audio in the spoken language.
255
+
256
+ - **saaras:v3**: State-of-the-art model with flexible output formats. Supports multiple modes via the `mode` parameter: transcribe, translate, verbatim, translit, codemix.
227
257
 
228
258
  mode : typing.Optional[Mode]
229
259
  Mode of operation. **Only applicable when using saaras:v3 model.**
230
- - **transcribe** (default): Standard transcription
231
- - **translate**: Translation to English
232
- - **indic-en**: Indic to English translation
233
- - **verbatim**: Exact transcription
234
- - **translit**: Transliteration to Latin script
235
- - **codemix**: Code-mixed output
260
+
261
+ Example audio: 'मेरा फोन नंबर है 9840950950'
262
+
263
+ - **transcribe** (default): Standard transcription in the original language with proper formatting and number normalization.
264
+ - Output: `मेरा फोन नंबर है 9840950950`
265
+
266
+ - **translate**: Translates speech from any supported Indic language to English.
267
+ - Output: `My phone number is 9840950950`
268
+
269
+ - **verbatim**: Exact word-for-word transcription without normalization, preserving filler words and spoken numbers as-is.
270
+ - Output: `मेरा फोन नंबर है नौ आठ चार zero नौ पांच zero नौ पांच zero`
271
+
272
+ - **translit**: Romanization - Transliterates speech to Latin/Roman script only.
273
+ - Output: `mera phone number hai 9840950950`
274
+
275
+ - **codemix**: Code-mixed text with English words in English and Indic words in native script.
276
+ - Output: `मेरा phone number है 9840950950`
236
277
 
237
278
  language_code : typing.Optional[SpeechToTextLanguage]
238
- Specifies the language of the input audio.
239
- For the `saarika:v2.5` model, it is optional.
240
- `unknown`: Use this when the language is not known; the API will detect it automatically.
279
+ Specifies the language of the input audio in BCP-47 format.
280
+
281
+ **Note:** This parameter is optional for `saarika:v2.5` model.
282
+
283
+ **Available Options:**
284
+ - `unknown`: Use when the language is not known; the API will auto-detect.
285
+ - `hi-IN`: Hindi
286
+ - `bn-IN`: Bengali
287
+ - `kn-IN`: Kannada
288
+ - `ml-IN`: Malayalam
289
+ - `mr-IN`: Marathi
290
+ - `od-IN`: Odia
291
+ - `pa-IN`: Punjabi
292
+ - `ta-IN`: Tamil
293
+ - `te-IN`: Telugu
294
+ - `en-IN`: English
295
+ - `gu-IN`: Gujarati
241
296
 
242
297
  input_audio_codec : typing.Optional[InputAudioCodec]
243
298
  Input Audio codec/format of the input file. PCM files are supported only at 16kHz sample rate.
@@ -310,7 +365,10 @@ class AsyncSpeechToTextClient:
310
365
  Conversation context can be passed as a prompt to boost model accuracy. However, the current system is at an experimentation stage and doesn't match the prompt performance of large language models.
311
366
 
312
367
  model : typing.Optional[SpeechToTextTranslateModel]
313
- Model to be used for converting speech to text in target language
368
+ Model to be used for speech to text translation.
369
+
370
+ - **saaras:v2.5** (default): Translation model that translates audio from any spoken Indic language to English.
371
+ - Example: Hindi audio → English text output
314
372
 
315
373
  input_audio_codec : typing.Optional[InputAudioCodec]
316
374
  Audio codec/format of the input file. Our API automatically detects all codec formats, but for PCM files specifically (pcm_s16le, pcm_l16, pcm_raw), you must pass this parameter. PCM files are supported only at 16kHz sample rate.
@@ -63,23 +63,49 @@ class RawSpeechToTextClient:
63
63
 
64
64
  model : typing.Optional[SpeechToTextModel]
65
65
  Specifies the model to use for speech-to-text conversion.
66
- - **saarika:v2.5** (default): Standard transcription model
67
- - **saarika:v3**: Advanced transcription model
68
- - **saaras:v3**: Advanced model with multiple output modes
66
+
67
+ - **saarika:v2.5** (default): Transcribes audio in the spoken language.
68
+
69
+ - **saaras:v3**: State-of-the-art model with flexible output formats. Supports multiple modes via the `mode` parameter: transcribe, translate, verbatim, translit, codemix.
69
70
 
70
71
  mode : typing.Optional[Mode]
71
72
  Mode of operation. **Only applicable when using saaras:v3 model.**
72
- - **transcribe** (default): Standard transcription
73
- - **translate**: Translation to English
74
- - **indic-en**: Indic to English translation
75
- - **verbatim**: Exact transcription
76
- - **translit**: Transliteration to Latin script
77
- - **codemix**: Code-mixed output
73
+
74
+ Example audio: 'मेरा फोन नंबर है 9840950950'
75
+
76
+ - **transcribe** (default): Standard transcription in the original language with proper formatting and number normalization.
77
+ - Output: `मेरा फोन नंबर है 9840950950`
78
+
79
+ - **translate**: Translates speech from any supported Indic language to English.
80
+ - Output: `My phone number is 9840950950`
81
+
82
+ - **verbatim**: Exact word-for-word transcription without normalization, preserving filler words and spoken numbers as-is.
83
+ - Output: `मेरा फोन नंबर है नौ आठ चार zero नौ पांच zero नौ पांच zero`
84
+
85
+ - **translit**: Romanization - Transliterates speech to Latin/Roman script only.
86
+ - Output: `mera phone number hai 9840950950`
87
+
88
+ - **codemix**: Code-mixed text with English words in English and Indic words in native script.
89
+ - Output: `मेरा phone number है 9840950950`
78
90
 
79
91
  language_code : typing.Optional[SpeechToTextLanguage]
80
- Specifies the language of the input audio.
81
- For the `saarika:v2.5` model, it is optional.
82
- `unknown`: Use this when the language is not known; the API will detect it automatically.
92
+ Specifies the language of the input audio in BCP-47 format.
93
+
94
+ **Note:** This parameter is optional for `saarika:v2.5` model.
95
+
96
+ **Available Options:**
97
+ - `unknown`: Use when the language is not known; the API will auto-detect.
98
+ - `hi-IN`: Hindi
99
+ - `bn-IN`: Bengali
100
+ - `kn-IN`: Kannada
101
+ - `ml-IN`: Malayalam
102
+ - `mr-IN`: Marathi
103
+ - `od-IN`: Odia
104
+ - `pa-IN`: Punjabi
105
+ - `ta-IN`: Tamil
106
+ - `te-IN`: Telugu
107
+ - `en-IN`: English
108
+ - `gu-IN`: Gujarati
83
109
 
84
110
  input_audio_codec : typing.Optional[InputAudioCodec]
85
111
  Input Audio codec/format of the input file. PCM files are supported only at 16kHz sample rate.
@@ -223,7 +249,10 @@ class RawSpeechToTextClient:
223
249
  Conversation context can be passed as a prompt to boost model accuracy. However, the current system is at an experimentation stage and doesn't match the prompt performance of large language models.
224
250
 
225
251
  model : typing.Optional[SpeechToTextTranslateModel]
226
- Model to be used for converting speech to text in target language
252
+ Model to be used for speech to text translation.
253
+
254
+ - **saaras:v2.5** (default): Translation model that translates audio from any spoken Indic language to English.
255
+ - Example: Hindi audio → English text output
227
256
 
228
257
  input_audio_codec : typing.Optional[InputAudioCodec]
229
258
  Audio codec/format of the input file. Our API automatically detects all codec formats, but for PCM files specifically (pcm_s16le, pcm_l16, pcm_raw), you must pass this parameter. PCM files are supported only at 16kHz sample rate.
@@ -370,23 +399,49 @@ class AsyncRawSpeechToTextClient:
370
399
 
371
400
  model : typing.Optional[SpeechToTextModel]
372
401
  Specifies the model to use for speech-to-text conversion.
373
- - **saarika:v2.5** (default): Standard transcription model
374
- - **saarika:v3**: Advanced transcription model
375
- - **saaras:v3**: Advanced model with multiple output modes
402
+
403
+ - **saarika:v2.5** (default): Transcribes audio in the spoken language.
404
+
405
+ - **saaras:v3**: State-of-the-art model with flexible output formats. Supports multiple modes via the `mode` parameter: transcribe, translate, verbatim, translit, codemix.
376
406
 
377
407
  mode : typing.Optional[Mode]
378
408
  Mode of operation. **Only applicable when using saaras:v3 model.**
379
- - **transcribe** (default): Standard transcription
380
- - **translate**: Translation to English
381
- - **indic-en**: Indic to English translation
382
- - **verbatim**: Exact transcription
383
- - **translit**: Transliteration to Latin script
384
- - **codemix**: Code-mixed output
409
+
410
+ Example audio: 'मेरा फोन नंबर है 9840950950'
411
+
412
+ - **transcribe** (default): Standard transcription in the original language with proper formatting and number normalization.
413
+ - Output: `मेरा फोन नंबर है 9840950950`
414
+
415
+ - **translate**: Translates speech from any supported Indic language to English.
416
+ - Output: `My phone number is 9840950950`
417
+
418
+ - **verbatim**: Exact word-for-word transcription without normalization, preserving filler words and spoken numbers as-is.
419
+ - Output: `मेरा फोन नंबर है नौ आठ चार zero नौ पांच zero नौ पांच zero`
420
+
421
+ - **translit**: Romanization - Transliterates speech to Latin/Roman script only.
422
+ - Output: `mera phone number hai 9840950950`
423
+
424
+ - **codemix**: Code-mixed text with English words in English and Indic words in native script.
425
+ - Output: `मेरा phone number है 9840950950`
385
426
 
386
427
  language_code : typing.Optional[SpeechToTextLanguage]
387
- Specifies the language of the input audio.
388
- For the `saarika:v2.5` model, it is optional.
389
- `unknown`: Use this when the language is not known; the API will detect it automatically.
428
+ Specifies the language of the input audio in BCP-47 format.
429
+
430
+ **Note:** This parameter is optional for `saarika:v2.5` model.
431
+
432
+ **Available Options:**
433
+ - `unknown`: Use when the language is not known; the API will auto-detect.
434
+ - `hi-IN`: Hindi
435
+ - `bn-IN`: Bengali
436
+ - `kn-IN`: Kannada
437
+ - `ml-IN`: Malayalam
438
+ - `mr-IN`: Marathi
439
+ - `od-IN`: Odia
440
+ - `pa-IN`: Punjabi
441
+ - `ta-IN`: Tamil
442
+ - `te-IN`: Telugu
443
+ - `en-IN`: English
444
+ - `gu-IN`: Gujarati
390
445
 
391
446
  input_audio_codec : typing.Optional[InputAudioCodec]
392
447
  Input Audio codec/format of the input file. PCM files are supported only at 16kHz sample rate.
@@ -530,7 +585,10 @@ class AsyncRawSpeechToTextClient:
530
585
  Conversation context can be passed as a prompt to boost model accuracy. However, the current system is at an experimentation stage and doesn't match the prompt performance of large language models.
531
586
 
532
587
  model : typing.Optional[SpeechToTextTranslateModel]
533
- Model to be used for converting speech to text in target language
588
+ Model to be used for speech to text translation.
589
+
590
+ - **saaras:v2.5** (default): Translation model that translates audio from any spoken Indic language to English.
591
+ - Example: Hindi audio → English text output
534
592
 
535
593
  input_audio_codec : typing.Optional[InputAudioCodec]
536
594
  Audio codec/format of the input file. Our API automatically detects all codec formats, but for PCM files specifically (pcm_s16le, pcm_l16, pcm_raw), you must pass this parameter. PCM files are supported only at 16kHz sample rate.
@@ -63,19 +63,47 @@ class SpeechToTextStreamingClient:
63
63
  Parameters
64
64
  ----------
65
65
  language_code : SpeechToTextStreamingLanguageCode
66
- Language code for speech recognition (BCP-47 format)
66
+ Specifies the language of the input audio in BCP-47 format.
67
+
68
+ **Available Options:**
69
+ - `hi-IN`: Hindi
70
+ - `bn-IN`: Bengali
71
+ - `gu-IN`: Gujarati
72
+ - `kn-IN`: Kannada
73
+ - `ml-IN`: Malayalam
74
+ - `mr-IN`: Marathi
75
+ - `od-IN`: Odia
76
+ - `pa-IN`: Punjabi
77
+ - `ta-IN`: Tamil
78
+ - `te-IN`: Telugu
79
+ - `en-IN`: English
67
80
 
68
81
  model : typing.Optional[SpeechToTextStreamingModel]
69
- Speech to text model to use
82
+ Specifies the model to use for speech-to-text conversion.
83
+
84
+ - **saarika:v2.5** (default): Transcribes audio in the spoken language.
85
+
86
+ - **saaras:v3**: State-of-the-art model with flexible output formats. Supports multiple modes via the `mode` parameter: transcribe, translate, verbatim, translit, codemix.
70
87
 
71
88
  mode : typing.Optional[SpeechToTextStreamingMode]
72
- Mode of operation for saaras:v3 model. Only applicable when model is 'saaras:v3'.
73
- - transcribe: Standard Whisper transcription
74
- - translate: Standard Whisper translation to English
75
- - indic-en: Translate Indic languages to English
76
- - verbatim: Exact transcription in original script
77
- - translit: Transliteration to Latin script
78
- - codemix: Code-mixed output (native + English)
89
+ Mode of operation. **Only applicable when using saaras:v3 model.**
90
+
91
+ Example audio: 'मेरा फोन नंबर है 9840950950'
92
+
93
+ - **transcribe** (default): Standard transcription in the original language with proper formatting and number normalization.
94
+ - Output: `मेरा फोन नंबर है 9840950950`
95
+
96
+ - **translate**: Translates speech from any supported Indic language to English.
97
+ - Output: `My phone number is 9840950950`
98
+
99
+ - **verbatim**: Exact word-for-word transcription without normalization, preserving filler words and spoken numbers as-is.
100
+ - Output: `मेरा फोन नंबर है नौ आठ चार zero नौ पांच zero नौ पांच zero`
101
+
102
+ - **translit**: Romanization - Transliterates speech to Latin/Roman script only.
103
+ - Output: `mera phone number hai 9840950950`
104
+
105
+ - **codemix**: Code-mixed text with English words in English and Indic words in native script.
106
+ - Output: `मेरा phone number है 9840950950`
79
107
 
80
108
  sample_rate : typing.Optional[str]
81
109
  Audio sample rate for the WebSocket connection. When specified as a connection parameter, only 16kHz and 8kHz are supported. 8kHz is only available via this connection parameter. If not specified, defaults to 16kHz.
@@ -178,19 +206,47 @@ class AsyncSpeechToTextStreamingClient:
178
206
  Parameters
179
207
  ----------
180
208
  language_code : SpeechToTextStreamingLanguageCode
181
- Language code for speech recognition (BCP-47 format)
209
+ Specifies the language of the input audio in BCP-47 format.
210
+
211
+ **Available Options:**
212
+ - `hi-IN`: Hindi
213
+ - `bn-IN`: Bengali
214
+ - `gu-IN`: Gujarati
215
+ - `kn-IN`: Kannada
216
+ - `ml-IN`: Malayalam
217
+ - `mr-IN`: Marathi
218
+ - `od-IN`: Odia
219
+ - `pa-IN`: Punjabi
220
+ - `ta-IN`: Tamil
221
+ - `te-IN`: Telugu
222
+ - `en-IN`: English
182
223
 
183
224
  model : typing.Optional[SpeechToTextStreamingModel]
184
- Speech to text model to use
225
+ Specifies the model to use for speech-to-text conversion.
226
+
227
+ - **saarika:v2.5** (default): Transcribes audio in the spoken language.
228
+
229
+ - **saaras:v3**: State-of-the-art model with flexible output formats. Supports multiple modes via the `mode` parameter: transcribe, translate, verbatim, translit, codemix.
185
230
 
186
231
  mode : typing.Optional[SpeechToTextStreamingMode]
187
- Mode of operation for saaras:v3 model. Only applicable when model is 'saaras:v3'.
188
- - transcribe: Standard Whisper transcription
189
- - translate: Standard Whisper translation to English
190
- - indic-en: Translate Indic languages to English
191
- - verbatim: Exact transcription in original script
192
- - translit: Transliteration to Latin script
193
- - codemix: Code-mixed output (native + English)
232
+ Mode of operation. **Only applicable when using saaras:v3 model.**
233
+
234
+ Example audio: 'मेरा फोन नंबर है 9840950950'
235
+
236
+ - **transcribe** (default): Standard transcription in the original language with proper formatting and number normalization.
237
+ - Output: `मेरा फोन नंबर है 9840950950`
238
+
239
+ - **translate**: Translates speech from any supported Indic language to English.
240
+ - Output: `My phone number is 9840950950`
241
+
242
+ - **verbatim**: Exact word-for-word transcription without normalization, preserving filler words and spoken numbers as-is.
243
+ - Output: `मेरा फोन नंबर है नौ आठ चार zero नौ पांच zero नौ पांच zero`
244
+
245
+ - **translit**: Romanization - Transliterates speech to Latin/Roman script only.
246
+ - Output: `mera phone number hai 9840950950`
247
+
248
+ - **codemix**: Code-mixed text with English words in English and Indic words in native script.
249
+ - Output: `मेरा phone number है 9840950950`
194
250
 
195
251
  sample_rate : typing.Optional[str]
196
252
  Audio sample rate for the WebSocket connection. When specified as a connection parameter, only 16kHz and 8kHz are supported. 8kHz is only available via this connection parameter. If not specified, defaults to 16kHz.
@@ -51,19 +51,47 @@ class RawSpeechToTextStreamingClient:
51
51
  Parameters
52
52
  ----------
53
53
  language_code : SpeechToTextStreamingLanguageCode
54
- Language code for speech recognition (BCP-47 format)
54
+ Specifies the language of the input audio in BCP-47 format.
55
+
56
+ **Available Options:**
57
+ - `hi-IN`: Hindi
58
+ - `bn-IN`: Bengali
59
+ - `gu-IN`: Gujarati
60
+ - `kn-IN`: Kannada
61
+ - `ml-IN`: Malayalam
62
+ - `mr-IN`: Marathi
63
+ - `od-IN`: Odia
64
+ - `pa-IN`: Punjabi
65
+ - `ta-IN`: Tamil
66
+ - `te-IN`: Telugu
67
+ - `en-IN`: English
55
68
 
56
69
  model : typing.Optional[SpeechToTextStreamingModel]
57
- Speech to text model to use
70
+ Specifies the model to use for speech-to-text conversion.
71
+
72
+ - **saarika:v2.5** (default): Transcribes audio in the spoken language.
73
+
74
+ - **saaras:v3**: State-of-the-art model with flexible output formats. Supports multiple modes via the `mode` parameter: transcribe, translate, verbatim, translit, codemix.
58
75
 
59
76
  mode : typing.Optional[SpeechToTextStreamingMode]
60
- Mode of operation for saaras:v3 model. Only applicable when model is 'saaras:v3'.
61
- - transcribe: Standard Whisper transcription
62
- - translate: Standard Whisper translation to English
63
- - indic-en: Translate Indic languages to English
64
- - verbatim: Exact transcription in original script
65
- - translit: Transliteration to Latin script
66
- - codemix: Code-mixed output (native + English)
77
+ Mode of operation. **Only applicable when using saaras:v3 model.**
78
+
79
+ Example audio: 'मेरा फोन नंबर है 9840950950'
80
+
81
+ - **transcribe** (default): Standard transcription in the original language with proper formatting and number normalization.
82
+ - Output: `मेरा फोन नंबर है 9840950950`
83
+
84
+ - **translate**: Translates speech from any supported Indic language to English.
85
+ - Output: `My phone number is 9840950950`
86
+
87
+ - **verbatim**: Exact word-for-word transcription without normalization, preserving filler words and spoken numbers as-is.
88
+ - Output: `मेरा फोन नंबर है नौ आठ चार zero नौ पांच zero नौ पांच zero`
89
+
90
+ - **translit**: Romanization - Transliterates speech to Latin/Roman script only.
91
+ - Output: `mera phone number hai 9840950950`
92
+
93
+ - **codemix**: Code-mixed text with English words in English and Indic words in native script.
94
+ - Output: `मेरा phone number है 9840950950`
67
95
 
68
96
  sample_rate : typing.Optional[str]
69
97
  Audio sample rate for the WebSocket connection. When specified as a connection parameter, only 16kHz and 8kHz are supported. 8kHz is only available via this connection parameter. If not specified, defaults to 16kHz.
@@ -155,19 +183,47 @@ class AsyncRawSpeechToTextStreamingClient:
155
183
  Parameters
156
184
  ----------
157
185
  language_code : SpeechToTextStreamingLanguageCode
158
- Language code for speech recognition (BCP-47 format)
186
+ Specifies the language of the input audio in BCP-47 format.
187
+
188
+ **Available Options:**
189
+ - `hi-IN`: Hindi
190
+ - `bn-IN`: Bengali
191
+ - `gu-IN`: Gujarati
192
+ - `kn-IN`: Kannada
193
+ - `ml-IN`: Malayalam
194
+ - `mr-IN`: Marathi
195
+ - `od-IN`: Odia
196
+ - `pa-IN`: Punjabi
197
+ - `ta-IN`: Tamil
198
+ - `te-IN`: Telugu
199
+ - `en-IN`: English
159
200
 
160
201
  model : typing.Optional[SpeechToTextStreamingModel]
161
- Speech to text model to use
202
+ Specifies the model to use for speech-to-text conversion.
203
+
204
+ - **saarika:v2.5** (default): Transcribes audio in the spoken language.
205
+
206
+ - **saaras:v3**: State-of-the-art model with flexible output formats. Supports multiple modes via the `mode` parameter: transcribe, translate, verbatim, translit, codemix.
162
207
 
163
208
  mode : typing.Optional[SpeechToTextStreamingMode]
164
- Mode of operation for saaras:v3 model. Only applicable when model is 'saaras:v3'.
165
- - transcribe: Standard Whisper transcription
166
- - translate: Standard Whisper translation to English
167
- - indic-en: Translate Indic languages to English
168
- - verbatim: Exact transcription in original script
169
- - translit: Transliteration to Latin script
170
- - codemix: Code-mixed output (native + English)
209
+ Mode of operation. **Only applicable when using saaras:v3 model.**
210
+
211
+ Example audio: 'मेरा फोन नंबर है 9840950950'
212
+
213
+ - **transcribe** (default): Standard transcription in the original language with proper formatting and number normalization.
214
+ - Output: `मेरा फोन नंबर है 9840950950`
215
+
216
+ - **translate**: Translates speech from any supported Indic language to English.
217
+ - Output: `My phone number is 9840950950`
218
+
219
+ - **verbatim**: Exact word-for-word transcription without normalization, preserving filler words and spoken numbers as-is.
220
+ - Output: `मेरा फोन नंबर है नौ आठ चार zero नौ पांच zero नौ पांच zero`
221
+
222
+ - **translit**: Romanization - Transliterates speech to Latin/Roman script only.
223
+ - Output: `mera phone number hai 9840950950`
224
+
225
+ - **codemix**: Code-mixed text with English words in English and Indic words in native script.
226
+ - Output: `मेरा phone number है 9840950950`
171
227
 
172
228
  sample_rate : typing.Optional[str]
173
229
  Audio sample rate for the WebSocket connection. When specified as a connection parameter, only 16kHz and 8kHz are supported. 8kHz is only available via this connection parameter. If not specified, defaults to 16kHz.