voice-router-dev 0.9.0 → 0.9.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,2 +1,2 @@
1
1
  import 'zod';
2
- export { B as AssemblyAIListFilterFieldName, L as AssemblyAIListFilterSchema, E as AssemblyAIStreamingConfig, x as AssemblyAIStreamingFieldName, J as AssemblyAIStreamingSchema, H as AssemblyAIStreamingUpdateConfig, y as AssemblyAIStreamingUpdateFieldName, K as AssemblyAIStreamingUpdateSchema, C as AssemblyAITranscriptionConfig, A as AssemblyAITranscriptionFieldName, I as AssemblyAITranscriptionSchema, R as AzureListFilterFieldName, U as AzureListFilterSchema, S as AzureTranscriptionConfig, Q as AzureTranscriptionFieldName, T as AzureTranscriptionSchema, q as DeepgramListFilterFieldName, w as DeepgramListFilterSchema, p as DeepgramStreamingFieldName, t as DeepgramStreamingOnlyConfig, v as DeepgramStreamingOnlySchema, r as DeepgramTranscriptionConfig, D as DeepgramTranscriptionFieldName, u as DeepgramTranscriptionSchema, Z as FieldConfig, aK as FieldConfigProvider, c as FieldOverrides, F as FieldType, i as GladiaListFilterFieldName, n as GladiaListFilterSchema, k as GladiaStreamingConfig, h as GladiaStreamingFieldName, m as GladiaStreamingSchema, j as GladiaTranscriptionConfig, G as GladiaTranscriptionFieldName, l as GladiaTranscriptionSchema, M as OpenAITranscriptionConfig, O as OpenAITranscriptionFieldName, N as OpenAITranscriptionSchema, P as ProviderFieldConfigs, a8 as SonioxListFilterFieldName, af as SonioxListFilterSchema, aa as SonioxStreamingConfig, a6 as SonioxStreamingFieldName, ad as SonioxStreamingSchema, ab as SonioxStreamingUpdateConfig, a7 as SonioxStreamingUpdateFieldName, ae as SonioxStreamingUpdateSchema, a9 as SonioxTranscriptionConfig, a5 as SonioxTranscriptionFieldName, ac as SonioxTranscriptionSchema, Y as SpeechmaticsListFilterFieldName, a4 as SpeechmaticsListFilterSchema, $ as SpeechmaticsStreamingConfig, W as SpeechmaticsStreamingFieldName, a2 as SpeechmaticsStreamingSchema, a0 as SpeechmaticsStreamingUpdateConfig, X as SpeechmaticsStreamingUpdateFieldName, a3 as SpeechmaticsStreamingUpdateSchema, _ as SpeechmaticsTranscriptionConfig, V as SpeechmaticsTranscriptionFieldName, a1 as SpeechmaticsTranscriptionSchema, ah as StreamingFieldName, ag as TranscriptionFieldName, aM as getAllFieldConfigs, au as getAssemblyAIFieldConfigs, ar as getAssemblyAIListFilterFields, as as getAssemblyAIStreamingFields, at as getAssemblyAIStreamingUpdateFields, aq as getAssemblyAITranscriptionFields, az as getAzureFieldConfigs, ay as getAzureListFilterFields, ax as getAzureTranscriptionFields, ap as getDeepgramFieldConfigs, an as getDeepgramListFilterFields, ao as getDeepgramStreamingFields, am as getDeepgramTranscriptionFields, al as getGladiaFieldConfigs, aj as getGladiaListFilterFields, ak as getGladiaStreamingFields, ai as getGladiaTranscriptionFields, aw as getOpenAIFieldConfigs, av as getOpenAITranscriptionFields, aL as getProviderFieldConfigs, aJ as getSonioxFieldConfigs, aG as getSonioxListFilterFields, aH as getSonioxStreamingFields, aI as getSonioxStreamingUpdateFields, aF as getSonioxTranscriptionFields, aE as getSpeechmaticsFieldConfigs, aB as getSpeechmaticsListFilterFields, aC as getSpeechmaticsStreamingFields, aD as getSpeechmaticsStreamingUpdateFields, aA as getSpeechmaticsTranscriptionFields } from './field-configs-DYiUtRUz.mjs';
2
+ export { B as AssemblyAIListFilterFieldName, L as AssemblyAIListFilterSchema, E as AssemblyAIStreamingConfig, x as AssemblyAIStreamingFieldName, J as AssemblyAIStreamingSchema, H as AssemblyAIStreamingUpdateConfig, y as AssemblyAIStreamingUpdateFieldName, K as AssemblyAIStreamingUpdateSchema, C as AssemblyAITranscriptionConfig, A as AssemblyAITranscriptionFieldName, I as AssemblyAITranscriptionSchema, R as AzureListFilterFieldName, U as AzureListFilterSchema, S as AzureTranscriptionConfig, Q as AzureTranscriptionFieldName, T as AzureTranscriptionSchema, q as DeepgramListFilterFieldName, w as DeepgramListFilterSchema, p as DeepgramStreamingFieldName, t as DeepgramStreamingOnlyConfig, v as DeepgramStreamingOnlySchema, r as DeepgramTranscriptionConfig, D as DeepgramTranscriptionFieldName, u as DeepgramTranscriptionSchema, Z as FieldConfig, aK as FieldConfigProvider, c as FieldOverrides, F as FieldType, i as GladiaListFilterFieldName, n as GladiaListFilterSchema, k as GladiaStreamingConfig, h as GladiaStreamingFieldName, m as GladiaStreamingSchema, j as GladiaTranscriptionConfig, G as GladiaTranscriptionFieldName, l as GladiaTranscriptionSchema, M as OpenAITranscriptionConfig, O as OpenAITranscriptionFieldName, N as OpenAITranscriptionSchema, P as ProviderFieldConfigs, a8 as SonioxListFilterFieldName, af as SonioxListFilterSchema, aa as SonioxStreamingConfig, a6 as SonioxStreamingFieldName, ad as SonioxStreamingSchema, ab as SonioxStreamingUpdateConfig, a7 as SonioxStreamingUpdateFieldName, ae as SonioxStreamingUpdateSchema, a9 as SonioxTranscriptionConfig, a5 as SonioxTranscriptionFieldName, ac as SonioxTranscriptionSchema, Y as SpeechmaticsListFilterFieldName, a4 as SpeechmaticsListFilterSchema, $ as SpeechmaticsStreamingConfig, W as SpeechmaticsStreamingFieldName, a2 as SpeechmaticsStreamingSchema, a0 as SpeechmaticsStreamingUpdateConfig, X as SpeechmaticsStreamingUpdateFieldName, a3 as SpeechmaticsStreamingUpdateSchema, _ as SpeechmaticsTranscriptionConfig, V as SpeechmaticsTranscriptionFieldName, a1 as SpeechmaticsTranscriptionSchema, ah as StreamingFieldName, ag as TranscriptionFieldName, aM as getAllFieldConfigs, au as getAssemblyAIFieldConfigs, ar as getAssemblyAIListFilterFields, as as getAssemblyAIStreamingFields, at as getAssemblyAIStreamingUpdateFields, aq as getAssemblyAITranscriptionFields, az as getAzureFieldConfigs, ay as getAzureListFilterFields, ax as getAzureTranscriptionFields, ap as getDeepgramFieldConfigs, an as getDeepgramListFilterFields, ao as getDeepgramStreamingFields, am as getDeepgramTranscriptionFields, al as getGladiaFieldConfigs, aj as getGladiaListFilterFields, ak as getGladiaStreamingFields, ai as getGladiaTranscriptionFields, aw as getOpenAIFieldConfigs, av as getOpenAITranscriptionFields, aL as getProviderFieldConfigs, aJ as getSonioxFieldConfigs, aG as getSonioxListFilterFields, aH as getSonioxStreamingFields, aI as getSonioxStreamingUpdateFields, aF as getSonioxTranscriptionFields, aE as getSpeechmaticsFieldConfigs, aB as getSpeechmaticsListFilterFields, aC as getSpeechmaticsStreamingFields, aD as getSpeechmaticsStreamingUpdateFields, aA as getSpeechmaticsTranscriptionFields } from './field-configs-FbtCPxzs.mjs';
@@ -1,2 +1,2 @@
1
1
  import 'zod';
2
- export { B as AssemblyAIListFilterFieldName, L as AssemblyAIListFilterSchema, E as AssemblyAIStreamingConfig, x as AssemblyAIStreamingFieldName, J as AssemblyAIStreamingSchema, H as AssemblyAIStreamingUpdateConfig, y as AssemblyAIStreamingUpdateFieldName, K as AssemblyAIStreamingUpdateSchema, C as AssemblyAITranscriptionConfig, A as AssemblyAITranscriptionFieldName, I as AssemblyAITranscriptionSchema, R as AzureListFilterFieldName, U as AzureListFilterSchema, S as AzureTranscriptionConfig, Q as AzureTranscriptionFieldName, T as AzureTranscriptionSchema, q as DeepgramListFilterFieldName, w as DeepgramListFilterSchema, p as DeepgramStreamingFieldName, t as DeepgramStreamingOnlyConfig, v as DeepgramStreamingOnlySchema, r as DeepgramTranscriptionConfig, D as DeepgramTranscriptionFieldName, u as DeepgramTranscriptionSchema, Z as FieldConfig, aK as FieldConfigProvider, c as FieldOverrides, F as FieldType, i as GladiaListFilterFieldName, n as GladiaListFilterSchema, k as GladiaStreamingConfig, h as GladiaStreamingFieldName, m as GladiaStreamingSchema, j as GladiaTranscriptionConfig, G as GladiaTranscriptionFieldName, l as GladiaTranscriptionSchema, M as OpenAITranscriptionConfig, O as OpenAITranscriptionFieldName, N as OpenAITranscriptionSchema, P as ProviderFieldConfigs, a8 as SonioxListFilterFieldName, af as SonioxListFilterSchema, aa as SonioxStreamingConfig, a6 as SonioxStreamingFieldName, ad as SonioxStreamingSchema, ab as SonioxStreamingUpdateConfig, a7 as SonioxStreamingUpdateFieldName, ae as SonioxStreamingUpdateSchema, a9 as SonioxTranscriptionConfig, a5 as SonioxTranscriptionFieldName, ac as SonioxTranscriptionSchema, Y as SpeechmaticsListFilterFieldName, a4 as SpeechmaticsListFilterSchema, $ as SpeechmaticsStreamingConfig, W as SpeechmaticsStreamingFieldName, a2 as SpeechmaticsStreamingSchema, a0 as SpeechmaticsStreamingUpdateConfig, X as SpeechmaticsStreamingUpdateFieldName, a3 as SpeechmaticsStreamingUpdateSchema, _ as SpeechmaticsTranscriptionConfig, V as SpeechmaticsTranscriptionFieldName, a1 as SpeechmaticsTranscriptionSchema, ah as StreamingFieldName, ag as TranscriptionFieldName, aM as getAllFieldConfigs, au as getAssemblyAIFieldConfigs, ar as getAssemblyAIListFilterFields, as as getAssemblyAIStreamingFields, at as getAssemblyAIStreamingUpdateFields, aq as getAssemblyAITranscriptionFields, az as getAzureFieldConfigs, ay as getAzureListFilterFields, ax as getAzureTranscriptionFields, ap as getDeepgramFieldConfigs, an as getDeepgramListFilterFields, ao as getDeepgramStreamingFields, am as getDeepgramTranscriptionFields, al as getGladiaFieldConfigs, aj as getGladiaListFilterFields, ak as getGladiaStreamingFields, ai as getGladiaTranscriptionFields, aw as getOpenAIFieldConfigs, av as getOpenAITranscriptionFields, aL as getProviderFieldConfigs, aJ as getSonioxFieldConfigs, aG as getSonioxListFilterFields, aH as getSonioxStreamingFields, aI as getSonioxStreamingUpdateFields, aF as getSonioxTranscriptionFields, aE as getSpeechmaticsFieldConfigs, aB as getSpeechmaticsListFilterFields, aC as getSpeechmaticsStreamingFields, aD as getSpeechmaticsStreamingUpdateFields, aA as getSpeechmaticsTranscriptionFields } from './field-configs-DYiUtRUz.js';
2
+ export { B as AssemblyAIListFilterFieldName, L as AssemblyAIListFilterSchema, E as AssemblyAIStreamingConfig, x as AssemblyAIStreamingFieldName, J as AssemblyAIStreamingSchema, H as AssemblyAIStreamingUpdateConfig, y as AssemblyAIStreamingUpdateFieldName, K as AssemblyAIStreamingUpdateSchema, C as AssemblyAITranscriptionConfig, A as AssemblyAITranscriptionFieldName, I as AssemblyAITranscriptionSchema, R as AzureListFilterFieldName, U as AzureListFilterSchema, S as AzureTranscriptionConfig, Q as AzureTranscriptionFieldName, T as AzureTranscriptionSchema, q as DeepgramListFilterFieldName, w as DeepgramListFilterSchema, p as DeepgramStreamingFieldName, t as DeepgramStreamingOnlyConfig, v as DeepgramStreamingOnlySchema, r as DeepgramTranscriptionConfig, D as DeepgramTranscriptionFieldName, u as DeepgramTranscriptionSchema, Z as FieldConfig, aK as FieldConfigProvider, c as FieldOverrides, F as FieldType, i as GladiaListFilterFieldName, n as GladiaListFilterSchema, k as GladiaStreamingConfig, h as GladiaStreamingFieldName, m as GladiaStreamingSchema, j as GladiaTranscriptionConfig, G as GladiaTranscriptionFieldName, l as GladiaTranscriptionSchema, M as OpenAITranscriptionConfig, O as OpenAITranscriptionFieldName, N as OpenAITranscriptionSchema, P as ProviderFieldConfigs, a8 as SonioxListFilterFieldName, af as SonioxListFilterSchema, aa as SonioxStreamingConfig, a6 as SonioxStreamingFieldName, ad as SonioxStreamingSchema, ab as SonioxStreamingUpdateConfig, a7 as SonioxStreamingUpdateFieldName, ae as SonioxStreamingUpdateSchema, a9 as SonioxTranscriptionConfig, a5 as SonioxTranscriptionFieldName, ac as SonioxTranscriptionSchema, Y as SpeechmaticsListFilterFieldName, a4 as SpeechmaticsListFilterSchema, $ as SpeechmaticsStreamingConfig, W as SpeechmaticsStreamingFieldName, a2 as SpeechmaticsStreamingSchema, a0 as SpeechmaticsStreamingUpdateConfig, X as SpeechmaticsStreamingUpdateFieldName, a3 as SpeechmaticsStreamingUpdateSchema, _ as SpeechmaticsTranscriptionConfig, V as SpeechmaticsTranscriptionFieldName, a1 as SpeechmaticsTranscriptionSchema, ah as StreamingFieldName, ag as TranscriptionFieldName, aM as getAllFieldConfigs, au as getAssemblyAIFieldConfigs, ar as getAssemblyAIListFilterFields, as as getAssemblyAIStreamingFields, at as getAssemblyAIStreamingUpdateFields, aq as getAssemblyAITranscriptionFields, az as getAzureFieldConfigs, ay as getAzureListFilterFields, ax as getAzureTranscriptionFields, ap as getDeepgramFieldConfigs, an as getDeepgramListFilterFields, ao as getDeepgramStreamingFields, am as getDeepgramTranscriptionFields, al as getGladiaFieldConfigs, aj as getGladiaListFilterFields, ak as getGladiaStreamingFields, ai as getGladiaTranscriptionFields, aw as getOpenAIFieldConfigs, av as getOpenAITranscriptionFields, aL as getProviderFieldConfigs, aJ as getSonioxFieldConfigs, aG as getSonioxListFilterFields, aH as getSonioxStreamingFields, aI as getSonioxStreamingUpdateFields, aF as getSonioxTranscriptionFields, aE as getSpeechmaticsFieldConfigs, aB as getSpeechmaticsListFilterFields, aC as getSpeechmaticsStreamingFields, aD as getSpeechmaticsStreamingUpdateFields, aA as getSpeechmaticsTranscriptionFields } from './field-configs-FbtCPxzs.js';
@@ -24662,7 +24662,7 @@ var createTemporaryApiKeyBody = import_zod10.z.object({
24662
24662
 
24663
24663
  // src/generated/soniox/streaming-types.zod.ts
24664
24664
  var import_zod11 = require("zod");
24665
- var sonioxAutoDetectedAudioFormatSchema = import_zod11.z.enum([
24665
+ var sonioxAudioFormatSchema = import_zod11.z.enum([
24666
24666
  "auto",
24667
24667
  "aac",
24668
24668
  "aiff",
@@ -24672,10 +24672,7 @@ var sonioxAutoDetectedAudioFormatSchema = import_zod11.z.enum([
24672
24672
  "mp3",
24673
24673
  "ogg",
24674
24674
  "wav",
24675
- "webm"
24676
- ]);
24677
- var sonioxPcmAudioEncodingSchema = import_zod11.z.enum([
24678
- // Signed PCM
24675
+ "webm",
24679
24676
  "pcm_s8",
24680
24677
  "pcm_s16le",
24681
24678
  "pcm_s16be",
@@ -24683,7 +24680,6 @@ var sonioxPcmAudioEncodingSchema = import_zod11.z.enum([
24683
24680
  "pcm_s24be",
24684
24681
  "pcm_s32le",
24685
24682
  "pcm_s32be",
24686
- // Unsigned PCM
24687
24683
  "pcm_u8",
24688
24684
  "pcm_u16le",
24689
24685
  "pcm_u16be",
@@ -24691,86 +24687,81 @@ var sonioxPcmAudioEncodingSchema = import_zod11.z.enum([
24691
24687
  "pcm_u24be",
24692
24688
  "pcm_u32le",
24693
24689
  "pcm_u32be",
24694
- // Float PCM
24695
24690
  "pcm_f32le",
24696
24691
  "pcm_f32be",
24697
24692
  "pcm_f64le",
24698
24693
  "pcm_f64be",
24699
- // Companded
24700
24694
  "mulaw",
24701
24695
  "alaw"
24702
24696
  ]);
24703
- var sonioxAudioFormatSchema = import_zod11.z.union([
24704
- sonioxAutoDetectedAudioFormatSchema,
24705
- sonioxPcmAudioEncodingSchema
24706
- ]);
24707
24697
  var sonioxOneWayTranslationSchema = import_zod11.z.object({
24708
24698
  type: import_zod11.z.literal("one_way"),
24709
- target_language: import_zod11.z.string().describe("Target language code for translation")
24699
+ target_language: import_zod11.z.string()
24710
24700
  });
24711
24701
  var sonioxTwoWayTranslationSchema = import_zod11.z.object({
24712
24702
  type: import_zod11.z.literal("two_way"),
24713
- language_a: import_zod11.z.string().describe("First language for bidirectional translation"),
24714
- language_b: import_zod11.z.string().describe("Second language for bidirectional translation")
24703
+ language_a: import_zod11.z.string(),
24704
+ language_b: import_zod11.z.string()
24715
24705
  });
24716
24706
  var sonioxTranslationConfigSchema = import_zod11.z.union([
24717
24707
  sonioxOneWayTranslationSchema,
24718
24708
  sonioxTwoWayTranslationSchema
24719
24709
  ]);
24720
24710
  var sonioxContextGeneralItemSchema = import_zod11.z.object({
24721
- key: import_zod11.z.string().describe("Context item key (e.g. 'Domain')"),
24722
- value: import_zod11.z.string().describe("Context item value (e.g. 'medicine')")
24711
+ key: import_zod11.z.string(),
24712
+ value: import_zod11.z.string()
24723
24713
  });
24724
24714
  var sonioxTranslationTermSchema = import_zod11.z.object({
24725
- source: import_zod11.z.string().describe("Source term"),
24726
- target: import_zod11.z.string().describe("Target term to translate to")
24715
+ source: import_zod11.z.string(),
24716
+ target: import_zod11.z.string()
24727
24717
  });
24728
24718
  var sonioxStructuredContextSchema = import_zod11.z.object({
24729
- general: import_zod11.z.array(sonioxContextGeneralItemSchema).optional().describe("General context items (key-value pairs)"),
24730
- text: import_zod11.z.string().optional().describe("Text context"),
24731
- terms: import_zod11.z.array(import_zod11.z.string()).optional().describe("Terms that might occur in speech"),
24732
- translation_terms: import_zod11.z.array(sonioxTranslationTermSchema).optional().describe("Hints how to translate specific terms (ignored if translation is not enabled)")
24719
+ general: import_zod11.z.array(sonioxContextGeneralItemSchema).optional(),
24720
+ text: import_zod11.z.string().optional(),
24721
+ terms: import_zod11.z.array(import_zod11.z.string()).optional(),
24722
+ translation_terms: import_zod11.z.array(sonioxTranslationTermSchema).optional()
24733
24723
  });
24734
24724
  var sonioxContextSchema = import_zod11.z.union([sonioxStructuredContextSchema, import_zod11.z.string()]);
24735
24725
  var sonioxRealtimeModelSchema = import_zod11.z.enum([
24726
+ "stt-rt-v4",
24736
24727
  "stt-rt-v3",
24737
24728
  "stt-rt-preview",
24738
24729
  "stt-rt-v3-preview",
24739
24730
  "stt-rt-preview-v2"
24740
24731
  ]);
24741
24732
  var streamingTranscriberParams3 = import_zod11.z.object({
24742
- model: sonioxRealtimeModelSchema.describe("Real-time model to use"),
24743
- audioFormat: sonioxAudioFormatSchema.optional().describe("Audio format specification. Use 'auto' for automatic detection"),
24744
- sampleRate: import_zod11.z.number().optional().describe("Sample rate in Hz (required for raw PCM formats)"),
24745
- numChannels: import_zod11.z.number().min(1).max(2).optional().describe("Number of audio channels (1 for mono, 2 for stereo) - required for raw PCM formats"),
24746
- languageHints: import_zod11.z.array(import_zod11.z.string()).optional().describe("Expected languages in the audio (ISO language codes)"),
24747
- context: sonioxContextSchema.optional().describe("Additional context to improve transcription accuracy"),
24748
- enableSpeakerDiarization: import_zod11.z.boolean().optional().describe("Enable speaker diarization - each token will include a speaker field"),
24749
- enableLanguageIdentification: import_zod11.z.boolean().optional().describe("Enable language identification - each token will include a language field"),
24750
- enableEndpointDetection: import_zod11.z.boolean().optional().describe("Enable endpoint detection to detect when a speaker has finished talking"),
24751
- translation: sonioxTranslationConfigSchema.optional().describe("Translation configuration"),
24752
- clientReferenceId: import_zod11.z.string().optional().describe("Optional tracking identifier (client-defined)")
24733
+ model: sonioxRealtimeModelSchema,
24734
+ audioFormat: sonioxAudioFormatSchema.optional(),
24735
+ sampleRate: import_zod11.z.number().optional(),
24736
+ numChannels: import_zod11.z.number().optional(),
24737
+ languageHints: import_zod11.z.array(import_zod11.z.string()).optional(),
24738
+ context: sonioxContextSchema.optional(),
24739
+ enableSpeakerDiarization: import_zod11.z.boolean().optional(),
24740
+ enableLanguageIdentification: import_zod11.z.boolean().optional(),
24741
+ enableEndpointDetection: import_zod11.z.boolean().optional(),
24742
+ translation: sonioxTranslationConfigSchema.optional(),
24743
+ clientReferenceId: import_zod11.z.string().optional()
24753
24744
  });
24754
- var sonioxTranslationStatusSchema = import_zod11.z.enum(["none", "original", "translation"]);
24745
+ var sonioxTranslationStatusSchema = import_zod11.z.enum(["original", "translation", "none"]);
24755
24746
  var sonioxTokenSchema = import_zod11.z.object({
24756
- text: import_zod11.z.string().describe("Token text content (subword, word, or space)"),
24757
- start_ms: import_zod11.z.number().optional().describe("Start time of the token in milliseconds"),
24758
- end_ms: import_zod11.z.number().optional().describe("End time of the token in milliseconds"),
24759
- confidence: import_zod11.z.number().min(0).max(1).optional().describe("Confidence score between 0.0 and 1.0"),
24760
- is_final: import_zod11.z.boolean().describe("Whether this token is final (confirmed) or provisional"),
24761
- speaker: import_zod11.z.string().optional().describe("Speaker identifier (only present when speaker diarization is enabled)"),
24762
- language: import_zod11.z.string().optional().describe("Detected language code (only present when language identification is enabled)"),
24763
- source_language: import_zod11.z.string().optional().describe("Original language code for translated tokens"),
24764
- translation_status: sonioxTranslationStatusSchema.optional().describe("Translation status: 'none', 'original', or 'translation'")
24747
+ text: import_zod11.z.string(),
24748
+ start_ms: import_zod11.z.number().optional(),
24749
+ end_ms: import_zod11.z.number().optional(),
24750
+ confidence: import_zod11.z.number(),
24751
+ is_final: import_zod11.z.boolean(),
24752
+ speaker: import_zod11.z.string().optional(),
24753
+ translation_status: sonioxTranslationStatusSchema.optional(),
24754
+ language: import_zod11.z.string().optional(),
24755
+ source_language: import_zod11.z.string().optional()
24765
24756
  });
24766
24757
  var sonioxStreamingResponseSchema = import_zod11.z.object({
24767
- text: import_zod11.z.string().optional().describe("Complete transcribed text"),
24768
- tokens: import_zod11.z.array(sonioxTokenSchema).describe("List of recognized tokens"),
24769
- final_audio_proc_ms: import_zod11.z.number().optional().describe("Milliseconds of audio processed into final tokens"),
24770
- total_audio_proc_ms: import_zod11.z.number().optional().describe("Milliseconds of audio processed (final + non-final)"),
24771
- finished: import_zod11.z.boolean().optional().describe("Whether the transcription is complete"),
24772
- error: import_zod11.z.string().optional().describe("Error message if an error occurred"),
24773
- error_code: import_zod11.z.number().optional().describe("Error code if an error occurred")
24758
+ text: import_zod11.z.string(),
24759
+ tokens: import_zod11.z.array(sonioxTokenSchema),
24760
+ final_audio_proc_ms: import_zod11.z.number(),
24761
+ total_audio_proc_ms: import_zod11.z.number(),
24762
+ finished: import_zod11.z.boolean().optional(),
24763
+ error_code: import_zod11.z.number().optional(),
24764
+ error_message: import_zod11.z.string().optional()
24774
24765
  });
24775
24766
  var sonioxRecorderStateSchema = import_zod11.z.enum([
24776
24767
  "Init",
@@ -24587,7 +24587,7 @@ var createTemporaryApiKeyBody = zod10.object({
24587
24587
 
24588
24588
  // src/generated/soniox/streaming-types.zod.ts
24589
24589
  import { z as zod11 } from "zod";
24590
- var sonioxAutoDetectedAudioFormatSchema = zod11.enum([
24590
+ var sonioxAudioFormatSchema = zod11.enum([
24591
24591
  "auto",
24592
24592
  "aac",
24593
24593
  "aiff",
@@ -24597,10 +24597,7 @@ var sonioxAutoDetectedAudioFormatSchema = zod11.enum([
24597
24597
  "mp3",
24598
24598
  "ogg",
24599
24599
  "wav",
24600
- "webm"
24601
- ]);
24602
- var sonioxPcmAudioEncodingSchema = zod11.enum([
24603
- // Signed PCM
24600
+ "webm",
24604
24601
  "pcm_s8",
24605
24602
  "pcm_s16le",
24606
24603
  "pcm_s16be",
@@ -24608,7 +24605,6 @@ var sonioxPcmAudioEncodingSchema = zod11.enum([
24608
24605
  "pcm_s24be",
24609
24606
  "pcm_s32le",
24610
24607
  "pcm_s32be",
24611
- // Unsigned PCM
24612
24608
  "pcm_u8",
24613
24609
  "pcm_u16le",
24614
24610
  "pcm_u16be",
@@ -24616,86 +24612,81 @@ var sonioxPcmAudioEncodingSchema = zod11.enum([
24616
24612
  "pcm_u24be",
24617
24613
  "pcm_u32le",
24618
24614
  "pcm_u32be",
24619
- // Float PCM
24620
24615
  "pcm_f32le",
24621
24616
  "pcm_f32be",
24622
24617
  "pcm_f64le",
24623
24618
  "pcm_f64be",
24624
- // Companded
24625
24619
  "mulaw",
24626
24620
  "alaw"
24627
24621
  ]);
24628
- var sonioxAudioFormatSchema = zod11.union([
24629
- sonioxAutoDetectedAudioFormatSchema,
24630
- sonioxPcmAudioEncodingSchema
24631
- ]);
24632
24622
  var sonioxOneWayTranslationSchema = zod11.object({
24633
24623
  type: zod11.literal("one_way"),
24634
- target_language: zod11.string().describe("Target language code for translation")
24624
+ target_language: zod11.string()
24635
24625
  });
24636
24626
  var sonioxTwoWayTranslationSchema = zod11.object({
24637
24627
  type: zod11.literal("two_way"),
24638
- language_a: zod11.string().describe("First language for bidirectional translation"),
24639
- language_b: zod11.string().describe("Second language for bidirectional translation")
24628
+ language_a: zod11.string(),
24629
+ language_b: zod11.string()
24640
24630
  });
24641
24631
  var sonioxTranslationConfigSchema = zod11.union([
24642
24632
  sonioxOneWayTranslationSchema,
24643
24633
  sonioxTwoWayTranslationSchema
24644
24634
  ]);
24645
24635
  var sonioxContextGeneralItemSchema = zod11.object({
24646
- key: zod11.string().describe("Context item key (e.g. 'Domain')"),
24647
- value: zod11.string().describe("Context item value (e.g. 'medicine')")
24636
+ key: zod11.string(),
24637
+ value: zod11.string()
24648
24638
  });
24649
24639
  var sonioxTranslationTermSchema = zod11.object({
24650
- source: zod11.string().describe("Source term"),
24651
- target: zod11.string().describe("Target term to translate to")
24640
+ source: zod11.string(),
24641
+ target: zod11.string()
24652
24642
  });
24653
24643
  var sonioxStructuredContextSchema = zod11.object({
24654
- general: zod11.array(sonioxContextGeneralItemSchema).optional().describe("General context items (key-value pairs)"),
24655
- text: zod11.string().optional().describe("Text context"),
24656
- terms: zod11.array(zod11.string()).optional().describe("Terms that might occur in speech"),
24657
- translation_terms: zod11.array(sonioxTranslationTermSchema).optional().describe("Hints how to translate specific terms (ignored if translation is not enabled)")
24644
+ general: zod11.array(sonioxContextGeneralItemSchema).optional(),
24645
+ text: zod11.string().optional(),
24646
+ terms: zod11.array(zod11.string()).optional(),
24647
+ translation_terms: zod11.array(sonioxTranslationTermSchema).optional()
24658
24648
  });
24659
24649
  var sonioxContextSchema = zod11.union([sonioxStructuredContextSchema, zod11.string()]);
24660
24650
  var sonioxRealtimeModelSchema = zod11.enum([
24651
+ "stt-rt-v4",
24661
24652
  "stt-rt-v3",
24662
24653
  "stt-rt-preview",
24663
24654
  "stt-rt-v3-preview",
24664
24655
  "stt-rt-preview-v2"
24665
24656
  ]);
24666
24657
  var streamingTranscriberParams3 = zod11.object({
24667
- model: sonioxRealtimeModelSchema.describe("Real-time model to use"),
24668
- audioFormat: sonioxAudioFormatSchema.optional().describe("Audio format specification. Use 'auto' for automatic detection"),
24669
- sampleRate: zod11.number().optional().describe("Sample rate in Hz (required for raw PCM formats)"),
24670
- numChannels: zod11.number().min(1).max(2).optional().describe("Number of audio channels (1 for mono, 2 for stereo) - required for raw PCM formats"),
24671
- languageHints: zod11.array(zod11.string()).optional().describe("Expected languages in the audio (ISO language codes)"),
24672
- context: sonioxContextSchema.optional().describe("Additional context to improve transcription accuracy"),
24673
- enableSpeakerDiarization: zod11.boolean().optional().describe("Enable speaker diarization - each token will include a speaker field"),
24674
- enableLanguageIdentification: zod11.boolean().optional().describe("Enable language identification - each token will include a language field"),
24675
- enableEndpointDetection: zod11.boolean().optional().describe("Enable endpoint detection to detect when a speaker has finished talking"),
24676
- translation: sonioxTranslationConfigSchema.optional().describe("Translation configuration"),
24677
- clientReferenceId: zod11.string().optional().describe("Optional tracking identifier (client-defined)")
24658
+ model: sonioxRealtimeModelSchema,
24659
+ audioFormat: sonioxAudioFormatSchema.optional(),
24660
+ sampleRate: zod11.number().optional(),
24661
+ numChannels: zod11.number().optional(),
24662
+ languageHints: zod11.array(zod11.string()).optional(),
24663
+ context: sonioxContextSchema.optional(),
24664
+ enableSpeakerDiarization: zod11.boolean().optional(),
24665
+ enableLanguageIdentification: zod11.boolean().optional(),
24666
+ enableEndpointDetection: zod11.boolean().optional(),
24667
+ translation: sonioxTranslationConfigSchema.optional(),
24668
+ clientReferenceId: zod11.string().optional()
24678
24669
  });
24679
- var sonioxTranslationStatusSchema = zod11.enum(["none", "original", "translation"]);
24670
+ var sonioxTranslationStatusSchema = zod11.enum(["original", "translation", "none"]);
24680
24671
  var sonioxTokenSchema = zod11.object({
24681
- text: zod11.string().describe("Token text content (subword, word, or space)"),
24682
- start_ms: zod11.number().optional().describe("Start time of the token in milliseconds"),
24683
- end_ms: zod11.number().optional().describe("End time of the token in milliseconds"),
24684
- confidence: zod11.number().min(0).max(1).optional().describe("Confidence score between 0.0 and 1.0"),
24685
- is_final: zod11.boolean().describe("Whether this token is final (confirmed) or provisional"),
24686
- speaker: zod11.string().optional().describe("Speaker identifier (only present when speaker diarization is enabled)"),
24687
- language: zod11.string().optional().describe("Detected language code (only present when language identification is enabled)"),
24688
- source_language: zod11.string().optional().describe("Original language code for translated tokens"),
24689
- translation_status: sonioxTranslationStatusSchema.optional().describe("Translation status: 'none', 'original', or 'translation'")
24672
+ text: zod11.string(),
24673
+ start_ms: zod11.number().optional(),
24674
+ end_ms: zod11.number().optional(),
24675
+ confidence: zod11.number(),
24676
+ is_final: zod11.boolean(),
24677
+ speaker: zod11.string().optional(),
24678
+ translation_status: sonioxTranslationStatusSchema.optional(),
24679
+ language: zod11.string().optional(),
24680
+ source_language: zod11.string().optional()
24690
24681
  });
24691
24682
  var sonioxStreamingResponseSchema = zod11.object({
24692
- text: zod11.string().optional().describe("Complete transcribed text"),
24693
- tokens: zod11.array(sonioxTokenSchema).describe("List of recognized tokens"),
24694
- final_audio_proc_ms: zod11.number().optional().describe("Milliseconds of audio processed into final tokens"),
24695
- total_audio_proc_ms: zod11.number().optional().describe("Milliseconds of audio processed (final + non-final)"),
24696
- finished: zod11.boolean().optional().describe("Whether the transcription is complete"),
24697
- error: zod11.string().optional().describe("Error message if an error occurred"),
24698
- error_code: zod11.number().optional().describe("Error code if an error occurred")
24683
+ text: zod11.string(),
24684
+ tokens: zod11.array(sonioxTokenSchema),
24685
+ final_audio_proc_ms: zod11.number(),
24686
+ total_audio_proc_ms: zod11.number(),
24687
+ finished: zod11.boolean().optional(),
24688
+ error_code: zod11.number().optional(),
24689
+ error_message: zod11.string().optional()
24699
24690
  });
24700
24691
  var sonioxRecorderStateSchema = zod11.enum([
24701
24692
  "Init",