@cartesia/cartesia-js 3.0.0-b3 → 3.0.0-b4
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +9 -0
- package/README.md +21 -21
- package/client.d.mts +2 -2
- package/client.d.mts.map +1 -1
- package/client.d.ts +2 -2
- package/client.d.ts.map +1 -1
- package/client.js.map +1 -1
- package/client.mjs.map +1 -1
- package/package.json +1 -1
- package/resources/access-token.d.mts +5 -0
- package/resources/access-token.d.mts.map +1 -1
- package/resources/access-token.d.ts +5 -0
- package/resources/access-token.d.ts.map +1 -1
- package/resources/agents/agents.js +1 -1
- package/resources/agents/agents.js.map +1 -1
- package/resources/agents/agents.mjs +1 -1
- package/resources/agents/agents.mjs.map +1 -1
- package/resources/agents/metrics/index.d.mts +1 -1
- package/resources/agents/metrics/index.d.mts.map +1 -1
- package/resources/agents/metrics/index.d.ts +1 -1
- package/resources/agents/metrics/index.d.ts.map +1 -1
- package/resources/agents/metrics/index.js.map +1 -1
- package/resources/agents/metrics/index.mjs.map +1 -1
- package/resources/agents/metrics/metrics.d.mts +2 -2
- package/resources/agents/metrics/metrics.d.mts.map +1 -1
- package/resources/agents/metrics/metrics.d.ts +2 -2
- package/resources/agents/metrics/metrics.d.ts.map +1 -1
- package/resources/agents/metrics/metrics.js.map +1 -1
- package/resources/agents/metrics/metrics.mjs.map +1 -1
- package/resources/agents/metrics/results.d.mts +23 -22
- package/resources/agents/metrics/results.d.mts.map +1 -1
- package/resources/agents/metrics/results.d.ts +23 -22
- package/resources/agents/metrics/results.d.ts.map +1 -1
- package/resources/agents/metrics/results.js +4 -5
- package/resources/agents/metrics/results.js.map +1 -1
- package/resources/agents/metrics/results.mjs +4 -5
- package/resources/agents/metrics/results.mjs.map +1 -1
- package/resources/index.d.mts +1 -1
- package/resources/index.d.mts.map +1 -1
- package/resources/index.d.ts +1 -1
- package/resources/index.d.ts.map +1 -1
- package/resources/index.js.map +1 -1
- package/resources/index.mjs.map +1 -1
- package/resources/infill.d.mts +3 -4
- package/resources/infill.d.mts.map +1 -1
- package/resources/infill.d.ts +3 -4
- package/resources/infill.d.ts.map +1 -1
- package/resources/infill.js +0 -2
- package/resources/infill.js.map +1 -1
- package/resources/infill.mjs +0 -2
- package/resources/infill.mjs.map +1 -1
- package/resources/pronunciation-dicts.d.mts +0 -8
- package/resources/pronunciation-dicts.d.mts.map +1 -1
- package/resources/pronunciation-dicts.d.ts +0 -8
- package/resources/pronunciation-dicts.d.ts.map +1 -1
- package/resources/pronunciation-dicts.js +0 -18
- package/resources/pronunciation-dicts.js.map +1 -1
- package/resources/pronunciation-dicts.mjs +0 -18
- package/resources/pronunciation-dicts.mjs.map +1 -1
- package/resources/stt.d.mts +1 -104
- package/resources/stt.d.mts.map +1 -1
- package/resources/stt.d.ts +1 -104
- package/resources/stt.d.ts.map +1 -1
- package/resources/tts/tts.d.mts +79 -115
- package/resources/tts/tts.d.mts.map +1 -1
- package/resources/tts/tts.d.ts +79 -115
- package/resources/tts/tts.d.ts.map +1 -1
- package/resources/voice-changer.d.mts +2 -2
- package/resources/voice-changer.d.mts.map +1 -1
- package/resources/voice-changer.d.ts +2 -2
- package/resources/voice-changer.d.ts.map +1 -1
- package/resources/voices.d.mts +70 -34
- package/resources/voices.d.mts.map +1 -1
- package/resources/voices.d.ts +70 -34
- package/resources/voices.d.ts.map +1 -1
- package/resources/voices.js +45 -3
- package/resources/voices.js.map +1 -1
- package/resources/voices.mjs +45 -3
- package/resources/voices.mjs.map +1 -1
- package/src/client.ts +2 -0
- package/src/resources/access-token.ts +6 -0
- package/src/resources/agents/agents.ts +1 -1
- package/src/resources/agents/metrics/index.ts +1 -0
- package/src/resources/agents/metrics/metrics.ts +2 -0
- package/src/resources/agents/metrics/results.ts +27 -23
- package/src/resources/index.ts +1 -0
- package/src/resources/infill.ts +3 -4
- package/src/resources/pronunciation-dicts.ts +0 -20
- package/src/resources/stt.ts +102 -104
- package/src/resources/tts/tts.ts +146 -128
- package/src/resources/voice-changer.ts +2 -2
- package/src/resources/voices.ts +105 -38
- package/src/version.ts +1 -1
- package/version.d.mts +1 -1
- package/version.d.ts +1 -1
- package/version.js +1 -1
- package/version.mjs +1 -1
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"pronunciation-dicts.mjs","sourceRoot":"","sources":["../src/resources/pronunciation-dicts.ts"],"names":[],"mappings":"AAAA,sFAAsF;OAE/E,EAAE,WAAW,EAAE;OAEf,EAAE,YAAY,EAAwC;OACtD,EAAE,YAAY,EAAE;OAEhB,EAAE,IAAI,EAAE;AAEf,MAAM,OAAO,kBAAmB,SAAQ,WAAW;IACjD;;OAEG;IACH,MAAM,CAAC,IAAmC,EAAE,OAAwB;QAClE,OAAO,IAAI,CAAC,OAAO,CAAC,IAAI,CAAC,uBAAuB,EAAE,EAAE,IAAI,EAAE,GAAG,OAAO,EAAE,CAAC,CAAC;IAC1E,CAAC;IAED;;OAEG;IACH,QAAQ,CAAC,EAAU,EAAE,OAAwB;QAC3C,OAAO,IAAI,CAAC,OAAO,CAAC,GAAG,CAAC,IAAI,CAAA,wBAAwB,EAAE,EAAE,EAAE,OAAO,CAAC,CAAC;IACrE,CAAC;IAED;;OAEG;IACH,MAAM,CACJ,EAAU,EACV,IAAmC,EACnC,OAAwB;QAExB,OAAO,IAAI,CAAC,OAAO,CAAC,KAAK,CAAC,IAAI,CAAA,wBAAwB,EAAE,EAAE,EAAE,EAAE,IAAI,EAAE,GAAG,OAAO,EAAE,CAAC,CAAC;IACpF,CAAC;IAED;;OAEG;IACH,IAAI,CACF,QAAwD,EAAE,EAC1D,OAAwB;QAExB,OAAO,IAAI,CAAC,OAAO,CAAC,UAAU,CAAC,uBAAuB,EAAE,CAAA,YAA+B,CAAA,EAAE;YACvF,KAAK;YACL,GAAG,OAAO;SACX,CAAC,CAAC;IACL,CAAC;IAED;;OAEG;IACH,MAAM,CAAC,EAAU,EAAE,OAAwB;QACzC,OAAO,IAAI,CAAC,OAAO,CAAC,MAAM,CAAC,IAAI,CAAA,wBAAwB,EAAE,EAAE,EAAE;YAC3D,GAAG,OAAO;YACV,OAAO,EAAE,YAAY,CAAC,CAAC,EAAE,MAAM,EAAE,KAAK,EAAE,EAAE,OAAO,EAAE,OAAO,CAAC,CAAC;SAC7D,CAAC,CAAC;IACL,CAAC;
|
|
1
|
+
{"version":3,"file":"pronunciation-dicts.mjs","sourceRoot":"","sources":["../src/resources/pronunciation-dicts.ts"],"names":[],"mappings":"AAAA,sFAAsF;OAE/E,EAAE,WAAW,EAAE;OAEf,EAAE,YAAY,EAAwC;OACtD,EAAE,YAAY,EAAE;OAEhB,EAAE,IAAI,EAAE;AAEf,MAAM,OAAO,kBAAmB,SAAQ,WAAW;IACjD;;OAEG;IACH,MAAM,CAAC,IAAmC,EAAE,OAAwB;QAClE,OAAO,IAAI,CAAC,OAAO,CAAC,IAAI,CAAC,uBAAuB,EAAE,EAAE,IAAI,EAAE,GAAG,OAAO,EAAE,CAAC,CAAC;IAC1E,CAAC;IAED;;OAEG;IACH,QAAQ,CAAC,EAAU,EAAE,OAAwB;QAC3C,OAAO,IAAI,CAAC,OAAO,CAAC,GAAG,CAAC,IAAI,CAAA,wBAAwB,EAAE,EAAE,EAAE,OAAO,CAAC,CAAC;IACrE,CAAC;IAED;;OAEG;IACH,MAAM,CACJ,EAAU,EACV,IAAmC,EACnC,OAAwB;QAExB,OAAO,IAAI,CAAC,OAAO,CAAC,KAAK,CAAC,IAAI,CAAA,wBAAwB,EAAE,EAAE,EAAE,EAAE,IAAI,EAAE,GAAG,OAAO,EAAE,CAAC,CAAC;IACpF,CAAC;IAED;;OAEG;IACH,IAAI,CACF,QAAwD,EAAE,EAC1D,OAAwB;QAExB,OAAO,IAAI,CAAC,OAAO,CAAC,UAAU,CAAC,uBAAuB,EAAE,CAAA,YAA+B,CAAA,EAAE;YACvF,KAAK;YACL,GAAG,OAAO;SACX,CAAC,CAAC;IACL,CAAC;IAED;;OAEG;IACH,MAAM,CAAC,EAAU,EAAE,OAAwB;QACzC,OAAO,IAAI,CAAC,OAAO,CAAC,MAAM,CAAC,IAAI,CAAA,wBAAwB,EAAE,EAAE,EAAE;YAC3D,GAAG,OAAO;YACV,OAAO,EAAE,YAAY,CAAC,CAAC,EAAE,MAAM,EAAE,KAAK,EAAE,EAAE,OAAO,EAAE,OAAO,CAAC,CAAC;SAC7D,CAAC,CAAC;IACL,CAAC;CACF"}
|
package/resources/stt.d.mts
CHANGED
|
@@ -86,111 +86,8 @@ export interface SttTranscribeParams {
|
|
|
86
86
|
/**
|
|
87
87
|
* Body param: The language of the input audio in ISO-639-1 format. Defaults to
|
|
88
88
|
* `en`.
|
|
89
|
-
*
|
|
90
|
-
* <Accordion title="Supported languages">
|
|
91
|
-
* - `en` (English)
|
|
92
|
-
* - `zh` (Chinese)
|
|
93
|
-
* - `de` (German)
|
|
94
|
-
* - `es` (Spanish)
|
|
95
|
-
* - `ru` (Russian)
|
|
96
|
-
* - `ko` (Korean)
|
|
97
|
-
* - `fr` (French)
|
|
98
|
-
* - `ja` (Japanese)
|
|
99
|
-
* - `pt` (Portuguese)
|
|
100
|
-
* - `tr` (Turkish)
|
|
101
|
-
* - `pl` (Polish)
|
|
102
|
-
* - `ca` (Catalan)
|
|
103
|
-
* - `nl` (Dutch)
|
|
104
|
-
* - `ar` (Arabic)
|
|
105
|
-
* - `sv` (Swedish)
|
|
106
|
-
* - `it` (Italian)
|
|
107
|
-
* - `id` (Indonesian)
|
|
108
|
-
* - `hi` (Hindi)
|
|
109
|
-
* - `fi` (Finnish)
|
|
110
|
-
* - `vi` (Vietnamese)
|
|
111
|
-
* - `he` (Hebrew)
|
|
112
|
-
* - `uk` (Ukrainian)
|
|
113
|
-
* - `el` (Greek)
|
|
114
|
-
* - `ms` (Malay)
|
|
115
|
-
* - `cs` (Czech)
|
|
116
|
-
* - `ro` (Romanian)
|
|
117
|
-
* - `da` (Danish)
|
|
118
|
-
* - `hu` (Hungarian)
|
|
119
|
-
* - `ta` (Tamil)
|
|
120
|
-
* - `no` (Norwegian)
|
|
121
|
-
* - `th` (Thai)
|
|
122
|
-
* - `ur` (Urdu)
|
|
123
|
-
* - `hr` (Croatian)
|
|
124
|
-
* - `bg` (Bulgarian)
|
|
125
|
-
* - `lt` (Lithuanian)
|
|
126
|
-
* - `la` (Latin)
|
|
127
|
-
* - `mi` (Maori)
|
|
128
|
-
* - `ml` (Malayalam)
|
|
129
|
-
* - `cy` (Welsh)
|
|
130
|
-
* - `sk` (Slovak)
|
|
131
|
-
* - `te` (Telugu)
|
|
132
|
-
* - `fa` (Persian)
|
|
133
|
-
* - `lv` (Latvian)
|
|
134
|
-
* - `bn` (Bengali)
|
|
135
|
-
* - `sr` (Serbian)
|
|
136
|
-
* - `az` (Azerbaijani)
|
|
137
|
-
* - `sl` (Slovenian)
|
|
138
|
-
* - `kn` (Kannada)
|
|
139
|
-
* - `et` (Estonian)
|
|
140
|
-
* - `mk` (Macedonian)
|
|
141
|
-
* - `br` (Breton)
|
|
142
|
-
* - `eu` (Basque)
|
|
143
|
-
* - `is` (Icelandic)
|
|
144
|
-
* - `hy` (Armenian)
|
|
145
|
-
* - `ne` (Nepali)
|
|
146
|
-
* - `mn` (Mongolian)
|
|
147
|
-
* - `bs` (Bosnian)
|
|
148
|
-
* - `kk` (Kazakh)
|
|
149
|
-
* - `sq` (Albanian)
|
|
150
|
-
* - `sw` (Swahili)
|
|
151
|
-
* - `gl` (Galician)
|
|
152
|
-
* - `mr` (Marathi)
|
|
153
|
-
* - `pa` (Punjabi)
|
|
154
|
-
* - `si` (Sinhala)
|
|
155
|
-
* - `km` (Khmer)
|
|
156
|
-
* - `sn` (Shona)
|
|
157
|
-
* - `yo` (Yoruba)
|
|
158
|
-
* - `so` (Somali)
|
|
159
|
-
* - `af` (Afrikaans)
|
|
160
|
-
* - `oc` (Occitan)
|
|
161
|
-
* - `ka` (Georgian)
|
|
162
|
-
* - `be` (Belarusian)
|
|
163
|
-
* - `tg` (Tajik)
|
|
164
|
-
* - `sd` (Sindhi)
|
|
165
|
-
* - `gu` (Gujarati)
|
|
166
|
-
* - `am` (Amharic)
|
|
167
|
-
* - `yi` (Yiddish)
|
|
168
|
-
* - `lo` (Lao)
|
|
169
|
-
* - `uz` (Uzbek)
|
|
170
|
-
* - `fo` (Faroese)
|
|
171
|
-
* - `ht` (Haitian Creole)
|
|
172
|
-
* - `ps` (Pashto)
|
|
173
|
-
* - `tk` (Turkmen)
|
|
174
|
-
* - `nn` (Nynorsk)
|
|
175
|
-
* - `mt` (Maltese)
|
|
176
|
-
* - `sa` (Sanskrit)
|
|
177
|
-
* - `lb` (Luxembourgish)
|
|
178
|
-
* - `my` (Myanmar)
|
|
179
|
-
* - `bo` (Tibetan)
|
|
180
|
-
* - `tl` (Tagalog)
|
|
181
|
-
* - `mg` (Malagasy)
|
|
182
|
-
* - `as` (Assamese)
|
|
183
|
-
* - `tt` (Tatar)
|
|
184
|
-
* - `haw` (Hawaiian)
|
|
185
|
-
* - `ln` (Lingala)
|
|
186
|
-
* - `ha` (Hausa)
|
|
187
|
-
* - `ba` (Bashkir)
|
|
188
|
-
* - `jw` (Javanese)
|
|
189
|
-
* - `su` (Sundanese)
|
|
190
|
-
* - `yue` (Cantonese)
|
|
191
|
-
* </Accordion>
|
|
192
89
|
*/
|
|
193
|
-
language?:
|
|
90
|
+
language?: 'en' | 'zh' | 'de' | 'es' | 'ru' | 'ko' | 'fr' | 'ja' | 'pt' | 'tr' | 'pl' | 'ca' | 'nl' | 'ar' | 'sv' | 'it' | 'id' | 'hi' | 'fi' | 'vi' | 'he' | 'uk' | 'el' | 'ms' | 'cs' | 'ro' | 'da' | 'hu' | 'ta' | 'no' | 'th' | 'ur' | 'hr' | 'bg' | 'lt' | 'la' | 'mi' | 'ml' | 'cy' | 'sk' | 'te' | 'fa' | 'lv' | 'bn' | 'sr' | 'az' | 'sl' | 'kn' | 'et' | 'mk' | 'br' | 'eu' | 'is' | 'hy' | 'ne' | 'mn' | 'bs' | 'kk' | 'sq' | 'sw' | 'gl' | 'mr' | 'pa' | 'si' | 'km' | 'sn' | 'yo' | 'so' | 'af' | 'oc' | 'ka' | 'be' | 'tg' | 'sd' | 'gu' | 'am' | 'yi' | 'lo' | 'uz' | 'fo' | 'ht' | 'ps' | 'tk' | 'nn' | 'mt' | 'sa' | 'lb' | 'my' | 'bo' | 'tl' | 'mg' | 'as' | 'tt' | 'haw' | 'ln' | 'ha' | 'ba' | 'jw' | 'su' | 'yue' | null;
|
|
194
91
|
/**
|
|
195
92
|
* Body param: ID of the model to use for transcription. Use `ink-whisper` for the
|
|
196
93
|
* latest Cartesia Whisper model.
|
package/resources/stt.d.mts.map
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"stt.d.mts","sourceRoot":"","sources":["../src/resources/stt.ts"],"names":[],"mappings":"OAEO,EAAE,WAAW,EAAE;OACf,EAAE,UAAU,EAAE;OACd,EAAE,KAAK,UAAU,EAAE;OACnB,EAAE,cAAc,EAAE;AAGzB,qBAAa,GAAI,SAAQ,WAAW;IAClC;;;;;;;;;;;;;;;;;;OAkBG;IACH,UAAU,CAAC,MAAM,EAAE,mBAAmB,EAAE,OAAO,CAAC,EAAE,cAAc,GAAG,UAAU,CAAC,qBAAqB,CAAC;CAOrG;AAED,MAAM,WAAW,qBAAqB;IACpC;;OAEG;IACH,IAAI,EAAE,MAAM,CAAC;IAEb;;OAEG;IACH,QAAQ,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAEzB;;OAEG;IACH,QAAQ,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAEzB;;;OAGG;IACH,KAAK,CAAC,EAAE,KAAK,CAAC,qBAAqB,CAAC,IAAI,CAAC,GAAG,IAAI,CAAC;CAClD;AAED,yBAAiB,qBAAqB,CAAC;IACrC,UAAiB,IAAI;QACnB;;WAEG;QACH,GAAG,EAAE,MAAM,CAAC;QAEZ;;WAEG;QACH,KAAK,EAAE,MAAM,CAAC;QAEd;;WAEG;QACH,IAAI,EAAE,MAAM,CAAC;KACd;CACF;AAED,MAAM,WAAW,mBAAmB;IAClC;;;;;;;;;;;;;OAaG;IACH,QAAQ,CAAC,EAAE,WAAW,GAAG,WAAW,GAAG,WAAW,GAAG,WAAW,GAAG,WAAW,GAAG,UAAU,GAAG,IAAI,CAAC;IAEnG;;OAEG;IACH,WAAW,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAE5B;;OAEG;IACH,IAAI,CAAC,EAAE,UAAU,CAAC;IAElB
|
|
1
|
+
{"version":3,"file":"stt.d.mts","sourceRoot":"","sources":["../src/resources/stt.ts"],"names":[],"mappings":"OAEO,EAAE,WAAW,EAAE;OACf,EAAE,UAAU,EAAE;OACd,EAAE,KAAK,UAAU,EAAE;OACnB,EAAE,cAAc,EAAE;AAGzB,qBAAa,GAAI,SAAQ,WAAW;IAClC;;;;;;;;;;;;;;;;;;OAkBG;IACH,UAAU,CAAC,MAAM,EAAE,mBAAmB,EAAE,OAAO,CAAC,EAAE,cAAc,GAAG,UAAU,CAAC,qBAAqB,CAAC;CAOrG;AAED,MAAM,WAAW,qBAAqB;IACpC;;OAEG;IACH,IAAI,EAAE,MAAM,CAAC;IAEb;;OAEG;IACH,QAAQ,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAEzB;;OAEG;IACH,QAAQ,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAEzB;;;OAGG;IACH,KAAK,CAAC,EAAE,KAAK,CAAC,qBAAqB,CAAC,IAAI,CAAC,GAAG,IAAI,CAAC;CAClD;AAED,yBAAiB,qBAAqB,CAAC;IACrC,UAAiB,IAAI;QACnB;;WAEG;QACH,GAAG,EAAE,MAAM,CAAC;QAEZ;;WAEG;QACH,KAAK,EAAE,MAAM,CAAC;QAEd;;WAEG;QACH,IAAI,EAAE,MAAM,CAAC;KACd;CACF;AAED,MAAM,WAAW,mBAAmB;IAClC;;;;;;;;;;;;;OAaG;IACH,QAAQ,CAAC,EAAE,WAAW,GAAG,WAAW,GAAG,WAAW,GAAG,WAAW,GAAG,WAAW,GAAG,UAAU,GAAG,IAAI,CAAC;IAEnG;;OAEG;IACH,WAAW,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAE5B;;OAEG;IACH,IAAI,CAAC,EAAE,UAAU,CAAC;IAElB;;;OAGG;IACH,QAAQ,CAAC,EACL,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,KAAK,GACL,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,KAAK,GACL,IAAI,CAAC;IAET;;;OAGG;IACH,KAAK,CAAC,EAAE,MAAM,CAAC;IAEf;;;OAGG;IACH,uBAAuB,CAAC,EAAE,KAAK,CAAC,MAAM,CAAC,GAAG,IAAI,CAAC;CAChD;AAED,MAAM,CAAC,OAAO,WAAW,GAAG,CAAC;IAC3B,OAAO,EACL,KAAK,qBAAqB,IAAI,qBAAqB,EACnD,KAAK,mBAAmB,IAAI,mBAAmB,GAChD,CAAC;CACH"}
|
package/resources/stt.d.ts
CHANGED
|
@@ -86,111 +86,8 @@ export interface SttTranscribeParams {
|
|
|
86
86
|
/**
|
|
87
87
|
* Body param: The language of the input audio in ISO-639-1 format. Defaults to
|
|
88
88
|
* `en`.
|
|
89
|
-
*
|
|
90
|
-
* <Accordion title="Supported languages">
|
|
91
|
-
* - `en` (English)
|
|
92
|
-
* - `zh` (Chinese)
|
|
93
|
-
* - `de` (German)
|
|
94
|
-
* - `es` (Spanish)
|
|
95
|
-
* - `ru` (Russian)
|
|
96
|
-
* - `ko` (Korean)
|
|
97
|
-
* - `fr` (French)
|
|
98
|
-
* - `ja` (Japanese)
|
|
99
|
-
* - `pt` (Portuguese)
|
|
100
|
-
* - `tr` (Turkish)
|
|
101
|
-
* - `pl` (Polish)
|
|
102
|
-
* - `ca` (Catalan)
|
|
103
|
-
* - `nl` (Dutch)
|
|
104
|
-
* - `ar` (Arabic)
|
|
105
|
-
* - `sv` (Swedish)
|
|
106
|
-
* - `it` (Italian)
|
|
107
|
-
* - `id` (Indonesian)
|
|
108
|
-
* - `hi` (Hindi)
|
|
109
|
-
* - `fi` (Finnish)
|
|
110
|
-
* - `vi` (Vietnamese)
|
|
111
|
-
* - `he` (Hebrew)
|
|
112
|
-
* - `uk` (Ukrainian)
|
|
113
|
-
* - `el` (Greek)
|
|
114
|
-
* - `ms` (Malay)
|
|
115
|
-
* - `cs` (Czech)
|
|
116
|
-
* - `ro` (Romanian)
|
|
117
|
-
* - `da` (Danish)
|
|
118
|
-
* - `hu` (Hungarian)
|
|
119
|
-
* - `ta` (Tamil)
|
|
120
|
-
* - `no` (Norwegian)
|
|
121
|
-
* - `th` (Thai)
|
|
122
|
-
* - `ur` (Urdu)
|
|
123
|
-
* - `hr` (Croatian)
|
|
124
|
-
* - `bg` (Bulgarian)
|
|
125
|
-
* - `lt` (Lithuanian)
|
|
126
|
-
* - `la` (Latin)
|
|
127
|
-
* - `mi` (Maori)
|
|
128
|
-
* - `ml` (Malayalam)
|
|
129
|
-
* - `cy` (Welsh)
|
|
130
|
-
* - `sk` (Slovak)
|
|
131
|
-
* - `te` (Telugu)
|
|
132
|
-
* - `fa` (Persian)
|
|
133
|
-
* - `lv` (Latvian)
|
|
134
|
-
* - `bn` (Bengali)
|
|
135
|
-
* - `sr` (Serbian)
|
|
136
|
-
* - `az` (Azerbaijani)
|
|
137
|
-
* - `sl` (Slovenian)
|
|
138
|
-
* - `kn` (Kannada)
|
|
139
|
-
* - `et` (Estonian)
|
|
140
|
-
* - `mk` (Macedonian)
|
|
141
|
-
* - `br` (Breton)
|
|
142
|
-
* - `eu` (Basque)
|
|
143
|
-
* - `is` (Icelandic)
|
|
144
|
-
* - `hy` (Armenian)
|
|
145
|
-
* - `ne` (Nepali)
|
|
146
|
-
* - `mn` (Mongolian)
|
|
147
|
-
* - `bs` (Bosnian)
|
|
148
|
-
* - `kk` (Kazakh)
|
|
149
|
-
* - `sq` (Albanian)
|
|
150
|
-
* - `sw` (Swahili)
|
|
151
|
-
* - `gl` (Galician)
|
|
152
|
-
* - `mr` (Marathi)
|
|
153
|
-
* - `pa` (Punjabi)
|
|
154
|
-
* - `si` (Sinhala)
|
|
155
|
-
* - `km` (Khmer)
|
|
156
|
-
* - `sn` (Shona)
|
|
157
|
-
* - `yo` (Yoruba)
|
|
158
|
-
* - `so` (Somali)
|
|
159
|
-
* - `af` (Afrikaans)
|
|
160
|
-
* - `oc` (Occitan)
|
|
161
|
-
* - `ka` (Georgian)
|
|
162
|
-
* - `be` (Belarusian)
|
|
163
|
-
* - `tg` (Tajik)
|
|
164
|
-
* - `sd` (Sindhi)
|
|
165
|
-
* - `gu` (Gujarati)
|
|
166
|
-
* - `am` (Amharic)
|
|
167
|
-
* - `yi` (Yiddish)
|
|
168
|
-
* - `lo` (Lao)
|
|
169
|
-
* - `uz` (Uzbek)
|
|
170
|
-
* - `fo` (Faroese)
|
|
171
|
-
* - `ht` (Haitian Creole)
|
|
172
|
-
* - `ps` (Pashto)
|
|
173
|
-
* - `tk` (Turkmen)
|
|
174
|
-
* - `nn` (Nynorsk)
|
|
175
|
-
* - `mt` (Maltese)
|
|
176
|
-
* - `sa` (Sanskrit)
|
|
177
|
-
* - `lb` (Luxembourgish)
|
|
178
|
-
* - `my` (Myanmar)
|
|
179
|
-
* - `bo` (Tibetan)
|
|
180
|
-
* - `tl` (Tagalog)
|
|
181
|
-
* - `mg` (Malagasy)
|
|
182
|
-
* - `as` (Assamese)
|
|
183
|
-
* - `tt` (Tatar)
|
|
184
|
-
* - `haw` (Hawaiian)
|
|
185
|
-
* - `ln` (Lingala)
|
|
186
|
-
* - `ha` (Hausa)
|
|
187
|
-
* - `ba` (Bashkir)
|
|
188
|
-
* - `jw` (Javanese)
|
|
189
|
-
* - `su` (Sundanese)
|
|
190
|
-
* - `yue` (Cantonese)
|
|
191
|
-
* </Accordion>
|
|
192
89
|
*/
|
|
193
|
-
language?:
|
|
90
|
+
language?: 'en' | 'zh' | 'de' | 'es' | 'ru' | 'ko' | 'fr' | 'ja' | 'pt' | 'tr' | 'pl' | 'ca' | 'nl' | 'ar' | 'sv' | 'it' | 'id' | 'hi' | 'fi' | 'vi' | 'he' | 'uk' | 'el' | 'ms' | 'cs' | 'ro' | 'da' | 'hu' | 'ta' | 'no' | 'th' | 'ur' | 'hr' | 'bg' | 'lt' | 'la' | 'mi' | 'ml' | 'cy' | 'sk' | 'te' | 'fa' | 'lv' | 'bn' | 'sr' | 'az' | 'sl' | 'kn' | 'et' | 'mk' | 'br' | 'eu' | 'is' | 'hy' | 'ne' | 'mn' | 'bs' | 'kk' | 'sq' | 'sw' | 'gl' | 'mr' | 'pa' | 'si' | 'km' | 'sn' | 'yo' | 'so' | 'af' | 'oc' | 'ka' | 'be' | 'tg' | 'sd' | 'gu' | 'am' | 'yi' | 'lo' | 'uz' | 'fo' | 'ht' | 'ps' | 'tk' | 'nn' | 'mt' | 'sa' | 'lb' | 'my' | 'bo' | 'tl' | 'mg' | 'as' | 'tt' | 'haw' | 'ln' | 'ha' | 'ba' | 'jw' | 'su' | 'yue' | null;
|
|
194
91
|
/**
|
|
195
92
|
* Body param: ID of the model to use for transcription. Use `ink-whisper` for the
|
|
196
93
|
* latest Cartesia Whisper model.
|
package/resources/stt.d.ts.map
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"stt.d.ts","sourceRoot":"","sources":["../src/resources/stt.ts"],"names":[],"mappings":"OAEO,EAAE,WAAW,EAAE;OACf,EAAE,UAAU,EAAE;OACd,EAAE,KAAK,UAAU,EAAE;OACnB,EAAE,cAAc,EAAE;AAGzB,qBAAa,GAAI,SAAQ,WAAW;IAClC;;;;;;;;;;;;;;;;;;OAkBG;IACH,UAAU,CAAC,MAAM,EAAE,mBAAmB,EAAE,OAAO,CAAC,EAAE,cAAc,GAAG,UAAU,CAAC,qBAAqB,CAAC;CAOrG;AAED,MAAM,WAAW,qBAAqB;IACpC;;OAEG;IACH,IAAI,EAAE,MAAM,CAAC;IAEb;;OAEG;IACH,QAAQ,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAEzB;;OAEG;IACH,QAAQ,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAEzB;;;OAGG;IACH,KAAK,CAAC,EAAE,KAAK,CAAC,qBAAqB,CAAC,IAAI,CAAC,GAAG,IAAI,CAAC;CAClD;AAED,yBAAiB,qBAAqB,CAAC;IACrC,UAAiB,IAAI;QACnB;;WAEG;QACH,GAAG,EAAE,MAAM,CAAC;QAEZ;;WAEG;QACH,KAAK,EAAE,MAAM,CAAC;QAEd;;WAEG;QACH,IAAI,EAAE,MAAM,CAAC;KACd;CACF;AAED,MAAM,WAAW,mBAAmB;IAClC;;;;;;;;;;;;;OAaG;IACH,QAAQ,CAAC,EAAE,WAAW,GAAG,WAAW,GAAG,WAAW,GAAG,WAAW,GAAG,WAAW,GAAG,UAAU,GAAG,IAAI,CAAC;IAEnG;;OAEG;IACH,WAAW,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAE5B;;OAEG;IACH,IAAI,CAAC,EAAE,UAAU,CAAC;IAElB
|
|
1
|
+
{"version":3,"file":"stt.d.ts","sourceRoot":"","sources":["../src/resources/stt.ts"],"names":[],"mappings":"OAEO,EAAE,WAAW,EAAE;OACf,EAAE,UAAU,EAAE;OACd,EAAE,KAAK,UAAU,EAAE;OACnB,EAAE,cAAc,EAAE;AAGzB,qBAAa,GAAI,SAAQ,WAAW;IAClC;;;;;;;;;;;;;;;;;;OAkBG;IACH,UAAU,CAAC,MAAM,EAAE,mBAAmB,EAAE,OAAO,CAAC,EAAE,cAAc,GAAG,UAAU,CAAC,qBAAqB,CAAC;CAOrG;AAED,MAAM,WAAW,qBAAqB;IACpC;;OAEG;IACH,IAAI,EAAE,MAAM,CAAC;IAEb;;OAEG;IACH,QAAQ,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAEzB;;OAEG;IACH,QAAQ,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAEzB;;;OAGG;IACH,KAAK,CAAC,EAAE,KAAK,CAAC,qBAAqB,CAAC,IAAI,CAAC,GAAG,IAAI,CAAC;CAClD;AAED,yBAAiB,qBAAqB,CAAC;IACrC,UAAiB,IAAI;QACnB;;WAEG;QACH,GAAG,EAAE,MAAM,CAAC;QAEZ;;WAEG;QACH,KAAK,EAAE,MAAM,CAAC;QAEd;;WAEG;QACH,IAAI,EAAE,MAAM,CAAC;KACd;CACF;AAED,MAAM,WAAW,mBAAmB;IAClC;;;;;;;;;;;;;OAaG;IACH,QAAQ,CAAC,EAAE,WAAW,GAAG,WAAW,GAAG,WAAW,GAAG,WAAW,GAAG,WAAW,GAAG,UAAU,GAAG,IAAI,CAAC;IAEnG;;OAEG;IACH,WAAW,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAE5B;;OAEG;IACH,IAAI,CAAC,EAAE,UAAU,CAAC;IAElB;;;OAGG;IACH,QAAQ,CAAC,EACL,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,KAAK,GACL,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,IAAI,GACJ,KAAK,GACL,IAAI,CAAC;IAET;;;OAGG;IACH,KAAK,CAAC,EAAE,MAAM,CAAC;IAEf;;;OAGG;IACH,uBAAuB,CAAC,EAAE,KAAK,CAAC,MAAM,CAAC,GAAG,IAAI,CAAC;CAChD;AAED,MAAM,CAAC,OAAO,WAAW,GAAG,CAAC;IAC3B,OAAO,EACL,KAAK,qBAAqB,IAAI,qBAAqB,EACnD,KAAK,mBAAmB,IAAI,mBAAmB,GAChD,CAAC;CACH"}
|
package/resources/tts/tts.d.mts
CHANGED
|
@@ -15,39 +15,28 @@ export declare class TTS extends APIResource {
|
|
|
15
15
|
generateSse(body: TTSGenerateSseParams, options?: RequestOptions): APIPromise<void>;
|
|
16
16
|
}
|
|
17
17
|
/**
|
|
18
|
-
* Configure the various attributes of the generated speech. These
|
|
19
|
-
*
|
|
18
|
+
* Configure the various attributes of the generated speech. These are only for
|
|
19
|
+
* `sonic-3` and have no effect on earlier models.
|
|
20
|
+
*
|
|
21
|
+
* See
|
|
22
|
+
* [Volume, Speed, and Emotion in Sonic-3](/build-with-cartesia/sonic-3/volume-speed-emotion)
|
|
23
|
+
* for a guide on this option.
|
|
20
24
|
*/
|
|
21
25
|
export interface GenerationConfig {
|
|
22
26
|
/**
|
|
23
|
-
*
|
|
24
|
-
*/
|
|
25
|
-
experimental?: GenerationConfig.Experimental | null;
|
|
26
|
-
/**
|
|
27
|
-
* Adjust the speed of the generated speech between -1.0 (slower) and 1.0 (faster).
|
|
28
|
-
* 0.0 is the default speed.
|
|
27
|
+
* Guide the emotion of the generated speech.
|
|
29
28
|
*/
|
|
30
|
-
|
|
29
|
+
emotion?: 'neutral' | 'happy' | 'excited' | 'enthusiastic' | 'elated' | 'euphoric' | 'triumphant' | 'amazed' | 'surprised' | 'flirtatious' | 'curious' | 'content' | 'peaceful' | 'serene' | 'calm' | 'grateful' | 'affectionate' | 'trust' | 'sympathetic' | 'anticipation' | 'mysterious' | 'angry' | 'mad' | 'outraged' | 'frustrated' | 'agitated' | 'threatened' | 'disgusted' | 'contempt' | 'envious' | 'sarcastic' | 'ironic' | 'sad' | 'dejected' | 'melancholic' | 'disappointed' | 'hurt' | 'guilty' | 'bored' | 'tired' | 'rejected' | 'nostalgic' | 'wistful' | 'apologetic' | 'hesitant' | 'insecure' | 'confused' | 'resigned' | 'anxious' | 'panicked' | 'alarmed' | 'scared' | 'proud' | 'confident' | 'distant' | 'skeptical' | 'contemplative' | 'determined';
|
|
31
30
|
/**
|
|
32
|
-
* Adjust the
|
|
33
|
-
* (
|
|
31
|
+
* Adjust the speed of the generated speech between 0.6x and 1.5x the original
|
|
32
|
+
* speed (default is 1.0x). Valid values are between [0.6, 1.5] inclusive.
|
|
34
33
|
*/
|
|
35
|
-
|
|
36
|
-
}
|
|
37
|
-
export declare namespace GenerationConfig {
|
|
34
|
+
speed?: number;
|
|
38
35
|
/**
|
|
39
|
-
*
|
|
36
|
+
* Adjust the volume of the generated speech between 0.5x and 2.0x the original
|
|
37
|
+
* volume (default is 1.0x). Valid values are between [0.5, 2.0] inclusive.
|
|
40
38
|
*/
|
|
41
|
-
|
|
42
|
-
/**
|
|
43
|
-
* Toggle accent localization: 0 (disabled, default) or 1 (enabled). When enabled,
|
|
44
|
-
* the voice adapts to match the transcript language's accent while preserving
|
|
45
|
-
* vocal characteristics. When disabled, maintains the original voice accent. For
|
|
46
|
-
* more information, see
|
|
47
|
-
* [Localize Voices](/build-with-sonic/capabilities/localize-voices).
|
|
48
|
-
*/
|
|
49
|
-
accent_localization?: number | null;
|
|
50
|
-
}
|
|
39
|
+
volume?: number;
|
|
51
40
|
}
|
|
52
41
|
export interface GenerationRequest {
|
|
53
42
|
/**
|
|
@@ -86,27 +75,27 @@ export interface GenerationRequest {
|
|
|
86
75
|
* defaults to `false`.
|
|
87
76
|
*/
|
|
88
77
|
continue?: boolean | null;
|
|
89
|
-
/**
|
|
90
|
-
* The maximum duration of the audio in seconds. You do not usually need to specify
|
|
91
|
-
* this. If the duration is not appropriate for the length of the transcript, the
|
|
92
|
-
* output audio may be truncated.
|
|
93
|
-
*/
|
|
94
|
-
duration?: number | null;
|
|
95
78
|
/**
|
|
96
79
|
* Whether to flush the context.
|
|
97
80
|
*/
|
|
98
81
|
flush?: boolean | null;
|
|
99
82
|
/**
|
|
100
|
-
*
|
|
83
|
+
* Configure the various attributes of the generated speech. These are only for
|
|
84
|
+
* `sonic-3` and have no effect on earlier models.
|
|
101
85
|
*
|
|
102
|
-
*
|
|
103
|
-
*
|
|
104
|
-
*
|
|
86
|
+
* See
|
|
87
|
+
* [Volume, Speed, and Emotion in Sonic-3](/build-with-cartesia/sonic-3/volume-speed-emotion)
|
|
88
|
+
* for a guide on this option.
|
|
105
89
|
*/
|
|
106
|
-
|
|
90
|
+
generation_config?: GenerationConfig;
|
|
91
|
+
/**
|
|
92
|
+
* The language that the given voice should speak the transcript in. For valid
|
|
93
|
+
* options, see [Models](/build-with-cartesia/tts-models).
|
|
94
|
+
*/
|
|
95
|
+
language?: VoicesAPI.SupportedLanguage;
|
|
107
96
|
/**
|
|
108
97
|
* The maximum time in milliseconds to buffer text before starting generation.
|
|
109
|
-
* Values between [0,
|
|
98
|
+
* Values between [0, 5000]ms are supported. Defaults to 3000ms.
|
|
110
99
|
*
|
|
111
100
|
* When set, the model will buffer incoming text chunks until it's confident it has
|
|
112
101
|
* enough context to generate high-quality speech, or the buffer delay elapses,
|
|
@@ -118,21 +107,17 @@ export interface GenerationRequest {
|
|
|
118
107
|
*/
|
|
119
108
|
max_buffer_delay_ms?: number | null;
|
|
120
109
|
/**
|
|
121
|
-
*
|
|
122
|
-
*
|
|
123
|
-
* element of the list. If there are conflicts with dict items, the latest dict
|
|
124
|
-
* will take precedence.
|
|
110
|
+
* The ID of a pronunciation dictionary to use for the generation. Pronunciation
|
|
111
|
+
* dictionaries are supported by `sonic-3` models and newer.
|
|
125
112
|
*/
|
|
126
|
-
|
|
113
|
+
pronunciation_dict_id?: string | null;
|
|
127
114
|
/**
|
|
128
|
-
*
|
|
129
|
-
*
|
|
130
|
-
*
|
|
131
|
-
*
|
|
132
|
-
* Influences the speed of the generated speech. Faster speeds may reduce
|
|
133
|
-
* hallucination rate.
|
|
115
|
+
* @deprecated Use `generation_config.speed` for sonic-3. Speed setting for the
|
|
116
|
+
* model. Defaults to `normal`. This feature is experimental and may not work for
|
|
117
|
+
* all voices. Influences the speed of the generated speech. Faster speeds may
|
|
118
|
+
* reduce hallucination rate.
|
|
134
119
|
*/
|
|
135
|
-
speed?: ModelSpeed
|
|
120
|
+
speed?: ModelSpeed;
|
|
136
121
|
/**
|
|
137
122
|
* Whether to use normalized timestamps (True) or original timestamps (False).
|
|
138
123
|
*/
|
|
@@ -142,21 +127,19 @@ export declare namespace GenerationRequest {
|
|
|
142
127
|
interface OutputFormat {
|
|
143
128
|
container: 'raw';
|
|
144
129
|
encoding: InfillAPI.RawEncoding;
|
|
145
|
-
sample_rate:
|
|
130
|
+
sample_rate: 8000 | 16000 | 22050 | 24000 | 44100 | 48000;
|
|
146
131
|
}
|
|
147
132
|
}
|
|
148
133
|
/**
|
|
149
|
-
*
|
|
150
|
-
*
|
|
151
|
-
*
|
|
152
|
-
*
|
|
153
|
-
* Influences the speed of the generated speech. Faster speeds may reduce
|
|
154
|
-
* hallucination rate.
|
|
134
|
+
* @deprecated Use `generation_config.speed` for sonic-3. Speed setting for the
|
|
135
|
+
* model. Defaults to `normal`. This feature is experimental and may not work for
|
|
136
|
+
* all voices. Influences the speed of the generated speech. Faster speeds may
|
|
137
|
+
* reduce hallucination rate.
|
|
155
138
|
*/
|
|
156
139
|
export type ModelSpeed = 'slow' | 'normal' | 'fast';
|
|
157
140
|
export interface RawOutputFormat {
|
|
158
141
|
encoding: InfillAPI.RawEncoding;
|
|
159
|
-
sample_rate:
|
|
142
|
+
sample_rate: 8000 | 16000 | 22050 | 24000 | 44100 | 48000;
|
|
160
143
|
}
|
|
161
144
|
export interface VoiceSpecifier {
|
|
162
145
|
/**
|
|
@@ -189,11 +172,8 @@ export declare namespace WebsocketClientEvent {
|
|
|
189
172
|
export type WebsocketResponse = WebsocketResponse.Chunk | WebsocketResponse.FlushDone | WebsocketResponse.Done | WebsocketResponse.Timestamps | WebsocketResponse.Error | WebsocketResponse.PhonemeTimestamps;
|
|
190
173
|
export declare namespace WebsocketResponse {
|
|
191
174
|
interface Chunk {
|
|
192
|
-
data: string;
|
|
193
175
|
done: boolean;
|
|
194
176
|
status_code: number;
|
|
195
|
-
step_time: number;
|
|
196
|
-
type: 'chunk';
|
|
197
177
|
/**
|
|
198
178
|
* A unique identifier for the context. You can use any unique identifier, like a
|
|
199
179
|
* UUID or human ID.
|
|
@@ -202,6 +182,7 @@ export declare namespace WebsocketResponse {
|
|
|
202
182
|
* conversation IDs) as context IDs.
|
|
203
183
|
*/
|
|
204
184
|
context_id?: string | null;
|
|
185
|
+
type?: 'chunk';
|
|
205
186
|
}
|
|
206
187
|
interface FlushDone {
|
|
207
188
|
done: boolean;
|
|
@@ -279,45 +260,36 @@ export interface TTSGenerateParams {
|
|
|
279
260
|
transcript: string;
|
|
280
261
|
voice: VoiceSpecifier;
|
|
281
262
|
/**
|
|
282
|
-
*
|
|
283
|
-
*
|
|
284
|
-
*
|
|
263
|
+
* Configure the various attributes of the generated speech. These are only for
|
|
264
|
+
* `sonic-3` and have no effect on earlier models.
|
|
265
|
+
*
|
|
266
|
+
* See
|
|
267
|
+
* [Volume, Speed, and Emotion in Sonic-3](/build-with-cartesia/sonic-3/volume-speed-emotion)
|
|
268
|
+
* for a guide on this option.
|
|
285
269
|
*/
|
|
286
|
-
|
|
270
|
+
generation_config?: GenerationConfig;
|
|
287
271
|
/**
|
|
288
|
-
*
|
|
289
|
-
*
|
|
290
|
-
*/
|
|
291
|
-
generation_config?: GenerationConfig | null;
|
|
292
|
-
/**
|
|
293
|
-
* The language that the given voice should speak the transcript in.
|
|
294
|
-
*
|
|
295
|
-
* Options: English (en), French (fr), German (de), Spanish (es), Portuguese (pt),
|
|
296
|
-
* Chinese (zh), Japanese (ja), Hindi (hi), Italian (it), Korean (ko), Dutch (nl),
|
|
297
|
-
* Polish (pl), Russian (ru), Swedish (sv), Turkish (tr).
|
|
272
|
+
* The language that the given voice should speak the transcript in. For valid
|
|
273
|
+
* options, see [Models](/build-with-cartesia/tts-models).
|
|
298
274
|
*/
|
|
299
275
|
language?: VoicesAPI.SupportedLanguage | null;
|
|
300
276
|
/**
|
|
301
|
-
*
|
|
302
|
-
*
|
|
303
|
-
* element of the list. If there are conflicts with dict items, the latest dict
|
|
304
|
-
* will take precedence.
|
|
277
|
+
* The ID of a pronunciation dictionary to use for the generation. Pronunciation
|
|
278
|
+
* dictionaries are supported by `sonic-3` models and newer.
|
|
305
279
|
*/
|
|
306
|
-
|
|
280
|
+
pronunciation_dict_id?: string | null;
|
|
307
281
|
/**
|
|
308
282
|
* Whether to save the generated audio file. When true, the response will include a
|
|
309
283
|
* `Cartesia-File-ID` header.
|
|
310
284
|
*/
|
|
311
285
|
save?: boolean | null;
|
|
312
286
|
/**
|
|
313
|
-
*
|
|
314
|
-
*
|
|
315
|
-
*
|
|
316
|
-
*
|
|
317
|
-
* Influences the speed of the generated speech. Faster speeds may reduce
|
|
318
|
-
* hallucination rate.
|
|
287
|
+
* @deprecated Use `generation_config.speed` for sonic-3. Speed setting for the
|
|
288
|
+
* model. Defaults to `normal`. This feature is experimental and may not work for
|
|
289
|
+
* all voices. Influences the speed of the generated speech. Faster speeds may
|
|
290
|
+
* reduce hallucination rate.
|
|
319
291
|
*/
|
|
320
|
-
speed?: ModelSpeed
|
|
292
|
+
speed?: ModelSpeed;
|
|
321
293
|
}
|
|
322
294
|
export declare namespace TTSGenerateParams {
|
|
323
295
|
interface RawOutputFormat extends TTSAPI.RawOutputFormat {
|
|
@@ -327,12 +299,8 @@ export declare namespace TTSGenerateParams {
|
|
|
327
299
|
container?: 'wav';
|
|
328
300
|
}
|
|
329
301
|
interface MP3OutputFormat {
|
|
330
|
-
|
|
331
|
-
|
|
332
|
-
* 64000, 96000, 128000, 192000.
|
|
333
|
-
*/
|
|
334
|
-
bit_rate: number;
|
|
335
|
-
sample_rate: number;
|
|
302
|
+
bit_rate: 32000 | 64000 | 96000 | 128000 | 192000;
|
|
303
|
+
sample_rate: 8000 | 16000 | 22050 | 24000 | 44100 | 48000;
|
|
336
304
|
container?: 'mp3';
|
|
337
305
|
}
|
|
338
306
|
}
|
|
@@ -362,35 +330,31 @@ export interface TTSGenerateSseParams {
|
|
|
362
330
|
*/
|
|
363
331
|
context_id?: string | null;
|
|
364
332
|
/**
|
|
365
|
-
*
|
|
366
|
-
*
|
|
367
|
-
*
|
|
333
|
+
* Configure the various attributes of the generated speech. These are only for
|
|
334
|
+
* `sonic-3` and have no effect on earlier models.
|
|
335
|
+
*
|
|
336
|
+
* See
|
|
337
|
+
* [Volume, Speed, and Emotion in Sonic-3](/build-with-cartesia/sonic-3/volume-speed-emotion)
|
|
338
|
+
* for a guide on this option.
|
|
368
339
|
*/
|
|
369
|
-
|
|
340
|
+
generation_config?: GenerationConfig;
|
|
370
341
|
/**
|
|
371
|
-
* The language that the given voice should speak the transcript in.
|
|
372
|
-
*
|
|
373
|
-
* Options: English (en), French (fr), German (de), Spanish (es), Portuguese (pt),
|
|
374
|
-
* Chinese (zh), Japanese (ja), Hindi (hi), Italian (it), Korean (ko), Dutch (nl),
|
|
375
|
-
* Polish (pl), Russian (ru), Swedish (sv), Turkish (tr).
|
|
342
|
+
* The language that the given voice should speak the transcript in. For valid
|
|
343
|
+
* options, see [Models](/build-with-cartesia/tts-models).
|
|
376
344
|
*/
|
|
377
|
-
language?: VoicesAPI.SupportedLanguage
|
|
345
|
+
language?: VoicesAPI.SupportedLanguage;
|
|
378
346
|
/**
|
|
379
|
-
*
|
|
380
|
-
*
|
|
381
|
-
* element of the list. If there are conflicts with dict items, the latest dict
|
|
382
|
-
* will take precedence.
|
|
347
|
+
* The ID of a pronunciation dictionary to use for the generation. Pronunciation
|
|
348
|
+
* dictionaries are supported by `sonic-3` models and newer.
|
|
383
349
|
*/
|
|
384
|
-
|
|
350
|
+
pronunciation_dict_id?: string | null;
|
|
385
351
|
/**
|
|
386
|
-
*
|
|
387
|
-
*
|
|
388
|
-
*
|
|
389
|
-
*
|
|
390
|
-
* Influences the speed of the generated speech. Faster speeds may reduce
|
|
391
|
-
* hallucination rate.
|
|
352
|
+
* @deprecated Use `generation_config.speed` for sonic-3. Speed setting for the
|
|
353
|
+
* model. Defaults to `normal`. This feature is experimental and may not work for
|
|
354
|
+
* all voices. Influences the speed of the generated speech. Faster speeds may
|
|
355
|
+
* reduce hallucination rate.
|
|
392
356
|
*/
|
|
393
|
-
speed?: ModelSpeed
|
|
357
|
+
speed?: ModelSpeed;
|
|
394
358
|
/**
|
|
395
359
|
* Whether to use normalized timestamps (True) or original timestamps (False).
|
|
396
360
|
*/
|
|
@@ -400,7 +364,7 @@ export declare namespace TTSGenerateSseParams {
|
|
|
400
364
|
interface OutputFormat {
|
|
401
365
|
container: 'raw';
|
|
402
366
|
encoding: InfillAPI.RawEncoding;
|
|
403
|
-
sample_rate:
|
|
367
|
+
sample_rate: 8000 | 16000 | 22050 | 24000 | 44100 | 48000;
|
|
404
368
|
}
|
|
405
369
|
}
|
|
406
370
|
export declare namespace TTS {
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"tts.d.mts","sourceRoot":"","sources":["../../src/resources/tts/tts.ts"],"names":[],"mappings":"OAEO,EAAE,WAAW,EAAE;OACf,KAAK,MAAM;OACX,KAAK,SAAS;OACd,KAAK,SAAS;OACd,EAAE,UAAU,EAAE;OAEd,EAAE,cAAc,EAAE;AAEzB,qBAAa,GAAI,SAAQ,WAAW;IAClC;;OAEG;IACH,QAAQ,CAAC,IAAI,EAAE,iBAAiB,EAAE,OAAO,CAAC,EAAE,cAAc,GAAG,UAAU,CAAC,QAAQ,CAAC;IASjF;;OAEG;IACH,WAAW,CAAC,IAAI,EAAE,oBAAoB,EAAE,OAAO,CAAC,EAAE,cAAc,GAAG,UAAU,CAAC,IAAI,CAAC;CAOpF;AAED
|
|
1
|
+
{"version":3,"file":"tts.d.mts","sourceRoot":"","sources":["../../src/resources/tts/tts.ts"],"names":[],"mappings":"OAEO,EAAE,WAAW,EAAE;OACf,KAAK,MAAM;OACX,KAAK,SAAS;OACd,KAAK,SAAS;OACd,EAAE,UAAU,EAAE;OAEd,EAAE,cAAc,EAAE;AAEzB,qBAAa,GAAI,SAAQ,WAAW;IAClC;;OAEG;IACH,QAAQ,CAAC,IAAI,EAAE,iBAAiB,EAAE,OAAO,CAAC,EAAE,cAAc,GAAG,UAAU,CAAC,QAAQ,CAAC;IASjF;;OAEG;IACH,WAAW,CAAC,IAAI,EAAE,oBAAoB,EAAE,OAAO,CAAC,EAAE,cAAc,GAAG,UAAU,CAAC,IAAI,CAAC;CAOpF;AAED;;;;;;;GAOG;AACH,MAAM,WAAW,gBAAgB;IAC/B;;OAEG;IACH,OAAO,CAAC,EACJ,SAAS,GACT,OAAO,GACP,SAAS,GACT,cAAc,GACd,QAAQ,GACR,UAAU,GACV,YAAY,GACZ,QAAQ,GACR,WAAW,GACX,aAAa,GACb,SAAS,GACT,SAAS,GACT,UAAU,GACV,QAAQ,GACR,MAAM,GACN,UAAU,GACV,cAAc,GACd,OAAO,GACP,aAAa,GACb,cAAc,GACd,YAAY,GACZ,OAAO,GACP,KAAK,GACL,UAAU,GACV,YAAY,GACZ,UAAU,GACV,YAAY,GACZ,WAAW,GACX,UAAU,GACV,SAAS,GACT,WAAW,GACX,QAAQ,GACR,KAAK,GACL,UAAU,GACV,aAAa,GACb,cAAc,GACd,MAAM,GACN,QAAQ,GACR,OAAO,GACP,OAAO,GACP,UAAU,GACV,WAAW,GACX,SAAS,GACT,YAAY,GACZ,UAAU,GACV,UAAU,GACV,UAAU,GACV,UAAU,GACV,SAAS,GACT,UAAU,GACV,SAAS,GACT,QAAQ,GACR,OAAO,GACP,WAAW,GACX,SAAS,GACT,WAAW,GACX,eAAe,GACf,YAAY,CAAC;IAEjB;;;OAGG;IACH,KAAK,CAAC,EAAE,MAAM,CAAC;IAEf;;;OAGG;IACH,MAAM,CAAC,EAAE,MAAM,CAAC;CACjB;AAED,MAAM,WAAW,iBAAiB;IAChC;;;OAGG;IACH,QAAQ,EAAE,MAAM,CAAC;IAEjB,aAAa,EAAE,iBAAiB,CAAC,YAAY,CAAC;IAE9C;;OAEG;IACH,UAAU,EAAE,MAAM,CAAC;IAEnB,KAAK,EAAE,cAAc,CAAC;IAEtB;;;;OAIG;IACH,sBAAsB,CAAC,EAAE,OAAO,GAAG,IAAI,CAAC;IAExC;;;;OAIG;IACH,cAAc,CAAC,EAAE,OAAO,GAAG,IAAI,CAAC;IAEhC;;;;;;OAMG;IACH,UAAU,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAE3B;;;OAGG;IACH,QAAQ,CAAC,EAAE,OAAO,GAAG,IAAI,CAAC;IAE1B;;OAEG;IACH,KAAK,CAAC,EAAE,OAAO,GAAG,IAAI,CAAC;IAEvB;;;;;;;OAOG;IACH,iBAAiB,CAAC,EAAE,gBAAgB,CAAC;IAErC;;;OAGG;IACH,QAAQ,CAAC,EAAE,SAAS,CAAC,iBAAiB,CAAC;IAEvC;;;;;;;;;;;OAWG;IACH,mBAAmB,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAEpC;;;OAGG;IACH,qBAAqB,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAEtC;;;;;OAKG;IACH,KAAK,CAAC,EAAE,UAAU,CAAC;IAEnB;;OAEG;IACH,yBAAyB,CAAC,EAAE,OAAO,GAAG,IAAI,CAAC;CAC5C;AAED,yBAAiB,iBAAiB,CAAC;IACjC,UAAiB,YAAY;QAC3B,SAAS,EAAE,KAAK,CAAC;QAEjB,QAAQ,EAAE,SAAS,CAAC,WAAW,CAAC;QAEhC,WAAW,EAAE,IAAI,GAAG,KAAK,GAAG,KAAK,GAAG,KAAK,GAAG,KAAK,GAAG,KAAK,CAAC;KAC3D;CACF;AAED;;;;;GAKG;AACH,MAAM,MAAM,UAAU,GAAG,MAAM,GAAG,QAAQ,GAAG,MAAM,CAAC;AAEpD,MAAM,WAAW,eAAe;IAC9B,QAAQ,EAAE,SAAS,CAAC,WAAW,CAAC;IAEhC,WAAW,EAAE,IAAI,GAAG,KAAK,GAAG,KAAK,GAAG,KAAK,GAAG,KAAK,GAAG,KAAK,CAAC;CAC3D;AAED,MAAM,WAAW,cAAc;IAC7B;;OAEG;IACH,EAAE,EAAE,MAAM,CAAC;IAEX,IAAI,EAAE,IAAI,CAAC;CACZ;AAED;;GAEG;AACH,MAAM,MAAM,oBAAoB,GAAG,iBAAiB,GAAG,oBAAoB,CAAC,oBAAoB,CAAC;AAEjG,yBAAiB,oBAAoB,CAAC;IACpC;;;OAGG;IACH,UAAiB,oBAAoB;QACnC;;;WAGG;QACH,MAAM,EAAE,IAAI,CAAC;QAEb;;WAEG;QACH,UAAU,EAAE,MAAM,CAAC;KACpB;CACF;AAED,MAAM,MAAM,iBAAiB,GACzB,iBAAiB,CAAC,KAAK,GACvB,iBAAiB,CAAC,SAAS,GAC3B,iBAAiB,CAAC,IAAI,GACtB,iBAAiB,CAAC,UAAU,GAC5B,iBAAiB,CAAC,KAAK,GACvB,iBAAiB,CAAC,iBAAiB,CAAC;AAExC,yBAAiB,iBAAiB,CAAC;IACjC,UAAiB,KAAK;QACpB,IAAI,EAAE,OAAO,CAAC;QAEd,WAAW,EAAE,MAAM,CAAC;QAEpB;;;;;;WAMG;QACH,UAAU,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;QAE3B,IAAI,CAAC,EAAE,OAAO,CAAC;KAChB;IAED,UAAiB,SAAS;QACxB,IAAI,EAAE,OAAO,CAAC;QAEd,WAAW,EAAE,MAAM,CAAC;QAEpB;;;;;;WAMG;QACH,UAAU,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;QAE3B,IAAI,CAAC,EAAE,YAAY,CAAC;KACrB;IAED,UAAiB,IAAI;QACnB,IAAI,EAAE,OAAO,CAAC;QAEd,WAAW,EAAE,MAAM,CAAC;QAEpB;;;;;;WAMG;QACH,UAAU,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;QAE3B,IAAI,CAAC,EAAE,MAAM,CAAC;KACf;IAED,UAAiB,UAAU;QACzB,IAAI,EAAE,OAAO,CAAC;QAEd,WAAW,EAAE,MAAM,CAAC;QAEpB;;;;;;WAMG;QACH,UAAU,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;QAE3B,IAAI,CAAC,EAAE,YAAY,CAAC;KACrB;IAED,UAAiB,KAAK;QACpB,IAAI,EAAE,OAAO,CAAC;QAEd,WAAW,EAAE,MAAM,CAAC;QAEpB;;;;;;WAMG;QACH,UAAU,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;QAE3B,IAAI,CAAC,EAAE,OAAO,CAAC;KAChB;IAED,UAAiB,iBAAiB;QAChC,IAAI,EAAE,OAAO,CAAC;QAEd,WAAW,EAAE,MAAM,CAAC;QAEpB;;;;;;WAMG;QACH,UAAU,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;QAE3B,IAAI,CAAC,EAAE,oBAAoB,CAAC;KAC7B;CACF;AAED,MAAM,WAAW,iBAAiB;IAChC;;;OAGG;IACH,QAAQ,EAAE,MAAM,CAAC;IAEjB,aAAa,EACT,iBAAiB,CAAC,eAAe,GACjC,iBAAiB,CAAC,eAAe,GACjC,iBAAiB,CAAC,eAAe,CAAC;IAEtC,UAAU,EAAE,MAAM,CAAC;IAEnB,KAAK,EAAE,cAAc,CAAC;IAEtB;;;;;;;OAOG;IACH,iBAAiB,CAAC,EAAE,gBAAgB,CAAC;IAErC;;;OAGG;IACH,QAAQ,CAAC,EAAE,SAAS,CAAC,iBAAiB,GAAG,IAAI,CAAC;IAE9C;;;OAGG;IACH,qBAAqB,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAEtC;;;OAGG;IACH,IAAI,CAAC,EAAE,OAAO,GAAG,IAAI,CAAC;IAEtB;;;;;OAKG;IACH,KAAK,CAAC,EAAE,UAAU,CAAC;CACpB;AAED,yBAAiB,iBAAiB,CAAC;IACjC,UAAiB,eAAgB,SAAQ,MAAM,CAAC,eAAe;QAC7D,SAAS,CAAC,EAAE,KAAK,CAAC;KACnB;IAED,UAAiB,eAAgB,SAAQ,MAAM,CAAC,eAAe;QAC7D,SAAS,CAAC,EAAE,KAAK,CAAC;KACnB;IAED,UAAiB,eAAe;QAC9B,QAAQ,EAAE,KAAK,GAAG,KAAK,GAAG,KAAK,GAAG,MAAM,GAAG,MAAM,CAAC;QAElD,WAAW,EAAE,IAAI,GAAG,KAAK,GAAG,KAAK,GAAG,KAAK,GAAG,KAAK,GAAG,KAAK,CAAC;QAE1D,SAAS,CAAC,EAAE,KAAK,CAAC;KACnB;CACF;AAED,MAAM,WAAW,oBAAoB;IACnC;;;OAGG;IACH,QAAQ,EAAE,MAAM,CAAC;IAEjB,aAAa,EAAE,oBAAoB,CAAC,YAAY,CAAC;IAEjD,UAAU,EAAE,MAAM,CAAC;IAEnB,KAAK,EAAE,cAAc,CAAC;IAEtB;;;;OAIG;IACH,sBAAsB,CAAC,EAAE,OAAO,GAAG,IAAI,CAAC;IAExC;;;;OAIG;IACH,cAAc,CAAC,EAAE,OAAO,GAAG,IAAI,CAAC;IAEhC;;OAEG;IACH,UAAU,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAE3B;;;;;;;OAOG;IACH,iBAAiB,CAAC,EAAE,gBAAgB,CAAC;IAErC;;;OAGG;IACH,QAAQ,CAAC,EAAE,SAAS,CAAC,iBAAiB,CAAC;IAEvC;;;OAGG;IACH,qBAAqB,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;IAEtC;;;;;OAKG;IACH,KAAK,CAAC,EAAE,UAAU,CAAC;IAEnB;;OAEG;IACH,yBAAyB,CAAC,EAAE,OAAO,GAAG,IAAI,CAAC;CAC5C;AAED,yBAAiB,oBAAoB,CAAC;IACpC,UAAiB,YAAY;QAC3B,SAAS,EAAE,KAAK,CAAC;QAEjB,QAAQ,EAAE,SAAS,CAAC,WAAW,CAAC;QAEhC,WAAW,EAAE,IAAI,GAAG,KAAK,GAAG,KAAK,GAAG,KAAK,GAAG,KAAK,GAAG,KAAK,CAAC;KAC3D;CACF;AAED,MAAM,CAAC,OAAO,WAAW,GAAG,CAAC;IAC3B,OAAO,EACL,KAAK,gBAAgB,IAAI,gBAAgB,EACzC,KAAK,iBAAiB,IAAI,iBAAiB,EAC3C,KAAK,UAAU,IAAI,UAAU,EAC7B,KAAK,eAAe,IAAI,eAAe,EACvC,KAAK,cAAc,IAAI,cAAc,EACrC,KAAK,oBAAoB,IAAI,oBAAoB,EACjD,KAAK,iBAAiB,IAAI,iBAAiB,EAC3C,KAAK,iBAAiB,IAAI,iBAAiB,EAC3C,KAAK,oBAAoB,IAAI,oBAAoB,GAClD,CAAC;CACH"}
|