@livekit/agents 1.1.0 → 1.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (959) hide show
  1. package/dist/_exceptions.cjs.map +1 -1
  2. package/dist/_exceptions.d.ts.map +1 -1
  3. package/dist/_exceptions.js.map +1 -1
  4. package/dist/audio.cjs +89 -3
  5. package/dist/audio.cjs.map +1 -1
  6. package/dist/audio.d.cts +36 -1
  7. package/dist/audio.d.ts +36 -1
  8. package/dist/audio.d.ts.map +1 -1
  9. package/dist/audio.js +76 -2
  10. package/dist/audio.js.map +1 -1
  11. package/dist/beta/index.cjs +29 -0
  12. package/dist/beta/index.cjs.map +1 -0
  13. package/dist/beta/index.d.cts +2 -0
  14. package/dist/beta/index.d.ts +2 -0
  15. package/dist/beta/index.d.ts.map +1 -0
  16. package/dist/beta/index.js +7 -0
  17. package/dist/beta/index.js.map +1 -0
  18. package/dist/beta/workflows/index.cjs +29 -0
  19. package/dist/beta/workflows/index.cjs.map +1 -0
  20. package/dist/beta/workflows/index.d.cts +2 -0
  21. package/dist/beta/workflows/index.d.ts +2 -0
  22. package/dist/beta/workflows/index.d.ts.map +1 -0
  23. package/dist/beta/workflows/index.js +7 -0
  24. package/dist/beta/workflows/index.js.map +1 -0
  25. package/dist/beta/workflows/task_group.cjs +165 -0
  26. package/dist/beta/workflows/task_group.cjs.map +1 -0
  27. package/dist/beta/workflows/task_group.d.cts +32 -0
  28. package/dist/beta/workflows/task_group.d.ts +32 -0
  29. package/dist/beta/workflows/task_group.d.ts.map +1 -0
  30. package/dist/beta/workflows/task_group.js +141 -0
  31. package/dist/beta/workflows/task_group.js.map +1 -0
  32. package/dist/cli.cjs +44 -46
  33. package/dist/cli.cjs.map +1 -1
  34. package/dist/cli.d.cts +3 -3
  35. package/dist/cli.d.ts +3 -3
  36. package/dist/cli.d.ts.map +1 -1
  37. package/dist/cli.js +45 -47
  38. package/dist/cli.js.map +1 -1
  39. package/dist/connection_pool.cjs +242 -0
  40. package/dist/connection_pool.cjs.map +1 -0
  41. package/dist/connection_pool.d.cts +123 -0
  42. package/dist/connection_pool.d.ts +123 -0
  43. package/dist/connection_pool.d.ts.map +1 -0
  44. package/dist/connection_pool.js +218 -0
  45. package/dist/connection_pool.js.map +1 -0
  46. package/dist/connection_pool.test.cjs +256 -0
  47. package/dist/connection_pool.test.cjs.map +1 -0
  48. package/dist/connection_pool.test.js +255 -0
  49. package/dist/connection_pool.test.js.map +1 -0
  50. package/dist/constants.cjs +30 -0
  51. package/dist/constants.cjs.map +1 -1
  52. package/dist/constants.d.cts +10 -0
  53. package/dist/constants.d.ts +10 -0
  54. package/dist/constants.d.ts.map +1 -1
  55. package/dist/constants.js +20 -0
  56. package/dist/constants.js.map +1 -1
  57. package/dist/cpu.cjs +189 -0
  58. package/dist/cpu.cjs.map +1 -0
  59. package/dist/cpu.d.cts +24 -0
  60. package/dist/cpu.d.ts +24 -0
  61. package/dist/cpu.d.ts.map +1 -0
  62. package/dist/cpu.js +152 -0
  63. package/dist/cpu.js.map +1 -0
  64. package/dist/cpu.test.cjs +227 -0
  65. package/dist/cpu.test.cjs.map +1 -0
  66. package/dist/cpu.test.js +204 -0
  67. package/dist/cpu.test.js.map +1 -0
  68. package/dist/http_server.cjs +9 -6
  69. package/dist/http_server.cjs.map +1 -1
  70. package/dist/http_server.d.cts +5 -1
  71. package/dist/http_server.d.ts +5 -1
  72. package/dist/http_server.d.ts.map +1 -1
  73. package/dist/http_server.js +9 -6
  74. package/dist/http_server.js.map +1 -1
  75. package/dist/index.cjs +24 -9
  76. package/dist/index.cjs.map +1 -1
  77. package/dist/index.d.cts +15 -11
  78. package/dist/index.d.ts +15 -11
  79. package/dist/index.d.ts.map +1 -1
  80. package/dist/index.js +18 -9
  81. package/dist/index.js.map +1 -1
  82. package/dist/inference/api_protos.cjs +70 -2
  83. package/dist/inference/api_protos.cjs.map +1 -1
  84. package/dist/inference/api_protos.d.cts +373 -32
  85. package/dist/inference/api_protos.d.ts +373 -32
  86. package/dist/inference/api_protos.d.ts.map +1 -1
  87. package/dist/inference/api_protos.js +62 -2
  88. package/dist/inference/api_protos.js.map +1 -1
  89. package/dist/inference/index.cjs +8 -0
  90. package/dist/inference/index.cjs.map +1 -1
  91. package/dist/inference/index.d.cts +3 -4
  92. package/dist/inference/index.d.ts +3 -4
  93. package/dist/inference/index.d.ts.map +1 -1
  94. package/dist/inference/index.js +18 -3
  95. package/dist/inference/index.js.map +1 -1
  96. package/dist/inference/interruption/defaults.cjs +81 -0
  97. package/dist/inference/interruption/defaults.cjs.map +1 -0
  98. package/dist/inference/interruption/defaults.d.cts +19 -0
  99. package/dist/inference/interruption/defaults.d.ts +19 -0
  100. package/dist/inference/interruption/defaults.d.ts.map +1 -0
  101. package/dist/inference/interruption/defaults.js +46 -0
  102. package/dist/inference/interruption/defaults.js.map +1 -0
  103. package/dist/inference/interruption/errors.cjs +44 -0
  104. package/dist/inference/interruption/errors.cjs.map +1 -0
  105. package/dist/inference/interruption/errors.d.cts +12 -0
  106. package/dist/inference/interruption/errors.d.ts +12 -0
  107. package/dist/inference/interruption/errors.d.ts.map +1 -0
  108. package/dist/inference/interruption/errors.js +20 -0
  109. package/dist/inference/interruption/errors.js.map +1 -0
  110. package/dist/inference/interruption/http_transport.cjs +163 -0
  111. package/dist/inference/interruption/http_transport.cjs.map +1 -0
  112. package/dist/inference/interruption/http_transport.d.cts +65 -0
  113. package/dist/inference/interruption/http_transport.d.ts +65 -0
  114. package/dist/inference/interruption/http_transport.d.ts.map +1 -0
  115. package/dist/inference/interruption/http_transport.js +137 -0
  116. package/dist/inference/interruption/http_transport.js.map +1 -0
  117. package/dist/inference/interruption/interruption_cache_entry.cjs +58 -0
  118. package/dist/inference/interruption/interruption_cache_entry.cjs.map +1 -0
  119. package/dist/inference/interruption/interruption_cache_entry.d.cts +30 -0
  120. package/dist/inference/interruption/interruption_cache_entry.d.ts +30 -0
  121. package/dist/inference/interruption/interruption_cache_entry.d.ts.map +1 -0
  122. package/dist/inference/interruption/interruption_cache_entry.js +34 -0
  123. package/dist/inference/interruption/interruption_cache_entry.js.map +1 -0
  124. package/dist/inference/interruption/interruption_detector.cjs +198 -0
  125. package/dist/inference/interruption/interruption_detector.cjs.map +1 -0
  126. package/dist/inference/interruption/interruption_detector.d.cts +59 -0
  127. package/dist/inference/interruption/interruption_detector.d.ts +59 -0
  128. package/dist/inference/interruption/interruption_detector.d.ts.map +1 -0
  129. package/dist/inference/interruption/interruption_detector.js +164 -0
  130. package/dist/inference/interruption/interruption_detector.js.map +1 -0
  131. package/dist/inference/interruption/interruption_stream.cjs +368 -0
  132. package/dist/inference/interruption/interruption_stream.cjs.map +1 -0
  133. package/dist/inference/interruption/interruption_stream.d.cts +46 -0
  134. package/dist/inference/interruption/interruption_stream.d.ts +46 -0
  135. package/dist/inference/interruption/interruption_stream.d.ts.map +1 -0
  136. package/dist/inference/interruption/interruption_stream.js +344 -0
  137. package/dist/inference/interruption/interruption_stream.js.map +1 -0
  138. package/dist/inference/interruption/types.cjs +17 -0
  139. package/dist/inference/interruption/types.cjs.map +1 -0
  140. package/dist/inference/interruption/types.d.cts +66 -0
  141. package/dist/inference/interruption/types.d.ts +66 -0
  142. package/dist/inference/interruption/types.d.ts.map +1 -0
  143. package/dist/inference/interruption/types.js +1 -0
  144. package/dist/inference/interruption/types.js.map +1 -0
  145. package/dist/inference/interruption/utils.cjs +130 -0
  146. package/dist/inference/interruption/utils.cjs.map +1 -0
  147. package/dist/inference/interruption/utils.d.cts +41 -0
  148. package/dist/inference/interruption/utils.d.ts +41 -0
  149. package/dist/inference/interruption/utils.d.ts.map +1 -0
  150. package/dist/inference/interruption/utils.js +105 -0
  151. package/dist/inference/interruption/utils.js.map +1 -0
  152. package/dist/inference/interruption/utils.test.cjs +105 -0
  153. package/dist/inference/interruption/utils.test.cjs.map +1 -0
  154. package/dist/inference/interruption/utils.test.js +104 -0
  155. package/dist/inference/interruption/utils.test.js.map +1 -0
  156. package/dist/inference/interruption/ws_transport.cjs +347 -0
  157. package/dist/inference/interruption/ws_transport.cjs.map +1 -0
  158. package/dist/inference/interruption/ws_transport.d.cts +33 -0
  159. package/dist/inference/interruption/ws_transport.d.ts +33 -0
  160. package/dist/inference/interruption/ws_transport.d.ts.map +1 -0
  161. package/dist/inference/interruption/ws_transport.js +313 -0
  162. package/dist/inference/interruption/ws_transport.js.map +1 -0
  163. package/dist/inference/llm.cjs +106 -66
  164. package/dist/inference/llm.cjs.map +1 -1
  165. package/dist/inference/llm.d.cts +65 -43
  166. package/dist/inference/llm.d.ts +65 -43
  167. package/dist/inference/llm.d.ts.map +1 -1
  168. package/dist/inference/llm.js +100 -66
  169. package/dist/inference/llm.js.map +1 -1
  170. package/dist/inference/stt.cjs +319 -170
  171. package/dist/inference/stt.cjs.map +1 -1
  172. package/dist/inference/stt.d.cts +64 -15
  173. package/dist/inference/stt.d.ts +64 -15
  174. package/dist/inference/stt.d.ts.map +1 -1
  175. package/dist/inference/stt.js +319 -170
  176. package/dist/inference/stt.js.map +1 -1
  177. package/dist/inference/stt.test.cjs +218 -0
  178. package/dist/inference/stt.test.cjs.map +1 -0
  179. package/dist/inference/stt.test.js +217 -0
  180. package/dist/inference/stt.test.js.map +1 -0
  181. package/dist/inference/tts.cjs +249 -71
  182. package/dist/inference/tts.cjs.map +1 -1
  183. package/dist/inference/tts.d.cts +94 -17
  184. package/dist/inference/tts.d.ts +94 -17
  185. package/dist/inference/tts.d.ts.map +1 -1
  186. package/dist/inference/tts.js +249 -77
  187. package/dist/inference/tts.js.map +1 -1
  188. package/dist/inference/tts.test.cjs +305 -0
  189. package/dist/inference/tts.test.cjs.map +1 -0
  190. package/dist/inference/tts.test.js +304 -0
  191. package/dist/inference/tts.test.js.map +1 -0
  192. package/dist/inference/utils.cjs +26 -7
  193. package/dist/inference/utils.cjs.map +1 -1
  194. package/dist/inference/utils.d.cts +14 -1
  195. package/dist/inference/utils.d.ts +14 -1
  196. package/dist/inference/utils.d.ts.map +1 -1
  197. package/dist/inference/utils.js +18 -2
  198. package/dist/inference/utils.js.map +1 -1
  199. package/dist/ipc/inference_proc_executor.cjs +6 -3
  200. package/dist/ipc/inference_proc_executor.cjs.map +1 -1
  201. package/dist/ipc/inference_proc_executor.d.ts.map +1 -1
  202. package/dist/ipc/inference_proc_executor.js +6 -3
  203. package/dist/ipc/inference_proc_executor.js.map +1 -1
  204. package/dist/ipc/inference_proc_lazy_main.cjs +13 -1
  205. package/dist/ipc/inference_proc_lazy_main.cjs.map +1 -1
  206. package/dist/ipc/inference_proc_lazy_main.js +13 -1
  207. package/dist/ipc/inference_proc_lazy_main.js.map +1 -1
  208. package/dist/ipc/job_proc_executor.cjs +6 -1
  209. package/dist/ipc/job_proc_executor.cjs.map +1 -1
  210. package/dist/ipc/job_proc_executor.d.ts.map +1 -1
  211. package/dist/ipc/job_proc_executor.js +6 -1
  212. package/dist/ipc/job_proc_executor.js.map +1 -1
  213. package/dist/ipc/job_proc_lazy_main.cjs +89 -17
  214. package/dist/ipc/job_proc_lazy_main.cjs.map +1 -1
  215. package/dist/ipc/job_proc_lazy_main.js +68 -18
  216. package/dist/ipc/job_proc_lazy_main.js.map +1 -1
  217. package/dist/ipc/supervised_proc.cjs +34 -8
  218. package/dist/ipc/supervised_proc.cjs.map +1 -1
  219. package/dist/ipc/supervised_proc.d.cts +8 -0
  220. package/dist/ipc/supervised_proc.d.ts +8 -0
  221. package/dist/ipc/supervised_proc.d.ts.map +1 -1
  222. package/dist/ipc/supervised_proc.js +34 -8
  223. package/dist/ipc/supervised_proc.js.map +1 -1
  224. package/dist/ipc/supervised_proc.test.cjs +145 -0
  225. package/dist/ipc/supervised_proc.test.cjs.map +1 -0
  226. package/dist/ipc/supervised_proc.test.js +122 -0
  227. package/dist/ipc/supervised_proc.test.js.map +1 -0
  228. package/dist/job.cjs +109 -1
  229. package/dist/job.cjs.map +1 -1
  230. package/dist/job.d.cts +14 -0
  231. package/dist/job.d.ts +14 -0
  232. package/dist/job.d.ts.map +1 -1
  233. package/dist/job.js +99 -1
  234. package/dist/job.js.map +1 -1
  235. package/dist/language.cjs +394 -0
  236. package/dist/language.cjs.map +1 -0
  237. package/dist/language.d.cts +15 -0
  238. package/dist/language.d.ts +15 -0
  239. package/dist/language.d.ts.map +1 -0
  240. package/dist/language.js +363 -0
  241. package/dist/language.js.map +1 -0
  242. package/dist/language.test.cjs +43 -0
  243. package/dist/language.test.cjs.map +1 -0
  244. package/dist/language.test.js +49 -0
  245. package/dist/language.test.js.map +1 -0
  246. package/dist/llm/chat_context.cjs +345 -3
  247. package/dist/llm/chat_context.cjs.map +1 -1
  248. package/dist/llm/chat_context.d.cts +86 -2
  249. package/dist/llm/chat_context.d.ts +86 -2
  250. package/dist/llm/chat_context.d.ts.map +1 -1
  251. package/dist/llm/chat_context.js +344 -3
  252. package/dist/llm/chat_context.js.map +1 -1
  253. package/dist/llm/chat_context.test.cjs +692 -0
  254. package/dist/llm/chat_context.test.cjs.map +1 -1
  255. package/dist/llm/chat_context.test.js +692 -0
  256. package/dist/llm/chat_context.test.js.map +1 -1
  257. package/dist/llm/fallback_adapter.cjs +280 -0
  258. package/dist/llm/fallback_adapter.cjs.map +1 -0
  259. package/dist/llm/fallback_adapter.d.cts +73 -0
  260. package/dist/llm/fallback_adapter.d.ts +73 -0
  261. package/dist/llm/fallback_adapter.d.ts.map +1 -0
  262. package/dist/llm/fallback_adapter.js +256 -0
  263. package/dist/llm/fallback_adapter.js.map +1 -0
  264. package/dist/llm/fallback_adapter.test.cjs +176 -0
  265. package/dist/llm/fallback_adapter.test.cjs.map +1 -0
  266. package/dist/llm/fallback_adapter.test.js +175 -0
  267. package/dist/llm/fallback_adapter.test.js.map +1 -0
  268. package/dist/llm/index.cjs +11 -0
  269. package/dist/llm/index.cjs.map +1 -1
  270. package/dist/llm/index.d.cts +4 -3
  271. package/dist/llm/index.d.ts +4 -3
  272. package/dist/llm/index.d.ts.map +1 -1
  273. package/dist/llm/index.js +13 -1
  274. package/dist/llm/index.js.map +1 -1
  275. package/dist/llm/llm.cjs +65 -11
  276. package/dist/llm/llm.cjs.map +1 -1
  277. package/dist/llm/llm.d.cts +13 -2
  278. package/dist/llm/llm.d.ts +13 -2
  279. package/dist/llm/llm.d.ts.map +1 -1
  280. package/dist/llm/llm.js +65 -11
  281. package/dist/llm/llm.js.map +1 -1
  282. package/dist/llm/provider_format/google.cjs +6 -2
  283. package/dist/llm/provider_format/google.cjs.map +1 -1
  284. package/dist/llm/provider_format/google.d.cts +1 -1
  285. package/dist/llm/provider_format/google.d.ts +1 -1
  286. package/dist/llm/provider_format/google.d.ts.map +1 -1
  287. package/dist/llm/provider_format/google.js +6 -2
  288. package/dist/llm/provider_format/google.js.map +1 -1
  289. package/dist/llm/provider_format/google.test.cjs +48 -0
  290. package/dist/llm/provider_format/google.test.cjs.map +1 -1
  291. package/dist/llm/provider_format/google.test.js +54 -1
  292. package/dist/llm/provider_format/google.test.js.map +1 -1
  293. package/dist/llm/provider_format/index.cjs +2 -0
  294. package/dist/llm/provider_format/index.cjs.map +1 -1
  295. package/dist/llm/provider_format/index.d.cts +2 -2
  296. package/dist/llm/provider_format/index.d.ts +2 -2
  297. package/dist/llm/provider_format/index.d.ts.map +1 -1
  298. package/dist/llm/provider_format/index.js +6 -1
  299. package/dist/llm/provider_format/index.js.map +1 -1
  300. package/dist/llm/provider_format/openai.cjs +126 -24
  301. package/dist/llm/provider_format/openai.cjs.map +1 -1
  302. package/dist/llm/provider_format/openai.d.cts +1 -0
  303. package/dist/llm/provider_format/openai.d.ts +1 -0
  304. package/dist/llm/provider_format/openai.d.ts.map +1 -1
  305. package/dist/llm/provider_format/openai.js +124 -23
  306. package/dist/llm/provider_format/openai.js.map +1 -1
  307. package/dist/llm/provider_format/openai.test.cjs +393 -0
  308. package/dist/llm/provider_format/openai.test.cjs.map +1 -1
  309. package/dist/llm/provider_format/openai.test.js +400 -2
  310. package/dist/llm/provider_format/openai.test.js.map +1 -1
  311. package/dist/llm/provider_format/utils.cjs +5 -4
  312. package/dist/llm/provider_format/utils.cjs.map +1 -1
  313. package/dist/llm/provider_format/utils.d.ts.map +1 -1
  314. package/dist/llm/provider_format/utils.js +5 -4
  315. package/dist/llm/provider_format/utils.js.map +1 -1
  316. package/dist/llm/realtime.cjs +3 -0
  317. package/dist/llm/realtime.cjs.map +1 -1
  318. package/dist/llm/realtime.d.cts +15 -1
  319. package/dist/llm/realtime.d.ts +15 -1
  320. package/dist/llm/realtime.d.ts.map +1 -1
  321. package/dist/llm/realtime.js +3 -0
  322. package/dist/llm/realtime.js.map +1 -1
  323. package/dist/llm/remote_chat_context.cjs.map +1 -1
  324. package/dist/llm/remote_chat_context.d.cts +2 -0
  325. package/dist/llm/remote_chat_context.d.ts +2 -0
  326. package/dist/llm/remote_chat_context.d.ts.map +1 -1
  327. package/dist/llm/remote_chat_context.js.map +1 -1
  328. package/dist/llm/tool_context.cjs +50 -2
  329. package/dist/llm/tool_context.cjs.map +1 -1
  330. package/dist/llm/tool_context.d.cts +47 -11
  331. package/dist/llm/tool_context.d.ts +47 -11
  332. package/dist/llm/tool_context.d.ts.map +1 -1
  333. package/dist/llm/tool_context.js +48 -3
  334. package/dist/llm/tool_context.js.map +1 -1
  335. package/dist/llm/tool_context.test.cjs +197 -0
  336. package/dist/llm/tool_context.test.cjs.map +1 -1
  337. package/dist/llm/tool_context.test.js +175 -0
  338. package/dist/llm/tool_context.test.js.map +1 -1
  339. package/dist/llm/utils.cjs +107 -12
  340. package/dist/llm/utils.cjs.map +1 -1
  341. package/dist/llm/utils.d.cts +10 -3
  342. package/dist/llm/utils.d.ts +10 -3
  343. package/dist/llm/utils.d.ts.map +1 -1
  344. package/dist/llm/utils.js +106 -12
  345. package/dist/llm/utils.js.map +1 -1
  346. package/dist/llm/utils.test.cjs +90 -0
  347. package/dist/llm/utils.test.cjs.map +1 -1
  348. package/dist/llm/utils.test.js +98 -2
  349. package/dist/llm/utils.test.js.map +1 -1
  350. package/dist/llm/zod-utils.cjs +102 -0
  351. package/dist/llm/zod-utils.cjs.map +1 -0
  352. package/dist/llm/zod-utils.d.cts +65 -0
  353. package/dist/llm/zod-utils.d.ts +65 -0
  354. package/dist/llm/zod-utils.d.ts.map +1 -0
  355. package/dist/llm/zod-utils.js +64 -0
  356. package/dist/llm/zod-utils.js.map +1 -0
  357. package/dist/llm/zod-utils.test.cjs +472 -0
  358. package/dist/llm/zod-utils.test.cjs.map +1 -0
  359. package/dist/llm/zod-utils.test.js +455 -0
  360. package/dist/llm/zod-utils.test.js.map +1 -0
  361. package/dist/log.cjs +45 -14
  362. package/dist/log.cjs.map +1 -1
  363. package/dist/log.d.cts +8 -1
  364. package/dist/log.d.ts +8 -1
  365. package/dist/log.d.ts.map +1 -1
  366. package/dist/log.js +45 -15
  367. package/dist/log.js.map +1 -1
  368. package/dist/metrics/base.cjs.map +1 -1
  369. package/dist/metrics/base.d.cts +75 -19
  370. package/dist/metrics/base.d.ts +75 -19
  371. package/dist/metrics/base.d.ts.map +1 -1
  372. package/dist/metrics/index.cjs +5 -0
  373. package/dist/metrics/index.cjs.map +1 -1
  374. package/dist/metrics/index.d.cts +2 -1
  375. package/dist/metrics/index.d.ts +2 -1
  376. package/dist/metrics/index.d.ts.map +1 -1
  377. package/dist/metrics/index.js +6 -0
  378. package/dist/metrics/index.js.map +1 -1
  379. package/dist/metrics/model_usage.cjs +189 -0
  380. package/dist/metrics/model_usage.cjs.map +1 -0
  381. package/dist/metrics/model_usage.d.cts +92 -0
  382. package/dist/metrics/model_usage.d.ts +92 -0
  383. package/dist/metrics/model_usage.d.ts.map +1 -0
  384. package/dist/metrics/model_usage.js +164 -0
  385. package/dist/metrics/model_usage.js.map +1 -0
  386. package/dist/metrics/model_usage.test.cjs +474 -0
  387. package/dist/metrics/model_usage.test.cjs.map +1 -0
  388. package/dist/metrics/model_usage.test.js +476 -0
  389. package/dist/metrics/model_usage.test.js.map +1 -0
  390. package/dist/metrics/usage_collector.cjs +5 -2
  391. package/dist/metrics/usage_collector.cjs.map +1 -1
  392. package/dist/metrics/usage_collector.d.cts +10 -1
  393. package/dist/metrics/usage_collector.d.ts +10 -1
  394. package/dist/metrics/usage_collector.d.ts.map +1 -1
  395. package/dist/metrics/usage_collector.js +5 -2
  396. package/dist/metrics/usage_collector.js.map +1 -1
  397. package/dist/metrics/utils.cjs +23 -7
  398. package/dist/metrics/utils.cjs.map +1 -1
  399. package/dist/metrics/utils.d.ts.map +1 -1
  400. package/dist/metrics/utils.js +23 -7
  401. package/dist/metrics/utils.js.map +1 -1
  402. package/dist/stream/deferred_stream.cjs +31 -10
  403. package/dist/stream/deferred_stream.cjs.map +1 -1
  404. package/dist/stream/deferred_stream.d.cts +6 -1
  405. package/dist/stream/deferred_stream.d.ts +6 -1
  406. package/dist/stream/deferred_stream.d.ts.map +1 -1
  407. package/dist/stream/deferred_stream.js +31 -10
  408. package/dist/stream/deferred_stream.js.map +1 -1
  409. package/dist/stream/deferred_stream.test.cjs +2 -2
  410. package/dist/stream/deferred_stream.test.cjs.map +1 -1
  411. package/dist/stream/deferred_stream.test.js +2 -2
  412. package/dist/stream/deferred_stream.test.js.map +1 -1
  413. package/dist/stream/index.cjs +3 -0
  414. package/dist/stream/index.cjs.map +1 -1
  415. package/dist/stream/index.d.cts +1 -0
  416. package/dist/stream/index.d.ts +1 -0
  417. package/dist/stream/index.d.ts.map +1 -1
  418. package/dist/stream/index.js +2 -0
  419. package/dist/stream/index.js.map +1 -1
  420. package/dist/stream/multi_input_stream.cjs +139 -0
  421. package/dist/stream/multi_input_stream.cjs.map +1 -0
  422. package/dist/stream/multi_input_stream.d.cts +55 -0
  423. package/dist/stream/multi_input_stream.d.ts +55 -0
  424. package/dist/stream/multi_input_stream.d.ts.map +1 -0
  425. package/dist/stream/multi_input_stream.js +115 -0
  426. package/dist/stream/multi_input_stream.js.map +1 -0
  427. package/dist/stream/multi_input_stream.test.cjs +344 -0
  428. package/dist/stream/multi_input_stream.test.cjs.map +1 -0
  429. package/dist/stream/multi_input_stream.test.js +343 -0
  430. package/dist/stream/multi_input_stream.test.js.map +1 -0
  431. package/dist/stream/stream_channel.cjs +39 -1
  432. package/dist/stream/stream_channel.cjs.map +1 -1
  433. package/dist/stream/stream_channel.d.cts +5 -2
  434. package/dist/stream/stream_channel.d.ts +5 -2
  435. package/dist/stream/stream_channel.d.ts.map +1 -1
  436. package/dist/stream/stream_channel.js +39 -1
  437. package/dist/stream/stream_channel.js.map +1 -1
  438. package/dist/stream/stream_channel.test.cjs +27 -0
  439. package/dist/stream/stream_channel.test.cjs.map +1 -1
  440. package/dist/stream/stream_channel.test.js +27 -0
  441. package/dist/stream/stream_channel.test.js.map +1 -1
  442. package/dist/stt/stream_adapter.cjs +24 -9
  443. package/dist/stt/stream_adapter.cjs.map +1 -1
  444. package/dist/stt/stream_adapter.d.cts +7 -3
  445. package/dist/stt/stream_adapter.d.ts +7 -3
  446. package/dist/stt/stream_adapter.d.ts.map +1 -1
  447. package/dist/stt/stream_adapter.js +24 -9
  448. package/dist/stt/stream_adapter.js.map +1 -1
  449. package/dist/stt/stt.cjs +94 -19
  450. package/dist/stt/stt.cjs.map +1 -1
  451. package/dist/stt/stt.d.cts +68 -5
  452. package/dist/stt/stt.d.ts +68 -5
  453. package/dist/stt/stt.d.ts.map +1 -1
  454. package/dist/stt/stt.js +96 -21
  455. package/dist/stt/stt.js.map +1 -1
  456. package/dist/telemetry/index.cjs +72 -0
  457. package/dist/telemetry/index.cjs.map +1 -0
  458. package/dist/telemetry/index.d.cts +7 -0
  459. package/dist/telemetry/index.d.ts +7 -0
  460. package/dist/telemetry/index.d.ts.map +1 -0
  461. package/dist/telemetry/index.js +37 -0
  462. package/dist/telemetry/index.js.map +1 -0
  463. package/dist/telemetry/logging.cjs +65 -0
  464. package/dist/telemetry/logging.cjs.map +1 -0
  465. package/dist/telemetry/logging.d.cts +21 -0
  466. package/dist/telemetry/logging.d.ts +21 -0
  467. package/dist/telemetry/logging.d.ts.map +1 -0
  468. package/dist/telemetry/logging.js +40 -0
  469. package/dist/telemetry/logging.js.map +1 -0
  470. package/dist/telemetry/otel_http_exporter.cjs +166 -0
  471. package/dist/telemetry/otel_http_exporter.cjs.map +1 -0
  472. package/dist/telemetry/otel_http_exporter.d.cts +63 -0
  473. package/dist/telemetry/otel_http_exporter.d.ts +63 -0
  474. package/dist/telemetry/otel_http_exporter.d.ts.map +1 -0
  475. package/dist/telemetry/otel_http_exporter.js +142 -0
  476. package/dist/telemetry/otel_http_exporter.js.map +1 -0
  477. package/dist/telemetry/pino_otel_transport.cjs +217 -0
  478. package/dist/telemetry/pino_otel_transport.cjs.map +1 -0
  479. package/dist/telemetry/pino_otel_transport.d.cts +58 -0
  480. package/dist/telemetry/pino_otel_transport.d.ts +58 -0
  481. package/dist/telemetry/pino_otel_transport.d.ts.map +1 -0
  482. package/dist/telemetry/pino_otel_transport.js +189 -0
  483. package/dist/telemetry/pino_otel_transport.js.map +1 -0
  484. package/dist/telemetry/trace_types.cjs +233 -0
  485. package/dist/telemetry/trace_types.cjs.map +1 -0
  486. package/dist/telemetry/trace_types.d.cts +74 -0
  487. package/dist/telemetry/trace_types.d.ts +74 -0
  488. package/dist/telemetry/trace_types.d.ts.map +1 -0
  489. package/dist/telemetry/trace_types.js +141 -0
  490. package/dist/telemetry/trace_types.js.map +1 -0
  491. package/dist/telemetry/traces.cjs +484 -0
  492. package/dist/telemetry/traces.cjs.map +1 -0
  493. package/dist/telemetry/traces.d.cts +116 -0
  494. package/dist/telemetry/traces.d.ts +116 -0
  495. package/dist/telemetry/traces.d.ts.map +1 -0
  496. package/dist/telemetry/traces.js +449 -0
  497. package/dist/telemetry/traces.js.map +1 -0
  498. package/dist/telemetry/utils.cjs +86 -0
  499. package/dist/telemetry/utils.cjs.map +1 -0
  500. package/dist/telemetry/utils.d.cts +5 -0
  501. package/dist/telemetry/utils.d.ts +5 -0
  502. package/dist/telemetry/utils.d.ts.map +1 -0
  503. package/dist/telemetry/utils.js +51 -0
  504. package/dist/telemetry/utils.js.map +1 -0
  505. package/dist/tokenize/basic/sentence.cjs +3 -3
  506. package/dist/tokenize/basic/sentence.cjs.map +1 -1
  507. package/dist/tokenize/basic/sentence.js +3 -3
  508. package/dist/tokenize/basic/sentence.js.map +1 -1
  509. package/dist/tokenize/tokenizer.test.cjs +3 -1
  510. package/dist/tokenize/tokenizer.test.cjs.map +1 -1
  511. package/dist/tokenize/tokenizer.test.js +3 -1
  512. package/dist/tokenize/tokenizer.test.js.map +1 -1
  513. package/dist/transcription.cjs.map +1 -1
  514. package/dist/transcription.d.cts +6 -0
  515. package/dist/transcription.d.ts +6 -0
  516. package/dist/transcription.d.ts.map +1 -1
  517. package/dist/transcription.js.map +1 -1
  518. package/dist/tts/fallback_adapter.cjs +472 -0
  519. package/dist/tts/fallback_adapter.cjs.map +1 -0
  520. package/dist/tts/fallback_adapter.d.cts +110 -0
  521. package/dist/tts/fallback_adapter.d.ts +110 -0
  522. package/dist/tts/fallback_adapter.d.ts.map +1 -0
  523. package/dist/tts/fallback_adapter.js +448 -0
  524. package/dist/tts/fallback_adapter.js.map +1 -0
  525. package/dist/tts/index.cjs +3 -0
  526. package/dist/tts/index.cjs.map +1 -1
  527. package/dist/tts/index.d.cts +1 -0
  528. package/dist/tts/index.d.ts +1 -0
  529. package/dist/tts/index.d.ts.map +1 -1
  530. package/dist/tts/index.js +2 -0
  531. package/dist/tts/index.js.map +1 -1
  532. package/dist/tts/stream_adapter.cjs +25 -8
  533. package/dist/tts/stream_adapter.cjs.map +1 -1
  534. package/dist/tts/stream_adapter.d.cts +6 -3
  535. package/dist/tts/stream_adapter.d.ts +6 -3
  536. package/dist/tts/stream_adapter.d.ts.map +1 -1
  537. package/dist/tts/stream_adapter.js +25 -8
  538. package/dist/tts/stream_adapter.js.map +1 -1
  539. package/dist/tts/tts.cjs +189 -57
  540. package/dist/tts/tts.cjs.map +1 -1
  541. package/dist/tts/tts.d.cts +58 -6
  542. package/dist/tts/tts.d.ts +58 -6
  543. package/dist/tts/tts.d.ts.map +1 -1
  544. package/dist/tts/tts.js +191 -59
  545. package/dist/tts/tts.js.map +1 -1
  546. package/dist/typed_promise.cjs +48 -0
  547. package/dist/typed_promise.cjs.map +1 -0
  548. package/dist/typed_promise.d.cts +24 -0
  549. package/dist/typed_promise.d.ts +24 -0
  550. package/dist/typed_promise.d.ts.map +1 -0
  551. package/dist/typed_promise.js +28 -0
  552. package/dist/typed_promise.js.map +1 -0
  553. package/dist/types.cjs +24 -32
  554. package/dist/types.cjs.map +1 -1
  555. package/dist/types.d.cts +45 -10
  556. package/dist/types.d.ts +45 -10
  557. package/dist/types.d.ts.map +1 -1
  558. package/dist/types.js +20 -30
  559. package/dist/types.js.map +1 -1
  560. package/dist/utils.cjs +124 -28
  561. package/dist/utils.cjs.map +1 -1
  562. package/dist/utils.d.cts +41 -1
  563. package/dist/utils.d.ts +41 -1
  564. package/dist/utils.d.ts.map +1 -1
  565. package/dist/utils.js +119 -27
  566. package/dist/utils.js.map +1 -1
  567. package/dist/utils.test.cjs +73 -1
  568. package/dist/utils.test.cjs.map +1 -1
  569. package/dist/utils.test.js +74 -10
  570. package/dist/utils.test.js.map +1 -1
  571. package/dist/vad.cjs +35 -15
  572. package/dist/vad.cjs.map +1 -1
  573. package/dist/vad.d.cts +15 -5
  574. package/dist/vad.d.ts +15 -5
  575. package/dist/vad.d.ts.map +1 -1
  576. package/dist/vad.js +35 -15
  577. package/dist/vad.js.map +1 -1
  578. package/dist/version.cjs +1 -1
  579. package/dist/version.cjs.map +1 -1
  580. package/dist/version.d.cts +1 -1
  581. package/dist/version.d.ts +1 -1
  582. package/dist/version.d.ts.map +1 -1
  583. package/dist/version.js +1 -1
  584. package/dist/version.js.map +1 -1
  585. package/dist/voice/agent.cjs +258 -35
  586. package/dist/voice/agent.cjs.map +1 -1
  587. package/dist/voice/agent.d.cts +54 -13
  588. package/dist/voice/agent.d.ts +54 -13
  589. package/dist/voice/agent.d.ts.map +1 -1
  590. package/dist/voice/agent.js +254 -34
  591. package/dist/voice/agent.js.map +1 -1
  592. package/dist/voice/agent.test.cjs +314 -0
  593. package/dist/voice/agent.test.cjs.map +1 -1
  594. package/dist/voice/agent.test.js +316 -2
  595. package/dist/voice/agent.test.js.map +1 -1
  596. package/dist/voice/agent_activity.cjs +1116 -385
  597. package/dist/voice/agent_activity.cjs.map +1 -1
  598. package/dist/voice/agent_activity.d.cts +72 -11
  599. package/dist/voice/agent_activity.d.ts +72 -11
  600. package/dist/voice/agent_activity.d.ts.map +1 -1
  601. package/dist/voice/agent_activity.js +1119 -383
  602. package/dist/voice/agent_activity.js.map +1 -1
  603. package/dist/voice/agent_activity.test.cjs +135 -0
  604. package/dist/voice/agent_activity.test.cjs.map +1 -0
  605. package/dist/voice/agent_activity.test.js +134 -0
  606. package/dist/voice/agent_activity.test.js.map +1 -0
  607. package/dist/voice/agent_session.cjs +550 -90
  608. package/dist/voice/agent_session.cjs.map +1 -1
  609. package/dist/voice/agent_session.d.cts +185 -25
  610. package/dist/voice/agent_session.d.ts +185 -25
  611. package/dist/voice/agent_session.d.ts.map +1 -1
  612. package/dist/voice/agent_session.js +556 -91
  613. package/dist/voice/agent_session.js.map +1 -1
  614. package/dist/voice/audio_recognition.cjs +605 -46
  615. package/dist/voice/audio_recognition.cjs.map +1 -1
  616. package/dist/voice/audio_recognition.d.cts +96 -4
  617. package/dist/voice/audio_recognition.d.ts +96 -4
  618. package/dist/voice/audio_recognition.d.ts.map +1 -1
  619. package/dist/voice/audio_recognition.js +611 -47
  620. package/dist/voice/audio_recognition.js.map +1 -1
  621. package/dist/voice/audio_recognition_span.test.cjs +295 -0
  622. package/dist/voice/audio_recognition_span.test.cjs.map +1 -0
  623. package/dist/voice/audio_recognition_span.test.js +299 -0
  624. package/dist/voice/audio_recognition_span.test.js.map +1 -0
  625. package/dist/voice/avatar/datastream_io.cjs +7 -1
  626. package/dist/voice/avatar/datastream_io.cjs.map +1 -1
  627. package/dist/voice/avatar/datastream_io.d.cts +1 -0
  628. package/dist/voice/avatar/datastream_io.d.ts +1 -0
  629. package/dist/voice/avatar/datastream_io.d.ts.map +1 -1
  630. package/dist/voice/avatar/datastream_io.js +7 -1
  631. package/dist/voice/avatar/datastream_io.js.map +1 -1
  632. package/dist/voice/background_audio.cjs +367 -0
  633. package/dist/voice/background_audio.cjs.map +1 -0
  634. package/dist/voice/background_audio.d.cts +123 -0
  635. package/dist/voice/background_audio.d.ts +123 -0
  636. package/dist/voice/background_audio.d.ts.map +1 -0
  637. package/dist/voice/background_audio.js +343 -0
  638. package/dist/voice/background_audio.js.map +1 -0
  639. package/dist/voice/events.cjs +3 -0
  640. package/dist/voice/events.cjs.map +1 -1
  641. package/dist/voice/events.d.cts +16 -9
  642. package/dist/voice/events.d.ts +16 -9
  643. package/dist/voice/events.d.ts.map +1 -1
  644. package/dist/voice/events.js +3 -0
  645. package/dist/voice/events.js.map +1 -1
  646. package/dist/voice/generation.cjs +205 -41
  647. package/dist/voice/generation.cjs.map +1 -1
  648. package/dist/voice/generation.d.cts +21 -5
  649. package/dist/voice/generation.d.ts +21 -5
  650. package/dist/voice/generation.d.ts.map +1 -1
  651. package/dist/voice/generation.js +215 -43
  652. package/dist/voice/generation.js.map +1 -1
  653. package/dist/voice/generation_tools.test.cjs +236 -0
  654. package/dist/voice/generation_tools.test.cjs.map +1 -0
  655. package/dist/voice/generation_tools.test.js +235 -0
  656. package/dist/voice/generation_tools.test.js.map +1 -0
  657. package/dist/voice/index.cjs +33 -2
  658. package/dist/voice/index.cjs.map +1 -1
  659. package/dist/voice/index.d.cts +8 -2
  660. package/dist/voice/index.d.ts +8 -2
  661. package/dist/voice/index.d.ts.map +1 -1
  662. package/dist/voice/index.js +19 -2
  663. package/dist/voice/index.js.map +1 -1
  664. package/dist/voice/interruption_detection.test.cjs +114 -0
  665. package/dist/voice/interruption_detection.test.cjs.map +1 -0
  666. package/dist/voice/interruption_detection.test.js +113 -0
  667. package/dist/voice/interruption_detection.test.js.map +1 -0
  668. package/dist/voice/io.cjs +66 -6
  669. package/dist/voice/io.cjs.map +1 -1
  670. package/dist/voice/io.d.cts +67 -7
  671. package/dist/voice/io.d.ts +67 -7
  672. package/dist/voice/io.d.ts.map +1 -1
  673. package/dist/voice/io.js +62 -5
  674. package/dist/voice/io.js.map +1 -1
  675. package/dist/voice/recorder_io/index.cjs +23 -0
  676. package/dist/voice/recorder_io/index.cjs.map +1 -0
  677. package/dist/voice/recorder_io/index.d.cts +2 -0
  678. package/dist/voice/recorder_io/index.d.ts +2 -0
  679. package/dist/voice/recorder_io/index.d.ts.map +1 -0
  680. package/dist/voice/recorder_io/index.js +2 -0
  681. package/dist/voice/recorder_io/index.js.map +1 -0
  682. package/dist/voice/recorder_io/recorder_io.cjs +607 -0
  683. package/dist/voice/recorder_io/recorder_io.cjs.map +1 -0
  684. package/dist/voice/recorder_io/recorder_io.d.cts +106 -0
  685. package/dist/voice/recorder_io/recorder_io.d.ts +106 -0
  686. package/dist/voice/recorder_io/recorder_io.d.ts.map +1 -0
  687. package/dist/voice/recorder_io/recorder_io.js +573 -0
  688. package/dist/voice/recorder_io/recorder_io.js.map +1 -0
  689. package/dist/voice/remote_session.cjs +922 -0
  690. package/dist/voice/remote_session.cjs.map +1 -0
  691. package/dist/voice/remote_session.d.cts +108 -0
  692. package/dist/voice/remote_session.d.ts +108 -0
  693. package/dist/voice/remote_session.d.ts.map +1 -0
  694. package/dist/voice/remote_session.js +887 -0
  695. package/dist/voice/remote_session.js.map +1 -0
  696. package/dist/voice/report.cjs +88 -0
  697. package/dist/voice/report.cjs.map +1 -0
  698. package/dist/voice/report.d.cts +49 -0
  699. package/dist/voice/report.d.ts +49 -0
  700. package/dist/voice/report.d.ts.map +1 -0
  701. package/dist/voice/report.js +63 -0
  702. package/dist/voice/report.js.map +1 -0
  703. package/dist/voice/report.test.cjs +121 -0
  704. package/dist/voice/report.test.cjs.map +1 -0
  705. package/dist/voice/report.test.js +120 -0
  706. package/dist/voice/report.test.js.map +1 -0
  707. package/dist/voice/room_io/_input.cjs +40 -7
  708. package/dist/voice/room_io/_input.cjs.map +1 -1
  709. package/dist/voice/room_io/_input.d.cts +5 -2
  710. package/dist/voice/room_io/_input.d.ts +5 -2
  711. package/dist/voice/room_io/_input.d.ts.map +1 -1
  712. package/dist/voice/room_io/_input.js +41 -8
  713. package/dist/voice/room_io/_input.js.map +1 -1
  714. package/dist/voice/room_io/_output.cjs +19 -11
  715. package/dist/voice/room_io/_output.cjs.map +1 -1
  716. package/dist/voice/room_io/_output.d.cts +7 -4
  717. package/dist/voice/room_io/_output.d.ts +7 -4
  718. package/dist/voice/room_io/_output.d.ts.map +1 -1
  719. package/dist/voice/room_io/_output.js +20 -12
  720. package/dist/voice/room_io/_output.js.map +1 -1
  721. package/dist/voice/room_io/room_io.cjs +33 -6
  722. package/dist/voice/room_io/room_io.cjs.map +1 -1
  723. package/dist/voice/room_io/room_io.d.cts +29 -9
  724. package/dist/voice/room_io/room_io.d.ts +29 -9
  725. package/dist/voice/room_io/room_io.d.ts.map +1 -1
  726. package/dist/voice/room_io/room_io.js +33 -7
  727. package/dist/voice/room_io/room_io.js.map +1 -1
  728. package/dist/voice/speech_handle.cjs +22 -4
  729. package/dist/voice/speech_handle.cjs.map +1 -1
  730. package/dist/voice/speech_handle.d.cts +17 -2
  731. package/dist/voice/speech_handle.d.ts +17 -2
  732. package/dist/voice/speech_handle.d.ts.map +1 -1
  733. package/dist/voice/speech_handle.js +21 -4
  734. package/dist/voice/speech_handle.js.map +1 -1
  735. package/dist/voice/testing/fake_llm.cjs +127 -0
  736. package/dist/voice/testing/fake_llm.cjs.map +1 -0
  737. package/dist/voice/testing/fake_llm.d.cts +30 -0
  738. package/dist/voice/testing/fake_llm.d.ts +30 -0
  739. package/dist/voice/testing/fake_llm.d.ts.map +1 -0
  740. package/dist/voice/testing/fake_llm.js +103 -0
  741. package/dist/voice/testing/fake_llm.js.map +1 -0
  742. package/dist/voice/testing/index.cjs +57 -0
  743. package/dist/voice/testing/index.cjs.map +1 -0
  744. package/dist/voice/testing/index.d.cts +21 -0
  745. package/dist/voice/testing/index.d.ts +21 -0
  746. package/dist/voice/testing/index.d.ts.map +1 -0
  747. package/dist/voice/testing/index.js +35 -0
  748. package/dist/voice/testing/index.js.map +1 -0
  749. package/dist/voice/testing/run_result.cjs +817 -0
  750. package/dist/voice/testing/run_result.cjs.map +1 -0
  751. package/dist/voice/testing/run_result.d.cts +385 -0
  752. package/dist/voice/testing/run_result.d.ts +385 -0
  753. package/dist/voice/testing/run_result.d.ts.map +1 -0
  754. package/dist/voice/testing/run_result.js +790 -0
  755. package/dist/voice/testing/run_result.js.map +1 -0
  756. package/dist/voice/testing/types.cjs +46 -0
  757. package/dist/voice/testing/types.cjs.map +1 -0
  758. package/dist/voice/testing/types.d.cts +83 -0
  759. package/dist/voice/testing/types.d.ts +83 -0
  760. package/dist/voice/testing/types.d.ts.map +1 -0
  761. package/dist/voice/testing/types.js +19 -0
  762. package/dist/voice/testing/types.js.map +1 -0
  763. package/dist/voice/transcription/synchronizer.cjs +139 -15
  764. package/dist/voice/transcription/synchronizer.cjs.map +1 -1
  765. package/dist/voice/transcription/synchronizer.d.cts +35 -4
  766. package/dist/voice/transcription/synchronizer.d.ts +35 -4
  767. package/dist/voice/transcription/synchronizer.d.ts.map +1 -1
  768. package/dist/voice/transcription/synchronizer.js +143 -16
  769. package/dist/voice/transcription/synchronizer.js.map +1 -1
  770. package/dist/voice/transcription/synchronizer.test.cjs +151 -0
  771. package/dist/voice/transcription/synchronizer.test.cjs.map +1 -0
  772. package/dist/voice/transcription/synchronizer.test.js +150 -0
  773. package/dist/voice/transcription/synchronizer.test.js.map +1 -0
  774. package/dist/voice/turn_config/endpointing.cjs +33 -0
  775. package/dist/voice/turn_config/endpointing.cjs.map +1 -0
  776. package/dist/voice/turn_config/endpointing.d.cts +30 -0
  777. package/dist/voice/turn_config/endpointing.d.ts +30 -0
  778. package/dist/voice/turn_config/endpointing.d.ts.map +1 -0
  779. package/dist/voice/turn_config/endpointing.js +9 -0
  780. package/dist/voice/turn_config/endpointing.js.map +1 -0
  781. package/dist/voice/turn_config/interruption.cjs +37 -0
  782. package/dist/voice/turn_config/interruption.cjs.map +1 -0
  783. package/dist/voice/turn_config/interruption.d.cts +53 -0
  784. package/dist/voice/turn_config/interruption.d.ts +53 -0
  785. package/dist/voice/turn_config/interruption.d.ts.map +1 -0
  786. package/dist/voice/turn_config/interruption.js +13 -0
  787. package/dist/voice/turn_config/interruption.js.map +1 -0
  788. package/dist/voice/turn_config/turn_handling.cjs +35 -0
  789. package/dist/voice/turn_config/turn_handling.cjs.map +1 -0
  790. package/dist/voice/turn_config/turn_handling.d.cts +36 -0
  791. package/dist/voice/turn_config/turn_handling.d.ts +36 -0
  792. package/dist/voice/turn_config/turn_handling.d.ts.map +1 -0
  793. package/dist/voice/turn_config/turn_handling.js +11 -0
  794. package/dist/voice/turn_config/turn_handling.js.map +1 -0
  795. package/dist/voice/turn_config/utils.cjs +157 -0
  796. package/dist/voice/turn_config/utils.cjs.map +1 -0
  797. package/dist/voice/turn_config/utils.d.cts +37 -0
  798. package/dist/voice/turn_config/utils.d.ts +37 -0
  799. package/dist/voice/turn_config/utils.d.ts.map +1 -0
  800. package/dist/voice/turn_config/utils.js +131 -0
  801. package/dist/voice/turn_config/utils.js.map +1 -0
  802. package/dist/voice/turn_config/utils.test.cjs +128 -0
  803. package/dist/voice/turn_config/utils.test.cjs.map +1 -0
  804. package/dist/voice/turn_config/utils.test.js +127 -0
  805. package/dist/voice/turn_config/utils.test.js.map +1 -0
  806. package/dist/voice/utils.cjs +47 -0
  807. package/dist/voice/utils.cjs.map +1 -0
  808. package/dist/voice/utils.d.cts +4 -0
  809. package/dist/voice/utils.d.ts +4 -0
  810. package/dist/voice/utils.d.ts.map +1 -0
  811. package/dist/voice/utils.js +23 -0
  812. package/dist/voice/utils.js.map +1 -0
  813. package/dist/worker.cjs +44 -52
  814. package/dist/worker.cjs.map +1 -1
  815. package/dist/worker.d.cts +18 -8
  816. package/dist/worker.d.ts +18 -8
  817. package/dist/worker.d.ts.map +1 -1
  818. package/dist/worker.js +43 -43
  819. package/dist/worker.js.map +1 -1
  820. package/package.json +35 -13
  821. package/resources/NOTICE +2 -0
  822. package/resources/keyboard-typing.ogg +0 -0
  823. package/resources/keyboard-typing2.ogg +0 -0
  824. package/resources/office-ambience.ogg +0 -0
  825. package/src/_exceptions.ts +5 -0
  826. package/src/audio.ts +132 -1
  827. package/src/beta/index.ts +9 -0
  828. package/src/beta/workflows/index.ts +9 -0
  829. package/src/beta/workflows/task_group.ts +203 -0
  830. package/src/cli.ts +57 -66
  831. package/src/connection_pool.test.ts +346 -0
  832. package/src/connection_pool.ts +307 -0
  833. package/src/constants.ts +14 -0
  834. package/src/cpu.test.ts +239 -0
  835. package/src/cpu.ts +173 -0
  836. package/src/http_server.ts +18 -6
  837. package/src/index.ts +15 -13
  838. package/src/inference/api_protos.ts +85 -2
  839. package/src/inference/index.ts +32 -4
  840. package/src/inference/interruption/defaults.ts +51 -0
  841. package/src/inference/interruption/errors.ts +25 -0
  842. package/src/inference/interruption/http_transport.ts +207 -0
  843. package/src/inference/interruption/interruption_cache_entry.ts +50 -0
  844. package/src/inference/interruption/interruption_detector.ts +204 -0
  845. package/src/inference/interruption/interruption_stream.ts +467 -0
  846. package/src/inference/interruption/types.ts +84 -0
  847. package/src/inference/interruption/utils.test.ts +132 -0
  848. package/src/inference/interruption/utils.ts +137 -0
  849. package/src/inference/interruption/ws_transport.ts +416 -0
  850. package/src/inference/llm.ts +214 -163
  851. package/src/inference/stt.test.ts +253 -0
  852. package/src/inference/stt.ts +449 -208
  853. package/src/inference/tts.test.ts +354 -0
  854. package/src/inference/tts.ts +417 -115
  855. package/src/inference/utils.ts +30 -2
  856. package/src/ipc/inference_proc_executor.ts +11 -3
  857. package/src/ipc/inference_proc_lazy_main.ts +13 -1
  858. package/src/ipc/job_proc_executor.ts +11 -1
  859. package/src/ipc/job_proc_lazy_main.ts +86 -20
  860. package/src/ipc/supervised_proc.test.ts +153 -0
  861. package/src/ipc/supervised_proc.ts +39 -10
  862. package/src/job.ts +120 -1
  863. package/src/language.test.ts +62 -0
  864. package/src/language.ts +380 -0
  865. package/src/llm/__snapshots__/zod-utils.test.ts.snap +559 -0
  866. package/src/llm/chat_context.test.ts +787 -0
  867. package/src/llm/chat_context.ts +493 -2
  868. package/src/llm/fallback_adapter.test.ts +238 -0
  869. package/src/llm/fallback_adapter.ts +394 -0
  870. package/src/llm/index.ts +13 -0
  871. package/src/llm/llm.ts +77 -12
  872. package/src/llm/provider_format/google.test.ts +72 -1
  873. package/src/llm/provider_format/google.ts +10 -6
  874. package/src/llm/provider_format/index.ts +7 -2
  875. package/src/llm/provider_format/openai.test.ts +480 -2
  876. package/src/llm/provider_format/openai.ts +152 -21
  877. package/src/llm/provider_format/utils.ts +11 -5
  878. package/src/llm/realtime.ts +23 -2
  879. package/src/llm/remote_chat_context.ts +2 -2
  880. package/src/llm/tool_context.test.ts +210 -1
  881. package/src/llm/tool_context.ts +115 -17
  882. package/src/llm/utils.test.ts +103 -2
  883. package/src/llm/utils.ts +152 -16
  884. package/src/llm/zod-utils.test.ts +577 -0
  885. package/src/llm/zod-utils.ts +153 -0
  886. package/src/log.ts +71 -19
  887. package/src/metrics/base.ts +78 -19
  888. package/src/metrics/index.ts +12 -0
  889. package/src/metrics/model_usage.test.ts +545 -0
  890. package/src/metrics/model_usage.ts +262 -0
  891. package/src/metrics/usage_collector.ts +14 -3
  892. package/src/metrics/utils.ts +27 -7
  893. package/src/stream/deferred_stream.test.ts +3 -3
  894. package/src/stream/deferred_stream.ts +43 -11
  895. package/src/stream/index.ts +1 -0
  896. package/src/stream/multi_input_stream.test.ts +545 -0
  897. package/src/stream/multi_input_stream.ts +172 -0
  898. package/src/stream/stream_channel.test.ts +37 -0
  899. package/src/stream/stream_channel.ts +43 -3
  900. package/src/stt/stream_adapter.ts +30 -9
  901. package/src/stt/stt.ts +140 -23
  902. package/src/telemetry/index.ts +28 -0
  903. package/src/telemetry/logging.ts +55 -0
  904. package/src/telemetry/otel_http_exporter.ts +218 -0
  905. package/src/telemetry/pino_otel_transport.ts +265 -0
  906. package/src/telemetry/trace_types.ts +109 -0
  907. package/src/telemetry/traces.ts +673 -0
  908. package/src/telemetry/utils.ts +61 -0
  909. package/src/tokenize/basic/sentence.ts +3 -3
  910. package/src/tokenize/tokenizer.test.ts +4 -0
  911. package/src/transcription.ts +6 -0
  912. package/src/tts/fallback_adapter.ts +586 -0
  913. package/src/tts/index.ts +1 -0
  914. package/src/tts/stream_adapter.ts +38 -8
  915. package/src/tts/tts.ts +245 -62
  916. package/src/typed_promise.ts +67 -0
  917. package/src/types.ts +62 -33
  918. package/src/utils.test.ts +90 -10
  919. package/src/utils.ts +178 -33
  920. package/src/vad.ts +42 -18
  921. package/src/version.ts +1 -1
  922. package/src/voice/agent.test.ts +347 -2
  923. package/src/voice/agent.ts +346 -44
  924. package/src/voice/agent_activity.test.ts +194 -0
  925. package/src/voice/agent_activity.ts +1457 -388
  926. package/src/voice/agent_session.ts +817 -112
  927. package/src/voice/audio_recognition.ts +845 -70
  928. package/src/voice/audio_recognition_span.test.ts +341 -0
  929. package/src/voice/avatar/datastream_io.ts +9 -1
  930. package/src/voice/background_audio.ts +494 -0
  931. package/src/voice/events.ts +27 -7
  932. package/src/voice/generation.ts +310 -56
  933. package/src/voice/generation_tools.test.ts +268 -0
  934. package/src/voice/index.ts +17 -3
  935. package/src/voice/interruption_detection.test.ts +151 -0
  936. package/src/voice/io.ts +115 -12
  937. package/src/voice/recorder_io/index.ts +4 -0
  938. package/src/voice/recorder_io/recorder_io.ts +783 -0
  939. package/src/voice/remote_session.ts +1083 -0
  940. package/src/voice/report.test.ts +136 -0
  941. package/src/voice/report.ts +140 -0
  942. package/src/voice/room_io/_input.ts +45 -10
  943. package/src/voice/room_io/_output.ts +26 -14
  944. package/src/voice/room_io/room_io.ts +67 -22
  945. package/src/voice/speech_handle.ts +38 -6
  946. package/src/voice/testing/fake_llm.ts +138 -0
  947. package/src/voice/testing/index.ts +52 -0
  948. package/src/voice/testing/run_result.ts +995 -0
  949. package/src/voice/testing/types.ts +118 -0
  950. package/src/voice/transcription/synchronizer.test.ts +206 -0
  951. package/src/voice/transcription/synchronizer.ts +204 -19
  952. package/src/voice/turn_config/endpointing.ts +33 -0
  953. package/src/voice/turn_config/interruption.ts +56 -0
  954. package/src/voice/turn_config/turn_handling.ts +45 -0
  955. package/src/voice/turn_config/utils.test.ts +148 -0
  956. package/src/voice/turn_config/utils.ts +167 -0
  957. package/src/voice/utils.ts +29 -0
  958. package/src/worker.ts +92 -78
  959. package/src/llm/__snapshots__/utils.test.ts.snap +0 -65
@@ -0,0 +1,305 @@
1
+ "use strict";
2
+ var import_vitest = require("vitest");
3
+ var import_language = require("../language.cjs");
4
+ var import_log = require("../log.cjs");
5
+ var import_types = require("../types.cjs");
6
+ var import_tts = require("./tts.cjs");
7
+ (0, import_vitest.beforeAll)(() => {
8
+ (0, import_log.initializeLogger)({ level: "silent", pretty: false });
9
+ });
10
+ function makeTts(overrides = {}) {
11
+ const defaults = {
12
+ model: "cartesia/sonic",
13
+ apiKey: "test-key",
14
+ apiSecret: "test-secret",
15
+ baseURL: "https://example.livekit.cloud"
16
+ };
17
+ return new import_tts.TTS({ ...defaults, ...overrides });
18
+ }
19
+ (0, import_vitest.describe)("parseTTSModelString", () => {
20
+ (0, import_vitest.it)("simple model without voice", () => {
21
+ const [model, voice] = (0, import_tts.parseTTSModelString)("cartesia");
22
+ (0, import_vitest.expect)(model).toBe("cartesia");
23
+ (0, import_vitest.expect)(voice).toBeUndefined();
24
+ });
25
+ (0, import_vitest.it)("model with voice suffix", () => {
26
+ const [model, voice] = (0, import_tts.parseTTSModelString)("cartesia:my-voice-id");
27
+ (0, import_vitest.expect)(model).toBe("cartesia");
28
+ (0, import_vitest.expect)(voice).toBe("my-voice-id");
29
+ });
30
+ (0, import_vitest.it)("provider/model format without voice", () => {
31
+ const [model, voice] = (0, import_tts.parseTTSModelString)("cartesia/sonic");
32
+ (0, import_vitest.expect)(model).toBe("cartesia/sonic");
33
+ (0, import_vitest.expect)(voice).toBeUndefined();
34
+ });
35
+ (0, import_vitest.it)("provider/model format with voice", () => {
36
+ const [model, voice] = (0, import_tts.parseTTSModelString)("cartesia/sonic:my-voice-id");
37
+ (0, import_vitest.expect)(model).toBe("cartesia/sonic");
38
+ (0, import_vitest.expect)(voice).toBe("my-voice-id");
39
+ });
40
+ import_vitest.it.each([
41
+ ["elevenlabs/eleven_flash_v2:voice123", "elevenlabs/eleven_flash_v2", "voice123"],
42
+ ["rime:speaker-a", "rime", "speaker-a"],
43
+ ["rime/mist:narrator", "rime/mist", "narrator"],
44
+ ["inworld/inworld-tts-1:character", "inworld/inworld-tts-1", "character"],
45
+ ["cartesia/sonic-turbo:deep-voice", "cartesia/sonic-turbo", "deep-voice"]
46
+ ])("various providers and voices: %s", (modelStr, expectedModel, expectedVoice) => {
47
+ const [model, voice] = (0, import_tts.parseTTSModelString)(modelStr);
48
+ (0, import_vitest.expect)(model).toBe(expectedModel);
49
+ (0, import_vitest.expect)(voice).toBe(expectedVoice);
50
+ });
51
+ (0, import_vitest.it)("empty voice after colon", () => {
52
+ const [model, voice] = (0, import_tts.parseTTSModelString)("cartesia/sonic:");
53
+ (0, import_vitest.expect)(model).toBe("cartesia/sonic");
54
+ (0, import_vitest.expect)(voice).toBe("");
55
+ });
56
+ });
57
+ (0, import_vitest.describe)("normalizeTTSFallback", () => {
58
+ (0, import_vitest.it)("single string model", () => {
59
+ const result = (0, import_tts.normalizeTTSFallback)("cartesia/sonic");
60
+ (0, import_vitest.expect)(result).toEqual([{ model: "cartesia/sonic", voice: "" }]);
61
+ });
62
+ (0, import_vitest.it)("single string model with voice", () => {
63
+ const result = (0, import_tts.normalizeTTSFallback)("cartesia/sonic:my-voice");
64
+ (0, import_vitest.expect)(result).toEqual([{ model: "cartesia/sonic", voice: "my-voice" }]);
65
+ });
66
+ (0, import_vitest.it)("single FallbackModel dict", () => {
67
+ const fallback = { model: "cartesia/sonic", voice: "narrator" };
68
+ const result = (0, import_tts.normalizeTTSFallback)(fallback);
69
+ (0, import_vitest.expect)(result).toEqual([{ model: "cartesia/sonic", voice: "narrator" }]);
70
+ });
71
+ (0, import_vitest.it)("list of string models", () => {
72
+ const result = (0, import_tts.normalizeTTSFallback)(["cartesia/sonic", "elevenlabs/eleven_flash_v2"]);
73
+ (0, import_vitest.expect)(result).toEqual([
74
+ { model: "cartesia/sonic", voice: "" },
75
+ { model: "elevenlabs/eleven_flash_v2", voice: "" }
76
+ ]);
77
+ });
78
+ (0, import_vitest.it)("list of string models with voices", () => {
79
+ const result = (0, import_tts.normalizeTTSFallback)(["cartesia/sonic:voice1", "elevenlabs:voice2"]);
80
+ (0, import_vitest.expect)(result).toEqual([
81
+ { model: "cartesia/sonic", voice: "voice1" },
82
+ { model: "elevenlabs", voice: "voice2" }
83
+ ]);
84
+ });
85
+ (0, import_vitest.it)("list of FallbackModel dicts", () => {
86
+ const fallbacks = [
87
+ { model: "cartesia/sonic", voice: "narrator" },
88
+ { model: "elevenlabs", voice: "" }
89
+ ];
90
+ const result = (0, import_tts.normalizeTTSFallback)(fallbacks);
91
+ (0, import_vitest.expect)(result).toEqual([
92
+ { model: "cartesia/sonic", voice: "narrator" },
93
+ { model: "elevenlabs", voice: "" }
94
+ ]);
95
+ });
96
+ (0, import_vitest.it)("mixed list of strings and dicts", () => {
97
+ const result = (0, import_tts.normalizeTTSFallback)([
98
+ "cartesia/sonic:voice1",
99
+ { model: "elevenlabs/eleven_flash_v2", voice: "custom" },
100
+ "rime/mist"
101
+ ]);
102
+ (0, import_vitest.expect)(result).toEqual([
103
+ { model: "cartesia/sonic", voice: "voice1" },
104
+ { model: "elevenlabs/eleven_flash_v2", voice: "custom" },
105
+ { model: "rime/mist", voice: "" }
106
+ ]);
107
+ });
108
+ (0, import_vitest.it)("FallbackModel with extraKwargs is preserved", () => {
109
+ const fallback = {
110
+ model: "cartesia/sonic",
111
+ voice: "narrator",
112
+ extraKwargs: { duration: 30, speed: "fast" }
113
+ };
114
+ const result = (0, import_tts.normalizeTTSFallback)(fallback);
115
+ (0, import_vitest.expect)(result).toEqual([
116
+ {
117
+ model: "cartesia/sonic",
118
+ voice: "narrator",
119
+ extraKwargs: { duration: 30, speed: "fast" }
120
+ }
121
+ ]);
122
+ });
123
+ (0, import_vitest.it)("list with extraKwargs preserved", () => {
124
+ const result = (0, import_tts.normalizeTTSFallback)([
125
+ { model: "cartesia/sonic", voice: "v1", extraKwargs: { speed: "slow" } },
126
+ "elevenlabs:voice2",
127
+ { model: "rime/mist", voice: "", extraKwargs: { custom: true } }
128
+ ]);
129
+ (0, import_vitest.expect)(result).toEqual([
130
+ { model: "cartesia/sonic", voice: "v1", extraKwargs: { speed: "slow" } },
131
+ { model: "elevenlabs", voice: "voice2" },
132
+ { model: "rime/mist", voice: "", extraKwargs: { custom: true } }
133
+ ]);
134
+ });
135
+ (0, import_vitest.it)("empty list returns empty list", () => {
136
+ const result = (0, import_tts.normalizeTTSFallback)([]);
137
+ (0, import_vitest.expect)(result).toEqual([]);
138
+ });
139
+ (0, import_vitest.it)("FallbackModel with empty voice", () => {
140
+ const fallback = { model: "cartesia/sonic", voice: "" };
141
+ const result = (0, import_tts.normalizeTTSFallback)(fallback);
142
+ (0, import_vitest.expect)(result).toEqual([{ model: "cartesia/sonic", voice: "" }]);
143
+ });
144
+ });
145
+ (0, import_vitest.describe)("TTS constructor fallback and connOptions", () => {
146
+ (0, import_vitest.it)("normalizes language in constructor", () => {
147
+ const tts = makeTts({ language: "english" });
148
+ (0, import_vitest.expect)(tts["opts"].language).toBe("en");
149
+ });
150
+ (0, import_vitest.it)("normalizes updated language values", () => {
151
+ const tts = makeTts();
152
+ tts.updateOptions({ language: "en_US" });
153
+ (0, import_vitest.expect)(tts["opts"].language).toBe((0, import_language.normalizeLanguage)("en_US"));
154
+ });
155
+ (0, import_vitest.it)("fallback not given defaults to undefined", () => {
156
+ const tts = makeTts();
157
+ (0, import_vitest.expect)(tts["opts"].fallback).toBeUndefined();
158
+ });
159
+ (0, import_vitest.it)("fallback single string is normalized", () => {
160
+ const tts = makeTts({ fallback: "elevenlabs/eleven_flash_v2" });
161
+ (0, import_vitest.expect)(tts["opts"].fallback).toEqual([{ model: "elevenlabs/eleven_flash_v2", voice: "" }]);
162
+ });
163
+ (0, import_vitest.it)("fallback single string with voice is normalized", () => {
164
+ const tts = makeTts({ fallback: "cartesia/sonic:my-voice" });
165
+ (0, import_vitest.expect)(tts["opts"].fallback).toEqual([{ model: "cartesia/sonic", voice: "my-voice" }]);
166
+ });
167
+ (0, import_vitest.it)("fallback list of strings is normalized", () => {
168
+ const tts = makeTts({ fallback: ["cartesia/sonic", "elevenlabs"] });
169
+ (0, import_vitest.expect)(tts["opts"].fallback).toEqual([
170
+ { model: "cartesia/sonic", voice: "" },
171
+ { model: "elevenlabs", voice: "" }
172
+ ]);
173
+ });
174
+ (0, import_vitest.it)("fallback single FallbackModel is normalized to list", () => {
175
+ const tts = makeTts({ fallback: { model: "cartesia/sonic", voice: "narrator" } });
176
+ (0, import_vitest.expect)(tts["opts"].fallback).toEqual([{ model: "cartesia/sonic", voice: "narrator" }]);
177
+ });
178
+ (0, import_vitest.it)("fallback with extraKwargs is preserved", () => {
179
+ const tts = makeTts({
180
+ fallback: {
181
+ model: "cartesia/sonic",
182
+ voice: "narrator",
183
+ extraKwargs: { duration: 30, speed: "fast" }
184
+ }
185
+ });
186
+ (0, import_vitest.expect)(tts["opts"].fallback).toEqual([
187
+ {
188
+ model: "cartesia/sonic",
189
+ voice: "narrator",
190
+ extraKwargs: { duration: 30, speed: "fast" }
191
+ }
192
+ ]);
193
+ });
194
+ (0, import_vitest.it)("fallback mixed list is normalized", () => {
195
+ const tts = makeTts({
196
+ fallback: [
197
+ "cartesia/sonic:voice1",
198
+ { model: "elevenlabs", voice: "custom", extraKwargs: { speed: "slow" } },
199
+ "rime/mist"
200
+ ]
201
+ });
202
+ (0, import_vitest.expect)(tts["opts"].fallback).toEqual([
203
+ { model: "cartesia/sonic", voice: "voice1" },
204
+ { model: "elevenlabs", voice: "custom", extraKwargs: { speed: "slow" } },
205
+ { model: "rime/mist", voice: "" }
206
+ ]);
207
+ });
208
+ (0, import_vitest.it)("connOptions not given uses default", () => {
209
+ const tts = makeTts();
210
+ (0, import_vitest.expect)(tts["opts"].connOptions).toEqual(import_types.DEFAULT_API_CONNECT_OPTIONS);
211
+ });
212
+ (0, import_vitest.it)("connOptions custom timeout", () => {
213
+ const custom = { timeoutMs: 3e4, maxRetry: 3, retryIntervalMs: 2e3 };
214
+ const tts = makeTts({ connOptions: custom });
215
+ (0, import_vitest.expect)(tts["opts"].connOptions).toEqual(custom);
216
+ (0, import_vitest.expect)(tts["opts"].connOptions.timeoutMs).toBe(3e4);
217
+ });
218
+ (0, import_vitest.it)("connOptions custom maxRetry", () => {
219
+ const custom = { timeoutMs: 1e4, maxRetry: 5, retryIntervalMs: 2e3 };
220
+ const tts = makeTts({ connOptions: custom });
221
+ (0, import_vitest.expect)(tts["opts"].connOptions).toEqual(custom);
222
+ (0, import_vitest.expect)(tts["opts"].connOptions.maxRetry).toBe(5);
223
+ });
224
+ (0, import_vitest.it)("connOptions full custom", () => {
225
+ const custom = { timeoutMs: 6e4, maxRetry: 10, retryIntervalMs: 2e3 };
226
+ const tts = makeTts({ connOptions: custom });
227
+ (0, import_vitest.expect)(tts["opts"].connOptions).toEqual(custom);
228
+ (0, import_vitest.expect)(tts["opts"].connOptions.timeoutMs).toBe(6e4);
229
+ (0, import_vitest.expect)(tts["opts"].connOptions.maxRetry).toBe(10);
230
+ (0, import_vitest.expect)(tts["opts"].connOptions.retryIntervalMs).toBe(2e3);
231
+ });
232
+ });
233
+ (0, import_vitest.describe)("TTS provider modelOptions parity", () => {
234
+ (0, import_vitest.it)("preserves ElevenLabs inference model options", () => {
235
+ const modelOptions = {
236
+ speed: 1.2,
237
+ stability: 0.5,
238
+ similarity_boost: 0.8,
239
+ enable_logging: false
240
+ };
241
+ const tts = new import_tts.TTS({
242
+ model: "elevenlabs/eleven_flash_v2_5",
243
+ apiKey: "test-key",
244
+ apiSecret: "test-secret",
245
+ baseURL: "https://example.livekit.cloud",
246
+ modelOptions
247
+ });
248
+ (0, import_vitest.expect)(tts["opts"].modelOptions).toEqual(modelOptions);
249
+ });
250
+ (0, import_vitest.it)("accepts expanded Cartesia inference model options", () => {
251
+ const modelOptions = {
252
+ speed: 1.15,
253
+ emotion: "curious",
254
+ add_timestamps: true
255
+ };
256
+ const tts = new import_tts.TTS({
257
+ model: "cartesia/sonic",
258
+ apiKey: "test-key",
259
+ apiSecret: "test-secret",
260
+ baseURL: "https://example.livekit.cloud",
261
+ modelOptions
262
+ });
263
+ (0, import_vitest.expect)(tts["opts"].modelOptions).toEqual(modelOptions);
264
+ });
265
+ (0, import_vitest.it)("accepts Deepgram inference model options", () => {
266
+ const modelOptions = { mip_opt_out: true };
267
+ const tts = new import_tts.TTS({
268
+ model: "deepgram/aura-2",
269
+ apiKey: "test-key",
270
+ apiSecret: "test-secret",
271
+ baseURL: "https://example.livekit.cloud",
272
+ modelOptions
273
+ });
274
+ (0, import_vitest.expect)(tts["opts"].modelOptions).toEqual(modelOptions);
275
+ });
276
+ (0, import_vitest.it)("accepts Rime inference model options", () => {
277
+ const modelOptions = {
278
+ speed_alpha: 0.9,
279
+ pause_between_brackets: true
280
+ };
281
+ const tts = new import_tts.TTS({
282
+ model: "rime/mistv2",
283
+ apiKey: "test-key",
284
+ apiSecret: "test-secret",
285
+ baseURL: "https://example.livekit.cloud",
286
+ modelOptions
287
+ });
288
+ (0, import_vitest.expect)(tts["opts"].modelOptions).toEqual(modelOptions);
289
+ });
290
+ (0, import_vitest.it)("accepts Inworld inference model options", () => {
291
+ const modelOptions = {
292
+ timestamp_type: "WORD",
293
+ apply_text_normalization: "ON"
294
+ };
295
+ const tts = new import_tts.TTS({
296
+ model: "inworld/inworld-tts-1",
297
+ apiKey: "test-key",
298
+ apiSecret: "test-secret",
299
+ baseURL: "https://example.livekit.cloud",
300
+ modelOptions
301
+ });
302
+ (0, import_vitest.expect)(tts["opts"].modelOptions).toEqual(modelOptions);
303
+ });
304
+ });
305
+ //# sourceMappingURL=tts.test.cjs.map
@@ -0,0 +1 @@
1
+ {"version":3,"sources":["../../src/inference/tts.test.ts"],"sourcesContent":["// SPDX-FileCopyrightText: 2025 LiveKit, Inc.\n//\n// SPDX-License-Identifier: Apache-2.0\nimport { beforeAll, describe, expect, it } from 'vitest';\nimport { normalizeLanguage } from '../language.js';\nimport { initializeLogger } from '../log.js';\nimport { type APIConnectOptions, DEFAULT_API_CONNECT_OPTIONS } from '../types.js';\nimport { TTS, type TTSFallbackModel, normalizeTTSFallback, parseTTSModelString } from './tts.js';\n\nbeforeAll(() => {\n initializeLogger({ level: 'silent', pretty: false });\n});\n\n/** Helper to create TTS with required credentials. */\nfunction makeTts(overrides: Record<string, unknown> = {}) {\n const defaults = {\n model: 'cartesia/sonic' as const,\n apiKey: 'test-key',\n apiSecret: 'test-secret',\n baseURL: 'https://example.livekit.cloud',\n };\n return new TTS({ ...defaults, ...overrides });\n}\n\ndescribe('parseTTSModelString', () => {\n it('simple model without voice', () => {\n const [model, voice] = parseTTSModelString('cartesia');\n expect(model).toBe('cartesia');\n expect(voice).toBeUndefined();\n });\n\n it('model with voice suffix', () => {\n const [model, voice] = parseTTSModelString('cartesia:my-voice-id');\n expect(model).toBe('cartesia');\n expect(voice).toBe('my-voice-id');\n });\n\n it('provider/model format without voice', () => {\n const [model, voice] = parseTTSModelString('cartesia/sonic');\n expect(model).toBe('cartesia/sonic');\n expect(voice).toBeUndefined();\n });\n\n it('provider/model format with voice', () => {\n const [model, voice] = parseTTSModelString('cartesia/sonic:my-voice-id');\n expect(model).toBe('cartesia/sonic');\n expect(voice).toBe('my-voice-id');\n });\n\n it.each([\n ['elevenlabs/eleven_flash_v2:voice123', 'elevenlabs/eleven_flash_v2', 'voice123'],\n ['rime:speaker-a', 'rime', 'speaker-a'],\n ['rime/mist:narrator', 'rime/mist', 'narrator'],\n ['inworld/inworld-tts-1:character', 'inworld/inworld-tts-1', 'character'],\n ['cartesia/sonic-turbo:deep-voice', 'cartesia/sonic-turbo', 'deep-voice'],\n ])('various providers and voices: %s', (modelStr, expectedModel, expectedVoice) => {\n const [model, voice] = parseTTSModelString(modelStr);\n expect(model).toBe(expectedModel);\n expect(voice).toBe(expectedVoice);\n });\n\n it('empty voice after colon', () => {\n const [model, voice] = parseTTSModelString('cartesia/sonic:');\n expect(model).toBe('cartesia/sonic');\n expect(voice).toBe('');\n });\n});\n\ndescribe('normalizeTTSFallback', () => {\n it('single string model', () => {\n const result = normalizeTTSFallback('cartesia/sonic');\n expect(result).toEqual([{ model: 'cartesia/sonic', voice: '' }]);\n });\n\n it('single string model with voice', () => {\n const result = normalizeTTSFallback('cartesia/sonic:my-voice');\n expect(result).toEqual([{ model: 'cartesia/sonic', voice: 'my-voice' }]);\n });\n\n it('single FallbackModel dict', () => {\n const fallback: TTSFallbackModel = { model: 'cartesia/sonic', voice: 'narrator' };\n const result = normalizeTTSFallback(fallback);\n expect(result).toEqual([{ model: 'cartesia/sonic', voice: 'narrator' }]);\n });\n\n it('list of string models', () => {\n const result = normalizeTTSFallback(['cartesia/sonic', 'elevenlabs/eleven_flash_v2']);\n expect(result).toEqual([\n { model: 'cartesia/sonic', voice: '' },\n { model: 'elevenlabs/eleven_flash_v2', voice: '' },\n ]);\n });\n\n it('list of string models with voices', () => {\n const result = normalizeTTSFallback(['cartesia/sonic:voice1', 'elevenlabs:voice2']);\n expect(result).toEqual([\n { model: 'cartesia/sonic', voice: 'voice1' },\n { model: 'elevenlabs', voice: 'voice2' },\n ]);\n });\n\n it('list of FallbackModel dicts', () => {\n const fallbacks: TTSFallbackModel[] = [\n { model: 'cartesia/sonic', voice: 'narrator' },\n { model: 'elevenlabs', voice: '' },\n ];\n const result = normalizeTTSFallback(fallbacks);\n expect(result).toEqual([\n { model: 'cartesia/sonic', voice: 'narrator' },\n { model: 'elevenlabs', voice: '' },\n ]);\n });\n\n it('mixed list of strings and dicts', () => {\n const result = normalizeTTSFallback([\n 'cartesia/sonic:voice1',\n { model: 'elevenlabs/eleven_flash_v2', voice: 'custom' } as TTSFallbackModel,\n 'rime/mist',\n ]);\n expect(result).toEqual([\n { model: 'cartesia/sonic', voice: 'voice1' },\n { model: 'elevenlabs/eleven_flash_v2', voice: 'custom' },\n { model: 'rime/mist', voice: '' },\n ]);\n });\n\n it('FallbackModel with extraKwargs is preserved', () => {\n const fallback: TTSFallbackModel = {\n model: 'cartesia/sonic',\n voice: 'narrator',\n extraKwargs: { duration: 30.0, speed: 'fast' },\n };\n const result = normalizeTTSFallback(fallback);\n expect(result).toEqual([\n {\n model: 'cartesia/sonic',\n voice: 'narrator',\n extraKwargs: { duration: 30.0, speed: 'fast' },\n },\n ]);\n });\n\n it('list with extraKwargs preserved', () => {\n const result = normalizeTTSFallback([\n { model: 'cartesia/sonic', voice: 'v1', extraKwargs: { speed: 'slow' } } as TTSFallbackModel,\n 'elevenlabs:voice2',\n { model: 'rime/mist', voice: '', extraKwargs: { custom: true } } as TTSFallbackModel,\n ]);\n expect(result).toEqual([\n { model: 'cartesia/sonic', voice: 'v1', extraKwargs: { speed: 'slow' } },\n { model: 'elevenlabs', voice: 'voice2' },\n { model: 'rime/mist', voice: '', extraKwargs: { custom: true } },\n ]);\n });\n\n it('empty list returns empty list', () => {\n const result = normalizeTTSFallback([]);\n expect(result).toEqual([]);\n });\n\n it('FallbackModel with empty voice', () => {\n const fallback: TTSFallbackModel = { model: 'cartesia/sonic', voice: '' };\n const result = normalizeTTSFallback(fallback);\n expect(result).toEqual([{ model: 'cartesia/sonic', voice: '' }]);\n });\n});\n\ndescribe('TTS constructor fallback and connOptions', () => {\n it('normalizes language in constructor', () => {\n const tts = makeTts({ language: 'english' });\n expect(tts['opts'].language).toBe('en');\n });\n\n it('normalizes updated language values', () => {\n const tts = makeTts();\n tts.updateOptions({ language: 'en_US' });\n expect(tts['opts'].language).toBe(normalizeLanguage('en_US'));\n });\n\n it('fallback not given defaults to undefined', () => {\n const tts = makeTts();\n expect(tts['opts'].fallback).toBeUndefined();\n });\n\n it('fallback single string is normalized', () => {\n const tts = makeTts({ fallback: 'elevenlabs/eleven_flash_v2' });\n expect(tts['opts'].fallback).toEqual([{ model: 'elevenlabs/eleven_flash_v2', voice: '' }]);\n });\n\n it('fallback single string with voice is normalized', () => {\n const tts = makeTts({ fallback: 'cartesia/sonic:my-voice' });\n expect(tts['opts'].fallback).toEqual([{ model: 'cartesia/sonic', voice: 'my-voice' }]);\n });\n\n it('fallback list of strings is normalized', () => {\n const tts = makeTts({ fallback: ['cartesia/sonic', 'elevenlabs'] });\n expect(tts['opts'].fallback).toEqual([\n { model: 'cartesia/sonic', voice: '' },\n { model: 'elevenlabs', voice: '' },\n ]);\n });\n\n it('fallback single FallbackModel is normalized to list', () => {\n const tts = makeTts({ fallback: { model: 'cartesia/sonic', voice: 'narrator' } });\n expect(tts['opts'].fallback).toEqual([{ model: 'cartesia/sonic', voice: 'narrator' }]);\n });\n\n it('fallback with extraKwargs is preserved', () => {\n const tts = makeTts({\n fallback: {\n model: 'cartesia/sonic',\n voice: 'narrator',\n extraKwargs: { duration: 30.0, speed: 'fast' },\n },\n });\n expect(tts['opts'].fallback).toEqual([\n {\n model: 'cartesia/sonic',\n voice: 'narrator',\n extraKwargs: { duration: 30.0, speed: 'fast' },\n },\n ]);\n });\n\n it('fallback mixed list is normalized', () => {\n const tts = makeTts({\n fallback: [\n 'cartesia/sonic:voice1',\n { model: 'elevenlabs', voice: 'custom', extraKwargs: { speed: 'slow' } },\n 'rime/mist',\n ],\n });\n expect(tts['opts'].fallback).toEqual([\n { model: 'cartesia/sonic', voice: 'voice1' },\n { model: 'elevenlabs', voice: 'custom', extraKwargs: { speed: 'slow' } },\n { model: 'rime/mist', voice: '' },\n ]);\n });\n\n it('connOptions not given uses default', () => {\n const tts = makeTts();\n expect(tts['opts'].connOptions).toEqual(DEFAULT_API_CONNECT_OPTIONS);\n });\n\n it('connOptions custom timeout', () => {\n const custom: APIConnectOptions = { timeoutMs: 30000, maxRetry: 3, retryIntervalMs: 2000 };\n const tts = makeTts({ connOptions: custom });\n expect(tts['opts'].connOptions).toEqual(custom);\n expect(tts['opts'].connOptions!.timeoutMs).toBe(30000);\n });\n\n it('connOptions custom maxRetry', () => {\n const custom: APIConnectOptions = { timeoutMs: 10000, maxRetry: 5, retryIntervalMs: 2000 };\n const tts = makeTts({ connOptions: custom });\n expect(tts['opts'].connOptions).toEqual(custom);\n expect(tts['opts'].connOptions!.maxRetry).toBe(5);\n });\n\n it('connOptions full custom', () => {\n const custom: APIConnectOptions = { timeoutMs: 60000, maxRetry: 10, retryIntervalMs: 2000 };\n const tts = makeTts({ connOptions: custom });\n expect(tts['opts'].connOptions).toEqual(custom);\n expect(tts['opts'].connOptions!.timeoutMs).toBe(60000);\n expect(tts['opts'].connOptions!.maxRetry).toBe(10);\n expect(tts['opts'].connOptions!.retryIntervalMs).toBe(2000);\n });\n});\n\ndescribe('TTS provider modelOptions parity', () => {\n it('preserves ElevenLabs inference model options', () => {\n const modelOptions = {\n speed: 1.2,\n stability: 0.5,\n similarity_boost: 0.8,\n enable_logging: false,\n };\n\n const tts = new TTS({\n model: 'elevenlabs/eleven_flash_v2_5' as const,\n apiKey: 'test-key',\n apiSecret: 'test-secret',\n baseURL: 'https://example.livekit.cloud',\n modelOptions,\n });\n\n expect(tts['opts'].modelOptions).toEqual(modelOptions);\n });\n\n it('accepts expanded Cartesia inference model options', () => {\n const modelOptions = {\n speed: 1.15,\n emotion: 'curious',\n add_timestamps: true,\n };\n\n const tts = new TTS({\n model: 'cartesia/sonic' as const,\n apiKey: 'test-key',\n apiSecret: 'test-secret',\n baseURL: 'https://example.livekit.cloud',\n modelOptions,\n });\n\n expect(tts['opts'].modelOptions).toEqual(modelOptions);\n });\n\n it('accepts Deepgram inference model options', () => {\n const modelOptions = { mip_opt_out: true };\n\n const tts = new TTS({\n model: 'deepgram/aura-2' as const,\n apiKey: 'test-key',\n apiSecret: 'test-secret',\n baseURL: 'https://example.livekit.cloud',\n modelOptions,\n });\n\n expect(tts['opts'].modelOptions).toEqual(modelOptions);\n });\n\n it('accepts Rime inference model options', () => {\n const modelOptions = {\n speed_alpha: 0.9,\n pause_between_brackets: true,\n };\n\n const tts = new TTS({\n model: 'rime/mistv2' as const,\n apiKey: 'test-key',\n apiSecret: 'test-secret',\n baseURL: 'https://example.livekit.cloud',\n modelOptions,\n });\n\n expect(tts['opts'].modelOptions).toEqual(modelOptions);\n });\n\n it('accepts Inworld inference model options', () => {\n const modelOptions = {\n timestamp_type: 'WORD' as const,\n apply_text_normalization: 'ON' as const,\n };\n\n const tts = new TTS({\n model: 'inworld/inworld-tts-1' as const,\n apiKey: 'test-key',\n apiSecret: 'test-secret',\n baseURL: 'https://example.livekit.cloud',\n modelOptions,\n });\n\n expect(tts['opts'].modelOptions).toEqual(modelOptions);\n });\n});\n"],"mappings":";AAGA,oBAAgD;AAChD,sBAAkC;AAClC,iBAAiC;AACjC,mBAAoE;AACpE,iBAAsF;AAAA,IAEtF,yBAAU,MAAM;AACd,mCAAiB,EAAE,OAAO,UAAU,QAAQ,MAAM,CAAC;AACrD,CAAC;AAGD,SAAS,QAAQ,YAAqC,CAAC,GAAG;AACxD,QAAM,WAAW;AAAA,IACf,OAAO;AAAA,IACP,QAAQ;AAAA,IACR,WAAW;AAAA,IACX,SAAS;AAAA,EACX;AACA,SAAO,IAAI,eAAI,EAAE,GAAG,UAAU,GAAG,UAAU,CAAC;AAC9C;AAAA,IAEA,wBAAS,uBAAuB,MAAM;AACpC,wBAAG,8BAA8B,MAAM;AACrC,UAAM,CAAC,OAAO,KAAK,QAAI,gCAAoB,UAAU;AACrD,8BAAO,KAAK,EAAE,KAAK,UAAU;AAC7B,8BAAO,KAAK,EAAE,cAAc;AAAA,EAC9B,CAAC;AAED,wBAAG,2BAA2B,MAAM;AAClC,UAAM,CAAC,OAAO,KAAK,QAAI,gCAAoB,sBAAsB;AACjE,8BAAO,KAAK,EAAE,KAAK,UAAU;AAC7B,8BAAO,KAAK,EAAE,KAAK,aAAa;AAAA,EAClC,CAAC;AAED,wBAAG,uCAAuC,MAAM;AAC9C,UAAM,CAAC,OAAO,KAAK,QAAI,gCAAoB,gBAAgB;AAC3D,8BAAO,KAAK,EAAE,KAAK,gBAAgB;AACnC,8BAAO,KAAK,EAAE,cAAc;AAAA,EAC9B,CAAC;AAED,wBAAG,oCAAoC,MAAM;AAC3C,UAAM,CAAC,OAAO,KAAK,QAAI,gCAAoB,4BAA4B;AACvE,8BAAO,KAAK,EAAE,KAAK,gBAAgB;AACnC,8BAAO,KAAK,EAAE,KAAK,aAAa;AAAA,EAClC,CAAC;AAED,mBAAG,KAAK;AAAA,IACN,CAAC,uCAAuC,8BAA8B,UAAU;AAAA,IAChF,CAAC,kBAAkB,QAAQ,WAAW;AAAA,IACtC,CAAC,sBAAsB,aAAa,UAAU;AAAA,IAC9C,CAAC,mCAAmC,yBAAyB,WAAW;AAAA,IACxE,CAAC,mCAAmC,wBAAwB,YAAY;AAAA,EAC1E,CAAC,EAAE,oCAAoC,CAAC,UAAU,eAAe,kBAAkB;AACjF,UAAM,CAAC,OAAO,KAAK,QAAI,gCAAoB,QAAQ;AACnD,8BAAO,KAAK,EAAE,KAAK,aAAa;AAChC,8BAAO,KAAK,EAAE,KAAK,aAAa;AAAA,EAClC,CAAC;AAED,wBAAG,2BAA2B,MAAM;AAClC,UAAM,CAAC,OAAO,KAAK,QAAI,gCAAoB,iBAAiB;AAC5D,8BAAO,KAAK,EAAE,KAAK,gBAAgB;AACnC,8BAAO,KAAK,EAAE,KAAK,EAAE;AAAA,EACvB,CAAC;AACH,CAAC;AAAA,IAED,wBAAS,wBAAwB,MAAM;AACrC,wBAAG,uBAAuB,MAAM;AAC9B,UAAM,aAAS,iCAAqB,gBAAgB;AACpD,8BAAO,MAAM,EAAE,QAAQ,CAAC,EAAE,OAAO,kBAAkB,OAAO,GAAG,CAAC,CAAC;AAAA,EACjE,CAAC;AAED,wBAAG,kCAAkC,MAAM;AACzC,UAAM,aAAS,iCAAqB,yBAAyB;AAC7D,8BAAO,MAAM,EAAE,QAAQ,CAAC,EAAE,OAAO,kBAAkB,OAAO,WAAW,CAAC,CAAC;AAAA,EACzE,CAAC;AAED,wBAAG,6BAA6B,MAAM;AACpC,UAAM,WAA6B,EAAE,OAAO,kBAAkB,OAAO,WAAW;AAChF,UAAM,aAAS,iCAAqB,QAAQ;AAC5C,8BAAO,MAAM,EAAE,QAAQ,CAAC,EAAE,OAAO,kBAAkB,OAAO,WAAW,CAAC,CAAC;AAAA,EACzE,CAAC;AAED,wBAAG,yBAAyB,MAAM;AAChC,UAAM,aAAS,iCAAqB,CAAC,kBAAkB,4BAA4B,CAAC;AACpF,8BAAO,MAAM,EAAE,QAAQ;AAAA,MACrB,EAAE,OAAO,kBAAkB,OAAO,GAAG;AAAA,MACrC,EAAE,OAAO,8BAA8B,OAAO,GAAG;AAAA,IACnD,CAAC;AAAA,EACH,CAAC;AAED,wBAAG,qCAAqC,MAAM;AAC5C,UAAM,aAAS,iCAAqB,CAAC,yBAAyB,mBAAmB,CAAC;AAClF,8BAAO,MAAM,EAAE,QAAQ;AAAA,MACrB,EAAE,OAAO,kBAAkB,OAAO,SAAS;AAAA,MAC3C,EAAE,OAAO,cAAc,OAAO,SAAS;AAAA,IACzC,CAAC;AAAA,EACH,CAAC;AAED,wBAAG,+BAA+B,MAAM;AACtC,UAAM,YAAgC;AAAA,MACpC,EAAE,OAAO,kBAAkB,OAAO,WAAW;AAAA,MAC7C,EAAE,OAAO,cAAc,OAAO,GAAG;AAAA,IACnC;AACA,UAAM,aAAS,iCAAqB,SAAS;AAC7C,8BAAO,MAAM,EAAE,QAAQ;AAAA,MACrB,EAAE,OAAO,kBAAkB,OAAO,WAAW;AAAA,MAC7C,EAAE,OAAO,cAAc,OAAO,GAAG;AAAA,IACnC,CAAC;AAAA,EACH,CAAC;AAED,wBAAG,mCAAmC,MAAM;AAC1C,UAAM,aAAS,iCAAqB;AAAA,MAClC;AAAA,MACA,EAAE,OAAO,8BAA8B,OAAO,SAAS;AAAA,MACvD;AAAA,IACF,CAAC;AACD,8BAAO,MAAM,EAAE,QAAQ;AAAA,MACrB,EAAE,OAAO,kBAAkB,OAAO,SAAS;AAAA,MAC3C,EAAE,OAAO,8BAA8B,OAAO,SAAS;AAAA,MACvD,EAAE,OAAO,aAAa,OAAO,GAAG;AAAA,IAClC,CAAC;AAAA,EACH,CAAC;AAED,wBAAG,+CAA+C,MAAM;AACtD,UAAM,WAA6B;AAAA,MACjC,OAAO;AAAA,MACP,OAAO;AAAA,MACP,aAAa,EAAE,UAAU,IAAM,OAAO,OAAO;AAAA,IAC/C;AACA,UAAM,aAAS,iCAAqB,QAAQ;AAC5C,8BAAO,MAAM,EAAE,QAAQ;AAAA,MACrB;AAAA,QACE,OAAO;AAAA,QACP,OAAO;AAAA,QACP,aAAa,EAAE,UAAU,IAAM,OAAO,OAAO;AAAA,MAC/C;AAAA,IACF,CAAC;AAAA,EACH,CAAC;AAED,wBAAG,mCAAmC,MAAM;AAC1C,UAAM,aAAS,iCAAqB;AAAA,MAClC,EAAE,OAAO,kBAAkB,OAAO,MAAM,aAAa,EAAE,OAAO,OAAO,EAAE;AAAA,MACvE;AAAA,MACA,EAAE,OAAO,aAAa,OAAO,IAAI,aAAa,EAAE,QAAQ,KAAK,EAAE;AAAA,IACjE,CAAC;AACD,8BAAO,MAAM,EAAE,QAAQ;AAAA,MACrB,EAAE,OAAO,kBAAkB,OAAO,MAAM,aAAa,EAAE,OAAO,OAAO,EAAE;AAAA,MACvE,EAAE,OAAO,cAAc,OAAO,SAAS;AAAA,MACvC,EAAE,OAAO,aAAa,OAAO,IAAI,aAAa,EAAE,QAAQ,KAAK,EAAE;AAAA,IACjE,CAAC;AAAA,EACH,CAAC;AAED,wBAAG,iCAAiC,MAAM;AACxC,UAAM,aAAS,iCAAqB,CAAC,CAAC;AACtC,8BAAO,MAAM,EAAE,QAAQ,CAAC,CAAC;AAAA,EAC3B,CAAC;AAED,wBAAG,kCAAkC,MAAM;AACzC,UAAM,WAA6B,EAAE,OAAO,kBAAkB,OAAO,GAAG;AACxE,UAAM,aAAS,iCAAqB,QAAQ;AAC5C,8BAAO,MAAM,EAAE,QAAQ,CAAC,EAAE,OAAO,kBAAkB,OAAO,GAAG,CAAC,CAAC;AAAA,EACjE,CAAC;AACH,CAAC;AAAA,IAED,wBAAS,4CAA4C,MAAM;AACzD,wBAAG,sCAAsC,MAAM;AAC7C,UAAM,MAAM,QAAQ,EAAE,UAAU,UAAU,CAAC;AAC3C,8BAAO,IAAI,MAAM,EAAE,QAAQ,EAAE,KAAK,IAAI;AAAA,EACxC,CAAC;AAED,wBAAG,sCAAsC,MAAM;AAC7C,UAAM,MAAM,QAAQ;AACpB,QAAI,cAAc,EAAE,UAAU,QAAQ,CAAC;AACvC,8BAAO,IAAI,MAAM,EAAE,QAAQ,EAAE,SAAK,mCAAkB,OAAO,CAAC;AAAA,EAC9D,CAAC;AAED,wBAAG,4CAA4C,MAAM;AACnD,UAAM,MAAM,QAAQ;AACpB,8BAAO,IAAI,MAAM,EAAE,QAAQ,EAAE,cAAc;AAAA,EAC7C,CAAC;AAED,wBAAG,wCAAwC,MAAM;AAC/C,UAAM,MAAM,QAAQ,EAAE,UAAU,6BAA6B,CAAC;AAC9D,8BAAO,IAAI,MAAM,EAAE,QAAQ,EAAE,QAAQ,CAAC,EAAE,OAAO,8BAA8B,OAAO,GAAG,CAAC,CAAC;AAAA,EAC3F,CAAC;AAED,wBAAG,mDAAmD,MAAM;AAC1D,UAAM,MAAM,QAAQ,EAAE,UAAU,0BAA0B,CAAC;AAC3D,8BAAO,IAAI,MAAM,EAAE,QAAQ,EAAE,QAAQ,CAAC,EAAE,OAAO,kBAAkB,OAAO,WAAW,CAAC,CAAC;AAAA,EACvF,CAAC;AAED,wBAAG,0CAA0C,MAAM;AACjD,UAAM,MAAM,QAAQ,EAAE,UAAU,CAAC,kBAAkB,YAAY,EAAE,CAAC;AAClE,8BAAO,IAAI,MAAM,EAAE,QAAQ,EAAE,QAAQ;AAAA,MACnC,EAAE,OAAO,kBAAkB,OAAO,GAAG;AAAA,MACrC,EAAE,OAAO,cAAc,OAAO,GAAG;AAAA,IACnC,CAAC;AAAA,EACH,CAAC;AAED,wBAAG,uDAAuD,MAAM;AAC9D,UAAM,MAAM,QAAQ,EAAE,UAAU,EAAE,OAAO,kBAAkB,OAAO,WAAW,EAAE,CAAC;AAChF,8BAAO,IAAI,MAAM,EAAE,QAAQ,EAAE,QAAQ,CAAC,EAAE,OAAO,kBAAkB,OAAO,WAAW,CAAC,CAAC;AAAA,EACvF,CAAC;AAED,wBAAG,0CAA0C,MAAM;AACjD,UAAM,MAAM,QAAQ;AAAA,MAClB,UAAU;AAAA,QACR,OAAO;AAAA,QACP,OAAO;AAAA,QACP,aAAa,EAAE,UAAU,IAAM,OAAO,OAAO;AAAA,MAC/C;AAAA,IACF,CAAC;AACD,8BAAO,IAAI,MAAM,EAAE,QAAQ,EAAE,QAAQ;AAAA,MACnC;AAAA,QACE,OAAO;AAAA,QACP,OAAO;AAAA,QACP,aAAa,EAAE,UAAU,IAAM,OAAO,OAAO;AAAA,MAC/C;AAAA,IACF,CAAC;AAAA,EACH,CAAC;AAED,wBAAG,qCAAqC,MAAM;AAC5C,UAAM,MAAM,QAAQ;AAAA,MAClB,UAAU;AAAA,QACR;AAAA,QACA,EAAE,OAAO,cAAc,OAAO,UAAU,aAAa,EAAE,OAAO,OAAO,EAAE;AAAA,QACvE;AAAA,MACF;AAAA,IACF,CAAC;AACD,8BAAO,IAAI,MAAM,EAAE,QAAQ,EAAE,QAAQ;AAAA,MACnC,EAAE,OAAO,kBAAkB,OAAO,SAAS;AAAA,MAC3C,EAAE,OAAO,cAAc,OAAO,UAAU,aAAa,EAAE,OAAO,OAAO,EAAE;AAAA,MACvE,EAAE,OAAO,aAAa,OAAO,GAAG;AAAA,IAClC,CAAC;AAAA,EACH,CAAC;AAED,wBAAG,sCAAsC,MAAM;AAC7C,UAAM,MAAM,QAAQ;AACpB,8BAAO,IAAI,MAAM,EAAE,WAAW,EAAE,QAAQ,wCAA2B;AAAA,EACrE,CAAC;AAED,wBAAG,8BAA8B,MAAM;AACrC,UAAM,SAA4B,EAAE,WAAW,KAAO,UAAU,GAAG,iBAAiB,IAAK;AACzF,UAAM,MAAM,QAAQ,EAAE,aAAa,OAAO,CAAC;AAC3C,8BAAO,IAAI,MAAM,EAAE,WAAW,EAAE,QAAQ,MAAM;AAC9C,8BAAO,IAAI,MAAM,EAAE,YAAa,SAAS,EAAE,KAAK,GAAK;AAAA,EACvD,CAAC;AAED,wBAAG,+BAA+B,MAAM;AACtC,UAAM,SAA4B,EAAE,WAAW,KAAO,UAAU,GAAG,iBAAiB,IAAK;AACzF,UAAM,MAAM,QAAQ,EAAE,aAAa,OAAO,CAAC;AAC3C,8BAAO,IAAI,MAAM,EAAE,WAAW,EAAE,QAAQ,MAAM;AAC9C,8BAAO,IAAI,MAAM,EAAE,YAAa,QAAQ,EAAE,KAAK,CAAC;AAAA,EAClD,CAAC;AAED,wBAAG,2BAA2B,MAAM;AAClC,UAAM,SAA4B,EAAE,WAAW,KAAO,UAAU,IAAI,iBAAiB,IAAK;AAC1F,UAAM,MAAM,QAAQ,EAAE,aAAa,OAAO,CAAC;AAC3C,8BAAO,IAAI,MAAM,EAAE,WAAW,EAAE,QAAQ,MAAM;AAC9C,8BAAO,IAAI,MAAM,EAAE,YAAa,SAAS,EAAE,KAAK,GAAK;AACrD,8BAAO,IAAI,MAAM,EAAE,YAAa,QAAQ,EAAE,KAAK,EAAE;AACjD,8BAAO,IAAI,MAAM,EAAE,YAAa,eAAe,EAAE,KAAK,GAAI;AAAA,EAC5D,CAAC;AACH,CAAC;AAAA,IAED,wBAAS,oCAAoC,MAAM;AACjD,wBAAG,gDAAgD,MAAM;AACvD,UAAM,eAAe;AAAA,MACnB,OAAO;AAAA,MACP,WAAW;AAAA,MACX,kBAAkB;AAAA,MAClB,gBAAgB;AAAA,IAClB;AAEA,UAAM,MAAM,IAAI,eAAI;AAAA,MAClB,OAAO;AAAA,MACP,QAAQ;AAAA,MACR,WAAW;AAAA,MACX,SAAS;AAAA,MACT;AAAA,IACF,CAAC;AAED,8BAAO,IAAI,MAAM,EAAE,YAAY,EAAE,QAAQ,YAAY;AAAA,EACvD,CAAC;AAED,wBAAG,qDAAqD,MAAM;AAC5D,UAAM,eAAe;AAAA,MACnB,OAAO;AAAA,MACP,SAAS;AAAA,MACT,gBAAgB;AAAA,IAClB;AAEA,UAAM,MAAM,IAAI,eAAI;AAAA,MAClB,OAAO;AAAA,MACP,QAAQ;AAAA,MACR,WAAW;AAAA,MACX,SAAS;AAAA,MACT;AAAA,IACF,CAAC;AAED,8BAAO,IAAI,MAAM,EAAE,YAAY,EAAE,QAAQ,YAAY;AAAA,EACvD,CAAC;AAED,wBAAG,4CAA4C,MAAM;AACnD,UAAM,eAAe,EAAE,aAAa,KAAK;AAEzC,UAAM,MAAM,IAAI,eAAI;AAAA,MAClB,OAAO;AAAA,MACP,QAAQ;AAAA,MACR,WAAW;AAAA,MACX,SAAS;AAAA,MACT;AAAA,IACF,CAAC;AAED,8BAAO,IAAI,MAAM,EAAE,YAAY,EAAE,QAAQ,YAAY;AAAA,EACvD,CAAC;AAED,wBAAG,wCAAwC,MAAM;AAC/C,UAAM,eAAe;AAAA,MACnB,aAAa;AAAA,MACb,wBAAwB;AAAA,IAC1B;AAEA,UAAM,MAAM,IAAI,eAAI;AAAA,MAClB,OAAO;AAAA,MACP,QAAQ;AAAA,MACR,WAAW;AAAA,MACX,SAAS;AAAA,MACT;AAAA,IACF,CAAC;AAED,8BAAO,IAAI,MAAM,EAAE,YAAY,EAAE,QAAQ,YAAY;AAAA,EACvD,CAAC;AAED,wBAAG,2CAA2C,MAAM;AAClD,UAAM,eAAe;AAAA,MACnB,gBAAgB;AAAA,MAChB,0BAA0B;AAAA,IAC5B;AAEA,UAAM,MAAM,IAAI,eAAI;AAAA,MAClB,OAAO;AAAA,MACP,QAAQ;AAAA,MACR,WAAW;AAAA,MACX,SAAS;AAAA,MACT;AAAA,IACF,CAAC;AAED,8BAAO,IAAI,MAAM,EAAE,YAAY,EAAE,QAAQ,YAAY;AAAA,EACvD,CAAC;AACH,CAAC;","names":[]}
@@ -0,0 +1,304 @@
1
+ import { beforeAll, describe, expect, it } from "vitest";
2
+ import { normalizeLanguage } from "../language.js";
3
+ import { initializeLogger } from "../log.js";
4
+ import { DEFAULT_API_CONNECT_OPTIONS } from "../types.js";
5
+ import { TTS, normalizeTTSFallback, parseTTSModelString } from "./tts.js";
6
+ beforeAll(() => {
7
+ initializeLogger({ level: "silent", pretty: false });
8
+ });
9
+ function makeTts(overrides = {}) {
10
+ const defaults = {
11
+ model: "cartesia/sonic",
12
+ apiKey: "test-key",
13
+ apiSecret: "test-secret",
14
+ baseURL: "https://example.livekit.cloud"
15
+ };
16
+ return new TTS({ ...defaults, ...overrides });
17
+ }
18
+ describe("parseTTSModelString", () => {
19
+ it("simple model without voice", () => {
20
+ const [model, voice] = parseTTSModelString("cartesia");
21
+ expect(model).toBe("cartesia");
22
+ expect(voice).toBeUndefined();
23
+ });
24
+ it("model with voice suffix", () => {
25
+ const [model, voice] = parseTTSModelString("cartesia:my-voice-id");
26
+ expect(model).toBe("cartesia");
27
+ expect(voice).toBe("my-voice-id");
28
+ });
29
+ it("provider/model format without voice", () => {
30
+ const [model, voice] = parseTTSModelString("cartesia/sonic");
31
+ expect(model).toBe("cartesia/sonic");
32
+ expect(voice).toBeUndefined();
33
+ });
34
+ it("provider/model format with voice", () => {
35
+ const [model, voice] = parseTTSModelString("cartesia/sonic:my-voice-id");
36
+ expect(model).toBe("cartesia/sonic");
37
+ expect(voice).toBe("my-voice-id");
38
+ });
39
+ it.each([
40
+ ["elevenlabs/eleven_flash_v2:voice123", "elevenlabs/eleven_flash_v2", "voice123"],
41
+ ["rime:speaker-a", "rime", "speaker-a"],
42
+ ["rime/mist:narrator", "rime/mist", "narrator"],
43
+ ["inworld/inworld-tts-1:character", "inworld/inworld-tts-1", "character"],
44
+ ["cartesia/sonic-turbo:deep-voice", "cartesia/sonic-turbo", "deep-voice"]
45
+ ])("various providers and voices: %s", (modelStr, expectedModel, expectedVoice) => {
46
+ const [model, voice] = parseTTSModelString(modelStr);
47
+ expect(model).toBe(expectedModel);
48
+ expect(voice).toBe(expectedVoice);
49
+ });
50
+ it("empty voice after colon", () => {
51
+ const [model, voice] = parseTTSModelString("cartesia/sonic:");
52
+ expect(model).toBe("cartesia/sonic");
53
+ expect(voice).toBe("");
54
+ });
55
+ });
56
+ describe("normalizeTTSFallback", () => {
57
+ it("single string model", () => {
58
+ const result = normalizeTTSFallback("cartesia/sonic");
59
+ expect(result).toEqual([{ model: "cartesia/sonic", voice: "" }]);
60
+ });
61
+ it("single string model with voice", () => {
62
+ const result = normalizeTTSFallback("cartesia/sonic:my-voice");
63
+ expect(result).toEqual([{ model: "cartesia/sonic", voice: "my-voice" }]);
64
+ });
65
+ it("single FallbackModel dict", () => {
66
+ const fallback = { model: "cartesia/sonic", voice: "narrator" };
67
+ const result = normalizeTTSFallback(fallback);
68
+ expect(result).toEqual([{ model: "cartesia/sonic", voice: "narrator" }]);
69
+ });
70
+ it("list of string models", () => {
71
+ const result = normalizeTTSFallback(["cartesia/sonic", "elevenlabs/eleven_flash_v2"]);
72
+ expect(result).toEqual([
73
+ { model: "cartesia/sonic", voice: "" },
74
+ { model: "elevenlabs/eleven_flash_v2", voice: "" }
75
+ ]);
76
+ });
77
+ it("list of string models with voices", () => {
78
+ const result = normalizeTTSFallback(["cartesia/sonic:voice1", "elevenlabs:voice2"]);
79
+ expect(result).toEqual([
80
+ { model: "cartesia/sonic", voice: "voice1" },
81
+ { model: "elevenlabs", voice: "voice2" }
82
+ ]);
83
+ });
84
+ it("list of FallbackModel dicts", () => {
85
+ const fallbacks = [
86
+ { model: "cartesia/sonic", voice: "narrator" },
87
+ { model: "elevenlabs", voice: "" }
88
+ ];
89
+ const result = normalizeTTSFallback(fallbacks);
90
+ expect(result).toEqual([
91
+ { model: "cartesia/sonic", voice: "narrator" },
92
+ { model: "elevenlabs", voice: "" }
93
+ ]);
94
+ });
95
+ it("mixed list of strings and dicts", () => {
96
+ const result = normalizeTTSFallback([
97
+ "cartesia/sonic:voice1",
98
+ { model: "elevenlabs/eleven_flash_v2", voice: "custom" },
99
+ "rime/mist"
100
+ ]);
101
+ expect(result).toEqual([
102
+ { model: "cartesia/sonic", voice: "voice1" },
103
+ { model: "elevenlabs/eleven_flash_v2", voice: "custom" },
104
+ { model: "rime/mist", voice: "" }
105
+ ]);
106
+ });
107
+ it("FallbackModel with extraKwargs is preserved", () => {
108
+ const fallback = {
109
+ model: "cartesia/sonic",
110
+ voice: "narrator",
111
+ extraKwargs: { duration: 30, speed: "fast" }
112
+ };
113
+ const result = normalizeTTSFallback(fallback);
114
+ expect(result).toEqual([
115
+ {
116
+ model: "cartesia/sonic",
117
+ voice: "narrator",
118
+ extraKwargs: { duration: 30, speed: "fast" }
119
+ }
120
+ ]);
121
+ });
122
+ it("list with extraKwargs preserved", () => {
123
+ const result = normalizeTTSFallback([
124
+ { model: "cartesia/sonic", voice: "v1", extraKwargs: { speed: "slow" } },
125
+ "elevenlabs:voice2",
126
+ { model: "rime/mist", voice: "", extraKwargs: { custom: true } }
127
+ ]);
128
+ expect(result).toEqual([
129
+ { model: "cartesia/sonic", voice: "v1", extraKwargs: { speed: "slow" } },
130
+ { model: "elevenlabs", voice: "voice2" },
131
+ { model: "rime/mist", voice: "", extraKwargs: { custom: true } }
132
+ ]);
133
+ });
134
+ it("empty list returns empty list", () => {
135
+ const result = normalizeTTSFallback([]);
136
+ expect(result).toEqual([]);
137
+ });
138
+ it("FallbackModel with empty voice", () => {
139
+ const fallback = { model: "cartesia/sonic", voice: "" };
140
+ const result = normalizeTTSFallback(fallback);
141
+ expect(result).toEqual([{ model: "cartesia/sonic", voice: "" }]);
142
+ });
143
+ });
144
+ describe("TTS constructor fallback and connOptions", () => {
145
+ it("normalizes language in constructor", () => {
146
+ const tts = makeTts({ language: "english" });
147
+ expect(tts["opts"].language).toBe("en");
148
+ });
149
+ it("normalizes updated language values", () => {
150
+ const tts = makeTts();
151
+ tts.updateOptions({ language: "en_US" });
152
+ expect(tts["opts"].language).toBe(normalizeLanguage("en_US"));
153
+ });
154
+ it("fallback not given defaults to undefined", () => {
155
+ const tts = makeTts();
156
+ expect(tts["opts"].fallback).toBeUndefined();
157
+ });
158
+ it("fallback single string is normalized", () => {
159
+ const tts = makeTts({ fallback: "elevenlabs/eleven_flash_v2" });
160
+ expect(tts["opts"].fallback).toEqual([{ model: "elevenlabs/eleven_flash_v2", voice: "" }]);
161
+ });
162
+ it("fallback single string with voice is normalized", () => {
163
+ const tts = makeTts({ fallback: "cartesia/sonic:my-voice" });
164
+ expect(tts["opts"].fallback).toEqual([{ model: "cartesia/sonic", voice: "my-voice" }]);
165
+ });
166
+ it("fallback list of strings is normalized", () => {
167
+ const tts = makeTts({ fallback: ["cartesia/sonic", "elevenlabs"] });
168
+ expect(tts["opts"].fallback).toEqual([
169
+ { model: "cartesia/sonic", voice: "" },
170
+ { model: "elevenlabs", voice: "" }
171
+ ]);
172
+ });
173
+ it("fallback single FallbackModel is normalized to list", () => {
174
+ const tts = makeTts({ fallback: { model: "cartesia/sonic", voice: "narrator" } });
175
+ expect(tts["opts"].fallback).toEqual([{ model: "cartesia/sonic", voice: "narrator" }]);
176
+ });
177
+ it("fallback with extraKwargs is preserved", () => {
178
+ const tts = makeTts({
179
+ fallback: {
180
+ model: "cartesia/sonic",
181
+ voice: "narrator",
182
+ extraKwargs: { duration: 30, speed: "fast" }
183
+ }
184
+ });
185
+ expect(tts["opts"].fallback).toEqual([
186
+ {
187
+ model: "cartesia/sonic",
188
+ voice: "narrator",
189
+ extraKwargs: { duration: 30, speed: "fast" }
190
+ }
191
+ ]);
192
+ });
193
+ it("fallback mixed list is normalized", () => {
194
+ const tts = makeTts({
195
+ fallback: [
196
+ "cartesia/sonic:voice1",
197
+ { model: "elevenlabs", voice: "custom", extraKwargs: { speed: "slow" } },
198
+ "rime/mist"
199
+ ]
200
+ });
201
+ expect(tts["opts"].fallback).toEqual([
202
+ { model: "cartesia/sonic", voice: "voice1" },
203
+ { model: "elevenlabs", voice: "custom", extraKwargs: { speed: "slow" } },
204
+ { model: "rime/mist", voice: "" }
205
+ ]);
206
+ });
207
+ it("connOptions not given uses default", () => {
208
+ const tts = makeTts();
209
+ expect(tts["opts"].connOptions).toEqual(DEFAULT_API_CONNECT_OPTIONS);
210
+ });
211
+ it("connOptions custom timeout", () => {
212
+ const custom = { timeoutMs: 3e4, maxRetry: 3, retryIntervalMs: 2e3 };
213
+ const tts = makeTts({ connOptions: custom });
214
+ expect(tts["opts"].connOptions).toEqual(custom);
215
+ expect(tts["opts"].connOptions.timeoutMs).toBe(3e4);
216
+ });
217
+ it("connOptions custom maxRetry", () => {
218
+ const custom = { timeoutMs: 1e4, maxRetry: 5, retryIntervalMs: 2e3 };
219
+ const tts = makeTts({ connOptions: custom });
220
+ expect(tts["opts"].connOptions).toEqual(custom);
221
+ expect(tts["opts"].connOptions.maxRetry).toBe(5);
222
+ });
223
+ it("connOptions full custom", () => {
224
+ const custom = { timeoutMs: 6e4, maxRetry: 10, retryIntervalMs: 2e3 };
225
+ const tts = makeTts({ connOptions: custom });
226
+ expect(tts["opts"].connOptions).toEqual(custom);
227
+ expect(tts["opts"].connOptions.timeoutMs).toBe(6e4);
228
+ expect(tts["opts"].connOptions.maxRetry).toBe(10);
229
+ expect(tts["opts"].connOptions.retryIntervalMs).toBe(2e3);
230
+ });
231
+ });
232
+ describe("TTS provider modelOptions parity", () => {
233
+ it("preserves ElevenLabs inference model options", () => {
234
+ const modelOptions = {
235
+ speed: 1.2,
236
+ stability: 0.5,
237
+ similarity_boost: 0.8,
238
+ enable_logging: false
239
+ };
240
+ const tts = new TTS({
241
+ model: "elevenlabs/eleven_flash_v2_5",
242
+ apiKey: "test-key",
243
+ apiSecret: "test-secret",
244
+ baseURL: "https://example.livekit.cloud",
245
+ modelOptions
246
+ });
247
+ expect(tts["opts"].modelOptions).toEqual(modelOptions);
248
+ });
249
+ it("accepts expanded Cartesia inference model options", () => {
250
+ const modelOptions = {
251
+ speed: 1.15,
252
+ emotion: "curious",
253
+ add_timestamps: true
254
+ };
255
+ const tts = new TTS({
256
+ model: "cartesia/sonic",
257
+ apiKey: "test-key",
258
+ apiSecret: "test-secret",
259
+ baseURL: "https://example.livekit.cloud",
260
+ modelOptions
261
+ });
262
+ expect(tts["opts"].modelOptions).toEqual(modelOptions);
263
+ });
264
+ it("accepts Deepgram inference model options", () => {
265
+ const modelOptions = { mip_opt_out: true };
266
+ const tts = new TTS({
267
+ model: "deepgram/aura-2",
268
+ apiKey: "test-key",
269
+ apiSecret: "test-secret",
270
+ baseURL: "https://example.livekit.cloud",
271
+ modelOptions
272
+ });
273
+ expect(tts["opts"].modelOptions).toEqual(modelOptions);
274
+ });
275
+ it("accepts Rime inference model options", () => {
276
+ const modelOptions = {
277
+ speed_alpha: 0.9,
278
+ pause_between_brackets: true
279
+ };
280
+ const tts = new TTS({
281
+ model: "rime/mistv2",
282
+ apiKey: "test-key",
283
+ apiSecret: "test-secret",
284
+ baseURL: "https://example.livekit.cloud",
285
+ modelOptions
286
+ });
287
+ expect(tts["opts"].modelOptions).toEqual(modelOptions);
288
+ });
289
+ it("accepts Inworld inference model options", () => {
290
+ const modelOptions = {
291
+ timestamp_type: "WORD",
292
+ apply_text_normalization: "ON"
293
+ };
294
+ const tts = new TTS({
295
+ model: "inworld/inworld-tts-1",
296
+ apiKey: "test-key",
297
+ apiSecret: "test-secret",
298
+ baseURL: "https://example.livekit.cloud",
299
+ modelOptions
300
+ });
301
+ expect(tts["opts"].modelOptions).toEqual(modelOptions);
302
+ });
303
+ });
304
+ //# sourceMappingURL=tts.test.js.map