@livekit/agents 1.1.0 → 1.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (942) hide show
  1. package/dist/audio.cjs +89 -3
  2. package/dist/audio.cjs.map +1 -1
  3. package/dist/audio.d.cts +36 -1
  4. package/dist/audio.d.ts +36 -1
  5. package/dist/audio.d.ts.map +1 -1
  6. package/dist/audio.js +76 -2
  7. package/dist/audio.js.map +1 -1
  8. package/dist/beta/index.cjs +29 -0
  9. package/dist/beta/index.cjs.map +1 -0
  10. package/dist/beta/index.d.cts +2 -0
  11. package/dist/beta/index.d.ts +2 -0
  12. package/dist/beta/index.d.ts.map +1 -0
  13. package/dist/beta/index.js +7 -0
  14. package/dist/beta/index.js.map +1 -0
  15. package/dist/beta/workflows/index.cjs +29 -0
  16. package/dist/beta/workflows/index.cjs.map +1 -0
  17. package/dist/beta/workflows/index.d.cts +2 -0
  18. package/dist/beta/workflows/index.d.ts +2 -0
  19. package/dist/beta/workflows/index.d.ts.map +1 -0
  20. package/dist/beta/workflows/index.js +7 -0
  21. package/dist/beta/workflows/index.js.map +1 -0
  22. package/dist/beta/workflows/task_group.cjs +162 -0
  23. package/dist/beta/workflows/task_group.cjs.map +1 -0
  24. package/dist/beta/workflows/task_group.d.cts +32 -0
  25. package/dist/beta/workflows/task_group.d.ts +32 -0
  26. package/dist/beta/workflows/task_group.d.ts.map +1 -0
  27. package/dist/beta/workflows/task_group.js +138 -0
  28. package/dist/beta/workflows/task_group.js.map +1 -0
  29. package/dist/cli.cjs +44 -46
  30. package/dist/cli.cjs.map +1 -1
  31. package/dist/cli.d.cts +3 -3
  32. package/dist/cli.d.ts +3 -3
  33. package/dist/cli.d.ts.map +1 -1
  34. package/dist/cli.js +45 -47
  35. package/dist/cli.js.map +1 -1
  36. package/dist/connection_pool.cjs +242 -0
  37. package/dist/connection_pool.cjs.map +1 -0
  38. package/dist/connection_pool.d.cts +123 -0
  39. package/dist/connection_pool.d.ts +123 -0
  40. package/dist/connection_pool.d.ts.map +1 -0
  41. package/dist/connection_pool.js +218 -0
  42. package/dist/connection_pool.js.map +1 -0
  43. package/dist/connection_pool.test.cjs +256 -0
  44. package/dist/connection_pool.test.cjs.map +1 -0
  45. package/dist/connection_pool.test.js +255 -0
  46. package/dist/connection_pool.test.js.map +1 -0
  47. package/dist/constants.cjs +30 -0
  48. package/dist/constants.cjs.map +1 -1
  49. package/dist/constants.d.cts +10 -0
  50. package/dist/constants.d.ts +10 -0
  51. package/dist/constants.d.ts.map +1 -1
  52. package/dist/constants.js +20 -0
  53. package/dist/constants.js.map +1 -1
  54. package/dist/cpu.cjs +189 -0
  55. package/dist/cpu.cjs.map +1 -0
  56. package/dist/cpu.d.cts +24 -0
  57. package/dist/cpu.d.ts +24 -0
  58. package/dist/cpu.d.ts.map +1 -0
  59. package/dist/cpu.js +152 -0
  60. package/dist/cpu.js.map +1 -0
  61. package/dist/cpu.test.cjs +227 -0
  62. package/dist/cpu.test.cjs.map +1 -0
  63. package/dist/cpu.test.js +204 -0
  64. package/dist/cpu.test.js.map +1 -0
  65. package/dist/http_server.cjs +9 -6
  66. package/dist/http_server.cjs.map +1 -1
  67. package/dist/http_server.d.cts +5 -1
  68. package/dist/http_server.d.ts +5 -1
  69. package/dist/http_server.d.ts.map +1 -1
  70. package/dist/http_server.js +9 -6
  71. package/dist/http_server.js.map +1 -1
  72. package/dist/index.cjs +24 -9
  73. package/dist/index.cjs.map +1 -1
  74. package/dist/index.d.cts +15 -11
  75. package/dist/index.d.ts +15 -11
  76. package/dist/index.d.ts.map +1 -1
  77. package/dist/index.js +18 -9
  78. package/dist/index.js.map +1 -1
  79. package/dist/inference/api_protos.cjs +70 -2
  80. package/dist/inference/api_protos.cjs.map +1 -1
  81. package/dist/inference/api_protos.d.cts +373 -32
  82. package/dist/inference/api_protos.d.ts +373 -32
  83. package/dist/inference/api_protos.d.ts.map +1 -1
  84. package/dist/inference/api_protos.js +62 -2
  85. package/dist/inference/api_protos.js.map +1 -1
  86. package/dist/inference/index.cjs +8 -0
  87. package/dist/inference/index.cjs.map +1 -1
  88. package/dist/inference/index.d.cts +3 -4
  89. package/dist/inference/index.d.ts +3 -4
  90. package/dist/inference/index.d.ts.map +1 -1
  91. package/dist/inference/index.js +18 -3
  92. package/dist/inference/index.js.map +1 -1
  93. package/dist/inference/interruption/defaults.cjs +81 -0
  94. package/dist/inference/interruption/defaults.cjs.map +1 -0
  95. package/dist/inference/interruption/defaults.d.cts +19 -0
  96. package/dist/inference/interruption/defaults.d.ts +19 -0
  97. package/dist/inference/interruption/defaults.d.ts.map +1 -0
  98. package/dist/inference/interruption/defaults.js +46 -0
  99. package/dist/inference/interruption/defaults.js.map +1 -0
  100. package/dist/inference/interruption/errors.cjs +44 -0
  101. package/dist/inference/interruption/errors.cjs.map +1 -0
  102. package/dist/inference/interruption/errors.d.cts +12 -0
  103. package/dist/inference/interruption/errors.d.ts +12 -0
  104. package/dist/inference/interruption/errors.d.ts.map +1 -0
  105. package/dist/inference/interruption/errors.js +20 -0
  106. package/dist/inference/interruption/errors.js.map +1 -0
  107. package/dist/inference/interruption/http_transport.cjs +163 -0
  108. package/dist/inference/interruption/http_transport.cjs.map +1 -0
  109. package/dist/inference/interruption/http_transport.d.cts +63 -0
  110. package/dist/inference/interruption/http_transport.d.ts +63 -0
  111. package/dist/inference/interruption/http_transport.d.ts.map +1 -0
  112. package/dist/inference/interruption/http_transport.js +137 -0
  113. package/dist/inference/interruption/http_transport.js.map +1 -0
  114. package/dist/inference/interruption/interruption_cache_entry.cjs +58 -0
  115. package/dist/inference/interruption/interruption_cache_entry.cjs.map +1 -0
  116. package/dist/inference/interruption/interruption_cache_entry.d.cts +30 -0
  117. package/dist/inference/interruption/interruption_cache_entry.d.ts +30 -0
  118. package/dist/inference/interruption/interruption_cache_entry.d.ts.map +1 -0
  119. package/dist/inference/interruption/interruption_cache_entry.js +34 -0
  120. package/dist/inference/interruption/interruption_cache_entry.js.map +1 -0
  121. package/dist/inference/interruption/interruption_detector.cjs +198 -0
  122. package/dist/inference/interruption/interruption_detector.cjs.map +1 -0
  123. package/dist/inference/interruption/interruption_detector.d.cts +59 -0
  124. package/dist/inference/interruption/interruption_detector.d.ts +59 -0
  125. package/dist/inference/interruption/interruption_detector.d.ts.map +1 -0
  126. package/dist/inference/interruption/interruption_detector.js +164 -0
  127. package/dist/inference/interruption/interruption_detector.js.map +1 -0
  128. package/dist/inference/interruption/interruption_stream.cjs +368 -0
  129. package/dist/inference/interruption/interruption_stream.cjs.map +1 -0
  130. package/dist/inference/interruption/interruption_stream.d.cts +46 -0
  131. package/dist/inference/interruption/interruption_stream.d.ts +46 -0
  132. package/dist/inference/interruption/interruption_stream.d.ts.map +1 -0
  133. package/dist/inference/interruption/interruption_stream.js +344 -0
  134. package/dist/inference/interruption/interruption_stream.js.map +1 -0
  135. package/dist/inference/interruption/types.cjs +17 -0
  136. package/dist/inference/interruption/types.cjs.map +1 -0
  137. package/dist/inference/interruption/types.d.cts +66 -0
  138. package/dist/inference/interruption/types.d.ts +66 -0
  139. package/dist/inference/interruption/types.d.ts.map +1 -0
  140. package/dist/inference/interruption/types.js +1 -0
  141. package/dist/inference/interruption/types.js.map +1 -0
  142. package/dist/inference/interruption/utils.cjs +130 -0
  143. package/dist/inference/interruption/utils.cjs.map +1 -0
  144. package/dist/inference/interruption/utils.d.cts +41 -0
  145. package/dist/inference/interruption/utils.d.ts +41 -0
  146. package/dist/inference/interruption/utils.d.ts.map +1 -0
  147. package/dist/inference/interruption/utils.js +105 -0
  148. package/dist/inference/interruption/utils.js.map +1 -0
  149. package/dist/inference/interruption/utils.test.cjs +105 -0
  150. package/dist/inference/interruption/utils.test.cjs.map +1 -0
  151. package/dist/inference/interruption/utils.test.js +104 -0
  152. package/dist/inference/interruption/utils.test.js.map +1 -0
  153. package/dist/inference/interruption/ws_transport.cjs +342 -0
  154. package/dist/inference/interruption/ws_transport.cjs.map +1 -0
  155. package/dist/inference/interruption/ws_transport.d.cts +33 -0
  156. package/dist/inference/interruption/ws_transport.d.ts +33 -0
  157. package/dist/inference/interruption/ws_transport.d.ts.map +1 -0
  158. package/dist/inference/interruption/ws_transport.js +308 -0
  159. package/dist/inference/interruption/ws_transport.js.map +1 -0
  160. package/dist/inference/llm.cjs +106 -66
  161. package/dist/inference/llm.cjs.map +1 -1
  162. package/dist/inference/llm.d.cts +65 -43
  163. package/dist/inference/llm.d.ts +65 -43
  164. package/dist/inference/llm.d.ts.map +1 -1
  165. package/dist/inference/llm.js +100 -66
  166. package/dist/inference/llm.js.map +1 -1
  167. package/dist/inference/stt.cjs +319 -170
  168. package/dist/inference/stt.cjs.map +1 -1
  169. package/dist/inference/stt.d.cts +64 -15
  170. package/dist/inference/stt.d.ts +64 -15
  171. package/dist/inference/stt.d.ts.map +1 -1
  172. package/dist/inference/stt.js +319 -170
  173. package/dist/inference/stt.js.map +1 -1
  174. package/dist/inference/stt.test.cjs +218 -0
  175. package/dist/inference/stt.test.cjs.map +1 -0
  176. package/dist/inference/stt.test.js +217 -0
  177. package/dist/inference/stt.test.js.map +1 -0
  178. package/dist/inference/tts.cjs +249 -71
  179. package/dist/inference/tts.cjs.map +1 -1
  180. package/dist/inference/tts.d.cts +55 -16
  181. package/dist/inference/tts.d.ts +55 -16
  182. package/dist/inference/tts.d.ts.map +1 -1
  183. package/dist/inference/tts.js +249 -77
  184. package/dist/inference/tts.js.map +1 -1
  185. package/dist/inference/tts.test.cjs +233 -0
  186. package/dist/inference/tts.test.cjs.map +1 -0
  187. package/dist/inference/tts.test.js +232 -0
  188. package/dist/inference/tts.test.js.map +1 -0
  189. package/dist/inference/utils.cjs +26 -7
  190. package/dist/inference/utils.cjs.map +1 -1
  191. package/dist/inference/utils.d.cts +14 -1
  192. package/dist/inference/utils.d.ts +14 -1
  193. package/dist/inference/utils.d.ts.map +1 -1
  194. package/dist/inference/utils.js +18 -2
  195. package/dist/inference/utils.js.map +1 -1
  196. package/dist/ipc/inference_proc_executor.cjs +6 -3
  197. package/dist/ipc/inference_proc_executor.cjs.map +1 -1
  198. package/dist/ipc/inference_proc_executor.d.ts.map +1 -1
  199. package/dist/ipc/inference_proc_executor.js +6 -3
  200. package/dist/ipc/inference_proc_executor.js.map +1 -1
  201. package/dist/ipc/inference_proc_lazy_main.cjs +13 -1
  202. package/dist/ipc/inference_proc_lazy_main.cjs.map +1 -1
  203. package/dist/ipc/inference_proc_lazy_main.js +13 -1
  204. package/dist/ipc/inference_proc_lazy_main.js.map +1 -1
  205. package/dist/ipc/job_proc_executor.cjs +6 -1
  206. package/dist/ipc/job_proc_executor.cjs.map +1 -1
  207. package/dist/ipc/job_proc_executor.d.ts.map +1 -1
  208. package/dist/ipc/job_proc_executor.js +6 -1
  209. package/dist/ipc/job_proc_executor.js.map +1 -1
  210. package/dist/ipc/job_proc_lazy_main.cjs +89 -17
  211. package/dist/ipc/job_proc_lazy_main.cjs.map +1 -1
  212. package/dist/ipc/job_proc_lazy_main.js +68 -18
  213. package/dist/ipc/job_proc_lazy_main.js.map +1 -1
  214. package/dist/ipc/supervised_proc.cjs +34 -8
  215. package/dist/ipc/supervised_proc.cjs.map +1 -1
  216. package/dist/ipc/supervised_proc.d.cts +8 -0
  217. package/dist/ipc/supervised_proc.d.ts +8 -0
  218. package/dist/ipc/supervised_proc.d.ts.map +1 -1
  219. package/dist/ipc/supervised_proc.js +34 -8
  220. package/dist/ipc/supervised_proc.js.map +1 -1
  221. package/dist/ipc/supervised_proc.test.cjs +145 -0
  222. package/dist/ipc/supervised_proc.test.cjs.map +1 -0
  223. package/dist/ipc/supervised_proc.test.js +122 -0
  224. package/dist/ipc/supervised_proc.test.js.map +1 -0
  225. package/dist/job.cjs +109 -1
  226. package/dist/job.cjs.map +1 -1
  227. package/dist/job.d.cts +14 -0
  228. package/dist/job.d.ts +14 -0
  229. package/dist/job.d.ts.map +1 -1
  230. package/dist/job.js +99 -1
  231. package/dist/job.js.map +1 -1
  232. package/dist/language.cjs +394 -0
  233. package/dist/language.cjs.map +1 -0
  234. package/dist/language.d.cts +15 -0
  235. package/dist/language.d.ts +15 -0
  236. package/dist/language.d.ts.map +1 -0
  237. package/dist/language.js +363 -0
  238. package/dist/language.js.map +1 -0
  239. package/dist/language.test.cjs +43 -0
  240. package/dist/language.test.cjs.map +1 -0
  241. package/dist/language.test.js +49 -0
  242. package/dist/language.test.js.map +1 -0
  243. package/dist/llm/chat_context.cjs +274 -3
  244. package/dist/llm/chat_context.cjs.map +1 -1
  245. package/dist/llm/chat_context.d.cts +86 -2
  246. package/dist/llm/chat_context.d.ts +86 -2
  247. package/dist/llm/chat_context.d.ts.map +1 -1
  248. package/dist/llm/chat_context.js +273 -3
  249. package/dist/llm/chat_context.js.map +1 -1
  250. package/dist/llm/chat_context.test.cjs +574 -0
  251. package/dist/llm/chat_context.test.cjs.map +1 -1
  252. package/dist/llm/chat_context.test.js +574 -0
  253. package/dist/llm/chat_context.test.js.map +1 -1
  254. package/dist/llm/fallback_adapter.cjs +278 -0
  255. package/dist/llm/fallback_adapter.cjs.map +1 -0
  256. package/dist/llm/fallback_adapter.d.cts +73 -0
  257. package/dist/llm/fallback_adapter.d.ts +73 -0
  258. package/dist/llm/fallback_adapter.d.ts.map +1 -0
  259. package/dist/llm/fallback_adapter.js +254 -0
  260. package/dist/llm/fallback_adapter.js.map +1 -0
  261. package/dist/llm/fallback_adapter.test.cjs +176 -0
  262. package/dist/llm/fallback_adapter.test.cjs.map +1 -0
  263. package/dist/llm/fallback_adapter.test.js +175 -0
  264. package/dist/llm/fallback_adapter.test.js.map +1 -0
  265. package/dist/llm/index.cjs +9 -0
  266. package/dist/llm/index.cjs.map +1 -1
  267. package/dist/llm/index.d.cts +4 -3
  268. package/dist/llm/index.d.ts +4 -3
  269. package/dist/llm/index.d.ts.map +1 -1
  270. package/dist/llm/index.js +11 -1
  271. package/dist/llm/index.js.map +1 -1
  272. package/dist/llm/llm.cjs +65 -11
  273. package/dist/llm/llm.cjs.map +1 -1
  274. package/dist/llm/llm.d.cts +13 -2
  275. package/dist/llm/llm.d.ts +13 -2
  276. package/dist/llm/llm.d.ts.map +1 -1
  277. package/dist/llm/llm.js +65 -11
  278. package/dist/llm/llm.js.map +1 -1
  279. package/dist/llm/provider_format/google.cjs +6 -2
  280. package/dist/llm/provider_format/google.cjs.map +1 -1
  281. package/dist/llm/provider_format/google.d.cts +1 -1
  282. package/dist/llm/provider_format/google.d.ts +1 -1
  283. package/dist/llm/provider_format/google.d.ts.map +1 -1
  284. package/dist/llm/provider_format/google.js +6 -2
  285. package/dist/llm/provider_format/google.js.map +1 -1
  286. package/dist/llm/provider_format/google.test.cjs +48 -0
  287. package/dist/llm/provider_format/google.test.cjs.map +1 -1
  288. package/dist/llm/provider_format/google.test.js +54 -1
  289. package/dist/llm/provider_format/google.test.js.map +1 -1
  290. package/dist/llm/provider_format/index.cjs +2 -0
  291. package/dist/llm/provider_format/index.cjs.map +1 -1
  292. package/dist/llm/provider_format/index.d.cts +2 -2
  293. package/dist/llm/provider_format/index.d.ts +2 -2
  294. package/dist/llm/provider_format/index.d.ts.map +1 -1
  295. package/dist/llm/provider_format/index.js +6 -1
  296. package/dist/llm/provider_format/index.js.map +1 -1
  297. package/dist/llm/provider_format/openai.cjs +126 -24
  298. package/dist/llm/provider_format/openai.cjs.map +1 -1
  299. package/dist/llm/provider_format/openai.d.cts +1 -0
  300. package/dist/llm/provider_format/openai.d.ts +1 -0
  301. package/dist/llm/provider_format/openai.d.ts.map +1 -1
  302. package/dist/llm/provider_format/openai.js +124 -23
  303. package/dist/llm/provider_format/openai.js.map +1 -1
  304. package/dist/llm/provider_format/openai.test.cjs +393 -0
  305. package/dist/llm/provider_format/openai.test.cjs.map +1 -1
  306. package/dist/llm/provider_format/openai.test.js +400 -2
  307. package/dist/llm/provider_format/openai.test.js.map +1 -1
  308. package/dist/llm/provider_format/utils.cjs +5 -4
  309. package/dist/llm/provider_format/utils.cjs.map +1 -1
  310. package/dist/llm/provider_format/utils.d.ts.map +1 -1
  311. package/dist/llm/provider_format/utils.js +5 -4
  312. package/dist/llm/provider_format/utils.js.map +1 -1
  313. package/dist/llm/realtime.cjs +3 -0
  314. package/dist/llm/realtime.cjs.map +1 -1
  315. package/dist/llm/realtime.d.cts +15 -1
  316. package/dist/llm/realtime.d.ts +15 -1
  317. package/dist/llm/realtime.d.ts.map +1 -1
  318. package/dist/llm/realtime.js +3 -0
  319. package/dist/llm/realtime.js.map +1 -1
  320. package/dist/llm/remote_chat_context.cjs.map +1 -1
  321. package/dist/llm/remote_chat_context.d.cts +2 -0
  322. package/dist/llm/remote_chat_context.d.ts +2 -0
  323. package/dist/llm/remote_chat_context.d.ts.map +1 -1
  324. package/dist/llm/remote_chat_context.js.map +1 -1
  325. package/dist/llm/tool_context.cjs +50 -2
  326. package/dist/llm/tool_context.cjs.map +1 -1
  327. package/dist/llm/tool_context.d.cts +47 -11
  328. package/dist/llm/tool_context.d.ts +47 -11
  329. package/dist/llm/tool_context.d.ts.map +1 -1
  330. package/dist/llm/tool_context.js +48 -3
  331. package/dist/llm/tool_context.js.map +1 -1
  332. package/dist/llm/tool_context.test.cjs +197 -0
  333. package/dist/llm/tool_context.test.cjs.map +1 -1
  334. package/dist/llm/tool_context.test.js +175 -0
  335. package/dist/llm/tool_context.test.js.map +1 -1
  336. package/dist/llm/utils.cjs +18 -12
  337. package/dist/llm/utils.cjs.map +1 -1
  338. package/dist/llm/utils.d.cts +2 -3
  339. package/dist/llm/utils.d.ts +2 -3
  340. package/dist/llm/utils.d.ts.map +1 -1
  341. package/dist/llm/utils.js +18 -12
  342. package/dist/llm/utils.js.map +1 -1
  343. package/dist/llm/zod-utils.cjs +102 -0
  344. package/dist/llm/zod-utils.cjs.map +1 -0
  345. package/dist/llm/zod-utils.d.cts +65 -0
  346. package/dist/llm/zod-utils.d.ts +65 -0
  347. package/dist/llm/zod-utils.d.ts.map +1 -0
  348. package/dist/llm/zod-utils.js +64 -0
  349. package/dist/llm/zod-utils.js.map +1 -0
  350. package/dist/llm/zod-utils.test.cjs +472 -0
  351. package/dist/llm/zod-utils.test.cjs.map +1 -0
  352. package/dist/llm/zod-utils.test.js +455 -0
  353. package/dist/llm/zod-utils.test.js.map +1 -0
  354. package/dist/log.cjs +45 -14
  355. package/dist/log.cjs.map +1 -1
  356. package/dist/log.d.cts +8 -1
  357. package/dist/log.d.ts +8 -1
  358. package/dist/log.d.ts.map +1 -1
  359. package/dist/log.js +45 -15
  360. package/dist/log.js.map +1 -1
  361. package/dist/metrics/base.cjs.map +1 -1
  362. package/dist/metrics/base.d.cts +75 -19
  363. package/dist/metrics/base.d.ts +75 -19
  364. package/dist/metrics/base.d.ts.map +1 -1
  365. package/dist/metrics/index.cjs +5 -0
  366. package/dist/metrics/index.cjs.map +1 -1
  367. package/dist/metrics/index.d.cts +2 -1
  368. package/dist/metrics/index.d.ts +2 -1
  369. package/dist/metrics/index.d.ts.map +1 -1
  370. package/dist/metrics/index.js +6 -0
  371. package/dist/metrics/index.js.map +1 -1
  372. package/dist/metrics/model_usage.cjs +189 -0
  373. package/dist/metrics/model_usage.cjs.map +1 -0
  374. package/dist/metrics/model_usage.d.cts +92 -0
  375. package/dist/metrics/model_usage.d.ts +92 -0
  376. package/dist/metrics/model_usage.d.ts.map +1 -0
  377. package/dist/metrics/model_usage.js +164 -0
  378. package/dist/metrics/model_usage.js.map +1 -0
  379. package/dist/metrics/model_usage.test.cjs +474 -0
  380. package/dist/metrics/model_usage.test.cjs.map +1 -0
  381. package/dist/metrics/model_usage.test.js +476 -0
  382. package/dist/metrics/model_usage.test.js.map +1 -0
  383. package/dist/metrics/usage_collector.cjs +5 -2
  384. package/dist/metrics/usage_collector.cjs.map +1 -1
  385. package/dist/metrics/usage_collector.d.cts +10 -1
  386. package/dist/metrics/usage_collector.d.ts +10 -1
  387. package/dist/metrics/usage_collector.d.ts.map +1 -1
  388. package/dist/metrics/usage_collector.js +5 -2
  389. package/dist/metrics/usage_collector.js.map +1 -1
  390. package/dist/metrics/utils.cjs +23 -7
  391. package/dist/metrics/utils.cjs.map +1 -1
  392. package/dist/metrics/utils.d.ts.map +1 -1
  393. package/dist/metrics/utils.js +23 -7
  394. package/dist/metrics/utils.js.map +1 -1
  395. package/dist/stream/deferred_stream.cjs +31 -10
  396. package/dist/stream/deferred_stream.cjs.map +1 -1
  397. package/dist/stream/deferred_stream.d.cts +6 -1
  398. package/dist/stream/deferred_stream.d.ts +6 -1
  399. package/dist/stream/deferred_stream.d.ts.map +1 -1
  400. package/dist/stream/deferred_stream.js +31 -10
  401. package/dist/stream/deferred_stream.js.map +1 -1
  402. package/dist/stream/deferred_stream.test.cjs +2 -2
  403. package/dist/stream/deferred_stream.test.cjs.map +1 -1
  404. package/dist/stream/deferred_stream.test.js +2 -2
  405. package/dist/stream/deferred_stream.test.js.map +1 -1
  406. package/dist/stream/index.cjs +3 -0
  407. package/dist/stream/index.cjs.map +1 -1
  408. package/dist/stream/index.d.cts +1 -0
  409. package/dist/stream/index.d.ts +1 -0
  410. package/dist/stream/index.d.ts.map +1 -1
  411. package/dist/stream/index.js +2 -0
  412. package/dist/stream/index.js.map +1 -1
  413. package/dist/stream/multi_input_stream.cjs +139 -0
  414. package/dist/stream/multi_input_stream.cjs.map +1 -0
  415. package/dist/stream/multi_input_stream.d.cts +55 -0
  416. package/dist/stream/multi_input_stream.d.ts +55 -0
  417. package/dist/stream/multi_input_stream.d.ts.map +1 -0
  418. package/dist/stream/multi_input_stream.js +115 -0
  419. package/dist/stream/multi_input_stream.js.map +1 -0
  420. package/dist/stream/multi_input_stream.test.cjs +344 -0
  421. package/dist/stream/multi_input_stream.test.cjs.map +1 -0
  422. package/dist/stream/multi_input_stream.test.js +343 -0
  423. package/dist/stream/multi_input_stream.test.js.map +1 -0
  424. package/dist/stream/stream_channel.cjs +39 -1
  425. package/dist/stream/stream_channel.cjs.map +1 -1
  426. package/dist/stream/stream_channel.d.cts +5 -2
  427. package/dist/stream/stream_channel.d.ts +5 -2
  428. package/dist/stream/stream_channel.d.ts.map +1 -1
  429. package/dist/stream/stream_channel.js +39 -1
  430. package/dist/stream/stream_channel.js.map +1 -1
  431. package/dist/stream/stream_channel.test.cjs +27 -0
  432. package/dist/stream/stream_channel.test.cjs.map +1 -1
  433. package/dist/stream/stream_channel.test.js +27 -0
  434. package/dist/stream/stream_channel.test.js.map +1 -1
  435. package/dist/stt/stream_adapter.cjs +24 -9
  436. package/dist/stt/stream_adapter.cjs.map +1 -1
  437. package/dist/stt/stream_adapter.d.cts +7 -3
  438. package/dist/stt/stream_adapter.d.ts +7 -3
  439. package/dist/stt/stream_adapter.d.ts.map +1 -1
  440. package/dist/stt/stream_adapter.js +24 -9
  441. package/dist/stt/stream_adapter.js.map +1 -1
  442. package/dist/stt/stt.cjs +86 -19
  443. package/dist/stt/stt.cjs.map +1 -1
  444. package/dist/stt/stt.d.cts +60 -5
  445. package/dist/stt/stt.d.ts +60 -5
  446. package/dist/stt/stt.d.ts.map +1 -1
  447. package/dist/stt/stt.js +88 -21
  448. package/dist/stt/stt.js.map +1 -1
  449. package/dist/telemetry/index.cjs +72 -0
  450. package/dist/telemetry/index.cjs.map +1 -0
  451. package/dist/telemetry/index.d.cts +7 -0
  452. package/dist/telemetry/index.d.ts +7 -0
  453. package/dist/telemetry/index.d.ts.map +1 -0
  454. package/dist/telemetry/index.js +37 -0
  455. package/dist/telemetry/index.js.map +1 -0
  456. package/dist/telemetry/logging.cjs +65 -0
  457. package/dist/telemetry/logging.cjs.map +1 -0
  458. package/dist/telemetry/logging.d.cts +21 -0
  459. package/dist/telemetry/logging.d.ts +21 -0
  460. package/dist/telemetry/logging.d.ts.map +1 -0
  461. package/dist/telemetry/logging.js +40 -0
  462. package/dist/telemetry/logging.js.map +1 -0
  463. package/dist/telemetry/otel_http_exporter.cjs +166 -0
  464. package/dist/telemetry/otel_http_exporter.cjs.map +1 -0
  465. package/dist/telemetry/otel_http_exporter.d.cts +63 -0
  466. package/dist/telemetry/otel_http_exporter.d.ts +63 -0
  467. package/dist/telemetry/otel_http_exporter.d.ts.map +1 -0
  468. package/dist/telemetry/otel_http_exporter.js +142 -0
  469. package/dist/telemetry/otel_http_exporter.js.map +1 -0
  470. package/dist/telemetry/pino_otel_transport.cjs +217 -0
  471. package/dist/telemetry/pino_otel_transport.cjs.map +1 -0
  472. package/dist/telemetry/pino_otel_transport.d.cts +58 -0
  473. package/dist/telemetry/pino_otel_transport.d.ts +58 -0
  474. package/dist/telemetry/pino_otel_transport.d.ts.map +1 -0
  475. package/dist/telemetry/pino_otel_transport.js +189 -0
  476. package/dist/telemetry/pino_otel_transport.js.map +1 -0
  477. package/dist/telemetry/trace_types.cjs +233 -0
  478. package/dist/telemetry/trace_types.cjs.map +1 -0
  479. package/dist/telemetry/trace_types.d.cts +74 -0
  480. package/dist/telemetry/trace_types.d.ts +74 -0
  481. package/dist/telemetry/trace_types.d.ts.map +1 -0
  482. package/dist/telemetry/trace_types.js +141 -0
  483. package/dist/telemetry/trace_types.js.map +1 -0
  484. package/dist/telemetry/traces.cjs +484 -0
  485. package/dist/telemetry/traces.cjs.map +1 -0
  486. package/dist/telemetry/traces.d.cts +116 -0
  487. package/dist/telemetry/traces.d.ts +116 -0
  488. package/dist/telemetry/traces.d.ts.map +1 -0
  489. package/dist/telemetry/traces.js +449 -0
  490. package/dist/telemetry/traces.js.map +1 -0
  491. package/dist/telemetry/utils.cjs +86 -0
  492. package/dist/telemetry/utils.cjs.map +1 -0
  493. package/dist/telemetry/utils.d.cts +5 -0
  494. package/dist/telemetry/utils.d.ts +5 -0
  495. package/dist/telemetry/utils.d.ts.map +1 -0
  496. package/dist/telemetry/utils.js +51 -0
  497. package/dist/telemetry/utils.js.map +1 -0
  498. package/dist/tokenize/basic/sentence.cjs +3 -3
  499. package/dist/tokenize/basic/sentence.cjs.map +1 -1
  500. package/dist/tokenize/basic/sentence.js +3 -3
  501. package/dist/tokenize/basic/sentence.js.map +1 -1
  502. package/dist/tokenize/tokenizer.test.cjs +3 -1
  503. package/dist/tokenize/tokenizer.test.cjs.map +1 -1
  504. package/dist/tokenize/tokenizer.test.js +3 -1
  505. package/dist/tokenize/tokenizer.test.js.map +1 -1
  506. package/dist/transcription.cjs.map +1 -1
  507. package/dist/transcription.d.cts +6 -0
  508. package/dist/transcription.d.ts +6 -0
  509. package/dist/transcription.d.ts.map +1 -1
  510. package/dist/transcription.js.map +1 -1
  511. package/dist/tts/fallback_adapter.cjs +466 -0
  512. package/dist/tts/fallback_adapter.cjs.map +1 -0
  513. package/dist/tts/fallback_adapter.d.cts +110 -0
  514. package/dist/tts/fallback_adapter.d.ts +110 -0
  515. package/dist/tts/fallback_adapter.d.ts.map +1 -0
  516. package/dist/tts/fallback_adapter.js +442 -0
  517. package/dist/tts/fallback_adapter.js.map +1 -0
  518. package/dist/tts/index.cjs +3 -0
  519. package/dist/tts/index.cjs.map +1 -1
  520. package/dist/tts/index.d.cts +1 -0
  521. package/dist/tts/index.d.ts +1 -0
  522. package/dist/tts/index.d.ts.map +1 -1
  523. package/dist/tts/index.js +2 -0
  524. package/dist/tts/index.js.map +1 -1
  525. package/dist/tts/stream_adapter.cjs +25 -8
  526. package/dist/tts/stream_adapter.cjs.map +1 -1
  527. package/dist/tts/stream_adapter.d.cts +6 -3
  528. package/dist/tts/stream_adapter.d.ts +6 -3
  529. package/dist/tts/stream_adapter.d.ts.map +1 -1
  530. package/dist/tts/stream_adapter.js +25 -8
  531. package/dist/tts/stream_adapter.js.map +1 -1
  532. package/dist/tts/tts.cjs +189 -57
  533. package/dist/tts/tts.cjs.map +1 -1
  534. package/dist/tts/tts.d.cts +58 -6
  535. package/dist/tts/tts.d.ts +58 -6
  536. package/dist/tts/tts.d.ts.map +1 -1
  537. package/dist/tts/tts.js +191 -59
  538. package/dist/tts/tts.js.map +1 -1
  539. package/dist/types.cjs +24 -32
  540. package/dist/types.cjs.map +1 -1
  541. package/dist/types.d.cts +45 -10
  542. package/dist/types.d.ts +45 -10
  543. package/dist/types.d.ts.map +1 -1
  544. package/dist/types.js +20 -30
  545. package/dist/types.js.map +1 -1
  546. package/dist/utils.cjs +122 -26
  547. package/dist/utils.cjs.map +1 -1
  548. package/dist/utils.d.cts +41 -1
  549. package/dist/utils.d.ts +41 -1
  550. package/dist/utils.d.ts.map +1 -1
  551. package/dist/utils.js +117 -25
  552. package/dist/utils.js.map +1 -1
  553. package/dist/utils.test.cjs +73 -1
  554. package/dist/utils.test.cjs.map +1 -1
  555. package/dist/utils.test.js +74 -10
  556. package/dist/utils.test.js.map +1 -1
  557. package/dist/vad.cjs +35 -15
  558. package/dist/vad.cjs.map +1 -1
  559. package/dist/vad.d.cts +15 -5
  560. package/dist/vad.d.ts +15 -5
  561. package/dist/vad.d.ts.map +1 -1
  562. package/dist/vad.js +35 -15
  563. package/dist/vad.js.map +1 -1
  564. package/dist/version.cjs +1 -1
  565. package/dist/version.cjs.map +1 -1
  566. package/dist/version.d.cts +1 -1
  567. package/dist/version.d.ts +1 -1
  568. package/dist/version.d.ts.map +1 -1
  569. package/dist/version.js +1 -1
  570. package/dist/version.js.map +1 -1
  571. package/dist/voice/agent.cjs +258 -35
  572. package/dist/voice/agent.cjs.map +1 -1
  573. package/dist/voice/agent.d.cts +54 -13
  574. package/dist/voice/agent.d.ts +54 -13
  575. package/dist/voice/agent.d.ts.map +1 -1
  576. package/dist/voice/agent.js +254 -34
  577. package/dist/voice/agent.js.map +1 -1
  578. package/dist/voice/agent.test.cjs +314 -0
  579. package/dist/voice/agent.test.cjs.map +1 -1
  580. package/dist/voice/agent.test.js +316 -2
  581. package/dist/voice/agent.test.js.map +1 -1
  582. package/dist/voice/agent_activity.cjs +1116 -385
  583. package/dist/voice/agent_activity.cjs.map +1 -1
  584. package/dist/voice/agent_activity.d.cts +72 -11
  585. package/dist/voice/agent_activity.d.ts +72 -11
  586. package/dist/voice/agent_activity.d.ts.map +1 -1
  587. package/dist/voice/agent_activity.js +1119 -383
  588. package/dist/voice/agent_activity.js.map +1 -1
  589. package/dist/voice/agent_activity.test.cjs +135 -0
  590. package/dist/voice/agent_activity.test.cjs.map +1 -0
  591. package/dist/voice/agent_activity.test.js +134 -0
  592. package/dist/voice/agent_activity.test.js.map +1 -0
  593. package/dist/voice/agent_session.cjs +550 -90
  594. package/dist/voice/agent_session.cjs.map +1 -1
  595. package/dist/voice/agent_session.d.cts +185 -25
  596. package/dist/voice/agent_session.d.ts +185 -25
  597. package/dist/voice/agent_session.d.ts.map +1 -1
  598. package/dist/voice/agent_session.js +556 -91
  599. package/dist/voice/agent_session.js.map +1 -1
  600. package/dist/voice/audio_recognition.cjs +605 -46
  601. package/dist/voice/audio_recognition.cjs.map +1 -1
  602. package/dist/voice/audio_recognition.d.cts +96 -4
  603. package/dist/voice/audio_recognition.d.ts +96 -4
  604. package/dist/voice/audio_recognition.d.ts.map +1 -1
  605. package/dist/voice/audio_recognition.js +611 -47
  606. package/dist/voice/audio_recognition.js.map +1 -1
  607. package/dist/voice/audio_recognition_span.test.cjs +295 -0
  608. package/dist/voice/audio_recognition_span.test.cjs.map +1 -0
  609. package/dist/voice/audio_recognition_span.test.js +299 -0
  610. package/dist/voice/audio_recognition_span.test.js.map +1 -0
  611. package/dist/voice/avatar/datastream_io.cjs +7 -1
  612. package/dist/voice/avatar/datastream_io.cjs.map +1 -1
  613. package/dist/voice/avatar/datastream_io.d.cts +1 -0
  614. package/dist/voice/avatar/datastream_io.d.ts +1 -0
  615. package/dist/voice/avatar/datastream_io.d.ts.map +1 -1
  616. package/dist/voice/avatar/datastream_io.js +7 -1
  617. package/dist/voice/avatar/datastream_io.js.map +1 -1
  618. package/dist/voice/background_audio.cjs +367 -0
  619. package/dist/voice/background_audio.cjs.map +1 -0
  620. package/dist/voice/background_audio.d.cts +123 -0
  621. package/dist/voice/background_audio.d.ts +123 -0
  622. package/dist/voice/background_audio.d.ts.map +1 -0
  623. package/dist/voice/background_audio.js +343 -0
  624. package/dist/voice/background_audio.js.map +1 -0
  625. package/dist/voice/events.cjs +3 -0
  626. package/dist/voice/events.cjs.map +1 -1
  627. package/dist/voice/events.d.cts +16 -9
  628. package/dist/voice/events.d.ts +16 -9
  629. package/dist/voice/events.d.ts.map +1 -1
  630. package/dist/voice/events.js +3 -0
  631. package/dist/voice/events.js.map +1 -1
  632. package/dist/voice/generation.cjs +205 -41
  633. package/dist/voice/generation.cjs.map +1 -1
  634. package/dist/voice/generation.d.cts +21 -5
  635. package/dist/voice/generation.d.ts +21 -5
  636. package/dist/voice/generation.d.ts.map +1 -1
  637. package/dist/voice/generation.js +215 -43
  638. package/dist/voice/generation.js.map +1 -1
  639. package/dist/voice/generation_tools.test.cjs +236 -0
  640. package/dist/voice/generation_tools.test.cjs.map +1 -0
  641. package/dist/voice/generation_tools.test.js +235 -0
  642. package/dist/voice/generation_tools.test.js.map +1 -0
  643. package/dist/voice/index.cjs +33 -2
  644. package/dist/voice/index.cjs.map +1 -1
  645. package/dist/voice/index.d.cts +8 -2
  646. package/dist/voice/index.d.ts +8 -2
  647. package/dist/voice/index.d.ts.map +1 -1
  648. package/dist/voice/index.js +19 -2
  649. package/dist/voice/index.js.map +1 -1
  650. package/dist/voice/interruption_detection.test.cjs +114 -0
  651. package/dist/voice/interruption_detection.test.cjs.map +1 -0
  652. package/dist/voice/interruption_detection.test.js +113 -0
  653. package/dist/voice/interruption_detection.test.js.map +1 -0
  654. package/dist/voice/io.cjs +66 -6
  655. package/dist/voice/io.cjs.map +1 -1
  656. package/dist/voice/io.d.cts +67 -7
  657. package/dist/voice/io.d.ts +67 -7
  658. package/dist/voice/io.d.ts.map +1 -1
  659. package/dist/voice/io.js +62 -5
  660. package/dist/voice/io.js.map +1 -1
  661. package/dist/voice/recorder_io/index.cjs +23 -0
  662. package/dist/voice/recorder_io/index.cjs.map +1 -0
  663. package/dist/voice/recorder_io/index.d.cts +2 -0
  664. package/dist/voice/recorder_io/index.d.ts +2 -0
  665. package/dist/voice/recorder_io/index.d.ts.map +1 -0
  666. package/dist/voice/recorder_io/index.js +2 -0
  667. package/dist/voice/recorder_io/index.js.map +1 -0
  668. package/dist/voice/recorder_io/recorder_io.cjs +607 -0
  669. package/dist/voice/recorder_io/recorder_io.cjs.map +1 -0
  670. package/dist/voice/recorder_io/recorder_io.d.cts +106 -0
  671. package/dist/voice/recorder_io/recorder_io.d.ts +106 -0
  672. package/dist/voice/recorder_io/recorder_io.d.ts.map +1 -0
  673. package/dist/voice/recorder_io/recorder_io.js +573 -0
  674. package/dist/voice/recorder_io/recorder_io.js.map +1 -0
  675. package/dist/voice/remote_session.cjs +922 -0
  676. package/dist/voice/remote_session.cjs.map +1 -0
  677. package/dist/voice/remote_session.d.cts +108 -0
  678. package/dist/voice/remote_session.d.ts +108 -0
  679. package/dist/voice/remote_session.d.ts.map +1 -0
  680. package/dist/voice/remote_session.js +887 -0
  681. package/dist/voice/remote_session.js.map +1 -0
  682. package/dist/voice/report.cjs +88 -0
  683. package/dist/voice/report.cjs.map +1 -0
  684. package/dist/voice/report.d.cts +49 -0
  685. package/dist/voice/report.d.ts +49 -0
  686. package/dist/voice/report.d.ts.map +1 -0
  687. package/dist/voice/report.js +63 -0
  688. package/dist/voice/report.js.map +1 -0
  689. package/dist/voice/report.test.cjs +121 -0
  690. package/dist/voice/report.test.cjs.map +1 -0
  691. package/dist/voice/report.test.js +120 -0
  692. package/dist/voice/report.test.js.map +1 -0
  693. package/dist/voice/room_io/_input.cjs +40 -7
  694. package/dist/voice/room_io/_input.cjs.map +1 -1
  695. package/dist/voice/room_io/_input.d.cts +5 -2
  696. package/dist/voice/room_io/_input.d.ts +5 -2
  697. package/dist/voice/room_io/_input.d.ts.map +1 -1
  698. package/dist/voice/room_io/_input.js +41 -8
  699. package/dist/voice/room_io/_input.js.map +1 -1
  700. package/dist/voice/room_io/_output.cjs +19 -11
  701. package/dist/voice/room_io/_output.cjs.map +1 -1
  702. package/dist/voice/room_io/_output.d.cts +7 -4
  703. package/dist/voice/room_io/_output.d.ts +7 -4
  704. package/dist/voice/room_io/_output.d.ts.map +1 -1
  705. package/dist/voice/room_io/_output.js +20 -12
  706. package/dist/voice/room_io/_output.js.map +1 -1
  707. package/dist/voice/room_io/room_io.cjs +33 -6
  708. package/dist/voice/room_io/room_io.cjs.map +1 -1
  709. package/dist/voice/room_io/room_io.d.cts +29 -9
  710. package/dist/voice/room_io/room_io.d.ts +29 -9
  711. package/dist/voice/room_io/room_io.d.ts.map +1 -1
  712. package/dist/voice/room_io/room_io.js +33 -7
  713. package/dist/voice/room_io/room_io.js.map +1 -1
  714. package/dist/voice/speech_handle.cjs +22 -4
  715. package/dist/voice/speech_handle.cjs.map +1 -1
  716. package/dist/voice/speech_handle.d.cts +17 -2
  717. package/dist/voice/speech_handle.d.ts +17 -2
  718. package/dist/voice/speech_handle.d.ts.map +1 -1
  719. package/dist/voice/speech_handle.js +21 -4
  720. package/dist/voice/speech_handle.js.map +1 -1
  721. package/dist/voice/testing/fake_llm.cjs +127 -0
  722. package/dist/voice/testing/fake_llm.cjs.map +1 -0
  723. package/dist/voice/testing/fake_llm.d.cts +30 -0
  724. package/dist/voice/testing/fake_llm.d.ts +30 -0
  725. package/dist/voice/testing/fake_llm.d.ts.map +1 -0
  726. package/dist/voice/testing/fake_llm.js +103 -0
  727. package/dist/voice/testing/fake_llm.js.map +1 -0
  728. package/dist/voice/testing/index.cjs +57 -0
  729. package/dist/voice/testing/index.cjs.map +1 -0
  730. package/dist/voice/testing/index.d.cts +21 -0
  731. package/dist/voice/testing/index.d.ts +21 -0
  732. package/dist/voice/testing/index.d.ts.map +1 -0
  733. package/dist/voice/testing/index.js +35 -0
  734. package/dist/voice/testing/index.js.map +1 -0
  735. package/dist/voice/testing/run_result.cjs +817 -0
  736. package/dist/voice/testing/run_result.cjs.map +1 -0
  737. package/dist/voice/testing/run_result.d.cts +385 -0
  738. package/dist/voice/testing/run_result.d.ts +385 -0
  739. package/dist/voice/testing/run_result.d.ts.map +1 -0
  740. package/dist/voice/testing/run_result.js +790 -0
  741. package/dist/voice/testing/run_result.js.map +1 -0
  742. package/dist/voice/testing/types.cjs +46 -0
  743. package/dist/voice/testing/types.cjs.map +1 -0
  744. package/dist/voice/testing/types.d.cts +83 -0
  745. package/dist/voice/testing/types.d.ts +83 -0
  746. package/dist/voice/testing/types.d.ts.map +1 -0
  747. package/dist/voice/testing/types.js +19 -0
  748. package/dist/voice/testing/types.js.map +1 -0
  749. package/dist/voice/transcription/synchronizer.cjs +139 -15
  750. package/dist/voice/transcription/synchronizer.cjs.map +1 -1
  751. package/dist/voice/transcription/synchronizer.d.cts +35 -4
  752. package/dist/voice/transcription/synchronizer.d.ts +35 -4
  753. package/dist/voice/transcription/synchronizer.d.ts.map +1 -1
  754. package/dist/voice/transcription/synchronizer.js +143 -16
  755. package/dist/voice/transcription/synchronizer.js.map +1 -1
  756. package/dist/voice/transcription/synchronizer.test.cjs +151 -0
  757. package/dist/voice/transcription/synchronizer.test.cjs.map +1 -0
  758. package/dist/voice/transcription/synchronizer.test.js +150 -0
  759. package/dist/voice/transcription/synchronizer.test.js.map +1 -0
  760. package/dist/voice/turn_config/endpointing.cjs +33 -0
  761. package/dist/voice/turn_config/endpointing.cjs.map +1 -0
  762. package/dist/voice/turn_config/endpointing.d.cts +30 -0
  763. package/dist/voice/turn_config/endpointing.d.ts +30 -0
  764. package/dist/voice/turn_config/endpointing.d.ts.map +1 -0
  765. package/dist/voice/turn_config/endpointing.js +9 -0
  766. package/dist/voice/turn_config/endpointing.js.map +1 -0
  767. package/dist/voice/turn_config/interruption.cjs +37 -0
  768. package/dist/voice/turn_config/interruption.cjs.map +1 -0
  769. package/dist/voice/turn_config/interruption.d.cts +53 -0
  770. package/dist/voice/turn_config/interruption.d.ts +53 -0
  771. package/dist/voice/turn_config/interruption.d.ts.map +1 -0
  772. package/dist/voice/turn_config/interruption.js +13 -0
  773. package/dist/voice/turn_config/interruption.js.map +1 -0
  774. package/dist/voice/turn_config/turn_handling.cjs +35 -0
  775. package/dist/voice/turn_config/turn_handling.cjs.map +1 -0
  776. package/dist/voice/turn_config/turn_handling.d.cts +36 -0
  777. package/dist/voice/turn_config/turn_handling.d.ts +36 -0
  778. package/dist/voice/turn_config/turn_handling.d.ts.map +1 -0
  779. package/dist/voice/turn_config/turn_handling.js +11 -0
  780. package/dist/voice/turn_config/turn_handling.js.map +1 -0
  781. package/dist/voice/turn_config/utils.cjs +157 -0
  782. package/dist/voice/turn_config/utils.cjs.map +1 -0
  783. package/dist/voice/turn_config/utils.d.cts +37 -0
  784. package/dist/voice/turn_config/utils.d.ts +37 -0
  785. package/dist/voice/turn_config/utils.d.ts.map +1 -0
  786. package/dist/voice/turn_config/utils.js +131 -0
  787. package/dist/voice/turn_config/utils.js.map +1 -0
  788. package/dist/voice/turn_config/utils.test.cjs +128 -0
  789. package/dist/voice/turn_config/utils.test.cjs.map +1 -0
  790. package/dist/voice/turn_config/utils.test.js +127 -0
  791. package/dist/voice/turn_config/utils.test.js.map +1 -0
  792. package/dist/voice/utils.cjs +47 -0
  793. package/dist/voice/utils.cjs.map +1 -0
  794. package/dist/voice/utils.d.cts +4 -0
  795. package/dist/voice/utils.d.ts +4 -0
  796. package/dist/voice/utils.d.ts.map +1 -0
  797. package/dist/voice/utils.js +23 -0
  798. package/dist/voice/utils.js.map +1 -0
  799. package/dist/worker.cjs +44 -52
  800. package/dist/worker.cjs.map +1 -1
  801. package/dist/worker.d.cts +18 -8
  802. package/dist/worker.d.ts +18 -8
  803. package/dist/worker.d.ts.map +1 -1
  804. package/dist/worker.js +43 -43
  805. package/dist/worker.js.map +1 -1
  806. package/package.json +32 -12
  807. package/resources/NOTICE +2 -0
  808. package/resources/keyboard-typing.ogg +0 -0
  809. package/resources/keyboard-typing2.ogg +0 -0
  810. package/resources/office-ambience.ogg +0 -0
  811. package/src/audio.ts +132 -1
  812. package/src/beta/index.ts +9 -0
  813. package/src/beta/workflows/index.ts +9 -0
  814. package/src/beta/workflows/task_group.ts +194 -0
  815. package/src/cli.ts +57 -66
  816. package/src/connection_pool.test.ts +346 -0
  817. package/src/connection_pool.ts +307 -0
  818. package/src/constants.ts +14 -0
  819. package/src/cpu.test.ts +239 -0
  820. package/src/cpu.ts +173 -0
  821. package/src/http_server.ts +18 -6
  822. package/src/index.ts +15 -13
  823. package/src/inference/api_protos.ts +85 -2
  824. package/src/inference/index.ts +32 -4
  825. package/src/inference/interruption/defaults.ts +51 -0
  826. package/src/inference/interruption/errors.ts +25 -0
  827. package/src/inference/interruption/http_transport.ts +206 -0
  828. package/src/inference/interruption/interruption_cache_entry.ts +50 -0
  829. package/src/inference/interruption/interruption_detector.ts +204 -0
  830. package/src/inference/interruption/interruption_stream.ts +467 -0
  831. package/src/inference/interruption/types.ts +84 -0
  832. package/src/inference/interruption/utils.test.ts +132 -0
  833. package/src/inference/interruption/utils.ts +137 -0
  834. package/src/inference/interruption/ws_transport.ts +406 -0
  835. package/src/inference/llm.ts +214 -163
  836. package/src/inference/stt.test.ts +253 -0
  837. package/src/inference/stt.ts +449 -208
  838. package/src/inference/tts.test.ts +267 -0
  839. package/src/inference/tts.ts +377 -115
  840. package/src/inference/utils.ts +30 -2
  841. package/src/ipc/inference_proc_executor.ts +11 -3
  842. package/src/ipc/inference_proc_lazy_main.ts +13 -1
  843. package/src/ipc/job_proc_executor.ts +11 -1
  844. package/src/ipc/job_proc_lazy_main.ts +86 -20
  845. package/src/ipc/supervised_proc.test.ts +153 -0
  846. package/src/ipc/supervised_proc.ts +39 -10
  847. package/src/job.ts +120 -1
  848. package/src/language.test.ts +62 -0
  849. package/src/language.ts +380 -0
  850. package/src/llm/__snapshots__/zod-utils.test.ts.snap +559 -0
  851. package/src/llm/chat_context.test.ts +655 -0
  852. package/src/llm/chat_context.ts +412 -2
  853. package/src/llm/fallback_adapter.test.ts +238 -0
  854. package/src/llm/fallback_adapter.ts +391 -0
  855. package/src/llm/index.ts +11 -0
  856. package/src/llm/llm.ts +77 -12
  857. package/src/llm/provider_format/google.test.ts +72 -1
  858. package/src/llm/provider_format/google.ts +10 -6
  859. package/src/llm/provider_format/index.ts +7 -2
  860. package/src/llm/provider_format/openai.test.ts +480 -2
  861. package/src/llm/provider_format/openai.ts +152 -21
  862. package/src/llm/provider_format/utils.ts +11 -5
  863. package/src/llm/realtime.ts +23 -2
  864. package/src/llm/remote_chat_context.ts +2 -2
  865. package/src/llm/tool_context.test.ts +210 -1
  866. package/src/llm/tool_context.ts +115 -17
  867. package/src/llm/utils.ts +24 -16
  868. package/src/llm/zod-utils.test.ts +577 -0
  869. package/src/llm/zod-utils.ts +153 -0
  870. package/src/log.ts +71 -19
  871. package/src/metrics/base.ts +78 -19
  872. package/src/metrics/index.ts +12 -0
  873. package/src/metrics/model_usage.test.ts +545 -0
  874. package/src/metrics/model_usage.ts +262 -0
  875. package/src/metrics/usage_collector.ts +14 -3
  876. package/src/metrics/utils.ts +27 -7
  877. package/src/stream/deferred_stream.test.ts +3 -3
  878. package/src/stream/deferred_stream.ts +43 -11
  879. package/src/stream/index.ts +1 -0
  880. package/src/stream/multi_input_stream.test.ts +545 -0
  881. package/src/stream/multi_input_stream.ts +172 -0
  882. package/src/stream/stream_channel.test.ts +37 -0
  883. package/src/stream/stream_channel.ts +43 -3
  884. package/src/stt/stream_adapter.ts +30 -9
  885. package/src/stt/stt.ts +131 -22
  886. package/src/telemetry/index.ts +28 -0
  887. package/src/telemetry/logging.ts +55 -0
  888. package/src/telemetry/otel_http_exporter.ts +218 -0
  889. package/src/telemetry/pino_otel_transport.ts +265 -0
  890. package/src/telemetry/trace_types.ts +109 -0
  891. package/src/telemetry/traces.ts +673 -0
  892. package/src/telemetry/utils.ts +61 -0
  893. package/src/tokenize/basic/sentence.ts +3 -3
  894. package/src/tokenize/tokenizer.test.ts +4 -0
  895. package/src/transcription.ts +6 -0
  896. package/src/tts/fallback_adapter.ts +579 -0
  897. package/src/tts/index.ts +1 -0
  898. package/src/tts/stream_adapter.ts +38 -8
  899. package/src/tts/tts.ts +245 -62
  900. package/src/types.ts +62 -33
  901. package/src/utils.test.ts +90 -10
  902. package/src/utils.ts +176 -31
  903. package/src/vad.ts +42 -18
  904. package/src/version.ts +1 -1
  905. package/src/voice/agent.test.ts +347 -2
  906. package/src/voice/agent.ts +346 -44
  907. package/src/voice/agent_activity.test.ts +194 -0
  908. package/src/voice/agent_activity.ts +1457 -388
  909. package/src/voice/agent_session.ts +817 -112
  910. package/src/voice/audio_recognition.ts +845 -70
  911. package/src/voice/audio_recognition_span.test.ts +341 -0
  912. package/src/voice/avatar/datastream_io.ts +9 -1
  913. package/src/voice/background_audio.ts +494 -0
  914. package/src/voice/events.ts +27 -7
  915. package/src/voice/generation.ts +310 -56
  916. package/src/voice/generation_tools.test.ts +268 -0
  917. package/src/voice/index.ts +17 -3
  918. package/src/voice/interruption_detection.test.ts +151 -0
  919. package/src/voice/io.ts +115 -12
  920. package/src/voice/recorder_io/index.ts +4 -0
  921. package/src/voice/recorder_io/recorder_io.ts +783 -0
  922. package/src/voice/remote_session.ts +1083 -0
  923. package/src/voice/report.test.ts +136 -0
  924. package/src/voice/report.ts +140 -0
  925. package/src/voice/room_io/_input.ts +45 -10
  926. package/src/voice/room_io/_output.ts +26 -14
  927. package/src/voice/room_io/room_io.ts +67 -22
  928. package/src/voice/speech_handle.ts +38 -6
  929. package/src/voice/testing/fake_llm.ts +138 -0
  930. package/src/voice/testing/index.ts +52 -0
  931. package/src/voice/testing/run_result.ts +995 -0
  932. package/src/voice/testing/types.ts +118 -0
  933. package/src/voice/transcription/synchronizer.test.ts +206 -0
  934. package/src/voice/transcription/synchronizer.ts +204 -19
  935. package/src/voice/turn_config/endpointing.ts +33 -0
  936. package/src/voice/turn_config/interruption.ts +56 -0
  937. package/src/voice/turn_config/turn_handling.ts +45 -0
  938. package/src/voice/turn_config/utils.test.ts +148 -0
  939. package/src/voice/turn_config/utils.ts +167 -0
  940. package/src/voice/utils.ts +29 -0
  941. package/src/worker.ts +92 -78
  942. package/src/llm/__snapshots__/utils.test.ts.snap +0 -65
@@ -0,0 +1,783 @@
1
+ // SPDX-FileCopyrightText: 2025 LiveKit, Inc.
2
+ //
3
+ // SPDX-License-Identifier: Apache-2.0
4
+ import ffmpegInstaller from '@ffmpeg-installer/ffmpeg';
5
+ import { Mutex } from '@livekit/mutex';
6
+ import { AudioFrame, AudioResampler } from '@livekit/rtc-node';
7
+ import ffmpeg from 'fluent-ffmpeg';
8
+ import fs from 'node:fs';
9
+ import path from 'node:path';
10
+ import { PassThrough } from 'node:stream';
11
+ import type { ReadableStream } from 'node:stream/web';
12
+ import { TransformStream } from 'node:stream/web';
13
+ import { log } from '../../log.js';
14
+ import { isStreamReaderReleaseError } from '../../stream/deferred_stream.js';
15
+ import { type StreamChannel, createStreamChannel } from '../../stream/stream_channel.js';
16
+ import { Future, Task, cancelAndWait, delay } from '../../utils.js';
17
+ import type { AgentSession } from '../agent_session.js';
18
+ import { AudioInput, AudioOutput, type PlaybackFinishedEvent } from '../io.js';
19
+
20
+ ffmpeg.setFfmpegPath(ffmpegInstaller.path);
21
+
22
+ const WRITE_INTERVAL_MS = 2500;
23
+ const DEFAULT_SAMPLE_RATE = 48000;
24
+
25
+ export interface RecorderOptions {
26
+ agentSession: AgentSession;
27
+ sampleRate?: number;
28
+ }
29
+
30
+ interface ResampleAndMixOptions {
31
+ frames: AudioFrame[];
32
+ resampler: AudioResampler | undefined;
33
+ flush?: boolean;
34
+ }
35
+
36
+ export class RecorderIO {
37
+ private inRecord?: RecorderAudioInput;
38
+ private outRecord?: RecorderAudioOutput;
39
+
40
+ private inChan: StreamChannel<AudioFrame[]> = createStreamChannel<AudioFrame[]>();
41
+ private outChan: StreamChannel<AudioFrame[]> = createStreamChannel<AudioFrame[]>();
42
+
43
+ private session: AgentSession;
44
+ private sampleRate: number;
45
+
46
+ private _outputPath?: string;
47
+ private forwardTask?: Task<void>;
48
+ private encodeTask?: Task<void>;
49
+
50
+ private closeFuture: Future<void> = new Future();
51
+ private lock: Mutex = new Mutex();
52
+ private started: boolean = false;
53
+
54
+ // FFmpeg streaming state
55
+ private pcmStream?: PassThrough;
56
+ private ffmpegPromise?: Promise<void>;
57
+ private inResampler?: AudioResampler;
58
+ private outResampler?: AudioResampler;
59
+
60
+ private logger = log();
61
+
62
+ constructor(opts: RecorderOptions) {
63
+ const { agentSession, sampleRate = DEFAULT_SAMPLE_RATE } = opts;
64
+
65
+ this.session = agentSession;
66
+ this.sampleRate = sampleRate;
67
+ }
68
+
69
+ async start(outputPath: string): Promise<void> {
70
+ const unlock = await this.lock.lock();
71
+
72
+ try {
73
+ if (this.started) return;
74
+
75
+ if (!this.inRecord || !this.outRecord) {
76
+ throw new Error(
77
+ 'RecorderIO not properly initialized: both `recordInput()` and `recordOutput()` must be called before starting the recorder.',
78
+ );
79
+ }
80
+
81
+ this._outputPath = outputPath;
82
+ this.started = true;
83
+ this.closeFuture = new Future();
84
+
85
+ // Ensure output directory exists
86
+ const dir = path.dirname(outputPath);
87
+ if (!fs.existsSync(dir)) {
88
+ fs.mkdirSync(dir, { recursive: true });
89
+ }
90
+
91
+ this.forwardTask = Task.from(({ signal }) => this.forward(signal));
92
+ this.encodeTask = Task.from(() => this.encode(), undefined, 'recorder_io_encode_task');
93
+ } finally {
94
+ unlock();
95
+ }
96
+ }
97
+
98
+ async close(): Promise<void> {
99
+ const unlock = await this.lock.lock();
100
+
101
+ try {
102
+ if (!this.started) return;
103
+
104
+ await this.inChan.close();
105
+ await this.outChan.close();
106
+ await this.closeFuture.await;
107
+ await cancelAndWait([this.forwardTask!, this.encodeTask!]);
108
+ await this.inRecord?.close();
109
+
110
+ this.started = false;
111
+ } finally {
112
+ unlock();
113
+ }
114
+ }
115
+
116
+ recordInput(audioInput: AudioInput): RecorderAudioInput {
117
+ this.inRecord = new RecorderAudioInput(this, audioInput);
118
+ return this.inRecord;
119
+ }
120
+
121
+ recordOutput(audioOutput: AudioOutput): RecorderAudioOutput {
122
+ this.outRecord = new RecorderAudioOutput(this, audioOutput, (buf) => this.writeCb(buf));
123
+ return this.outRecord;
124
+ }
125
+
126
+ private writeCb(buf: AudioFrame[]): void {
127
+ const inputBuf = this.inRecord!.takeBuf(this.outRecord?._lastSpeechEndTime);
128
+ this.inChan.write(inputBuf);
129
+ this.outChan.write(buf);
130
+ }
131
+
132
+ get recording(): boolean {
133
+ return this.started;
134
+ }
135
+
136
+ get outputPath(): string | undefined {
137
+ return this._outputPath;
138
+ }
139
+
140
+ get recordingStartedAt(): number | undefined {
141
+ const inT = this.inRecord?.startedWallTime;
142
+ const outT = this.outRecord?.startedWallTime;
143
+
144
+ if (inT === undefined) {
145
+ return outT;
146
+ }
147
+
148
+ if (outT === undefined) {
149
+ return inT;
150
+ }
151
+
152
+ return Math.min(inT, outT);
153
+ }
154
+
155
+ /**
156
+ * Forward task: periodically flush input buffer to encoder
157
+ */
158
+ private async forward(signal: AbortSignal): Promise<void> {
159
+ while (!signal.aborted) {
160
+ try {
161
+ await delay(WRITE_INTERVAL_MS, { signal });
162
+ } catch {
163
+ // Aborted
164
+ break;
165
+ }
166
+
167
+ if (this.outRecord!.hasPendingData) {
168
+ // If the output is currently playing audio, wait for it to stay in sync
169
+ continue;
170
+ }
171
+
172
+ // Flush input buffer
173
+ const inputBuf = this.inRecord!.takeBuf(this.outRecord!._lastSpeechEndTime);
174
+ this.inChan
175
+ .write(inputBuf)
176
+ .catch((err) => this.logger.error({ err }, 'Error writing RecorderIO input buffer'));
177
+ this.outChan
178
+ .write([])
179
+ .catch((err) => this.logger.error({ err }, 'Error writing RecorderIO output buffer'));
180
+ }
181
+ }
182
+
183
+ /**
184
+ * Start FFmpeg process for streaming encoding
185
+ */
186
+ private startFFmpeg(): void {
187
+ if (this.pcmStream) return;
188
+
189
+ this.pcmStream = new PassThrough();
190
+
191
+ this.ffmpegPromise = new Promise<void>((resolve, reject) => {
192
+ ffmpeg(this.pcmStream!)
193
+ .inputFormat('s16le')
194
+ .inputOptions([`-ar ${this.sampleRate}`, '-ac 2'])
195
+ .audioCodec('libopus')
196
+ .audioChannels(2)
197
+ .audioFrequency(this.sampleRate)
198
+ .format('ogg')
199
+ .output(this._outputPath!)
200
+ .on('end', () => {
201
+ this.logger.debug('FFmpeg encoding finished');
202
+ resolve();
203
+ })
204
+ .on('error', (err) => {
205
+ // Ignore errors from intentional stream closure or SIGINT during shutdown
206
+ if (
207
+ err.message?.includes('Output stream closed') ||
208
+ err.message?.includes('received signal 2') ||
209
+ err.message?.includes('SIGKILL') ||
210
+ err.message?.includes('SIGINT')
211
+ ) {
212
+ resolve();
213
+ } else {
214
+ this.logger.error({ err }, 'FFmpeg encoding error');
215
+ reject(err);
216
+ }
217
+ })
218
+ .run();
219
+ });
220
+ }
221
+
222
+ /**
223
+ * Resample and mix frames to mono Float32
224
+ */
225
+ private resampleAndMix(opts: ResampleAndMixOptions): {
226
+ samples: Float32Array;
227
+ resampler: AudioResampler | undefined;
228
+ } {
229
+ const INV_INT16 = 1.0 / 32768.0;
230
+ const { frames, flush = false } = opts;
231
+ let { resampler } = opts;
232
+
233
+ if (frames.length === 0 && !flush) {
234
+ return { samples: new Float32Array(0), resampler };
235
+ }
236
+
237
+ if (!resampler && frames.length > 0) {
238
+ const firstFrame = frames[0]!;
239
+ resampler = new AudioResampler(firstFrame.sampleRate, this.sampleRate, firstFrame.channels);
240
+ }
241
+
242
+ const resampledFrames: AudioFrame[] = [];
243
+ for (const frame of frames) {
244
+ if (resampler) {
245
+ resampledFrames.push(...resampler.push(frame));
246
+ }
247
+ }
248
+
249
+ if (flush && resampler) {
250
+ resampledFrames.push(...resampler.flush());
251
+ }
252
+
253
+ const totalSamples = resampledFrames.reduce((acc, frame) => acc + frame.samplesPerChannel, 0);
254
+ const samples = new Float32Array(totalSamples);
255
+
256
+ let pos = 0;
257
+ for (const frame of resampledFrames) {
258
+ const data = frame.data;
259
+ const numChannels = frame.channels;
260
+ for (let i = 0; i < frame.samplesPerChannel; i++) {
261
+ let sum = 0;
262
+ for (let ch = 0; ch < numChannels; ch++) {
263
+ sum += data[i * numChannels + ch]!;
264
+ }
265
+ samples[pos++] = (sum / numChannels) * INV_INT16;
266
+ }
267
+ }
268
+
269
+ return { samples, resampler };
270
+ }
271
+
272
+ /**
273
+ * Write PCM chunk to FFmpeg stream
274
+ */
275
+ private writePCM(leftSamples: Float32Array, rightSamples: Float32Array): void {
276
+ if (!this.pcmStream) {
277
+ this.startFFmpeg();
278
+ }
279
+
280
+ // Handle length mismatch by prepending silence
281
+ if (leftSamples.length !== rightSamples.length) {
282
+ const diff = Math.abs(leftSamples.length - rightSamples.length);
283
+ if (leftSamples.length < rightSamples.length) {
284
+ this.logger.warn(
285
+ `Input is shorter by ${diff} samples; silence has been prepended to align the input channel.`,
286
+ );
287
+ const padded = new Float32Array(rightSamples.length);
288
+ padded.set(leftSamples, diff);
289
+ leftSamples = padded;
290
+ } else {
291
+ const padded = new Float32Array(leftSamples.length);
292
+ padded.set(rightSamples, diff);
293
+ rightSamples = padded;
294
+ }
295
+ }
296
+
297
+ const maxLen = Math.max(leftSamples.length, rightSamples.length);
298
+ if (maxLen <= 0) return;
299
+
300
+ // Interleave stereo samples and convert back to Int16
301
+ const stereoData = new Int16Array(maxLen * 2);
302
+ for (let i = 0; i < maxLen; i++) {
303
+ stereoData[i * 2] = Math.max(
304
+ -32768,
305
+ Math.min(32767, Math.round((leftSamples[i] ?? 0) * 32768)),
306
+ );
307
+ stereoData[i * 2 + 1] = Math.max(
308
+ -32768,
309
+ Math.min(32767, Math.round((rightSamples[i] ?? 0) * 32768)),
310
+ );
311
+ }
312
+
313
+ this.pcmStream!.write(Buffer.from(stereoData.buffer));
314
+ }
315
+
316
+ /**
317
+ * Encode task: read from channels, mix to stereo, stream to FFmpeg
318
+ */
319
+ private async encode(): Promise<void> {
320
+ if (!this._outputPath) return;
321
+
322
+ const inReader = this.inChan.stream().getReader();
323
+ const outReader = this.outChan.stream().getReader();
324
+
325
+ try {
326
+ while (true) {
327
+ const [inResult, outResult] = await Promise.all([inReader.read(), outReader.read()]);
328
+
329
+ if (inResult.done || outResult.done) {
330
+ break;
331
+ }
332
+
333
+ const inputBuf = inResult.value;
334
+ const outputBuf = outResult.value;
335
+
336
+ const inMixed = this.resampleAndMix({ frames: inputBuf, resampler: this.inResampler });
337
+ this.inResampler = inMixed.resampler;
338
+
339
+ const outMixed = this.resampleAndMix({
340
+ frames: outputBuf,
341
+ resampler: this.outResampler,
342
+ flush: outputBuf.length > 0,
343
+ });
344
+ this.outResampler = outMixed.resampler;
345
+
346
+ // Stream PCM data directly to FFmpeg
347
+ this.writePCM(inMixed.samples, outMixed.samples);
348
+ }
349
+
350
+ // Close FFmpeg stream and wait for encoding to complete
351
+ if (this.pcmStream) {
352
+ this.pcmStream.end();
353
+ await this.ffmpegPromise;
354
+ }
355
+ } catch (err) {
356
+ this.logger.error({ err }, 'Error in encode task');
357
+ } finally {
358
+ inReader.releaseLock();
359
+ outReader.releaseLock();
360
+
361
+ if (!this.closeFuture.done) {
362
+ this.closeFuture.resolve();
363
+ }
364
+ }
365
+ }
366
+ }
367
+
368
+ class RecorderAudioInput extends AudioInput {
369
+ private source: AudioInput;
370
+ private recorderIO: RecorderIO;
371
+ private accFrames: AudioFrame[] = [];
372
+ private _startedWallTime?: number;
373
+ private _padded: boolean = false;
374
+ private logger = log();
375
+
376
+ constructor(recorderIO: RecorderIO, source: AudioInput) {
377
+ super();
378
+ this.recorderIO = recorderIO;
379
+ this.source = source;
380
+
381
+ // Set up the intercepting stream
382
+ this.multiStream.addInputStream(this.createInterceptingStream());
383
+ }
384
+
385
+ /**
386
+ * Wall-clock time when the first frame was captured
387
+ */
388
+ get startedWallTime(): number | undefined {
389
+ return this._startedWallTime;
390
+ }
391
+
392
+ /**
393
+ * Take accumulated frames and clear the buffer
394
+ * @param padSince - If provided and input started after this time, pad with silence
395
+ */
396
+ takeBuf(padSince?: number): AudioFrame[] {
397
+ let frames = this.accFrames;
398
+ this.accFrames = [];
399
+
400
+ if (
401
+ padSince !== undefined &&
402
+ this._startedWallTime !== undefined &&
403
+ this._startedWallTime > padSince &&
404
+ !this._padded &&
405
+ frames.length > 0
406
+ ) {
407
+ const padding = this._startedWallTime - padSince;
408
+ this.logger.warn(
409
+ {
410
+ lastAgentSpeechTime: padSince,
411
+ inputStartedTime: this._startedWallTime,
412
+ },
413
+ 'input speech started after last agent speech ended',
414
+ );
415
+ this._padded = true;
416
+ const firstFrame = frames[0]!;
417
+ frames = [
418
+ createSilenceFrame(padding / 1000, firstFrame.sampleRate, firstFrame.channels),
419
+ ...frames,
420
+ ];
421
+ } else if (
422
+ padSince !== undefined &&
423
+ this._startedWallTime === undefined &&
424
+ !this._padded &&
425
+ frames.length === 0
426
+ ) {
427
+ // We could pad with silence here with some fixed SR and channels,
428
+ // but it's better for the user to know that this is happening
429
+ this.logger.warn(
430
+ "input speech hasn't started yet, skipping silence padding, recording may be inaccurate until the speech starts",
431
+ );
432
+ }
433
+
434
+ return frames;
435
+ }
436
+
437
+ /**
438
+ * Creates a stream that intercepts frames from the source,
439
+ * accumulates them when recording, and passes them through unchanged.
440
+ */
441
+ private createInterceptingStream(): ReadableStream<AudioFrame> {
442
+ const sourceStream = this.source.stream;
443
+ const reader = sourceStream.getReader();
444
+
445
+ const transform = new TransformStream<AudioFrame, AudioFrame>({
446
+ transform: (frame, controller) => {
447
+ // Accumulate frames when recording is active
448
+ if (this.recorderIO.recording) {
449
+ if (this._startedWallTime === undefined) {
450
+ this._startedWallTime = Date.now();
451
+ }
452
+ this.accFrames.push(frame);
453
+ }
454
+
455
+ controller.enqueue(frame);
456
+ },
457
+ });
458
+
459
+ const pump = async () => {
460
+ const writer = transform.writable.getWriter();
461
+ let sourceError: unknown;
462
+
463
+ try {
464
+ while (true) {
465
+ const { done, value } = await reader.read();
466
+ if (done) break;
467
+ await writer.write(value);
468
+ }
469
+ } catch (e) {
470
+ if (isStreamReaderReleaseError(e)) return;
471
+ sourceError = e;
472
+ } finally {
473
+ if (sourceError) {
474
+ writer.abort(sourceError);
475
+ return;
476
+ }
477
+
478
+ writer.releaseLock();
479
+
480
+ try {
481
+ await transform.writable.close();
482
+ } catch {
483
+ // ignore "WritableStream is closed" errors
484
+ }
485
+ }
486
+ };
487
+
488
+ pump();
489
+
490
+ return transform.readable;
491
+ }
492
+
493
+ onAttached(): void {
494
+ this.source.onAttached();
495
+ }
496
+
497
+ onDetached(): void {
498
+ this.source.onDetached();
499
+ }
500
+ }
501
+
502
+ class RecorderAudioOutput extends AudioOutput {
503
+ private recorderIO: RecorderIO;
504
+ private writeFn: (buf: AudioFrame[]) => void;
505
+ private accFrames: AudioFrame[] = [];
506
+ private _startedWallTime?: number;
507
+ private _logger = log();
508
+
509
+ _lastSpeechEndTime?: number;
510
+ private _lastSpeechStartTime?: number;
511
+
512
+ // Pause tracking
513
+ private currentPauseStart?: number;
514
+ private pauseWallTimes: Array<[number, number]> = []; // [start, end] pairs
515
+
516
+ constructor(
517
+ recorderIO: RecorderIO,
518
+ audioOutput: AudioOutput,
519
+ writeFn: (buf: AudioFrame[]) => void,
520
+ ) {
521
+ super(audioOutput.sampleRate, audioOutput, { pause: true });
522
+ this.recorderIO = recorderIO;
523
+ this.writeFn = writeFn;
524
+ }
525
+
526
+ get startedWallTime(): number | undefined {
527
+ return this._startedWallTime;
528
+ }
529
+
530
+ get hasPendingData(): boolean {
531
+ return this.accFrames.length > 0;
532
+ }
533
+
534
+ pause(): void {
535
+ if (this.currentPauseStart === undefined && this.recorderIO.recording) {
536
+ this.currentPauseStart = Date.now();
537
+ }
538
+
539
+ if (this.nextInChain) {
540
+ this.nextInChain.pause();
541
+ }
542
+ }
543
+
544
+ /**
545
+ * Resume playback and record the pause interval
546
+ */
547
+ resume(): void {
548
+ if (this.currentPauseStart !== undefined && this.recorderIO.recording) {
549
+ this.pauseWallTimes.push([this.currentPauseStart, Date.now()]);
550
+ this.currentPauseStart = undefined;
551
+ }
552
+
553
+ if (this.nextInChain) {
554
+ this.nextInChain.resume();
555
+ }
556
+ }
557
+
558
+ private resetPauseState(): void {
559
+ this.currentPauseStart = undefined;
560
+ this.pauseWallTimes = [];
561
+ }
562
+
563
+ onPlaybackFinished(options: PlaybackFinishedEvent): void {
564
+ const finishTime = this.currentPauseStart ?? Date.now();
565
+ const trailingSilenceDuration = Math.max(0, Date.now() - finishTime);
566
+
567
+ // Convert playbackPosition from seconds to ms for internal calculations
568
+ let playbackPosition = options.playbackPosition * 1000;
569
+
570
+ if (this._lastSpeechStartTime === undefined) {
571
+ this._logger.warn(
572
+ {
573
+ finishTime,
574
+ playbackPosition,
575
+ interrupted: options.interrupted,
576
+ },
577
+ 'playback finished before speech started',
578
+ );
579
+ playbackPosition = 0;
580
+ }
581
+
582
+ // Clamp playbackPosition to actual elapsed time (all in ms)
583
+ playbackPosition = Math.max(
584
+ 0,
585
+ Math.min(finishTime - (this._lastSpeechStartTime ?? 0), playbackPosition),
586
+ );
587
+
588
+ // Convert back to seconds for the event
589
+ super.onPlaybackFinished({ ...options, playbackPosition: playbackPosition / 1000 });
590
+
591
+ if (!this.recorderIO.recording) {
592
+ return;
593
+ }
594
+
595
+ if (this.currentPauseStart !== undefined) {
596
+ this.pauseWallTimes.push([this.currentPauseStart, finishTime]);
597
+ this.currentPauseStart = undefined;
598
+ }
599
+
600
+ if (this.accFrames.length === 0) {
601
+ this.resetPauseState();
602
+ this._lastSpeechEndTime = Date.now();
603
+ this._lastSpeechStartTime = undefined;
604
+ return;
605
+ }
606
+
607
+ // pauseEvents stores (position, duration) in ms
608
+ const pauseEvents: Array<[number, number]> = [];
609
+ let playbackStartTime = finishTime - playbackPosition;
610
+
611
+ if (this.pauseWallTimes.length > 0) {
612
+ const totalPauseDuration = this.pauseWallTimes.reduce(
613
+ (sum, [start, end]) => sum + (end - start),
614
+ 0,
615
+ );
616
+ playbackStartTime = finishTime - playbackPosition - totalPauseDuration;
617
+
618
+ let accumulatedPause = 0;
619
+ for (const [pauseStart, pauseEnd] of this.pauseWallTimes) {
620
+ let position = pauseStart - playbackStartTime - accumulatedPause;
621
+ const duration = pauseEnd - pauseStart;
622
+ position = Math.max(0, Math.min(position, playbackPosition));
623
+ pauseEvents.push([position, duration]);
624
+ accumulatedPause += duration;
625
+ }
626
+ }
627
+
628
+ const buf: AudioFrame[] = [];
629
+ let accDur = 0;
630
+ const sampleRate = this.accFrames[0]!.sampleRate;
631
+ const numChannels = this.accFrames[0]!.channels;
632
+
633
+ let pauseIdx = 0;
634
+ let shouldBreak = false;
635
+
636
+ for (const frame of this.accFrames) {
637
+ let currentFrame = frame;
638
+ const frameDuration = (frame.samplesPerChannel / frame.sampleRate) * 1000;
639
+
640
+ if (frameDuration + accDur > playbackPosition) {
641
+ const [left] = splitFrame(currentFrame, (playbackPosition - accDur) / 1000);
642
+ currentFrame = left;
643
+ shouldBreak = true;
644
+ }
645
+
646
+ // Process any pauses before this frame starts
647
+ while (pauseIdx < pauseEvents.length && pauseEvents[pauseIdx]![0] <= accDur) {
648
+ const [, pauseDur] = pauseEvents[pauseIdx]!;
649
+ buf.push(createSilenceFrame(pauseDur / 1000, sampleRate, numChannels));
650
+ pauseIdx++;
651
+ }
652
+
653
+ // Process any pauses within this frame
654
+ const currentFrameDuration =
655
+ (currentFrame.samplesPerChannel / currentFrame.sampleRate) * 1000;
656
+ while (
657
+ pauseIdx < pauseEvents.length &&
658
+ pauseEvents[pauseIdx]![0] < accDur + currentFrameDuration
659
+ ) {
660
+ const [pausePos, pauseDur] = pauseEvents[pauseIdx]!;
661
+ const [left, right] = splitFrame(currentFrame, (pausePos - accDur) / 1000);
662
+ buf.push(left);
663
+ accDur += (left.samplesPerChannel / left.sampleRate) * 1000;
664
+ buf.push(createSilenceFrame(pauseDur / 1000, sampleRate, numChannels));
665
+
666
+ currentFrame = right;
667
+ pauseIdx++;
668
+ }
669
+
670
+ buf.push(currentFrame);
671
+ accDur += (currentFrame.samplesPerChannel / currentFrame.sampleRate) * 1000;
672
+
673
+ if (shouldBreak) {
674
+ break;
675
+ }
676
+ }
677
+
678
+ // Process remaining pauses
679
+ while (pauseIdx < pauseEvents.length) {
680
+ const [pausePos, pauseDur] = pauseEvents[pauseIdx]!;
681
+ if (pausePos <= playbackPosition) {
682
+ buf.push(createSilenceFrame(pauseDur / 1000, sampleRate, numChannels));
683
+ }
684
+ pauseIdx++;
685
+ }
686
+
687
+ if (buf.length > 0) {
688
+ if (trailingSilenceDuration > 0) {
689
+ buf.push(createSilenceFrame(trailingSilenceDuration / 1000, sampleRate, numChannels));
690
+ }
691
+ this.writeFn(buf);
692
+ }
693
+
694
+ this.accFrames = [];
695
+ this.resetPauseState();
696
+ this._lastSpeechEndTime = Date.now();
697
+ this._lastSpeechStartTime = undefined;
698
+ }
699
+
700
+ async captureFrame(frame: AudioFrame): Promise<void> {
701
+ if (this.nextInChain) {
702
+ await this.nextInChain.captureFrame(frame);
703
+ }
704
+
705
+ await super.captureFrame(frame);
706
+
707
+ if (this.recorderIO.recording) {
708
+ this.accFrames.push(frame);
709
+ }
710
+
711
+ if (this._startedWallTime === undefined) {
712
+ this._startedWallTime = Date.now();
713
+ }
714
+
715
+ if (this._lastSpeechStartTime === undefined) {
716
+ this._lastSpeechStartTime = Date.now();
717
+ }
718
+ }
719
+
720
+ flush(): void {
721
+ super.flush();
722
+
723
+ if (this.nextInChain) {
724
+ this.nextInChain.flush();
725
+ }
726
+ }
727
+
728
+ clearBuffer(): void {
729
+ if (this.nextInChain) {
730
+ this.nextInChain.clearBuffer();
731
+ }
732
+ }
733
+ }
734
+
735
+ /**
736
+ * Create a silent audio frame with the given duration
737
+ */
738
+ function createSilenceFrame(
739
+ durationInS: number,
740
+ sampleRate: number,
741
+ numChannels: number,
742
+ ): AudioFrame {
743
+ const samples = Math.floor(durationInS * sampleRate);
744
+ const data = new Int16Array(samples * numChannels); // Zero-filled by default
745
+ return new AudioFrame(data, sampleRate, numChannels, samples);
746
+ }
747
+
748
+ /**
749
+ * Split an audio frame at the given position (in seconds)
750
+ * Returns [left, right] frames
751
+ */
752
+ function splitFrame(frame: AudioFrame, position: number): [AudioFrame, AudioFrame] {
753
+ if (position <= 0) {
754
+ const emptyFrame = new AudioFrame(new Int16Array(0), frame.sampleRate, frame.channels, 0);
755
+ return [emptyFrame, frame];
756
+ }
757
+
758
+ const frameDuration = frame.samplesPerChannel / frame.sampleRate;
759
+ if (position >= frameDuration) {
760
+ const emptyFrame = new AudioFrame(new Int16Array(0), frame.sampleRate, frame.channels, 0);
761
+ return [frame, emptyFrame];
762
+ }
763
+
764
+ // samplesNeeded is samples per channel (i.e., sample count in time)
765
+ const samplesNeeded = Math.floor(position * frame.sampleRate);
766
+ // Int16Array: each element is one sample, interleaved by channel
767
+ // So total elements = samplesPerChannel * channels
768
+ const numChannels = frame.channels;
769
+
770
+ const leftData = frame.data.slice(0, samplesNeeded * numChannels);
771
+ const rightData = frame.data.slice(samplesNeeded * numChannels);
772
+
773
+ const leftFrame = new AudioFrame(leftData, frame.sampleRate, frame.channels, samplesNeeded);
774
+
775
+ const rightFrame = new AudioFrame(
776
+ rightData,
777
+ frame.sampleRate,
778
+ frame.channels,
779
+ frame.samplesPerChannel - samplesNeeded,
780
+ );
781
+
782
+ return [leftFrame, rightFrame];
783
+ }