@livekit/agents 1.1.0 → 1.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (959) hide show
  1. package/dist/_exceptions.cjs.map +1 -1
  2. package/dist/_exceptions.d.ts.map +1 -1
  3. package/dist/_exceptions.js.map +1 -1
  4. package/dist/audio.cjs +89 -3
  5. package/dist/audio.cjs.map +1 -1
  6. package/dist/audio.d.cts +36 -1
  7. package/dist/audio.d.ts +36 -1
  8. package/dist/audio.d.ts.map +1 -1
  9. package/dist/audio.js +76 -2
  10. package/dist/audio.js.map +1 -1
  11. package/dist/beta/index.cjs +29 -0
  12. package/dist/beta/index.cjs.map +1 -0
  13. package/dist/beta/index.d.cts +2 -0
  14. package/dist/beta/index.d.ts +2 -0
  15. package/dist/beta/index.d.ts.map +1 -0
  16. package/dist/beta/index.js +7 -0
  17. package/dist/beta/index.js.map +1 -0
  18. package/dist/beta/workflows/index.cjs +29 -0
  19. package/dist/beta/workflows/index.cjs.map +1 -0
  20. package/dist/beta/workflows/index.d.cts +2 -0
  21. package/dist/beta/workflows/index.d.ts +2 -0
  22. package/dist/beta/workflows/index.d.ts.map +1 -0
  23. package/dist/beta/workflows/index.js +7 -0
  24. package/dist/beta/workflows/index.js.map +1 -0
  25. package/dist/beta/workflows/task_group.cjs +165 -0
  26. package/dist/beta/workflows/task_group.cjs.map +1 -0
  27. package/dist/beta/workflows/task_group.d.cts +32 -0
  28. package/dist/beta/workflows/task_group.d.ts +32 -0
  29. package/dist/beta/workflows/task_group.d.ts.map +1 -0
  30. package/dist/beta/workflows/task_group.js +141 -0
  31. package/dist/beta/workflows/task_group.js.map +1 -0
  32. package/dist/cli.cjs +44 -46
  33. package/dist/cli.cjs.map +1 -1
  34. package/dist/cli.d.cts +3 -3
  35. package/dist/cli.d.ts +3 -3
  36. package/dist/cli.d.ts.map +1 -1
  37. package/dist/cli.js +45 -47
  38. package/dist/cli.js.map +1 -1
  39. package/dist/connection_pool.cjs +242 -0
  40. package/dist/connection_pool.cjs.map +1 -0
  41. package/dist/connection_pool.d.cts +123 -0
  42. package/dist/connection_pool.d.ts +123 -0
  43. package/dist/connection_pool.d.ts.map +1 -0
  44. package/dist/connection_pool.js +218 -0
  45. package/dist/connection_pool.js.map +1 -0
  46. package/dist/connection_pool.test.cjs +256 -0
  47. package/dist/connection_pool.test.cjs.map +1 -0
  48. package/dist/connection_pool.test.js +255 -0
  49. package/dist/connection_pool.test.js.map +1 -0
  50. package/dist/constants.cjs +30 -0
  51. package/dist/constants.cjs.map +1 -1
  52. package/dist/constants.d.cts +10 -0
  53. package/dist/constants.d.ts +10 -0
  54. package/dist/constants.d.ts.map +1 -1
  55. package/dist/constants.js +20 -0
  56. package/dist/constants.js.map +1 -1
  57. package/dist/cpu.cjs +189 -0
  58. package/dist/cpu.cjs.map +1 -0
  59. package/dist/cpu.d.cts +24 -0
  60. package/dist/cpu.d.ts +24 -0
  61. package/dist/cpu.d.ts.map +1 -0
  62. package/dist/cpu.js +152 -0
  63. package/dist/cpu.js.map +1 -0
  64. package/dist/cpu.test.cjs +227 -0
  65. package/dist/cpu.test.cjs.map +1 -0
  66. package/dist/cpu.test.js +204 -0
  67. package/dist/cpu.test.js.map +1 -0
  68. package/dist/http_server.cjs +9 -6
  69. package/dist/http_server.cjs.map +1 -1
  70. package/dist/http_server.d.cts +5 -1
  71. package/dist/http_server.d.ts +5 -1
  72. package/dist/http_server.d.ts.map +1 -1
  73. package/dist/http_server.js +9 -6
  74. package/dist/http_server.js.map +1 -1
  75. package/dist/index.cjs +24 -9
  76. package/dist/index.cjs.map +1 -1
  77. package/dist/index.d.cts +15 -11
  78. package/dist/index.d.ts +15 -11
  79. package/dist/index.d.ts.map +1 -1
  80. package/dist/index.js +18 -9
  81. package/dist/index.js.map +1 -1
  82. package/dist/inference/api_protos.cjs +70 -2
  83. package/dist/inference/api_protos.cjs.map +1 -1
  84. package/dist/inference/api_protos.d.cts +373 -32
  85. package/dist/inference/api_protos.d.ts +373 -32
  86. package/dist/inference/api_protos.d.ts.map +1 -1
  87. package/dist/inference/api_protos.js +62 -2
  88. package/dist/inference/api_protos.js.map +1 -1
  89. package/dist/inference/index.cjs +8 -0
  90. package/dist/inference/index.cjs.map +1 -1
  91. package/dist/inference/index.d.cts +3 -4
  92. package/dist/inference/index.d.ts +3 -4
  93. package/dist/inference/index.d.ts.map +1 -1
  94. package/dist/inference/index.js +18 -3
  95. package/dist/inference/index.js.map +1 -1
  96. package/dist/inference/interruption/defaults.cjs +81 -0
  97. package/dist/inference/interruption/defaults.cjs.map +1 -0
  98. package/dist/inference/interruption/defaults.d.cts +19 -0
  99. package/dist/inference/interruption/defaults.d.ts +19 -0
  100. package/dist/inference/interruption/defaults.d.ts.map +1 -0
  101. package/dist/inference/interruption/defaults.js +46 -0
  102. package/dist/inference/interruption/defaults.js.map +1 -0
  103. package/dist/inference/interruption/errors.cjs +44 -0
  104. package/dist/inference/interruption/errors.cjs.map +1 -0
  105. package/dist/inference/interruption/errors.d.cts +12 -0
  106. package/dist/inference/interruption/errors.d.ts +12 -0
  107. package/dist/inference/interruption/errors.d.ts.map +1 -0
  108. package/dist/inference/interruption/errors.js +20 -0
  109. package/dist/inference/interruption/errors.js.map +1 -0
  110. package/dist/inference/interruption/http_transport.cjs +163 -0
  111. package/dist/inference/interruption/http_transport.cjs.map +1 -0
  112. package/dist/inference/interruption/http_transport.d.cts +65 -0
  113. package/dist/inference/interruption/http_transport.d.ts +65 -0
  114. package/dist/inference/interruption/http_transport.d.ts.map +1 -0
  115. package/dist/inference/interruption/http_transport.js +137 -0
  116. package/dist/inference/interruption/http_transport.js.map +1 -0
  117. package/dist/inference/interruption/interruption_cache_entry.cjs +58 -0
  118. package/dist/inference/interruption/interruption_cache_entry.cjs.map +1 -0
  119. package/dist/inference/interruption/interruption_cache_entry.d.cts +30 -0
  120. package/dist/inference/interruption/interruption_cache_entry.d.ts +30 -0
  121. package/dist/inference/interruption/interruption_cache_entry.d.ts.map +1 -0
  122. package/dist/inference/interruption/interruption_cache_entry.js +34 -0
  123. package/dist/inference/interruption/interruption_cache_entry.js.map +1 -0
  124. package/dist/inference/interruption/interruption_detector.cjs +198 -0
  125. package/dist/inference/interruption/interruption_detector.cjs.map +1 -0
  126. package/dist/inference/interruption/interruption_detector.d.cts +59 -0
  127. package/dist/inference/interruption/interruption_detector.d.ts +59 -0
  128. package/dist/inference/interruption/interruption_detector.d.ts.map +1 -0
  129. package/dist/inference/interruption/interruption_detector.js +164 -0
  130. package/dist/inference/interruption/interruption_detector.js.map +1 -0
  131. package/dist/inference/interruption/interruption_stream.cjs +368 -0
  132. package/dist/inference/interruption/interruption_stream.cjs.map +1 -0
  133. package/dist/inference/interruption/interruption_stream.d.cts +46 -0
  134. package/dist/inference/interruption/interruption_stream.d.ts +46 -0
  135. package/dist/inference/interruption/interruption_stream.d.ts.map +1 -0
  136. package/dist/inference/interruption/interruption_stream.js +344 -0
  137. package/dist/inference/interruption/interruption_stream.js.map +1 -0
  138. package/dist/inference/interruption/types.cjs +17 -0
  139. package/dist/inference/interruption/types.cjs.map +1 -0
  140. package/dist/inference/interruption/types.d.cts +66 -0
  141. package/dist/inference/interruption/types.d.ts +66 -0
  142. package/dist/inference/interruption/types.d.ts.map +1 -0
  143. package/dist/inference/interruption/types.js +1 -0
  144. package/dist/inference/interruption/types.js.map +1 -0
  145. package/dist/inference/interruption/utils.cjs +130 -0
  146. package/dist/inference/interruption/utils.cjs.map +1 -0
  147. package/dist/inference/interruption/utils.d.cts +41 -0
  148. package/dist/inference/interruption/utils.d.ts +41 -0
  149. package/dist/inference/interruption/utils.d.ts.map +1 -0
  150. package/dist/inference/interruption/utils.js +105 -0
  151. package/dist/inference/interruption/utils.js.map +1 -0
  152. package/dist/inference/interruption/utils.test.cjs +105 -0
  153. package/dist/inference/interruption/utils.test.cjs.map +1 -0
  154. package/dist/inference/interruption/utils.test.js +104 -0
  155. package/dist/inference/interruption/utils.test.js.map +1 -0
  156. package/dist/inference/interruption/ws_transport.cjs +347 -0
  157. package/dist/inference/interruption/ws_transport.cjs.map +1 -0
  158. package/dist/inference/interruption/ws_transport.d.cts +33 -0
  159. package/dist/inference/interruption/ws_transport.d.ts +33 -0
  160. package/dist/inference/interruption/ws_transport.d.ts.map +1 -0
  161. package/dist/inference/interruption/ws_transport.js +313 -0
  162. package/dist/inference/interruption/ws_transport.js.map +1 -0
  163. package/dist/inference/llm.cjs +106 -66
  164. package/dist/inference/llm.cjs.map +1 -1
  165. package/dist/inference/llm.d.cts +65 -43
  166. package/dist/inference/llm.d.ts +65 -43
  167. package/dist/inference/llm.d.ts.map +1 -1
  168. package/dist/inference/llm.js +100 -66
  169. package/dist/inference/llm.js.map +1 -1
  170. package/dist/inference/stt.cjs +319 -170
  171. package/dist/inference/stt.cjs.map +1 -1
  172. package/dist/inference/stt.d.cts +64 -15
  173. package/dist/inference/stt.d.ts +64 -15
  174. package/dist/inference/stt.d.ts.map +1 -1
  175. package/dist/inference/stt.js +319 -170
  176. package/dist/inference/stt.js.map +1 -1
  177. package/dist/inference/stt.test.cjs +218 -0
  178. package/dist/inference/stt.test.cjs.map +1 -0
  179. package/dist/inference/stt.test.js +217 -0
  180. package/dist/inference/stt.test.js.map +1 -0
  181. package/dist/inference/tts.cjs +249 -71
  182. package/dist/inference/tts.cjs.map +1 -1
  183. package/dist/inference/tts.d.cts +94 -17
  184. package/dist/inference/tts.d.ts +94 -17
  185. package/dist/inference/tts.d.ts.map +1 -1
  186. package/dist/inference/tts.js +249 -77
  187. package/dist/inference/tts.js.map +1 -1
  188. package/dist/inference/tts.test.cjs +305 -0
  189. package/dist/inference/tts.test.cjs.map +1 -0
  190. package/dist/inference/tts.test.js +304 -0
  191. package/dist/inference/tts.test.js.map +1 -0
  192. package/dist/inference/utils.cjs +26 -7
  193. package/dist/inference/utils.cjs.map +1 -1
  194. package/dist/inference/utils.d.cts +14 -1
  195. package/dist/inference/utils.d.ts +14 -1
  196. package/dist/inference/utils.d.ts.map +1 -1
  197. package/dist/inference/utils.js +18 -2
  198. package/dist/inference/utils.js.map +1 -1
  199. package/dist/ipc/inference_proc_executor.cjs +6 -3
  200. package/dist/ipc/inference_proc_executor.cjs.map +1 -1
  201. package/dist/ipc/inference_proc_executor.d.ts.map +1 -1
  202. package/dist/ipc/inference_proc_executor.js +6 -3
  203. package/dist/ipc/inference_proc_executor.js.map +1 -1
  204. package/dist/ipc/inference_proc_lazy_main.cjs +13 -1
  205. package/dist/ipc/inference_proc_lazy_main.cjs.map +1 -1
  206. package/dist/ipc/inference_proc_lazy_main.js +13 -1
  207. package/dist/ipc/inference_proc_lazy_main.js.map +1 -1
  208. package/dist/ipc/job_proc_executor.cjs +6 -1
  209. package/dist/ipc/job_proc_executor.cjs.map +1 -1
  210. package/dist/ipc/job_proc_executor.d.ts.map +1 -1
  211. package/dist/ipc/job_proc_executor.js +6 -1
  212. package/dist/ipc/job_proc_executor.js.map +1 -1
  213. package/dist/ipc/job_proc_lazy_main.cjs +89 -17
  214. package/dist/ipc/job_proc_lazy_main.cjs.map +1 -1
  215. package/dist/ipc/job_proc_lazy_main.js +68 -18
  216. package/dist/ipc/job_proc_lazy_main.js.map +1 -1
  217. package/dist/ipc/supervised_proc.cjs +34 -8
  218. package/dist/ipc/supervised_proc.cjs.map +1 -1
  219. package/dist/ipc/supervised_proc.d.cts +8 -0
  220. package/dist/ipc/supervised_proc.d.ts +8 -0
  221. package/dist/ipc/supervised_proc.d.ts.map +1 -1
  222. package/dist/ipc/supervised_proc.js +34 -8
  223. package/dist/ipc/supervised_proc.js.map +1 -1
  224. package/dist/ipc/supervised_proc.test.cjs +145 -0
  225. package/dist/ipc/supervised_proc.test.cjs.map +1 -0
  226. package/dist/ipc/supervised_proc.test.js +122 -0
  227. package/dist/ipc/supervised_proc.test.js.map +1 -0
  228. package/dist/job.cjs +109 -1
  229. package/dist/job.cjs.map +1 -1
  230. package/dist/job.d.cts +14 -0
  231. package/dist/job.d.ts +14 -0
  232. package/dist/job.d.ts.map +1 -1
  233. package/dist/job.js +99 -1
  234. package/dist/job.js.map +1 -1
  235. package/dist/language.cjs +394 -0
  236. package/dist/language.cjs.map +1 -0
  237. package/dist/language.d.cts +15 -0
  238. package/dist/language.d.ts +15 -0
  239. package/dist/language.d.ts.map +1 -0
  240. package/dist/language.js +363 -0
  241. package/dist/language.js.map +1 -0
  242. package/dist/language.test.cjs +43 -0
  243. package/dist/language.test.cjs.map +1 -0
  244. package/dist/language.test.js +49 -0
  245. package/dist/language.test.js.map +1 -0
  246. package/dist/llm/chat_context.cjs +345 -3
  247. package/dist/llm/chat_context.cjs.map +1 -1
  248. package/dist/llm/chat_context.d.cts +86 -2
  249. package/dist/llm/chat_context.d.ts +86 -2
  250. package/dist/llm/chat_context.d.ts.map +1 -1
  251. package/dist/llm/chat_context.js +344 -3
  252. package/dist/llm/chat_context.js.map +1 -1
  253. package/dist/llm/chat_context.test.cjs +692 -0
  254. package/dist/llm/chat_context.test.cjs.map +1 -1
  255. package/dist/llm/chat_context.test.js +692 -0
  256. package/dist/llm/chat_context.test.js.map +1 -1
  257. package/dist/llm/fallback_adapter.cjs +280 -0
  258. package/dist/llm/fallback_adapter.cjs.map +1 -0
  259. package/dist/llm/fallback_adapter.d.cts +73 -0
  260. package/dist/llm/fallback_adapter.d.ts +73 -0
  261. package/dist/llm/fallback_adapter.d.ts.map +1 -0
  262. package/dist/llm/fallback_adapter.js +256 -0
  263. package/dist/llm/fallback_adapter.js.map +1 -0
  264. package/dist/llm/fallback_adapter.test.cjs +176 -0
  265. package/dist/llm/fallback_adapter.test.cjs.map +1 -0
  266. package/dist/llm/fallback_adapter.test.js +175 -0
  267. package/dist/llm/fallback_adapter.test.js.map +1 -0
  268. package/dist/llm/index.cjs +11 -0
  269. package/dist/llm/index.cjs.map +1 -1
  270. package/dist/llm/index.d.cts +4 -3
  271. package/dist/llm/index.d.ts +4 -3
  272. package/dist/llm/index.d.ts.map +1 -1
  273. package/dist/llm/index.js +13 -1
  274. package/dist/llm/index.js.map +1 -1
  275. package/dist/llm/llm.cjs +65 -11
  276. package/dist/llm/llm.cjs.map +1 -1
  277. package/dist/llm/llm.d.cts +13 -2
  278. package/dist/llm/llm.d.ts +13 -2
  279. package/dist/llm/llm.d.ts.map +1 -1
  280. package/dist/llm/llm.js +65 -11
  281. package/dist/llm/llm.js.map +1 -1
  282. package/dist/llm/provider_format/google.cjs +6 -2
  283. package/dist/llm/provider_format/google.cjs.map +1 -1
  284. package/dist/llm/provider_format/google.d.cts +1 -1
  285. package/dist/llm/provider_format/google.d.ts +1 -1
  286. package/dist/llm/provider_format/google.d.ts.map +1 -1
  287. package/dist/llm/provider_format/google.js +6 -2
  288. package/dist/llm/provider_format/google.js.map +1 -1
  289. package/dist/llm/provider_format/google.test.cjs +48 -0
  290. package/dist/llm/provider_format/google.test.cjs.map +1 -1
  291. package/dist/llm/provider_format/google.test.js +54 -1
  292. package/dist/llm/provider_format/google.test.js.map +1 -1
  293. package/dist/llm/provider_format/index.cjs +2 -0
  294. package/dist/llm/provider_format/index.cjs.map +1 -1
  295. package/dist/llm/provider_format/index.d.cts +2 -2
  296. package/dist/llm/provider_format/index.d.ts +2 -2
  297. package/dist/llm/provider_format/index.d.ts.map +1 -1
  298. package/dist/llm/provider_format/index.js +6 -1
  299. package/dist/llm/provider_format/index.js.map +1 -1
  300. package/dist/llm/provider_format/openai.cjs +126 -24
  301. package/dist/llm/provider_format/openai.cjs.map +1 -1
  302. package/dist/llm/provider_format/openai.d.cts +1 -0
  303. package/dist/llm/provider_format/openai.d.ts +1 -0
  304. package/dist/llm/provider_format/openai.d.ts.map +1 -1
  305. package/dist/llm/provider_format/openai.js +124 -23
  306. package/dist/llm/provider_format/openai.js.map +1 -1
  307. package/dist/llm/provider_format/openai.test.cjs +393 -0
  308. package/dist/llm/provider_format/openai.test.cjs.map +1 -1
  309. package/dist/llm/provider_format/openai.test.js +400 -2
  310. package/dist/llm/provider_format/openai.test.js.map +1 -1
  311. package/dist/llm/provider_format/utils.cjs +5 -4
  312. package/dist/llm/provider_format/utils.cjs.map +1 -1
  313. package/dist/llm/provider_format/utils.d.ts.map +1 -1
  314. package/dist/llm/provider_format/utils.js +5 -4
  315. package/dist/llm/provider_format/utils.js.map +1 -1
  316. package/dist/llm/realtime.cjs +3 -0
  317. package/dist/llm/realtime.cjs.map +1 -1
  318. package/dist/llm/realtime.d.cts +15 -1
  319. package/dist/llm/realtime.d.ts +15 -1
  320. package/dist/llm/realtime.d.ts.map +1 -1
  321. package/dist/llm/realtime.js +3 -0
  322. package/dist/llm/realtime.js.map +1 -1
  323. package/dist/llm/remote_chat_context.cjs.map +1 -1
  324. package/dist/llm/remote_chat_context.d.cts +2 -0
  325. package/dist/llm/remote_chat_context.d.ts +2 -0
  326. package/dist/llm/remote_chat_context.d.ts.map +1 -1
  327. package/dist/llm/remote_chat_context.js.map +1 -1
  328. package/dist/llm/tool_context.cjs +50 -2
  329. package/dist/llm/tool_context.cjs.map +1 -1
  330. package/dist/llm/tool_context.d.cts +47 -11
  331. package/dist/llm/tool_context.d.ts +47 -11
  332. package/dist/llm/tool_context.d.ts.map +1 -1
  333. package/dist/llm/tool_context.js +48 -3
  334. package/dist/llm/tool_context.js.map +1 -1
  335. package/dist/llm/tool_context.test.cjs +197 -0
  336. package/dist/llm/tool_context.test.cjs.map +1 -1
  337. package/dist/llm/tool_context.test.js +175 -0
  338. package/dist/llm/tool_context.test.js.map +1 -1
  339. package/dist/llm/utils.cjs +107 -12
  340. package/dist/llm/utils.cjs.map +1 -1
  341. package/dist/llm/utils.d.cts +10 -3
  342. package/dist/llm/utils.d.ts +10 -3
  343. package/dist/llm/utils.d.ts.map +1 -1
  344. package/dist/llm/utils.js +106 -12
  345. package/dist/llm/utils.js.map +1 -1
  346. package/dist/llm/utils.test.cjs +90 -0
  347. package/dist/llm/utils.test.cjs.map +1 -1
  348. package/dist/llm/utils.test.js +98 -2
  349. package/dist/llm/utils.test.js.map +1 -1
  350. package/dist/llm/zod-utils.cjs +102 -0
  351. package/dist/llm/zod-utils.cjs.map +1 -0
  352. package/dist/llm/zod-utils.d.cts +65 -0
  353. package/dist/llm/zod-utils.d.ts +65 -0
  354. package/dist/llm/zod-utils.d.ts.map +1 -0
  355. package/dist/llm/zod-utils.js +64 -0
  356. package/dist/llm/zod-utils.js.map +1 -0
  357. package/dist/llm/zod-utils.test.cjs +472 -0
  358. package/dist/llm/zod-utils.test.cjs.map +1 -0
  359. package/dist/llm/zod-utils.test.js +455 -0
  360. package/dist/llm/zod-utils.test.js.map +1 -0
  361. package/dist/log.cjs +45 -14
  362. package/dist/log.cjs.map +1 -1
  363. package/dist/log.d.cts +8 -1
  364. package/dist/log.d.ts +8 -1
  365. package/dist/log.d.ts.map +1 -1
  366. package/dist/log.js +45 -15
  367. package/dist/log.js.map +1 -1
  368. package/dist/metrics/base.cjs.map +1 -1
  369. package/dist/metrics/base.d.cts +75 -19
  370. package/dist/metrics/base.d.ts +75 -19
  371. package/dist/metrics/base.d.ts.map +1 -1
  372. package/dist/metrics/index.cjs +5 -0
  373. package/dist/metrics/index.cjs.map +1 -1
  374. package/dist/metrics/index.d.cts +2 -1
  375. package/dist/metrics/index.d.ts +2 -1
  376. package/dist/metrics/index.d.ts.map +1 -1
  377. package/dist/metrics/index.js +6 -0
  378. package/dist/metrics/index.js.map +1 -1
  379. package/dist/metrics/model_usage.cjs +189 -0
  380. package/dist/metrics/model_usage.cjs.map +1 -0
  381. package/dist/metrics/model_usage.d.cts +92 -0
  382. package/dist/metrics/model_usage.d.ts +92 -0
  383. package/dist/metrics/model_usage.d.ts.map +1 -0
  384. package/dist/metrics/model_usage.js +164 -0
  385. package/dist/metrics/model_usage.js.map +1 -0
  386. package/dist/metrics/model_usage.test.cjs +474 -0
  387. package/dist/metrics/model_usage.test.cjs.map +1 -0
  388. package/dist/metrics/model_usage.test.js +476 -0
  389. package/dist/metrics/model_usage.test.js.map +1 -0
  390. package/dist/metrics/usage_collector.cjs +5 -2
  391. package/dist/metrics/usage_collector.cjs.map +1 -1
  392. package/dist/metrics/usage_collector.d.cts +10 -1
  393. package/dist/metrics/usage_collector.d.ts +10 -1
  394. package/dist/metrics/usage_collector.d.ts.map +1 -1
  395. package/dist/metrics/usage_collector.js +5 -2
  396. package/dist/metrics/usage_collector.js.map +1 -1
  397. package/dist/metrics/utils.cjs +23 -7
  398. package/dist/metrics/utils.cjs.map +1 -1
  399. package/dist/metrics/utils.d.ts.map +1 -1
  400. package/dist/metrics/utils.js +23 -7
  401. package/dist/metrics/utils.js.map +1 -1
  402. package/dist/stream/deferred_stream.cjs +31 -10
  403. package/dist/stream/deferred_stream.cjs.map +1 -1
  404. package/dist/stream/deferred_stream.d.cts +6 -1
  405. package/dist/stream/deferred_stream.d.ts +6 -1
  406. package/dist/stream/deferred_stream.d.ts.map +1 -1
  407. package/dist/stream/deferred_stream.js +31 -10
  408. package/dist/stream/deferred_stream.js.map +1 -1
  409. package/dist/stream/deferred_stream.test.cjs +2 -2
  410. package/dist/stream/deferred_stream.test.cjs.map +1 -1
  411. package/dist/stream/deferred_stream.test.js +2 -2
  412. package/dist/stream/deferred_stream.test.js.map +1 -1
  413. package/dist/stream/index.cjs +3 -0
  414. package/dist/stream/index.cjs.map +1 -1
  415. package/dist/stream/index.d.cts +1 -0
  416. package/dist/stream/index.d.ts +1 -0
  417. package/dist/stream/index.d.ts.map +1 -1
  418. package/dist/stream/index.js +2 -0
  419. package/dist/stream/index.js.map +1 -1
  420. package/dist/stream/multi_input_stream.cjs +139 -0
  421. package/dist/stream/multi_input_stream.cjs.map +1 -0
  422. package/dist/stream/multi_input_stream.d.cts +55 -0
  423. package/dist/stream/multi_input_stream.d.ts +55 -0
  424. package/dist/stream/multi_input_stream.d.ts.map +1 -0
  425. package/dist/stream/multi_input_stream.js +115 -0
  426. package/dist/stream/multi_input_stream.js.map +1 -0
  427. package/dist/stream/multi_input_stream.test.cjs +344 -0
  428. package/dist/stream/multi_input_stream.test.cjs.map +1 -0
  429. package/dist/stream/multi_input_stream.test.js +343 -0
  430. package/dist/stream/multi_input_stream.test.js.map +1 -0
  431. package/dist/stream/stream_channel.cjs +39 -1
  432. package/dist/stream/stream_channel.cjs.map +1 -1
  433. package/dist/stream/stream_channel.d.cts +5 -2
  434. package/dist/stream/stream_channel.d.ts +5 -2
  435. package/dist/stream/stream_channel.d.ts.map +1 -1
  436. package/dist/stream/stream_channel.js +39 -1
  437. package/dist/stream/stream_channel.js.map +1 -1
  438. package/dist/stream/stream_channel.test.cjs +27 -0
  439. package/dist/stream/stream_channel.test.cjs.map +1 -1
  440. package/dist/stream/stream_channel.test.js +27 -0
  441. package/dist/stream/stream_channel.test.js.map +1 -1
  442. package/dist/stt/stream_adapter.cjs +24 -9
  443. package/dist/stt/stream_adapter.cjs.map +1 -1
  444. package/dist/stt/stream_adapter.d.cts +7 -3
  445. package/dist/stt/stream_adapter.d.ts +7 -3
  446. package/dist/stt/stream_adapter.d.ts.map +1 -1
  447. package/dist/stt/stream_adapter.js +24 -9
  448. package/dist/stt/stream_adapter.js.map +1 -1
  449. package/dist/stt/stt.cjs +94 -19
  450. package/dist/stt/stt.cjs.map +1 -1
  451. package/dist/stt/stt.d.cts +68 -5
  452. package/dist/stt/stt.d.ts +68 -5
  453. package/dist/stt/stt.d.ts.map +1 -1
  454. package/dist/stt/stt.js +96 -21
  455. package/dist/stt/stt.js.map +1 -1
  456. package/dist/telemetry/index.cjs +72 -0
  457. package/dist/telemetry/index.cjs.map +1 -0
  458. package/dist/telemetry/index.d.cts +7 -0
  459. package/dist/telemetry/index.d.ts +7 -0
  460. package/dist/telemetry/index.d.ts.map +1 -0
  461. package/dist/telemetry/index.js +37 -0
  462. package/dist/telemetry/index.js.map +1 -0
  463. package/dist/telemetry/logging.cjs +65 -0
  464. package/dist/telemetry/logging.cjs.map +1 -0
  465. package/dist/telemetry/logging.d.cts +21 -0
  466. package/dist/telemetry/logging.d.ts +21 -0
  467. package/dist/telemetry/logging.d.ts.map +1 -0
  468. package/dist/telemetry/logging.js +40 -0
  469. package/dist/telemetry/logging.js.map +1 -0
  470. package/dist/telemetry/otel_http_exporter.cjs +166 -0
  471. package/dist/telemetry/otel_http_exporter.cjs.map +1 -0
  472. package/dist/telemetry/otel_http_exporter.d.cts +63 -0
  473. package/dist/telemetry/otel_http_exporter.d.ts +63 -0
  474. package/dist/telemetry/otel_http_exporter.d.ts.map +1 -0
  475. package/dist/telemetry/otel_http_exporter.js +142 -0
  476. package/dist/telemetry/otel_http_exporter.js.map +1 -0
  477. package/dist/telemetry/pino_otel_transport.cjs +217 -0
  478. package/dist/telemetry/pino_otel_transport.cjs.map +1 -0
  479. package/dist/telemetry/pino_otel_transport.d.cts +58 -0
  480. package/dist/telemetry/pino_otel_transport.d.ts +58 -0
  481. package/dist/telemetry/pino_otel_transport.d.ts.map +1 -0
  482. package/dist/telemetry/pino_otel_transport.js +189 -0
  483. package/dist/telemetry/pino_otel_transport.js.map +1 -0
  484. package/dist/telemetry/trace_types.cjs +233 -0
  485. package/dist/telemetry/trace_types.cjs.map +1 -0
  486. package/dist/telemetry/trace_types.d.cts +74 -0
  487. package/dist/telemetry/trace_types.d.ts +74 -0
  488. package/dist/telemetry/trace_types.d.ts.map +1 -0
  489. package/dist/telemetry/trace_types.js +141 -0
  490. package/dist/telemetry/trace_types.js.map +1 -0
  491. package/dist/telemetry/traces.cjs +484 -0
  492. package/dist/telemetry/traces.cjs.map +1 -0
  493. package/dist/telemetry/traces.d.cts +116 -0
  494. package/dist/telemetry/traces.d.ts +116 -0
  495. package/dist/telemetry/traces.d.ts.map +1 -0
  496. package/dist/telemetry/traces.js +449 -0
  497. package/dist/telemetry/traces.js.map +1 -0
  498. package/dist/telemetry/utils.cjs +86 -0
  499. package/dist/telemetry/utils.cjs.map +1 -0
  500. package/dist/telemetry/utils.d.cts +5 -0
  501. package/dist/telemetry/utils.d.ts +5 -0
  502. package/dist/telemetry/utils.d.ts.map +1 -0
  503. package/dist/telemetry/utils.js +51 -0
  504. package/dist/telemetry/utils.js.map +1 -0
  505. package/dist/tokenize/basic/sentence.cjs +3 -3
  506. package/dist/tokenize/basic/sentence.cjs.map +1 -1
  507. package/dist/tokenize/basic/sentence.js +3 -3
  508. package/dist/tokenize/basic/sentence.js.map +1 -1
  509. package/dist/tokenize/tokenizer.test.cjs +3 -1
  510. package/dist/tokenize/tokenizer.test.cjs.map +1 -1
  511. package/dist/tokenize/tokenizer.test.js +3 -1
  512. package/dist/tokenize/tokenizer.test.js.map +1 -1
  513. package/dist/transcription.cjs.map +1 -1
  514. package/dist/transcription.d.cts +6 -0
  515. package/dist/transcription.d.ts +6 -0
  516. package/dist/transcription.d.ts.map +1 -1
  517. package/dist/transcription.js.map +1 -1
  518. package/dist/tts/fallback_adapter.cjs +472 -0
  519. package/dist/tts/fallback_adapter.cjs.map +1 -0
  520. package/dist/tts/fallback_adapter.d.cts +110 -0
  521. package/dist/tts/fallback_adapter.d.ts +110 -0
  522. package/dist/tts/fallback_adapter.d.ts.map +1 -0
  523. package/dist/tts/fallback_adapter.js +448 -0
  524. package/dist/tts/fallback_adapter.js.map +1 -0
  525. package/dist/tts/index.cjs +3 -0
  526. package/dist/tts/index.cjs.map +1 -1
  527. package/dist/tts/index.d.cts +1 -0
  528. package/dist/tts/index.d.ts +1 -0
  529. package/dist/tts/index.d.ts.map +1 -1
  530. package/dist/tts/index.js +2 -0
  531. package/dist/tts/index.js.map +1 -1
  532. package/dist/tts/stream_adapter.cjs +25 -8
  533. package/dist/tts/stream_adapter.cjs.map +1 -1
  534. package/dist/tts/stream_adapter.d.cts +6 -3
  535. package/dist/tts/stream_adapter.d.ts +6 -3
  536. package/dist/tts/stream_adapter.d.ts.map +1 -1
  537. package/dist/tts/stream_adapter.js +25 -8
  538. package/dist/tts/stream_adapter.js.map +1 -1
  539. package/dist/tts/tts.cjs +189 -57
  540. package/dist/tts/tts.cjs.map +1 -1
  541. package/dist/tts/tts.d.cts +58 -6
  542. package/dist/tts/tts.d.ts +58 -6
  543. package/dist/tts/tts.d.ts.map +1 -1
  544. package/dist/tts/tts.js +191 -59
  545. package/dist/tts/tts.js.map +1 -1
  546. package/dist/typed_promise.cjs +48 -0
  547. package/dist/typed_promise.cjs.map +1 -0
  548. package/dist/typed_promise.d.cts +24 -0
  549. package/dist/typed_promise.d.ts +24 -0
  550. package/dist/typed_promise.d.ts.map +1 -0
  551. package/dist/typed_promise.js +28 -0
  552. package/dist/typed_promise.js.map +1 -0
  553. package/dist/types.cjs +24 -32
  554. package/dist/types.cjs.map +1 -1
  555. package/dist/types.d.cts +45 -10
  556. package/dist/types.d.ts +45 -10
  557. package/dist/types.d.ts.map +1 -1
  558. package/dist/types.js +20 -30
  559. package/dist/types.js.map +1 -1
  560. package/dist/utils.cjs +124 -28
  561. package/dist/utils.cjs.map +1 -1
  562. package/dist/utils.d.cts +41 -1
  563. package/dist/utils.d.ts +41 -1
  564. package/dist/utils.d.ts.map +1 -1
  565. package/dist/utils.js +119 -27
  566. package/dist/utils.js.map +1 -1
  567. package/dist/utils.test.cjs +73 -1
  568. package/dist/utils.test.cjs.map +1 -1
  569. package/dist/utils.test.js +74 -10
  570. package/dist/utils.test.js.map +1 -1
  571. package/dist/vad.cjs +35 -15
  572. package/dist/vad.cjs.map +1 -1
  573. package/dist/vad.d.cts +15 -5
  574. package/dist/vad.d.ts +15 -5
  575. package/dist/vad.d.ts.map +1 -1
  576. package/dist/vad.js +35 -15
  577. package/dist/vad.js.map +1 -1
  578. package/dist/version.cjs +1 -1
  579. package/dist/version.cjs.map +1 -1
  580. package/dist/version.d.cts +1 -1
  581. package/dist/version.d.ts +1 -1
  582. package/dist/version.d.ts.map +1 -1
  583. package/dist/version.js +1 -1
  584. package/dist/version.js.map +1 -1
  585. package/dist/voice/agent.cjs +258 -35
  586. package/dist/voice/agent.cjs.map +1 -1
  587. package/dist/voice/agent.d.cts +54 -13
  588. package/dist/voice/agent.d.ts +54 -13
  589. package/dist/voice/agent.d.ts.map +1 -1
  590. package/dist/voice/agent.js +254 -34
  591. package/dist/voice/agent.js.map +1 -1
  592. package/dist/voice/agent.test.cjs +314 -0
  593. package/dist/voice/agent.test.cjs.map +1 -1
  594. package/dist/voice/agent.test.js +316 -2
  595. package/dist/voice/agent.test.js.map +1 -1
  596. package/dist/voice/agent_activity.cjs +1116 -385
  597. package/dist/voice/agent_activity.cjs.map +1 -1
  598. package/dist/voice/agent_activity.d.cts +72 -11
  599. package/dist/voice/agent_activity.d.ts +72 -11
  600. package/dist/voice/agent_activity.d.ts.map +1 -1
  601. package/dist/voice/agent_activity.js +1119 -383
  602. package/dist/voice/agent_activity.js.map +1 -1
  603. package/dist/voice/agent_activity.test.cjs +135 -0
  604. package/dist/voice/agent_activity.test.cjs.map +1 -0
  605. package/dist/voice/agent_activity.test.js +134 -0
  606. package/dist/voice/agent_activity.test.js.map +1 -0
  607. package/dist/voice/agent_session.cjs +550 -90
  608. package/dist/voice/agent_session.cjs.map +1 -1
  609. package/dist/voice/agent_session.d.cts +185 -25
  610. package/dist/voice/agent_session.d.ts +185 -25
  611. package/dist/voice/agent_session.d.ts.map +1 -1
  612. package/dist/voice/agent_session.js +556 -91
  613. package/dist/voice/agent_session.js.map +1 -1
  614. package/dist/voice/audio_recognition.cjs +605 -46
  615. package/dist/voice/audio_recognition.cjs.map +1 -1
  616. package/dist/voice/audio_recognition.d.cts +96 -4
  617. package/dist/voice/audio_recognition.d.ts +96 -4
  618. package/dist/voice/audio_recognition.d.ts.map +1 -1
  619. package/dist/voice/audio_recognition.js +611 -47
  620. package/dist/voice/audio_recognition.js.map +1 -1
  621. package/dist/voice/audio_recognition_span.test.cjs +295 -0
  622. package/dist/voice/audio_recognition_span.test.cjs.map +1 -0
  623. package/dist/voice/audio_recognition_span.test.js +299 -0
  624. package/dist/voice/audio_recognition_span.test.js.map +1 -0
  625. package/dist/voice/avatar/datastream_io.cjs +7 -1
  626. package/dist/voice/avatar/datastream_io.cjs.map +1 -1
  627. package/dist/voice/avatar/datastream_io.d.cts +1 -0
  628. package/dist/voice/avatar/datastream_io.d.ts +1 -0
  629. package/dist/voice/avatar/datastream_io.d.ts.map +1 -1
  630. package/dist/voice/avatar/datastream_io.js +7 -1
  631. package/dist/voice/avatar/datastream_io.js.map +1 -1
  632. package/dist/voice/background_audio.cjs +367 -0
  633. package/dist/voice/background_audio.cjs.map +1 -0
  634. package/dist/voice/background_audio.d.cts +123 -0
  635. package/dist/voice/background_audio.d.ts +123 -0
  636. package/dist/voice/background_audio.d.ts.map +1 -0
  637. package/dist/voice/background_audio.js +343 -0
  638. package/dist/voice/background_audio.js.map +1 -0
  639. package/dist/voice/events.cjs +3 -0
  640. package/dist/voice/events.cjs.map +1 -1
  641. package/dist/voice/events.d.cts +16 -9
  642. package/dist/voice/events.d.ts +16 -9
  643. package/dist/voice/events.d.ts.map +1 -1
  644. package/dist/voice/events.js +3 -0
  645. package/dist/voice/events.js.map +1 -1
  646. package/dist/voice/generation.cjs +205 -41
  647. package/dist/voice/generation.cjs.map +1 -1
  648. package/dist/voice/generation.d.cts +21 -5
  649. package/dist/voice/generation.d.ts +21 -5
  650. package/dist/voice/generation.d.ts.map +1 -1
  651. package/dist/voice/generation.js +215 -43
  652. package/dist/voice/generation.js.map +1 -1
  653. package/dist/voice/generation_tools.test.cjs +236 -0
  654. package/dist/voice/generation_tools.test.cjs.map +1 -0
  655. package/dist/voice/generation_tools.test.js +235 -0
  656. package/dist/voice/generation_tools.test.js.map +1 -0
  657. package/dist/voice/index.cjs +33 -2
  658. package/dist/voice/index.cjs.map +1 -1
  659. package/dist/voice/index.d.cts +8 -2
  660. package/dist/voice/index.d.ts +8 -2
  661. package/dist/voice/index.d.ts.map +1 -1
  662. package/dist/voice/index.js +19 -2
  663. package/dist/voice/index.js.map +1 -1
  664. package/dist/voice/interruption_detection.test.cjs +114 -0
  665. package/dist/voice/interruption_detection.test.cjs.map +1 -0
  666. package/dist/voice/interruption_detection.test.js +113 -0
  667. package/dist/voice/interruption_detection.test.js.map +1 -0
  668. package/dist/voice/io.cjs +66 -6
  669. package/dist/voice/io.cjs.map +1 -1
  670. package/dist/voice/io.d.cts +67 -7
  671. package/dist/voice/io.d.ts +67 -7
  672. package/dist/voice/io.d.ts.map +1 -1
  673. package/dist/voice/io.js +62 -5
  674. package/dist/voice/io.js.map +1 -1
  675. package/dist/voice/recorder_io/index.cjs +23 -0
  676. package/dist/voice/recorder_io/index.cjs.map +1 -0
  677. package/dist/voice/recorder_io/index.d.cts +2 -0
  678. package/dist/voice/recorder_io/index.d.ts +2 -0
  679. package/dist/voice/recorder_io/index.d.ts.map +1 -0
  680. package/dist/voice/recorder_io/index.js +2 -0
  681. package/dist/voice/recorder_io/index.js.map +1 -0
  682. package/dist/voice/recorder_io/recorder_io.cjs +607 -0
  683. package/dist/voice/recorder_io/recorder_io.cjs.map +1 -0
  684. package/dist/voice/recorder_io/recorder_io.d.cts +106 -0
  685. package/dist/voice/recorder_io/recorder_io.d.ts +106 -0
  686. package/dist/voice/recorder_io/recorder_io.d.ts.map +1 -0
  687. package/dist/voice/recorder_io/recorder_io.js +573 -0
  688. package/dist/voice/recorder_io/recorder_io.js.map +1 -0
  689. package/dist/voice/remote_session.cjs +922 -0
  690. package/dist/voice/remote_session.cjs.map +1 -0
  691. package/dist/voice/remote_session.d.cts +108 -0
  692. package/dist/voice/remote_session.d.ts +108 -0
  693. package/dist/voice/remote_session.d.ts.map +1 -0
  694. package/dist/voice/remote_session.js +887 -0
  695. package/dist/voice/remote_session.js.map +1 -0
  696. package/dist/voice/report.cjs +88 -0
  697. package/dist/voice/report.cjs.map +1 -0
  698. package/dist/voice/report.d.cts +49 -0
  699. package/dist/voice/report.d.ts +49 -0
  700. package/dist/voice/report.d.ts.map +1 -0
  701. package/dist/voice/report.js +63 -0
  702. package/dist/voice/report.js.map +1 -0
  703. package/dist/voice/report.test.cjs +121 -0
  704. package/dist/voice/report.test.cjs.map +1 -0
  705. package/dist/voice/report.test.js +120 -0
  706. package/dist/voice/report.test.js.map +1 -0
  707. package/dist/voice/room_io/_input.cjs +40 -7
  708. package/dist/voice/room_io/_input.cjs.map +1 -1
  709. package/dist/voice/room_io/_input.d.cts +5 -2
  710. package/dist/voice/room_io/_input.d.ts +5 -2
  711. package/dist/voice/room_io/_input.d.ts.map +1 -1
  712. package/dist/voice/room_io/_input.js +41 -8
  713. package/dist/voice/room_io/_input.js.map +1 -1
  714. package/dist/voice/room_io/_output.cjs +19 -11
  715. package/dist/voice/room_io/_output.cjs.map +1 -1
  716. package/dist/voice/room_io/_output.d.cts +7 -4
  717. package/dist/voice/room_io/_output.d.ts +7 -4
  718. package/dist/voice/room_io/_output.d.ts.map +1 -1
  719. package/dist/voice/room_io/_output.js +20 -12
  720. package/dist/voice/room_io/_output.js.map +1 -1
  721. package/dist/voice/room_io/room_io.cjs +33 -6
  722. package/dist/voice/room_io/room_io.cjs.map +1 -1
  723. package/dist/voice/room_io/room_io.d.cts +29 -9
  724. package/dist/voice/room_io/room_io.d.ts +29 -9
  725. package/dist/voice/room_io/room_io.d.ts.map +1 -1
  726. package/dist/voice/room_io/room_io.js +33 -7
  727. package/dist/voice/room_io/room_io.js.map +1 -1
  728. package/dist/voice/speech_handle.cjs +22 -4
  729. package/dist/voice/speech_handle.cjs.map +1 -1
  730. package/dist/voice/speech_handle.d.cts +17 -2
  731. package/dist/voice/speech_handle.d.ts +17 -2
  732. package/dist/voice/speech_handle.d.ts.map +1 -1
  733. package/dist/voice/speech_handle.js +21 -4
  734. package/dist/voice/speech_handle.js.map +1 -1
  735. package/dist/voice/testing/fake_llm.cjs +127 -0
  736. package/dist/voice/testing/fake_llm.cjs.map +1 -0
  737. package/dist/voice/testing/fake_llm.d.cts +30 -0
  738. package/dist/voice/testing/fake_llm.d.ts +30 -0
  739. package/dist/voice/testing/fake_llm.d.ts.map +1 -0
  740. package/dist/voice/testing/fake_llm.js +103 -0
  741. package/dist/voice/testing/fake_llm.js.map +1 -0
  742. package/dist/voice/testing/index.cjs +57 -0
  743. package/dist/voice/testing/index.cjs.map +1 -0
  744. package/dist/voice/testing/index.d.cts +21 -0
  745. package/dist/voice/testing/index.d.ts +21 -0
  746. package/dist/voice/testing/index.d.ts.map +1 -0
  747. package/dist/voice/testing/index.js +35 -0
  748. package/dist/voice/testing/index.js.map +1 -0
  749. package/dist/voice/testing/run_result.cjs +817 -0
  750. package/dist/voice/testing/run_result.cjs.map +1 -0
  751. package/dist/voice/testing/run_result.d.cts +385 -0
  752. package/dist/voice/testing/run_result.d.ts +385 -0
  753. package/dist/voice/testing/run_result.d.ts.map +1 -0
  754. package/dist/voice/testing/run_result.js +790 -0
  755. package/dist/voice/testing/run_result.js.map +1 -0
  756. package/dist/voice/testing/types.cjs +46 -0
  757. package/dist/voice/testing/types.cjs.map +1 -0
  758. package/dist/voice/testing/types.d.cts +83 -0
  759. package/dist/voice/testing/types.d.ts +83 -0
  760. package/dist/voice/testing/types.d.ts.map +1 -0
  761. package/dist/voice/testing/types.js +19 -0
  762. package/dist/voice/testing/types.js.map +1 -0
  763. package/dist/voice/transcription/synchronizer.cjs +139 -15
  764. package/dist/voice/transcription/synchronizer.cjs.map +1 -1
  765. package/dist/voice/transcription/synchronizer.d.cts +35 -4
  766. package/dist/voice/transcription/synchronizer.d.ts +35 -4
  767. package/dist/voice/transcription/synchronizer.d.ts.map +1 -1
  768. package/dist/voice/transcription/synchronizer.js +143 -16
  769. package/dist/voice/transcription/synchronizer.js.map +1 -1
  770. package/dist/voice/transcription/synchronizer.test.cjs +151 -0
  771. package/dist/voice/transcription/synchronizer.test.cjs.map +1 -0
  772. package/dist/voice/transcription/synchronizer.test.js +150 -0
  773. package/dist/voice/transcription/synchronizer.test.js.map +1 -0
  774. package/dist/voice/turn_config/endpointing.cjs +33 -0
  775. package/dist/voice/turn_config/endpointing.cjs.map +1 -0
  776. package/dist/voice/turn_config/endpointing.d.cts +30 -0
  777. package/dist/voice/turn_config/endpointing.d.ts +30 -0
  778. package/dist/voice/turn_config/endpointing.d.ts.map +1 -0
  779. package/dist/voice/turn_config/endpointing.js +9 -0
  780. package/dist/voice/turn_config/endpointing.js.map +1 -0
  781. package/dist/voice/turn_config/interruption.cjs +37 -0
  782. package/dist/voice/turn_config/interruption.cjs.map +1 -0
  783. package/dist/voice/turn_config/interruption.d.cts +53 -0
  784. package/dist/voice/turn_config/interruption.d.ts +53 -0
  785. package/dist/voice/turn_config/interruption.d.ts.map +1 -0
  786. package/dist/voice/turn_config/interruption.js +13 -0
  787. package/dist/voice/turn_config/interruption.js.map +1 -0
  788. package/dist/voice/turn_config/turn_handling.cjs +35 -0
  789. package/dist/voice/turn_config/turn_handling.cjs.map +1 -0
  790. package/dist/voice/turn_config/turn_handling.d.cts +36 -0
  791. package/dist/voice/turn_config/turn_handling.d.ts +36 -0
  792. package/dist/voice/turn_config/turn_handling.d.ts.map +1 -0
  793. package/dist/voice/turn_config/turn_handling.js +11 -0
  794. package/dist/voice/turn_config/turn_handling.js.map +1 -0
  795. package/dist/voice/turn_config/utils.cjs +157 -0
  796. package/dist/voice/turn_config/utils.cjs.map +1 -0
  797. package/dist/voice/turn_config/utils.d.cts +37 -0
  798. package/dist/voice/turn_config/utils.d.ts +37 -0
  799. package/dist/voice/turn_config/utils.d.ts.map +1 -0
  800. package/dist/voice/turn_config/utils.js +131 -0
  801. package/dist/voice/turn_config/utils.js.map +1 -0
  802. package/dist/voice/turn_config/utils.test.cjs +128 -0
  803. package/dist/voice/turn_config/utils.test.cjs.map +1 -0
  804. package/dist/voice/turn_config/utils.test.js +127 -0
  805. package/dist/voice/turn_config/utils.test.js.map +1 -0
  806. package/dist/voice/utils.cjs +47 -0
  807. package/dist/voice/utils.cjs.map +1 -0
  808. package/dist/voice/utils.d.cts +4 -0
  809. package/dist/voice/utils.d.ts +4 -0
  810. package/dist/voice/utils.d.ts.map +1 -0
  811. package/dist/voice/utils.js +23 -0
  812. package/dist/voice/utils.js.map +1 -0
  813. package/dist/worker.cjs +44 -52
  814. package/dist/worker.cjs.map +1 -1
  815. package/dist/worker.d.cts +18 -8
  816. package/dist/worker.d.ts +18 -8
  817. package/dist/worker.d.ts.map +1 -1
  818. package/dist/worker.js +43 -43
  819. package/dist/worker.js.map +1 -1
  820. package/package.json +35 -13
  821. package/resources/NOTICE +2 -0
  822. package/resources/keyboard-typing.ogg +0 -0
  823. package/resources/keyboard-typing2.ogg +0 -0
  824. package/resources/office-ambience.ogg +0 -0
  825. package/src/_exceptions.ts +5 -0
  826. package/src/audio.ts +132 -1
  827. package/src/beta/index.ts +9 -0
  828. package/src/beta/workflows/index.ts +9 -0
  829. package/src/beta/workflows/task_group.ts +203 -0
  830. package/src/cli.ts +57 -66
  831. package/src/connection_pool.test.ts +346 -0
  832. package/src/connection_pool.ts +307 -0
  833. package/src/constants.ts +14 -0
  834. package/src/cpu.test.ts +239 -0
  835. package/src/cpu.ts +173 -0
  836. package/src/http_server.ts +18 -6
  837. package/src/index.ts +15 -13
  838. package/src/inference/api_protos.ts +85 -2
  839. package/src/inference/index.ts +32 -4
  840. package/src/inference/interruption/defaults.ts +51 -0
  841. package/src/inference/interruption/errors.ts +25 -0
  842. package/src/inference/interruption/http_transport.ts +207 -0
  843. package/src/inference/interruption/interruption_cache_entry.ts +50 -0
  844. package/src/inference/interruption/interruption_detector.ts +204 -0
  845. package/src/inference/interruption/interruption_stream.ts +467 -0
  846. package/src/inference/interruption/types.ts +84 -0
  847. package/src/inference/interruption/utils.test.ts +132 -0
  848. package/src/inference/interruption/utils.ts +137 -0
  849. package/src/inference/interruption/ws_transport.ts +416 -0
  850. package/src/inference/llm.ts +214 -163
  851. package/src/inference/stt.test.ts +253 -0
  852. package/src/inference/stt.ts +449 -208
  853. package/src/inference/tts.test.ts +354 -0
  854. package/src/inference/tts.ts +417 -115
  855. package/src/inference/utils.ts +30 -2
  856. package/src/ipc/inference_proc_executor.ts +11 -3
  857. package/src/ipc/inference_proc_lazy_main.ts +13 -1
  858. package/src/ipc/job_proc_executor.ts +11 -1
  859. package/src/ipc/job_proc_lazy_main.ts +86 -20
  860. package/src/ipc/supervised_proc.test.ts +153 -0
  861. package/src/ipc/supervised_proc.ts +39 -10
  862. package/src/job.ts +120 -1
  863. package/src/language.test.ts +62 -0
  864. package/src/language.ts +380 -0
  865. package/src/llm/__snapshots__/zod-utils.test.ts.snap +559 -0
  866. package/src/llm/chat_context.test.ts +787 -0
  867. package/src/llm/chat_context.ts +493 -2
  868. package/src/llm/fallback_adapter.test.ts +238 -0
  869. package/src/llm/fallback_adapter.ts +394 -0
  870. package/src/llm/index.ts +13 -0
  871. package/src/llm/llm.ts +77 -12
  872. package/src/llm/provider_format/google.test.ts +72 -1
  873. package/src/llm/provider_format/google.ts +10 -6
  874. package/src/llm/provider_format/index.ts +7 -2
  875. package/src/llm/provider_format/openai.test.ts +480 -2
  876. package/src/llm/provider_format/openai.ts +152 -21
  877. package/src/llm/provider_format/utils.ts +11 -5
  878. package/src/llm/realtime.ts +23 -2
  879. package/src/llm/remote_chat_context.ts +2 -2
  880. package/src/llm/tool_context.test.ts +210 -1
  881. package/src/llm/tool_context.ts +115 -17
  882. package/src/llm/utils.test.ts +103 -2
  883. package/src/llm/utils.ts +152 -16
  884. package/src/llm/zod-utils.test.ts +577 -0
  885. package/src/llm/zod-utils.ts +153 -0
  886. package/src/log.ts +71 -19
  887. package/src/metrics/base.ts +78 -19
  888. package/src/metrics/index.ts +12 -0
  889. package/src/metrics/model_usage.test.ts +545 -0
  890. package/src/metrics/model_usage.ts +262 -0
  891. package/src/metrics/usage_collector.ts +14 -3
  892. package/src/metrics/utils.ts +27 -7
  893. package/src/stream/deferred_stream.test.ts +3 -3
  894. package/src/stream/deferred_stream.ts +43 -11
  895. package/src/stream/index.ts +1 -0
  896. package/src/stream/multi_input_stream.test.ts +545 -0
  897. package/src/stream/multi_input_stream.ts +172 -0
  898. package/src/stream/stream_channel.test.ts +37 -0
  899. package/src/stream/stream_channel.ts +43 -3
  900. package/src/stt/stream_adapter.ts +30 -9
  901. package/src/stt/stt.ts +140 -23
  902. package/src/telemetry/index.ts +28 -0
  903. package/src/telemetry/logging.ts +55 -0
  904. package/src/telemetry/otel_http_exporter.ts +218 -0
  905. package/src/telemetry/pino_otel_transport.ts +265 -0
  906. package/src/telemetry/trace_types.ts +109 -0
  907. package/src/telemetry/traces.ts +673 -0
  908. package/src/telemetry/utils.ts +61 -0
  909. package/src/tokenize/basic/sentence.ts +3 -3
  910. package/src/tokenize/tokenizer.test.ts +4 -0
  911. package/src/transcription.ts +6 -0
  912. package/src/tts/fallback_adapter.ts +586 -0
  913. package/src/tts/index.ts +1 -0
  914. package/src/tts/stream_adapter.ts +38 -8
  915. package/src/tts/tts.ts +245 -62
  916. package/src/typed_promise.ts +67 -0
  917. package/src/types.ts +62 -33
  918. package/src/utils.test.ts +90 -10
  919. package/src/utils.ts +178 -33
  920. package/src/vad.ts +42 -18
  921. package/src/version.ts +1 -1
  922. package/src/voice/agent.test.ts +347 -2
  923. package/src/voice/agent.ts +346 -44
  924. package/src/voice/agent_activity.test.ts +194 -0
  925. package/src/voice/agent_activity.ts +1457 -388
  926. package/src/voice/agent_session.ts +817 -112
  927. package/src/voice/audio_recognition.ts +845 -70
  928. package/src/voice/audio_recognition_span.test.ts +341 -0
  929. package/src/voice/avatar/datastream_io.ts +9 -1
  930. package/src/voice/background_audio.ts +494 -0
  931. package/src/voice/events.ts +27 -7
  932. package/src/voice/generation.ts +310 -56
  933. package/src/voice/generation_tools.test.ts +268 -0
  934. package/src/voice/index.ts +17 -3
  935. package/src/voice/interruption_detection.test.ts +151 -0
  936. package/src/voice/io.ts +115 -12
  937. package/src/voice/recorder_io/index.ts +4 -0
  938. package/src/voice/recorder_io/recorder_io.ts +783 -0
  939. package/src/voice/remote_session.ts +1083 -0
  940. package/src/voice/report.test.ts +136 -0
  941. package/src/voice/report.ts +140 -0
  942. package/src/voice/room_io/_input.ts +45 -10
  943. package/src/voice/room_io/_output.ts +26 -14
  944. package/src/voice/room_io/room_io.ts +67 -22
  945. package/src/voice/speech_handle.ts +38 -6
  946. package/src/voice/testing/fake_llm.ts +138 -0
  947. package/src/voice/testing/index.ts +52 -0
  948. package/src/voice/testing/run_result.ts +995 -0
  949. package/src/voice/testing/types.ts +118 -0
  950. package/src/voice/transcription/synchronizer.test.ts +206 -0
  951. package/src/voice/transcription/synchronizer.ts +204 -19
  952. package/src/voice/turn_config/endpointing.ts +33 -0
  953. package/src/voice/turn_config/interruption.ts +56 -0
  954. package/src/voice/turn_config/turn_handling.ts +45 -0
  955. package/src/voice/turn_config/utils.test.ts +148 -0
  956. package/src/voice/turn_config/utils.ts +167 -0
  957. package/src/voice/utils.ts +29 -0
  958. package/src/worker.ts +92 -78
  959. package/src/llm/__snapshots__/utils.test.ts.snap +0 -65
@@ -18,26 +18,37 @@ var __copyProps = (to, from, except, desc) => {
18
18
  var __toCommonJS = (mod) => __copyProps(__defProp({}, "__esModule", { value: true }), mod);
19
19
  var agent_session_exports = {};
20
20
  __export(agent_session_exports, {
21
- AgentSession: () => AgentSession
21
+ AgentSession: () => AgentSession,
22
+ defaultAgentSessionOptions: () => defaultAgentSessionOptions
22
23
  });
23
24
  module.exports = __toCommonJS(agent_session_exports);
25
+ var import_mutex = require("@livekit/mutex");
26
+ var import_api = require("@opentelemetry/api");
24
27
  var import_node_events = require("node:events");
25
28
  var import_inference = require("../inference/index.cjs");
26
29
  var import_job = require("../job.cjs");
27
30
  var import_chat_context = require("../llm/chat_context.cjs");
28
31
  var import_log = require("../log.cjs");
32
+ var import_model_usage = require("../metrics/model_usage.cjs");
33
+ var import_telemetry = require("../telemetry/index.cjs");
34
+ var import_types = require("../types.cjs");
35
+ var import_utils = require("../utils.cjs");
29
36
  var import_agent_activity = require("./agent_activity.cjs");
30
37
  var import_events = require("./events.cjs");
31
38
  var import_io = require("./io.cjs");
39
+ var import_recorder_io = require("./recorder_io/index.cjs");
40
+ var import_remote_session = require("./remote_session.cjs");
32
41
  var import_room_io = require("./room_io/index.cjs");
33
- const defaultVoiceOptions = {
34
- allowInterruptions: true,
35
- discardAudioIfUninterruptible: true,
36
- minInterruptionDuration: 500,
37
- minInterruptionWords: 0,
38
- minEndpointingDelay: 500,
39
- maxEndpointingDelay: 6e3,
40
- maxToolSteps: 3
42
+ var import_run_result = require("./testing/run_result.cjs");
43
+ var import_utils2 = require("./turn_config/utils.cjs");
44
+ var import_utils3 = require("./utils.cjs");
45
+ const defaultAgentSessionOptions = {
46
+ maxToolSteps: 3,
47
+ preemptiveGeneration: true,
48
+ userAwayTimeout: 15,
49
+ aecWarmupDuration: 3e3,
50
+ turnHandling: {},
51
+ useTtsAlignedTranscript: true
41
52
  };
42
53
  class AgentSession extends import_node_events.EventEmitter {
43
54
  vad;
@@ -45,53 +56,97 @@ class AgentSession extends import_node_events.EventEmitter {
45
56
  llm;
46
57
  tts;
47
58
  turnDetection;
59
+ /** @deprecated use {@link sessionOptions } instead */
48
60
  options;
61
+ sessionOptions;
62
+ activityLock = new import_mutex.Mutex();
49
63
  agent;
50
64
  activity;
51
65
  nextActivity;
66
+ updateActivityTask;
52
67
  started = false;
53
- userState = "listening";
54
- roomIO;
55
- logger = (0, import_log.log)();
68
+ sessionHost;
56
69
  _chatCtx;
57
70
  _userData;
71
+ _userState = "listening";
58
72
  _agentState = "initializing";
59
73
  _input;
60
74
  _output;
61
75
  closingTask = null;
62
- constructor(opts) {
76
+ userAwayTimer = null;
77
+ _aecWarmupTimer = null;
78
+ // Connection options for STT, LLM, and TTS
79
+ _connOptions;
80
+ // Unrecoverable error counts, reset after agent speaking
81
+ llmErrorCounts = 0;
82
+ ttsErrorCounts = 0;
83
+ sessionSpan;
84
+ agentSpeakingSpan;
85
+ _interruptionDetection;
86
+ /** @internal */
87
+ _usageCollector = new import_model_usage.ModelUsageCollector();
88
+ /** @internal */
89
+ _roomIO;
90
+ /** @internal */
91
+ _aecWarmupRemaining = 0;
92
+ /** @internal */
93
+ _recorderIO;
94
+ /** @internal */
95
+ rootSpanContext;
96
+ /** @internal */
97
+ _recordedEvents = [];
98
+ /** @internal */
99
+ _enableRecording = false;
100
+ /** @internal - Timestamp when the session started (milliseconds) */
101
+ _startedAt;
102
+ /** @internal - Current run state for testing */
103
+ _globalRunState;
104
+ /** @internal */
105
+ _userSpeakingSpan;
106
+ logger = (0, import_log.log)();
107
+ constructor(options) {
108
+ var _a;
63
109
  super();
64
- const {
65
- vad,
66
- stt,
67
- llm,
68
- tts,
69
- turnDetection,
70
- userData,
71
- voiceOptions = defaultVoiceOptions
72
- } = opts;
110
+ const { agentSessionOptions: opts, legacyVoiceOptions } = (0, import_utils2.migrateLegacyOptions)(options);
111
+ const { vad, stt, llm, tts, userData, connOptions, ...resolvedSessionOptions } = opts;
112
+ this._connOptions = {
113
+ sttConnOptions: { ...import_types.DEFAULT_API_CONNECT_OPTIONS, ...connOptions == null ? void 0 : connOptions.sttConnOptions },
114
+ llmConnOptions: { ...import_types.DEFAULT_API_CONNECT_OPTIONS, ...connOptions == null ? void 0 : connOptions.llmConnOptions },
115
+ ttsConnOptions: { ...import_types.DEFAULT_API_CONNECT_OPTIONS, ...connOptions == null ? void 0 : connOptions.ttsConnOptions },
116
+ maxUnrecoverableErrors: (connOptions == null ? void 0 : connOptions.maxUnrecoverableErrors) ?? import_types.DEFAULT_SESSION_CONNECT_OPTIONS.maxUnrecoverableErrors
117
+ };
73
118
  this.vad = vad;
74
119
  if (typeof stt === "string") {
75
- this.stt = new import_inference.STT({ model: stt });
120
+ this.stt = import_inference.STT.fromModelString(stt);
76
121
  } else {
77
122
  this.stt = stt;
78
123
  }
79
124
  if (typeof llm === "string") {
80
- this.llm = new import_inference.LLM({ model: llm });
125
+ this.llm = import_inference.LLM.fromModelString(llm);
81
126
  } else {
82
127
  this.llm = llm;
83
128
  }
84
129
  if (typeof tts === "string") {
85
- this.tts = new import_inference.TTS({ model: tts });
130
+ this.tts = import_inference.TTS.fromModelString(tts);
86
131
  } else {
87
132
  this.tts = tts;
88
133
  }
89
- this.turnDetection = turnDetection;
134
+ this.turnDetection = resolvedSessionOptions.turnHandling.turnDetection;
135
+ this._interruptionDetection = (_a = resolvedSessionOptions.turnHandling.interruption) == null ? void 0 : _a.mode;
90
136
  this._userData = userData;
91
137
  this._input = new import_io.AgentInput(this.onAudioInputChanged);
92
138
  this._output = new import_io.AgentOutput(this.onAudioOutputChanged, this.onTextOutputChanged);
93
139
  this._chatCtx = import_chat_context.ChatContext.empty();
94
- this.options = { ...defaultVoiceOptions, ...voiceOptions };
140
+ this.sessionOptions = resolvedSessionOptions;
141
+ this.options = legacyVoiceOptions;
142
+ this._aecWarmupRemaining = this.sessionOptions.aecWarmupDuration ?? 0;
143
+ this._onUserInputTranscribed = this._onUserInputTranscribed.bind(this);
144
+ this.on(import_events.AgentSessionEventTypes.UserInputTranscribed, this._onUserInputTranscribed);
145
+ }
146
+ emit(event, ...args) {
147
+ const eventData = args[0];
148
+ this._recordedEvents.push(eventData);
149
+ return super.emit(event, ...args);
95
150
  }
96
151
  get input() {
97
152
  return this._input;
@@ -108,48 +163,100 @@ class AgentSession extends import_node_events.EventEmitter {
108
163
  get history() {
109
164
  return this._chatCtx;
110
165
  }
166
+ /** Connection options for STT, LLM, and TTS. */
167
+ get connOptions() {
168
+ return this._connOptions;
169
+ }
170
+ get interruptionDetection() {
171
+ return this._interruptionDetection;
172
+ }
173
+ /**
174
+ * Returns usage summaries for this session, one per model/provider combination.
175
+ */
176
+ get usage() {
177
+ return { modelUsage: this._usageCollector.flatten().map(import_model_usage.filterZeroValues) };
178
+ }
179
+ get useTtsAlignedTranscript() {
180
+ return this.sessionOptions.useTtsAlignedTranscript;
181
+ }
111
182
  set userData(value) {
112
183
  this._userData = value;
113
184
  }
114
- async start({
185
+ async _startImpl({
115
186
  agent,
116
187
  room,
117
188
  inputOptions,
118
- outputOptions
189
+ outputOptions,
190
+ span
119
191
  }) {
120
- if (this.started) {
121
- return;
122
- }
192
+ span.setAttribute(import_telemetry.traceTypes.ATTR_AGENT_LABEL, agent.id);
123
193
  this.agent = agent;
124
194
  this._updateAgentState("initializing");
125
195
  const tasks = [];
126
- if (this.input.audio && (inputOptions == null ? void 0 : inputOptions.audioEnabled) !== false) {
127
- this.logger.warn("RoomIO audio input is enabled but input.audio is already set, ignoring..");
128
- }
129
- if (this.output.audio && (outputOptions == null ? void 0 : outputOptions.audioEnabled) !== false) {
130
- this.logger.warn(
131
- "RoomIO audio output is enabled but output.audio is already set, ignoring.."
132
- );
196
+ if (room && !this._roomIO) {
197
+ if (this.input.audio && (inputOptions == null ? void 0 : inputOptions.audioEnabled) !== false) {
198
+ this.logger.warn(
199
+ "RoomIO audio input is enabled but input.audio is already set, ignoring.."
200
+ );
201
+ }
202
+ if (this.output.audio && (outputOptions == null ? void 0 : outputOptions.audioEnabled) !== false) {
203
+ this.logger.warn(
204
+ "RoomIO audio output is enabled but output.audio is already set, ignoring.."
205
+ );
206
+ }
207
+ if (this.output.transcription && (outputOptions == null ? void 0 : outputOptions.transcriptionEnabled) !== false) {
208
+ this.logger.warn(
209
+ "RoomIO transcription output is enabled but output.transcription is already set, ignoring.."
210
+ );
211
+ }
212
+ this._roomIO = new import_room_io.RoomIO({
213
+ agentSession: this,
214
+ room,
215
+ inputOptions,
216
+ outputOptions
217
+ });
218
+ this._roomIO.start();
219
+ const transport = new import_remote_session.RoomSessionTransport(room, this._roomIO);
220
+ this.sessionHost = new import_remote_session.SessionHost(transport);
221
+ this.sessionHost.registerSession(this);
222
+ if ((inputOptions == null ? void 0 : inputOptions.textEnabled) !== false) {
223
+ this.sessionHost.registerTextInput(
224
+ (inputOptions == null ? void 0 : inputOptions.textInputCallback) ?? import_room_io.DEFAULT_TEXT_INPUT_CALLBACK
225
+ );
226
+ }
133
227
  }
134
- if (this.output.transcription && (outputOptions == null ? void 0 : outputOptions.transcriptionEnabled) !== false) {
135
- this.logger.warn(
136
- "RoomIO transcription output is enabled but output.transcription is already set, ignoring.."
137
- );
228
+ let ctx = void 0;
229
+ try {
230
+ ctx = (0, import_job.getJobContext)();
231
+ } catch {
138
232
  }
139
- this.roomIO = new import_room_io.RoomIO({
140
- agentSession: this,
141
- room,
142
- inputOptions,
143
- outputOptions
144
- });
145
- this.roomIO.start();
146
- const ctx = (0, import_job.getJobContext)();
147
- if (ctx && ctx.room === room && !room.isConnected) {
148
- this.logger.debug("Auto-connecting to room via job context");
149
- tasks.push(ctx.connect());
233
+ if (ctx) {
234
+ if (room && ctx.room === room && !room.isConnected) {
235
+ this.logger.debug("Auto-connecting to room via job context");
236
+ tasks.push(ctx.connect());
237
+ }
238
+ if (ctx._primaryAgentSession === void 0) {
239
+ ctx._primaryAgentSession = this;
240
+ } else if (this._enableRecording) {
241
+ throw new Error(
242
+ "Only one `AgentSession` can be the primary at a time. If you want to ignore primary designation, use `session.start({ record: false })`."
243
+ );
244
+ }
245
+ if (this.input.audio && this.output.audio && this._enableRecording) {
246
+ this._recorderIO = new import_recorder_io.RecorderIO({ agentSession: this });
247
+ this.input.audio = this._recorderIO.recordInput(this.input.audio);
248
+ this.output.audio = this._recorderIO.recordOutput(this.output.audio);
249
+ const sessionDir = ctx.sessionDirectory;
250
+ if (sessionDir) {
251
+ tasks.push(this._recorderIO.start(`${sessionDir}/audio.ogg`));
252
+ }
253
+ }
150
254
  }
151
- tasks.push(this.updateActivity(this.agent));
255
+ tasks.push(this._updateActivity(this.agent, { waitOnEnter: false }));
152
256
  await Promise.allSettled(tasks);
257
+ if (this.sessionHost) {
258
+ await this.sessionHost.start();
259
+ }
153
260
  this.logger.debug(
154
261
  `using audio io: ${this.input.audio ? "`" + this.input.audio.constructor.name + "`" : "(none)"} -> \`AgentSession\` -> ${this.output.audio ? "`" + this.output.audio.constructor.name + "`" : "(none)"}`
155
262
  );
@@ -157,12 +264,70 @@ class AgentSession extends import_node_events.EventEmitter {
157
264
  `using transcript io: \`AgentSession\` -> ${this.output.transcription ? "`" + this.output.transcription.constructor.name + "`" : "(none)"}`
158
265
  );
159
266
  this.started = true;
267
+ this._startedAt = Date.now();
160
268
  this._updateAgentState("listening");
161
269
  }
270
+ async start({
271
+ agent,
272
+ room,
273
+ inputOptions,
274
+ outputOptions,
275
+ record
276
+ }) {
277
+ if (this.started) {
278
+ return;
279
+ }
280
+ this._usageCollector = new import_model_usage.ModelUsageCollector();
281
+ let ctx = void 0;
282
+ try {
283
+ ctx = (0, import_job.getJobContext)();
284
+ if (record === void 0) {
285
+ record = ctx.job.enableRecording;
286
+ }
287
+ this._enableRecording = record;
288
+ if (this._enableRecording) {
289
+ ctx.initRecording();
290
+ }
291
+ } catch (error) {
292
+ this.logger.warn("JobContext is not available");
293
+ }
294
+ this.sessionSpan = import_telemetry.tracer.startSpan({
295
+ name: "agent_session",
296
+ context: import_api.ROOT_CONTEXT
297
+ });
298
+ this.rootSpanContext = import_api.trace.setSpan(import_api.ROOT_CONTEXT, this.sessionSpan);
299
+ await this._startImpl({
300
+ agent,
301
+ room,
302
+ inputOptions,
303
+ outputOptions,
304
+ span: this.sessionSpan
305
+ });
306
+ }
162
307
  updateAgent(agent) {
163
308
  this.agent = agent;
164
- if (this.started) {
165
- this.updateActivity(agent);
309
+ if (!this.started) {
310
+ return;
311
+ }
312
+ const _updateActivityTask = async (oldTask2, agent2) => {
313
+ if (oldTask2) {
314
+ try {
315
+ await oldTask2.result;
316
+ } catch (error) {
317
+ this.logger.error(error, "previous updateAgent transition failed");
318
+ }
319
+ }
320
+ await this._updateActivity(agent2);
321
+ };
322
+ const oldTask = this.updateActivityTask;
323
+ this.updateActivityTask = import_utils.Task.from(
324
+ async () => _updateActivityTask(oldTask, agent),
325
+ void 0,
326
+ "AgentSession_updateActivityTask"
327
+ );
328
+ const runState = this._globalRunState;
329
+ if (runState) {
330
+ runState._watchHandle(this.updateActivityTask);
166
331
  }
167
332
  }
168
333
  commitUserTurn() {
@@ -181,13 +346,36 @@ class AgentSession extends import_node_events.EventEmitter {
181
346
  if (!this.activity) {
182
347
  throw new Error("AgentSession is not running");
183
348
  }
184
- return this.activity.say(text, options);
349
+ const doSay = (activity, nextActivity) => {
350
+ if (activity.schedulingPaused) {
351
+ if (!nextActivity) {
352
+ throw new Error("AgentSession is closing, cannot use say()");
353
+ }
354
+ return nextActivity.say(text, options);
355
+ }
356
+ return activity.say(text, options);
357
+ };
358
+ const runState = this._globalRunState;
359
+ let handle;
360
+ const activeSpan = import_api.trace.getActiveSpan();
361
+ if (!activeSpan && this.rootSpanContext) {
362
+ handle = import_api.context.with(
363
+ this.rootSpanContext,
364
+ () => doSay(this.activity, this.nextActivity)
365
+ );
366
+ } else {
367
+ handle = doSay(this.activity, this.nextActivity);
368
+ }
369
+ if (runState) {
370
+ runState._watchHandle(handle);
371
+ }
372
+ return handle;
185
373
  }
186
- interrupt() {
374
+ interrupt(options) {
187
375
  if (!this.activity) {
188
376
  throw new Error("AgentSession is not running");
189
377
  }
190
- return this.activity.interrupt();
378
+ return this.activity.interrupt(options);
191
379
  }
192
380
  generateReply(options) {
193
381
  if (!this.activity) {
@@ -197,26 +385,142 @@ class AgentSession extends import_node_events.EventEmitter {
197
385
  role: "user",
198
386
  content: options.userInput
199
387
  }) : void 0;
200
- if (this.activity.draining) {
201
- if (!this.nextActivity) {
202
- throw new Error("AgentSession is closing, cannot use generateReply()");
388
+ const doGenerateReply = (activity, nextActivity) => {
389
+ if (activity.schedulingPaused) {
390
+ if (!nextActivity) {
391
+ throw new Error("AgentSession is closing, cannot use generateReply()");
392
+ }
393
+ return nextActivity.generateReply({ userMessage, ...options });
203
394
  }
204
- return this.nextActivity.generateReply({ userMessage, ...options });
395
+ return activity.generateReply({ userMessage, ...options });
396
+ };
397
+ const activeSpan = import_api.trace.getActiveSpan();
398
+ let handle;
399
+ if (!activeSpan && this.rootSpanContext) {
400
+ handle = import_api.context.with(
401
+ this.rootSpanContext,
402
+ () => doGenerateReply(this.activity, this.nextActivity)
403
+ );
404
+ } else {
405
+ handle = doGenerateReply(this.activity, this.nextActivity);
406
+ }
407
+ if (this._globalRunState) {
408
+ this._globalRunState._watchHandle(handle);
205
409
  }
206
- return this.activity.generateReply({ userMessage, ...options });
410
+ return handle;
207
411
  }
208
- async updateActivity(agent) {
209
- this.nextActivity = new import_agent_activity.AgentActivity(agent, this);
210
- if (this.activity) {
211
- await this.activity.drain();
212
- await this.activity.close();
412
+ /**
413
+ * Run a test with user input and return a result for assertions.
414
+ *
415
+ * This method is primarily used for testing agent behavior without
416
+ * requiring a real room connection.
417
+ *
418
+ * @example
419
+ * ```typescript
420
+ * const result = await session.run({ userInput: 'Hello' });
421
+ * result.expect.nextEvent().isMessage({ role: 'assistant' });
422
+ * result.expect.noMoreEvents();
423
+ * ```
424
+ *
425
+ * @param options - Run options including user input and optional output type
426
+ * @returns A RunResult that resolves when the agent finishes responding
427
+ */
428
+ run({
429
+ userInput,
430
+ outputType
431
+ }) {
432
+ if (this._globalRunState && !this._globalRunState.done()) {
433
+ throw new Error("nested runs are not supported");
213
434
  }
214
- this.activity = this.nextActivity;
215
- this.nextActivity = void 0;
216
- await this.activity.start();
217
- if (this._input.audio) {
218
- this.activity.attachAudioInput(this._input.audio.stream);
435
+ const runState = new import_run_result.RunResult({
436
+ userInput,
437
+ outputType
438
+ });
439
+ this._globalRunState = runState;
440
+ (async () => {
441
+ try {
442
+ const unlock = await this.activityLock.lock();
443
+ unlock();
444
+ this.generateReply({ userInput });
445
+ } catch (e) {
446
+ runState._reject(e instanceof Error ? e : new Error(String(e)));
447
+ }
448
+ })();
449
+ return runState;
450
+ }
451
+ /** @internal */
452
+ async _updateActivity(agent, options = {}) {
453
+ const { previousActivity = "close", newActivity = "start", blockedTasks = [] } = options;
454
+ const waitOnEnter = options.waitOnEnter ?? newActivity === "start";
455
+ const runWithContext = async () => {
456
+ const unlock = await this.activityLock.lock();
457
+ let onEnterTask;
458
+ try {
459
+ this.agent = agent;
460
+ const prevActivityObj = this.activity;
461
+ if (newActivity === "start") {
462
+ const prevAgent = prevActivityObj == null ? void 0 : prevActivityObj.agent;
463
+ if (agent._agentActivity && // allow updating the same agent that is running
464
+ (agent !== prevAgent || previousActivity !== "close")) {
465
+ throw new Error("Cannot start agent: an activity is already running");
466
+ }
467
+ this.nextActivity = new import_agent_activity.AgentActivity(agent, this);
468
+ } else if (newActivity === "resume") {
469
+ if (!agent._agentActivity) {
470
+ throw new Error("Cannot resume agent: no existing activity to resume");
471
+ }
472
+ this.nextActivity = agent._agentActivity;
473
+ }
474
+ if (prevActivityObj && prevActivityObj !== this.nextActivity) {
475
+ if (previousActivity === "pause") {
476
+ await prevActivityObj.pause({ blockedTasks });
477
+ } else {
478
+ await prevActivityObj.drain();
479
+ await prevActivityObj.close();
480
+ }
481
+ }
482
+ this.activity = this.nextActivity;
483
+ this.nextActivity = void 0;
484
+ const runState = this._globalRunState;
485
+ const handoffItem = new import_chat_context.AgentHandoffItem({
486
+ oldAgentId: prevActivityObj == null ? void 0 : prevActivityObj.agent.id,
487
+ newAgentId: agent.id
488
+ });
489
+ if (runState) {
490
+ runState._agentHandoff({
491
+ item: handoffItem,
492
+ oldAgent: prevActivityObj == null ? void 0 : prevActivityObj.agent,
493
+ newAgent: this.activity.agent
494
+ });
495
+ }
496
+ this._chatCtx.insert(handoffItem);
497
+ this.logger.debug(
498
+ { previousAgentId: prevActivityObj == null ? void 0 : prevActivityObj.agent.id, newAgentId: agent.id },
499
+ "Agent handoff inserted into chat context"
500
+ );
501
+ if (newActivity === "start") {
502
+ await this.activity.start();
503
+ } else {
504
+ await this.activity.resume();
505
+ }
506
+ onEnterTask = this.activity._onEnterTask;
507
+ if (this._input.audio) {
508
+ this.activity.attachAudioInput(this._input.audio.stream);
509
+ }
510
+ } finally {
511
+ unlock();
512
+ }
513
+ if (waitOnEnter) {
514
+ if (!onEnterTask) {
515
+ throw new Error("expected onEnter task to be available while waitOnEnter=true");
516
+ }
517
+ await onEnterTask.result;
518
+ }
519
+ };
520
+ if (this.rootSpanContext) {
521
+ return import_api.context.with(this.rootSpanContext, runWithContext);
219
522
  }
523
+ return runWithContext();
220
524
  }
221
525
  get chatCtx() {
222
526
  return this._chatCtx.copy();
@@ -224,6 +528,9 @@ class AgentSession extends import_node_events.EventEmitter {
224
528
  get agentState() {
225
529
  return this._agentState;
226
530
  }
531
+ get userState() {
532
+ return this._userState;
533
+ }
227
534
  get currentAgent() {
228
535
  if (!this.agent) {
229
536
  throw new Error("AgentSession is not running");
@@ -233,6 +540,13 @@ class AgentSession extends import_node_events.EventEmitter {
233
540
  async close() {
234
541
  await this.closeImpl(import_events.CloseReason.USER_INITIATED);
235
542
  }
543
+ shutdown(options) {
544
+ const { drain = true, reason = import_events.CloseReason.USER_INITIATED } = options ?? {};
545
+ this._closeSoon({
546
+ reason,
547
+ drain
548
+ });
549
+ }
236
550
  /** @internal */
237
551
  _closeSoon({
238
552
  reason,
@@ -242,14 +556,30 @@ class AgentSession extends import_node_events.EventEmitter {
242
556
  if (this.closingTask) {
243
557
  return;
244
558
  }
245
- this.closeImpl(reason, error, drain);
559
+ this.closingTask = this.closeImpl(reason, error, drain).finally(() => {
560
+ this.closingTask = null;
561
+ });
246
562
  }
247
563
  /** @internal */
248
564
  _onError(error) {
249
565
  if (this.closingTask || error.recoverable) {
250
566
  return;
251
567
  }
252
- this.logger.error(error, "AgentSession is closing due to unrecoverable error");
568
+ if (error.type === "llm_error") {
569
+ this.llmErrorCounts += 1;
570
+ if (this.llmErrorCounts <= this._connOptions.maxUnrecoverableErrors) {
571
+ return;
572
+ }
573
+ } else if (error.type === "tts_error") {
574
+ this.ttsErrorCounts += 1;
575
+ if (this.ttsErrorCounts <= this._connOptions.maxUnrecoverableErrors) {
576
+ return;
577
+ }
578
+ } else if (error.type === "interruption_detection_error") {
579
+ this.logger.error(error.toString());
580
+ return;
581
+ }
582
+ this.logger.error(error, "AgentSession is closing due to an unrecoverable error");
253
583
  this.closingTask = (async () => {
254
584
  await this.closeImpl(import_events.CloseReason.ERROR, error);
255
585
  })().then(() => {
@@ -262,24 +592,79 @@ class AgentSession extends import_node_events.EventEmitter {
262
592
  this.emit(import_events.AgentSessionEventTypes.ConversationItemAdded, (0, import_events.createConversationItemAddedEvent)(item));
263
593
  }
264
594
  /** @internal */
265
- _updateAgentState(state) {
595
+ _toolItemsAdded(items) {
596
+ this._chatCtx.insert(items);
597
+ }
598
+ /** @internal */
599
+ _updateAgentState(state, options) {
600
+ var _a;
266
601
  if (this._agentState === state) {
267
602
  return;
268
603
  }
604
+ if (state === "speaking") {
605
+ this.llmErrorCounts = 0;
606
+ this.ttsErrorCounts = 0;
607
+ if (this.agentSpeakingSpan === void 0) {
608
+ this.agentSpeakingSpan = import_telemetry.tracer.startSpan({
609
+ name: "agent_speaking",
610
+ context: (options == null ? void 0 : options.otelContext) ?? this.rootSpanContext,
611
+ startTime: options == null ? void 0 : options.startTime
612
+ });
613
+ const localParticipant = (_a = this._roomIO) == null ? void 0 : _a.localParticipant;
614
+ if (localParticipant) {
615
+ (0, import_utils3.setParticipantSpanAttributes)(this.agentSpeakingSpan, localParticipant);
616
+ }
617
+ }
618
+ } else if (this.agentSpeakingSpan !== void 0) {
619
+ this.agentSpeakingSpan.end();
620
+ this.agentSpeakingSpan = void 0;
621
+ }
622
+ if (state === "speaking" && this._aecWarmupRemaining > 0 && this._aecWarmupTimer === null) {
623
+ this._aecWarmupTimer = setTimeout(() => this._onAecWarmupExpired(), this._aecWarmupRemaining);
624
+ this.logger.debug(
625
+ { warmupDurationMs: this._aecWarmupRemaining },
626
+ "aec warmup active, disabling interruptions"
627
+ );
628
+ }
269
629
  const oldState = this._agentState;
270
630
  this._agentState = state;
631
+ if (state === "listening" && this._userState === "listening") {
632
+ this._setUserAwayTimer();
633
+ } else {
634
+ this._cancelUserAwayTimer();
635
+ }
271
636
  this.emit(
272
637
  import_events.AgentSessionEventTypes.AgentStateChanged,
273
638
  (0, import_events.createAgentStateChangedEvent)(oldState, state)
274
639
  );
275
640
  }
276
641
  /** @internal */
277
- _updateUserState(state) {
278
- if (this.userState === state) {
642
+ _updateUserState(state, options) {
643
+ var _a;
644
+ if (this._userState === state) {
279
645
  return;
280
646
  }
281
- const oldState = this.userState;
282
- this.userState = state;
647
+ if (state === "speaking" && this._userSpeakingSpan === void 0) {
648
+ this._userSpeakingSpan = import_telemetry.tracer.startSpan({
649
+ name: "user_speaking",
650
+ context: (options == null ? void 0 : options.otelContext) ?? this.rootSpanContext,
651
+ startTime: options == null ? void 0 : options.lastSpeakingTime
652
+ });
653
+ const linked = (_a = this._roomIO) == null ? void 0 : _a.linkedParticipant;
654
+ if (linked) {
655
+ (0, import_utils3.setParticipantSpanAttributes)(this._userSpeakingSpan, linked);
656
+ }
657
+ } else if (this._userSpeakingSpan !== void 0) {
658
+ this._userSpeakingSpan.end(options == null ? void 0 : options.lastSpeakingTime);
659
+ this._userSpeakingSpan = void 0;
660
+ }
661
+ const oldState = this._userState;
662
+ this._userState = state;
663
+ if (state === "listening" && this._agentState === "listening") {
664
+ this._setUserAwayTimer();
665
+ } else {
666
+ this._cancelUserAwayTimer();
667
+ }
283
668
  this.emit(
284
669
  import_events.AgentSessionEventTypes.UserStateChanged,
285
670
  (0, import_events.createUserStateChangedEvent)(oldState, state)
@@ -298,38 +683,113 @@ class AgentSession extends import_node_events.EventEmitter {
298
683
  }
299
684
  onTextOutputChanged() {
300
685
  }
686
+ _setUserAwayTimer() {
687
+ this._cancelUserAwayTimer();
688
+ if (this.sessionOptions.userAwayTimeout === null || this.sessionOptions.userAwayTimeout === void 0) {
689
+ return;
690
+ }
691
+ if (this._roomIO && !this._roomIO.isParticipantAvailable) {
692
+ return;
693
+ }
694
+ this.userAwayTimer = setTimeout(() => {
695
+ this.logger.debug("User away timeout triggered");
696
+ this._updateUserState("away");
697
+ }, this.sessionOptions.userAwayTimeout * 1e3);
698
+ }
699
+ _cancelUserAwayTimer() {
700
+ if (this.userAwayTimer !== null) {
701
+ clearTimeout(this.userAwayTimer);
702
+ this.userAwayTimer = null;
703
+ }
704
+ }
705
+ /** @internal */
706
+ _onAecWarmupExpired() {
707
+ if (this._aecWarmupRemaining > 0) {
708
+ this.logger.debug("aec warmup expired, re-enabling interruptions");
709
+ }
710
+ this._aecWarmupRemaining = 0;
711
+ if (this._aecWarmupTimer !== null) {
712
+ clearTimeout(this._aecWarmupTimer);
713
+ this._aecWarmupTimer = null;
714
+ }
715
+ }
716
+ _onUserInputTranscribed(ev) {
717
+ if (this._userState === "away" && ev.isFinal) {
718
+ this.logger.debug("User returned from away state due to speech input");
719
+ this._updateUserState("listening");
720
+ }
721
+ }
301
722
  async closeImpl(reason, error = null, drain = false) {
302
- var _a, _b, _c;
723
+ if (this.rootSpanContext) {
724
+ return import_api.context.with(this.rootSpanContext, async () => {
725
+ await this.closeImplInner(reason, error, drain);
726
+ });
727
+ }
728
+ return this.closeImplInner(reason, error, drain);
729
+ }
730
+ async closeImplInner(reason, error = null, drain = false) {
731
+ var _a, _b, _c, _d;
303
732
  if (!this.started) {
304
733
  return;
305
734
  }
735
+ this._cancelUserAwayTimer();
736
+ this._onAecWarmupExpired();
737
+ this.off(import_events.AgentSessionEventTypes.UserInputTranscribed, this._onUserInputTranscribed);
306
738
  if (this.activity) {
307
739
  if (!drain) {
308
740
  try {
309
- this.activity.interrupt();
741
+ await this.activity.interrupt({ force: true }).await;
310
742
  } catch (error2) {
743
+ this.logger.warn({ error: error2 }, "Error interrupting activity");
311
744
  }
312
745
  }
313
746
  await this.activity.drain();
314
747
  await ((_a = this.activity.currentSpeech) == null ? void 0 : _a.waitForPlayout());
315
- this.activity.detachAudioInput();
748
+ if (reason !== import_events.CloseReason.ERROR) {
749
+ this.activity.commitUserTurn({ audioDetached: true, throwIfNotReady: false });
750
+ }
751
+ try {
752
+ this.activity.detachAudioInput();
753
+ } catch (error2) {
754
+ }
755
+ }
756
+ if (this._recorderIO) {
757
+ await this._recorderIO.close();
316
758
  }
317
759
  this.input.audio = null;
318
760
  this.output.audio = null;
319
761
  this.output.transcription = null;
320
- await ((_b = this.roomIO) == null ? void 0 : _b.close());
321
- this.roomIO = void 0;
322
- await ((_c = this.activity) == null ? void 0 : _c.close());
762
+ await ((_b = this.sessionHost) == null ? void 0 : _b.close());
763
+ this.sessionHost = void 0;
764
+ await ((_c = this._roomIO) == null ? void 0 : _c.close());
765
+ this._roomIO = void 0;
766
+ await ((_d = this.activity) == null ? void 0 : _d.close());
323
767
  this.activity = void 0;
768
+ if (this.sessionSpan) {
769
+ this.sessionSpan.end();
770
+ this.sessionSpan = void 0;
771
+ }
772
+ if (this._userSpeakingSpan) {
773
+ this._userSpeakingSpan.end();
774
+ this._userSpeakingSpan = void 0;
775
+ }
776
+ if (this.agentSpeakingSpan) {
777
+ this.agentSpeakingSpan.end();
778
+ this.agentSpeakingSpan = void 0;
779
+ }
324
780
  this.started = false;
325
781
  this.emit(import_events.AgentSessionEventTypes.Close, (0, import_events.createCloseEvent)(reason, error));
326
- this.userState = "listening";
782
+ this._userState = "listening";
327
783
  this._agentState = "initializing";
784
+ this.rootSpanContext = void 0;
785
+ this.llmErrorCounts = 0;
786
+ this.ttsErrorCounts = 0;
328
787
  this.logger.info({ reason, error }, "AgentSession closed");
329
788
  }
330
789
  }
331
790
  // Annotate the CommonJS export names for ESM import in node:
332
791
  0 && (module.exports = {
333
- AgentSession
792
+ AgentSession,
793
+ defaultAgentSessionOptions
334
794
  });
335
795
  //# sourceMappingURL=agent_session.cjs.map