@livekit/agents 0.0.0-20260120144724

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (987) hide show
  1. package/LICENSE +201 -0
  2. package/README.md +17 -0
  3. package/dist/_exceptions.cjs +109 -0
  4. package/dist/_exceptions.cjs.map +1 -0
  5. package/dist/_exceptions.d.cts +64 -0
  6. package/dist/_exceptions.d.ts +64 -0
  7. package/dist/_exceptions.d.ts.map +1 -0
  8. package/dist/_exceptions.js +80 -0
  9. package/dist/_exceptions.js.map +1 -0
  10. package/dist/audio.cjs +170 -0
  11. package/dist/audio.cjs.map +1 -0
  12. package/dist/audio.d.cts +46 -0
  13. package/dist/audio.d.ts +46 -0
  14. package/dist/audio.d.ts.map +1 -0
  15. package/dist/audio.js +133 -0
  16. package/dist/audio.js.map +1 -0
  17. package/dist/cli.cjs +171 -0
  18. package/dist/cli.cjs.map +1 -0
  19. package/dist/cli.d.cts +14 -0
  20. package/dist/cli.d.ts +14 -0
  21. package/dist/cli.d.ts.map +1 -0
  22. package/dist/cli.js +145 -0
  23. package/dist/cli.js.map +1 -0
  24. package/dist/connection_pool.cjs +242 -0
  25. package/dist/connection_pool.cjs.map +1 -0
  26. package/dist/connection_pool.d.cts +123 -0
  27. package/dist/connection_pool.d.ts +123 -0
  28. package/dist/connection_pool.d.ts.map +1 -0
  29. package/dist/connection_pool.js +218 -0
  30. package/dist/connection_pool.js.map +1 -0
  31. package/dist/connection_pool.test.cjs +256 -0
  32. package/dist/connection_pool.test.cjs.map +1 -0
  33. package/dist/connection_pool.test.js +255 -0
  34. package/dist/connection_pool.test.js.map +1 -0
  35. package/dist/constants.cjs +44 -0
  36. package/dist/constants.cjs.map +1 -0
  37. package/dist/constants.d.cts +7 -0
  38. package/dist/constants.d.ts +7 -0
  39. package/dist/constants.d.ts.map +1 -0
  40. package/dist/constants.js +15 -0
  41. package/dist/constants.js.map +1 -0
  42. package/dist/generator.cjs +36 -0
  43. package/dist/generator.cjs.map +1 -0
  44. package/dist/generator.d.cts +23 -0
  45. package/dist/generator.d.ts +23 -0
  46. package/dist/generator.d.ts.map +1 -0
  47. package/dist/generator.js +11 -0
  48. package/dist/generator.js.map +1 -0
  49. package/dist/http_server.cjs +75 -0
  50. package/dist/http_server.cjs.map +1 -0
  51. package/dist/http_server.d.cts +20 -0
  52. package/dist/http_server.d.ts +20 -0
  53. package/dist/http_server.d.ts.map +1 -0
  54. package/dist/http_server.js +51 -0
  55. package/dist/http_server.js.map +1 -0
  56. package/dist/index.cjs +100 -0
  57. package/dist/index.cjs.map +1 -0
  58. package/dist/index.d.cts +35 -0
  59. package/dist/index.d.ts +35 -0
  60. package/dist/index.d.ts.map +1 -0
  61. package/dist/index.js +40 -0
  62. package/dist/index.js.map +1 -0
  63. package/dist/inference/api_protos.cjs +104 -0
  64. package/dist/inference/api_protos.cjs.map +1 -0
  65. package/dist/inference/api_protos.d.cts +222 -0
  66. package/dist/inference/api_protos.d.ts +222 -0
  67. package/dist/inference/api_protos.d.ts.map +1 -0
  68. package/dist/inference/api_protos.js +70 -0
  69. package/dist/inference/api_protos.js.map +1 -0
  70. package/dist/inference/index.cjs +56 -0
  71. package/dist/inference/index.cjs.map +1 -0
  72. package/dist/inference/index.d.cts +8 -0
  73. package/dist/inference/index.d.ts +8 -0
  74. package/dist/inference/index.d.ts.map +1 -0
  75. package/dist/inference/index.js +23 -0
  76. package/dist/inference/index.js.map +1 -0
  77. package/dist/inference/interruption/AdaptiveInterruptionDetector.cjs +152 -0
  78. package/dist/inference/interruption/AdaptiveInterruptionDetector.cjs.map +1 -0
  79. package/dist/inference/interruption/AdaptiveInterruptionDetector.d.cts +50 -0
  80. package/dist/inference/interruption/AdaptiveInterruptionDetector.d.ts +50 -0
  81. package/dist/inference/interruption/AdaptiveInterruptionDetector.d.ts.map +1 -0
  82. package/dist/inference/interruption/AdaptiveInterruptionDetector.js +125 -0
  83. package/dist/inference/interruption/AdaptiveInterruptionDetector.js.map +1 -0
  84. package/dist/inference/interruption/InterruptionStream.cjs +310 -0
  85. package/dist/inference/interruption/InterruptionStream.cjs.map +1 -0
  86. package/dist/inference/interruption/InterruptionStream.d.cts +57 -0
  87. package/dist/inference/interruption/InterruptionStream.d.ts +57 -0
  88. package/dist/inference/interruption/InterruptionStream.d.ts.map +1 -0
  89. package/dist/inference/interruption/InterruptionStream.js +288 -0
  90. package/dist/inference/interruption/InterruptionStream.js.map +1 -0
  91. package/dist/inference/interruption/defaults.cjs +76 -0
  92. package/dist/inference/interruption/defaults.cjs.map +1 -0
  93. package/dist/inference/interruption/defaults.d.cts +14 -0
  94. package/dist/inference/interruption/defaults.d.ts +14 -0
  95. package/dist/inference/interruption/defaults.d.ts.map +1 -0
  96. package/dist/inference/interruption/defaults.js +42 -0
  97. package/dist/inference/interruption/defaults.js.map +1 -0
  98. package/dist/inference/interruption/errors.cjs +2 -0
  99. package/dist/inference/interruption/errors.cjs.map +1 -0
  100. package/dist/inference/interruption/errors.d.cts +2 -0
  101. package/dist/inference/interruption/errors.d.ts +2 -0
  102. package/dist/inference/interruption/errors.d.ts.map +1 -0
  103. package/dist/inference/interruption/errors.js +1 -0
  104. package/dist/inference/interruption/errors.js.map +1 -0
  105. package/dist/inference/interruption/http_transport.cjs +57 -0
  106. package/dist/inference/interruption/http_transport.cjs.map +1 -0
  107. package/dist/inference/interruption/http_transport.d.cts +23 -0
  108. package/dist/inference/interruption/http_transport.d.ts +23 -0
  109. package/dist/inference/interruption/http_transport.d.ts.map +1 -0
  110. package/dist/inference/interruption/http_transport.js +33 -0
  111. package/dist/inference/interruption/http_transport.js.map +1 -0
  112. package/dist/inference/interruption/index.cjs +34 -0
  113. package/dist/inference/interruption/index.cjs.map +1 -0
  114. package/dist/inference/interruption/index.d.cts +5 -0
  115. package/dist/inference/interruption/index.d.ts +5 -0
  116. package/dist/inference/interruption/index.d.ts.map +1 -0
  117. package/dist/inference/interruption/index.js +7 -0
  118. package/dist/inference/interruption/index.js.map +1 -0
  119. package/dist/inference/interruption/interruption.cjs +85 -0
  120. package/dist/inference/interruption/interruption.cjs.map +1 -0
  121. package/dist/inference/interruption/interruption.d.cts +48 -0
  122. package/dist/inference/interruption/interruption.d.ts +48 -0
  123. package/dist/inference/interruption/interruption.d.ts.map +1 -0
  124. package/dist/inference/interruption/interruption.js +59 -0
  125. package/dist/inference/interruption/interruption.js.map +1 -0
  126. package/dist/inference/llm.cjs +347 -0
  127. package/dist/inference/llm.cjs.map +1 -0
  128. package/dist/inference/llm.d.cts +114 -0
  129. package/dist/inference/llm.d.ts +114 -0
  130. package/dist/inference/llm.d.ts.map +1 -0
  131. package/dist/inference/llm.js +318 -0
  132. package/dist/inference/llm.js.map +1 -0
  133. package/dist/inference/stt.cjs +371 -0
  134. package/dist/inference/stt.cjs.map +1 -0
  135. package/dist/inference/stt.d.cts +91 -0
  136. package/dist/inference/stt.d.ts +91 -0
  137. package/dist/inference/stt.d.ts.map +1 -0
  138. package/dist/inference/stt.js +350 -0
  139. package/dist/inference/stt.js.map +1 -0
  140. package/dist/inference/tts.cjs +439 -0
  141. package/dist/inference/tts.cjs.map +1 -0
  142. package/dist/inference/tts.d.cts +80 -0
  143. package/dist/inference/tts.d.ts +80 -0
  144. package/dist/inference/tts.d.ts.map +1 -0
  145. package/dist/inference/tts.js +417 -0
  146. package/dist/inference/tts.js.map +1 -0
  147. package/dist/inference/utils.cjs +89 -0
  148. package/dist/inference/utils.cjs.map +1 -0
  149. package/dist/inference/utils.d.cts +6 -0
  150. package/dist/inference/utils.d.ts +6 -0
  151. package/dist/inference/utils.d.ts.map +1 -0
  152. package/dist/inference/utils.js +63 -0
  153. package/dist/inference/utils.js.map +1 -0
  154. package/dist/inference/utils.test.cjs +20 -0
  155. package/dist/inference/utils.test.cjs.map +1 -0
  156. package/dist/inference/utils.test.js +19 -0
  157. package/dist/inference/utils.test.js.map +1 -0
  158. package/dist/inference_runner.cjs +37 -0
  159. package/dist/inference_runner.cjs.map +1 -0
  160. package/dist/inference_runner.d.cts +11 -0
  161. package/dist/inference_runner.d.ts +11 -0
  162. package/dist/inference_runner.d.ts.map +1 -0
  163. package/dist/inference_runner.js +13 -0
  164. package/dist/inference_runner.js.map +1 -0
  165. package/dist/ipc/index.cjs +23 -0
  166. package/dist/ipc/index.cjs.map +1 -0
  167. package/dist/ipc/index.d.cts +2 -0
  168. package/dist/ipc/index.d.ts +2 -0
  169. package/dist/ipc/index.d.ts.map +1 -0
  170. package/dist/ipc/index.js +2 -0
  171. package/dist/ipc/index.js.map +1 -0
  172. package/dist/ipc/inference_executor.cjs +17 -0
  173. package/dist/ipc/inference_executor.cjs.map +1 -0
  174. package/dist/ipc/inference_executor.d.cts +4 -0
  175. package/dist/ipc/inference_executor.d.ts +4 -0
  176. package/dist/ipc/inference_executor.d.ts.map +1 -0
  177. package/dist/ipc/inference_executor.js +1 -0
  178. package/dist/ipc/inference_executor.js.map +1 -0
  179. package/dist/ipc/inference_proc_executor.cjs +101 -0
  180. package/dist/ipc/inference_proc_executor.cjs.map +1 -0
  181. package/dist/ipc/inference_proc_executor.d.cts +23 -0
  182. package/dist/ipc/inference_proc_executor.d.ts +23 -0
  183. package/dist/ipc/inference_proc_executor.d.ts.map +1 -0
  184. package/dist/ipc/inference_proc_executor.js +75 -0
  185. package/dist/ipc/inference_proc_executor.js.map +1 -0
  186. package/dist/ipc/inference_proc_lazy_main.cjs +86 -0
  187. package/dist/ipc/inference_proc_lazy_main.cjs.map +1 -0
  188. package/dist/ipc/inference_proc_lazy_main.d.cts +2 -0
  189. package/dist/ipc/inference_proc_lazy_main.d.ts +2 -0
  190. package/dist/ipc/inference_proc_lazy_main.d.ts.map +1 -0
  191. package/dist/ipc/inference_proc_lazy_main.js +85 -0
  192. package/dist/ipc/inference_proc_lazy_main.js.map +1 -0
  193. package/dist/ipc/job_executor.cjs +34 -0
  194. package/dist/ipc/job_executor.cjs.map +1 -0
  195. package/dist/ipc/job_executor.d.cts +18 -0
  196. package/dist/ipc/job_executor.d.ts +18 -0
  197. package/dist/ipc/job_executor.d.ts.map +1 -0
  198. package/dist/ipc/job_executor.js +10 -0
  199. package/dist/ipc/job_executor.js.map +1 -0
  200. package/dist/ipc/job_proc_executor.cjs +115 -0
  201. package/dist/ipc/job_proc_executor.cjs.map +1 -0
  202. package/dist/ipc/job_proc_executor.d.cts +19 -0
  203. package/dist/ipc/job_proc_executor.d.ts +19 -0
  204. package/dist/ipc/job_proc_executor.d.ts.map +1 -0
  205. package/dist/ipc/job_proc_executor.js +89 -0
  206. package/dist/ipc/job_proc_executor.js.map +1 -0
  207. package/dist/ipc/job_proc_lazy_main.cjs +210 -0
  208. package/dist/ipc/job_proc_lazy_main.cjs.map +1 -0
  209. package/dist/ipc/job_proc_lazy_main.d.cts +2 -0
  210. package/dist/ipc/job_proc_lazy_main.d.ts +2 -0
  211. package/dist/ipc/job_proc_lazy_main.d.ts.map +1 -0
  212. package/dist/ipc/job_proc_lazy_main.js +187 -0
  213. package/dist/ipc/job_proc_lazy_main.js.map +1 -0
  214. package/dist/ipc/message.cjs +17 -0
  215. package/dist/ipc/message.cjs.map +1 -0
  216. package/dist/ipc/message.d.cts +58 -0
  217. package/dist/ipc/message.d.ts +58 -0
  218. package/dist/ipc/message.d.ts.map +1 -0
  219. package/dist/ipc/message.js +1 -0
  220. package/dist/ipc/message.js.map +1 -0
  221. package/dist/ipc/proc_pool.cjs +164 -0
  222. package/dist/ipc/proc_pool.cjs.map +1 -0
  223. package/dist/ipc/proc_pool.d.cts +31 -0
  224. package/dist/ipc/proc_pool.d.ts +31 -0
  225. package/dist/ipc/proc_pool.d.ts.map +1 -0
  226. package/dist/ipc/proc_pool.js +140 -0
  227. package/dist/ipc/proc_pool.js.map +1 -0
  228. package/dist/ipc/supervised_proc.cjs +229 -0
  229. package/dist/ipc/supervised_proc.cjs.map +1 -0
  230. package/dist/ipc/supervised_proc.d.cts +32 -0
  231. package/dist/ipc/supervised_proc.d.ts +32 -0
  232. package/dist/ipc/supervised_proc.d.ts.map +1 -0
  233. package/dist/ipc/supervised_proc.js +195 -0
  234. package/dist/ipc/supervised_proc.js.map +1 -0
  235. package/dist/ipc/supervised_proc.test.cjs +145 -0
  236. package/dist/ipc/supervised_proc.test.cjs.map +1 -0
  237. package/dist/ipc/supervised_proc.test.js +122 -0
  238. package/dist/ipc/supervised_proc.test.js.map +1 -0
  239. package/dist/job.cjs +373 -0
  240. package/dist/job.cjs.map +1 -0
  241. package/dist/job.d.cts +141 -0
  242. package/dist/job.d.ts +141 -0
  243. package/dist/job.d.ts.map +1 -0
  244. package/dist/job.js +332 -0
  245. package/dist/job.js.map +1 -0
  246. package/dist/llm/chat_context.cjs +527 -0
  247. package/dist/llm/chat_context.cjs.map +1 -0
  248. package/dist/llm/chat_context.d.cts +223 -0
  249. package/dist/llm/chat_context.d.ts +223 -0
  250. package/dist/llm/chat_context.d.ts.map +1 -0
  251. package/dist/llm/chat_context.js +496 -0
  252. package/dist/llm/chat_context.js.map +1 -0
  253. package/dist/llm/chat_context.test.cjs +911 -0
  254. package/dist/llm/chat_context.test.cjs.map +1 -0
  255. package/dist/llm/chat_context.test.js +916 -0
  256. package/dist/llm/chat_context.test.js.map +1 -0
  257. package/dist/llm/fallback_adapter.cjs +278 -0
  258. package/dist/llm/fallback_adapter.cjs.map +1 -0
  259. package/dist/llm/fallback_adapter.d.cts +73 -0
  260. package/dist/llm/fallback_adapter.d.ts +73 -0
  261. package/dist/llm/fallback_adapter.d.ts.map +1 -0
  262. package/dist/llm/fallback_adapter.js +254 -0
  263. package/dist/llm/fallback_adapter.js.map +1 -0
  264. package/dist/llm/fallback_adapter.test.cjs +176 -0
  265. package/dist/llm/fallback_adapter.test.cjs.map +1 -0
  266. package/dist/llm/fallback_adapter.test.js +175 -0
  267. package/dist/llm/fallback_adapter.test.js.map +1 -0
  268. package/dist/llm/index.cjs +79 -0
  269. package/dist/llm/index.cjs.map +1 -0
  270. package/dist/llm/index.d.cts +9 -0
  271. package/dist/llm/index.d.ts +9 -0
  272. package/dist/llm/index.d.ts.map +1 -0
  273. package/dist/llm/index.js +61 -0
  274. package/dist/llm/index.js.map +1 -0
  275. package/dist/llm/llm.cjs +226 -0
  276. package/dist/llm/llm.cjs.map +1 -0
  277. package/dist/llm/llm.d.cts +94 -0
  278. package/dist/llm/llm.d.ts +94 -0
  279. package/dist/llm/llm.d.ts.map +1 -0
  280. package/dist/llm/llm.js +201 -0
  281. package/dist/llm/llm.js.map +1 -0
  282. package/dist/llm/provider_format/google.cjs +132 -0
  283. package/dist/llm/provider_format/google.cjs.map +1 -0
  284. package/dist/llm/provider_format/google.d.cts +6 -0
  285. package/dist/llm/provider_format/google.d.ts +6 -0
  286. package/dist/llm/provider_format/google.d.ts.map +1 -0
  287. package/dist/llm/provider_format/google.js +108 -0
  288. package/dist/llm/provider_format/google.js.map +1 -0
  289. package/dist/llm/provider_format/google.test.cjs +724 -0
  290. package/dist/llm/provider_format/google.test.cjs.map +1 -0
  291. package/dist/llm/provider_format/google.test.js +728 -0
  292. package/dist/llm/provider_format/google.test.js.map +1 -0
  293. package/dist/llm/provider_format/index.cjs +40 -0
  294. package/dist/llm/provider_format/index.cjs.map +1 -0
  295. package/dist/llm/provider_format/index.d.cts +4 -0
  296. package/dist/llm/provider_format/index.d.ts +4 -0
  297. package/dist/llm/provider_format/index.d.ts.map +1 -0
  298. package/dist/llm/provider_format/index.js +16 -0
  299. package/dist/llm/provider_format/index.js.map +1 -0
  300. package/dist/llm/provider_format/openai.cjs +138 -0
  301. package/dist/llm/provider_format/openai.cjs.map +1 -0
  302. package/dist/llm/provider_format/openai.d.cts +3 -0
  303. package/dist/llm/provider_format/openai.d.ts +3 -0
  304. package/dist/llm/provider_format/openai.d.ts.map +1 -0
  305. package/dist/llm/provider_format/openai.js +114 -0
  306. package/dist/llm/provider_format/openai.js.map +1 -0
  307. package/dist/llm/provider_format/openai.test.cjs +557 -0
  308. package/dist/llm/provider_format/openai.test.cjs.map +1 -0
  309. package/dist/llm/provider_format/openai.test.js +561 -0
  310. package/dist/llm/provider_format/openai.test.js.map +1 -0
  311. package/dist/llm/provider_format/utils.cjs +146 -0
  312. package/dist/llm/provider_format/utils.cjs.map +1 -0
  313. package/dist/llm/provider_format/utils.d.cts +38 -0
  314. package/dist/llm/provider_format/utils.d.ts +38 -0
  315. package/dist/llm/provider_format/utils.d.ts.map +1 -0
  316. package/dist/llm/provider_format/utils.js +122 -0
  317. package/dist/llm/provider_format/utils.js.map +1 -0
  318. package/dist/llm/realtime.cjs +77 -0
  319. package/dist/llm/realtime.cjs.map +1 -0
  320. package/dist/llm/realtime.d.cts +106 -0
  321. package/dist/llm/realtime.d.ts +106 -0
  322. package/dist/llm/realtime.d.ts.map +1 -0
  323. package/dist/llm/realtime.js +52 -0
  324. package/dist/llm/realtime.js.map +1 -0
  325. package/dist/llm/remote_chat_context.cjs +112 -0
  326. package/dist/llm/remote_chat_context.cjs.map +1 -0
  327. package/dist/llm/remote_chat_context.d.cts +25 -0
  328. package/dist/llm/remote_chat_context.d.ts +25 -0
  329. package/dist/llm/remote_chat_context.d.ts.map +1 -0
  330. package/dist/llm/remote_chat_context.js +88 -0
  331. package/dist/llm/remote_chat_context.js.map +1 -0
  332. package/dist/llm/remote_chat_context.test.cjs +225 -0
  333. package/dist/llm/remote_chat_context.test.cjs.map +1 -0
  334. package/dist/llm/remote_chat_context.test.js +224 -0
  335. package/dist/llm/remote_chat_context.test.js.map +1 -0
  336. package/dist/llm/tool_context.cjs +152 -0
  337. package/dist/llm/tool_context.cjs.map +1 -0
  338. package/dist/llm/tool_context.d.cts +153 -0
  339. package/dist/llm/tool_context.d.ts +153 -0
  340. package/dist/llm/tool_context.d.ts.map +1 -0
  341. package/dist/llm/tool_context.js +119 -0
  342. package/dist/llm/tool_context.js.map +1 -0
  343. package/dist/llm/tool_context.test.cjs +359 -0
  344. package/dist/llm/tool_context.test.cjs.map +1 -0
  345. package/dist/llm/tool_context.test.js +336 -0
  346. package/dist/llm/tool_context.test.js.map +1 -0
  347. package/dist/llm/tool_context.type.test.cjs +92 -0
  348. package/dist/llm/tool_context.type.test.cjs.map +1 -0
  349. package/dist/llm/tool_context.type.test.js +91 -0
  350. package/dist/llm/tool_context.type.test.js.map +1 -0
  351. package/dist/llm/utils.cjs +267 -0
  352. package/dist/llm/utils.cjs.map +1 -0
  353. package/dist/llm/utils.d.cts +41 -0
  354. package/dist/llm/utils.d.ts +41 -0
  355. package/dist/llm/utils.d.ts.map +1 -0
  356. package/dist/llm/utils.js +230 -0
  357. package/dist/llm/utils.js.map +1 -0
  358. package/dist/llm/utils.test.cjs +513 -0
  359. package/dist/llm/utils.test.cjs.map +1 -0
  360. package/dist/llm/utils.test.js +490 -0
  361. package/dist/llm/utils.test.js.map +1 -0
  362. package/dist/llm/zod-utils.cjs +102 -0
  363. package/dist/llm/zod-utils.cjs.map +1 -0
  364. package/dist/llm/zod-utils.d.cts +65 -0
  365. package/dist/llm/zod-utils.d.ts +65 -0
  366. package/dist/llm/zod-utils.d.ts.map +1 -0
  367. package/dist/llm/zod-utils.js +64 -0
  368. package/dist/llm/zod-utils.js.map +1 -0
  369. package/dist/llm/zod-utils.test.cjs +472 -0
  370. package/dist/llm/zod-utils.test.cjs.map +1 -0
  371. package/dist/llm/zod-utils.test.js +455 -0
  372. package/dist/llm/zod-utils.test.js.map +1 -0
  373. package/dist/log.cjs +81 -0
  374. package/dist/log.cjs.map +1 -0
  375. package/dist/log.d.cts +20 -0
  376. package/dist/log.d.ts +20 -0
  377. package/dist/log.d.ts.map +1 -0
  378. package/dist/log.js +54 -0
  379. package/dist/log.js.map +1 -0
  380. package/dist/metrics/base.cjs +17 -0
  381. package/dist/metrics/base.cjs.map +1 -0
  382. package/dist/metrics/base.d.cts +150 -0
  383. package/dist/metrics/base.d.ts +150 -0
  384. package/dist/metrics/base.d.ts.map +1 -0
  385. package/dist/metrics/base.js +1 -0
  386. package/dist/metrics/base.js.map +1 -0
  387. package/dist/metrics/index.cjs +32 -0
  388. package/dist/metrics/index.cjs.map +1 -0
  389. package/dist/metrics/index.d.cts +4 -0
  390. package/dist/metrics/index.d.ts +4 -0
  391. package/dist/metrics/index.d.ts.map +1 -0
  392. package/dist/metrics/index.js +7 -0
  393. package/dist/metrics/index.js.map +1 -0
  394. package/dist/metrics/usage_collector.cjs +58 -0
  395. package/dist/metrics/usage_collector.cjs.map +1 -0
  396. package/dist/metrics/usage_collector.d.cts +15 -0
  397. package/dist/metrics/usage_collector.d.ts +15 -0
  398. package/dist/metrics/usage_collector.d.ts.map +1 -0
  399. package/dist/metrics/usage_collector.js +34 -0
  400. package/dist/metrics/usage_collector.js.map +1 -0
  401. package/dist/metrics/utils.cjs +74 -0
  402. package/dist/metrics/utils.cjs.map +1 -0
  403. package/dist/metrics/utils.d.cts +3 -0
  404. package/dist/metrics/utils.d.ts +3 -0
  405. package/dist/metrics/utils.d.ts.map +1 -0
  406. package/dist/metrics/utils.js +50 -0
  407. package/dist/metrics/utils.js.map +1 -0
  408. package/dist/plugin.cjs +62 -0
  409. package/dist/plugin.cjs.map +1 -0
  410. package/dist/plugin.d.cts +24 -0
  411. package/dist/plugin.d.ts +24 -0
  412. package/dist/plugin.d.ts.map +1 -0
  413. package/dist/plugin.js +37 -0
  414. package/dist/plugin.js.map +1 -0
  415. package/dist/stream/deferred_stream.cjs +106 -0
  416. package/dist/stream/deferred_stream.cjs.map +1 -0
  417. package/dist/stream/deferred_stream.d.cts +32 -0
  418. package/dist/stream/deferred_stream.d.ts +32 -0
  419. package/dist/stream/deferred_stream.d.ts.map +1 -0
  420. package/dist/stream/deferred_stream.js +81 -0
  421. package/dist/stream/deferred_stream.js.map +1 -0
  422. package/dist/stream/deferred_stream.test.cjs +527 -0
  423. package/dist/stream/deferred_stream.test.cjs.map +1 -0
  424. package/dist/stream/deferred_stream.test.js +526 -0
  425. package/dist/stream/deferred_stream.test.js.map +1 -0
  426. package/dist/stream/identity_transform.cjs +42 -0
  427. package/dist/stream/identity_transform.cjs.map +1 -0
  428. package/dist/stream/identity_transform.d.cts +6 -0
  429. package/dist/stream/identity_transform.d.ts +6 -0
  430. package/dist/stream/identity_transform.d.ts.map +1 -0
  431. package/dist/stream/identity_transform.js +18 -0
  432. package/dist/stream/identity_transform.js.map +1 -0
  433. package/dist/stream/identity_transform.test.cjs +125 -0
  434. package/dist/stream/identity_transform.test.cjs.map +1 -0
  435. package/dist/stream/identity_transform.test.js +124 -0
  436. package/dist/stream/identity_transform.test.js.map +1 -0
  437. package/dist/stream/index.cjs +38 -0
  438. package/dist/stream/index.cjs.map +1 -0
  439. package/dist/stream/index.d.cts +5 -0
  440. package/dist/stream/index.d.ts +5 -0
  441. package/dist/stream/index.d.ts.map +1 -0
  442. package/dist/stream/index.js +11 -0
  443. package/dist/stream/index.js.map +1 -0
  444. package/dist/stream/merge_readable_streams.cjs +59 -0
  445. package/dist/stream/merge_readable_streams.cjs.map +1 -0
  446. package/dist/stream/merge_readable_streams.d.cts +4 -0
  447. package/dist/stream/merge_readable_streams.d.ts +4 -0
  448. package/dist/stream/merge_readable_streams.d.ts.map +1 -0
  449. package/dist/stream/merge_readable_streams.js +35 -0
  450. package/dist/stream/merge_readable_streams.js.map +1 -0
  451. package/dist/stream/stream_channel.cjs +57 -0
  452. package/dist/stream/stream_channel.cjs.map +1 -0
  453. package/dist/stream/stream_channel.d.cts +11 -0
  454. package/dist/stream/stream_channel.d.ts +11 -0
  455. package/dist/stream/stream_channel.d.ts.map +1 -0
  456. package/dist/stream/stream_channel.js +33 -0
  457. package/dist/stream/stream_channel.js.map +1 -0
  458. package/dist/stream/stream_channel.test.cjs +124 -0
  459. package/dist/stream/stream_channel.test.cjs.map +1 -0
  460. package/dist/stream/stream_channel.test.js +123 -0
  461. package/dist/stream/stream_channel.test.js.map +1 -0
  462. package/dist/stt/index.cjs +38 -0
  463. package/dist/stt/index.cjs.map +1 -0
  464. package/dist/stt/index.d.cts +3 -0
  465. package/dist/stt/index.d.ts +3 -0
  466. package/dist/stt/index.d.ts.map +1 -0
  467. package/dist/stt/index.js +14 -0
  468. package/dist/stt/index.js.map +1 -0
  469. package/dist/stt/stream_adapter.cjs +115 -0
  470. package/dist/stt/stream_adapter.cjs.map +1 -0
  471. package/dist/stt/stream_adapter.d.cts +23 -0
  472. package/dist/stt/stream_adapter.d.ts +23 -0
  473. package/dist/stt/stream_adapter.d.ts.map +1 -0
  474. package/dist/stt/stream_adapter.js +90 -0
  475. package/dist/stt/stream_adapter.js.map +1 -0
  476. package/dist/stt/stt.cjs +253 -0
  477. package/dist/stt/stt.cjs.map +1 -0
  478. package/dist/stt/stt.d.cts +158 -0
  479. package/dist/stt/stt.d.ts +158 -0
  480. package/dist/stt/stt.d.ts.map +1 -0
  481. package/dist/stt/stt.js +227 -0
  482. package/dist/stt/stt.js.map +1 -0
  483. package/dist/telemetry/index.cjs +72 -0
  484. package/dist/telemetry/index.cjs.map +1 -0
  485. package/dist/telemetry/index.d.cts +7 -0
  486. package/dist/telemetry/index.d.ts +7 -0
  487. package/dist/telemetry/index.d.ts.map +1 -0
  488. package/dist/telemetry/index.js +37 -0
  489. package/dist/telemetry/index.js.map +1 -0
  490. package/dist/telemetry/logging.cjs +65 -0
  491. package/dist/telemetry/logging.cjs.map +1 -0
  492. package/dist/telemetry/logging.d.cts +21 -0
  493. package/dist/telemetry/logging.d.ts +21 -0
  494. package/dist/telemetry/logging.d.ts.map +1 -0
  495. package/dist/telemetry/logging.js +40 -0
  496. package/dist/telemetry/logging.js.map +1 -0
  497. package/dist/telemetry/otel_http_exporter.cjs +147 -0
  498. package/dist/telemetry/otel_http_exporter.cjs.map +1 -0
  499. package/dist/telemetry/otel_http_exporter.d.cts +62 -0
  500. package/dist/telemetry/otel_http_exporter.d.ts +62 -0
  501. package/dist/telemetry/otel_http_exporter.d.ts.map +1 -0
  502. package/dist/telemetry/otel_http_exporter.js +123 -0
  503. package/dist/telemetry/otel_http_exporter.js.map +1 -0
  504. package/dist/telemetry/pino_otel_transport.cjs +217 -0
  505. package/dist/telemetry/pino_otel_transport.cjs.map +1 -0
  506. package/dist/telemetry/pino_otel_transport.d.cts +58 -0
  507. package/dist/telemetry/pino_otel_transport.d.ts +58 -0
  508. package/dist/telemetry/pino_otel_transport.d.ts.map +1 -0
  509. package/dist/telemetry/pino_otel_transport.js +189 -0
  510. package/dist/telemetry/pino_otel_transport.js.map +1 -0
  511. package/dist/telemetry/trace_types.cjs +206 -0
  512. package/dist/telemetry/trace_types.cjs.map +1 -0
  513. package/dist/telemetry/trace_types.d.cts +61 -0
  514. package/dist/telemetry/trace_types.d.ts +61 -0
  515. package/dist/telemetry/trace_types.d.ts.map +1 -0
  516. package/dist/telemetry/trace_types.js +123 -0
  517. package/dist/telemetry/trace_types.js.map +1 -0
  518. package/dist/telemetry/traces.cjs +444 -0
  519. package/dist/telemetry/traces.cjs.map +1 -0
  520. package/dist/telemetry/traces.d.cts +114 -0
  521. package/dist/telemetry/traces.d.ts +114 -0
  522. package/dist/telemetry/traces.d.ts.map +1 -0
  523. package/dist/telemetry/traces.js +409 -0
  524. package/dist/telemetry/traces.js.map +1 -0
  525. package/dist/telemetry/utils.cjs +86 -0
  526. package/dist/telemetry/utils.cjs.map +1 -0
  527. package/dist/telemetry/utils.d.cts +5 -0
  528. package/dist/telemetry/utils.d.ts +5 -0
  529. package/dist/telemetry/utils.d.ts.map +1 -0
  530. package/dist/telemetry/utils.js +51 -0
  531. package/dist/telemetry/utils.js.map +1 -0
  532. package/dist/tokenize/basic/basic.cjs +105 -0
  533. package/dist/tokenize/basic/basic.cjs.map +1 -0
  534. package/dist/tokenize/basic/basic.d.cts +24 -0
  535. package/dist/tokenize/basic/basic.d.ts +24 -0
  536. package/dist/tokenize/basic/basic.d.ts.map +1 -0
  537. package/dist/tokenize/basic/basic.js +67 -0
  538. package/dist/tokenize/basic/basic.js.map +1 -0
  539. package/dist/tokenize/basic/hyphenator.cjs +425 -0
  540. package/dist/tokenize/basic/hyphenator.cjs.map +1 -0
  541. package/dist/tokenize/basic/hyphenator.d.cts +17 -0
  542. package/dist/tokenize/basic/hyphenator.d.ts +17 -0
  543. package/dist/tokenize/basic/hyphenator.d.ts.map +1 -0
  544. package/dist/tokenize/basic/hyphenator.js +401 -0
  545. package/dist/tokenize/basic/hyphenator.js.map +1 -0
  546. package/dist/tokenize/basic/index.cjs +37 -0
  547. package/dist/tokenize/basic/index.cjs.map +1 -0
  548. package/dist/tokenize/basic/index.d.cts +2 -0
  549. package/dist/tokenize/basic/index.d.ts +2 -0
  550. package/dist/tokenize/basic/index.d.ts.map +1 -0
  551. package/dist/tokenize/basic/index.js +15 -0
  552. package/dist/tokenize/basic/index.js.map +1 -0
  553. package/dist/tokenize/basic/paragraph.cjs +57 -0
  554. package/dist/tokenize/basic/paragraph.cjs.map +1 -0
  555. package/dist/tokenize/basic/paragraph.d.cts +5 -0
  556. package/dist/tokenize/basic/paragraph.d.ts +5 -0
  557. package/dist/tokenize/basic/paragraph.d.ts.map +1 -0
  558. package/dist/tokenize/basic/paragraph.js +33 -0
  559. package/dist/tokenize/basic/paragraph.js.map +1 -0
  560. package/dist/tokenize/basic/sentence.cjs +97 -0
  561. package/dist/tokenize/basic/sentence.cjs.map +1 -0
  562. package/dist/tokenize/basic/sentence.d.cts +5 -0
  563. package/dist/tokenize/basic/sentence.d.ts +5 -0
  564. package/dist/tokenize/basic/sentence.d.ts.map +1 -0
  565. package/dist/tokenize/basic/sentence.js +73 -0
  566. package/dist/tokenize/basic/sentence.js.map +1 -0
  567. package/dist/tokenize/basic/word.cjs +44 -0
  568. package/dist/tokenize/basic/word.cjs.map +1 -0
  569. package/dist/tokenize/basic/word.d.cts +5 -0
  570. package/dist/tokenize/basic/word.d.ts +5 -0
  571. package/dist/tokenize/basic/word.d.ts.map +1 -0
  572. package/dist/tokenize/basic/word.js +20 -0
  573. package/dist/tokenize/basic/word.js.map +1 -0
  574. package/dist/tokenize/index.cjs +55 -0
  575. package/dist/tokenize/index.cjs.map +1 -0
  576. package/dist/tokenize/index.d.cts +5 -0
  577. package/dist/tokenize/index.d.ts +5 -0
  578. package/dist/tokenize/index.d.ts.map +1 -0
  579. package/dist/tokenize/index.js +19 -0
  580. package/dist/tokenize/index.js.map +1 -0
  581. package/dist/tokenize/token_stream.cjs +168 -0
  582. package/dist/tokenize/token_stream.cjs.map +1 -0
  583. package/dist/tokenize/token_stream.d.cts +40 -0
  584. package/dist/tokenize/token_stream.d.ts +40 -0
  585. package/dist/tokenize/token_stream.d.ts.map +1 -0
  586. package/dist/tokenize/token_stream.js +142 -0
  587. package/dist/tokenize/token_stream.js.map +1 -0
  588. package/dist/tokenize/tokenizer.cjs +184 -0
  589. package/dist/tokenize/tokenizer.cjs.map +1 -0
  590. package/dist/tokenize/tokenizer.d.cts +55 -0
  591. package/dist/tokenize/tokenizer.d.ts +55 -0
  592. package/dist/tokenize/tokenizer.d.ts.map +1 -0
  593. package/dist/tokenize/tokenizer.js +156 -0
  594. package/dist/tokenize/tokenizer.js.map +1 -0
  595. package/dist/tokenize/tokenizer.test.cjs +220 -0
  596. package/dist/tokenize/tokenizer.test.cjs.map +1 -0
  597. package/dist/tokenize/tokenizer.test.js +219 -0
  598. package/dist/tokenize/tokenizer.test.js.map +1 -0
  599. package/dist/transcription.cjs +247 -0
  600. package/dist/transcription.cjs.map +1 -0
  601. package/dist/transcription.d.cts +31 -0
  602. package/dist/transcription.d.ts +31 -0
  603. package/dist/transcription.d.ts.map +1 -0
  604. package/dist/transcription.js +222 -0
  605. package/dist/transcription.js.map +1 -0
  606. package/dist/tts/index.cjs +38 -0
  607. package/dist/tts/index.cjs.map +1 -0
  608. package/dist/tts/index.d.cts +3 -0
  609. package/dist/tts/index.d.ts +3 -0
  610. package/dist/tts/index.d.ts.map +1 -0
  611. package/dist/tts/index.js +14 -0
  612. package/dist/tts/index.js.map +1 -0
  613. package/dist/tts/stream_adapter.cjs +105 -0
  614. package/dist/tts/stream_adapter.cjs.map +1 -0
  615. package/dist/tts/stream_adapter.d.cts +20 -0
  616. package/dist/tts/stream_adapter.d.ts +20 -0
  617. package/dist/tts/stream_adapter.d.ts.map +1 -0
  618. package/dist/tts/stream_adapter.js +80 -0
  619. package/dist/tts/stream_adapter.js.map +1 -0
  620. package/dist/tts/tts.cjs +431 -0
  621. package/dist/tts/tts.cjs.map +1 -0
  622. package/dist/tts/tts.d.cts +161 -0
  623. package/dist/tts/tts.d.ts +161 -0
  624. package/dist/tts/tts.d.ts.map +1 -0
  625. package/dist/tts/tts.js +405 -0
  626. package/dist/tts/tts.js.map +1 -0
  627. package/dist/types.cjs +49 -0
  628. package/dist/types.cjs.map +1 -0
  629. package/dist/types.d.cts +44 -0
  630. package/dist/types.d.ts +44 -0
  631. package/dist/types.d.ts.map +1 -0
  632. package/dist/types.js +23 -0
  633. package/dist/types.js.map +1 -0
  634. package/dist/utils/ws_transport.cjs +51 -0
  635. package/dist/utils/ws_transport.cjs.map +1 -0
  636. package/dist/utils/ws_transport.d.cts +9 -0
  637. package/dist/utils/ws_transport.d.ts +9 -0
  638. package/dist/utils/ws_transport.d.ts.map +1 -0
  639. package/dist/utils/ws_transport.js +17 -0
  640. package/dist/utils/ws_transport.js.map +1 -0
  641. package/dist/utils/ws_transport.test.cjs +212 -0
  642. package/dist/utils/ws_transport.test.cjs.map +1 -0
  643. package/dist/utils/ws_transport.test.js +211 -0
  644. package/dist/utils/ws_transport.test.js.map +1 -0
  645. package/dist/utils.cjs +669 -0
  646. package/dist/utils.cjs.map +1 -0
  647. package/dist/utils.d.cts +244 -0
  648. package/dist/utils.d.ts +244 -0
  649. package/dist/utils.d.ts.map +1 -0
  650. package/dist/utils.js +617 -0
  651. package/dist/utils.js.map +1 -0
  652. package/dist/utils.test.cjs +492 -0
  653. package/dist/utils.test.cjs.map +1 -0
  654. package/dist/utils.test.js +491 -0
  655. package/dist/utils.test.js.map +1 -0
  656. package/dist/vad.cjs +211 -0
  657. package/dist/vad.cjs.map +1 -0
  658. package/dist/vad.d.cts +105 -0
  659. package/dist/vad.d.ts +105 -0
  660. package/dist/vad.d.ts.map +1 -0
  661. package/dist/vad.js +185 -0
  662. package/dist/vad.js.map +1 -0
  663. package/dist/version.cjs +29 -0
  664. package/dist/version.cjs.map +1 -0
  665. package/dist/version.d.cts +2 -0
  666. package/dist/version.d.ts +2 -0
  667. package/dist/version.d.ts.map +1 -0
  668. package/dist/version.js +5 -0
  669. package/dist/version.js.map +1 -0
  670. package/dist/voice/agent.cjs +308 -0
  671. package/dist/voice/agent.cjs.map +1 -0
  672. package/dist/voice/agent.d.cts +83 -0
  673. package/dist/voice/agent.d.ts +83 -0
  674. package/dist/voice/agent.d.ts.map +1 -0
  675. package/dist/voice/agent.js +287 -0
  676. package/dist/voice/agent.js.map +1 -0
  677. package/dist/voice/agent.test.cjs +61 -0
  678. package/dist/voice/agent.test.cjs.map +1 -0
  679. package/dist/voice/agent.test.js +60 -0
  680. package/dist/voice/agent.test.js.map +1 -0
  681. package/dist/voice/agent_activity.cjs +1784 -0
  682. package/dist/voice/agent_activity.cjs.map +1 -0
  683. package/dist/voice/agent_activity.d.cts +116 -0
  684. package/dist/voice/agent_activity.d.ts +116 -0
  685. package/dist/voice/agent_activity.d.ts.map +1 -0
  686. package/dist/voice/agent_activity.js +1780 -0
  687. package/dist/voice/agent_activity.js.map +1 -0
  688. package/dist/voice/agent_session.cjs +592 -0
  689. package/dist/voice/agent_session.cjs.map +1 -0
  690. package/dist/voice/agent_session.d.cts +165 -0
  691. package/dist/voice/agent_session.d.ts +165 -0
  692. package/dist/voice/agent_session.d.ts.map +1 -0
  693. package/dist/voice/agent_session.js +582 -0
  694. package/dist/voice/agent_session.js.map +1 -0
  695. package/dist/voice/audio_recognition.cjs +668 -0
  696. package/dist/voice/audio_recognition.cjs.map +1 -0
  697. package/dist/voice/audio_recognition.d.cts +127 -0
  698. package/dist/voice/audio_recognition.d.ts +127 -0
  699. package/dist/voice/audio_recognition.d.ts.map +1 -0
  700. package/dist/voice/audio_recognition.js +647 -0
  701. package/dist/voice/audio_recognition.js.map +1 -0
  702. package/dist/voice/avatar/datastream_io.cjs +204 -0
  703. package/dist/voice/avatar/datastream_io.cjs.map +1 -0
  704. package/dist/voice/avatar/datastream_io.d.cts +37 -0
  705. package/dist/voice/avatar/datastream_io.d.ts +37 -0
  706. package/dist/voice/avatar/datastream_io.d.ts.map +1 -0
  707. package/dist/voice/avatar/datastream_io.js +188 -0
  708. package/dist/voice/avatar/datastream_io.js.map +1 -0
  709. package/dist/voice/avatar/index.cjs +23 -0
  710. package/dist/voice/avatar/index.cjs.map +1 -0
  711. package/dist/voice/avatar/index.d.cts +2 -0
  712. package/dist/voice/avatar/index.d.ts +2 -0
  713. package/dist/voice/avatar/index.d.ts.map +1 -0
  714. package/dist/voice/avatar/index.js +2 -0
  715. package/dist/voice/avatar/index.js.map +1 -0
  716. package/dist/voice/background_audio.cjs +366 -0
  717. package/dist/voice/background_audio.cjs.map +1 -0
  718. package/dist/voice/background_audio.d.cts +121 -0
  719. package/dist/voice/background_audio.d.ts +121 -0
  720. package/dist/voice/background_audio.d.ts.map +1 -0
  721. package/dist/voice/background_audio.js +342 -0
  722. package/dist/voice/background_audio.js.map +1 -0
  723. package/dist/voice/events.cjs +147 -0
  724. package/dist/voice/events.cjs.map +1 -0
  725. package/dist/voice/events.d.cts +127 -0
  726. package/dist/voice/events.d.ts +127 -0
  727. package/dist/voice/events.d.ts.map +1 -0
  728. package/dist/voice/events.js +112 -0
  729. package/dist/voice/events.js.map +1 -0
  730. package/dist/voice/generation.cjs +747 -0
  731. package/dist/voice/generation.cjs.map +1 -0
  732. package/dist/voice/generation.d.cts +116 -0
  733. package/dist/voice/generation.d.ts +116 -0
  734. package/dist/voice/generation.d.ts.map +1 -0
  735. package/dist/voice/generation.js +719 -0
  736. package/dist/voice/generation.js.map +1 -0
  737. package/dist/voice/generation_tools.test.cjs +236 -0
  738. package/dist/voice/generation_tools.test.cjs.map +1 -0
  739. package/dist/voice/generation_tools.test.js +235 -0
  740. package/dist/voice/generation_tools.test.js.map +1 -0
  741. package/dist/voice/index.cjs +49 -0
  742. package/dist/voice/index.cjs.map +1 -0
  743. package/dist/voice/index.d.cts +10 -0
  744. package/dist/voice/index.d.ts +10 -0
  745. package/dist/voice/index.d.ts.map +1 -0
  746. package/dist/voice/index.js +16 -0
  747. package/dist/voice/index.js.map +1 -0
  748. package/dist/voice/interruption_detection.test.cjs +114 -0
  749. package/dist/voice/interruption_detection.test.cjs.map +1 -0
  750. package/dist/voice/interruption_detection.test.js +113 -0
  751. package/dist/voice/interruption_detection.test.js.map +1 -0
  752. package/dist/voice/io.cjs +270 -0
  753. package/dist/voice/io.cjs.map +1 -0
  754. package/dist/voice/io.d.cts +126 -0
  755. package/dist/voice/io.d.ts +126 -0
  756. package/dist/voice/io.d.ts.map +1 -0
  757. package/dist/voice/io.js +242 -0
  758. package/dist/voice/io.js.map +1 -0
  759. package/dist/voice/recorder_io/index.cjs +23 -0
  760. package/dist/voice/recorder_io/index.cjs.map +1 -0
  761. package/dist/voice/recorder_io/index.d.cts +2 -0
  762. package/dist/voice/recorder_io/index.d.ts +2 -0
  763. package/dist/voice/recorder_io/index.d.ts.map +1 -0
  764. package/dist/voice/recorder_io/index.js +2 -0
  765. package/dist/voice/recorder_io/index.js.map +1 -0
  766. package/dist/voice/recorder_io/recorder_io.cjs +542 -0
  767. package/dist/voice/recorder_io/recorder_io.cjs.map +1 -0
  768. package/dist/voice/recorder_io/recorder_io.d.cts +100 -0
  769. package/dist/voice/recorder_io/recorder_io.d.ts +100 -0
  770. package/dist/voice/recorder_io/recorder_io.d.ts.map +1 -0
  771. package/dist/voice/recorder_io/recorder_io.js +508 -0
  772. package/dist/voice/recorder_io/recorder_io.js.map +1 -0
  773. package/dist/voice/report.cjs +75 -0
  774. package/dist/voice/report.cjs.map +1 -0
  775. package/dist/voice/report.d.cts +42 -0
  776. package/dist/voice/report.d.ts +42 -0
  777. package/dist/voice/report.d.ts.map +1 -0
  778. package/dist/voice/report.js +50 -0
  779. package/dist/voice/report.js.map +1 -0
  780. package/dist/voice/room_io/_input.cjs +133 -0
  781. package/dist/voice/room_io/_input.cjs.map +1 -0
  782. package/dist/voice/room_io/_input.d.cts +24 -0
  783. package/dist/voice/room_io/_input.d.ts +24 -0
  784. package/dist/voice/room_io/_input.d.ts.map +1 -0
  785. package/dist/voice/room_io/_input.js +114 -0
  786. package/dist/voice/room_io/_input.js.map +1 -0
  787. package/dist/voice/room_io/_output.cjs +359 -0
  788. package/dist/voice/room_io/_output.cjs.map +1 -0
  789. package/dist/voice/room_io/_output.d.cts +77 -0
  790. package/dist/voice/room_io/_output.d.ts +77 -0
  791. package/dist/voice/room_io/_output.d.ts.map +1 -0
  792. package/dist/voice/room_io/_output.js +343 -0
  793. package/dist/voice/room_io/_output.js.map +1 -0
  794. package/dist/voice/room_io/index.cjs +25 -0
  795. package/dist/voice/room_io/index.cjs.map +1 -0
  796. package/dist/voice/room_io/index.d.cts +3 -0
  797. package/dist/voice/room_io/index.d.ts +3 -0
  798. package/dist/voice/room_io/index.d.ts.map +1 -0
  799. package/dist/voice/room_io/index.js +3 -0
  800. package/dist/voice/room_io/index.js.map +1 -0
  801. package/dist/voice/room_io/room_io.cjs +373 -0
  802. package/dist/voice/room_io/room_io.cjs.map +1 -0
  803. package/dist/voice/room_io/room_io.d.cts +94 -0
  804. package/dist/voice/room_io/room_io.d.ts +94 -0
  805. package/dist/voice/room_io/room_io.d.ts.map +1 -0
  806. package/dist/voice/room_io/room_io.js +364 -0
  807. package/dist/voice/room_io/room_io.js.map +1 -0
  808. package/dist/voice/run_context.cjs +51 -0
  809. package/dist/voice/run_context.cjs.map +1 -0
  810. package/dist/voice/run_context.d.cts +22 -0
  811. package/dist/voice/run_context.d.ts +22 -0
  812. package/dist/voice/run_context.d.ts.map +1 -0
  813. package/dist/voice/run_context.js +27 -0
  814. package/dist/voice/run_context.js.map +1 -0
  815. package/dist/voice/speech_handle.cjs +228 -0
  816. package/dist/voice/speech_handle.cjs.map +1 -0
  817. package/dist/voice/speech_handle.d.cts +97 -0
  818. package/dist/voice/speech_handle.d.ts +97 -0
  819. package/dist/voice/speech_handle.d.ts.map +1 -0
  820. package/dist/voice/speech_handle.js +204 -0
  821. package/dist/voice/speech_handle.js.map +1 -0
  822. package/dist/voice/transcription/_utils.cjs +45 -0
  823. package/dist/voice/transcription/_utils.cjs.map +1 -0
  824. package/dist/voice/transcription/_utils.d.cts +3 -0
  825. package/dist/voice/transcription/_utils.d.ts +3 -0
  826. package/dist/voice/transcription/_utils.d.ts.map +1 -0
  827. package/dist/voice/transcription/_utils.js +21 -0
  828. package/dist/voice/transcription/_utils.js.map +1 -0
  829. package/dist/voice/transcription/index.cjs +23 -0
  830. package/dist/voice/transcription/index.cjs.map +1 -0
  831. package/dist/voice/transcription/index.d.cts +2 -0
  832. package/dist/voice/transcription/index.d.ts +2 -0
  833. package/dist/voice/transcription/index.d.ts.map +1 -0
  834. package/dist/voice/transcription/index.js +2 -0
  835. package/dist/voice/transcription/index.js.map +1 -0
  836. package/dist/voice/transcription/synchronizer.cjs +379 -0
  837. package/dist/voice/transcription/synchronizer.cjs.map +1 -0
  838. package/dist/voice/transcription/synchronizer.d.cts +87 -0
  839. package/dist/voice/transcription/synchronizer.d.ts +87 -0
  840. package/dist/voice/transcription/synchronizer.d.ts.map +1 -0
  841. package/dist/voice/transcription/synchronizer.js +354 -0
  842. package/dist/voice/transcription/synchronizer.js.map +1 -0
  843. package/dist/worker.cjs +680 -0
  844. package/dist/worker.cjs.map +1 -0
  845. package/dist/worker.d.cts +119 -0
  846. package/dist/worker.d.ts +119 -0
  847. package/dist/worker.d.ts.map +1 -0
  848. package/dist/worker.js +645 -0
  849. package/dist/worker.js.map +1 -0
  850. package/package.json +86 -0
  851. package/resources/NOTICE +2 -0
  852. package/resources/keyboard-typing.ogg +0 -0
  853. package/resources/keyboard-typing2.ogg +0 -0
  854. package/resources/office-ambience.ogg +0 -0
  855. package/src/_exceptions.ts +137 -0
  856. package/src/audio.ts +205 -0
  857. package/src/cli.ts +224 -0
  858. package/src/connection_pool.test.ts +346 -0
  859. package/src/connection_pool.ts +307 -0
  860. package/src/constants.ts +9 -0
  861. package/src/generator.ts +38 -0
  862. package/src/http_server.ts +64 -0
  863. package/src/index.ts +41 -0
  864. package/src/inference/api_protos.ts +82 -0
  865. package/src/inference/index.ts +32 -0
  866. package/src/inference/interruption/AdaptiveInterruptionDetector.ts +166 -0
  867. package/src/inference/interruption/InterruptionStream.ts +397 -0
  868. package/src/inference/interruption/defaults.ts +33 -0
  869. package/src/inference/interruption/errors.ts +0 -0
  870. package/src/inference/interruption/http_transport.ts +61 -0
  871. package/src/inference/interruption/index.ts +4 -0
  872. package/src/inference/interruption/interruption.ts +88 -0
  873. package/src/inference/llm.ts +532 -0
  874. package/src/inference/stt.ts +524 -0
  875. package/src/inference/tts.ts +574 -0
  876. package/src/inference/utils.test.ts +31 -0
  877. package/src/inference/utils.ts +81 -0
  878. package/src/inference_runner.ts +19 -0
  879. package/src/ipc/index.ts +5 -0
  880. package/src/ipc/inference_executor.ts +7 -0
  881. package/src/ipc/inference_proc_executor.ts +101 -0
  882. package/src/ipc/inference_proc_lazy_main.ts +115 -0
  883. package/src/ipc/job_executor.ts +23 -0
  884. package/src/ipc/job_proc_executor.ts +122 -0
  885. package/src/ipc/job_proc_lazy_main.ts +247 -0
  886. package/src/ipc/message.ts +52 -0
  887. package/src/ipc/proc_pool.ts +164 -0
  888. package/src/ipc/supervised_proc.test.ts +153 -0
  889. package/src/ipc/supervised_proc.ts +242 -0
  890. package/src/job.ts +461 -0
  891. package/src/llm/__snapshots__/chat_context.test.ts.snap +527 -0
  892. package/src/llm/__snapshots__/tool_context.test.ts.snap +177 -0
  893. package/src/llm/__snapshots__/zod-utils.test.ts.snap +559 -0
  894. package/src/llm/chat_context.test.ts +1057 -0
  895. package/src/llm/chat_context.ts +759 -0
  896. package/src/llm/fallback_adapter.test.ts +238 -0
  897. package/src/llm/fallback_adapter.ts +391 -0
  898. package/src/llm/index.ts +74 -0
  899. package/src/llm/llm.ts +303 -0
  900. package/src/llm/provider_format/google.test.ts +843 -0
  901. package/src/llm/provider_format/google.ts +134 -0
  902. package/src/llm/provider_format/index.ts +23 -0
  903. package/src/llm/provider_format/openai.test.ts +675 -0
  904. package/src/llm/provider_format/openai.ts +146 -0
  905. package/src/llm/provider_format/utils.ts +187 -0
  906. package/src/llm/realtime.ts +163 -0
  907. package/src/llm/remote_chat_context.test.ts +290 -0
  908. package/src/llm/remote_chat_context.ts +114 -0
  909. package/src/llm/tool_context.test.ts +407 -0
  910. package/src/llm/tool_context.ts +343 -0
  911. package/src/llm/tool_context.type.test.ts +115 -0
  912. package/src/llm/utils.test.ts +670 -0
  913. package/src/llm/utils.ts +336 -0
  914. package/src/llm/zod-utils.test.ts +577 -0
  915. package/src/llm/zod-utils.ts +153 -0
  916. package/src/log.ts +83 -0
  917. package/src/metrics/base.ts +168 -0
  918. package/src/metrics/index.ts +15 -0
  919. package/src/metrics/usage_collector.ts +46 -0
  920. package/src/metrics/utils.ts +64 -0
  921. package/src/plugin.ts +46 -0
  922. package/src/stream/deferred_stream.test.ts +755 -0
  923. package/src/stream/deferred_stream.ts +127 -0
  924. package/src/stream/identity_transform.test.ts +179 -0
  925. package/src/stream/identity_transform.ts +18 -0
  926. package/src/stream/index.ts +7 -0
  927. package/src/stream/merge_readable_streams.ts +40 -0
  928. package/src/stream/stream_channel.test.ts +166 -0
  929. package/src/stream/stream_channel.ts +44 -0
  930. package/src/stt/index.ts +15 -0
  931. package/src/stt/stream_adapter.ts +107 -0
  932. package/src/stt/stt.ts +374 -0
  933. package/src/telemetry/index.ts +28 -0
  934. package/src/telemetry/logging.ts +55 -0
  935. package/src/telemetry/otel_http_exporter.ts +195 -0
  936. package/src/telemetry/pino_otel_transport.ts +265 -0
  937. package/src/telemetry/trace_types.ts +95 -0
  938. package/src/telemetry/traces.ts +612 -0
  939. package/src/telemetry/utils.ts +61 -0
  940. package/src/tokenize/basic/basic.ts +83 -0
  941. package/src/tokenize/basic/hyphenator.ts +434 -0
  942. package/src/tokenize/basic/index.ts +11 -0
  943. package/src/tokenize/basic/paragraph.ts +43 -0
  944. package/src/tokenize/basic/sentence.ts +89 -0
  945. package/src/tokenize/basic/word.ts +27 -0
  946. package/src/tokenize/index.ts +16 -0
  947. package/src/tokenize/token_stream.ts +180 -0
  948. package/src/tokenize/tokenizer.test.ts +255 -0
  949. package/src/tokenize/tokenizer.ts +152 -0
  950. package/src/transcription.ts +307 -0
  951. package/src/tts/index.ts +12 -0
  952. package/src/tts/stream_adapter.ts +110 -0
  953. package/src/tts/tts.ts +598 -0
  954. package/src/types.ts +66 -0
  955. package/src/utils/ws_transport.test.ts +282 -0
  956. package/src/utils/ws_transport.ts +22 -0
  957. package/src/utils.test.ts +651 -0
  958. package/src/utils.ts +871 -0
  959. package/src/vad.ts +262 -0
  960. package/src/version.ts +5 -0
  961. package/src/voice/agent.test.ts +80 -0
  962. package/src/voice/agent.ts +418 -0
  963. package/src/voice/agent_activity.ts +2375 -0
  964. package/src/voice/agent_session.ts +866 -0
  965. package/src/voice/audio_recognition.ts +877 -0
  966. package/src/voice/avatar/datastream_io.ts +247 -0
  967. package/src/voice/avatar/index.ts +4 -0
  968. package/src/voice/background_audio.ts +491 -0
  969. package/src/voice/events.ts +261 -0
  970. package/src/voice/generation.ts +946 -0
  971. package/src/voice/generation_tools.test.ts +268 -0
  972. package/src/voice/index.ts +12 -0
  973. package/src/voice/interruption_detection.test.ts +151 -0
  974. package/src/voice/io.ts +347 -0
  975. package/src/voice/recorder_io/index.ts +4 -0
  976. package/src/voice/recorder_io/recorder_io.ts +690 -0
  977. package/src/voice/report.ts +100 -0
  978. package/src/voice/room_io/_input.ts +162 -0
  979. package/src/voice/room_io/_output.ts +439 -0
  980. package/src/voice/room_io/index.ts +5 -0
  981. package/src/voice/room_io/room_io.ts +518 -0
  982. package/src/voice/run_context.ts +34 -0
  983. package/src/voice/speech_handle.ts +250 -0
  984. package/src/voice/transcription/_utils.ts +25 -0
  985. package/src/voice/transcription/index.ts +4 -0
  986. package/src/voice/transcription/synchronizer.ts +477 -0
  987. package/src/worker.ts +798 -0
@@ -0,0 +1,866 @@
1
+ // SPDX-FileCopyrightText: 2024 LiveKit, Inc.
2
+ //
3
+ // SPDX-License-Identifier: Apache-2.0
4
+ import type { AudioFrame, Room } from '@livekit/rtc-node';
5
+ import type { TypedEventEmitter as TypedEmitter } from '@livekit/typed-emitter';
6
+ import type { Context, Span } from '@opentelemetry/api';
7
+ import { ROOT_CONTEXT, context as otelContext, trace } from '@opentelemetry/api';
8
+ import { EventEmitter } from 'node:events';
9
+ import type { ReadableStream } from 'node:stream/web';
10
+ import {
11
+ LLM as InferenceLLM,
12
+ STT as InferenceSTT,
13
+ TTS as InferenceTTS,
14
+ type LLMModels,
15
+ type STTModelString,
16
+ type TTSModelString,
17
+ } from '../inference/index.js';
18
+ import type { AdaptiveInterruptionDetector } from '../inference/interruption/AdaptiveInterruptionDetector.js';
19
+ import { type JobContext, getJobContext } from '../job.js';
20
+ import type { FunctionCall, FunctionCallOutput } from '../llm/chat_context.js';
21
+ import { AgentHandoffItem, ChatContext, ChatMessage } from '../llm/chat_context.js';
22
+ import type { LLM, RealtimeModel, RealtimeModelError, ToolChoice } from '../llm/index.js';
23
+ import type { LLMError } from '../llm/llm.js';
24
+ import { log } from '../log.js';
25
+ import type { STT } from '../stt/index.js';
26
+ import type { STTError } from '../stt/stt.js';
27
+ import { traceTypes, tracer } from '../telemetry/index.js';
28
+ import type { TTS, TTSError } from '../tts/tts.js';
29
+ import {
30
+ DEFAULT_API_CONNECT_OPTIONS,
31
+ DEFAULT_SESSION_CONNECT_OPTIONS,
32
+ type ResolvedSessionConnectOptions,
33
+ type SessionConnectOptions,
34
+ } from '../types.js';
35
+ import type { VAD } from '../vad.js';
36
+ import type { Agent } from './agent.js';
37
+ import { AgentActivity } from './agent_activity.js';
38
+ import type { _TurnDetector } from './audio_recognition.js';
39
+ import {
40
+ type AgentEvent,
41
+ AgentSessionEventTypes,
42
+ type AgentState,
43
+ type AgentStateChangedEvent,
44
+ type CloseEvent,
45
+ CloseReason,
46
+ type ConversationItemAddedEvent,
47
+ type ErrorEvent,
48
+ type FunctionToolsExecutedEvent,
49
+ type MetricsCollectedEvent,
50
+ type ShutdownReason,
51
+ type SpeechCreatedEvent,
52
+ type UserInputTranscribedEvent,
53
+ type UserState,
54
+ type UserStateChangedEvent,
55
+ createAgentStateChangedEvent,
56
+ createCloseEvent,
57
+ createConversationItemAddedEvent,
58
+ createUserStateChangedEvent,
59
+ } from './events.js';
60
+ import { AgentInput, AgentOutput } from './io.js';
61
+ import { RecorderIO } from './recorder_io/index.js';
62
+ import { RoomIO, type RoomInputOptions, type RoomOutputOptions } from './room_io/index.js';
63
+ import type { UnknownUserData } from './run_context.js';
64
+ import type { SpeechHandle } from './speech_handle.js';
65
+
66
+ export interface VoiceOptions {
67
+ allowInterruptions: boolean;
68
+ discardAudioIfUninterruptible: boolean;
69
+ minInterruptionDuration: number;
70
+ minInterruptionWords: number;
71
+ minEndpointingDelay: number;
72
+ maxEndpointingDelay: number;
73
+ maxToolSteps: number;
74
+ preemptiveGeneration: boolean;
75
+ userAwayTimeout?: number | null;
76
+ }
77
+
78
+ const defaultVoiceOptions: VoiceOptions = {
79
+ allowInterruptions: true,
80
+ discardAudioIfUninterruptible: true,
81
+ minInterruptionDuration: 500,
82
+ minInterruptionWords: 0,
83
+ minEndpointingDelay: 500,
84
+ maxEndpointingDelay: 6000,
85
+ maxToolSteps: 3,
86
+ preemptiveGeneration: false,
87
+ userAwayTimeout: 15.0,
88
+ } as const;
89
+
90
+ export type TurnDetectionMode = 'stt' | 'vad' | 'realtime_llm' | 'manual' | _TurnDetector;
91
+
92
+ export type AgentSessionCallbacks = {
93
+ [AgentSessionEventTypes.UserInputTranscribed]: (ev: UserInputTranscribedEvent) => void;
94
+ [AgentSessionEventTypes.AgentStateChanged]: (ev: AgentStateChangedEvent) => void;
95
+ [AgentSessionEventTypes.UserStateChanged]: (ev: UserStateChangedEvent) => void;
96
+ [AgentSessionEventTypes.ConversationItemAdded]: (ev: ConversationItemAddedEvent) => void;
97
+ [AgentSessionEventTypes.FunctionToolsExecuted]: (ev: FunctionToolsExecutedEvent) => void;
98
+ [AgentSessionEventTypes.MetricsCollected]: (ev: MetricsCollectedEvent) => void;
99
+ [AgentSessionEventTypes.SpeechCreated]: (ev: SpeechCreatedEvent) => void;
100
+ [AgentSessionEventTypes.Error]: (ev: ErrorEvent) => void;
101
+ [AgentSessionEventTypes.Close]: (ev: CloseEvent) => void;
102
+ };
103
+
104
+ export type AgentSessionOptions<UserData = UnknownUserData> = {
105
+ turnDetection?: TurnDetectionMode;
106
+ stt?: STT | STTModelString;
107
+ vad?: VAD;
108
+ llm?: LLM | RealtimeModel | LLMModels;
109
+ tts?: TTS | TTSModelString;
110
+ interruptionDetector?: AdaptiveInterruptionDetector;
111
+ userData?: UserData;
112
+ voiceOptions?: Partial<VoiceOptions>;
113
+ connOptions?: SessionConnectOptions;
114
+ };
115
+
116
+ export class AgentSession<
117
+ UserData = UnknownUserData,
118
+ > extends (EventEmitter as new () => TypedEmitter<AgentSessionCallbacks>) {
119
+ vad?: VAD;
120
+ stt?: STT;
121
+ llm?: LLM | RealtimeModel;
122
+ tts?: TTS;
123
+ turnDetection?: TurnDetectionMode;
124
+
125
+ readonly options: VoiceOptions;
126
+
127
+ private agent?: Agent;
128
+ private activity?: AgentActivity;
129
+ private nextActivity?: AgentActivity;
130
+ private started = false;
131
+ private userState: UserState = 'listening';
132
+
133
+ private roomIO?: RoomIO;
134
+ private logger = log();
135
+
136
+ private _chatCtx: ChatContext;
137
+ private _userData: UserData | undefined;
138
+ private _agentState: AgentState = 'initializing';
139
+
140
+ private _input: AgentInput;
141
+ private _output: AgentOutput;
142
+
143
+ private closingTask: Promise<void> | null = null;
144
+ private userAwayTimer: NodeJS.Timeout | null = null;
145
+
146
+ // Connection options for STT, LLM, and TTS
147
+ private _connOptions: ResolvedSessionConnectOptions;
148
+
149
+ // Unrecoverable error counts, reset after agent speaking
150
+ private llmErrorCounts = 0;
151
+ private ttsErrorCounts = 0;
152
+
153
+ private sessionSpan?: Span;
154
+ private userSpeakingSpan?: Span;
155
+ private agentSpeakingSpan?: Span;
156
+
157
+ /** @internal */
158
+ _recorderIO?: RecorderIO;
159
+
160
+ /** @internal */
161
+ rootSpanContext?: Context;
162
+
163
+ /** @internal */
164
+ _recordedEvents: AgentEvent[] = [];
165
+
166
+ /** @internal */
167
+ _enableRecording = false;
168
+
169
+ /** @internal - Timestamp when the session started (milliseconds) */
170
+ _startedAt?: number;
171
+
172
+ interruptionDetector?: AdaptiveInterruptionDetector;
173
+
174
+ constructor(opts: AgentSessionOptions<UserData>) {
175
+ super();
176
+
177
+ const {
178
+ vad,
179
+ stt,
180
+ llm,
181
+ tts,
182
+ turnDetection,
183
+ interruptionDetector,
184
+ userData,
185
+ voiceOptions = defaultVoiceOptions,
186
+ connOptions,
187
+ } = opts;
188
+
189
+ // Merge user-provided connOptions with defaults
190
+ this._connOptions = {
191
+ sttConnOptions: { ...DEFAULT_API_CONNECT_OPTIONS, ...connOptions?.sttConnOptions },
192
+ llmConnOptions: { ...DEFAULT_API_CONNECT_OPTIONS, ...connOptions?.llmConnOptions },
193
+ ttsConnOptions: { ...DEFAULT_API_CONNECT_OPTIONS, ...connOptions?.ttsConnOptions },
194
+ maxUnrecoverableErrors:
195
+ connOptions?.maxUnrecoverableErrors ??
196
+ DEFAULT_SESSION_CONNECT_OPTIONS.maxUnrecoverableErrors,
197
+ };
198
+
199
+ this.vad = vad;
200
+
201
+ if (typeof stt === 'string') {
202
+ this.stt = InferenceSTT.fromModelString(stt);
203
+ } else {
204
+ this.stt = stt;
205
+ }
206
+
207
+ if (typeof llm === 'string') {
208
+ this.llm = InferenceLLM.fromModelString(llm);
209
+ } else {
210
+ this.llm = llm;
211
+ }
212
+
213
+ if (typeof tts === 'string') {
214
+ this.tts = InferenceTTS.fromModelString(tts);
215
+ } else {
216
+ this.tts = tts;
217
+ }
218
+
219
+ this.turnDetection = turnDetection;
220
+ this.interruptionDetector = interruptionDetector;
221
+ this._userData = userData;
222
+
223
+ // configurable IO
224
+ this._input = new AgentInput(this.onAudioInputChanged);
225
+ this._output = new AgentOutput(this.onAudioOutputChanged, this.onTextOutputChanged);
226
+
227
+ // This is the "global" chat context, it holds the entire conversation history
228
+ this._chatCtx = ChatContext.empty();
229
+ this.options = { ...defaultVoiceOptions, ...voiceOptions };
230
+
231
+ this._onUserInputTranscribed = this._onUserInputTranscribed.bind(this);
232
+ this.on(AgentSessionEventTypes.UserInputTranscribed, this._onUserInputTranscribed);
233
+ }
234
+
235
+ emit<K extends keyof AgentSessionCallbacks>(
236
+ event: K,
237
+ ...args: Parameters<AgentSessionCallbacks[K]>
238
+ ): boolean {
239
+ const eventData = args[0] as AgentEvent;
240
+ this._recordedEvents.push(eventData);
241
+ return super.emit(event, ...args);
242
+ }
243
+
244
+ get input(): AgentInput {
245
+ return this._input;
246
+ }
247
+
248
+ get output(): AgentOutput {
249
+ return this._output;
250
+ }
251
+
252
+ get userData(): UserData {
253
+ if (this._userData === undefined) {
254
+ throw new Error('Voice agent userData is not set');
255
+ }
256
+
257
+ return this._userData;
258
+ }
259
+
260
+ get history(): ChatContext {
261
+ return this._chatCtx;
262
+ }
263
+
264
+ /** Connection options for STT, LLM, and TTS. */
265
+ get connOptions(): ResolvedSessionConnectOptions {
266
+ return this._connOptions;
267
+ }
268
+
269
+ set userData(value: UserData) {
270
+ this._userData = value;
271
+ }
272
+
273
+ private async _startImpl({
274
+ agent,
275
+ room,
276
+ inputOptions,
277
+ outputOptions,
278
+ span,
279
+ }: {
280
+ agent: Agent;
281
+ room: Room;
282
+ inputOptions?: Partial<RoomInputOptions>;
283
+ outputOptions?: Partial<RoomOutputOptions>;
284
+ span: Span;
285
+ }): Promise<void> {
286
+ span.setAttribute(traceTypes.ATTR_AGENT_LABEL, agent.id);
287
+
288
+ this.agent = agent;
289
+ this._updateAgentState('initializing');
290
+
291
+ const tasks: Promise<void>[] = [];
292
+ // Check for existing input/output configuration and warn if needed
293
+ if (this.input.audio && inputOptions?.audioEnabled !== false) {
294
+ this.logger.warn('RoomIO audio input is enabled but input.audio is already set, ignoring..');
295
+ }
296
+
297
+ if (this.output.audio && outputOptions?.audioEnabled !== false) {
298
+ this.logger.warn(
299
+ 'RoomIO audio output is enabled but output.audio is already set, ignoring..',
300
+ );
301
+ }
302
+
303
+ if (this.output.transcription && outputOptions?.transcriptionEnabled !== false) {
304
+ this.logger.warn(
305
+ 'RoomIO transcription output is enabled but output.transcription is already set, ignoring..',
306
+ );
307
+ }
308
+
309
+ this.roomIO = new RoomIO({
310
+ agentSession: this,
311
+ room,
312
+ inputOptions,
313
+ outputOptions,
314
+ });
315
+ this.roomIO.start();
316
+
317
+ let ctx: JobContext | undefined = undefined;
318
+ try {
319
+ ctx = getJobContext();
320
+ } catch (error) {
321
+ // JobContext is not available in evals
322
+ this.logger.warn('JobContext is not available');
323
+ }
324
+
325
+ if (ctx) {
326
+ if (ctx.room === room && !room.isConnected) {
327
+ this.logger.debug('Auto-connecting to room via job context');
328
+ tasks.push(ctx.connect());
329
+ }
330
+
331
+ if (ctx._primaryAgentSession === undefined) {
332
+ ctx._primaryAgentSession = this;
333
+ } else if (this._enableRecording) {
334
+ throw new Error(
335
+ 'Only one `AgentSession` can be the primary at a time. If you want to ignore primary designation, use `session.start({ record: false })`.',
336
+ );
337
+ }
338
+
339
+ if (this.input.audio && this.output.audio && this._enableRecording) {
340
+ this._recorderIO = new RecorderIO({ agentSession: this });
341
+ this.input.audio = this._recorderIO.recordInput(this.input.audio);
342
+ this.output.audio = this._recorderIO.recordOutput(this.output.audio);
343
+
344
+ // Start recording to session directory
345
+ const sessionDir = ctx.sessionDirectory;
346
+ if (sessionDir) {
347
+ tasks.push(this._recorderIO.start(`${sessionDir}/audio.ogg`));
348
+ }
349
+ }
350
+ }
351
+
352
+ // TODO(AJS-265): add shutdown callback to job context
353
+ tasks.push(this.updateActivity(this.agent));
354
+
355
+ await Promise.allSettled(tasks);
356
+
357
+ // Log used IO configuration
358
+ this.logger.debug(
359
+ `using audio io: ${this.input.audio ? '`' + this.input.audio.constructor.name + '`' : '(none)'} -> \`AgentSession\` -> ${this.output.audio ? '`' + this.output.audio.constructor.name + '`' : '(none)'}`,
360
+ );
361
+
362
+ this.logger.debug(
363
+ `using transcript io: \`AgentSession\` -> ${this.output.transcription ? '`' + this.output.transcription.constructor.name + '`' : '(none)'}`,
364
+ );
365
+
366
+ this.started = true;
367
+ this._startedAt = Date.now();
368
+ this._updateAgentState('listening');
369
+ }
370
+
371
+ async start({
372
+ agent,
373
+ room,
374
+ inputOptions,
375
+ outputOptions,
376
+ record,
377
+ }: {
378
+ agent: Agent;
379
+ room: Room;
380
+ inputOptions?: Partial<RoomInputOptions>;
381
+ outputOptions?: Partial<RoomOutputOptions>;
382
+ record?: boolean;
383
+ }): Promise<void> {
384
+ if (this.started) {
385
+ return;
386
+ }
387
+
388
+ let ctx: JobContext | undefined = undefined;
389
+ try {
390
+ ctx = getJobContext();
391
+
392
+ if (record === undefined) {
393
+ record = ctx.job.enableRecording;
394
+ }
395
+
396
+ this._enableRecording = record;
397
+
398
+ if (this._enableRecording) {
399
+ ctx.initRecording();
400
+ }
401
+ } catch (error) {
402
+ // JobContext is not available in evals
403
+ this.logger.warn('JobContext is not available');
404
+ }
405
+
406
+ this.sessionSpan = tracer.startSpan({
407
+ name: 'agent_session',
408
+ context: ROOT_CONTEXT,
409
+ });
410
+
411
+ this.rootSpanContext = trace.setSpan(ROOT_CONTEXT, this.sessionSpan);
412
+
413
+ await this._startImpl({
414
+ agent,
415
+ room,
416
+ inputOptions,
417
+ outputOptions,
418
+ span: this.sessionSpan,
419
+ });
420
+ }
421
+
422
+ updateAgent(agent: Agent): void {
423
+ this.agent = agent;
424
+
425
+ if (this.started) {
426
+ this.updateActivity(agent);
427
+ }
428
+ }
429
+
430
+ commitUserTurn() {
431
+ if (!this.activity) {
432
+ throw new Error('AgentSession is not running');
433
+ }
434
+
435
+ this.activity.commitUserTurn();
436
+ }
437
+
438
+ clearUserTurn() {
439
+ if (!this.activity) {
440
+ throw new Error('AgentSession is not running');
441
+ }
442
+ this.activity.clearUserTurn();
443
+ }
444
+
445
+ say(
446
+ text: string | ReadableStream<string>,
447
+ options?: {
448
+ audio?: ReadableStream<AudioFrame>;
449
+ allowInterruptions?: boolean;
450
+ addToChatCtx?: boolean;
451
+ },
452
+ ): SpeechHandle {
453
+ if (!this.activity) {
454
+ throw new Error('AgentSession is not running');
455
+ }
456
+
457
+ const doSay = (activity: AgentActivity) => {
458
+ return activity.say(text, options);
459
+ };
460
+
461
+ // attach to the session span if called outside of the AgentSession
462
+ const activeSpan = trace.getActiveSpan();
463
+ if (!activeSpan && this.rootSpanContext) {
464
+ return otelContext.with(this.rootSpanContext, () => doSay(this.activity!));
465
+ }
466
+
467
+ return doSay(this.activity);
468
+ }
469
+
470
+ interrupt() {
471
+ if (!this.activity) {
472
+ throw new Error('AgentSession is not running');
473
+ }
474
+ return this.activity.interrupt();
475
+ }
476
+
477
+ generateReply(options?: {
478
+ userInput?: string;
479
+ instructions?: string;
480
+ toolChoice?: ToolChoice;
481
+ allowInterruptions?: boolean;
482
+ }): SpeechHandle {
483
+ if (!this.activity) {
484
+ throw new Error('AgentSession is not running');
485
+ }
486
+
487
+ const userMessage = options?.userInput
488
+ ? new ChatMessage({
489
+ role: 'user',
490
+ content: options.userInput,
491
+ })
492
+ : undefined;
493
+
494
+ const doGenerateReply = (activity: AgentActivity, nextActivity?: AgentActivity) => {
495
+ if (activity.draining) {
496
+ if (!nextActivity) {
497
+ throw new Error('AgentSession is closing, cannot use generateReply()');
498
+ }
499
+ return nextActivity.generateReply({ userMessage, ...options });
500
+ }
501
+ return activity.generateReply({ userMessage, ...options });
502
+ };
503
+
504
+ // attach to the session span if called outside of the AgentSession
505
+ const activeSpan = trace.getActiveSpan();
506
+ if (!activeSpan && this.rootSpanContext) {
507
+ return otelContext.with(this.rootSpanContext, () =>
508
+ doGenerateReply(this.activity!, this.nextActivity),
509
+ );
510
+ }
511
+
512
+ return doGenerateReply(this.activity!, this.nextActivity);
513
+ }
514
+
515
+ private async updateActivity(agent: Agent): Promise<void> {
516
+ const runWithContext = async () => {
517
+ // TODO(AJS-129): add lock to agent activity core lifecycle
518
+ this.nextActivity = new AgentActivity(agent, this);
519
+
520
+ const previousActivity = this.activity;
521
+
522
+ if (this.activity) {
523
+ await this.activity.drain();
524
+ await this.activity.close();
525
+ }
526
+
527
+ this.activity = this.nextActivity;
528
+ this.nextActivity = undefined;
529
+
530
+ this._chatCtx.insert(
531
+ new AgentHandoffItem({
532
+ oldAgentId: previousActivity?.agent.id,
533
+ newAgentId: agent.id,
534
+ }),
535
+ );
536
+ this.logger.debug(
537
+ { previousAgentId: previousActivity?.agent.id, newAgentId: agent.id },
538
+ 'Agent handoff inserted into chat context',
539
+ );
540
+
541
+ await this.activity.start();
542
+
543
+ if (this._input.audio) {
544
+ this.activity.attachAudioInput(this._input.audio.stream);
545
+ }
546
+ };
547
+
548
+ // Run within session span context if available
549
+ if (this.rootSpanContext) {
550
+ return otelContext.with(this.rootSpanContext, runWithContext);
551
+ }
552
+
553
+ return runWithContext();
554
+ }
555
+
556
+ get chatCtx(): ChatContext {
557
+ return this._chatCtx.copy();
558
+ }
559
+
560
+ get agentState(): AgentState {
561
+ return this._agentState;
562
+ }
563
+
564
+ get currentAgent(): Agent {
565
+ if (!this.agent) {
566
+ throw new Error('AgentSession is not running');
567
+ }
568
+
569
+ return this.agent;
570
+ }
571
+
572
+ async close(): Promise<void> {
573
+ await this.closeImpl(CloseReason.USER_INITIATED);
574
+ }
575
+
576
+ shutdown(options?: { drain?: boolean; reason?: ShutdownReason }): void {
577
+ const { drain = true, reason = CloseReason.USER_INITIATED } = options ?? {};
578
+
579
+ this._closeSoon({
580
+ reason,
581
+ drain,
582
+ });
583
+ }
584
+
585
+ /** @internal */
586
+ _closeSoon({
587
+ reason,
588
+ drain = false,
589
+ error = null,
590
+ }: {
591
+ reason: ShutdownReason;
592
+ drain?: boolean;
593
+ error?: RealtimeModelError | STTError | TTSError | LLMError | null;
594
+ }): void {
595
+ if (this.closingTask) {
596
+ return;
597
+ }
598
+ this.closeImpl(reason, error, drain);
599
+ }
600
+
601
+ /** @internal */
602
+ _onError(error: RealtimeModelError | STTError | TTSError | LLMError): void {
603
+ if (this.closingTask || error.recoverable) {
604
+ return;
605
+ }
606
+
607
+ // Track error counts per type to implement max_unrecoverable_errors logic
608
+ if (error.type === 'llm_error') {
609
+ this.llmErrorCounts += 1;
610
+ if (this.llmErrorCounts <= this._connOptions.maxUnrecoverableErrors) {
611
+ return;
612
+ }
613
+ } else if (error.type === 'tts_error') {
614
+ this.ttsErrorCounts += 1;
615
+ if (this.ttsErrorCounts <= this._connOptions.maxUnrecoverableErrors) {
616
+ return;
617
+ }
618
+ }
619
+
620
+ this.logger.error(error, 'AgentSession is closing due to unrecoverable error');
621
+
622
+ this.closingTask = (async () => {
623
+ await this.closeImpl(CloseReason.ERROR, error);
624
+ })().then(() => {
625
+ this.closingTask = null;
626
+ });
627
+ }
628
+
629
+ /** @internal */
630
+ _conversationItemAdded(item: ChatMessage): void {
631
+ this._chatCtx.insert(item);
632
+ this.emit(AgentSessionEventTypes.ConversationItemAdded, createConversationItemAddedEvent(item));
633
+ }
634
+
635
+ /** @internal */
636
+ _toolItemsAdded(items: (FunctionCall | FunctionCallOutput)[]): void {
637
+ this._chatCtx.insert(items);
638
+ }
639
+
640
+ /** @internal */
641
+ _updateAgentState(state: AgentState) {
642
+ if (this._agentState === state) {
643
+ return;
644
+ }
645
+
646
+ const oldState = this._agentState;
647
+
648
+ if (state === 'speaking') {
649
+ // Reset error counts when agent starts speaking
650
+ this.llmErrorCounts = 0;
651
+ this.ttsErrorCounts = 0;
652
+
653
+ if (this.agentSpeakingSpan === undefined) {
654
+ this.agentSpeakingSpan = tracer.startSpan({
655
+ name: 'agent_speaking',
656
+ context: this.rootSpanContext,
657
+ });
658
+
659
+ // TODO(brian): PR4 - Set participant attributes if roomIO.room.localParticipant is available
660
+ // (Ref: Python agent_session.py line 1161-1164)
661
+ }
662
+
663
+ // Notify AudioRecognition that agent started speaking (for interruption detection)
664
+ this.activity?.notifyAgentSpeechStarted();
665
+ } else if (oldState === 'speaking') {
666
+ // Agent stopped speaking
667
+ if (this.agentSpeakingSpan !== undefined) {
668
+ // TODO(brian): PR4 - Set ATTR_END_TIME attribute if available
669
+ this.agentSpeakingSpan.end();
670
+ this.agentSpeakingSpan = undefined;
671
+ }
672
+
673
+ // Notify AudioRecognition that agent stopped speaking (for interruption detection)
674
+ this.activity?.notifyAgentSpeechEnded();
675
+ } else if (this.agentSpeakingSpan !== undefined) {
676
+ // Non-speaking to non-speaking transition but span is still open
677
+ this.agentSpeakingSpan.end();
678
+ this.agentSpeakingSpan = undefined;
679
+ }
680
+
681
+ this._agentState = state;
682
+
683
+ // Handle user away timer based on state changes
684
+ if (state === 'listening' && this.userState === 'listening') {
685
+ this._setUserAwayTimer();
686
+ } else {
687
+ this._cancelUserAwayTimer();
688
+ }
689
+
690
+ this.emit(
691
+ AgentSessionEventTypes.AgentStateChanged,
692
+ createAgentStateChangedEvent(oldState, state),
693
+ );
694
+ }
695
+
696
+ /** @internal */
697
+ _updateUserState(state: UserState, _lastSpeakingTime?: number) {
698
+ if (this.userState === state) {
699
+ return;
700
+ }
701
+
702
+ if (state === 'speaking' && this.userSpeakingSpan === undefined) {
703
+ this.userSpeakingSpan = tracer.startSpan({
704
+ name: 'user_speaking',
705
+ context: this.rootSpanContext,
706
+ });
707
+
708
+ // TODO(brian): PR4 - Set participant attributes if roomIO.linkedParticipant is available
709
+ // (Ref: Python agent_session.py line 1192-1195)
710
+ } else if (this.userSpeakingSpan !== undefined) {
711
+ // TODO(brian): PR4 - Set ATTR_END_TIME attribute with lastSpeakingTime if available
712
+ this.userSpeakingSpan.end();
713
+ this.userSpeakingSpan = undefined;
714
+ }
715
+
716
+ const oldState = this.userState;
717
+ this.userState = state;
718
+
719
+ // Handle user away timer based on state changes
720
+ if (state === 'listening' && this._agentState === 'listening') {
721
+ this._setUserAwayTimer();
722
+ } else {
723
+ this._cancelUserAwayTimer();
724
+ }
725
+
726
+ this.emit(
727
+ AgentSessionEventTypes.UserStateChanged,
728
+ createUserStateChangedEvent(oldState, state),
729
+ );
730
+ }
731
+
732
+ // -- User changed input/output streams/sinks --
733
+ private onAudioInputChanged(): void {
734
+ if (!this.started) {
735
+ return;
736
+ }
737
+
738
+ if (this.activity && this._input.audio) {
739
+ this.activity.attachAudioInput(this._input.audio.stream);
740
+ }
741
+ }
742
+
743
+ private onAudioOutputChanged(): void {}
744
+
745
+ private onTextOutputChanged(): void {}
746
+
747
+ private _setUserAwayTimer(): void {
748
+ this._cancelUserAwayTimer();
749
+
750
+ if (this.options.userAwayTimeout === null || this.options.userAwayTimeout === undefined) {
751
+ return;
752
+ }
753
+
754
+ if (this.roomIO && !this.roomIO.isParticipantAvailable) {
755
+ return;
756
+ }
757
+
758
+ this.userAwayTimer = setTimeout(() => {
759
+ this.logger.debug('User away timeout triggered');
760
+ this._updateUserState('away');
761
+ }, this.options.userAwayTimeout * 1000);
762
+ }
763
+
764
+ private _cancelUserAwayTimer(): void {
765
+ if (this.userAwayTimer !== null) {
766
+ clearTimeout(this.userAwayTimer);
767
+ this.userAwayTimer = null;
768
+ }
769
+ }
770
+
771
+ private _onUserInputTranscribed(ev: UserInputTranscribedEvent): void {
772
+ if (this.userState === 'away' && ev.isFinal) {
773
+ this.logger.debug('User returned from away state due to speech input');
774
+ this._updateUserState('listening');
775
+ }
776
+ }
777
+
778
+ private async closeImpl(
779
+ reason: ShutdownReason,
780
+ error: RealtimeModelError | LLMError | TTSError | STTError | null = null,
781
+ drain: boolean = false,
782
+ ): Promise<void> {
783
+ if (this.rootSpanContext) {
784
+ return otelContext.with(this.rootSpanContext, async () => {
785
+ await this.closeImplInner(reason, error, drain);
786
+ });
787
+ }
788
+
789
+ return this.closeImplInner(reason, error, drain);
790
+ }
791
+
792
+ private async closeImplInner(
793
+ reason: ShutdownReason,
794
+ error: RealtimeModelError | LLMError | TTSError | STTError | null = null,
795
+ drain: boolean = false,
796
+ ): Promise<void> {
797
+ if (!this.started) {
798
+ return;
799
+ }
800
+
801
+ this._cancelUserAwayTimer();
802
+ this.off(AgentSessionEventTypes.UserInputTranscribed, this._onUserInputTranscribed);
803
+
804
+ if (this.activity) {
805
+ if (!drain) {
806
+ try {
807
+ this.activity.interrupt();
808
+ } catch (error) {
809
+ // TODO(shubhra): force interrupt or wait for it to finish?
810
+ // it might be an audio played from the error callback
811
+ }
812
+ }
813
+ await this.activity.drain();
814
+ // wait any uninterruptible speech to finish
815
+ await this.activity.currentSpeech?.waitForPlayout();
816
+ try {
817
+ this.activity.detachAudioInput();
818
+ } catch (error) {
819
+ // Ignore detach errors during cleanup - source may not have been set
820
+ }
821
+ }
822
+
823
+ // Close recorder before detaching inputs/outputs (keep reference for session report)
824
+ if (this._recorderIO) {
825
+ await this._recorderIO.close();
826
+ }
827
+
828
+ // detach the inputs and outputs
829
+ this.input.audio = null;
830
+ this.output.audio = null;
831
+ this.output.transcription = null;
832
+
833
+ await this.roomIO?.close();
834
+ this.roomIO = undefined;
835
+
836
+ await this.activity?.close();
837
+ this.activity = undefined;
838
+
839
+ if (this.sessionSpan) {
840
+ this.sessionSpan.end();
841
+ this.sessionSpan = undefined;
842
+ }
843
+
844
+ if (this.userSpeakingSpan) {
845
+ this.userSpeakingSpan.end();
846
+ this.userSpeakingSpan = undefined;
847
+ }
848
+
849
+ if (this.agentSpeakingSpan) {
850
+ this.agentSpeakingSpan.end();
851
+ this.agentSpeakingSpan = undefined;
852
+ }
853
+
854
+ this.started = false;
855
+
856
+ this.emit(AgentSessionEventTypes.Close, createCloseEvent(reason, error));
857
+
858
+ this.userState = 'listening';
859
+ this._agentState = 'initializing';
860
+ this.rootSpanContext = undefined;
861
+ this.llmErrorCounts = 0;
862
+ this.ttsErrorCounts = 0;
863
+
864
+ this.logger.info({ reason, error }, 'AgentSession closed');
865
+ }
866
+ }