@livekit/agents 0.7.8 → 1.0.0-next.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (627) hide show
  1. package/dist/_exceptions.cjs +109 -0
  2. package/dist/_exceptions.cjs.map +1 -0
  3. package/dist/_exceptions.d.cts +64 -0
  4. package/dist/_exceptions.d.ts +64 -0
  5. package/dist/_exceptions.d.ts.map +1 -0
  6. package/dist/_exceptions.js +80 -0
  7. package/dist/_exceptions.js.map +1 -0
  8. package/dist/audio.cjs +10 -3
  9. package/dist/audio.cjs.map +1 -1
  10. package/dist/audio.d.cts +2 -0
  11. package/dist/audio.d.ts +2 -0
  12. package/dist/audio.d.ts.map +1 -1
  13. package/dist/audio.js +8 -2
  14. package/dist/audio.js.map +1 -1
  15. package/dist/cli.cjs +25 -0
  16. package/dist/cli.cjs.map +1 -1
  17. package/dist/cli.d.ts.map +1 -1
  18. package/dist/cli.js +25 -0
  19. package/dist/cli.js.map +1 -1
  20. package/dist/constants.cjs +6 -0
  21. package/dist/constants.cjs.map +1 -1
  22. package/dist/constants.d.cts +2 -0
  23. package/dist/constants.d.ts +2 -0
  24. package/dist/constants.d.ts.map +1 -1
  25. package/dist/constants.js +4 -0
  26. package/dist/constants.js.map +1 -1
  27. package/dist/http_server.cjs.map +1 -1
  28. package/dist/http_server.d.cts +1 -0
  29. package/dist/http_server.d.ts +1 -0
  30. package/dist/http_server.d.ts.map +1 -1
  31. package/dist/http_server.js.map +1 -1
  32. package/dist/index.cjs +27 -20
  33. package/dist/index.cjs.map +1 -1
  34. package/dist/index.d.cts +13 -10
  35. package/dist/index.d.ts +13 -10
  36. package/dist/index.d.ts.map +1 -1
  37. package/dist/index.js +15 -11
  38. package/dist/index.js.map +1 -1
  39. package/dist/inference_runner.cjs +0 -1
  40. package/dist/inference_runner.cjs.map +1 -1
  41. package/dist/inference_runner.d.cts +2 -3
  42. package/dist/inference_runner.d.ts +2 -3
  43. package/dist/inference_runner.d.ts.map +1 -1
  44. package/dist/inference_runner.js +0 -1
  45. package/dist/inference_runner.js.map +1 -1
  46. package/dist/ipc/inference_proc_executor.cjs +2 -2
  47. package/dist/ipc/inference_proc_executor.cjs.map +1 -1
  48. package/dist/ipc/inference_proc_executor.js +2 -2
  49. package/dist/ipc/inference_proc_executor.js.map +1 -1
  50. package/dist/ipc/job_executor.cjs.map +1 -1
  51. package/dist/ipc/job_executor.js.map +1 -1
  52. package/dist/ipc/job_proc_executor.cjs +1 -0
  53. package/dist/ipc/job_proc_executor.cjs.map +1 -1
  54. package/dist/ipc/job_proc_executor.js +1 -0
  55. package/dist/ipc/job_proc_executor.js.map +1 -1
  56. package/dist/ipc/job_proc_lazy_main.cjs +1 -1
  57. package/dist/ipc/job_proc_lazy_main.cjs.map +1 -1
  58. package/dist/ipc/job_proc_lazy_main.js +1 -1
  59. package/dist/ipc/job_proc_lazy_main.js.map +1 -1
  60. package/dist/ipc/supervised_proc.d.cts +1 -1
  61. package/dist/ipc/supervised_proc.d.ts +1 -1
  62. package/dist/ipc/supervised_proc.d.ts.map +1 -1
  63. package/dist/job.cjs +14 -2
  64. package/dist/job.cjs.map +1 -1
  65. package/dist/job.d.cts +8 -0
  66. package/dist/job.d.ts +8 -0
  67. package/dist/job.d.ts.map +1 -1
  68. package/dist/job.js +12 -1
  69. package/dist/job.js.map +1 -1
  70. package/dist/llm/chat_context.cjs +332 -82
  71. package/dist/llm/chat_context.cjs.map +1 -1
  72. package/dist/llm/chat_context.d.cts +152 -48
  73. package/dist/llm/chat_context.d.ts +152 -48
  74. package/dist/llm/chat_context.d.ts.map +1 -1
  75. package/dist/llm/chat_context.js +327 -81
  76. package/dist/llm/chat_context.js.map +1 -1
  77. package/dist/llm/chat_context.test.cjs +380 -0
  78. package/dist/llm/chat_context.test.cjs.map +1 -0
  79. package/dist/llm/chat_context.test.js +385 -0
  80. package/dist/llm/chat_context.test.js.map +1 -0
  81. package/dist/llm/index.cjs +37 -8
  82. package/dist/llm/index.cjs.map +1 -1
  83. package/dist/llm/index.d.cts +7 -3
  84. package/dist/llm/index.d.ts +7 -3
  85. package/dist/llm/index.d.ts.map +1 -1
  86. package/dist/llm/index.js +39 -9
  87. package/dist/llm/index.js.map +1 -1
  88. package/dist/llm/llm.cjs +98 -33
  89. package/dist/llm/llm.cjs.map +1 -1
  90. package/dist/llm/llm.d.cts +50 -24
  91. package/dist/llm/llm.d.ts +50 -24
  92. package/dist/llm/llm.d.ts.map +1 -1
  93. package/dist/llm/llm.js +99 -33
  94. package/dist/llm/llm.js.map +1 -1
  95. package/dist/llm/provider_format/google.cjs +128 -0
  96. package/dist/llm/provider_format/google.cjs.map +1 -0
  97. package/dist/llm/provider_format/google.d.cts +6 -0
  98. package/dist/llm/provider_format/google.d.ts +6 -0
  99. package/dist/llm/provider_format/google.d.ts.map +1 -0
  100. package/dist/llm/provider_format/google.js +104 -0
  101. package/dist/llm/provider_format/google.js.map +1 -0
  102. package/dist/llm/provider_format/google.test.cjs +676 -0
  103. package/dist/llm/provider_format/google.test.cjs.map +1 -0
  104. package/dist/llm/provider_format/google.test.js +675 -0
  105. package/dist/llm/provider_format/google.test.js.map +1 -0
  106. package/dist/llm/provider_format/index.cjs +40 -0
  107. package/dist/llm/provider_format/index.cjs.map +1 -0
  108. package/dist/llm/provider_format/index.d.cts +4 -0
  109. package/dist/llm/provider_format/index.d.ts +4 -0
  110. package/dist/llm/provider_format/index.d.ts.map +1 -0
  111. package/dist/llm/provider_format/index.js +16 -0
  112. package/dist/llm/provider_format/index.js.map +1 -0
  113. package/dist/llm/provider_format/openai.cjs +116 -0
  114. package/dist/llm/provider_format/openai.cjs.map +1 -0
  115. package/dist/llm/provider_format/openai.d.cts +3 -0
  116. package/dist/llm/provider_format/openai.d.ts +3 -0
  117. package/dist/llm/provider_format/openai.d.ts.map +1 -0
  118. package/dist/llm/provider_format/openai.js +92 -0
  119. package/dist/llm/provider_format/openai.js.map +1 -0
  120. package/dist/llm/provider_format/openai.test.cjs +490 -0
  121. package/dist/llm/provider_format/openai.test.cjs.map +1 -0
  122. package/dist/llm/provider_format/openai.test.js +489 -0
  123. package/dist/llm/provider_format/openai.test.js.map +1 -0
  124. package/dist/llm/provider_format/utils.cjs +146 -0
  125. package/dist/llm/provider_format/utils.cjs.map +1 -0
  126. package/dist/llm/provider_format/utils.d.cts +38 -0
  127. package/dist/llm/provider_format/utils.d.ts +38 -0
  128. package/dist/llm/provider_format/utils.d.ts.map +1 -0
  129. package/dist/llm/provider_format/utils.js +122 -0
  130. package/dist/llm/provider_format/utils.js.map +1 -0
  131. package/dist/llm/realtime.cjs +77 -0
  132. package/dist/llm/realtime.cjs.map +1 -0
  133. package/dist/llm/realtime.d.cts +98 -0
  134. package/dist/llm/realtime.d.ts +98 -0
  135. package/dist/llm/realtime.d.ts.map +1 -0
  136. package/dist/llm/realtime.js +52 -0
  137. package/dist/llm/realtime.js.map +1 -0
  138. package/dist/llm/remote_chat_context.cjs +112 -0
  139. package/dist/llm/remote_chat_context.cjs.map +1 -0
  140. package/dist/llm/remote_chat_context.d.cts +23 -0
  141. package/dist/llm/remote_chat_context.d.ts +23 -0
  142. package/dist/llm/remote_chat_context.d.ts.map +1 -0
  143. package/dist/llm/remote_chat_context.js +88 -0
  144. package/dist/llm/remote_chat_context.js.map +1 -0
  145. package/dist/llm/remote_chat_context.test.cjs +225 -0
  146. package/dist/llm/remote_chat_context.test.cjs.map +1 -0
  147. package/dist/llm/remote_chat_context.test.js +224 -0
  148. package/dist/llm/remote_chat_context.test.js.map +1 -0
  149. package/dist/llm/tool_context.cjs +111 -0
  150. package/dist/llm/tool_context.cjs.map +1 -0
  151. package/dist/llm/tool_context.d.cts +125 -0
  152. package/dist/llm/tool_context.d.ts +125 -0
  153. package/dist/llm/tool_context.d.ts.map +1 -0
  154. package/dist/llm/tool_context.js +80 -0
  155. package/dist/llm/tool_context.js.map +1 -0
  156. package/dist/llm/tool_context.test.cjs +162 -0
  157. package/dist/llm/tool_context.test.cjs.map +1 -0
  158. package/dist/llm/tool_context.test.js +161 -0
  159. package/dist/llm/tool_context.test.js.map +1 -0
  160. package/dist/llm/tool_context.type.test.cjs +92 -0
  161. package/dist/llm/tool_context.type.test.cjs.map +1 -0
  162. package/dist/llm/tool_context.type.test.js +91 -0
  163. package/dist/llm/tool_context.type.test.js.map +1 -0
  164. package/dist/llm/utils.cjs +260 -0
  165. package/dist/llm/utils.cjs.map +1 -0
  166. package/dist/llm/utils.d.cts +42 -0
  167. package/dist/llm/utils.d.ts +42 -0
  168. package/dist/llm/utils.d.ts.map +1 -0
  169. package/dist/llm/utils.js +223 -0
  170. package/dist/llm/utils.js.map +1 -0
  171. package/dist/llm/utils.test.cjs +513 -0
  172. package/dist/llm/utils.test.cjs.map +1 -0
  173. package/dist/llm/utils.test.js +490 -0
  174. package/dist/llm/utils.test.js.map +1 -0
  175. package/dist/metrics/base.cjs +0 -27
  176. package/dist/metrics/base.cjs.map +1 -1
  177. package/dist/metrics/base.d.cts +105 -63
  178. package/dist/metrics/base.d.ts +105 -63
  179. package/dist/metrics/base.d.ts.map +1 -1
  180. package/dist/metrics/base.js +0 -19
  181. package/dist/metrics/base.js.map +1 -1
  182. package/dist/metrics/index.cjs +0 -3
  183. package/dist/metrics/index.cjs.map +1 -1
  184. package/dist/metrics/index.d.cts +2 -3
  185. package/dist/metrics/index.d.ts +2 -3
  186. package/dist/metrics/index.d.ts.map +1 -1
  187. package/dist/metrics/index.js +0 -2
  188. package/dist/metrics/index.js.map +1 -1
  189. package/dist/metrics/usage_collector.cjs +17 -12
  190. package/dist/metrics/usage_collector.cjs.map +1 -1
  191. package/dist/metrics/usage_collector.d.cts +3 -2
  192. package/dist/metrics/usage_collector.d.ts +3 -2
  193. package/dist/metrics/usage_collector.d.ts.map +1 -1
  194. package/dist/metrics/usage_collector.js +17 -12
  195. package/dist/metrics/usage_collector.js.map +1 -1
  196. package/dist/metrics/utils.cjs +22 -59
  197. package/dist/metrics/utils.cjs.map +1 -1
  198. package/dist/metrics/utils.d.cts +1 -8
  199. package/dist/metrics/utils.d.ts +1 -8
  200. package/dist/metrics/utils.d.ts.map +1 -1
  201. package/dist/metrics/utils.js +22 -52
  202. package/dist/metrics/utils.js.map +1 -1
  203. package/dist/multimodal/index.cjs +0 -2
  204. package/dist/multimodal/index.cjs.map +1 -1
  205. package/dist/multimodal/index.d.cts +0 -1
  206. package/dist/multimodal/index.d.ts +0 -1
  207. package/dist/multimodal/index.d.ts.map +1 -1
  208. package/dist/multimodal/index.js +0 -1
  209. package/dist/multimodal/index.js.map +1 -1
  210. package/dist/plugin.cjs +24 -8
  211. package/dist/plugin.cjs.map +1 -1
  212. package/dist/plugin.d.cts +18 -4
  213. package/dist/plugin.d.ts +18 -4
  214. package/dist/plugin.d.ts.map +1 -1
  215. package/dist/plugin.js +22 -7
  216. package/dist/plugin.js.map +1 -1
  217. package/dist/stream/deferred_stream.cjs +98 -0
  218. package/dist/stream/deferred_stream.cjs.map +1 -0
  219. package/dist/stream/deferred_stream.d.cts +27 -0
  220. package/dist/stream/deferred_stream.d.ts +27 -0
  221. package/dist/stream/deferred_stream.d.ts.map +1 -0
  222. package/dist/stream/deferred_stream.js +73 -0
  223. package/dist/stream/deferred_stream.js.map +1 -0
  224. package/dist/stream/deferred_stream.test.cjs +527 -0
  225. package/dist/stream/deferred_stream.test.cjs.map +1 -0
  226. package/dist/stream/deferred_stream.test.js +526 -0
  227. package/dist/stream/deferred_stream.test.js.map +1 -0
  228. package/dist/stream/identity_transform.cjs +42 -0
  229. package/dist/stream/identity_transform.cjs.map +1 -0
  230. package/dist/stream/identity_transform.d.cts +6 -0
  231. package/dist/stream/identity_transform.d.ts +6 -0
  232. package/dist/stream/identity_transform.d.ts.map +1 -0
  233. package/dist/stream/identity_transform.js +18 -0
  234. package/dist/stream/identity_transform.js.map +1 -0
  235. package/dist/stream/identity_transform.test.cjs +125 -0
  236. package/dist/stream/identity_transform.test.cjs.map +1 -0
  237. package/dist/stream/identity_transform.test.js +124 -0
  238. package/dist/stream/identity_transform.test.js.map +1 -0
  239. package/dist/stream/index.cjs +38 -0
  240. package/dist/stream/index.cjs.map +1 -0
  241. package/dist/stream/index.d.cts +5 -0
  242. package/dist/stream/index.d.ts +5 -0
  243. package/dist/stream/index.d.ts.map +1 -0
  244. package/dist/stream/index.js +11 -0
  245. package/dist/stream/index.js.map +1 -0
  246. package/dist/stream/merge_readable_streams.cjs +59 -0
  247. package/dist/stream/merge_readable_streams.cjs.map +1 -0
  248. package/dist/stream/merge_readable_streams.d.cts +4 -0
  249. package/dist/stream/merge_readable_streams.d.ts +4 -0
  250. package/dist/stream/merge_readable_streams.d.ts.map +1 -0
  251. package/dist/stream/merge_readable_streams.js +35 -0
  252. package/dist/stream/merge_readable_streams.js.map +1 -0
  253. package/dist/stream/stream_channel.cjs +47 -0
  254. package/dist/stream/stream_channel.cjs.map +1 -0
  255. package/dist/stream/stream_channel.d.cts +9 -0
  256. package/dist/stream/stream_channel.d.ts +9 -0
  257. package/dist/stream/stream_channel.d.ts.map +1 -0
  258. package/dist/stream/stream_channel.js +23 -0
  259. package/dist/stream/stream_channel.js.map +1 -0
  260. package/dist/stream/stream_channel.test.cjs +97 -0
  261. package/dist/stream/stream_channel.test.cjs.map +1 -0
  262. package/dist/stream/stream_channel.test.js +96 -0
  263. package/dist/stream/stream_channel.test.js.map +1 -0
  264. package/dist/stt/stream_adapter.cjs +3 -4
  265. package/dist/stt/stream_adapter.cjs.map +1 -1
  266. package/dist/stt/stream_adapter.d.cts +1 -0
  267. package/dist/stt/stream_adapter.d.ts +1 -0
  268. package/dist/stt/stream_adapter.d.ts.map +1 -1
  269. package/dist/stt/stream_adapter.js +3 -4
  270. package/dist/stt/stream_adapter.js.map +1 -1
  271. package/dist/stt/stt.cjs +101 -10
  272. package/dist/stt/stt.cjs.map +1 -1
  273. package/dist/stt/stt.d.cts +26 -5
  274. package/dist/stt/stt.d.ts +26 -5
  275. package/dist/stt/stt.d.ts.map +1 -1
  276. package/dist/stt/stt.js +102 -11
  277. package/dist/stt/stt.js.map +1 -1
  278. package/dist/tokenize/basic/basic.cjs +10 -5
  279. package/dist/tokenize/basic/basic.cjs.map +1 -1
  280. package/dist/tokenize/basic/basic.d.cts +7 -1
  281. package/dist/tokenize/basic/basic.d.ts +7 -1
  282. package/dist/tokenize/basic/basic.d.ts.map +1 -1
  283. package/dist/tokenize/basic/basic.js +10 -5
  284. package/dist/tokenize/basic/basic.js.map +1 -1
  285. package/dist/tokenize/basic/sentence.cjs +14 -6
  286. package/dist/tokenize/basic/sentence.cjs.map +1 -1
  287. package/dist/tokenize/basic/sentence.d.cts +1 -1
  288. package/dist/tokenize/basic/sentence.d.ts +1 -1
  289. package/dist/tokenize/basic/sentence.d.ts.map +1 -1
  290. package/dist/tokenize/basic/sentence.js +14 -6
  291. package/dist/tokenize/basic/sentence.js.map +1 -1
  292. package/dist/tokenize/token_stream.cjs +5 -3
  293. package/dist/tokenize/token_stream.cjs.map +1 -1
  294. package/dist/tokenize/token_stream.d.cts +1 -0
  295. package/dist/tokenize/token_stream.d.ts +1 -0
  296. package/dist/tokenize/token_stream.d.ts.map +1 -1
  297. package/dist/tokenize/token_stream.js +6 -4
  298. package/dist/tokenize/token_stream.js.map +1 -1
  299. package/dist/transcription.cjs +1 -2
  300. package/dist/transcription.cjs.map +1 -1
  301. package/dist/transcription.d.ts.map +1 -1
  302. package/dist/transcription.js +2 -3
  303. package/dist/transcription.js.map +1 -1
  304. package/dist/tts/index.cjs +2 -4
  305. package/dist/tts/index.cjs.map +1 -1
  306. package/dist/tts/index.d.cts +1 -1
  307. package/dist/tts/index.d.ts +1 -1
  308. package/dist/tts/index.d.ts.map +1 -1
  309. package/dist/tts/index.js +1 -3
  310. package/dist/tts/index.js.map +1 -1
  311. package/dist/tts/stream_adapter.cjs +26 -13
  312. package/dist/tts/stream_adapter.cjs.map +1 -1
  313. package/dist/tts/stream_adapter.d.cts +1 -1
  314. package/dist/tts/stream_adapter.d.ts +1 -1
  315. package/dist/tts/stream_adapter.d.ts.map +1 -1
  316. package/dist/tts/stream_adapter.js +27 -14
  317. package/dist/tts/stream_adapter.js.map +1 -1
  318. package/dist/tts/tts.cjs +157 -25
  319. package/dist/tts/tts.cjs.map +1 -1
  320. package/dist/tts/tts.d.cts +29 -5
  321. package/dist/tts/tts.d.ts +29 -5
  322. package/dist/tts/tts.d.ts.map +1 -1
  323. package/dist/tts/tts.js +157 -24
  324. package/dist/tts/tts.js.map +1 -1
  325. package/dist/types.cjs +60 -0
  326. package/dist/types.cjs.map +1 -0
  327. package/dist/types.d.cts +13 -0
  328. package/dist/types.d.ts +13 -0
  329. package/dist/types.d.ts.map +1 -0
  330. package/dist/types.js +35 -0
  331. package/dist/types.js.map +1 -0
  332. package/dist/utils.cjs +281 -27
  333. package/dist/utils.cjs.map +1 -1
  334. package/dist/utils.d.cts +134 -9
  335. package/dist/utils.d.ts +134 -9
  336. package/dist/utils.d.ts.map +1 -1
  337. package/dist/utils.js +265 -26
  338. package/dist/utils.js.map +1 -1
  339. package/dist/utils.test.cjs +492 -0
  340. package/dist/utils.test.cjs.map +1 -0
  341. package/dist/utils.test.js +498 -0
  342. package/dist/utils.test.js.map +1 -0
  343. package/dist/vad.cjs +76 -20
  344. package/dist/vad.cjs.map +1 -1
  345. package/dist/vad.d.cts +25 -5
  346. package/dist/vad.d.ts +25 -5
  347. package/dist/vad.d.ts.map +1 -1
  348. package/dist/vad.js +76 -20
  349. package/dist/vad.js.map +1 -1
  350. package/dist/voice/agent.cjs +245 -0
  351. package/dist/voice/agent.cjs.map +1 -0
  352. package/dist/voice/agent.d.cts +78 -0
  353. package/dist/voice/agent.d.ts +78 -0
  354. package/dist/voice/agent.d.ts.map +1 -0
  355. package/dist/voice/agent.js +220 -0
  356. package/dist/voice/agent.js.map +1 -0
  357. package/dist/voice/agent.test.cjs +61 -0
  358. package/dist/voice/agent.test.cjs.map +1 -0
  359. package/dist/voice/agent.test.js +60 -0
  360. package/dist/voice/agent.test.js.map +1 -0
  361. package/dist/voice/agent_activity.cjs +1453 -0
  362. package/dist/voice/agent_activity.cjs.map +1 -0
  363. package/dist/voice/agent_activity.d.cts +94 -0
  364. package/dist/voice/agent_activity.d.ts +94 -0
  365. package/dist/voice/agent_activity.d.ts.map +1 -0
  366. package/dist/voice/agent_activity.js +1449 -0
  367. package/dist/voice/agent_activity.js.map +1 -0
  368. package/dist/voice/agent_session.cjs +312 -0
  369. package/dist/voice/agent_session.cjs.map +1 -0
  370. package/dist/voice/agent_session.d.cts +121 -0
  371. package/dist/voice/agent_session.d.ts +121 -0
  372. package/dist/voice/agent_session.d.ts.map +1 -0
  373. package/dist/voice/agent_session.js +295 -0
  374. package/dist/voice/agent_session.js.map +1 -0
  375. package/dist/voice/audio_recognition.cjs +375 -0
  376. package/dist/voice/audio_recognition.cjs.map +1 -0
  377. package/dist/voice/audio_recognition.d.cts +80 -0
  378. package/dist/voice/audio_recognition.d.ts +80 -0
  379. package/dist/voice/audio_recognition.d.ts.map +1 -0
  380. package/dist/voice/audio_recognition.js +351 -0
  381. package/dist/voice/audio_recognition.js.map +1 -0
  382. package/dist/voice/events.cjs +145 -0
  383. package/dist/voice/events.cjs.map +1 -0
  384. package/dist/voice/events.d.cts +124 -0
  385. package/dist/voice/events.d.ts +124 -0
  386. package/dist/voice/events.d.ts.map +1 -0
  387. package/dist/voice/events.js +110 -0
  388. package/dist/voice/events.js.map +1 -0
  389. package/dist/voice/generation.cjs +700 -0
  390. package/dist/voice/generation.cjs.map +1 -0
  391. package/dist/voice/generation.d.cts +115 -0
  392. package/dist/voice/generation.d.ts +115 -0
  393. package/dist/voice/generation.d.ts.map +1 -0
  394. package/dist/voice/generation.js +672 -0
  395. package/dist/voice/generation.js.map +1 -0
  396. package/dist/voice/index.cjs +40 -0
  397. package/dist/voice/index.cjs.map +1 -0
  398. package/dist/voice/index.d.cts +5 -0
  399. package/dist/voice/index.d.ts +5 -0
  400. package/dist/voice/index.d.ts.map +1 -0
  401. package/dist/voice/index.js +11 -0
  402. package/dist/voice/index.js.map +1 -0
  403. package/dist/voice/io.cjs +245 -0
  404. package/dist/voice/io.cjs.map +1 -0
  405. package/dist/voice/io.d.cts +101 -0
  406. package/dist/voice/io.d.ts +101 -0
  407. package/dist/voice/io.d.ts.map +1 -0
  408. package/dist/voice/io.js +217 -0
  409. package/dist/voice/io.js.map +1 -0
  410. package/dist/voice/room_io/_input.cjs +121 -0
  411. package/dist/voice/room_io/_input.cjs.map +1 -0
  412. package/dist/voice/room_io/_input.d.cts +24 -0
  413. package/dist/voice/room_io/_input.d.ts +24 -0
  414. package/dist/voice/room_io/_input.d.ts.map +1 -0
  415. package/dist/voice/room_io/_input.js +102 -0
  416. package/dist/voice/room_io/_input.js.map +1 -0
  417. package/dist/voice/room_io/_output.cjs +358 -0
  418. package/dist/voice/room_io/_output.cjs.map +1 -0
  419. package/dist/voice/room_io/_output.d.cts +75 -0
  420. package/dist/voice/room_io/_output.d.ts +75 -0
  421. package/dist/voice/room_io/_output.d.ts.map +1 -0
  422. package/dist/voice/room_io/_output.js +342 -0
  423. package/dist/voice/room_io/_output.js.map +1 -0
  424. package/dist/voice/room_io/index.cjs +25 -0
  425. package/dist/voice/room_io/index.cjs.map +1 -0
  426. package/dist/voice/room_io/index.d.cts +3 -0
  427. package/dist/voice/room_io/index.d.ts +3 -0
  428. package/dist/voice/room_io/index.d.ts.map +1 -0
  429. package/dist/voice/room_io/index.js +3 -0
  430. package/dist/voice/room_io/index.js.map +1 -0
  431. package/dist/voice/room_io/room_io.cjs +370 -0
  432. package/dist/voice/room_io/room_io.cjs.map +1 -0
  433. package/dist/voice/room_io/room_io.d.cts +73 -0
  434. package/dist/voice/room_io/room_io.d.ts +73 -0
  435. package/dist/voice/room_io/room_io.d.ts.map +1 -0
  436. package/dist/voice/room_io/room_io.js +361 -0
  437. package/dist/voice/room_io/room_io.js.map +1 -0
  438. package/dist/{pipeline/index.cjs → voice/run_context.cjs} +16 -11
  439. package/dist/voice/run_context.cjs.map +1 -0
  440. package/dist/voice/run_context.d.cts +12 -0
  441. package/dist/voice/run_context.d.ts +12 -0
  442. package/dist/voice/run_context.d.ts.map +1 -0
  443. package/dist/voice/run_context.js +14 -0
  444. package/dist/voice/run_context.js.map +1 -0
  445. package/dist/voice/speech_handle.cjs +105 -0
  446. package/dist/voice/speech_handle.cjs.map +1 -0
  447. package/dist/voice/speech_handle.d.cts +46 -0
  448. package/dist/voice/speech_handle.d.ts +46 -0
  449. package/dist/voice/speech_handle.d.ts.map +1 -0
  450. package/dist/voice/speech_handle.js +81 -0
  451. package/dist/voice/speech_handle.js.map +1 -0
  452. package/dist/voice/transcription/_utils.cjs +45 -0
  453. package/dist/voice/transcription/_utils.cjs.map +1 -0
  454. package/dist/voice/transcription/_utils.d.cts +3 -0
  455. package/dist/voice/transcription/_utils.d.ts +3 -0
  456. package/dist/voice/transcription/_utils.d.ts.map +1 -0
  457. package/dist/voice/transcription/_utils.js +21 -0
  458. package/dist/voice/transcription/_utils.js.map +1 -0
  459. package/dist/voice/transcription/index.cjs +23 -0
  460. package/dist/voice/transcription/index.cjs.map +1 -0
  461. package/dist/voice/transcription/index.d.cts +2 -0
  462. package/dist/voice/transcription/index.d.ts +2 -0
  463. package/dist/voice/transcription/index.d.ts.map +1 -0
  464. package/dist/voice/transcription/index.js +2 -0
  465. package/dist/voice/transcription/index.js.map +1 -0
  466. package/dist/voice/transcription/synchronizer.cjs +380 -0
  467. package/dist/voice/transcription/synchronizer.cjs.map +1 -0
  468. package/dist/voice/transcription/synchronizer.d.cts +86 -0
  469. package/dist/voice/transcription/synchronizer.d.ts +86 -0
  470. package/dist/voice/transcription/synchronizer.d.ts.map +1 -0
  471. package/dist/voice/transcription/synchronizer.js +355 -0
  472. package/dist/voice/transcription/synchronizer.js.map +1 -0
  473. package/dist/worker.cjs +22 -4
  474. package/dist/worker.cjs.map +1 -1
  475. package/dist/worker.d.cts +1 -1
  476. package/dist/worker.d.ts +1 -1
  477. package/dist/worker.d.ts.map +1 -1
  478. package/dist/worker.js +22 -4
  479. package/dist/worker.js.map +1 -1
  480. package/package.json +9 -2
  481. package/src/_exceptions.ts +137 -0
  482. package/src/audio.ts +12 -1
  483. package/src/cli.ts +37 -0
  484. package/src/constants.ts +2 -0
  485. package/src/http_server.ts +1 -0
  486. package/src/index.ts +13 -10
  487. package/src/inference_runner.ts +2 -3
  488. package/src/ipc/inference_proc_executor.ts +2 -2
  489. package/src/ipc/job_executor.ts +1 -1
  490. package/src/ipc/job_proc_executor.ts +1 -1
  491. package/src/ipc/job_proc_lazy_main.ts +1 -1
  492. package/src/job.ts +18 -0
  493. package/src/llm/__snapshots__/chat_context.test.ts.snap +527 -0
  494. package/src/llm/__snapshots__/tool_context.test.ts.snap +177 -0
  495. package/src/llm/__snapshots__/utils.test.ts.snap +65 -0
  496. package/src/llm/chat_context.test.ts +450 -0
  497. package/src/llm/chat_context.ts +501 -103
  498. package/src/llm/index.ts +53 -18
  499. package/src/llm/llm.ts +149 -50
  500. package/src/llm/provider_format/google.test.ts +772 -0
  501. package/src/llm/provider_format/google.ts +130 -0
  502. package/src/llm/provider_format/index.ts +23 -0
  503. package/src/llm/provider_format/openai.test.ts +581 -0
  504. package/src/llm/provider_format/openai.ts +118 -0
  505. package/src/llm/provider_format/utils.ts +183 -0
  506. package/src/llm/realtime.ts +151 -0
  507. package/src/llm/remote_chat_context.test.ts +290 -0
  508. package/src/llm/remote_chat_context.ts +114 -0
  509. package/src/llm/tool_context.test.ts +198 -0
  510. package/src/llm/tool_context.ts +259 -0
  511. package/src/llm/tool_context.type.test.ts +115 -0
  512. package/src/llm/utils.test.ts +670 -0
  513. package/src/llm/utils.ts +324 -0
  514. package/src/metrics/base.ts +110 -78
  515. package/src/metrics/index.ts +3 -9
  516. package/src/metrics/usage_collector.ts +19 -13
  517. package/src/metrics/utils.ts +24 -69
  518. package/src/multimodal/index.ts +0 -1
  519. package/src/plugin.ts +26 -8
  520. package/src/stream/deferred_stream.test.ts +755 -0
  521. package/src/stream/deferred_stream.ts +110 -0
  522. package/src/stream/identity_transform.test.ts +179 -0
  523. package/src/stream/identity_transform.ts +18 -0
  524. package/src/stream/index.ts +7 -0
  525. package/src/stream/merge_readable_streams.ts +40 -0
  526. package/src/stream/stream_channel.test.ts +129 -0
  527. package/src/stream/stream_channel.ts +32 -0
  528. package/src/stt/stream_adapter.ts +3 -5
  529. package/src/stt/stt.ts +135 -17
  530. package/src/tokenize/basic/basic.ts +13 -5
  531. package/src/tokenize/basic/sentence.ts +20 -6
  532. package/src/tokenize/token_stream.ts +7 -4
  533. package/src/transcription.ts +2 -3
  534. package/src/tts/index.ts +0 -1
  535. package/src/tts/stream_adapter.ts +42 -16
  536. package/src/tts/tts.ts +203 -21
  537. package/src/types.ts +42 -0
  538. package/src/utils.test.ts +658 -0
  539. package/src/utils.ts +375 -44
  540. package/src/vad.ts +90 -22
  541. package/src/voice/agent.test.ts +80 -0
  542. package/src/voice/agent.ts +332 -0
  543. package/src/voice/agent_activity.ts +1913 -0
  544. package/src/voice/agent_session.ts +460 -0
  545. package/src/voice/audio_recognition.ts +474 -0
  546. package/src/voice/events.ts +252 -0
  547. package/src/voice/generation.ts +881 -0
  548. package/src/voice/index.ts +7 -0
  549. package/src/voice/io.ts +304 -0
  550. package/src/voice/room_io/_input.ts +144 -0
  551. package/src/voice/room_io/_output.ts +436 -0
  552. package/src/voice/room_io/index.ts +5 -0
  553. package/src/voice/room_io/room_io.ts +495 -0
  554. package/src/voice/run_context.ts +20 -0
  555. package/src/voice/speech_handle.ts +104 -0
  556. package/src/voice/transcription/_utils.ts +25 -0
  557. package/src/voice/transcription/index.ts +4 -0
  558. package/src/voice/transcription/synchronizer.ts +478 -0
  559. package/src/worker.ts +22 -2
  560. package/dist/llm/function_context.cjs +0 -103
  561. package/dist/llm/function_context.cjs.map +0 -1
  562. package/dist/llm/function_context.d.cts +0 -47
  563. package/dist/llm/function_context.d.ts +0 -47
  564. package/dist/llm/function_context.d.ts.map +0 -1
  565. package/dist/llm/function_context.js +0 -78
  566. package/dist/llm/function_context.js.map +0 -1
  567. package/dist/llm/function_context.test.cjs +0 -218
  568. package/dist/llm/function_context.test.cjs.map +0 -1
  569. package/dist/llm/function_context.test.js +0 -217
  570. package/dist/llm/function_context.test.js.map +0 -1
  571. package/dist/multimodal/multimodal_agent.cjs +0 -451
  572. package/dist/multimodal/multimodal_agent.cjs.map +0 -1
  573. package/dist/multimodal/multimodal_agent.d.cts +0 -48
  574. package/dist/multimodal/multimodal_agent.d.ts +0 -48
  575. package/dist/multimodal/multimodal_agent.d.ts.map +0 -1
  576. package/dist/multimodal/multimodal_agent.js +0 -425
  577. package/dist/multimodal/multimodal_agent.js.map +0 -1
  578. package/dist/pipeline/agent_output.cjs +0 -197
  579. package/dist/pipeline/agent_output.cjs.map +0 -1
  580. package/dist/pipeline/agent_output.d.cts +0 -33
  581. package/dist/pipeline/agent_output.d.ts +0 -33
  582. package/dist/pipeline/agent_output.d.ts.map +0 -1
  583. package/dist/pipeline/agent_output.js +0 -172
  584. package/dist/pipeline/agent_output.js.map +0 -1
  585. package/dist/pipeline/agent_playout.cjs +0 -175
  586. package/dist/pipeline/agent_playout.cjs.map +0 -1
  587. package/dist/pipeline/agent_playout.d.cts +0 -40
  588. package/dist/pipeline/agent_playout.d.ts +0 -40
  589. package/dist/pipeline/agent_playout.d.ts.map +0 -1
  590. package/dist/pipeline/agent_playout.js +0 -139
  591. package/dist/pipeline/agent_playout.js.map +0 -1
  592. package/dist/pipeline/human_input.cjs +0 -171
  593. package/dist/pipeline/human_input.cjs.map +0 -1
  594. package/dist/pipeline/human_input.d.cts +0 -30
  595. package/dist/pipeline/human_input.d.ts +0 -30
  596. package/dist/pipeline/human_input.d.ts.map +0 -1
  597. package/dist/pipeline/human_input.js +0 -146
  598. package/dist/pipeline/human_input.js.map +0 -1
  599. package/dist/pipeline/index.cjs.map +0 -1
  600. package/dist/pipeline/index.d.cts +0 -2
  601. package/dist/pipeline/index.d.ts +0 -2
  602. package/dist/pipeline/index.d.ts.map +0 -1
  603. package/dist/pipeline/index.js +0 -11
  604. package/dist/pipeline/index.js.map +0 -1
  605. package/dist/pipeline/pipeline_agent.cjs +0 -849
  606. package/dist/pipeline/pipeline_agent.cjs.map +0 -1
  607. package/dist/pipeline/pipeline_agent.d.cts +0 -150
  608. package/dist/pipeline/pipeline_agent.d.ts +0 -150
  609. package/dist/pipeline/pipeline_agent.d.ts.map +0 -1
  610. package/dist/pipeline/pipeline_agent.js +0 -826
  611. package/dist/pipeline/pipeline_agent.js.map +0 -1
  612. package/dist/pipeline/speech_handle.cjs +0 -176
  613. package/dist/pipeline/speech_handle.cjs.map +0 -1
  614. package/dist/pipeline/speech_handle.d.cts +0 -37
  615. package/dist/pipeline/speech_handle.d.ts +0 -37
  616. package/dist/pipeline/speech_handle.d.ts.map +0 -1
  617. package/dist/pipeline/speech_handle.js +0 -152
  618. package/dist/pipeline/speech_handle.js.map +0 -1
  619. package/src/llm/function_context.test.ts +0 -248
  620. package/src/llm/function_context.ts +0 -142
  621. package/src/multimodal/multimodal_agent.ts +0 -555
  622. package/src/pipeline/agent_output.ts +0 -219
  623. package/src/pipeline/agent_playout.ts +0 -192
  624. package/src/pipeline/human_input.ts +0 -188
  625. package/src/pipeline/index.ts +0 -15
  626. package/src/pipeline/pipeline_agent.ts +0 -1185
  627. package/src/pipeline/speech_handle.ts +0 -201
@@ -1,826 +0,0 @@
1
- import {
2
- AudioSource,
3
- LocalAudioTrack,
4
- RoomEvent,
5
- TrackPublishOptions,
6
- TrackSource
7
- } from "@livekit/rtc-node";
8
- import { randomUUID } from "node:crypto";
9
- import EventEmitter from "node:events";
10
- import {
11
- ATTRIBUTE_TRANSCRIPTION_FINAL,
12
- ATTRIBUTE_TRANSCRIPTION_TRACK_ID,
13
- TOPIC_TRANSCRIPTION
14
- } from "../constants.js";
15
- import { ChatContext, ChatMessage, ChatRole, LLMEvent, LLMStream } from "../llm/index.js";
16
- import { log } from "../log.js";
17
- import { StreamAdapter as STTStreamAdapter, SpeechEventType } from "../stt/index.js";
18
- import {
19
- SentenceTokenizer as BasicSentenceTokenizer,
20
- WordTokenizer as BasicWordTokenizer,
21
- hyphenateWord
22
- } from "../tokenize/basic/index.js";
23
- import { TextAudioSynchronizer, defaultTextSyncOptions } from "../transcription.js";
24
- import { TTSEvent, StreamAdapter as TTSStreamAdapter } from "../tts/index.js";
25
- import { AsyncIterableQueue, CancellablePromise, Future, gracefullyCancel } from "../utils.js";
26
- import { VADEventType } from "../vad.js";
27
- import { AgentOutput } from "./agent_output.js";
28
- import { AgentPlayout, AgentPlayoutEvent } from "./agent_playout.js";
29
- import { HumanInput, HumanInputEvent } from "./human_input.js";
30
- import { SpeechHandle } from "./speech_handle.js";
31
- const AGENT_STATE_ATTRIBUTE = "lk.agent.state";
32
- let lastSpeechData;
33
- let speechData;
34
- var VPAEvent = /* @__PURE__ */ ((VPAEvent2) => {
35
- VPAEvent2[VPAEvent2["USER_STARTED_SPEAKING"] = 0] = "USER_STARTED_SPEAKING";
36
- VPAEvent2[VPAEvent2["USER_STOPPED_SPEAKING"] = 1] = "USER_STOPPED_SPEAKING";
37
- VPAEvent2[VPAEvent2["AGENT_STARTED_SPEAKING"] = 2] = "AGENT_STARTED_SPEAKING";
38
- VPAEvent2[VPAEvent2["AGENT_STOPPED_SPEAKING"] = 3] = "AGENT_STOPPED_SPEAKING";
39
- VPAEvent2[VPAEvent2["USER_SPEECH_COMMITTED"] = 4] = "USER_SPEECH_COMMITTED";
40
- VPAEvent2[VPAEvent2["AGENT_SPEECH_COMMITTED"] = 5] = "AGENT_SPEECH_COMMITTED";
41
- VPAEvent2[VPAEvent2["AGENT_SPEECH_INTERRUPTED"] = 6] = "AGENT_SPEECH_INTERRUPTED";
42
- VPAEvent2[VPAEvent2["FUNCTION_CALLS_COLLECTED"] = 7] = "FUNCTION_CALLS_COLLECTED";
43
- VPAEvent2[VPAEvent2["FUNCTION_CALLS_FINISHED"] = 8] = "FUNCTION_CALLS_FINISHED";
44
- VPAEvent2[VPAEvent2["METRICS_COLLECTED"] = 9] = "METRICS_COLLECTED";
45
- return VPAEvent2;
46
- })(VPAEvent || {});
47
- class AgentCallContext {
48
- #agent;
49
- #llmStream;
50
- #metadata = /* @__PURE__ */ new Map();
51
- #extraChatMessages = [];
52
- static #current;
53
- constructor(agent, llmStream) {
54
- this.#agent = agent;
55
- this.#llmStream = llmStream;
56
- AgentCallContext.#current = this;
57
- }
58
- static getCurrent() {
59
- return AgentCallContext.#current;
60
- }
61
- get agent() {
62
- return this.#agent;
63
- }
64
- storeMetadata(key, value) {
65
- this.#metadata.set(key, value);
66
- }
67
- getMetadata(key, orDefault = void 0) {
68
- return this.#metadata.get(key) || orDefault;
69
- }
70
- get llmStream() {
71
- return this.#llmStream;
72
- }
73
- get extraChatMessages() {
74
- return this.#extraChatMessages;
75
- }
76
- addExtraChatMessage(message) {
77
- this.#extraChatMessages.push(message);
78
- }
79
- }
80
- const defaultBeforeLLMCallback = (agent, chatCtx) => {
81
- return agent.llm.chat({ chatCtx, fncCtx: agent.fncCtx });
82
- };
83
- const defaultBeforeTTSCallback = (_, text) => {
84
- return text;
85
- };
86
- const defaultAgentTranscriptionOptions = {
87
- userTranscription: true,
88
- agentTranscription: true,
89
- agentTranscriptionSpeech: 1,
90
- sentenceTokenizer: new BasicSentenceTokenizer(),
91
- wordTokenizer: new BasicWordTokenizer(false),
92
- hyphenateWord
93
- };
94
- const defaultVPAOptions = {
95
- chatCtx: new ChatContext(),
96
- allowInterruptions: true,
97
- interruptSpeechDuration: 50,
98
- interruptMinWords: 0,
99
- minEndpointingDelay: 500,
100
- maxNestedFncCalls: 1,
101
- preemptiveSynthesis: false,
102
- beforeLLMCallback: defaultBeforeLLMCallback,
103
- beforeTTSCallback: defaultBeforeTTSCallback,
104
- transcription: defaultAgentTranscriptionOptions
105
- };
106
- class VoicePipelineAgent extends EventEmitter {
107
- /** Minimum time played for the user speech to be committed to the chat context. */
108
- MIN_TIME_PLAYED_FOR_COMMIT = 1.5;
109
- static FLUSH_SENTINEL = Symbol("FLUSH_SENTINEL");
110
- #vad;
111
- #stt;
112
- #llm;
113
- #tts;
114
- #opts;
115
- #humanInput;
116
- #agentOutput;
117
- #trackPublishedFut = new Future();
118
- #pendingAgentReply;
119
- #agentReplyTask;
120
- #playingSpeech;
121
- transcribedText = "";
122
- #transcribedInterimText = "";
123
- #speechQueueOpen = new Future();
124
- #speechQueue = new AsyncIterableQueue();
125
- #updateStateTask;
126
- #started = false;
127
- #room;
128
- #participant = null;
129
- #deferredValidation;
130
- #logger = log();
131
- #agentPublication;
132
- #lastFinalTranscriptTime;
133
- #lastSpeechTime;
134
- #transcriptionId;
135
- #agentTranscribedText = "";
136
- constructor(vad, stt, llm, tts, opts = defaultVPAOptions) {
137
- super();
138
- this.#opts = { ...defaultVPAOptions, ...opts };
139
- if (!stt.capabilities.streaming) {
140
- stt = new STTStreamAdapter(stt, vad);
141
- }
142
- if (!tts.capabilities.streaming) {
143
- tts = new TTSStreamAdapter(tts, new BasicSentenceTokenizer());
144
- }
145
- this.#vad = vad;
146
- this.#stt = stt;
147
- this.#llm = llm;
148
- this.#tts = tts;
149
- this.#deferredValidation = new DeferredReplyValidation(
150
- this.#validateReplyIfPossible.bind(this),
151
- this.#opts.minEndpointingDelay,
152
- this,
153
- this.#opts.turnDetector
154
- );
155
- }
156
- get fncCtx() {
157
- return this.#opts.fncCtx;
158
- }
159
- set fncCtx(ctx) {
160
- this.#opts.fncCtx = ctx;
161
- }
162
- get chatCtx() {
163
- return this.#opts.chatCtx;
164
- }
165
- get llm() {
166
- return this.#llm;
167
- }
168
- get tts() {
169
- return this.#tts;
170
- }
171
- get stt() {
172
- return this.#stt;
173
- }
174
- get vad() {
175
- return this.#vad;
176
- }
177
- /** Start the voice assistant. */
178
- start(room, participant = null) {
179
- if (this.#started) {
180
- throw new Error("voice assistant already started");
181
- }
182
- this.#stt.on(SpeechEventType.METRICS_COLLECTED, (metrics) => {
183
- this.emit(9 /* METRICS_COLLECTED */, metrics);
184
- });
185
- this.#tts.on(TTSEvent.METRICS_COLLECTED, (metrics) => {
186
- if (!speechData) return;
187
- this.emit(9 /* METRICS_COLLECTED */, { ...metrics, sequenceId: speechData.sequenceId });
188
- });
189
- this.#llm.on(LLMEvent.METRICS_COLLECTED, (metrics) => {
190
- const sequenceId = speechData ? speechData.sequenceId : lastSpeechData == null ? void 0 : lastSpeechData.sequenceId;
191
- if (!sequenceId) return;
192
- this.emit(9 /* METRICS_COLLECTED */, { ...metrics, sequenceId });
193
- });
194
- this.#vad.on(VADEventType.METRICS_COLLECTED, (metrics) => {
195
- this.emit(9 /* METRICS_COLLECTED */, metrics);
196
- });
197
- room.on(RoomEvent.ParticipantConnected, (participant2) => {
198
- if (this.#participant) {
199
- return;
200
- }
201
- this.#linkParticipant.call(this, participant2.identity);
202
- });
203
- this.#room = room;
204
- this.#participant = participant;
205
- if (participant) {
206
- if (typeof participant === "string") {
207
- this.#linkParticipant(participant);
208
- } else {
209
- this.#linkParticipant(participant.identity);
210
- }
211
- }
212
- this.#run();
213
- }
214
- /** Play a speech source through the voice assistant. */
215
- async say(source, allowInterruptions = true, addToChatCtx = true) {
216
- await this.#trackPublishedFut.await;
217
- let callContext;
218
- let fncSource;
219
- if (addToChatCtx) {
220
- callContext = AgentCallContext.getCurrent();
221
- if (source instanceof LLMStream) {
222
- this.#logger.warn("LLMStream will be ignored for function call chat context");
223
- } else if (typeof source === "string") {
224
- fncSource = source;
225
- } else {
226
- fncSource = source;
227
- source = new AsyncIterableQueue();
228
- }
229
- }
230
- const newHandle = SpeechHandle.createAssistantSpeech(allowInterruptions, addToChatCtx);
231
- const synthesisHandle = this.#synthesizeAgentSpeech(newHandle.id, source);
232
- newHandle.initialize(source, synthesisHandle);
233
- if (this.#playingSpeech && !this.#playingSpeech.nestedSpeechFinished) {
234
- this.#playingSpeech.addNestedSpeech(newHandle);
235
- } else {
236
- this.#addSpeechForPlayout(newHandle);
237
- }
238
- if (callContext && fncSource) {
239
- let text;
240
- if (typeof source === "string") {
241
- text = fncSource;
242
- } else {
243
- text = "";
244
- for await (const chunk of fncSource) {
245
- source.put(chunk);
246
- text += chunk;
247
- }
248
- source.close();
249
- }
250
- callContext.addExtraChatMessage(ChatMessage.create({ text, role: ChatRole.ASSISTANT }));
251
- this.#logger.child({ text }).debug("added speech to function call chat context");
252
- }
253
- return newHandle;
254
- }
255
- #updateState(state, delay = 0) {
256
- const runTask = (delay2) => {
257
- return new CancellablePromise(async (resolve, _, onCancel) => {
258
- var _a, _b;
259
- let cancelled = false;
260
- onCancel(() => {
261
- cancelled = true;
262
- });
263
- await new Promise((resolve2) => setTimeout(resolve2, delay2));
264
- if ((_a = this.#room) == null ? void 0 : _a.isConnected) {
265
- if (!cancelled) {
266
- await ((_b = this.#room.localParticipant) == null ? void 0 : _b.setAttributes({ [AGENT_STATE_ATTRIBUTE]: state }));
267
- }
268
- }
269
- resolve();
270
- });
271
- };
272
- if (this.#updateStateTask) {
273
- this.#updateStateTask.cancel();
274
- }
275
- this.#updateStateTask = runTask(delay);
276
- }
277
- #linkParticipant(participantIdentity) {
278
- if (!this.#room) {
279
- this.#logger.error("Room is not set");
280
- return;
281
- }
282
- this.#participant = this.#room.remoteParticipants.get(participantIdentity) || null;
283
- if (!this.#participant) {
284
- this.#logger.error(`Participant with identity ${participantIdentity} not found`);
285
- return;
286
- }
287
- this.#humanInput = new HumanInput(
288
- this.#room,
289
- this.#vad,
290
- this.#stt,
291
- this.#participant,
292
- this.#opts.noiseCancellation
293
- );
294
- this.#humanInput.on(HumanInputEvent.START_OF_SPEECH, (event) => {
295
- this.emit(0 /* USER_STARTED_SPEAKING */);
296
- this.#deferredValidation.onHumanStartOfSpeech(event);
297
- });
298
- this.#humanInput.on(HumanInputEvent.VAD_INFERENCE_DONE, (event) => {
299
- if (!this.#trackPublishedFut.done) {
300
- return;
301
- }
302
- if (!this.#agentOutput) {
303
- throw new Error("agent output is undefined");
304
- }
305
- let tv = 1;
306
- if (this.#opts.allowInterruptions) {
307
- tv = Math.max(0, 1 - event.probability);
308
- this.#agentOutput.playout.targetVolume = tv;
309
- }
310
- if (event.speechDuration >= this.#opts.interruptSpeechDuration) {
311
- this.#interruptIfPossible();
312
- }
313
- if (event.rawAccumulatedSpeech > 0) {
314
- this.#lastSpeechTime = Date.now() - event.rawAccumulatedSilence;
315
- }
316
- });
317
- this.#humanInput.on(HumanInputEvent.END_OF_SPEECH, (event) => {
318
- this.emit(1 /* USER_STOPPED_SPEAKING */);
319
- this.#deferredValidation.onHumanEndOfSpeech(event);
320
- });
321
- this.#humanInput.on(HumanInputEvent.INTERIM_TRANSCRIPT, async (event) => {
322
- if (!this.#transcriptionId) {
323
- this.#transcriptionId = randomUUID();
324
- }
325
- this.#transcribedInterimText = event.alternatives[0].text;
326
- await this.#publishTranscription(
327
- this.#humanInput.participant.identity,
328
- this.#humanInput.subscribedTrack.sid,
329
- this.#transcribedInterimText,
330
- false,
331
- this.#transcriptionId
332
- );
333
- });
334
- this.#humanInput.on(HumanInputEvent.FINAL_TRANSCRIPT, async (event) => {
335
- const newTranscript = event.alternatives[0].text;
336
- if (!newTranscript) return;
337
- if (!this.#transcriptionId) {
338
- this.#transcriptionId = randomUUID();
339
- }
340
- this.#lastFinalTranscriptTime = Date.now();
341
- this.transcribedText += (this.transcribedText ? " " : "") + newTranscript;
342
- await this.#publishTranscription(
343
- this.#humanInput.participant.identity,
344
- this.#humanInput.subscribedTrack.sid,
345
- this.transcribedText,
346
- true,
347
- this.#transcriptionId
348
- );
349
- this.#transcriptionId = void 0;
350
- if (this.#opts.preemptiveSynthesis && (!this.#playingSpeech || this.#playingSpeech.allowInterruptions)) {
351
- this.#synthesizeAgentReply();
352
- }
353
- this.#deferredValidation.onHumanFinalTranscript(newTranscript);
354
- const words = this.#opts.transcription.wordTokenizer.tokenize(newTranscript);
355
- if (words.length >= 3) {
356
- this.#interruptIfPossible();
357
- }
358
- });
359
- }
360
- async #run() {
361
- var _a, _b;
362
- this.#updateState("initializing");
363
- const audioSource = new AudioSource(this.#tts.sampleRate, this.#tts.numChannels);
364
- const track = LocalAudioTrack.createAudioTrack("assistant_voice", audioSource);
365
- this.#agentPublication = await ((_b = (_a = this.#room) == null ? void 0 : _a.localParticipant) == null ? void 0 : _b.publishTrack(
366
- track,
367
- new TrackPublishOptions({ source: TrackSource.SOURCE_MICROPHONE })
368
- ));
369
- const agentPlayout = new AgentPlayout(audioSource);
370
- this.#agentOutput = new AgentOutput(agentPlayout, this.#tts);
371
- agentPlayout.on(AgentPlayoutEvent.PLAYOUT_STARTED, () => {
372
- this.emit(2 /* AGENT_STARTED_SPEAKING */);
373
- this.#updateState("speaking");
374
- });
375
- agentPlayout.on(AgentPlayoutEvent.PLAYOUT_STOPPED, (_) => {
376
- this.emit(3 /* AGENT_STOPPED_SPEAKING */);
377
- this.#updateState("listening");
378
- });
379
- this.#trackPublishedFut.resolve();
380
- while (true) {
381
- await this.#speechQueueOpen.await;
382
- for await (const speech of this.#speechQueue) {
383
- if (speech === VoicePipelineAgent.FLUSH_SENTINEL) break;
384
- this.#playingSpeech = speech;
385
- await this.#playSpeech(speech);
386
- this.#playingSpeech = void 0;
387
- }
388
- this.#speechQueueOpen = new Future();
389
- }
390
- }
391
- #synthesizeAgentReply() {
392
- var _a;
393
- (_a = this.#pendingAgentReply) == null ? void 0 : _a.cancel();
394
- if (this.#humanInput && this.#humanInput.speaking) {
395
- this.#updateState("thinking", 200);
396
- }
397
- this.#pendingAgentReply = SpeechHandle.createAssistantReply(
398
- this.#opts.allowInterruptions,
399
- true,
400
- this.transcribedText
401
- );
402
- const newHandle = this.#pendingAgentReply;
403
- this.#agentReplyTask = this.#synthesizeAnswerTask(this.#agentReplyTask, newHandle);
404
- }
405
- #synthesizeAnswerTask(oldTask, handle) {
406
- return new CancellablePromise(async (resolve, _, onCancel) => {
407
- let cancelled = false;
408
- onCancel(() => {
409
- cancelled = true;
410
- });
411
- if (oldTask) {
412
- await gracefullyCancel(oldTask);
413
- }
414
- const copiedCtx = this.chatCtx.copy();
415
- const playingSpeech = this.#playingSpeech;
416
- if (playingSpeech && playingSpeech.initialized) {
417
- if ((!playingSpeech.userQuestion || playingSpeech.userCommitted) && !playingSpeech.speechCommitted) {
418
- copiedCtx.messages.push(
419
- ChatMessage.create({
420
- text: playingSpeech.synthesisHandle.text,
421
- role: ChatRole.ASSISTANT
422
- })
423
- );
424
- }
425
- }
426
- copiedCtx.messages.push(
427
- ChatMessage.create({
428
- text: handle == null ? void 0 : handle.userQuestion,
429
- role: ChatRole.USER
430
- })
431
- );
432
- speechData = { sequenceId: handle.id };
433
- try {
434
- if (cancelled) resolve();
435
- let llmStream = await this.#opts.beforeLLMCallback(this, copiedCtx);
436
- if (llmStream === false) {
437
- handle == null ? void 0 : handle.cancel();
438
- return;
439
- }
440
- if (cancelled) resolve();
441
- if (!(llmStream instanceof LLMStream)) {
442
- llmStream = await defaultBeforeLLMCallback(this, copiedCtx);
443
- }
444
- if (handle.interrupted) {
445
- return;
446
- }
447
- const synthesisHandle = this.#synthesizeAgentSpeech(handle.id, llmStream);
448
- handle.initialize(llmStream, synthesisHandle);
449
- } finally {
450
- lastSpeechData = speechData;
451
- speechData = void 0;
452
- }
453
- resolve();
454
- });
455
- }
456
- async #playSpeech(handle) {
457
- try {
458
- await handle.waitForInitialization();
459
- } catch {
460
- return;
461
- }
462
- await this.#agentPublication.waitForSubscription();
463
- const synthesisHandle = handle.synthesisHandle;
464
- if (synthesisHandle.interrupted) return;
465
- const userQuestion = handle.userQuestion;
466
- const playHandle = synthesisHandle.play();
467
- const joinFut = playHandle.join();
468
- const commitUserQuestionIfNeeded = () => {
469
- if (!userQuestion || synthesisHandle.interrupted || handle.userCommitted) return;
470
- const isUsingTools2 = handle.source instanceof LLMStream && !!handle.source.functionCalls.length;
471
- if (handle.allowInterruptions && !isUsingTools2 && playHandle.timePlayed < this.MIN_TIME_PLAYED_FOR_COMMIT && !joinFut.done) {
472
- return;
473
- }
474
- this.#logger.child({ userTranscript: userQuestion }).debug("committed user transcript");
475
- const userMsg = ChatMessage.create({ text: userQuestion, role: ChatRole.USER });
476
- this.chatCtx.messages.push(userMsg);
477
- this.emit(4 /* USER_SPEECH_COMMITTED */, userMsg);
478
- this.transcribedText = this.transcribedText.slice(userQuestion.length);
479
- handle.markUserCommitted();
480
- };
481
- commitUserQuestionIfNeeded();
482
- while (!joinFut.done) {
483
- await new Promise(async (resolve) => {
484
- setTimeout(resolve, 500);
485
- await joinFut.await;
486
- resolve();
487
- });
488
- commitUserQuestionIfNeeded();
489
- if (handle.interrupted) break;
490
- }
491
- commitUserQuestionIfNeeded();
492
- let collectedText = this.#agentTranscribedText;
493
- const isUsingTools = handle.source instanceof LLMStream && !!handle.source.functionCalls.length;
494
- const interrupted = handle.interrupted;
495
- if (handle.addToChatCtx && (!userQuestion || handle.userCommitted)) {
496
- if (handle.extraToolsMessages) {
497
- this.chatCtx.messages.push(...handle.extraToolsMessages);
498
- }
499
- if (interrupted) {
500
- collectedText += "\u2026";
501
- }
502
- const msg = ChatMessage.create({ text: collectedText, role: ChatRole.ASSISTANT });
503
- this.chatCtx.messages.push(msg);
504
- handle.markSpeechCommitted();
505
- if (interrupted) {
506
- this.emit(6 /* AGENT_SPEECH_INTERRUPTED */, msg);
507
- } else {
508
- this.emit(5 /* AGENT_SPEECH_COMMITTED */, msg);
509
- }
510
- this.#logger.child({
511
- agentTranscript: collectedText,
512
- interrupted,
513
- speechId: handle.id
514
- }).debug("committed agent speech");
515
- handle.setDone();
516
- }
517
- const executeFunctionCalls = async () => {
518
- if (!isUsingTools || interrupted) return;
519
- if (handle.fncNestedDepth >= this.#opts.maxNestedFncCalls) {
520
- this.#logger.child({ speechId: handle.id, fncNestedDepth: handle.fncNestedDepth }).warn("max function calls nested depth reached");
521
- return;
522
- }
523
- if (userQuestion && !handle.userCommitted) {
524
- throw new Error("user speech should have been committed before using tools");
525
- }
526
- const llmStream = handle.source;
527
- const newFunctionCalls = llmStream.functionCalls;
528
- new AgentCallContext(this, llmStream);
529
- this.emit(7 /* FUNCTION_CALLS_COLLECTED */, newFunctionCalls);
530
- const calledFuncs = [];
531
- for (const func of newFunctionCalls) {
532
- const task2 = func.func.execute(func.params).then(
533
- (result) => ({ name: func.name, toolCallId: func.toolCallId, result }),
534
- (error) => ({ name: func.name, toolCallId: func.toolCallId, error })
535
- );
536
- calledFuncs.push({ ...func, task: task2 });
537
- this.#logger.child({ function: func.name, speechId: handle.id }).debug("executing AI function");
538
- try {
539
- await task2;
540
- } catch {
541
- this.#logger.child({ function: func.name, speechId: handle.id }).error("error executing AI function");
542
- }
543
- }
544
- const toolCallsInfo = [];
545
- const toolCallsResults = [];
546
- for (const fnc of calledFuncs) {
547
- const task2 = await fnc.task;
548
- if (!task2 || task2.result === void 0) continue;
549
- toolCallsInfo.push(fnc);
550
- toolCallsResults.push(ChatMessage.createToolFromFunctionResult(task2));
551
- }
552
- if (!toolCallsInfo.length) return;
553
- const extraToolsMessages = [ChatMessage.createToolCalls(toolCallsInfo, collectedText)];
554
- extraToolsMessages.push(...toolCallsResults);
555
- const newSpeechHandle = SpeechHandle.createToolSpeech(
556
- handle.allowInterruptions,
557
- handle.addToChatCtx,
558
- handle.fncNestedDepth + 1,
559
- extraToolsMessages
560
- );
561
- const chatCtx = handle.source.chatCtx.copy();
562
- chatCtx.messages.push(...extraToolsMessages);
563
- chatCtx.messages.push(...AgentCallContext.getCurrent().extraChatMessages);
564
- const answerLLMStream = this.llm.chat({
565
- chatCtx,
566
- fncCtx: this.fncCtx
567
- });
568
- const answerSynthesis = this.#synthesizeAgentSpeech(newSpeechHandle.id, answerLLMStream);
569
- newSpeechHandle.initialize(answerLLMStream, answerSynthesis);
570
- handle.addNestedSpeech(newSpeechHandle);
571
- this.emit(8 /* FUNCTION_CALLS_FINISHED */, calledFuncs);
572
- };
573
- let finished = false;
574
- const task = executeFunctionCalls().then(() => {
575
- finished = true;
576
- });
577
- while (!handle.nestedSpeechFinished) {
578
- const changed = handle.nestedSpeechChanged();
579
- await Promise.race([changed, task]);
580
- while (handle.nestedSpeechHandles.length) {
581
- const speech = handle.nestedSpeechHandles[0];
582
- this.#playingSpeech = speech;
583
- await this.#playSpeech(speech);
584
- handle.nestedSpeechHandles.shift();
585
- this.#playingSpeech = handle;
586
- }
587
- handle.nestedSpeechHandles.forEach(() => handle.nestedSpeechHandles.pop());
588
- if (finished) {
589
- handle.markNestedSpeechFinished();
590
- }
591
- }
592
- handle.setDone();
593
- }
594
- async #publishTranscription(participantIdentity, trackSid, text, isFinal, id) {
595
- this.#room.localParticipant.publishTranscription({
596
- participantIdentity,
597
- trackSid,
598
- segments: [
599
- {
600
- text,
601
- final: isFinal,
602
- id,
603
- startTime: BigInt(0),
604
- endTime: BigInt(0),
605
- language: ""
606
- }
607
- ]
608
- });
609
- const stream = await this.#room.localParticipant.streamText({
610
- senderIdentity: participantIdentity,
611
- topic: TOPIC_TRANSCRIPTION,
612
- attributes: {
613
- [ATTRIBUTE_TRANSCRIPTION_TRACK_ID]: trackSid,
614
- [ATTRIBUTE_TRANSCRIPTION_FINAL]: isFinal.toString()
615
- }
616
- });
617
- await stream.write(text);
618
- await stream.close();
619
- }
620
- #synthesizeAgentSpeech(speechId, source) {
621
- const synchronizer = new TextAudioSynchronizer(defaultTextSyncOptions);
622
- synchronizer.on("textUpdated", async (text) => {
623
- var _a;
624
- this.#agentTranscribedText = text.text;
625
- await this.#publishTranscription(
626
- this.#room.localParticipant.identity,
627
- ((_a = this.#agentPublication) == null ? void 0 : _a.sid) ?? "",
628
- text.text,
629
- text.final,
630
- text.id
631
- );
632
- });
633
- if (!this.#agentOutput) {
634
- throw new Error("agent output should be initialized when ready");
635
- }
636
- if (source instanceof LLMStream) {
637
- source = llmStreamToStringIterable(speechId, source);
638
- }
639
- const ogSource = source;
640
- if (!(typeof source === "string")) {
641
- }
642
- const ttsSource = this.#opts.beforeTTSCallback(this, ogSource);
643
- if (!ttsSource) {
644
- throw new Error("beforeTTSCallback must return string or AsyncIterable<string>");
645
- }
646
- return this.#agentOutput.synthesize(speechId, ttsSource, synchronizer);
647
- }
648
- async #validateReplyIfPossible() {
649
- if (this.#playingSpeech && !this.#playingSpeech.allowInterruptions) {
650
- this.#logger.child({ speechId: this.#playingSpeech.id }).debug("skipping validation, agent is speaking and does not allow interruptions");
651
- return;
652
- }
653
- if (!this.#pendingAgentReply) {
654
- if (this.#opts.preemptiveSynthesis || !this.transcribedText) {
655
- return;
656
- }
657
- this.#synthesizeAgentReply();
658
- }
659
- if (!this.#pendingAgentReply) {
660
- throw new Error("pending agent reply is undefined");
661
- }
662
- if (this.#speechQueueOpen.done) {
663
- for await (const speech of this.#speechQueue) {
664
- if (speech === VoicePipelineAgent.FLUSH_SENTINEL) break;
665
- if (!speech.isReply) continue;
666
- if (speech.allowInterruptions) speech.interrupt();
667
- }
668
- }
669
- this.#logger.child({ speechId: this.#pendingAgentReply.id }).debug("validated agent reply");
670
- if (this.#lastSpeechTime) {
671
- const timeSinceLastSpeech = Date.now() - this.#lastSpeechTime;
672
- const transcriptionDelay = Math.max(
673
- (this.#lastFinalTranscriptTime || 0) - this.#lastSpeechTime,
674
- 0
675
- );
676
- const metrics = {
677
- timestamp: Date.now(),
678
- sequenceId: this.#pendingAgentReply.id,
679
- endOfUtteranceDelay: timeSinceLastSpeech,
680
- transcriptionDelay
681
- };
682
- this.emit(9 /* METRICS_COLLECTED */, metrics);
683
- }
684
- this.#addSpeechForPlayout(this.#pendingAgentReply);
685
- this.#pendingAgentReply = void 0;
686
- this.#transcribedInterimText = "";
687
- }
688
- #interruptIfPossible() {
689
- if (!this.#playingSpeech || !this.#playingSpeech.allowInterruptions || this.#playingSpeech.interrupted) {
690
- return;
691
- }
692
- if (this.#opts.interruptMinWords !== 0) {
693
- const interimWords = this.#opts.transcription.wordTokenizer.tokenize(
694
- this.#transcribedInterimText
695
- );
696
- if (interimWords.length < this.#opts.interruptMinWords) {
697
- return;
698
- }
699
- }
700
- this.#playingSpeech.interrupt();
701
- }
702
- #addSpeechForPlayout(handle) {
703
- this.#speechQueue.put(handle);
704
- this.#speechQueue.put(VoicePipelineAgent.FLUSH_SENTINEL);
705
- this.#speechQueueOpen.resolve();
706
- }
707
- /** Close the voice assistant. */
708
- async close() {
709
- var _a;
710
- if (!this.#started) {
711
- return;
712
- }
713
- (_a = this.#room) == null ? void 0 : _a.removeAllListeners(RoomEvent.ParticipantConnected);
714
- }
715
- }
716
- async function* llmStreamToStringIterable(speechId, stream) {
717
- var _a;
718
- const startTime = Date.now();
719
- let firstFrame = true;
720
- for await (const chunk of stream) {
721
- const content = (_a = chunk.choices[0]) == null ? void 0 : _a.delta.content;
722
- if (!content) continue;
723
- if (firstFrame) {
724
- firstFrame = false;
725
- log().child({ speechId, elapsed: Math.round(Date.now() - startTime) }).debug("received first LLM token");
726
- }
727
- yield content;
728
- }
729
- }
730
- class DeferredReplyValidation {
731
- // if the STT gives us punctuation, we can try to validate the reply faster.
732
- PUNCTUATION = ".!?";
733
- PUNCTUATION_REDUCE_FACTOR = 0.75;
734
- LATE_TRANSCRIPT_TOLERANCE = 1.5;
735
- // late compared to end of speech
736
- UNLIKELY_ENDPOINT_DELAY = 6e3;
737
- #validateFunc;
738
- #validatingPromise;
739
- #validatingFuture = new Future();
740
- #lastFinalTranscript = "";
741
- #lastRecvEndOfSpeechTime = 0;
742
- #speaking = false;
743
- #endOfSpeechDelay;
744
- #finalTranscriptDelay;
745
- #turnDetector;
746
- #agent;
747
- #abort;
748
- constructor(validateFunc, minEndpointingDelay, agent, turnDetector) {
749
- this.#validateFunc = validateFunc;
750
- this.#endOfSpeechDelay = minEndpointingDelay;
751
- this.#finalTranscriptDelay = minEndpointingDelay;
752
- this.#agent = agent;
753
- this.#turnDetector = turnDetector;
754
- }
755
- get validating() {
756
- return !this.#validatingFuture.done;
757
- }
758
- onHumanFinalTranscript(transcript) {
759
- this.#lastFinalTranscript = transcript.trim();
760
- if (this.#speaking) return;
761
- const hasRecentEndOfSpeech = Date.now() - this.#lastRecvEndOfSpeechTime < this.LATE_TRANSCRIPT_TOLERANCE;
762
- let delay = hasRecentEndOfSpeech ? this.#endOfSpeechDelay : this.#finalTranscriptDelay;
763
- delay = this.#endWithPunctuation() ? delay * this.PUNCTUATION_REDUCE_FACTOR : 1;
764
- this.#run(delay);
765
- }
766
- // eslint-disable-next-line @typescript-eslint/no-unused-vars
767
- onHumanStartOfSpeech(_) {
768
- var _a;
769
- this.#speaking = true;
770
- if (this.validating) {
771
- (_a = this.#abort) == null ? void 0 : _a.abort();
772
- }
773
- }
774
- // eslint-disable-next-line @typescript-eslint/no-unused-vars
775
- onHumanEndOfSpeech(_) {
776
- this.#speaking = false;
777
- this.#lastRecvEndOfSpeechTime = Date.now();
778
- if (this.#lastFinalTranscript) {
779
- const delay = this.#endWithPunctuation() ? this.#endOfSpeechDelay * this.PUNCTUATION_REDUCE_FACTOR : 1e3;
780
- this.#run(delay);
781
- }
782
- }
783
- // TODO(nbsp): aclose
784
- #endWithPunctuation() {
785
- return this.#lastFinalTranscript.length > 0 && this.PUNCTUATION.includes(this.#lastFinalTranscript[this.#lastFinalTranscript.length - 1]);
786
- }
787
- #resetStates() {
788
- this.#lastFinalTranscript = "";
789
- this.#lastRecvEndOfSpeechTime = 0;
790
- }
791
- #run(delay) {
792
- var _a;
793
- const runTask = async (delay2, chatCtx, signal) => {
794
- if (this.#lastFinalTranscript && !this.#speaking && this.#turnDetector) {
795
- const startTime = Date.now();
796
- const eotProb = await this.#turnDetector.predictEndOfTurn(chatCtx);
797
- const unlikelyThreshold = this.#turnDetector.unlikelyThreshold;
798
- const elapsed = Date.now() - startTime;
799
- if (eotProb < unlikelyThreshold) {
800
- delay2 = this.UNLIKELY_ENDPOINT_DELAY;
801
- }
802
- delay2 = Math.max(0, delay2 - elapsed);
803
- }
804
- const timeout = setTimeout(() => {
805
- this.#resetStates();
806
- this.#validateFunc();
807
- }, delay2);
808
- signal.addEventListener("abort", () => {
809
- clearTimeout(timeout);
810
- });
811
- };
812
- (_a = this.#abort) == null ? void 0 : _a.abort();
813
- this.#abort = new AbortController();
814
- this.#validatingFuture = new Future();
815
- const detectCtx = this.#agent.chatCtx.copy();
816
- detectCtx.append({ text: this.#agent.transcribedText, role: ChatRole.USER });
817
- this.#validatingPromise = runTask(delay, detectCtx, this.#abort.signal);
818
- }
819
- }
820
- export {
821
- AGENT_STATE_ATTRIBUTE,
822
- AgentCallContext,
823
- VPAEvent,
824
- VoicePipelineAgent
825
- };
826
- //# sourceMappingURL=pipeline_agent.js.map