@livekit/agents 0.7.9 → 1.0.0-next.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (627) hide show
  1. package/dist/_exceptions.cjs +109 -0
  2. package/dist/_exceptions.cjs.map +1 -0
  3. package/dist/_exceptions.d.cts +64 -0
  4. package/dist/_exceptions.d.ts +64 -0
  5. package/dist/_exceptions.d.ts.map +1 -0
  6. package/dist/_exceptions.js +80 -0
  7. package/dist/_exceptions.js.map +1 -0
  8. package/dist/audio.cjs +10 -3
  9. package/dist/audio.cjs.map +1 -1
  10. package/dist/audio.d.cts +2 -0
  11. package/dist/audio.d.ts +2 -0
  12. package/dist/audio.d.ts.map +1 -1
  13. package/dist/audio.js +8 -2
  14. package/dist/audio.js.map +1 -1
  15. package/dist/cli.cjs +25 -0
  16. package/dist/cli.cjs.map +1 -1
  17. package/dist/cli.d.ts.map +1 -1
  18. package/dist/cli.js +25 -0
  19. package/dist/cli.js.map +1 -1
  20. package/dist/constants.cjs +6 -3
  21. package/dist/constants.cjs.map +1 -1
  22. package/dist/constants.d.cts +2 -1
  23. package/dist/constants.d.ts +2 -1
  24. package/dist/constants.d.ts.map +1 -1
  25. package/dist/constants.js +4 -2
  26. package/dist/constants.js.map +1 -1
  27. package/dist/http_server.cjs.map +1 -1
  28. package/dist/http_server.d.cts +1 -0
  29. package/dist/http_server.d.ts +1 -0
  30. package/dist/http_server.d.ts.map +1 -1
  31. package/dist/http_server.js.map +1 -1
  32. package/dist/index.cjs +27 -20
  33. package/dist/index.cjs.map +1 -1
  34. package/dist/index.d.cts +13 -10
  35. package/dist/index.d.ts +13 -10
  36. package/dist/index.d.ts.map +1 -1
  37. package/dist/index.js +15 -11
  38. package/dist/index.js.map +1 -1
  39. package/dist/inference_runner.cjs +0 -1
  40. package/dist/inference_runner.cjs.map +1 -1
  41. package/dist/inference_runner.d.cts +2 -3
  42. package/dist/inference_runner.d.ts +2 -3
  43. package/dist/inference_runner.d.ts.map +1 -1
  44. package/dist/inference_runner.js +0 -1
  45. package/dist/inference_runner.js.map +1 -1
  46. package/dist/ipc/inference_proc_executor.cjs +2 -2
  47. package/dist/ipc/inference_proc_executor.cjs.map +1 -1
  48. package/dist/ipc/inference_proc_executor.js +2 -2
  49. package/dist/ipc/inference_proc_executor.js.map +1 -1
  50. package/dist/ipc/job_executor.cjs.map +1 -1
  51. package/dist/ipc/job_executor.js.map +1 -1
  52. package/dist/ipc/job_proc_executor.cjs +1 -0
  53. package/dist/ipc/job_proc_executor.cjs.map +1 -1
  54. package/dist/ipc/job_proc_executor.js +1 -0
  55. package/dist/ipc/job_proc_executor.js.map +1 -1
  56. package/dist/ipc/job_proc_lazy_main.cjs +1 -1
  57. package/dist/ipc/job_proc_lazy_main.cjs.map +1 -1
  58. package/dist/ipc/job_proc_lazy_main.js +1 -1
  59. package/dist/ipc/job_proc_lazy_main.js.map +1 -1
  60. package/dist/ipc/supervised_proc.d.cts +1 -1
  61. package/dist/ipc/supervised_proc.d.ts +1 -1
  62. package/dist/ipc/supervised_proc.d.ts.map +1 -1
  63. package/dist/job.cjs +14 -2
  64. package/dist/job.cjs.map +1 -1
  65. package/dist/job.d.cts +8 -0
  66. package/dist/job.d.ts +8 -0
  67. package/dist/job.d.ts.map +1 -1
  68. package/dist/job.js +12 -1
  69. package/dist/job.js.map +1 -1
  70. package/dist/llm/chat_context.cjs +332 -82
  71. package/dist/llm/chat_context.cjs.map +1 -1
  72. package/dist/llm/chat_context.d.cts +152 -48
  73. package/dist/llm/chat_context.d.ts +152 -48
  74. package/dist/llm/chat_context.d.ts.map +1 -1
  75. package/dist/llm/chat_context.js +327 -81
  76. package/dist/llm/chat_context.js.map +1 -1
  77. package/dist/llm/chat_context.test.cjs +380 -0
  78. package/dist/llm/chat_context.test.cjs.map +1 -0
  79. package/dist/llm/chat_context.test.js +385 -0
  80. package/dist/llm/chat_context.test.js.map +1 -0
  81. package/dist/llm/index.cjs +37 -8
  82. package/dist/llm/index.cjs.map +1 -1
  83. package/dist/llm/index.d.cts +7 -3
  84. package/dist/llm/index.d.ts +7 -3
  85. package/dist/llm/index.d.ts.map +1 -1
  86. package/dist/llm/index.js +39 -9
  87. package/dist/llm/index.js.map +1 -1
  88. package/dist/llm/llm.cjs +97 -33
  89. package/dist/llm/llm.cjs.map +1 -1
  90. package/dist/llm/llm.d.cts +50 -24
  91. package/dist/llm/llm.d.ts +50 -24
  92. package/dist/llm/llm.d.ts.map +1 -1
  93. package/dist/llm/llm.js +98 -33
  94. package/dist/llm/llm.js.map +1 -1
  95. package/dist/llm/provider_format/google.cjs +128 -0
  96. package/dist/llm/provider_format/google.cjs.map +1 -0
  97. package/dist/llm/provider_format/google.d.cts +6 -0
  98. package/dist/llm/provider_format/google.d.ts +6 -0
  99. package/dist/llm/provider_format/google.d.ts.map +1 -0
  100. package/dist/llm/provider_format/google.js +104 -0
  101. package/dist/llm/provider_format/google.js.map +1 -0
  102. package/dist/llm/provider_format/google.test.cjs +676 -0
  103. package/dist/llm/provider_format/google.test.cjs.map +1 -0
  104. package/dist/llm/provider_format/google.test.js +675 -0
  105. package/dist/llm/provider_format/google.test.js.map +1 -0
  106. package/dist/llm/provider_format/index.cjs +40 -0
  107. package/dist/llm/provider_format/index.cjs.map +1 -0
  108. package/dist/llm/provider_format/index.d.cts +4 -0
  109. package/dist/llm/provider_format/index.d.ts +4 -0
  110. package/dist/llm/provider_format/index.d.ts.map +1 -0
  111. package/dist/llm/provider_format/index.js +16 -0
  112. package/dist/llm/provider_format/index.js.map +1 -0
  113. package/dist/llm/provider_format/openai.cjs +116 -0
  114. package/dist/llm/provider_format/openai.cjs.map +1 -0
  115. package/dist/llm/provider_format/openai.d.cts +3 -0
  116. package/dist/llm/provider_format/openai.d.ts +3 -0
  117. package/dist/llm/provider_format/openai.d.ts.map +1 -0
  118. package/dist/llm/provider_format/openai.js +92 -0
  119. package/dist/llm/provider_format/openai.js.map +1 -0
  120. package/dist/llm/provider_format/openai.test.cjs +490 -0
  121. package/dist/llm/provider_format/openai.test.cjs.map +1 -0
  122. package/dist/llm/provider_format/openai.test.js +489 -0
  123. package/dist/llm/provider_format/openai.test.js.map +1 -0
  124. package/dist/llm/provider_format/utils.cjs +146 -0
  125. package/dist/llm/provider_format/utils.cjs.map +1 -0
  126. package/dist/llm/provider_format/utils.d.cts +38 -0
  127. package/dist/llm/provider_format/utils.d.ts +38 -0
  128. package/dist/llm/provider_format/utils.d.ts.map +1 -0
  129. package/dist/llm/provider_format/utils.js +122 -0
  130. package/dist/llm/provider_format/utils.js.map +1 -0
  131. package/dist/llm/realtime.cjs +77 -0
  132. package/dist/llm/realtime.cjs.map +1 -0
  133. package/dist/llm/realtime.d.cts +98 -0
  134. package/dist/llm/realtime.d.ts +98 -0
  135. package/dist/llm/realtime.d.ts.map +1 -0
  136. package/dist/llm/realtime.js +52 -0
  137. package/dist/llm/realtime.js.map +1 -0
  138. package/dist/llm/remote_chat_context.cjs +112 -0
  139. package/dist/llm/remote_chat_context.cjs.map +1 -0
  140. package/dist/llm/remote_chat_context.d.cts +23 -0
  141. package/dist/llm/remote_chat_context.d.ts +23 -0
  142. package/dist/llm/remote_chat_context.d.ts.map +1 -0
  143. package/dist/llm/remote_chat_context.js +88 -0
  144. package/dist/llm/remote_chat_context.js.map +1 -0
  145. package/dist/llm/remote_chat_context.test.cjs +225 -0
  146. package/dist/llm/remote_chat_context.test.cjs.map +1 -0
  147. package/dist/llm/remote_chat_context.test.js +224 -0
  148. package/dist/llm/remote_chat_context.test.js.map +1 -0
  149. package/dist/llm/tool_context.cjs +111 -0
  150. package/dist/llm/tool_context.cjs.map +1 -0
  151. package/dist/llm/tool_context.d.cts +125 -0
  152. package/dist/llm/tool_context.d.ts +125 -0
  153. package/dist/llm/tool_context.d.ts.map +1 -0
  154. package/dist/llm/tool_context.js +80 -0
  155. package/dist/llm/tool_context.js.map +1 -0
  156. package/dist/llm/tool_context.test.cjs +162 -0
  157. package/dist/llm/tool_context.test.cjs.map +1 -0
  158. package/dist/llm/tool_context.test.js +161 -0
  159. package/dist/llm/tool_context.test.js.map +1 -0
  160. package/dist/llm/tool_context.type.test.cjs +92 -0
  161. package/dist/llm/tool_context.type.test.cjs.map +1 -0
  162. package/dist/llm/tool_context.type.test.js +91 -0
  163. package/dist/llm/tool_context.type.test.js.map +1 -0
  164. package/dist/llm/utils.cjs +260 -0
  165. package/dist/llm/utils.cjs.map +1 -0
  166. package/dist/llm/utils.d.cts +42 -0
  167. package/dist/llm/utils.d.ts +42 -0
  168. package/dist/llm/utils.d.ts.map +1 -0
  169. package/dist/llm/utils.js +223 -0
  170. package/dist/llm/utils.js.map +1 -0
  171. package/dist/llm/utils.test.cjs +513 -0
  172. package/dist/llm/utils.test.cjs.map +1 -0
  173. package/dist/llm/utils.test.js +490 -0
  174. package/dist/llm/utils.test.js.map +1 -0
  175. package/dist/metrics/base.cjs +0 -27
  176. package/dist/metrics/base.cjs.map +1 -1
  177. package/dist/metrics/base.d.cts +105 -63
  178. package/dist/metrics/base.d.ts +105 -63
  179. package/dist/metrics/base.d.ts.map +1 -1
  180. package/dist/metrics/base.js +0 -19
  181. package/dist/metrics/base.js.map +1 -1
  182. package/dist/metrics/index.cjs +0 -3
  183. package/dist/metrics/index.cjs.map +1 -1
  184. package/dist/metrics/index.d.cts +2 -3
  185. package/dist/metrics/index.d.ts +2 -3
  186. package/dist/metrics/index.d.ts.map +1 -1
  187. package/dist/metrics/index.js +0 -2
  188. package/dist/metrics/index.js.map +1 -1
  189. package/dist/metrics/usage_collector.cjs +17 -12
  190. package/dist/metrics/usage_collector.cjs.map +1 -1
  191. package/dist/metrics/usage_collector.d.cts +3 -2
  192. package/dist/metrics/usage_collector.d.ts +3 -2
  193. package/dist/metrics/usage_collector.d.ts.map +1 -1
  194. package/dist/metrics/usage_collector.js +17 -12
  195. package/dist/metrics/usage_collector.js.map +1 -1
  196. package/dist/metrics/utils.cjs +22 -59
  197. package/dist/metrics/utils.cjs.map +1 -1
  198. package/dist/metrics/utils.d.cts +1 -8
  199. package/dist/metrics/utils.d.ts +1 -8
  200. package/dist/metrics/utils.d.ts.map +1 -1
  201. package/dist/metrics/utils.js +22 -52
  202. package/dist/metrics/utils.js.map +1 -1
  203. package/dist/multimodal/index.cjs +0 -2
  204. package/dist/multimodal/index.cjs.map +1 -1
  205. package/dist/multimodal/index.d.cts +0 -1
  206. package/dist/multimodal/index.d.ts +0 -1
  207. package/dist/multimodal/index.d.ts.map +1 -1
  208. package/dist/multimodal/index.js +0 -1
  209. package/dist/multimodal/index.js.map +1 -1
  210. package/dist/plugin.cjs +24 -8
  211. package/dist/plugin.cjs.map +1 -1
  212. package/dist/plugin.d.cts +18 -4
  213. package/dist/plugin.d.ts +18 -4
  214. package/dist/plugin.d.ts.map +1 -1
  215. package/dist/plugin.js +22 -7
  216. package/dist/plugin.js.map +1 -1
  217. package/dist/stream/deferred_stream.cjs +98 -0
  218. package/dist/stream/deferred_stream.cjs.map +1 -0
  219. package/dist/stream/deferred_stream.d.cts +27 -0
  220. package/dist/stream/deferred_stream.d.ts +27 -0
  221. package/dist/stream/deferred_stream.d.ts.map +1 -0
  222. package/dist/stream/deferred_stream.js +73 -0
  223. package/dist/stream/deferred_stream.js.map +1 -0
  224. package/dist/stream/deferred_stream.test.cjs +527 -0
  225. package/dist/stream/deferred_stream.test.cjs.map +1 -0
  226. package/dist/stream/deferred_stream.test.js +526 -0
  227. package/dist/stream/deferred_stream.test.js.map +1 -0
  228. package/dist/stream/identity_transform.cjs +42 -0
  229. package/dist/stream/identity_transform.cjs.map +1 -0
  230. package/dist/stream/identity_transform.d.cts +6 -0
  231. package/dist/stream/identity_transform.d.ts +6 -0
  232. package/dist/stream/identity_transform.d.ts.map +1 -0
  233. package/dist/stream/identity_transform.js +18 -0
  234. package/dist/stream/identity_transform.js.map +1 -0
  235. package/dist/stream/identity_transform.test.cjs +125 -0
  236. package/dist/stream/identity_transform.test.cjs.map +1 -0
  237. package/dist/stream/identity_transform.test.js +124 -0
  238. package/dist/stream/identity_transform.test.js.map +1 -0
  239. package/dist/stream/index.cjs +38 -0
  240. package/dist/stream/index.cjs.map +1 -0
  241. package/dist/stream/index.d.cts +5 -0
  242. package/dist/stream/index.d.ts +5 -0
  243. package/dist/stream/index.d.ts.map +1 -0
  244. package/dist/stream/index.js +11 -0
  245. package/dist/stream/index.js.map +1 -0
  246. package/dist/stream/merge_readable_streams.cjs +59 -0
  247. package/dist/stream/merge_readable_streams.cjs.map +1 -0
  248. package/dist/stream/merge_readable_streams.d.cts +4 -0
  249. package/dist/stream/merge_readable_streams.d.ts +4 -0
  250. package/dist/stream/merge_readable_streams.d.ts.map +1 -0
  251. package/dist/stream/merge_readable_streams.js +35 -0
  252. package/dist/stream/merge_readable_streams.js.map +1 -0
  253. package/dist/stream/stream_channel.cjs +47 -0
  254. package/dist/stream/stream_channel.cjs.map +1 -0
  255. package/dist/stream/stream_channel.d.cts +9 -0
  256. package/dist/stream/stream_channel.d.ts +9 -0
  257. package/dist/stream/stream_channel.d.ts.map +1 -0
  258. package/dist/stream/stream_channel.js +23 -0
  259. package/dist/stream/stream_channel.js.map +1 -0
  260. package/dist/stream/stream_channel.test.cjs +97 -0
  261. package/dist/stream/stream_channel.test.cjs.map +1 -0
  262. package/dist/stream/stream_channel.test.js +96 -0
  263. package/dist/stream/stream_channel.test.js.map +1 -0
  264. package/dist/stt/stream_adapter.cjs +3 -4
  265. package/dist/stt/stream_adapter.cjs.map +1 -1
  266. package/dist/stt/stream_adapter.d.cts +1 -0
  267. package/dist/stt/stream_adapter.d.ts +1 -0
  268. package/dist/stt/stream_adapter.d.ts.map +1 -1
  269. package/dist/stt/stream_adapter.js +3 -4
  270. package/dist/stt/stream_adapter.js.map +1 -1
  271. package/dist/stt/stt.cjs +100 -10
  272. package/dist/stt/stt.cjs.map +1 -1
  273. package/dist/stt/stt.d.cts +26 -5
  274. package/dist/stt/stt.d.ts +26 -5
  275. package/dist/stt/stt.d.ts.map +1 -1
  276. package/dist/stt/stt.js +101 -11
  277. package/dist/stt/stt.js.map +1 -1
  278. package/dist/tokenize/basic/basic.cjs +10 -5
  279. package/dist/tokenize/basic/basic.cjs.map +1 -1
  280. package/dist/tokenize/basic/basic.d.cts +7 -1
  281. package/dist/tokenize/basic/basic.d.ts +7 -1
  282. package/dist/tokenize/basic/basic.d.ts.map +1 -1
  283. package/dist/tokenize/basic/basic.js +10 -5
  284. package/dist/tokenize/basic/basic.js.map +1 -1
  285. package/dist/tokenize/basic/sentence.cjs +14 -6
  286. package/dist/tokenize/basic/sentence.cjs.map +1 -1
  287. package/dist/tokenize/basic/sentence.d.cts +1 -1
  288. package/dist/tokenize/basic/sentence.d.ts +1 -1
  289. package/dist/tokenize/basic/sentence.d.ts.map +1 -1
  290. package/dist/tokenize/basic/sentence.js +14 -6
  291. package/dist/tokenize/basic/sentence.js.map +1 -1
  292. package/dist/tokenize/token_stream.cjs +5 -3
  293. package/dist/tokenize/token_stream.cjs.map +1 -1
  294. package/dist/tokenize/token_stream.d.cts +1 -0
  295. package/dist/tokenize/token_stream.d.ts +1 -0
  296. package/dist/tokenize/token_stream.d.ts.map +1 -1
  297. package/dist/tokenize/token_stream.js +6 -4
  298. package/dist/tokenize/token_stream.js.map +1 -1
  299. package/dist/transcription.cjs +1 -2
  300. package/dist/transcription.cjs.map +1 -1
  301. package/dist/transcription.d.ts.map +1 -1
  302. package/dist/transcription.js +2 -3
  303. package/dist/transcription.js.map +1 -1
  304. package/dist/tts/index.cjs +2 -4
  305. package/dist/tts/index.cjs.map +1 -1
  306. package/dist/tts/index.d.cts +1 -1
  307. package/dist/tts/index.d.ts +1 -1
  308. package/dist/tts/index.d.ts.map +1 -1
  309. package/dist/tts/index.js +1 -3
  310. package/dist/tts/index.js.map +1 -1
  311. package/dist/tts/stream_adapter.cjs +26 -13
  312. package/dist/tts/stream_adapter.cjs.map +1 -1
  313. package/dist/tts/stream_adapter.d.cts +1 -1
  314. package/dist/tts/stream_adapter.d.ts +1 -1
  315. package/dist/tts/stream_adapter.d.ts.map +1 -1
  316. package/dist/tts/stream_adapter.js +27 -14
  317. package/dist/tts/stream_adapter.js.map +1 -1
  318. package/dist/tts/tts.cjs +156 -25
  319. package/dist/tts/tts.cjs.map +1 -1
  320. package/dist/tts/tts.d.cts +29 -5
  321. package/dist/tts/tts.d.ts +29 -5
  322. package/dist/tts/tts.d.ts.map +1 -1
  323. package/dist/tts/tts.js +156 -24
  324. package/dist/tts/tts.js.map +1 -1
  325. package/dist/types.cjs +60 -0
  326. package/dist/types.cjs.map +1 -0
  327. package/dist/types.d.cts +13 -0
  328. package/dist/types.d.ts +13 -0
  329. package/dist/types.d.ts.map +1 -0
  330. package/dist/types.js +35 -0
  331. package/dist/types.js.map +1 -0
  332. package/dist/utils.cjs +298 -27
  333. package/dist/utils.cjs.map +1 -1
  334. package/dist/utils.d.cts +145 -9
  335. package/dist/utils.d.ts +145 -9
  336. package/dist/utils.d.ts.map +1 -1
  337. package/dist/utils.js +281 -26
  338. package/dist/utils.js.map +1 -1
  339. package/dist/utils.test.cjs +491 -0
  340. package/dist/utils.test.cjs.map +1 -0
  341. package/dist/utils.test.js +498 -0
  342. package/dist/utils.test.js.map +1 -0
  343. package/dist/vad.cjs +76 -20
  344. package/dist/vad.cjs.map +1 -1
  345. package/dist/vad.d.cts +25 -5
  346. package/dist/vad.d.ts +25 -5
  347. package/dist/vad.d.ts.map +1 -1
  348. package/dist/vad.js +76 -20
  349. package/dist/vad.js.map +1 -1
  350. package/dist/voice/agent.cjs +245 -0
  351. package/dist/voice/agent.cjs.map +1 -0
  352. package/dist/voice/agent.d.cts +78 -0
  353. package/dist/voice/agent.d.ts +78 -0
  354. package/dist/voice/agent.d.ts.map +1 -0
  355. package/dist/voice/agent.js +220 -0
  356. package/dist/voice/agent.js.map +1 -0
  357. package/dist/voice/agent.test.cjs +61 -0
  358. package/dist/voice/agent.test.cjs.map +1 -0
  359. package/dist/voice/agent.test.js +60 -0
  360. package/dist/voice/agent.test.js.map +1 -0
  361. package/dist/voice/agent_activity.cjs +1453 -0
  362. package/dist/voice/agent_activity.cjs.map +1 -0
  363. package/dist/voice/agent_activity.d.cts +94 -0
  364. package/dist/voice/agent_activity.d.ts +94 -0
  365. package/dist/voice/agent_activity.d.ts.map +1 -0
  366. package/dist/voice/agent_activity.js +1449 -0
  367. package/dist/voice/agent_activity.js.map +1 -0
  368. package/dist/voice/agent_session.cjs +312 -0
  369. package/dist/voice/agent_session.cjs.map +1 -0
  370. package/dist/voice/agent_session.d.cts +121 -0
  371. package/dist/voice/agent_session.d.ts +121 -0
  372. package/dist/voice/agent_session.d.ts.map +1 -0
  373. package/dist/voice/agent_session.js +295 -0
  374. package/dist/voice/agent_session.js.map +1 -0
  375. package/dist/voice/audio_recognition.cjs +374 -0
  376. package/dist/voice/audio_recognition.cjs.map +1 -0
  377. package/dist/voice/audio_recognition.d.cts +80 -0
  378. package/dist/voice/audio_recognition.d.ts +80 -0
  379. package/dist/voice/audio_recognition.d.ts.map +1 -0
  380. package/dist/voice/audio_recognition.js +350 -0
  381. package/dist/voice/audio_recognition.js.map +1 -0
  382. package/dist/voice/events.cjs +145 -0
  383. package/dist/voice/events.cjs.map +1 -0
  384. package/dist/voice/events.d.cts +124 -0
  385. package/dist/voice/events.d.ts +124 -0
  386. package/dist/voice/events.d.ts.map +1 -0
  387. package/dist/voice/events.js +110 -0
  388. package/dist/voice/events.js.map +1 -0
  389. package/dist/voice/generation.cjs +700 -0
  390. package/dist/voice/generation.cjs.map +1 -0
  391. package/dist/voice/generation.d.cts +115 -0
  392. package/dist/voice/generation.d.ts +115 -0
  393. package/dist/voice/generation.d.ts.map +1 -0
  394. package/dist/voice/generation.js +672 -0
  395. package/dist/voice/generation.js.map +1 -0
  396. package/dist/voice/index.cjs +40 -0
  397. package/dist/voice/index.cjs.map +1 -0
  398. package/dist/voice/index.d.cts +5 -0
  399. package/dist/voice/index.d.ts +5 -0
  400. package/dist/voice/index.d.ts.map +1 -0
  401. package/dist/voice/index.js +11 -0
  402. package/dist/voice/index.js.map +1 -0
  403. package/dist/voice/io.cjs +245 -0
  404. package/dist/voice/io.cjs.map +1 -0
  405. package/dist/voice/io.d.cts +101 -0
  406. package/dist/voice/io.d.ts +101 -0
  407. package/dist/voice/io.d.ts.map +1 -0
  408. package/dist/voice/io.js +217 -0
  409. package/dist/voice/io.js.map +1 -0
  410. package/dist/voice/room_io/_input.cjs +121 -0
  411. package/dist/voice/room_io/_input.cjs.map +1 -0
  412. package/dist/voice/room_io/_input.d.cts +24 -0
  413. package/dist/voice/room_io/_input.d.ts +24 -0
  414. package/dist/voice/room_io/_input.d.ts.map +1 -0
  415. package/dist/voice/room_io/_input.js +102 -0
  416. package/dist/voice/room_io/_input.js.map +1 -0
  417. package/dist/voice/room_io/_output.cjs +358 -0
  418. package/dist/voice/room_io/_output.cjs.map +1 -0
  419. package/dist/voice/room_io/_output.d.cts +75 -0
  420. package/dist/voice/room_io/_output.d.ts +75 -0
  421. package/dist/voice/room_io/_output.d.ts.map +1 -0
  422. package/dist/voice/room_io/_output.js +342 -0
  423. package/dist/voice/room_io/_output.js.map +1 -0
  424. package/dist/voice/room_io/index.cjs +25 -0
  425. package/dist/voice/room_io/index.cjs.map +1 -0
  426. package/dist/voice/room_io/index.d.cts +3 -0
  427. package/dist/voice/room_io/index.d.ts +3 -0
  428. package/dist/voice/room_io/index.d.ts.map +1 -0
  429. package/dist/voice/room_io/index.js +3 -0
  430. package/dist/voice/room_io/index.js.map +1 -0
  431. package/dist/voice/room_io/room_io.cjs +370 -0
  432. package/dist/voice/room_io/room_io.cjs.map +1 -0
  433. package/dist/voice/room_io/room_io.d.cts +73 -0
  434. package/dist/voice/room_io/room_io.d.ts +73 -0
  435. package/dist/voice/room_io/room_io.d.ts.map +1 -0
  436. package/dist/voice/room_io/room_io.js +361 -0
  437. package/dist/voice/room_io/room_io.js.map +1 -0
  438. package/dist/{pipeline/index.cjs → voice/run_context.cjs} +16 -11
  439. package/dist/voice/run_context.cjs.map +1 -0
  440. package/dist/voice/run_context.d.cts +12 -0
  441. package/dist/voice/run_context.d.ts +12 -0
  442. package/dist/voice/run_context.d.ts.map +1 -0
  443. package/dist/voice/run_context.js +14 -0
  444. package/dist/voice/run_context.js.map +1 -0
  445. package/dist/voice/speech_handle.cjs +105 -0
  446. package/dist/voice/speech_handle.cjs.map +1 -0
  447. package/dist/voice/speech_handle.d.cts +46 -0
  448. package/dist/voice/speech_handle.d.ts +46 -0
  449. package/dist/voice/speech_handle.d.ts.map +1 -0
  450. package/dist/voice/speech_handle.js +81 -0
  451. package/dist/voice/speech_handle.js.map +1 -0
  452. package/dist/voice/transcription/_utils.cjs +45 -0
  453. package/dist/voice/transcription/_utils.cjs.map +1 -0
  454. package/dist/voice/transcription/_utils.d.cts +3 -0
  455. package/dist/voice/transcription/_utils.d.ts +3 -0
  456. package/dist/voice/transcription/_utils.d.ts.map +1 -0
  457. package/dist/voice/transcription/_utils.js +21 -0
  458. package/dist/voice/transcription/_utils.js.map +1 -0
  459. package/dist/voice/transcription/index.cjs +23 -0
  460. package/dist/voice/transcription/index.cjs.map +1 -0
  461. package/dist/voice/transcription/index.d.cts +2 -0
  462. package/dist/voice/transcription/index.d.ts +2 -0
  463. package/dist/voice/transcription/index.d.ts.map +1 -0
  464. package/dist/voice/transcription/index.js +2 -0
  465. package/dist/voice/transcription/index.js.map +1 -0
  466. package/dist/voice/transcription/synchronizer.cjs +379 -0
  467. package/dist/voice/transcription/synchronizer.cjs.map +1 -0
  468. package/dist/voice/transcription/synchronizer.d.cts +86 -0
  469. package/dist/voice/transcription/synchronizer.d.ts +86 -0
  470. package/dist/voice/transcription/synchronizer.d.ts.map +1 -0
  471. package/dist/voice/transcription/synchronizer.js +354 -0
  472. package/dist/voice/transcription/synchronizer.js.map +1 -0
  473. package/dist/worker.cjs +22 -4
  474. package/dist/worker.cjs.map +1 -1
  475. package/dist/worker.d.cts +1 -1
  476. package/dist/worker.d.ts +1 -1
  477. package/dist/worker.d.ts.map +1 -1
  478. package/dist/worker.js +22 -4
  479. package/dist/worker.js.map +1 -1
  480. package/package.json +8 -2
  481. package/src/_exceptions.ts +137 -0
  482. package/src/audio.ts +12 -1
  483. package/src/cli.ts +37 -0
  484. package/src/constants.ts +2 -1
  485. package/src/http_server.ts +1 -0
  486. package/src/index.ts +13 -10
  487. package/src/inference_runner.ts +2 -3
  488. package/src/ipc/inference_proc_executor.ts +2 -2
  489. package/src/ipc/job_executor.ts +1 -1
  490. package/src/ipc/job_proc_executor.ts +1 -1
  491. package/src/ipc/job_proc_lazy_main.ts +1 -1
  492. package/src/job.ts +18 -0
  493. package/src/llm/__snapshots__/chat_context.test.ts.snap +527 -0
  494. package/src/llm/__snapshots__/tool_context.test.ts.snap +177 -0
  495. package/src/llm/__snapshots__/utils.test.ts.snap +65 -0
  496. package/src/llm/chat_context.test.ts +450 -0
  497. package/src/llm/chat_context.ts +501 -103
  498. package/src/llm/index.ts +53 -18
  499. package/src/llm/llm.ts +148 -50
  500. package/src/llm/provider_format/google.test.ts +772 -0
  501. package/src/llm/provider_format/google.ts +130 -0
  502. package/src/llm/provider_format/index.ts +23 -0
  503. package/src/llm/provider_format/openai.test.ts +581 -0
  504. package/src/llm/provider_format/openai.ts +118 -0
  505. package/src/llm/provider_format/utils.ts +183 -0
  506. package/src/llm/realtime.ts +151 -0
  507. package/src/llm/remote_chat_context.test.ts +290 -0
  508. package/src/llm/remote_chat_context.ts +114 -0
  509. package/src/llm/tool_context.test.ts +198 -0
  510. package/src/llm/tool_context.ts +259 -0
  511. package/src/llm/tool_context.type.test.ts +115 -0
  512. package/src/llm/utils.test.ts +670 -0
  513. package/src/llm/utils.ts +324 -0
  514. package/src/metrics/base.ts +110 -78
  515. package/src/metrics/index.ts +3 -9
  516. package/src/metrics/usage_collector.ts +19 -13
  517. package/src/metrics/utils.ts +24 -69
  518. package/src/multimodal/index.ts +0 -1
  519. package/src/plugin.ts +26 -8
  520. package/src/stream/deferred_stream.test.ts +755 -0
  521. package/src/stream/deferred_stream.ts +110 -0
  522. package/src/stream/identity_transform.test.ts +179 -0
  523. package/src/stream/identity_transform.ts +18 -0
  524. package/src/stream/index.ts +7 -0
  525. package/src/stream/merge_readable_streams.ts +40 -0
  526. package/src/stream/stream_channel.test.ts +129 -0
  527. package/src/stream/stream_channel.ts +32 -0
  528. package/src/stt/stream_adapter.ts +3 -5
  529. package/src/stt/stt.ts +134 -17
  530. package/src/tokenize/basic/basic.ts +13 -5
  531. package/src/tokenize/basic/sentence.ts +20 -6
  532. package/src/tokenize/token_stream.ts +7 -4
  533. package/src/transcription.ts +2 -3
  534. package/src/tts/index.ts +0 -1
  535. package/src/tts/stream_adapter.ts +42 -16
  536. package/src/tts/tts.ts +202 -21
  537. package/src/types.ts +42 -0
  538. package/src/utils.test.ts +658 -0
  539. package/src/utils.ts +402 -44
  540. package/src/vad.ts +90 -22
  541. package/src/voice/agent.test.ts +80 -0
  542. package/src/voice/agent.ts +332 -0
  543. package/src/voice/agent_activity.ts +1913 -0
  544. package/src/voice/agent_session.ts +460 -0
  545. package/src/voice/audio_recognition.ts +473 -0
  546. package/src/voice/events.ts +252 -0
  547. package/src/voice/generation.ts +881 -0
  548. package/src/voice/index.ts +7 -0
  549. package/src/voice/io.ts +304 -0
  550. package/src/voice/room_io/_input.ts +144 -0
  551. package/src/voice/room_io/_output.ts +436 -0
  552. package/src/voice/room_io/index.ts +5 -0
  553. package/src/voice/room_io/room_io.ts +495 -0
  554. package/src/voice/run_context.ts +20 -0
  555. package/src/voice/speech_handle.ts +104 -0
  556. package/src/voice/transcription/_utils.ts +25 -0
  557. package/src/voice/transcription/index.ts +4 -0
  558. package/src/voice/transcription/synchronizer.ts +477 -0
  559. package/src/worker.ts +22 -2
  560. package/dist/llm/function_context.cjs +0 -103
  561. package/dist/llm/function_context.cjs.map +0 -1
  562. package/dist/llm/function_context.d.cts +0 -47
  563. package/dist/llm/function_context.d.ts +0 -47
  564. package/dist/llm/function_context.d.ts.map +0 -1
  565. package/dist/llm/function_context.js +0 -78
  566. package/dist/llm/function_context.js.map +0 -1
  567. package/dist/llm/function_context.test.cjs +0 -218
  568. package/dist/llm/function_context.test.cjs.map +0 -1
  569. package/dist/llm/function_context.test.js +0 -217
  570. package/dist/llm/function_context.test.js.map +0 -1
  571. package/dist/multimodal/multimodal_agent.cjs +0 -486
  572. package/dist/multimodal/multimodal_agent.cjs.map +0 -1
  573. package/dist/multimodal/multimodal_agent.d.cts +0 -48
  574. package/dist/multimodal/multimodal_agent.d.ts +0 -48
  575. package/dist/multimodal/multimodal_agent.d.ts.map +0 -1
  576. package/dist/multimodal/multimodal_agent.js +0 -461
  577. package/dist/multimodal/multimodal_agent.js.map +0 -1
  578. package/dist/pipeline/agent_output.cjs +0 -197
  579. package/dist/pipeline/agent_output.cjs.map +0 -1
  580. package/dist/pipeline/agent_output.d.cts +0 -33
  581. package/dist/pipeline/agent_output.d.ts +0 -33
  582. package/dist/pipeline/agent_output.d.ts.map +0 -1
  583. package/dist/pipeline/agent_output.js +0 -172
  584. package/dist/pipeline/agent_output.js.map +0 -1
  585. package/dist/pipeline/agent_playout.cjs +0 -175
  586. package/dist/pipeline/agent_playout.cjs.map +0 -1
  587. package/dist/pipeline/agent_playout.d.cts +0 -40
  588. package/dist/pipeline/agent_playout.d.ts +0 -40
  589. package/dist/pipeline/agent_playout.d.ts.map +0 -1
  590. package/dist/pipeline/agent_playout.js +0 -139
  591. package/dist/pipeline/agent_playout.js.map +0 -1
  592. package/dist/pipeline/human_input.cjs +0 -171
  593. package/dist/pipeline/human_input.cjs.map +0 -1
  594. package/dist/pipeline/human_input.d.cts +0 -30
  595. package/dist/pipeline/human_input.d.ts +0 -30
  596. package/dist/pipeline/human_input.d.ts.map +0 -1
  597. package/dist/pipeline/human_input.js +0 -146
  598. package/dist/pipeline/human_input.js.map +0 -1
  599. package/dist/pipeline/index.cjs.map +0 -1
  600. package/dist/pipeline/index.d.cts +0 -2
  601. package/dist/pipeline/index.d.ts +0 -2
  602. package/dist/pipeline/index.d.ts.map +0 -1
  603. package/dist/pipeline/index.js +0 -11
  604. package/dist/pipeline/index.js.map +0 -1
  605. package/dist/pipeline/pipeline_agent.cjs +0 -859
  606. package/dist/pipeline/pipeline_agent.cjs.map +0 -1
  607. package/dist/pipeline/pipeline_agent.d.cts +0 -150
  608. package/dist/pipeline/pipeline_agent.d.ts +0 -150
  609. package/dist/pipeline/pipeline_agent.d.ts.map +0 -1
  610. package/dist/pipeline/pipeline_agent.js +0 -837
  611. package/dist/pipeline/pipeline_agent.js.map +0 -1
  612. package/dist/pipeline/speech_handle.cjs +0 -176
  613. package/dist/pipeline/speech_handle.cjs.map +0 -1
  614. package/dist/pipeline/speech_handle.d.cts +0 -37
  615. package/dist/pipeline/speech_handle.d.ts +0 -37
  616. package/dist/pipeline/speech_handle.d.ts.map +0 -1
  617. package/dist/pipeline/speech_handle.js +0 -152
  618. package/dist/pipeline/speech_handle.js.map +0 -1
  619. package/src/llm/function_context.test.ts +0 -248
  620. package/src/llm/function_context.ts +0 -142
  621. package/src/multimodal/multimodal_agent.ts +0 -592
  622. package/src/pipeline/agent_output.ts +0 -219
  623. package/src/pipeline/agent_playout.ts +0 -192
  624. package/src/pipeline/human_input.ts +0 -188
  625. package/src/pipeline/index.ts +0 -15
  626. package/src/pipeline/pipeline_agent.ts +0 -1197
  627. package/src/pipeline/speech_handle.ts +0 -201
@@ -0,0 +1,672 @@
1
+ import { AudioResampler } from "@livekit/rtc-node";
2
+ import { ZodObject } from "zod";
3
+ import {
4
+ ChatMessage,
5
+ FunctionCall,
6
+ FunctionCallOutput
7
+ } from "../llm/chat_context.js";
8
+ import {
9
+ isAgentHandoff,
10
+ isFunctionTool,
11
+ isToolError
12
+ } from "../llm/tool_context.js";
13
+ import { log } from "../log.js";
14
+ import { IdentityTransform } from "../stream/identity_transform.js";
15
+ import { Future, Task, shortuuid, toError } from "../utils.js";
16
+ import { asyncLocalStorage, isStopResponse } from "./agent.js";
17
+ import { RunContext } from "./run_context.js";
18
+ class _LLMGenerationData {
19
+ constructor(textStream, toolCallStream) {
20
+ this.textStream = textStream;
21
+ this.toolCallStream = toolCallStream;
22
+ this.id = shortuuid("item_");
23
+ this.generatedToolCalls = [];
24
+ }
25
+ generatedText = "";
26
+ generatedToolCalls;
27
+ id;
28
+ }
29
+ class _ToolOutput {
30
+ output;
31
+ firstToolFut;
32
+ constructor() {
33
+ this.output = [];
34
+ this.firstToolFut = new Future();
35
+ }
36
+ }
37
+ class _SanitizedOutput {
38
+ toolCall;
39
+ toolCallOutput;
40
+ replyRequired;
41
+ agentTask;
42
+ constructor(toolCall, toolCallOutput, replyRequired, agentTask) {
43
+ this.toolCall = toolCall;
44
+ this.toolCallOutput = toolCallOutput;
45
+ this.replyRequired = replyRequired;
46
+ this.agentTask = agentTask;
47
+ }
48
+ static create(params) {
49
+ const { toolCall, toolCallOutput, replyRequired = true, agentTask } = params;
50
+ return new _SanitizedOutput(toolCall, toolCallOutput, replyRequired, agentTask);
51
+ }
52
+ }
53
+ function isValidToolOutput(toolOutput) {
54
+ const validTypes = ["string", "number", "boolean"];
55
+ if (validTypes.includes(typeof toolOutput)) {
56
+ return true;
57
+ }
58
+ if (toolOutput === void 0 || toolOutput === null) {
59
+ return true;
60
+ }
61
+ if (Array.isArray(toolOutput)) {
62
+ return toolOutput.every(isValidToolOutput);
63
+ }
64
+ if (toolOutput instanceof Set) {
65
+ return Array.from(toolOutput).every(isValidToolOutput);
66
+ }
67
+ if (toolOutput instanceof Map) {
68
+ return Array.from(toolOutput.values()).every(isValidToolOutput);
69
+ }
70
+ if (toolOutput instanceof Object) {
71
+ return Object.entries(toolOutput).every(
72
+ ([key, value]) => validTypes.includes(typeof key) && isValidToolOutput(value)
73
+ );
74
+ }
75
+ return false;
76
+ }
77
+ class ToolExecutionOutput {
78
+ constructor(toolCall, toolCallOutput, agentTask, rawOutput, rawException, replyRequired) {
79
+ this.toolCall = toolCall;
80
+ this.toolCallOutput = toolCallOutput;
81
+ this.agentTask = agentTask;
82
+ this.rawOutput = rawOutput;
83
+ this.rawException = rawException;
84
+ this.replyRequired = replyRequired;
85
+ }
86
+ static create(params) {
87
+ const {
88
+ toolCall,
89
+ toolCallOutput,
90
+ agentTask,
91
+ rawOutput,
92
+ rawException,
93
+ replyRequired = true
94
+ } = params;
95
+ return new ToolExecutionOutput(
96
+ toolCall,
97
+ toolCallOutput,
98
+ agentTask,
99
+ rawOutput,
100
+ rawException,
101
+ replyRequired
102
+ );
103
+ }
104
+ }
105
+ class _JsOutput {
106
+ toolCall;
107
+ output;
108
+ exception;
109
+ #logger = log();
110
+ constructor(toolCall, output, exception) {
111
+ this.toolCall = toolCall;
112
+ this.output = output;
113
+ this.exception = exception;
114
+ }
115
+ static create(params) {
116
+ const { toolCall, output = void 0, exception = void 0 } = params;
117
+ return new _JsOutput(toolCall, output, exception);
118
+ }
119
+ sanitize() {
120
+ if (isToolError(this.exception)) {
121
+ return _SanitizedOutput.create({
122
+ toolCall: FunctionCall.create({ ...this.toolCall }),
123
+ toolCallOutput: FunctionCallOutput.create({
124
+ name: this.toolCall.name,
125
+ callId: this.toolCall.callId,
126
+ output: this.exception.message,
127
+ isError: true
128
+ })
129
+ });
130
+ }
131
+ if (isStopResponse(this.exception)) {
132
+ return _SanitizedOutput.create({
133
+ toolCall: FunctionCall.create({ ...this.toolCall })
134
+ });
135
+ }
136
+ if (this.exception !== void 0) {
137
+ return _SanitizedOutput.create({
138
+ toolCall: FunctionCall.create({ ...this.toolCall }),
139
+ toolCallOutput: FunctionCallOutput.create({
140
+ name: this.toolCall.name,
141
+ callId: this.toolCall.callId,
142
+ output: "An internal error occurred while executing the tool.",
143
+ // Don't send the actual error message, as it may contain sensitive information
144
+ isError: true
145
+ })
146
+ });
147
+ }
148
+ let agentTask = void 0;
149
+ let toolOutput = this.output;
150
+ if (isAgentHandoff(this.output)) {
151
+ agentTask = this.output.agent;
152
+ toolOutput = this.output.returns;
153
+ }
154
+ if (!isValidToolOutput(toolOutput)) {
155
+ this.#logger.error(
156
+ {
157
+ callId: this.toolCall.callId,
158
+ function: this.toolCall.name
159
+ },
160
+ `AI function ${this.toolCall.name} returned an invalid output`
161
+ );
162
+ return _SanitizedOutput.create({
163
+ toolCall: FunctionCall.create({ ...this.toolCall }),
164
+ toolCallOutput: void 0
165
+ });
166
+ }
167
+ return _SanitizedOutput.create({
168
+ toolCall: FunctionCall.create({ ...this.toolCall }),
169
+ toolCallOutput: FunctionCallOutput.create({
170
+ name: this.toolCall.name,
171
+ callId: this.toolCall.callId,
172
+ output: toolOutput !== void 0 ? JSON.stringify(toolOutput) : "",
173
+ // take the string representation of the output
174
+ isError: false
175
+ }),
176
+ replyRequired: toolOutput !== void 0,
177
+ // require a reply if the tool returned an output
178
+ agentTask
179
+ });
180
+ }
181
+ }
182
+ function createToolOutput(params) {
183
+ const { toolCall, output, exception } = params;
184
+ const logger = log();
185
+ let finalOutput = output;
186
+ let finalException = exception;
187
+ if (output instanceof Error) {
188
+ finalException = output;
189
+ finalOutput = void 0;
190
+ }
191
+ if (isToolError(finalException)) {
192
+ return ToolExecutionOutput.create({
193
+ toolCall: FunctionCall.create({ ...toolCall }),
194
+ toolCallOutput: FunctionCallOutput.create({
195
+ name: toolCall.name,
196
+ callId: toolCall.callId,
197
+ output: finalException.message,
198
+ isError: true
199
+ }),
200
+ rawOutput: finalOutput,
201
+ rawException: finalException
202
+ });
203
+ }
204
+ if (isStopResponse(finalException)) {
205
+ return ToolExecutionOutput.create({
206
+ toolCall: FunctionCall.create({ ...toolCall }),
207
+ rawOutput: finalOutput,
208
+ rawException: finalException
209
+ });
210
+ }
211
+ if (finalException !== void 0) {
212
+ return ToolExecutionOutput.create({
213
+ toolCall: FunctionCall.create({ ...toolCall }),
214
+ toolCallOutput: FunctionCallOutput.create({
215
+ name: toolCall.name,
216
+ callId: toolCall.callId,
217
+ output: "An internal error occurred",
218
+ // Don't send the actual error message, as it may contain sensitive information
219
+ isError: true
220
+ }),
221
+ rawOutput: finalOutput,
222
+ rawException: finalException
223
+ });
224
+ }
225
+ let agentTask = void 0;
226
+ let toolOutput = finalOutput;
227
+ if (isAgentHandoff(finalOutput)) {
228
+ agentTask = finalOutput.agent;
229
+ toolOutput = finalOutput.returns;
230
+ }
231
+ if (!isValidToolOutput(toolOutput)) {
232
+ logger.error(
233
+ {
234
+ callId: toolCall.callId,
235
+ output: finalOutput
236
+ },
237
+ `AI function ${toolCall.name} returned an invalid output`
238
+ );
239
+ return ToolExecutionOutput.create({
240
+ toolCall: FunctionCall.create({ ...toolCall }),
241
+ rawOutput: finalOutput,
242
+ rawException: finalException
243
+ });
244
+ }
245
+ return ToolExecutionOutput.create({
246
+ toolCall: FunctionCall.create({ ...toolCall }),
247
+ toolCallOutput: FunctionCallOutput.create({
248
+ name: toolCall.name,
249
+ callId: toolCall.callId,
250
+ output: toolOutput !== void 0 ? JSON.stringify(toolOutput) : "",
251
+ // take the string representation of the output
252
+ isError: false
253
+ }),
254
+ replyRequired: toolOutput !== void 0,
255
+ // require a reply if the tool returned an output
256
+ agentTask,
257
+ rawOutput: finalOutput,
258
+ rawException: finalException
259
+ });
260
+ }
261
+ const INSTRUCTIONS_MESSAGE_ID = "lk.agent_task.instructions";
262
+ function updateInstructions(options) {
263
+ const { chatCtx, instructions, addIfMissing } = options;
264
+ const idx = chatCtx.indexById(INSTRUCTIONS_MESSAGE_ID);
265
+ if (idx !== void 0) {
266
+ if (chatCtx.items[idx].type === "message") {
267
+ chatCtx.items[idx] = ChatMessage.create({
268
+ id: INSTRUCTIONS_MESSAGE_ID,
269
+ role: "system",
270
+ content: [instructions],
271
+ createdAt: chatCtx.items[idx].createdAt
272
+ });
273
+ } else {
274
+ throw new Error('expected the instructions inside the chatCtx to be of type "message"');
275
+ }
276
+ } else if (addIfMissing) {
277
+ chatCtx.items.unshift(
278
+ ChatMessage.create({
279
+ id: INSTRUCTIONS_MESSAGE_ID,
280
+ role: "system",
281
+ content: [instructions]
282
+ })
283
+ );
284
+ }
285
+ }
286
+ function performLLMInference(node, chatCtx, toolCtx, modelSettings, controller) {
287
+ const textStream = new IdentityTransform();
288
+ const toolCallStream = new IdentityTransform();
289
+ const textWriter = textStream.writable.getWriter();
290
+ const toolCallWriter = toolCallStream.writable.getWriter();
291
+ const data = new _LLMGenerationData(textStream.readable, toolCallStream.readable);
292
+ const inferenceTask = async (signal) => {
293
+ let llmStreamReader = null;
294
+ let llmStream = null;
295
+ try {
296
+ llmStream = await node(chatCtx, toolCtx, modelSettings);
297
+ if (llmStream === null) {
298
+ await textWriter.close();
299
+ return;
300
+ }
301
+ llmStreamReader = llmStream.getReader();
302
+ while (true) {
303
+ if (signal.aborted) {
304
+ break;
305
+ }
306
+ const { done, value: chunk } = await llmStreamReader.read();
307
+ if (done) {
308
+ break;
309
+ }
310
+ if (typeof chunk === "string") {
311
+ data.generatedText += chunk;
312
+ await textWriter.write(chunk);
313
+ } else {
314
+ if (chunk.delta === void 0) {
315
+ continue;
316
+ }
317
+ if (chunk.delta.toolCalls) {
318
+ for (const tool of chunk.delta.toolCalls) {
319
+ if (tool.type !== "function_call") continue;
320
+ const toolCall = FunctionCall.create({
321
+ callId: `${data.id}/fnc_${data.generatedToolCalls.length}`,
322
+ name: tool.name,
323
+ args: tool.args
324
+ });
325
+ data.generatedToolCalls.push(toolCall);
326
+ await toolCallWriter.write(toolCall);
327
+ }
328
+ }
329
+ if (chunk.delta.content) {
330
+ data.generatedText += chunk.delta.content;
331
+ await textWriter.write(chunk.delta.content);
332
+ }
333
+ }
334
+ }
335
+ } catch (error) {
336
+ if (error instanceof DOMException && error.name === "AbortError") {
337
+ return;
338
+ }
339
+ throw error;
340
+ } finally {
341
+ llmStreamReader == null ? void 0 : llmStreamReader.releaseLock();
342
+ await (llmStream == null ? void 0 : llmStream.cancel());
343
+ await textWriter.close();
344
+ await toolCallWriter.close();
345
+ }
346
+ };
347
+ return [
348
+ Task.from((controller2) => inferenceTask(controller2.signal), controller, "performLLMInference"),
349
+ data
350
+ ];
351
+ }
352
+ function performTTSInference(node, text, modelSettings, controller) {
353
+ const audioStream = new IdentityTransform();
354
+ const outputWriter = audioStream.writable.getWriter();
355
+ const audioOutputStream = audioStream.readable;
356
+ const inferenceTask = async (signal) => {
357
+ let ttsStreamReader = null;
358
+ let ttsStream = null;
359
+ try {
360
+ ttsStream = await node(text, modelSettings);
361
+ if (ttsStream === null) {
362
+ await outputWriter.close();
363
+ return;
364
+ }
365
+ ttsStreamReader = ttsStream.getReader();
366
+ while (true) {
367
+ if (signal.aborted) {
368
+ break;
369
+ }
370
+ const { done, value: chunk } = await ttsStreamReader.read();
371
+ if (done) {
372
+ break;
373
+ }
374
+ await outputWriter.write(chunk);
375
+ }
376
+ } catch (error) {
377
+ if (error instanceof DOMException && error.name === "AbortError") {
378
+ return;
379
+ }
380
+ throw error;
381
+ } finally {
382
+ ttsStreamReader == null ? void 0 : ttsStreamReader.releaseLock();
383
+ await (ttsStream == null ? void 0 : ttsStream.cancel());
384
+ await outputWriter.close();
385
+ }
386
+ };
387
+ return [
388
+ Task.from((controller2) => inferenceTask(controller2.signal), controller, "performTTSInference"),
389
+ audioOutputStream
390
+ ];
391
+ }
392
+ async function forwardText(source, out, signal, textOutput) {
393
+ const reader = source.getReader();
394
+ try {
395
+ while (true) {
396
+ if (signal.aborted) {
397
+ break;
398
+ }
399
+ const { done, value: delta } = await reader.read();
400
+ if (done) break;
401
+ out.text += delta;
402
+ if (textOutput !== null) {
403
+ await textOutput.captureText(delta);
404
+ }
405
+ if (!out.firstTextFut.done) {
406
+ out.firstTextFut.resolve();
407
+ }
408
+ }
409
+ } finally {
410
+ if (textOutput !== null) {
411
+ textOutput.flush();
412
+ }
413
+ reader == null ? void 0 : reader.releaseLock();
414
+ }
415
+ }
416
+ function performTextForwarding(source, controller, textOutput) {
417
+ const out = {
418
+ text: "",
419
+ firstTextFut: new Future()
420
+ };
421
+ return [
422
+ Task.from(
423
+ (controller2) => forwardText(source, out, controller2.signal, textOutput),
424
+ controller,
425
+ "performTextForwarding"
426
+ ),
427
+ out
428
+ ];
429
+ }
430
+ async function forwardAudio(ttsStream, audioOuput, out, signal) {
431
+ const reader = ttsStream.getReader();
432
+ let resampler = null;
433
+ try {
434
+ while (true) {
435
+ if (signal == null ? void 0 : signal.aborted) {
436
+ break;
437
+ }
438
+ const { done, value: frame } = await reader.read();
439
+ if (done) break;
440
+ out.audio.push(frame);
441
+ if (!out.firstFrameFut.done && audioOuput.sampleRate && audioOuput.sampleRate !== frame.sampleRate && !resampler) {
442
+ resampler = new AudioResampler(frame.sampleRate, audioOuput.sampleRate, 1);
443
+ }
444
+ if (resampler) {
445
+ for (const f of resampler.push(frame)) {
446
+ await audioOuput.captureFrame(f);
447
+ }
448
+ } else {
449
+ await audioOuput.captureFrame(frame);
450
+ }
451
+ if (!out.firstFrameFut.done) {
452
+ out.firstFrameFut.resolve();
453
+ }
454
+ }
455
+ } finally {
456
+ reader == null ? void 0 : reader.releaseLock();
457
+ if (resampler) {
458
+ for (const f of resampler.flush()) {
459
+ await audioOuput.captureFrame(f);
460
+ }
461
+ }
462
+ audioOuput.flush();
463
+ }
464
+ }
465
+ function performAudioForwarding(ttsStream, audioOutput, controller) {
466
+ const out = {
467
+ audio: [],
468
+ firstFrameFut: new Future()
469
+ };
470
+ return [
471
+ Task.from(
472
+ (controller2) => forwardAudio(ttsStream, audioOutput, out, controller2.signal),
473
+ controller,
474
+ "performAudioForwarding"
475
+ ),
476
+ out
477
+ ];
478
+ }
479
+ function performToolExecutions({
480
+ session,
481
+ speechHandle,
482
+ toolCtx,
483
+ toolChoice,
484
+ toolCallStream,
485
+ onToolExecutionStarted = () => {
486
+ },
487
+ onToolExecutionCompleted = () => {
488
+ },
489
+ controller
490
+ }) {
491
+ const logger = log();
492
+ const toolOutput = {
493
+ output: [],
494
+ firstToolStartedFuture: new Future()
495
+ };
496
+ const toolCompleted = (out) => {
497
+ onToolExecutionCompleted(out);
498
+ toolOutput.output.push(out);
499
+ };
500
+ const executeToolsTask = async (controller2) => {
501
+ const signal = controller2.signal;
502
+ const reader = toolCallStream.getReader();
503
+ const tasks = [];
504
+ while (!signal.aborted) {
505
+ const { done, value: toolCall } = await reader.read();
506
+ if (signal.aborted) break;
507
+ if (done) break;
508
+ if (toolChoice === "none") {
509
+ logger.error(
510
+ {
511
+ function: toolCall.name,
512
+ speech_id: speechHandle.id
513
+ },
514
+ "received a tool call with toolChoice set to 'none', ignoring"
515
+ );
516
+ continue;
517
+ }
518
+ const tool = toolCtx[toolCall.name];
519
+ if (!tool) {
520
+ logger.warn(
521
+ {
522
+ function: toolCall.name,
523
+ speech_id: speechHandle.id
524
+ },
525
+ `unknown AI function ${toolCall.name}`
526
+ );
527
+ continue;
528
+ }
529
+ if (!isFunctionTool(tool)) {
530
+ logger.error(
531
+ {
532
+ function: toolCall.name,
533
+ speech_id: speechHandle.id
534
+ },
535
+ `unknown tool type: ${typeof tool}`
536
+ );
537
+ continue;
538
+ }
539
+ let parsedArgs;
540
+ try {
541
+ const jsonArgs = JSON.parse(toolCall.args);
542
+ if (tool.parameters instanceof ZodObject) {
543
+ parsedArgs = tool.parameters.parse(jsonArgs);
544
+ } else {
545
+ parsedArgs = jsonArgs;
546
+ }
547
+ } catch (rawError) {
548
+ const error = toError(rawError);
549
+ logger.error(
550
+ {
551
+ function: toolCall.name,
552
+ arguments: toolCall.args,
553
+ speech_id: speechHandle.id,
554
+ error: error.message
555
+ },
556
+ `tried to call AI function ${toolCall.name} with invalid arguments`
557
+ );
558
+ toolCompleted(
559
+ createToolOutput({
560
+ toolCall,
561
+ exception: error
562
+ })
563
+ );
564
+ continue;
565
+ }
566
+ if (!toolOutput.firstToolStartedFuture.done) {
567
+ toolOutput.firstToolStartedFuture.resolve();
568
+ }
569
+ onToolExecutionStarted(toolCall);
570
+ logger.info(
571
+ {
572
+ function: toolCall.name,
573
+ arguments: parsedArgs,
574
+ speech_id: speechHandle.id
575
+ },
576
+ "Executing LLM tool call"
577
+ );
578
+ const toolExecution = asyncLocalStorage.run({ functionCall: toolCall }, async () => {
579
+ return await tool.execute(parsedArgs, {
580
+ ctx: new RunContext(session, speechHandle, toolCall),
581
+ toolCallId: toolCall.callId,
582
+ abortSignal: signal
583
+ });
584
+ });
585
+ const tracableToolExecution = async (toolExecTask) => {
586
+ let toolOutput2;
587
+ try {
588
+ const { result, isAborted } = await waitUntilAborted(toolExecTask, signal);
589
+ toolOutput2 = createToolOutput({
590
+ toolCall,
591
+ exception: isAborted ? new Error("tool call was aborted") : void 0,
592
+ output: isAborted ? void 0 : result
593
+ });
594
+ } catch (rawError) {
595
+ logger.error(
596
+ {
597
+ function: toolCall.name,
598
+ speech_id: speechHandle.id,
599
+ error: toError(rawError).message
600
+ },
601
+ "exception occurred while executing tool"
602
+ );
603
+ toolOutput2 = createToolOutput({
604
+ toolCall,
605
+ exception: toError(rawError)
606
+ });
607
+ } finally {
608
+ if (!toolOutput2) throw new Error("toolOutput is undefined");
609
+ toolCompleted(toolOutput2);
610
+ }
611
+ };
612
+ tasks.push(tracableToolExecution(toolExecution));
613
+ }
614
+ await Promise.allSettled(tasks);
615
+ if (toolOutput.output.length > 0) {
616
+ logger.debug(
617
+ {
618
+ speech_id: speechHandle.id
619
+ },
620
+ "tools execution completed"
621
+ );
622
+ }
623
+ };
624
+ return [Task.from(executeToolsTask, controller, "performToolExecutions"), toolOutput];
625
+ }
626
+ async function waitUntilAborted(promise, signal) {
627
+ const abortFut = new Future();
628
+ const resolveAbort = () => {
629
+ if (!abortFut.done) {
630
+ abortFut.resolve({ result: void 0, isAborted: true });
631
+ }
632
+ };
633
+ signal.addEventListener("abort", resolveAbort);
634
+ promise.then((r) => {
635
+ if (!abortFut.done) {
636
+ abortFut.resolve({ result: r, isAborted: false });
637
+ }
638
+ }).catch((e) => {
639
+ if (!abortFut.done) {
640
+ abortFut.reject(e);
641
+ }
642
+ }).finally(() => {
643
+ signal.removeEventListener("abort", resolveAbort);
644
+ });
645
+ return await abortFut.await;
646
+ }
647
+ function removeInstructions(chatCtx) {
648
+ while (true) {
649
+ const idx = chatCtx.indexById(INSTRUCTIONS_MESSAGE_ID);
650
+ if (idx !== void 0) {
651
+ chatCtx.items.splice(idx, 1);
652
+ } else {
653
+ break;
654
+ }
655
+ }
656
+ }
657
+ export {
658
+ ToolExecutionOutput,
659
+ _JsOutput,
660
+ _LLMGenerationData,
661
+ _SanitizedOutput,
662
+ _ToolOutput,
663
+ createToolOutput,
664
+ performAudioForwarding,
665
+ performLLMInference,
666
+ performTTSInference,
667
+ performTextForwarding,
668
+ performToolExecutions,
669
+ removeInstructions,
670
+ updateInstructions
671
+ };
672
+ //# sourceMappingURL=generation.js.map