@livekit/agents 1.1.0 → 1.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (942) hide show
  1. package/dist/audio.cjs +89 -3
  2. package/dist/audio.cjs.map +1 -1
  3. package/dist/audio.d.cts +36 -1
  4. package/dist/audio.d.ts +36 -1
  5. package/dist/audio.d.ts.map +1 -1
  6. package/dist/audio.js +76 -2
  7. package/dist/audio.js.map +1 -1
  8. package/dist/beta/index.cjs +29 -0
  9. package/dist/beta/index.cjs.map +1 -0
  10. package/dist/beta/index.d.cts +2 -0
  11. package/dist/beta/index.d.ts +2 -0
  12. package/dist/beta/index.d.ts.map +1 -0
  13. package/dist/beta/index.js +7 -0
  14. package/dist/beta/index.js.map +1 -0
  15. package/dist/beta/workflows/index.cjs +29 -0
  16. package/dist/beta/workflows/index.cjs.map +1 -0
  17. package/dist/beta/workflows/index.d.cts +2 -0
  18. package/dist/beta/workflows/index.d.ts +2 -0
  19. package/dist/beta/workflows/index.d.ts.map +1 -0
  20. package/dist/beta/workflows/index.js +7 -0
  21. package/dist/beta/workflows/index.js.map +1 -0
  22. package/dist/beta/workflows/task_group.cjs +162 -0
  23. package/dist/beta/workflows/task_group.cjs.map +1 -0
  24. package/dist/beta/workflows/task_group.d.cts +32 -0
  25. package/dist/beta/workflows/task_group.d.ts +32 -0
  26. package/dist/beta/workflows/task_group.d.ts.map +1 -0
  27. package/dist/beta/workflows/task_group.js +138 -0
  28. package/dist/beta/workflows/task_group.js.map +1 -0
  29. package/dist/cli.cjs +44 -46
  30. package/dist/cli.cjs.map +1 -1
  31. package/dist/cli.d.cts +3 -3
  32. package/dist/cli.d.ts +3 -3
  33. package/dist/cli.d.ts.map +1 -1
  34. package/dist/cli.js +45 -47
  35. package/dist/cli.js.map +1 -1
  36. package/dist/connection_pool.cjs +242 -0
  37. package/dist/connection_pool.cjs.map +1 -0
  38. package/dist/connection_pool.d.cts +123 -0
  39. package/dist/connection_pool.d.ts +123 -0
  40. package/dist/connection_pool.d.ts.map +1 -0
  41. package/dist/connection_pool.js +218 -0
  42. package/dist/connection_pool.js.map +1 -0
  43. package/dist/connection_pool.test.cjs +256 -0
  44. package/dist/connection_pool.test.cjs.map +1 -0
  45. package/dist/connection_pool.test.js +255 -0
  46. package/dist/connection_pool.test.js.map +1 -0
  47. package/dist/constants.cjs +30 -0
  48. package/dist/constants.cjs.map +1 -1
  49. package/dist/constants.d.cts +10 -0
  50. package/dist/constants.d.ts +10 -0
  51. package/dist/constants.d.ts.map +1 -1
  52. package/dist/constants.js +20 -0
  53. package/dist/constants.js.map +1 -1
  54. package/dist/cpu.cjs +189 -0
  55. package/dist/cpu.cjs.map +1 -0
  56. package/dist/cpu.d.cts +24 -0
  57. package/dist/cpu.d.ts +24 -0
  58. package/dist/cpu.d.ts.map +1 -0
  59. package/dist/cpu.js +152 -0
  60. package/dist/cpu.js.map +1 -0
  61. package/dist/cpu.test.cjs +227 -0
  62. package/dist/cpu.test.cjs.map +1 -0
  63. package/dist/cpu.test.js +204 -0
  64. package/dist/cpu.test.js.map +1 -0
  65. package/dist/http_server.cjs +9 -6
  66. package/dist/http_server.cjs.map +1 -1
  67. package/dist/http_server.d.cts +5 -1
  68. package/dist/http_server.d.ts +5 -1
  69. package/dist/http_server.d.ts.map +1 -1
  70. package/dist/http_server.js +9 -6
  71. package/dist/http_server.js.map +1 -1
  72. package/dist/index.cjs +24 -9
  73. package/dist/index.cjs.map +1 -1
  74. package/dist/index.d.cts +15 -11
  75. package/dist/index.d.ts +15 -11
  76. package/dist/index.d.ts.map +1 -1
  77. package/dist/index.js +18 -9
  78. package/dist/index.js.map +1 -1
  79. package/dist/inference/api_protos.cjs +70 -2
  80. package/dist/inference/api_protos.cjs.map +1 -1
  81. package/dist/inference/api_protos.d.cts +373 -32
  82. package/dist/inference/api_protos.d.ts +373 -32
  83. package/dist/inference/api_protos.d.ts.map +1 -1
  84. package/dist/inference/api_protos.js +62 -2
  85. package/dist/inference/api_protos.js.map +1 -1
  86. package/dist/inference/index.cjs +8 -0
  87. package/dist/inference/index.cjs.map +1 -1
  88. package/dist/inference/index.d.cts +3 -4
  89. package/dist/inference/index.d.ts +3 -4
  90. package/dist/inference/index.d.ts.map +1 -1
  91. package/dist/inference/index.js +18 -3
  92. package/dist/inference/index.js.map +1 -1
  93. package/dist/inference/interruption/defaults.cjs +81 -0
  94. package/dist/inference/interruption/defaults.cjs.map +1 -0
  95. package/dist/inference/interruption/defaults.d.cts +19 -0
  96. package/dist/inference/interruption/defaults.d.ts +19 -0
  97. package/dist/inference/interruption/defaults.d.ts.map +1 -0
  98. package/dist/inference/interruption/defaults.js +46 -0
  99. package/dist/inference/interruption/defaults.js.map +1 -0
  100. package/dist/inference/interruption/errors.cjs +44 -0
  101. package/dist/inference/interruption/errors.cjs.map +1 -0
  102. package/dist/inference/interruption/errors.d.cts +12 -0
  103. package/dist/inference/interruption/errors.d.ts +12 -0
  104. package/dist/inference/interruption/errors.d.ts.map +1 -0
  105. package/dist/inference/interruption/errors.js +20 -0
  106. package/dist/inference/interruption/errors.js.map +1 -0
  107. package/dist/inference/interruption/http_transport.cjs +163 -0
  108. package/dist/inference/interruption/http_transport.cjs.map +1 -0
  109. package/dist/inference/interruption/http_transport.d.cts +63 -0
  110. package/dist/inference/interruption/http_transport.d.ts +63 -0
  111. package/dist/inference/interruption/http_transport.d.ts.map +1 -0
  112. package/dist/inference/interruption/http_transport.js +137 -0
  113. package/dist/inference/interruption/http_transport.js.map +1 -0
  114. package/dist/inference/interruption/interruption_cache_entry.cjs +58 -0
  115. package/dist/inference/interruption/interruption_cache_entry.cjs.map +1 -0
  116. package/dist/inference/interruption/interruption_cache_entry.d.cts +30 -0
  117. package/dist/inference/interruption/interruption_cache_entry.d.ts +30 -0
  118. package/dist/inference/interruption/interruption_cache_entry.d.ts.map +1 -0
  119. package/dist/inference/interruption/interruption_cache_entry.js +34 -0
  120. package/dist/inference/interruption/interruption_cache_entry.js.map +1 -0
  121. package/dist/inference/interruption/interruption_detector.cjs +198 -0
  122. package/dist/inference/interruption/interruption_detector.cjs.map +1 -0
  123. package/dist/inference/interruption/interruption_detector.d.cts +59 -0
  124. package/dist/inference/interruption/interruption_detector.d.ts +59 -0
  125. package/dist/inference/interruption/interruption_detector.d.ts.map +1 -0
  126. package/dist/inference/interruption/interruption_detector.js +164 -0
  127. package/dist/inference/interruption/interruption_detector.js.map +1 -0
  128. package/dist/inference/interruption/interruption_stream.cjs +368 -0
  129. package/dist/inference/interruption/interruption_stream.cjs.map +1 -0
  130. package/dist/inference/interruption/interruption_stream.d.cts +46 -0
  131. package/dist/inference/interruption/interruption_stream.d.ts +46 -0
  132. package/dist/inference/interruption/interruption_stream.d.ts.map +1 -0
  133. package/dist/inference/interruption/interruption_stream.js +344 -0
  134. package/dist/inference/interruption/interruption_stream.js.map +1 -0
  135. package/dist/inference/interruption/types.cjs +17 -0
  136. package/dist/inference/interruption/types.cjs.map +1 -0
  137. package/dist/inference/interruption/types.d.cts +66 -0
  138. package/dist/inference/interruption/types.d.ts +66 -0
  139. package/dist/inference/interruption/types.d.ts.map +1 -0
  140. package/dist/inference/interruption/types.js +1 -0
  141. package/dist/inference/interruption/types.js.map +1 -0
  142. package/dist/inference/interruption/utils.cjs +130 -0
  143. package/dist/inference/interruption/utils.cjs.map +1 -0
  144. package/dist/inference/interruption/utils.d.cts +41 -0
  145. package/dist/inference/interruption/utils.d.ts +41 -0
  146. package/dist/inference/interruption/utils.d.ts.map +1 -0
  147. package/dist/inference/interruption/utils.js +105 -0
  148. package/dist/inference/interruption/utils.js.map +1 -0
  149. package/dist/inference/interruption/utils.test.cjs +105 -0
  150. package/dist/inference/interruption/utils.test.cjs.map +1 -0
  151. package/dist/inference/interruption/utils.test.js +104 -0
  152. package/dist/inference/interruption/utils.test.js.map +1 -0
  153. package/dist/inference/interruption/ws_transport.cjs +342 -0
  154. package/dist/inference/interruption/ws_transport.cjs.map +1 -0
  155. package/dist/inference/interruption/ws_transport.d.cts +33 -0
  156. package/dist/inference/interruption/ws_transport.d.ts +33 -0
  157. package/dist/inference/interruption/ws_transport.d.ts.map +1 -0
  158. package/dist/inference/interruption/ws_transport.js +308 -0
  159. package/dist/inference/interruption/ws_transport.js.map +1 -0
  160. package/dist/inference/llm.cjs +106 -66
  161. package/dist/inference/llm.cjs.map +1 -1
  162. package/dist/inference/llm.d.cts +65 -43
  163. package/dist/inference/llm.d.ts +65 -43
  164. package/dist/inference/llm.d.ts.map +1 -1
  165. package/dist/inference/llm.js +100 -66
  166. package/dist/inference/llm.js.map +1 -1
  167. package/dist/inference/stt.cjs +319 -170
  168. package/dist/inference/stt.cjs.map +1 -1
  169. package/dist/inference/stt.d.cts +64 -15
  170. package/dist/inference/stt.d.ts +64 -15
  171. package/dist/inference/stt.d.ts.map +1 -1
  172. package/dist/inference/stt.js +319 -170
  173. package/dist/inference/stt.js.map +1 -1
  174. package/dist/inference/stt.test.cjs +218 -0
  175. package/dist/inference/stt.test.cjs.map +1 -0
  176. package/dist/inference/stt.test.js +217 -0
  177. package/dist/inference/stt.test.js.map +1 -0
  178. package/dist/inference/tts.cjs +249 -71
  179. package/dist/inference/tts.cjs.map +1 -1
  180. package/dist/inference/tts.d.cts +55 -16
  181. package/dist/inference/tts.d.ts +55 -16
  182. package/dist/inference/tts.d.ts.map +1 -1
  183. package/dist/inference/tts.js +249 -77
  184. package/dist/inference/tts.js.map +1 -1
  185. package/dist/inference/tts.test.cjs +233 -0
  186. package/dist/inference/tts.test.cjs.map +1 -0
  187. package/dist/inference/tts.test.js +232 -0
  188. package/dist/inference/tts.test.js.map +1 -0
  189. package/dist/inference/utils.cjs +26 -7
  190. package/dist/inference/utils.cjs.map +1 -1
  191. package/dist/inference/utils.d.cts +14 -1
  192. package/dist/inference/utils.d.ts +14 -1
  193. package/dist/inference/utils.d.ts.map +1 -1
  194. package/dist/inference/utils.js +18 -2
  195. package/dist/inference/utils.js.map +1 -1
  196. package/dist/ipc/inference_proc_executor.cjs +6 -3
  197. package/dist/ipc/inference_proc_executor.cjs.map +1 -1
  198. package/dist/ipc/inference_proc_executor.d.ts.map +1 -1
  199. package/dist/ipc/inference_proc_executor.js +6 -3
  200. package/dist/ipc/inference_proc_executor.js.map +1 -1
  201. package/dist/ipc/inference_proc_lazy_main.cjs +13 -1
  202. package/dist/ipc/inference_proc_lazy_main.cjs.map +1 -1
  203. package/dist/ipc/inference_proc_lazy_main.js +13 -1
  204. package/dist/ipc/inference_proc_lazy_main.js.map +1 -1
  205. package/dist/ipc/job_proc_executor.cjs +6 -1
  206. package/dist/ipc/job_proc_executor.cjs.map +1 -1
  207. package/dist/ipc/job_proc_executor.d.ts.map +1 -1
  208. package/dist/ipc/job_proc_executor.js +6 -1
  209. package/dist/ipc/job_proc_executor.js.map +1 -1
  210. package/dist/ipc/job_proc_lazy_main.cjs +89 -17
  211. package/dist/ipc/job_proc_lazy_main.cjs.map +1 -1
  212. package/dist/ipc/job_proc_lazy_main.js +68 -18
  213. package/dist/ipc/job_proc_lazy_main.js.map +1 -1
  214. package/dist/ipc/supervised_proc.cjs +34 -8
  215. package/dist/ipc/supervised_proc.cjs.map +1 -1
  216. package/dist/ipc/supervised_proc.d.cts +8 -0
  217. package/dist/ipc/supervised_proc.d.ts +8 -0
  218. package/dist/ipc/supervised_proc.d.ts.map +1 -1
  219. package/dist/ipc/supervised_proc.js +34 -8
  220. package/dist/ipc/supervised_proc.js.map +1 -1
  221. package/dist/ipc/supervised_proc.test.cjs +145 -0
  222. package/dist/ipc/supervised_proc.test.cjs.map +1 -0
  223. package/dist/ipc/supervised_proc.test.js +122 -0
  224. package/dist/ipc/supervised_proc.test.js.map +1 -0
  225. package/dist/job.cjs +109 -1
  226. package/dist/job.cjs.map +1 -1
  227. package/dist/job.d.cts +14 -0
  228. package/dist/job.d.ts +14 -0
  229. package/dist/job.d.ts.map +1 -1
  230. package/dist/job.js +99 -1
  231. package/dist/job.js.map +1 -1
  232. package/dist/language.cjs +394 -0
  233. package/dist/language.cjs.map +1 -0
  234. package/dist/language.d.cts +15 -0
  235. package/dist/language.d.ts +15 -0
  236. package/dist/language.d.ts.map +1 -0
  237. package/dist/language.js +363 -0
  238. package/dist/language.js.map +1 -0
  239. package/dist/language.test.cjs +43 -0
  240. package/dist/language.test.cjs.map +1 -0
  241. package/dist/language.test.js +49 -0
  242. package/dist/language.test.js.map +1 -0
  243. package/dist/llm/chat_context.cjs +274 -3
  244. package/dist/llm/chat_context.cjs.map +1 -1
  245. package/dist/llm/chat_context.d.cts +86 -2
  246. package/dist/llm/chat_context.d.ts +86 -2
  247. package/dist/llm/chat_context.d.ts.map +1 -1
  248. package/dist/llm/chat_context.js +273 -3
  249. package/dist/llm/chat_context.js.map +1 -1
  250. package/dist/llm/chat_context.test.cjs +574 -0
  251. package/dist/llm/chat_context.test.cjs.map +1 -1
  252. package/dist/llm/chat_context.test.js +574 -0
  253. package/dist/llm/chat_context.test.js.map +1 -1
  254. package/dist/llm/fallback_adapter.cjs +278 -0
  255. package/dist/llm/fallback_adapter.cjs.map +1 -0
  256. package/dist/llm/fallback_adapter.d.cts +73 -0
  257. package/dist/llm/fallback_adapter.d.ts +73 -0
  258. package/dist/llm/fallback_adapter.d.ts.map +1 -0
  259. package/dist/llm/fallback_adapter.js +254 -0
  260. package/dist/llm/fallback_adapter.js.map +1 -0
  261. package/dist/llm/fallback_adapter.test.cjs +176 -0
  262. package/dist/llm/fallback_adapter.test.cjs.map +1 -0
  263. package/dist/llm/fallback_adapter.test.js +175 -0
  264. package/dist/llm/fallback_adapter.test.js.map +1 -0
  265. package/dist/llm/index.cjs +9 -0
  266. package/dist/llm/index.cjs.map +1 -1
  267. package/dist/llm/index.d.cts +4 -3
  268. package/dist/llm/index.d.ts +4 -3
  269. package/dist/llm/index.d.ts.map +1 -1
  270. package/dist/llm/index.js +11 -1
  271. package/dist/llm/index.js.map +1 -1
  272. package/dist/llm/llm.cjs +65 -11
  273. package/dist/llm/llm.cjs.map +1 -1
  274. package/dist/llm/llm.d.cts +13 -2
  275. package/dist/llm/llm.d.ts +13 -2
  276. package/dist/llm/llm.d.ts.map +1 -1
  277. package/dist/llm/llm.js +65 -11
  278. package/dist/llm/llm.js.map +1 -1
  279. package/dist/llm/provider_format/google.cjs +6 -2
  280. package/dist/llm/provider_format/google.cjs.map +1 -1
  281. package/dist/llm/provider_format/google.d.cts +1 -1
  282. package/dist/llm/provider_format/google.d.ts +1 -1
  283. package/dist/llm/provider_format/google.d.ts.map +1 -1
  284. package/dist/llm/provider_format/google.js +6 -2
  285. package/dist/llm/provider_format/google.js.map +1 -1
  286. package/dist/llm/provider_format/google.test.cjs +48 -0
  287. package/dist/llm/provider_format/google.test.cjs.map +1 -1
  288. package/dist/llm/provider_format/google.test.js +54 -1
  289. package/dist/llm/provider_format/google.test.js.map +1 -1
  290. package/dist/llm/provider_format/index.cjs +2 -0
  291. package/dist/llm/provider_format/index.cjs.map +1 -1
  292. package/dist/llm/provider_format/index.d.cts +2 -2
  293. package/dist/llm/provider_format/index.d.ts +2 -2
  294. package/dist/llm/provider_format/index.d.ts.map +1 -1
  295. package/dist/llm/provider_format/index.js +6 -1
  296. package/dist/llm/provider_format/index.js.map +1 -1
  297. package/dist/llm/provider_format/openai.cjs +126 -24
  298. package/dist/llm/provider_format/openai.cjs.map +1 -1
  299. package/dist/llm/provider_format/openai.d.cts +1 -0
  300. package/dist/llm/provider_format/openai.d.ts +1 -0
  301. package/dist/llm/provider_format/openai.d.ts.map +1 -1
  302. package/dist/llm/provider_format/openai.js +124 -23
  303. package/dist/llm/provider_format/openai.js.map +1 -1
  304. package/dist/llm/provider_format/openai.test.cjs +393 -0
  305. package/dist/llm/provider_format/openai.test.cjs.map +1 -1
  306. package/dist/llm/provider_format/openai.test.js +400 -2
  307. package/dist/llm/provider_format/openai.test.js.map +1 -1
  308. package/dist/llm/provider_format/utils.cjs +5 -4
  309. package/dist/llm/provider_format/utils.cjs.map +1 -1
  310. package/dist/llm/provider_format/utils.d.ts.map +1 -1
  311. package/dist/llm/provider_format/utils.js +5 -4
  312. package/dist/llm/provider_format/utils.js.map +1 -1
  313. package/dist/llm/realtime.cjs +3 -0
  314. package/dist/llm/realtime.cjs.map +1 -1
  315. package/dist/llm/realtime.d.cts +15 -1
  316. package/dist/llm/realtime.d.ts +15 -1
  317. package/dist/llm/realtime.d.ts.map +1 -1
  318. package/dist/llm/realtime.js +3 -0
  319. package/dist/llm/realtime.js.map +1 -1
  320. package/dist/llm/remote_chat_context.cjs.map +1 -1
  321. package/dist/llm/remote_chat_context.d.cts +2 -0
  322. package/dist/llm/remote_chat_context.d.ts +2 -0
  323. package/dist/llm/remote_chat_context.d.ts.map +1 -1
  324. package/dist/llm/remote_chat_context.js.map +1 -1
  325. package/dist/llm/tool_context.cjs +50 -2
  326. package/dist/llm/tool_context.cjs.map +1 -1
  327. package/dist/llm/tool_context.d.cts +47 -11
  328. package/dist/llm/tool_context.d.ts +47 -11
  329. package/dist/llm/tool_context.d.ts.map +1 -1
  330. package/dist/llm/tool_context.js +48 -3
  331. package/dist/llm/tool_context.js.map +1 -1
  332. package/dist/llm/tool_context.test.cjs +197 -0
  333. package/dist/llm/tool_context.test.cjs.map +1 -1
  334. package/dist/llm/tool_context.test.js +175 -0
  335. package/dist/llm/tool_context.test.js.map +1 -1
  336. package/dist/llm/utils.cjs +18 -12
  337. package/dist/llm/utils.cjs.map +1 -1
  338. package/dist/llm/utils.d.cts +2 -3
  339. package/dist/llm/utils.d.ts +2 -3
  340. package/dist/llm/utils.d.ts.map +1 -1
  341. package/dist/llm/utils.js +18 -12
  342. package/dist/llm/utils.js.map +1 -1
  343. package/dist/llm/zod-utils.cjs +102 -0
  344. package/dist/llm/zod-utils.cjs.map +1 -0
  345. package/dist/llm/zod-utils.d.cts +65 -0
  346. package/dist/llm/zod-utils.d.ts +65 -0
  347. package/dist/llm/zod-utils.d.ts.map +1 -0
  348. package/dist/llm/zod-utils.js +64 -0
  349. package/dist/llm/zod-utils.js.map +1 -0
  350. package/dist/llm/zod-utils.test.cjs +472 -0
  351. package/dist/llm/zod-utils.test.cjs.map +1 -0
  352. package/dist/llm/zod-utils.test.js +455 -0
  353. package/dist/llm/zod-utils.test.js.map +1 -0
  354. package/dist/log.cjs +45 -14
  355. package/dist/log.cjs.map +1 -1
  356. package/dist/log.d.cts +8 -1
  357. package/dist/log.d.ts +8 -1
  358. package/dist/log.d.ts.map +1 -1
  359. package/dist/log.js +45 -15
  360. package/dist/log.js.map +1 -1
  361. package/dist/metrics/base.cjs.map +1 -1
  362. package/dist/metrics/base.d.cts +75 -19
  363. package/dist/metrics/base.d.ts +75 -19
  364. package/dist/metrics/base.d.ts.map +1 -1
  365. package/dist/metrics/index.cjs +5 -0
  366. package/dist/metrics/index.cjs.map +1 -1
  367. package/dist/metrics/index.d.cts +2 -1
  368. package/dist/metrics/index.d.ts +2 -1
  369. package/dist/metrics/index.d.ts.map +1 -1
  370. package/dist/metrics/index.js +6 -0
  371. package/dist/metrics/index.js.map +1 -1
  372. package/dist/metrics/model_usage.cjs +189 -0
  373. package/dist/metrics/model_usage.cjs.map +1 -0
  374. package/dist/metrics/model_usage.d.cts +92 -0
  375. package/dist/metrics/model_usage.d.ts +92 -0
  376. package/dist/metrics/model_usage.d.ts.map +1 -0
  377. package/dist/metrics/model_usage.js +164 -0
  378. package/dist/metrics/model_usage.js.map +1 -0
  379. package/dist/metrics/model_usage.test.cjs +474 -0
  380. package/dist/metrics/model_usage.test.cjs.map +1 -0
  381. package/dist/metrics/model_usage.test.js +476 -0
  382. package/dist/metrics/model_usage.test.js.map +1 -0
  383. package/dist/metrics/usage_collector.cjs +5 -2
  384. package/dist/metrics/usage_collector.cjs.map +1 -1
  385. package/dist/metrics/usage_collector.d.cts +10 -1
  386. package/dist/metrics/usage_collector.d.ts +10 -1
  387. package/dist/metrics/usage_collector.d.ts.map +1 -1
  388. package/dist/metrics/usage_collector.js +5 -2
  389. package/dist/metrics/usage_collector.js.map +1 -1
  390. package/dist/metrics/utils.cjs +23 -7
  391. package/dist/metrics/utils.cjs.map +1 -1
  392. package/dist/metrics/utils.d.ts.map +1 -1
  393. package/dist/metrics/utils.js +23 -7
  394. package/dist/metrics/utils.js.map +1 -1
  395. package/dist/stream/deferred_stream.cjs +31 -10
  396. package/dist/stream/deferred_stream.cjs.map +1 -1
  397. package/dist/stream/deferred_stream.d.cts +6 -1
  398. package/dist/stream/deferred_stream.d.ts +6 -1
  399. package/dist/stream/deferred_stream.d.ts.map +1 -1
  400. package/dist/stream/deferred_stream.js +31 -10
  401. package/dist/stream/deferred_stream.js.map +1 -1
  402. package/dist/stream/deferred_stream.test.cjs +2 -2
  403. package/dist/stream/deferred_stream.test.cjs.map +1 -1
  404. package/dist/stream/deferred_stream.test.js +2 -2
  405. package/dist/stream/deferred_stream.test.js.map +1 -1
  406. package/dist/stream/index.cjs +3 -0
  407. package/dist/stream/index.cjs.map +1 -1
  408. package/dist/stream/index.d.cts +1 -0
  409. package/dist/stream/index.d.ts +1 -0
  410. package/dist/stream/index.d.ts.map +1 -1
  411. package/dist/stream/index.js +2 -0
  412. package/dist/stream/index.js.map +1 -1
  413. package/dist/stream/multi_input_stream.cjs +139 -0
  414. package/dist/stream/multi_input_stream.cjs.map +1 -0
  415. package/dist/stream/multi_input_stream.d.cts +55 -0
  416. package/dist/stream/multi_input_stream.d.ts +55 -0
  417. package/dist/stream/multi_input_stream.d.ts.map +1 -0
  418. package/dist/stream/multi_input_stream.js +115 -0
  419. package/dist/stream/multi_input_stream.js.map +1 -0
  420. package/dist/stream/multi_input_stream.test.cjs +344 -0
  421. package/dist/stream/multi_input_stream.test.cjs.map +1 -0
  422. package/dist/stream/multi_input_stream.test.js +343 -0
  423. package/dist/stream/multi_input_stream.test.js.map +1 -0
  424. package/dist/stream/stream_channel.cjs +39 -1
  425. package/dist/stream/stream_channel.cjs.map +1 -1
  426. package/dist/stream/stream_channel.d.cts +5 -2
  427. package/dist/stream/stream_channel.d.ts +5 -2
  428. package/dist/stream/stream_channel.d.ts.map +1 -1
  429. package/dist/stream/stream_channel.js +39 -1
  430. package/dist/stream/stream_channel.js.map +1 -1
  431. package/dist/stream/stream_channel.test.cjs +27 -0
  432. package/dist/stream/stream_channel.test.cjs.map +1 -1
  433. package/dist/stream/stream_channel.test.js +27 -0
  434. package/dist/stream/stream_channel.test.js.map +1 -1
  435. package/dist/stt/stream_adapter.cjs +24 -9
  436. package/dist/stt/stream_adapter.cjs.map +1 -1
  437. package/dist/stt/stream_adapter.d.cts +7 -3
  438. package/dist/stt/stream_adapter.d.ts +7 -3
  439. package/dist/stt/stream_adapter.d.ts.map +1 -1
  440. package/dist/stt/stream_adapter.js +24 -9
  441. package/dist/stt/stream_adapter.js.map +1 -1
  442. package/dist/stt/stt.cjs +86 -19
  443. package/dist/stt/stt.cjs.map +1 -1
  444. package/dist/stt/stt.d.cts +60 -5
  445. package/dist/stt/stt.d.ts +60 -5
  446. package/dist/stt/stt.d.ts.map +1 -1
  447. package/dist/stt/stt.js +88 -21
  448. package/dist/stt/stt.js.map +1 -1
  449. package/dist/telemetry/index.cjs +72 -0
  450. package/dist/telemetry/index.cjs.map +1 -0
  451. package/dist/telemetry/index.d.cts +7 -0
  452. package/dist/telemetry/index.d.ts +7 -0
  453. package/dist/telemetry/index.d.ts.map +1 -0
  454. package/dist/telemetry/index.js +37 -0
  455. package/dist/telemetry/index.js.map +1 -0
  456. package/dist/telemetry/logging.cjs +65 -0
  457. package/dist/telemetry/logging.cjs.map +1 -0
  458. package/dist/telemetry/logging.d.cts +21 -0
  459. package/dist/telemetry/logging.d.ts +21 -0
  460. package/dist/telemetry/logging.d.ts.map +1 -0
  461. package/dist/telemetry/logging.js +40 -0
  462. package/dist/telemetry/logging.js.map +1 -0
  463. package/dist/telemetry/otel_http_exporter.cjs +166 -0
  464. package/dist/telemetry/otel_http_exporter.cjs.map +1 -0
  465. package/dist/telemetry/otel_http_exporter.d.cts +63 -0
  466. package/dist/telemetry/otel_http_exporter.d.ts +63 -0
  467. package/dist/telemetry/otel_http_exporter.d.ts.map +1 -0
  468. package/dist/telemetry/otel_http_exporter.js +142 -0
  469. package/dist/telemetry/otel_http_exporter.js.map +1 -0
  470. package/dist/telemetry/pino_otel_transport.cjs +217 -0
  471. package/dist/telemetry/pino_otel_transport.cjs.map +1 -0
  472. package/dist/telemetry/pino_otel_transport.d.cts +58 -0
  473. package/dist/telemetry/pino_otel_transport.d.ts +58 -0
  474. package/dist/telemetry/pino_otel_transport.d.ts.map +1 -0
  475. package/dist/telemetry/pino_otel_transport.js +189 -0
  476. package/dist/telemetry/pino_otel_transport.js.map +1 -0
  477. package/dist/telemetry/trace_types.cjs +233 -0
  478. package/dist/telemetry/trace_types.cjs.map +1 -0
  479. package/dist/telemetry/trace_types.d.cts +74 -0
  480. package/dist/telemetry/trace_types.d.ts +74 -0
  481. package/dist/telemetry/trace_types.d.ts.map +1 -0
  482. package/dist/telemetry/trace_types.js +141 -0
  483. package/dist/telemetry/trace_types.js.map +1 -0
  484. package/dist/telemetry/traces.cjs +484 -0
  485. package/dist/telemetry/traces.cjs.map +1 -0
  486. package/dist/telemetry/traces.d.cts +116 -0
  487. package/dist/telemetry/traces.d.ts +116 -0
  488. package/dist/telemetry/traces.d.ts.map +1 -0
  489. package/dist/telemetry/traces.js +449 -0
  490. package/dist/telemetry/traces.js.map +1 -0
  491. package/dist/telemetry/utils.cjs +86 -0
  492. package/dist/telemetry/utils.cjs.map +1 -0
  493. package/dist/telemetry/utils.d.cts +5 -0
  494. package/dist/telemetry/utils.d.ts +5 -0
  495. package/dist/telemetry/utils.d.ts.map +1 -0
  496. package/dist/telemetry/utils.js +51 -0
  497. package/dist/telemetry/utils.js.map +1 -0
  498. package/dist/tokenize/basic/sentence.cjs +3 -3
  499. package/dist/tokenize/basic/sentence.cjs.map +1 -1
  500. package/dist/tokenize/basic/sentence.js +3 -3
  501. package/dist/tokenize/basic/sentence.js.map +1 -1
  502. package/dist/tokenize/tokenizer.test.cjs +3 -1
  503. package/dist/tokenize/tokenizer.test.cjs.map +1 -1
  504. package/dist/tokenize/tokenizer.test.js +3 -1
  505. package/dist/tokenize/tokenizer.test.js.map +1 -1
  506. package/dist/transcription.cjs.map +1 -1
  507. package/dist/transcription.d.cts +6 -0
  508. package/dist/transcription.d.ts +6 -0
  509. package/dist/transcription.d.ts.map +1 -1
  510. package/dist/transcription.js.map +1 -1
  511. package/dist/tts/fallback_adapter.cjs +466 -0
  512. package/dist/tts/fallback_adapter.cjs.map +1 -0
  513. package/dist/tts/fallback_adapter.d.cts +110 -0
  514. package/dist/tts/fallback_adapter.d.ts +110 -0
  515. package/dist/tts/fallback_adapter.d.ts.map +1 -0
  516. package/dist/tts/fallback_adapter.js +442 -0
  517. package/dist/tts/fallback_adapter.js.map +1 -0
  518. package/dist/tts/index.cjs +3 -0
  519. package/dist/tts/index.cjs.map +1 -1
  520. package/dist/tts/index.d.cts +1 -0
  521. package/dist/tts/index.d.ts +1 -0
  522. package/dist/tts/index.d.ts.map +1 -1
  523. package/dist/tts/index.js +2 -0
  524. package/dist/tts/index.js.map +1 -1
  525. package/dist/tts/stream_adapter.cjs +25 -8
  526. package/dist/tts/stream_adapter.cjs.map +1 -1
  527. package/dist/tts/stream_adapter.d.cts +6 -3
  528. package/dist/tts/stream_adapter.d.ts +6 -3
  529. package/dist/tts/stream_adapter.d.ts.map +1 -1
  530. package/dist/tts/stream_adapter.js +25 -8
  531. package/dist/tts/stream_adapter.js.map +1 -1
  532. package/dist/tts/tts.cjs +189 -57
  533. package/dist/tts/tts.cjs.map +1 -1
  534. package/dist/tts/tts.d.cts +58 -6
  535. package/dist/tts/tts.d.ts +58 -6
  536. package/dist/tts/tts.d.ts.map +1 -1
  537. package/dist/tts/tts.js +191 -59
  538. package/dist/tts/tts.js.map +1 -1
  539. package/dist/types.cjs +24 -32
  540. package/dist/types.cjs.map +1 -1
  541. package/dist/types.d.cts +45 -10
  542. package/dist/types.d.ts +45 -10
  543. package/dist/types.d.ts.map +1 -1
  544. package/dist/types.js +20 -30
  545. package/dist/types.js.map +1 -1
  546. package/dist/utils.cjs +122 -26
  547. package/dist/utils.cjs.map +1 -1
  548. package/dist/utils.d.cts +41 -1
  549. package/dist/utils.d.ts +41 -1
  550. package/dist/utils.d.ts.map +1 -1
  551. package/dist/utils.js +117 -25
  552. package/dist/utils.js.map +1 -1
  553. package/dist/utils.test.cjs +73 -1
  554. package/dist/utils.test.cjs.map +1 -1
  555. package/dist/utils.test.js +74 -10
  556. package/dist/utils.test.js.map +1 -1
  557. package/dist/vad.cjs +35 -15
  558. package/dist/vad.cjs.map +1 -1
  559. package/dist/vad.d.cts +15 -5
  560. package/dist/vad.d.ts +15 -5
  561. package/dist/vad.d.ts.map +1 -1
  562. package/dist/vad.js +35 -15
  563. package/dist/vad.js.map +1 -1
  564. package/dist/version.cjs +1 -1
  565. package/dist/version.cjs.map +1 -1
  566. package/dist/version.d.cts +1 -1
  567. package/dist/version.d.ts +1 -1
  568. package/dist/version.d.ts.map +1 -1
  569. package/dist/version.js +1 -1
  570. package/dist/version.js.map +1 -1
  571. package/dist/voice/agent.cjs +258 -35
  572. package/dist/voice/agent.cjs.map +1 -1
  573. package/dist/voice/agent.d.cts +54 -13
  574. package/dist/voice/agent.d.ts +54 -13
  575. package/dist/voice/agent.d.ts.map +1 -1
  576. package/dist/voice/agent.js +254 -34
  577. package/dist/voice/agent.js.map +1 -1
  578. package/dist/voice/agent.test.cjs +314 -0
  579. package/dist/voice/agent.test.cjs.map +1 -1
  580. package/dist/voice/agent.test.js +316 -2
  581. package/dist/voice/agent.test.js.map +1 -1
  582. package/dist/voice/agent_activity.cjs +1116 -385
  583. package/dist/voice/agent_activity.cjs.map +1 -1
  584. package/dist/voice/agent_activity.d.cts +72 -11
  585. package/dist/voice/agent_activity.d.ts +72 -11
  586. package/dist/voice/agent_activity.d.ts.map +1 -1
  587. package/dist/voice/agent_activity.js +1119 -383
  588. package/dist/voice/agent_activity.js.map +1 -1
  589. package/dist/voice/agent_activity.test.cjs +135 -0
  590. package/dist/voice/agent_activity.test.cjs.map +1 -0
  591. package/dist/voice/agent_activity.test.js +134 -0
  592. package/dist/voice/agent_activity.test.js.map +1 -0
  593. package/dist/voice/agent_session.cjs +550 -90
  594. package/dist/voice/agent_session.cjs.map +1 -1
  595. package/dist/voice/agent_session.d.cts +185 -25
  596. package/dist/voice/agent_session.d.ts +185 -25
  597. package/dist/voice/agent_session.d.ts.map +1 -1
  598. package/dist/voice/agent_session.js +556 -91
  599. package/dist/voice/agent_session.js.map +1 -1
  600. package/dist/voice/audio_recognition.cjs +605 -46
  601. package/dist/voice/audio_recognition.cjs.map +1 -1
  602. package/dist/voice/audio_recognition.d.cts +96 -4
  603. package/dist/voice/audio_recognition.d.ts +96 -4
  604. package/dist/voice/audio_recognition.d.ts.map +1 -1
  605. package/dist/voice/audio_recognition.js +611 -47
  606. package/dist/voice/audio_recognition.js.map +1 -1
  607. package/dist/voice/audio_recognition_span.test.cjs +295 -0
  608. package/dist/voice/audio_recognition_span.test.cjs.map +1 -0
  609. package/dist/voice/audio_recognition_span.test.js +299 -0
  610. package/dist/voice/audio_recognition_span.test.js.map +1 -0
  611. package/dist/voice/avatar/datastream_io.cjs +7 -1
  612. package/dist/voice/avatar/datastream_io.cjs.map +1 -1
  613. package/dist/voice/avatar/datastream_io.d.cts +1 -0
  614. package/dist/voice/avatar/datastream_io.d.ts +1 -0
  615. package/dist/voice/avatar/datastream_io.d.ts.map +1 -1
  616. package/dist/voice/avatar/datastream_io.js +7 -1
  617. package/dist/voice/avatar/datastream_io.js.map +1 -1
  618. package/dist/voice/background_audio.cjs +367 -0
  619. package/dist/voice/background_audio.cjs.map +1 -0
  620. package/dist/voice/background_audio.d.cts +123 -0
  621. package/dist/voice/background_audio.d.ts +123 -0
  622. package/dist/voice/background_audio.d.ts.map +1 -0
  623. package/dist/voice/background_audio.js +343 -0
  624. package/dist/voice/background_audio.js.map +1 -0
  625. package/dist/voice/events.cjs +3 -0
  626. package/dist/voice/events.cjs.map +1 -1
  627. package/dist/voice/events.d.cts +16 -9
  628. package/dist/voice/events.d.ts +16 -9
  629. package/dist/voice/events.d.ts.map +1 -1
  630. package/dist/voice/events.js +3 -0
  631. package/dist/voice/events.js.map +1 -1
  632. package/dist/voice/generation.cjs +205 -41
  633. package/dist/voice/generation.cjs.map +1 -1
  634. package/dist/voice/generation.d.cts +21 -5
  635. package/dist/voice/generation.d.ts +21 -5
  636. package/dist/voice/generation.d.ts.map +1 -1
  637. package/dist/voice/generation.js +215 -43
  638. package/dist/voice/generation.js.map +1 -1
  639. package/dist/voice/generation_tools.test.cjs +236 -0
  640. package/dist/voice/generation_tools.test.cjs.map +1 -0
  641. package/dist/voice/generation_tools.test.js +235 -0
  642. package/dist/voice/generation_tools.test.js.map +1 -0
  643. package/dist/voice/index.cjs +33 -2
  644. package/dist/voice/index.cjs.map +1 -1
  645. package/dist/voice/index.d.cts +8 -2
  646. package/dist/voice/index.d.ts +8 -2
  647. package/dist/voice/index.d.ts.map +1 -1
  648. package/dist/voice/index.js +19 -2
  649. package/dist/voice/index.js.map +1 -1
  650. package/dist/voice/interruption_detection.test.cjs +114 -0
  651. package/dist/voice/interruption_detection.test.cjs.map +1 -0
  652. package/dist/voice/interruption_detection.test.js +113 -0
  653. package/dist/voice/interruption_detection.test.js.map +1 -0
  654. package/dist/voice/io.cjs +66 -6
  655. package/dist/voice/io.cjs.map +1 -1
  656. package/dist/voice/io.d.cts +67 -7
  657. package/dist/voice/io.d.ts +67 -7
  658. package/dist/voice/io.d.ts.map +1 -1
  659. package/dist/voice/io.js +62 -5
  660. package/dist/voice/io.js.map +1 -1
  661. package/dist/voice/recorder_io/index.cjs +23 -0
  662. package/dist/voice/recorder_io/index.cjs.map +1 -0
  663. package/dist/voice/recorder_io/index.d.cts +2 -0
  664. package/dist/voice/recorder_io/index.d.ts +2 -0
  665. package/dist/voice/recorder_io/index.d.ts.map +1 -0
  666. package/dist/voice/recorder_io/index.js +2 -0
  667. package/dist/voice/recorder_io/index.js.map +1 -0
  668. package/dist/voice/recorder_io/recorder_io.cjs +607 -0
  669. package/dist/voice/recorder_io/recorder_io.cjs.map +1 -0
  670. package/dist/voice/recorder_io/recorder_io.d.cts +106 -0
  671. package/dist/voice/recorder_io/recorder_io.d.ts +106 -0
  672. package/dist/voice/recorder_io/recorder_io.d.ts.map +1 -0
  673. package/dist/voice/recorder_io/recorder_io.js +573 -0
  674. package/dist/voice/recorder_io/recorder_io.js.map +1 -0
  675. package/dist/voice/remote_session.cjs +922 -0
  676. package/dist/voice/remote_session.cjs.map +1 -0
  677. package/dist/voice/remote_session.d.cts +108 -0
  678. package/dist/voice/remote_session.d.ts +108 -0
  679. package/dist/voice/remote_session.d.ts.map +1 -0
  680. package/dist/voice/remote_session.js +887 -0
  681. package/dist/voice/remote_session.js.map +1 -0
  682. package/dist/voice/report.cjs +88 -0
  683. package/dist/voice/report.cjs.map +1 -0
  684. package/dist/voice/report.d.cts +49 -0
  685. package/dist/voice/report.d.ts +49 -0
  686. package/dist/voice/report.d.ts.map +1 -0
  687. package/dist/voice/report.js +63 -0
  688. package/dist/voice/report.js.map +1 -0
  689. package/dist/voice/report.test.cjs +121 -0
  690. package/dist/voice/report.test.cjs.map +1 -0
  691. package/dist/voice/report.test.js +120 -0
  692. package/dist/voice/report.test.js.map +1 -0
  693. package/dist/voice/room_io/_input.cjs +40 -7
  694. package/dist/voice/room_io/_input.cjs.map +1 -1
  695. package/dist/voice/room_io/_input.d.cts +5 -2
  696. package/dist/voice/room_io/_input.d.ts +5 -2
  697. package/dist/voice/room_io/_input.d.ts.map +1 -1
  698. package/dist/voice/room_io/_input.js +41 -8
  699. package/dist/voice/room_io/_input.js.map +1 -1
  700. package/dist/voice/room_io/_output.cjs +19 -11
  701. package/dist/voice/room_io/_output.cjs.map +1 -1
  702. package/dist/voice/room_io/_output.d.cts +7 -4
  703. package/dist/voice/room_io/_output.d.ts +7 -4
  704. package/dist/voice/room_io/_output.d.ts.map +1 -1
  705. package/dist/voice/room_io/_output.js +20 -12
  706. package/dist/voice/room_io/_output.js.map +1 -1
  707. package/dist/voice/room_io/room_io.cjs +33 -6
  708. package/dist/voice/room_io/room_io.cjs.map +1 -1
  709. package/dist/voice/room_io/room_io.d.cts +29 -9
  710. package/dist/voice/room_io/room_io.d.ts +29 -9
  711. package/dist/voice/room_io/room_io.d.ts.map +1 -1
  712. package/dist/voice/room_io/room_io.js +33 -7
  713. package/dist/voice/room_io/room_io.js.map +1 -1
  714. package/dist/voice/speech_handle.cjs +22 -4
  715. package/dist/voice/speech_handle.cjs.map +1 -1
  716. package/dist/voice/speech_handle.d.cts +17 -2
  717. package/dist/voice/speech_handle.d.ts +17 -2
  718. package/dist/voice/speech_handle.d.ts.map +1 -1
  719. package/dist/voice/speech_handle.js +21 -4
  720. package/dist/voice/speech_handle.js.map +1 -1
  721. package/dist/voice/testing/fake_llm.cjs +127 -0
  722. package/dist/voice/testing/fake_llm.cjs.map +1 -0
  723. package/dist/voice/testing/fake_llm.d.cts +30 -0
  724. package/dist/voice/testing/fake_llm.d.ts +30 -0
  725. package/dist/voice/testing/fake_llm.d.ts.map +1 -0
  726. package/dist/voice/testing/fake_llm.js +103 -0
  727. package/dist/voice/testing/fake_llm.js.map +1 -0
  728. package/dist/voice/testing/index.cjs +57 -0
  729. package/dist/voice/testing/index.cjs.map +1 -0
  730. package/dist/voice/testing/index.d.cts +21 -0
  731. package/dist/voice/testing/index.d.ts +21 -0
  732. package/dist/voice/testing/index.d.ts.map +1 -0
  733. package/dist/voice/testing/index.js +35 -0
  734. package/dist/voice/testing/index.js.map +1 -0
  735. package/dist/voice/testing/run_result.cjs +817 -0
  736. package/dist/voice/testing/run_result.cjs.map +1 -0
  737. package/dist/voice/testing/run_result.d.cts +385 -0
  738. package/dist/voice/testing/run_result.d.ts +385 -0
  739. package/dist/voice/testing/run_result.d.ts.map +1 -0
  740. package/dist/voice/testing/run_result.js +790 -0
  741. package/dist/voice/testing/run_result.js.map +1 -0
  742. package/dist/voice/testing/types.cjs +46 -0
  743. package/dist/voice/testing/types.cjs.map +1 -0
  744. package/dist/voice/testing/types.d.cts +83 -0
  745. package/dist/voice/testing/types.d.ts +83 -0
  746. package/dist/voice/testing/types.d.ts.map +1 -0
  747. package/dist/voice/testing/types.js +19 -0
  748. package/dist/voice/testing/types.js.map +1 -0
  749. package/dist/voice/transcription/synchronizer.cjs +139 -15
  750. package/dist/voice/transcription/synchronizer.cjs.map +1 -1
  751. package/dist/voice/transcription/synchronizer.d.cts +35 -4
  752. package/dist/voice/transcription/synchronizer.d.ts +35 -4
  753. package/dist/voice/transcription/synchronizer.d.ts.map +1 -1
  754. package/dist/voice/transcription/synchronizer.js +143 -16
  755. package/dist/voice/transcription/synchronizer.js.map +1 -1
  756. package/dist/voice/transcription/synchronizer.test.cjs +151 -0
  757. package/dist/voice/transcription/synchronizer.test.cjs.map +1 -0
  758. package/dist/voice/transcription/synchronizer.test.js +150 -0
  759. package/dist/voice/transcription/synchronizer.test.js.map +1 -0
  760. package/dist/voice/turn_config/endpointing.cjs +33 -0
  761. package/dist/voice/turn_config/endpointing.cjs.map +1 -0
  762. package/dist/voice/turn_config/endpointing.d.cts +30 -0
  763. package/dist/voice/turn_config/endpointing.d.ts +30 -0
  764. package/dist/voice/turn_config/endpointing.d.ts.map +1 -0
  765. package/dist/voice/turn_config/endpointing.js +9 -0
  766. package/dist/voice/turn_config/endpointing.js.map +1 -0
  767. package/dist/voice/turn_config/interruption.cjs +37 -0
  768. package/dist/voice/turn_config/interruption.cjs.map +1 -0
  769. package/dist/voice/turn_config/interruption.d.cts +53 -0
  770. package/dist/voice/turn_config/interruption.d.ts +53 -0
  771. package/dist/voice/turn_config/interruption.d.ts.map +1 -0
  772. package/dist/voice/turn_config/interruption.js +13 -0
  773. package/dist/voice/turn_config/interruption.js.map +1 -0
  774. package/dist/voice/turn_config/turn_handling.cjs +35 -0
  775. package/dist/voice/turn_config/turn_handling.cjs.map +1 -0
  776. package/dist/voice/turn_config/turn_handling.d.cts +36 -0
  777. package/dist/voice/turn_config/turn_handling.d.ts +36 -0
  778. package/dist/voice/turn_config/turn_handling.d.ts.map +1 -0
  779. package/dist/voice/turn_config/turn_handling.js +11 -0
  780. package/dist/voice/turn_config/turn_handling.js.map +1 -0
  781. package/dist/voice/turn_config/utils.cjs +157 -0
  782. package/dist/voice/turn_config/utils.cjs.map +1 -0
  783. package/dist/voice/turn_config/utils.d.cts +37 -0
  784. package/dist/voice/turn_config/utils.d.ts +37 -0
  785. package/dist/voice/turn_config/utils.d.ts.map +1 -0
  786. package/dist/voice/turn_config/utils.js +131 -0
  787. package/dist/voice/turn_config/utils.js.map +1 -0
  788. package/dist/voice/turn_config/utils.test.cjs +128 -0
  789. package/dist/voice/turn_config/utils.test.cjs.map +1 -0
  790. package/dist/voice/turn_config/utils.test.js +127 -0
  791. package/dist/voice/turn_config/utils.test.js.map +1 -0
  792. package/dist/voice/utils.cjs +47 -0
  793. package/dist/voice/utils.cjs.map +1 -0
  794. package/dist/voice/utils.d.cts +4 -0
  795. package/dist/voice/utils.d.ts +4 -0
  796. package/dist/voice/utils.d.ts.map +1 -0
  797. package/dist/voice/utils.js +23 -0
  798. package/dist/voice/utils.js.map +1 -0
  799. package/dist/worker.cjs +44 -52
  800. package/dist/worker.cjs.map +1 -1
  801. package/dist/worker.d.cts +18 -8
  802. package/dist/worker.d.ts +18 -8
  803. package/dist/worker.d.ts.map +1 -1
  804. package/dist/worker.js +43 -43
  805. package/dist/worker.js.map +1 -1
  806. package/package.json +32 -12
  807. package/resources/NOTICE +2 -0
  808. package/resources/keyboard-typing.ogg +0 -0
  809. package/resources/keyboard-typing2.ogg +0 -0
  810. package/resources/office-ambience.ogg +0 -0
  811. package/src/audio.ts +132 -1
  812. package/src/beta/index.ts +9 -0
  813. package/src/beta/workflows/index.ts +9 -0
  814. package/src/beta/workflows/task_group.ts +194 -0
  815. package/src/cli.ts +57 -66
  816. package/src/connection_pool.test.ts +346 -0
  817. package/src/connection_pool.ts +307 -0
  818. package/src/constants.ts +14 -0
  819. package/src/cpu.test.ts +239 -0
  820. package/src/cpu.ts +173 -0
  821. package/src/http_server.ts +18 -6
  822. package/src/index.ts +15 -13
  823. package/src/inference/api_protos.ts +85 -2
  824. package/src/inference/index.ts +32 -4
  825. package/src/inference/interruption/defaults.ts +51 -0
  826. package/src/inference/interruption/errors.ts +25 -0
  827. package/src/inference/interruption/http_transport.ts +206 -0
  828. package/src/inference/interruption/interruption_cache_entry.ts +50 -0
  829. package/src/inference/interruption/interruption_detector.ts +204 -0
  830. package/src/inference/interruption/interruption_stream.ts +467 -0
  831. package/src/inference/interruption/types.ts +84 -0
  832. package/src/inference/interruption/utils.test.ts +132 -0
  833. package/src/inference/interruption/utils.ts +137 -0
  834. package/src/inference/interruption/ws_transport.ts +406 -0
  835. package/src/inference/llm.ts +214 -163
  836. package/src/inference/stt.test.ts +253 -0
  837. package/src/inference/stt.ts +449 -208
  838. package/src/inference/tts.test.ts +267 -0
  839. package/src/inference/tts.ts +377 -115
  840. package/src/inference/utils.ts +30 -2
  841. package/src/ipc/inference_proc_executor.ts +11 -3
  842. package/src/ipc/inference_proc_lazy_main.ts +13 -1
  843. package/src/ipc/job_proc_executor.ts +11 -1
  844. package/src/ipc/job_proc_lazy_main.ts +86 -20
  845. package/src/ipc/supervised_proc.test.ts +153 -0
  846. package/src/ipc/supervised_proc.ts +39 -10
  847. package/src/job.ts +120 -1
  848. package/src/language.test.ts +62 -0
  849. package/src/language.ts +380 -0
  850. package/src/llm/__snapshots__/zod-utils.test.ts.snap +559 -0
  851. package/src/llm/chat_context.test.ts +655 -0
  852. package/src/llm/chat_context.ts +412 -2
  853. package/src/llm/fallback_adapter.test.ts +238 -0
  854. package/src/llm/fallback_adapter.ts +391 -0
  855. package/src/llm/index.ts +11 -0
  856. package/src/llm/llm.ts +77 -12
  857. package/src/llm/provider_format/google.test.ts +72 -1
  858. package/src/llm/provider_format/google.ts +10 -6
  859. package/src/llm/provider_format/index.ts +7 -2
  860. package/src/llm/provider_format/openai.test.ts +480 -2
  861. package/src/llm/provider_format/openai.ts +152 -21
  862. package/src/llm/provider_format/utils.ts +11 -5
  863. package/src/llm/realtime.ts +23 -2
  864. package/src/llm/remote_chat_context.ts +2 -2
  865. package/src/llm/tool_context.test.ts +210 -1
  866. package/src/llm/tool_context.ts +115 -17
  867. package/src/llm/utils.ts +24 -16
  868. package/src/llm/zod-utils.test.ts +577 -0
  869. package/src/llm/zod-utils.ts +153 -0
  870. package/src/log.ts +71 -19
  871. package/src/metrics/base.ts +78 -19
  872. package/src/metrics/index.ts +12 -0
  873. package/src/metrics/model_usage.test.ts +545 -0
  874. package/src/metrics/model_usage.ts +262 -0
  875. package/src/metrics/usage_collector.ts +14 -3
  876. package/src/metrics/utils.ts +27 -7
  877. package/src/stream/deferred_stream.test.ts +3 -3
  878. package/src/stream/deferred_stream.ts +43 -11
  879. package/src/stream/index.ts +1 -0
  880. package/src/stream/multi_input_stream.test.ts +545 -0
  881. package/src/stream/multi_input_stream.ts +172 -0
  882. package/src/stream/stream_channel.test.ts +37 -0
  883. package/src/stream/stream_channel.ts +43 -3
  884. package/src/stt/stream_adapter.ts +30 -9
  885. package/src/stt/stt.ts +131 -22
  886. package/src/telemetry/index.ts +28 -0
  887. package/src/telemetry/logging.ts +55 -0
  888. package/src/telemetry/otel_http_exporter.ts +218 -0
  889. package/src/telemetry/pino_otel_transport.ts +265 -0
  890. package/src/telemetry/trace_types.ts +109 -0
  891. package/src/telemetry/traces.ts +673 -0
  892. package/src/telemetry/utils.ts +61 -0
  893. package/src/tokenize/basic/sentence.ts +3 -3
  894. package/src/tokenize/tokenizer.test.ts +4 -0
  895. package/src/transcription.ts +6 -0
  896. package/src/tts/fallback_adapter.ts +579 -0
  897. package/src/tts/index.ts +1 -0
  898. package/src/tts/stream_adapter.ts +38 -8
  899. package/src/tts/tts.ts +245 -62
  900. package/src/types.ts +62 -33
  901. package/src/utils.test.ts +90 -10
  902. package/src/utils.ts +176 -31
  903. package/src/vad.ts +42 -18
  904. package/src/version.ts +1 -1
  905. package/src/voice/agent.test.ts +347 -2
  906. package/src/voice/agent.ts +346 -44
  907. package/src/voice/agent_activity.test.ts +194 -0
  908. package/src/voice/agent_activity.ts +1457 -388
  909. package/src/voice/agent_session.ts +817 -112
  910. package/src/voice/audio_recognition.ts +845 -70
  911. package/src/voice/audio_recognition_span.test.ts +341 -0
  912. package/src/voice/avatar/datastream_io.ts +9 -1
  913. package/src/voice/background_audio.ts +494 -0
  914. package/src/voice/events.ts +27 -7
  915. package/src/voice/generation.ts +310 -56
  916. package/src/voice/generation_tools.test.ts +268 -0
  917. package/src/voice/index.ts +17 -3
  918. package/src/voice/interruption_detection.test.ts +151 -0
  919. package/src/voice/io.ts +115 -12
  920. package/src/voice/recorder_io/index.ts +4 -0
  921. package/src/voice/recorder_io/recorder_io.ts +783 -0
  922. package/src/voice/remote_session.ts +1083 -0
  923. package/src/voice/report.test.ts +136 -0
  924. package/src/voice/report.ts +140 -0
  925. package/src/voice/room_io/_input.ts +45 -10
  926. package/src/voice/room_io/_output.ts +26 -14
  927. package/src/voice/room_io/room_io.ts +67 -22
  928. package/src/voice/speech_handle.ts +38 -6
  929. package/src/voice/testing/fake_llm.ts +138 -0
  930. package/src/voice/testing/index.ts +52 -0
  931. package/src/voice/testing/run_result.ts +995 -0
  932. package/src/voice/testing/types.ts +118 -0
  933. package/src/voice/transcription/synchronizer.test.ts +206 -0
  934. package/src/voice/transcription/synchronizer.ts +204 -19
  935. package/src/voice/turn_config/endpointing.ts +33 -0
  936. package/src/voice/turn_config/interruption.ts +56 -0
  937. package/src/voice/turn_config/turn_handling.ts +45 -0
  938. package/src/voice/turn_config/utils.test.ts +148 -0
  939. package/src/voice/turn_config/utils.ts +167 -0
  940. package/src/voice/utils.ts +29 -0
  941. package/src/worker.ts +92 -78
  942. package/src/llm/__snapshots__/utils.test.ts.snap +0 -65
@@ -22,15 +22,24 @@ __export(audio_recognition_exports, {
22
22
  });
23
23
  module.exports = __toCommonJS(audio_recognition_exports);
24
24
  var import_rtc_node = require("@livekit/rtc-node");
25
+ var import_api = require("@opentelemetry/api");
25
26
  var import_web = require("node:stream/web");
27
+ var import_exceptions = require("../_exceptions.cjs");
28
+ var import_defaults = require("../inference/interruption/defaults.cjs");
29
+ var import_errors = require("../inference/interruption/errors.cjs");
30
+ var import_interruption_stream = require("../inference/interruption/interruption_stream.cjs");
31
+ var import_types = require("../inference/interruption/types.cjs");
26
32
  var import_chat_context = require("../llm/chat_context.cjs");
27
33
  var import_log = require("../log.cjs");
28
34
  var import_deferred_stream = require("../stream/deferred_stream.cjs");
29
35
  var import_identity_transform = require("../stream/identity_transform.cjs");
30
36
  var import_merge_readable_streams = require("../stream/merge_readable_streams.cjs");
37
+ var import_stream_channel = require("../stream/stream_channel.cjs");
31
38
  var import_stt = require("../stt/stt.cjs");
39
+ var import_telemetry = require("../telemetry/index.cjs");
32
40
  var import_utils = require("../utils.cjs");
33
41
  var import_vad = require("../vad.cjs");
42
+ var import_utils2 = require("./utils.cjs");
34
43
  class AudioRecognition {
35
44
  hooks;
36
45
  stt;
@@ -40,15 +49,23 @@ class AudioRecognition {
40
49
  minEndpointingDelay;
41
50
  maxEndpointingDelay;
42
51
  lastLanguage;
52
+ rootSpanContext;
53
+ sttModel;
54
+ sttProvider;
55
+ getLinkedParticipant;
43
56
  deferredInputStream;
44
57
  logger = (0, import_log.log)();
45
58
  lastFinalTranscriptTime = 0;
46
59
  audioTranscript = "";
47
60
  audioInterimTranscript = "";
48
- lastSpeakingTime = 0;
61
+ audioPreflightTranscript = "";
62
+ finalTranscriptConfidence = [];
63
+ lastSpeakingTime;
64
+ speechStartTime;
49
65
  userTurnCommitted = false;
50
66
  speaking = false;
51
67
  sampleRate;
68
+ userTurnSpan;
52
69
  vadInputStream;
53
70
  sttInputStream;
54
71
  silenceAudioTransform = new import_identity_transform.IdentityTransform();
@@ -58,6 +75,15 @@ class AudioRecognition {
58
75
  commitUserTurnTask;
59
76
  vadTask;
60
77
  sttTask;
78
+ interruptionTask;
79
+ // interruption detection
80
+ interruptionDetection;
81
+ _inputStartedAt;
82
+ ignoreUserTranscriptUntil;
83
+ transcriptBuffer;
84
+ isInterruptionEnabled;
85
+ isAgentSpeaking;
86
+ interruptionStreamChannel;
61
87
  constructor(opts) {
62
88
  this.hooks = opts.recognitionHooks;
63
89
  this.stt = opts.stt;
@@ -67,10 +93,33 @@ class AudioRecognition {
67
93
  this.minEndpointingDelay = opts.minEndpointingDelay;
68
94
  this.maxEndpointingDelay = opts.maxEndpointingDelay;
69
95
  this.lastLanguage = void 0;
96
+ this.rootSpanContext = opts.rootSpanContext;
97
+ this.sttModel = opts.sttModel;
98
+ this.sttProvider = opts.sttProvider;
99
+ this.getLinkedParticipant = opts.getLinkedParticipant;
70
100
  this.deferredInputStream = new import_deferred_stream.DeferredReadableStream();
71
- const [vadInputStream, sttInputStream] = this.deferredInputStream.stream.tee();
72
- this.vadInputStream = vadInputStream;
73
- this.sttInputStream = (0, import_merge_readable_streams.mergeReadableStreams)(sttInputStream, this.silenceAudioTransform.readable);
101
+ this.interruptionDetection = opts.interruptionDetection;
102
+ this.transcriptBuffer = [];
103
+ this.isInterruptionEnabled = !!(opts.interruptionDetection && opts.vad);
104
+ this.isAgentSpeaking = false;
105
+ if (opts.interruptionDetection) {
106
+ const [vadInputStream, teedInput] = this.deferredInputStream.stream.tee();
107
+ const [inputStream, sttInputStream] = teedInput.tee();
108
+ this.vadInputStream = vadInputStream;
109
+ this.sttInputStream = (0, import_merge_readable_streams.mergeReadableStreams)(
110
+ sttInputStream,
111
+ this.silenceAudioTransform.readable
112
+ );
113
+ this.interruptionStreamChannel = (0, import_stream_channel.createStreamChannel)();
114
+ this.interruptionStreamChannel.addStreamInput(inputStream);
115
+ } else {
116
+ const [vadInputStream, sttInputStream] = this.deferredInputStream.stream.tee();
117
+ this.vadInputStream = vadInputStream;
118
+ this.sttInputStream = (0, import_merge_readable_streams.mergeReadableStreams)(
119
+ sttInputStream,
120
+ this.silenceAudioTransform.readable
121
+ );
122
+ }
74
123
  this.silenceAudioWriter = this.silenceAudioTransform.writable.getWriter();
75
124
  }
76
125
  /**
@@ -82,6 +131,14 @@ class AudioRecognition {
82
131
  }
83
132
  return this.audioTranscript;
84
133
  }
134
+ /** @internal */
135
+ get inputStartedAt() {
136
+ return this._inputStartedAt;
137
+ }
138
+ /** @internal */
139
+ updateOptions(options) {
140
+ this.turnDetectionMode = options.turnDetection;
141
+ }
85
142
  async start() {
86
143
  this.vadTask = import_utils.Task.from(({ signal }) => this.createVadTask(this.vad, signal));
87
144
  this.vadTask.result.catch((err) => {
@@ -91,9 +148,194 @@ class AudioRecognition {
91
148
  this.sttTask.result.catch((err) => {
92
149
  this.logger.error(`Error running STT task: ${err}`);
93
150
  });
151
+ this.interruptionTask = import_utils.Task.from(
152
+ ({ signal }) => this.createInterruptionTask(this.interruptionDetection, signal)
153
+ );
154
+ this.interruptionTask.result.catch((err) => {
155
+ this.logger.error(`Error running interruption task: ${err}`);
156
+ });
157
+ }
158
+ async stop() {
159
+ var _a, _b, _c;
160
+ await ((_a = this.sttTask) == null ? void 0 : _a.cancelAndWait());
161
+ await ((_b = this.vadTask) == null ? void 0 : _b.cancelAndWait());
162
+ await ((_c = this.interruptionTask) == null ? void 0 : _c.cancelAndWait());
163
+ }
164
+ async disableInterruptionDetection() {
165
+ var _a, _b;
166
+ this.isInterruptionEnabled = false;
167
+ this.interruptionDetection = void 0;
168
+ await ((_a = this.interruptionTask) == null ? void 0 : _a.cancelAndWait());
169
+ this.interruptionTask = void 0;
170
+ await ((_b = this.interruptionStreamChannel) == null ? void 0 : _b.close());
171
+ this.interruptionStreamChannel = void 0;
172
+ }
173
+ async onStartOfAgentSpeech() {
174
+ this.isAgentSpeaking = true;
175
+ return this.trySendInterruptionSentinel(import_interruption_stream.InterruptionStreamSentinel.agentSpeechStarted());
176
+ }
177
+ async onEndOfAgentSpeech(ignoreUserTranscriptUntil) {
178
+ if (!this.isInterruptionEnabled) {
179
+ this.isAgentSpeaking = false;
180
+ return;
181
+ }
182
+ const inputOpen = await this.trySendInterruptionSentinel(
183
+ import_interruption_stream.InterruptionStreamSentinel.agentSpeechEnded()
184
+ );
185
+ if (!inputOpen) {
186
+ this.isAgentSpeaking = false;
187
+ return;
188
+ }
189
+ if (this.isAgentSpeaking) {
190
+ if (this.ignoreUserTranscriptUntil === void 0) {
191
+ this.onEndOfOverlapSpeech(Date.now());
192
+ }
193
+ this.ignoreUserTranscriptUntil = this.ignoreUserTranscriptUntil ? Math.min(ignoreUserTranscriptUntil, this.ignoreUserTranscriptUntil) : ignoreUserTranscriptUntil;
194
+ await this.flushHeldTranscripts();
195
+ }
196
+ this.isAgentSpeaking = false;
197
+ }
198
+ /** Start interruption inference when agent is speaking and overlap speech starts. */
199
+ async onStartOfOverlapSpeech(speechDuration, startedAt, userSpeakingSpan) {
200
+ if (this.isAgentSpeaking) {
201
+ this.trySendInterruptionSentinel(
202
+ import_interruption_stream.InterruptionStreamSentinel.overlapSpeechStarted(
203
+ speechDuration,
204
+ startedAt,
205
+ userSpeakingSpan
206
+ )
207
+ );
208
+ }
209
+ }
210
+ /** End interruption inference when overlap speech ends. */
211
+ async onEndOfOverlapSpeech(endedAt, userSpeakingSpan) {
212
+ if (!this.isInterruptionEnabled) {
213
+ return;
214
+ }
215
+ if (userSpeakingSpan && userSpeakingSpan.isRecording()) {
216
+ userSpeakingSpan.setAttribute(import_telemetry.traceTypes.ATTR_IS_INTERRUPTION, "false");
217
+ }
218
+ return this.trySendInterruptionSentinel(import_interruption_stream.InterruptionStreamSentinel.overlapSpeechEnded(endedAt));
219
+ }
220
+ /**
221
+ * Flush held transcripts whose *end time* is after the ignoreUserTranscriptUntil timestamp.
222
+ * If the event has no timestamps, we assume it is the same as the next valid event.
223
+ */
224
+ async flushHeldTranscripts() {
225
+ if (!this.isInterruptionEnabled || this.ignoreUserTranscriptUntil === void 0 || this.transcriptBuffer.length === 0) {
226
+ return;
227
+ }
228
+ if (!this._inputStartedAt) {
229
+ this.transcriptBuffer = [];
230
+ this.ignoreUserTranscriptUntil = void 0;
231
+ return;
232
+ }
233
+ let emitFromIndex = null;
234
+ let shouldFlush = false;
235
+ for (let i = 0; i < this.transcriptBuffer.length; i++) {
236
+ const ev = this.transcriptBuffer[i];
237
+ if (!ev || !ev.alternatives || ev.alternatives.length === 0) {
238
+ emitFromIndex = Math.min(emitFromIndex ?? i, i);
239
+ continue;
240
+ }
241
+ const firstAlternative = ev.alternatives[0];
242
+ if (firstAlternative.startTime === firstAlternative.endTime && firstAlternative.startTime === 0) {
243
+ this.transcriptBuffer = [];
244
+ this.ignoreUserTranscriptUntil = void 0;
245
+ return;
246
+ }
247
+ if (this.#alternativeEndsBeforeIgnoreWindow(firstAlternative)) {
248
+ emitFromIndex = null;
249
+ } else {
250
+ emitFromIndex = Math.min(emitFromIndex ?? i, i);
251
+ shouldFlush = true;
252
+ break;
253
+ }
254
+ }
255
+ const eventsToEmit = emitFromIndex !== null && shouldFlush ? this.transcriptBuffer.slice(emitFromIndex) : [];
256
+ this.transcriptBuffer = [];
257
+ this.ignoreUserTranscriptUntil = void 0;
258
+ for (const event of eventsToEmit) {
259
+ this.logger.trace(
260
+ {
261
+ event: event.type
262
+ },
263
+ "re-emitting held user transcript"
264
+ );
265
+ this.onSTTEvent(event);
266
+ }
267
+ }
268
+ #alternativeEndsBeforeIgnoreWindow(alternative) {
269
+ if (this.ignoreUserTranscriptUntil === void 0 || !this._inputStartedAt || alternative.startTime <= 0) {
270
+ return false;
271
+ }
272
+ return alternative.startTime * 1e3 + this._inputStartedAt < this.ignoreUserTranscriptUntil;
273
+ }
274
+ shouldHoldSttEvent(ev) {
275
+ if (!this.isInterruptionEnabled) {
276
+ return false;
277
+ }
278
+ if (this.isAgentSpeaking) {
279
+ return true;
280
+ }
281
+ if (ev.type === import_stt.SpeechEventType.START_OF_SPEECH) {
282
+ this.ignoreUserTranscriptUntil = void 0;
283
+ this.transcriptBuffer = [];
284
+ return false;
285
+ }
286
+ if (this.ignoreUserTranscriptUntil === void 0) {
287
+ return false;
288
+ }
289
+ if (!ev.alternatives || ev.alternatives.length === 0) {
290
+ return true;
291
+ }
292
+ const alternative = ev.alternatives[0];
293
+ if (alternative.startTime !== alternative.endTime && this.#alternativeEndsBeforeIgnoreWindow(alternative)) {
294
+ return true;
295
+ }
296
+ return false;
297
+ }
298
+ async trySendInterruptionSentinel(frame) {
299
+ if (this.isInterruptionEnabled && this.interruptionStreamChannel && !this.interruptionStreamChannel.closed) {
300
+ try {
301
+ await this.interruptionStreamChannel.write(frame);
302
+ return true;
303
+ } catch (e) {
304
+ this.logger.warn(
305
+ `could not forward interruption sentinel: ${e instanceof Error ? e.message : String(e)}`
306
+ );
307
+ }
308
+ }
309
+ return false;
310
+ }
311
+ ensureUserTurnSpan(startTime) {
312
+ var _a;
313
+ if (this.userTurnSpan && this.userTurnSpan.isRecording()) {
314
+ return this.userTurnSpan;
315
+ }
316
+ this.userTurnSpan = import_telemetry.tracer.startSpan({
317
+ name: "user_turn",
318
+ context: this.rootSpanContext,
319
+ startTime
320
+ });
321
+ const participant = (_a = this.getLinkedParticipant) == null ? void 0 : _a.call(this);
322
+ if (participant) {
323
+ (0, import_utils2.setParticipantSpanAttributes)(this.userTurnSpan, participant);
324
+ }
325
+ if (this.sttModel) {
326
+ this.userTurnSpan.setAttribute(import_telemetry.traceTypes.ATTR_GEN_AI_REQUEST_MODEL, this.sttModel);
327
+ }
328
+ if (this.sttProvider) {
329
+ this.userTurnSpan.setAttribute(import_telemetry.traceTypes.ATTR_GEN_AI_PROVIDER_NAME, this.sttProvider);
330
+ }
331
+ return this.userTurnSpan;
332
+ }
333
+ userTurnContext(span) {
334
+ const base = this.rootSpanContext ?? import_api.ROOT_CONTEXT;
335
+ return import_api.trace.setSpan(base, span);
94
336
  }
95
337
  async onSTTEvent(ev) {
96
- var _a, _b, _c, _d, _e, _f, _g, _h, _i;
338
+ var _a, _b, _c, _d, _e, _f, _g, _h, _i, _j, _k, _l, _m, _n, _o, _p, _q, _r;
97
339
  if (this.turnDetectionMode === "manual" && this.userTurnCommitted && (this.bounceEOUTask === void 0 || this.bounceEOUTask.done || ev.type == import_stt.SpeechEventType.INTERIM_TRANSCRIPT)) {
98
340
  this.logger.debug(
99
341
  {
@@ -106,14 +348,27 @@ class AudioRecognition {
106
348
  );
107
349
  return;
108
350
  }
351
+ if (ev.type !== import_stt.SpeechEventType.RECOGNITION_USAGE && this.isInterruptionEnabled) {
352
+ if (this.shouldHoldSttEvent(ev)) {
353
+ this.logger.trace(
354
+ { event: ev.type, ignoreUserTranscriptUntil: this.ignoreUserTranscriptUntil },
355
+ "holding STT event until ignore_user_transcript_until expires"
356
+ );
357
+ this.transcriptBuffer.push(ev);
358
+ return;
359
+ } else {
360
+ await this.flushHeldTranscripts();
361
+ }
362
+ }
109
363
  switch (ev.type) {
110
364
  case import_stt.SpeechEventType.FINAL_TRANSCRIPT:
111
- this.hooks.onFinalTranscript(ev);
112
365
  const transcript = (_c = (_b = ev.alternatives) == null ? void 0 : _b[0]) == null ? void 0 : _c.text;
113
- this.lastLanguage = (_e = (_d = ev.alternatives) == null ? void 0 : _d[0]) == null ? void 0 : _e.language;
366
+ const confidence = ((_e = (_d = ev.alternatives) == null ? void 0 : _d[0]) == null ? void 0 : _e.confidence) ?? 0;
367
+ this.lastLanguage = (_g = (_f = ev.alternatives) == null ? void 0 : _f[0]) == null ? void 0 : _g.language;
114
368
  if (!transcript) {
115
369
  return;
116
370
  }
371
+ this.hooks.onFinalTranscript(ev);
117
372
  this.logger.debug(
118
373
  {
119
374
  user_transcript: transcript,
@@ -124,26 +379,124 @@ class AudioRecognition {
124
379
  this.lastFinalTranscriptTime = Date.now();
125
380
  this.audioTranscript += ` ${transcript}`;
126
381
  this.audioTranscript = this.audioTranscript.trimStart();
382
+ this.finalTranscriptConfidence.push(confidence);
383
+ const transcriptChanged = this.audioTranscript !== this.audioPreflightTranscript;
127
384
  this.audioInterimTranscript = "";
128
- if (!this.speaking) {
129
- if (!this.vad) {
130
- this.lastSpeakingTime = Date.now();
385
+ this.audioPreflightTranscript = "";
386
+ if (!this.vad || this.lastSpeakingTime === void 0) {
387
+ this.lastSpeakingTime = Date.now();
388
+ }
389
+ if (this.vadBaseTurnDetection || this.userTurnCommitted) {
390
+ if (transcriptChanged) {
391
+ this.logger.debug(
392
+ { transcript: this.audioTranscript },
393
+ "triggering preemptive generation (FINAL_TRANSCRIPT)"
394
+ );
395
+ this.hooks.onPreemptiveGeneration({
396
+ newTranscript: this.audioTranscript,
397
+ transcriptConfidence: this.finalTranscriptConfidence.length > 0 ? this.finalTranscriptConfidence.reduce((a, b) => a + b, 0) / this.finalTranscriptConfidence.length : 0
398
+ });
131
399
  }
132
- if (this.vadBaseTurnDetection || this.userTurnCommitted) {
400
+ if (!this.speaking) {
133
401
  const chatCtx = this.hooks.retrieveChatCtx();
134
402
  this.logger.debug("running EOU detection on stt FINAL_TRANSCRIPT");
135
403
  this.runEOUDetection(chatCtx);
136
404
  }
137
405
  }
138
406
  break;
407
+ case import_stt.SpeechEventType.PREFLIGHT_TRANSCRIPT:
408
+ this.hooks.onInterimTranscript(ev);
409
+ const preflightTranscript = ((_i = (_h = ev.alternatives) == null ? void 0 : _h[0]) == null ? void 0 : _i.text) ?? "";
410
+ const preflightConfidence = ((_k = (_j = ev.alternatives) == null ? void 0 : _j[0]) == null ? void 0 : _k.confidence) ?? 0;
411
+ const preflightLanguage = (_m = (_l = ev.alternatives) == null ? void 0 : _l[0]) == null ? void 0 : _m.language;
412
+ const MIN_LANGUAGE_DETECTION_LENGTH = 5;
413
+ if (!this.lastLanguage || preflightLanguage && preflightTranscript.length > MIN_LANGUAGE_DETECTION_LENGTH) {
414
+ this.lastLanguage = preflightLanguage;
415
+ }
416
+ if (!preflightTranscript) {
417
+ return;
418
+ }
419
+ this.logger.debug(
420
+ {
421
+ user_transcript: preflightTranscript,
422
+ language: this.lastLanguage
423
+ },
424
+ "received user preflight transcript"
425
+ );
426
+ this.lastFinalTranscriptTime = Date.now();
427
+ this.audioPreflightTranscript = `${this.audioTranscript} ${preflightTranscript}`.trimStart();
428
+ this.audioInterimTranscript = preflightTranscript;
429
+ if (!this.vad || this.lastSpeakingTime === void 0) {
430
+ this.lastSpeakingTime = Date.now();
431
+ }
432
+ if (this.turnDetectionMode !== "manual" || this.userTurnCommitted) {
433
+ const confidenceVals = [...this.finalTranscriptConfidence, preflightConfidence];
434
+ this.logger.debug(
435
+ {
436
+ transcript: this.audioPreflightTranscript.length > 100 ? this.audioPreflightTranscript.slice(0, 100) + "..." : this.audioPreflightTranscript
437
+ },
438
+ "triggering preemptive generation (PREFLIGHT_TRANSCRIPT)"
439
+ );
440
+ this.hooks.onPreemptiveGeneration({
441
+ newTranscript: this.audioPreflightTranscript,
442
+ transcriptConfidence: confidenceVals.length > 0 ? confidenceVals.reduce((a, b) => a + b, 0) / confidenceVals.length : 0
443
+ });
444
+ }
445
+ break;
139
446
  case import_stt.SpeechEventType.INTERIM_TRANSCRIPT:
140
- this.logger.debug({ transcript: (_g = (_f = ev.alternatives) == null ? void 0 : _f[0]) == null ? void 0 : _g.text }, "interim transcript");
447
+ this.logger.debug({ transcript: (_o = (_n = ev.alternatives) == null ? void 0 : _n[0]) == null ? void 0 : _o.text }, "interim transcript");
141
448
  this.hooks.onInterimTranscript(ev);
142
- this.audioInterimTranscript = ((_i = (_h = ev.alternatives) == null ? void 0 : _h[0]) == null ? void 0 : _i.text) ?? "";
449
+ this.audioInterimTranscript = ((_q = (_p = ev.alternatives) == null ? void 0 : _p[0]) == null ? void 0 : _q.text) ?? "";
450
+ break;
451
+ case import_stt.SpeechEventType.START_OF_SPEECH:
452
+ if (this.turnDetectionMode !== "stt") break;
453
+ {
454
+ const span = this.ensureUserTurnSpan(Date.now());
455
+ const ctx = this.userTurnContext(span);
456
+ import_api.context.with(ctx, () => {
457
+ this.hooks.onStartOfSpeech({
458
+ type: import_vad.VADEventType.START_OF_SPEECH,
459
+ samplesIndex: 0,
460
+ timestamp: Date.now(),
461
+ speechDuration: 0,
462
+ silenceDuration: 0,
463
+ frames: [],
464
+ probability: 0,
465
+ inferenceDuration: 0,
466
+ speaking: true,
467
+ rawAccumulatedSilence: 0,
468
+ rawAccumulatedSpeech: 0
469
+ });
470
+ });
471
+ }
472
+ this.speaking = true;
473
+ this.lastSpeakingTime = Date.now();
474
+ (_r = this.bounceEOUTask) == null ? void 0 : _r.cancel();
143
475
  break;
144
476
  case import_stt.SpeechEventType.END_OF_SPEECH:
145
477
  if (this.turnDetectionMode !== "stt") break;
478
+ {
479
+ const span = this.ensureUserTurnSpan();
480
+ const ctx = this.userTurnContext(span);
481
+ import_api.context.with(ctx, () => {
482
+ this.hooks.onEndOfSpeech({
483
+ type: import_vad.VADEventType.END_OF_SPEECH,
484
+ samplesIndex: 0,
485
+ timestamp: Date.now(),
486
+ speechDuration: 0,
487
+ silenceDuration: 0,
488
+ frames: [],
489
+ probability: 0,
490
+ inferenceDuration: 0,
491
+ speaking: false,
492
+ rawAccumulatedSilence: 0,
493
+ rawAccumulatedSpeech: 0
494
+ });
495
+ });
496
+ }
497
+ this.speaking = false;
146
498
  this.userTurnCommitted = true;
499
+ this.lastSpeakingTime = Date.now();
147
500
  if (!this.speaking) {
148
501
  const chatCtx = this.hooks.retrieveChatCtx();
149
502
  this.logger.debug("running EOU detection on stt END_OF_SPEECH");
@@ -151,6 +504,11 @@ class AudioRecognition {
151
504
  }
152
505
  }
153
506
  }
507
+ onOverlapSpeechEvent(ev) {
508
+ if (ev.isInterruption) {
509
+ this.hooks.onInterruption(ev);
510
+ }
511
+ }
154
512
  runEOUDetection(chatCtx) {
155
513
  var _a;
156
514
  this.logger.debug(
@@ -171,48 +529,94 @@ class AudioRecognition {
171
529
  // disable EOU model if manual turn detection enabled
172
530
  this.audioTranscript && this.turnDetectionMode !== "manual" ? this.turnDetector : void 0
173
531
  );
174
- const bounceEOUTask = (lastSpeakingTime) => async (controller) => {
532
+ const bounceEOUTask = (lastSpeakingTime, lastFinalTranscriptTime, speechStartTime) => async (controller) => {
175
533
  let endpointingDelay = this.minEndpointingDelay;
534
+ const userTurnSpan = this.ensureUserTurnSpan();
535
+ const userTurnCtx = this.userTurnContext(userTurnSpan);
176
536
  if (turnDetector) {
177
- this.logger.debug("Running turn detector model");
178
- if (!turnDetector.supportsLanguage(this.lastLanguage)) {
179
- this.logger.debug(`Turn detector does not support language ${this.lastLanguage}`);
180
- } else {
181
- const endOfTurnProbability = await turnDetector.predictEndOfTurn(chatCtx);
182
- this.logger.debug(
183
- { endOfTurnProbability, language: this.lastLanguage },
184
- "end of turn probability"
185
- );
186
- const unlikelyThreshold = await turnDetector.unlikelyThreshold(this.lastLanguage);
187
- this.logger.debug(
188
- {
189
- unlikelyThreshold,
190
- endOfTurnProbability,
191
- language: this.lastLanguage,
192
- transcript: this.audioTranscript
193
- },
194
- "EOU Detection"
195
- );
196
- if (unlikelyThreshold && endOfTurnProbability < unlikelyThreshold) {
197
- endpointingDelay = this.maxEndpointingDelay;
537
+ await import_telemetry.tracer.startActiveSpan(
538
+ async (span) => {
539
+ this.logger.debug("Running turn detector model");
540
+ let endOfTurnProbability = 0;
541
+ let unlikelyThreshold;
542
+ if (!await turnDetector.supportsLanguage(this.lastLanguage)) {
543
+ this.logger.debug(`Turn detector does not support language ${this.lastLanguage}`);
544
+ } else {
545
+ try {
546
+ endOfTurnProbability = await turnDetector.predictEndOfTurn(chatCtx);
547
+ unlikelyThreshold = await turnDetector.unlikelyThreshold(this.lastLanguage);
548
+ this.logger.debug(
549
+ { endOfTurnProbability, unlikelyThreshold, language: this.lastLanguage },
550
+ "end of turn probability"
551
+ );
552
+ if (unlikelyThreshold && endOfTurnProbability < unlikelyThreshold) {
553
+ endpointingDelay = this.maxEndpointingDelay;
554
+ }
555
+ } catch (error) {
556
+ this.logger.error(error, "Error predicting end of turn");
557
+ }
558
+ }
559
+ span.setAttribute(
560
+ import_telemetry.traceTypes.ATTR_CHAT_CTX,
561
+ JSON.stringify(chatCtx.toJSON({ excludeTimestamp: false }))
562
+ );
563
+ span.setAttribute(import_telemetry.traceTypes.ATTR_EOU_PROBABILITY, endOfTurnProbability);
564
+ span.setAttribute(import_telemetry.traceTypes.ATTR_EOU_UNLIKELY_THRESHOLD, unlikelyThreshold ?? 0);
565
+ span.setAttribute(import_telemetry.traceTypes.ATTR_EOU_DELAY, endpointingDelay);
566
+ span.setAttribute(import_telemetry.traceTypes.ATTR_EOU_LANGUAGE, this.lastLanguage ?? "");
567
+ },
568
+ {
569
+ name: "eou_detection",
570
+ context: userTurnCtx
198
571
  }
199
- }
572
+ );
573
+ }
574
+ let extraSleep = endpointingDelay;
575
+ if (lastSpeakingTime !== void 0) {
576
+ extraSleep += lastSpeakingTime - Date.now();
577
+ }
578
+ if (extraSleep > 0) {
579
+ await (0, import_utils.delay)(Math.max(extraSleep, 0), { signal: controller.signal });
200
580
  }
201
- const extraSleep = lastSpeakingTime + endpointingDelay - Date.now();
202
- await (0, import_utils.delay)(Math.max(extraSleep, 0), { signal: controller.signal });
203
581
  this.logger.debug({ transcript: this.audioTranscript }, "end of user turn");
582
+ const confidenceAvg = this.finalTranscriptConfidence.length > 0 ? this.finalTranscriptConfidence.reduce((a, b) => a + b, 0) / this.finalTranscriptConfidence.length : 0;
583
+ let startedSpeakingAt;
584
+ let stoppedSpeakingAt;
585
+ let transcriptionDelay;
586
+ let endOfUtteranceDelay;
587
+ if (lastFinalTranscriptTime !== 0 && lastSpeakingTime !== void 0 && speechStartTime !== void 0) {
588
+ startedSpeakingAt = speechStartTime;
589
+ stoppedSpeakingAt = lastSpeakingTime;
590
+ transcriptionDelay = Math.max(lastFinalTranscriptTime - lastSpeakingTime, 0);
591
+ endOfUtteranceDelay = Date.now() - lastSpeakingTime;
592
+ }
204
593
  const committed = await this.hooks.onEndOfTurn({
205
594
  newTranscript: this.audioTranscript,
206
- transcriptionDelay: Math.max(this.lastFinalTranscriptTime - lastSpeakingTime, 0),
207
- endOfUtteranceDelay: Date.now() - lastSpeakingTime
595
+ transcriptConfidence: confidenceAvg,
596
+ transcriptionDelay: transcriptionDelay ?? 0,
597
+ endOfUtteranceDelay: endOfUtteranceDelay ?? 0,
598
+ startedSpeakingAt,
599
+ stoppedSpeakingAt
208
600
  });
209
601
  if (committed) {
602
+ this._endUserTurnSpan({
603
+ transcript: this.audioTranscript,
604
+ confidence: confidenceAvg,
605
+ transcriptionDelay: transcriptionDelay ?? 0,
606
+ endOfUtteranceDelay: endOfUtteranceDelay ?? 0
607
+ });
210
608
  this.audioTranscript = "";
609
+ this.finalTranscriptConfidence = [];
610
+ this.lastSpeakingTime = void 0;
611
+ this.lastFinalTranscriptTime = 0;
612
+ this.speechStartTime = void 0;
211
613
  }
212
614
  this.userTurnCommitted = false;
213
615
  };
214
616
  (_a = this.bounceEOUTask) == null ? void 0 : _a.cancel();
215
- this.bounceEOUTask = import_utils.Task.from(bounceEOUTask(this.lastSpeakingTime));
617
+ this.bounceEOUTask = import_utils.Task.from(
618
+ bounceEOUTask(this.lastSpeakingTime, this.lastFinalTranscriptTime, this.speechStartTime)
619
+ );
216
620
  this.bounceEOUTask.result.then(() => {
217
621
  this.logger.debug("EOU detection task completed");
218
622
  }).catch((err) => {
@@ -283,7 +687,12 @@ class AudioRecognition {
283
687
  switch (ev.type) {
284
688
  case import_vad.VADEventType.START_OF_SPEECH:
285
689
  this.logger.debug("VAD task: START_OF_SPEECH");
286
- this.hooks.onStartOfSpeech(ev);
690
+ {
691
+ const startTime = Date.now() - ev.speechDuration;
692
+ const span = this.ensureUserTurnSpan(startTime);
693
+ const ctx = this.userTurnContext(span);
694
+ import_api.context.with(ctx, () => this.hooks.onStartOfSpeech(ev));
695
+ }
287
696
  this.speaking = true;
288
697
  if (ev.frames.length > 0 && ev.frames[0]) {
289
698
  this.sampleRate = ev.frames[0].sampleRate;
@@ -292,12 +701,21 @@ class AudioRecognition {
292
701
  break;
293
702
  case import_vad.VADEventType.INFERENCE_DONE:
294
703
  this.hooks.onVADInferenceDone(ev);
704
+ if (ev.rawAccumulatedSpeech > 0) {
705
+ this.lastSpeakingTime = Date.now();
706
+ if (this.speechStartTime === void 0) {
707
+ this.speechStartTime = Date.now() - ev.rawAccumulatedSpeech;
708
+ }
709
+ }
295
710
  break;
296
711
  case import_vad.VADEventType.END_OF_SPEECH:
297
712
  this.logger.debug("VAD task: END_OF_SPEECH");
298
- this.hooks.onEndOfSpeech(ev);
713
+ {
714
+ const span = this.ensureUserTurnSpan();
715
+ const ctx = this.userTurnContext(span);
716
+ import_api.context.with(ctx, () => this.hooks.onEndOfSpeech(ev));
717
+ }
299
718
  this.speaking = false;
300
- this.lastSpeakingTime = Date.now() - ev.silenceDuration;
301
719
  if (this.vadBaseTurnDetection || this.turnDetectionMode === "stt" && this.userTurnCommitted) {
302
720
  const chatCtx = this.hooks.retrieveChatCtx();
303
721
  this.runEOUDetection(chatCtx);
@@ -311,6 +729,115 @@ class AudioRecognition {
311
729
  this.logger.debug("VAD task closed");
312
730
  }
313
731
  }
732
+ async createInterruptionTask(interruptionDetection, signal) {
733
+ if (!interruptionDetection || !this.interruptionStreamChannel) return;
734
+ let numRetries = 0;
735
+ const maxRetries = import_defaults.apiConnectDefaults.maxRetries;
736
+ while (!signal.aborted) {
737
+ const stream = interruptionDetection.createStream();
738
+ const eventReader = stream.stream().getReader();
739
+ const cleanup = async () => {
740
+ try {
741
+ signal.removeEventListener("abort", cleanup);
742
+ eventReader.releaseLock();
743
+ await stream.close();
744
+ } catch (e) {
745
+ this.logger.debug("createInterruptionTask: error during cleanup:", e);
746
+ }
747
+ };
748
+ signal.addEventListener("abort", cleanup, { once: true });
749
+ let forwardTask;
750
+ try {
751
+ if (numRetries > 0 && this.isAgentSpeaking) {
752
+ await stream.pushFrame(import_interruption_stream.InterruptionStreamSentinel.agentSpeechStarted());
753
+ }
754
+ forwardTask = (async () => {
755
+ const inputReader = this.interruptionStreamChannel.stream().getReader();
756
+ const abortPromise2 = (0, import_utils.waitForAbort)(signal);
757
+ try {
758
+ while (!signal.aborted) {
759
+ const res = await Promise.race([inputReader.read(), abortPromise2]);
760
+ if (!res) break;
761
+ const { value, done } = res;
762
+ if (done) break;
763
+ if (value instanceof import_rtc_node.AudioFrame) {
764
+ const frameDurationMs = value.samplesPerChannel / value.sampleRate * 1e3;
765
+ this._inputStartedAt ??= Date.now() - frameDurationMs;
766
+ } else {
767
+ this._inputStartedAt ??= Date.now();
768
+ }
769
+ await stream.pushFrame(value);
770
+ }
771
+ } finally {
772
+ inputReader.releaseLock();
773
+ }
774
+ })();
775
+ const abortPromise = (0, import_utils.waitForAbort)(signal);
776
+ while (!signal.aborted) {
777
+ const res = await Promise.race([eventReader.read(), abortPromise]);
778
+ if (!res) break;
779
+ const { done, value: ev } = res;
780
+ if (done) break;
781
+ this.onOverlapSpeechEvent(ev);
782
+ }
783
+ break;
784
+ } catch (e) {
785
+ if (signal.aborted) break;
786
+ if ((0, import_exceptions.isAPIError)(e)) {
787
+ if (maxRetries === 0 || !e.retryable) {
788
+ interruptionDetection.emitError(
789
+ new import_errors.InterruptionDetectionError(
790
+ e.message,
791
+ Date.now(),
792
+ interruptionDetection.label,
793
+ false
794
+ )
795
+ );
796
+ break;
797
+ } else if (numRetries >= maxRetries) {
798
+ interruptionDetection.emitError(
799
+ new import_errors.InterruptionDetectionError(
800
+ `failed to detect interruption after ${numRetries} attempts`,
801
+ Date.now(),
802
+ interruptionDetection.label,
803
+ false
804
+ )
805
+ );
806
+ break;
807
+ } else {
808
+ const retryInterval = (0, import_defaults.intervalForRetry)(numRetries);
809
+ interruptionDetection.emitError(
810
+ new import_errors.InterruptionDetectionError(
811
+ e.message,
812
+ Date.now(),
813
+ interruptionDetection.label,
814
+ true
815
+ )
816
+ );
817
+ this.logger.warn(
818
+ { model: interruptionDetection.label, attempt: numRetries },
819
+ `failed to detect interruption, retrying in ${retryInterval}ms`
820
+ );
821
+ numRetries++;
822
+ await (0, import_utils.delay)(retryInterval, { signal });
823
+ }
824
+ } else {
825
+ const msg = e instanceof Error ? e.message : String(e);
826
+ interruptionDetection.emitError(
827
+ new import_errors.InterruptionDetectionError(msg, Date.now(), interruptionDetection.label, false)
828
+ );
829
+ this.logger.error(e, "Error in interruption task");
830
+ break;
831
+ }
832
+ } finally {
833
+ await cleanup();
834
+ await (forwardTask == null ? void 0 : forwardTask.catch((e) => {
835
+ this.logger.debug({ err: e }, "interruption task exited with error");
836
+ }));
837
+ }
838
+ }
839
+ this.logger.debug("Interruption task closed");
840
+ }
314
841
  setInputAudioStream(audioStream) {
315
842
  this.deferredInputStream.setSource(audioStream);
316
843
  }
@@ -321,6 +848,8 @@ class AudioRecognition {
321
848
  var _a;
322
849
  this.audioTranscript = "";
323
850
  this.audioInterimTranscript = "";
851
+ this.audioPreflightTranscript = "";
852
+ this.finalTranscriptConfidence = [];
324
853
  this.userTurnCommitted = false;
325
854
  (_a = this.sttTask) == null ? void 0 : _a.cancelAndWait().finally(() => {
326
855
  this.sttTask = import_utils.Task.from(({ signal }) => this.createSttTask(this.stt, signal));
@@ -355,19 +884,49 @@ class AudioRecognition {
355
884
  this.commitUserTurnTask.result.then(() => {
356
885
  this.logger.debug("User turn committed");
357
886
  }).catch((err) => {
887
+ if (err instanceof Error && err.name === "AbortError") {
888
+ this.logger.debug("User turn commit task cancelled");
889
+ return;
890
+ }
358
891
  this.logger.error(err, "Error in user turn commit task:");
359
892
  });
360
893
  }
361
894
  async close() {
362
- var _a, _b, _c, _d;
895
+ var _a, _b, _c, _d, _e, _f;
363
896
  this.detachInputAudioStream();
897
+ this.silenceAudioWriter.releaseLock();
364
898
  await ((_a = this.commitUserTurnTask) == null ? void 0 : _a.cancelAndWait());
365
899
  await ((_b = this.sttTask) == null ? void 0 : _b.cancelAndWait());
366
900
  await ((_c = this.vadTask) == null ? void 0 : _c.cancelAndWait());
367
901
  await ((_d = this.bounceEOUTask) == null ? void 0 : _d.cancelAndWait());
902
+ await ((_e = this.interruptionTask) == null ? void 0 : _e.cancelAndWait());
903
+ await ((_f = this.interruptionStreamChannel) == null ? void 0 : _f.close());
904
+ }
905
+ _endUserTurnSpan({
906
+ transcript,
907
+ confidence,
908
+ transcriptionDelay,
909
+ endOfUtteranceDelay
910
+ }) {
911
+ if (this.userTurnSpan) {
912
+ this.userTurnSpan.setAttributes({
913
+ [import_telemetry.traceTypes.ATTR_USER_TRANSCRIPT]: transcript,
914
+ [import_telemetry.traceTypes.ATTR_TRANSCRIPT_CONFIDENCE]: confidence,
915
+ [import_telemetry.traceTypes.ATTR_TRANSCRIPTION_DELAY]: transcriptionDelay,
916
+ [import_telemetry.traceTypes.ATTR_END_OF_TURN_DELAY]: endOfUtteranceDelay
917
+ });
918
+ this.userTurnSpan.end();
919
+ this.userTurnSpan = void 0;
920
+ }
368
921
  }
369
922
  get vadBaseTurnDetection() {
370
- return ["vad", void 0].includes(this.turnDetectionMode);
923
+ if (typeof this.turnDetectionMode === "object") {
924
+ return false;
925
+ }
926
+ if (this.turnDetectionMode === void 0 || this.turnDetectionMode === "vad") {
927
+ return true;
928
+ }
929
+ return false;
371
930
  }
372
931
  }
373
932
  // Annotate the CommonJS export names for ESM import in node: