@livekit/agents 1.0.47 → 1.1.0-dev.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (444) hide show
  1. package/dist/beta/index.cjs +29 -0
  2. package/dist/beta/index.cjs.map +1 -0
  3. package/dist/beta/index.d.cts +2 -0
  4. package/dist/beta/index.d.ts +2 -0
  5. package/dist/beta/index.d.ts.map +1 -0
  6. package/dist/beta/index.js +7 -0
  7. package/dist/beta/index.js.map +1 -0
  8. package/dist/beta/workflows/index.cjs +29 -0
  9. package/dist/beta/workflows/index.cjs.map +1 -0
  10. package/dist/beta/workflows/index.d.cts +2 -0
  11. package/dist/beta/workflows/index.d.ts +2 -0
  12. package/dist/beta/workflows/index.d.ts.map +1 -0
  13. package/dist/beta/workflows/index.js +7 -0
  14. package/dist/beta/workflows/index.js.map +1 -0
  15. package/dist/beta/workflows/task_group.cjs +162 -0
  16. package/dist/beta/workflows/task_group.cjs.map +1 -0
  17. package/dist/beta/workflows/task_group.d.cts +32 -0
  18. package/dist/beta/workflows/task_group.d.ts +32 -0
  19. package/dist/beta/workflows/task_group.d.ts.map +1 -0
  20. package/dist/beta/workflows/task_group.js +138 -0
  21. package/dist/beta/workflows/task_group.js.map +1 -0
  22. package/dist/constants.cjs +27 -0
  23. package/dist/constants.cjs.map +1 -1
  24. package/dist/constants.d.cts +9 -0
  25. package/dist/constants.d.ts +9 -0
  26. package/dist/constants.d.ts.map +1 -1
  27. package/dist/constants.js +18 -0
  28. package/dist/constants.js.map +1 -1
  29. package/dist/index.cjs +3 -0
  30. package/dist/index.cjs.map +1 -1
  31. package/dist/index.d.cts +2 -1
  32. package/dist/index.d.ts +2 -1
  33. package/dist/index.d.ts.map +1 -1
  34. package/dist/index.js +2 -0
  35. package/dist/index.js.map +1 -1
  36. package/dist/inference/api_protos.d.cts +12 -12
  37. package/dist/inference/api_protos.d.ts +12 -12
  38. package/dist/inference/interruption/defaults.cjs +81 -0
  39. package/dist/inference/interruption/defaults.cjs.map +1 -0
  40. package/dist/inference/interruption/defaults.d.cts +19 -0
  41. package/dist/inference/interruption/defaults.d.ts +19 -0
  42. package/dist/inference/interruption/defaults.d.ts.map +1 -0
  43. package/dist/inference/interruption/defaults.js +46 -0
  44. package/dist/inference/interruption/defaults.js.map +1 -0
  45. package/dist/inference/interruption/errors.cjs +44 -0
  46. package/dist/inference/interruption/errors.cjs.map +1 -0
  47. package/dist/inference/interruption/errors.d.cts +12 -0
  48. package/dist/inference/interruption/errors.d.ts +12 -0
  49. package/dist/inference/interruption/errors.d.ts.map +1 -0
  50. package/dist/inference/interruption/errors.js +20 -0
  51. package/dist/inference/interruption/errors.js.map +1 -0
  52. package/dist/inference/interruption/http_transport.cjs +147 -0
  53. package/dist/inference/interruption/http_transport.cjs.map +1 -0
  54. package/dist/inference/interruption/http_transport.d.cts +63 -0
  55. package/dist/inference/interruption/http_transport.d.ts +63 -0
  56. package/dist/inference/interruption/http_transport.d.ts.map +1 -0
  57. package/dist/inference/interruption/http_transport.js +121 -0
  58. package/dist/inference/interruption/http_transport.js.map +1 -0
  59. package/dist/inference/interruption/interruption_cache_entry.cjs +58 -0
  60. package/dist/inference/interruption/interruption_cache_entry.cjs.map +1 -0
  61. package/dist/inference/interruption/interruption_cache_entry.d.cts +30 -0
  62. package/dist/inference/interruption/interruption_cache_entry.d.ts +30 -0
  63. package/dist/inference/interruption/interruption_cache_entry.d.ts.map +1 -0
  64. package/dist/inference/interruption/interruption_cache_entry.js +34 -0
  65. package/dist/inference/interruption/interruption_cache_entry.js.map +1 -0
  66. package/dist/inference/interruption/interruption_detector.cjs +181 -0
  67. package/dist/inference/interruption/interruption_detector.cjs.map +1 -0
  68. package/dist/inference/interruption/interruption_detector.d.cts +59 -0
  69. package/dist/inference/interruption/interruption_detector.d.ts +59 -0
  70. package/dist/inference/interruption/interruption_detector.d.ts.map +1 -0
  71. package/dist/inference/interruption/interruption_detector.js +147 -0
  72. package/dist/inference/interruption/interruption_detector.js.map +1 -0
  73. package/dist/inference/interruption/interruption_stream.cjs +368 -0
  74. package/dist/inference/interruption/interruption_stream.cjs.map +1 -0
  75. package/dist/inference/interruption/interruption_stream.d.cts +46 -0
  76. package/dist/inference/interruption/interruption_stream.d.ts +46 -0
  77. package/dist/inference/interruption/interruption_stream.d.ts.map +1 -0
  78. package/dist/inference/interruption/interruption_stream.js +344 -0
  79. package/dist/inference/interruption/interruption_stream.js.map +1 -0
  80. package/dist/inference/interruption/types.cjs +17 -0
  81. package/dist/inference/interruption/types.cjs.map +1 -0
  82. package/dist/inference/interruption/types.d.cts +66 -0
  83. package/dist/inference/interruption/types.d.ts +66 -0
  84. package/dist/inference/interruption/types.d.ts.map +1 -0
  85. package/dist/inference/interruption/types.js +1 -0
  86. package/dist/inference/interruption/types.js.map +1 -0
  87. package/dist/inference/interruption/utils.cjs +130 -0
  88. package/dist/inference/interruption/utils.cjs.map +1 -0
  89. package/dist/inference/interruption/utils.d.cts +41 -0
  90. package/dist/inference/interruption/utils.d.ts +41 -0
  91. package/dist/inference/interruption/utils.d.ts.map +1 -0
  92. package/dist/inference/interruption/utils.js +105 -0
  93. package/dist/inference/interruption/utils.js.map +1 -0
  94. package/dist/inference/interruption/utils.test.cjs +105 -0
  95. package/dist/inference/interruption/utils.test.cjs.map +1 -0
  96. package/dist/inference/interruption/utils.test.js +104 -0
  97. package/dist/inference/interruption/utils.test.js.map +1 -0
  98. package/dist/inference/interruption/ws_transport.cjs +329 -0
  99. package/dist/inference/interruption/ws_transport.cjs.map +1 -0
  100. package/dist/inference/interruption/ws_transport.d.cts +33 -0
  101. package/dist/inference/interruption/ws_transport.d.ts +33 -0
  102. package/dist/inference/interruption/ws_transport.d.ts.map +1 -0
  103. package/dist/inference/interruption/ws_transport.js +295 -0
  104. package/dist/inference/interruption/ws_transport.js.map +1 -0
  105. package/dist/inference/llm.cjs +14 -10
  106. package/dist/inference/llm.cjs.map +1 -1
  107. package/dist/inference/llm.d.cts +2 -1
  108. package/dist/inference/llm.d.ts +2 -1
  109. package/dist/inference/llm.d.ts.map +1 -1
  110. package/dist/inference/llm.js +8 -10
  111. package/dist/inference/llm.js.map +1 -1
  112. package/dist/inference/stt.cjs +7 -2
  113. package/dist/inference/stt.cjs.map +1 -1
  114. package/dist/inference/stt.d.cts +2 -0
  115. package/dist/inference/stt.d.ts +2 -0
  116. package/dist/inference/stt.d.ts.map +1 -1
  117. package/dist/inference/stt.js +8 -3
  118. package/dist/inference/stt.js.map +1 -1
  119. package/dist/inference/tts.cjs +7 -2
  120. package/dist/inference/tts.cjs.map +1 -1
  121. package/dist/inference/tts.d.cts +2 -0
  122. package/dist/inference/tts.d.ts +2 -0
  123. package/dist/inference/tts.d.ts.map +1 -1
  124. package/dist/inference/tts.js +8 -3
  125. package/dist/inference/tts.js.map +1 -1
  126. package/dist/inference/utils.cjs +26 -7
  127. package/dist/inference/utils.cjs.map +1 -1
  128. package/dist/inference/utils.d.cts +13 -0
  129. package/dist/inference/utils.d.ts +13 -0
  130. package/dist/inference/utils.d.ts.map +1 -1
  131. package/dist/inference/utils.js +18 -2
  132. package/dist/inference/utils.js.map +1 -1
  133. package/dist/llm/chat_context.cjs +108 -2
  134. package/dist/llm/chat_context.cjs.map +1 -1
  135. package/dist/llm/chat_context.d.cts +28 -1
  136. package/dist/llm/chat_context.d.ts +28 -1
  137. package/dist/llm/chat_context.d.ts.map +1 -1
  138. package/dist/llm/chat_context.js +108 -2
  139. package/dist/llm/chat_context.js.map +1 -1
  140. package/dist/llm/chat_context.test.cjs +43 -0
  141. package/dist/llm/chat_context.test.cjs.map +1 -1
  142. package/dist/llm/chat_context.test.js +43 -0
  143. package/dist/llm/chat_context.test.js.map +1 -1
  144. package/dist/llm/index.cjs +2 -0
  145. package/dist/llm/index.cjs.map +1 -1
  146. package/dist/llm/index.d.cts +2 -2
  147. package/dist/llm/index.d.ts +2 -2
  148. package/dist/llm/index.d.ts.map +1 -1
  149. package/dist/llm/index.js +3 -1
  150. package/dist/llm/index.js.map +1 -1
  151. package/dist/llm/llm.cjs +16 -1
  152. package/dist/llm/llm.cjs.map +1 -1
  153. package/dist/llm/llm.d.cts +9 -0
  154. package/dist/llm/llm.d.ts +9 -0
  155. package/dist/llm/llm.d.ts.map +1 -1
  156. package/dist/llm/llm.js +16 -1
  157. package/dist/llm/llm.js.map +1 -1
  158. package/dist/llm/provider_format/index.d.cts +1 -1
  159. package/dist/llm/provider_format/index.d.ts +1 -1
  160. package/dist/llm/realtime.cjs +3 -0
  161. package/dist/llm/realtime.cjs.map +1 -1
  162. package/dist/llm/realtime.d.cts +1 -0
  163. package/dist/llm/realtime.d.ts +1 -0
  164. package/dist/llm/realtime.d.ts.map +1 -1
  165. package/dist/llm/realtime.js +3 -0
  166. package/dist/llm/realtime.js.map +1 -1
  167. package/dist/llm/tool_context.cjs +7 -0
  168. package/dist/llm/tool_context.cjs.map +1 -1
  169. package/dist/llm/tool_context.d.cts +10 -2
  170. package/dist/llm/tool_context.d.ts +10 -2
  171. package/dist/llm/tool_context.d.ts.map +1 -1
  172. package/dist/llm/tool_context.js +6 -0
  173. package/dist/llm/tool_context.js.map +1 -1
  174. package/dist/metrics/base.cjs.map +1 -1
  175. package/dist/metrics/base.d.cts +45 -1
  176. package/dist/metrics/base.d.ts +45 -1
  177. package/dist/metrics/base.d.ts.map +1 -1
  178. package/dist/metrics/index.cjs +5 -0
  179. package/dist/metrics/index.cjs.map +1 -1
  180. package/dist/metrics/index.d.cts +2 -1
  181. package/dist/metrics/index.d.ts +2 -1
  182. package/dist/metrics/index.d.ts.map +1 -1
  183. package/dist/metrics/index.js +6 -0
  184. package/dist/metrics/index.js.map +1 -1
  185. package/dist/metrics/model_usage.cjs +189 -0
  186. package/dist/metrics/model_usage.cjs.map +1 -0
  187. package/dist/metrics/model_usage.d.cts +92 -0
  188. package/dist/metrics/model_usage.d.ts +92 -0
  189. package/dist/metrics/model_usage.d.ts.map +1 -0
  190. package/dist/metrics/model_usage.js +164 -0
  191. package/dist/metrics/model_usage.js.map +1 -0
  192. package/dist/metrics/model_usage.test.cjs +474 -0
  193. package/dist/metrics/model_usage.test.cjs.map +1 -0
  194. package/dist/metrics/model_usage.test.js +476 -0
  195. package/dist/metrics/model_usage.test.js.map +1 -0
  196. package/dist/metrics/usage_collector.cjs +3 -0
  197. package/dist/metrics/usage_collector.cjs.map +1 -1
  198. package/dist/metrics/usage_collector.d.cts +9 -0
  199. package/dist/metrics/usage_collector.d.ts +9 -0
  200. package/dist/metrics/usage_collector.d.ts.map +1 -1
  201. package/dist/metrics/usage_collector.js +3 -0
  202. package/dist/metrics/usage_collector.js.map +1 -1
  203. package/dist/metrics/utils.cjs +9 -0
  204. package/dist/metrics/utils.cjs.map +1 -1
  205. package/dist/metrics/utils.d.ts.map +1 -1
  206. package/dist/metrics/utils.js +9 -0
  207. package/dist/metrics/utils.js.map +1 -1
  208. package/dist/stream/multi_input_stream.test.cjs +4 -0
  209. package/dist/stream/multi_input_stream.test.cjs.map +1 -1
  210. package/dist/stream/multi_input_stream.test.js +5 -1
  211. package/dist/stream/multi_input_stream.test.js.map +1 -1
  212. package/dist/stream/stream_channel.cjs +31 -0
  213. package/dist/stream/stream_channel.cjs.map +1 -1
  214. package/dist/stream/stream_channel.d.cts +4 -2
  215. package/dist/stream/stream_channel.d.ts +4 -2
  216. package/dist/stream/stream_channel.d.ts.map +1 -1
  217. package/dist/stream/stream_channel.js +31 -0
  218. package/dist/stream/stream_channel.js.map +1 -1
  219. package/dist/stt/stt.cjs +34 -2
  220. package/dist/stt/stt.cjs.map +1 -1
  221. package/dist/stt/stt.d.cts +22 -0
  222. package/dist/stt/stt.d.ts +22 -0
  223. package/dist/stt/stt.d.ts.map +1 -1
  224. package/dist/stt/stt.js +34 -2
  225. package/dist/stt/stt.js.map +1 -1
  226. package/dist/telemetry/otel_http_exporter.cjs +24 -5
  227. package/dist/telemetry/otel_http_exporter.cjs.map +1 -1
  228. package/dist/telemetry/otel_http_exporter.d.cts +1 -0
  229. package/dist/telemetry/otel_http_exporter.d.ts +1 -0
  230. package/dist/telemetry/otel_http_exporter.d.ts.map +1 -1
  231. package/dist/telemetry/otel_http_exporter.js +24 -5
  232. package/dist/telemetry/otel_http_exporter.js.map +1 -1
  233. package/dist/telemetry/trace_types.cjs +5 -5
  234. package/dist/telemetry/trace_types.cjs.map +1 -1
  235. package/dist/telemetry/trace_types.d.cts +9 -5
  236. package/dist/telemetry/trace_types.d.ts +9 -5
  237. package/dist/telemetry/trace_types.d.ts.map +1 -1
  238. package/dist/telemetry/trace_types.js +5 -5
  239. package/dist/telemetry/trace_types.js.map +1 -1
  240. package/dist/telemetry/traces.cjs +47 -8
  241. package/dist/telemetry/traces.cjs.map +1 -1
  242. package/dist/telemetry/traces.d.ts.map +1 -1
  243. package/dist/telemetry/traces.js +47 -8
  244. package/dist/telemetry/traces.js.map +1 -1
  245. package/dist/tts/tts.cjs +64 -2
  246. package/dist/tts/tts.cjs.map +1 -1
  247. package/dist/tts/tts.d.cts +34 -0
  248. package/dist/tts/tts.d.ts +34 -0
  249. package/dist/tts/tts.d.ts.map +1 -1
  250. package/dist/tts/tts.js +64 -2
  251. package/dist/tts/tts.js.map +1 -1
  252. package/dist/utils.cjs +1 -0
  253. package/dist/utils.cjs.map +1 -1
  254. package/dist/utils.d.ts.map +1 -1
  255. package/dist/utils.js +1 -0
  256. package/dist/utils.js.map +1 -1
  257. package/dist/version.cjs +1 -1
  258. package/dist/version.js +1 -1
  259. package/dist/voice/agent.cjs +34 -4
  260. package/dist/voice/agent.cjs.map +1 -1
  261. package/dist/voice/agent.d.cts +11 -2
  262. package/dist/voice/agent.d.ts +11 -2
  263. package/dist/voice/agent.d.ts.map +1 -1
  264. package/dist/voice/agent.js +34 -4
  265. package/dist/voice/agent.js.map +1 -1
  266. package/dist/voice/agent_activity.cjs +292 -44
  267. package/dist/voice/agent_activity.cjs.map +1 -1
  268. package/dist/voice/agent_activity.d.cts +27 -6
  269. package/dist/voice/agent_activity.d.ts +27 -6
  270. package/dist/voice/agent_activity.d.ts.map +1 -1
  271. package/dist/voice/agent_activity.js +293 -45
  272. package/dist/voice/agent_activity.js.map +1 -1
  273. package/dist/voice/agent_session.cjs +105 -48
  274. package/dist/voice/agent_session.cjs.map +1 -1
  275. package/dist/voice/agent_session.d.cts +90 -20
  276. package/dist/voice/agent_session.d.ts +90 -20
  277. package/dist/voice/agent_session.d.ts.map +1 -1
  278. package/dist/voice/agent_session.js +105 -46
  279. package/dist/voice/agent_session.js.map +1 -1
  280. package/dist/voice/audio_recognition.cjs +287 -6
  281. package/dist/voice/audio_recognition.cjs.map +1 -1
  282. package/dist/voice/audio_recognition.d.cts +42 -3
  283. package/dist/voice/audio_recognition.d.ts +42 -3
  284. package/dist/voice/audio_recognition.d.ts.map +1 -1
  285. package/dist/voice/audio_recognition.js +289 -7
  286. package/dist/voice/audio_recognition.js.map +1 -1
  287. package/dist/voice/client_events.cjs +554 -0
  288. package/dist/voice/client_events.cjs.map +1 -0
  289. package/dist/voice/client_events.d.cts +195 -0
  290. package/dist/voice/client_events.d.ts +195 -0
  291. package/dist/voice/client_events.d.ts.map +1 -0
  292. package/dist/voice/client_events.js +548 -0
  293. package/dist/voice/client_events.js.map +1 -0
  294. package/dist/voice/events.cjs +1 -0
  295. package/dist/voice/events.cjs.map +1 -1
  296. package/dist/voice/events.d.cts +8 -5
  297. package/dist/voice/events.d.ts +8 -5
  298. package/dist/voice/events.d.ts.map +1 -1
  299. package/dist/voice/events.js +1 -0
  300. package/dist/voice/events.js.map +1 -1
  301. package/dist/voice/generation.cjs +43 -8
  302. package/dist/voice/generation.cjs.map +1 -1
  303. package/dist/voice/generation.d.cts +3 -3
  304. package/dist/voice/generation.d.ts +3 -3
  305. package/dist/voice/generation.d.ts.map +1 -1
  306. package/dist/voice/generation.js +43 -8
  307. package/dist/voice/generation.js.map +1 -1
  308. package/dist/voice/index.cjs +1 -0
  309. package/dist/voice/index.cjs.map +1 -1
  310. package/dist/voice/index.d.cts +1 -0
  311. package/dist/voice/index.d.ts +1 -0
  312. package/dist/voice/index.d.ts.map +1 -1
  313. package/dist/voice/index.js +1 -0
  314. package/dist/voice/index.js.map +1 -1
  315. package/dist/voice/report.cjs +20 -8
  316. package/dist/voice/report.cjs.map +1 -1
  317. package/dist/voice/report.d.cts +5 -0
  318. package/dist/voice/report.d.ts +5 -0
  319. package/dist/voice/report.d.ts.map +1 -1
  320. package/dist/voice/report.js +20 -8
  321. package/dist/voice/report.js.map +1 -1
  322. package/dist/voice/report.test.cjs +106 -0
  323. package/dist/voice/report.test.cjs.map +1 -0
  324. package/dist/voice/report.test.js +105 -0
  325. package/dist/voice/report.test.js.map +1 -0
  326. package/dist/voice/room_io/room_io.cjs +16 -41
  327. package/dist/voice/room_io/room_io.cjs.map +1 -1
  328. package/dist/voice/room_io/room_io.d.cts +4 -9
  329. package/dist/voice/room_io/room_io.d.ts +4 -9
  330. package/dist/voice/room_io/room_io.d.ts.map +1 -1
  331. package/dist/voice/room_io/room_io.js +17 -43
  332. package/dist/voice/room_io/room_io.js.map +1 -1
  333. package/dist/voice/testing/fake_llm.cjs +127 -0
  334. package/dist/voice/testing/fake_llm.cjs.map +1 -0
  335. package/dist/voice/testing/fake_llm.d.cts +30 -0
  336. package/dist/voice/testing/fake_llm.d.ts +30 -0
  337. package/dist/voice/testing/fake_llm.d.ts.map +1 -0
  338. package/dist/voice/testing/fake_llm.js +103 -0
  339. package/dist/voice/testing/fake_llm.js.map +1 -0
  340. package/dist/voice/testing/index.cjs +3 -0
  341. package/dist/voice/testing/index.cjs.map +1 -1
  342. package/dist/voice/testing/index.d.cts +1 -0
  343. package/dist/voice/testing/index.d.ts +1 -0
  344. package/dist/voice/testing/index.d.ts.map +1 -1
  345. package/dist/voice/testing/index.js +2 -0
  346. package/dist/voice/testing/index.js.map +1 -1
  347. package/dist/voice/turn_config/endpointing.cjs +33 -0
  348. package/dist/voice/turn_config/endpointing.cjs.map +1 -0
  349. package/dist/voice/turn_config/endpointing.d.cts +30 -0
  350. package/dist/voice/turn_config/endpointing.d.ts +30 -0
  351. package/dist/voice/turn_config/endpointing.d.ts.map +1 -0
  352. package/dist/voice/turn_config/endpointing.js +9 -0
  353. package/dist/voice/turn_config/endpointing.js.map +1 -0
  354. package/dist/voice/turn_config/interruption.cjs +37 -0
  355. package/dist/voice/turn_config/interruption.cjs.map +1 -0
  356. package/dist/voice/turn_config/interruption.d.cts +53 -0
  357. package/dist/voice/turn_config/interruption.d.ts +53 -0
  358. package/dist/voice/turn_config/interruption.d.ts.map +1 -0
  359. package/dist/voice/turn_config/interruption.js +13 -0
  360. package/dist/voice/turn_config/interruption.js.map +1 -0
  361. package/dist/voice/turn_config/turn_handling.cjs +35 -0
  362. package/dist/voice/turn_config/turn_handling.cjs.map +1 -0
  363. package/dist/voice/turn_config/turn_handling.d.cts +36 -0
  364. package/dist/voice/turn_config/turn_handling.d.ts +36 -0
  365. package/dist/voice/turn_config/turn_handling.d.ts.map +1 -0
  366. package/dist/voice/turn_config/turn_handling.js +11 -0
  367. package/dist/voice/turn_config/turn_handling.js.map +1 -0
  368. package/dist/voice/turn_config/utils.cjs +97 -0
  369. package/dist/voice/turn_config/utils.cjs.map +1 -0
  370. package/dist/voice/turn_config/utils.d.cts +25 -0
  371. package/dist/voice/turn_config/utils.d.ts +25 -0
  372. package/dist/voice/turn_config/utils.d.ts.map +1 -0
  373. package/dist/voice/turn_config/utils.js +73 -0
  374. package/dist/voice/turn_config/utils.js.map +1 -0
  375. package/dist/voice/turn_config/utils.test.cjs +86 -0
  376. package/dist/voice/turn_config/utils.test.cjs.map +1 -0
  377. package/dist/voice/turn_config/utils.test.js +85 -0
  378. package/dist/voice/turn_config/utils.test.js.map +1 -0
  379. package/dist/voice/wire_format.cjs +798 -0
  380. package/dist/voice/wire_format.cjs.map +1 -0
  381. package/dist/voice/wire_format.d.cts +5503 -0
  382. package/dist/voice/wire_format.d.ts +5503 -0
  383. package/dist/voice/wire_format.d.ts.map +1 -0
  384. package/dist/voice/wire_format.js +728 -0
  385. package/dist/voice/wire_format.js.map +1 -0
  386. package/package.json +2 -1
  387. package/src/beta/index.ts +9 -0
  388. package/src/beta/workflows/index.ts +9 -0
  389. package/src/beta/workflows/task_group.ts +194 -0
  390. package/src/constants.ts +13 -0
  391. package/src/index.ts +2 -1
  392. package/src/inference/interruption/defaults.ts +51 -0
  393. package/src/inference/interruption/errors.ts +25 -0
  394. package/src/inference/interruption/http_transport.ts +187 -0
  395. package/src/inference/interruption/interruption_cache_entry.ts +50 -0
  396. package/src/inference/interruption/interruption_detector.ts +188 -0
  397. package/src/inference/interruption/interruption_stream.ts +467 -0
  398. package/src/inference/interruption/types.ts +84 -0
  399. package/src/inference/interruption/utils.test.ts +132 -0
  400. package/src/inference/interruption/utils.ts +137 -0
  401. package/src/inference/interruption/ws_transport.ts +402 -0
  402. package/src/inference/llm.ts +9 -12
  403. package/src/inference/stt.ts +10 -3
  404. package/src/inference/tts.ts +10 -3
  405. package/src/inference/utils.ts +29 -1
  406. package/src/llm/chat_context.test.ts +48 -0
  407. package/src/llm/chat_context.ts +161 -0
  408. package/src/llm/index.ts +2 -0
  409. package/src/llm/llm.ts +16 -0
  410. package/src/llm/realtime.ts +4 -0
  411. package/src/llm/tool_context.ts +14 -0
  412. package/src/metrics/base.ts +48 -1
  413. package/src/metrics/index.ts +11 -0
  414. package/src/metrics/model_usage.test.ts +545 -0
  415. package/src/metrics/model_usage.ts +262 -0
  416. package/src/metrics/usage_collector.ts +11 -0
  417. package/src/metrics/utils.ts +11 -0
  418. package/src/stream/multi_input_stream.test.ts +6 -1
  419. package/src/stream/stream_channel.ts +34 -2
  420. package/src/stt/stt.ts +38 -0
  421. package/src/telemetry/otel_http_exporter.ts +28 -5
  422. package/src/telemetry/trace_types.ts +11 -8
  423. package/src/telemetry/traces.ts +111 -54
  424. package/src/tts/tts.ts +69 -1
  425. package/src/utils.ts +5 -0
  426. package/src/voice/agent.ts +41 -3
  427. package/src/voice/agent_activity.ts +371 -34
  428. package/src/voice/agent_session.ts +207 -59
  429. package/src/voice/audio_recognition.ts +385 -9
  430. package/src/voice/client_events.ts +838 -0
  431. package/src/voice/events.ts +14 -4
  432. package/src/voice/generation.ts +52 -9
  433. package/src/voice/index.ts +1 -0
  434. package/src/voice/report.test.ts +117 -0
  435. package/src/voice/report.ts +29 -6
  436. package/src/voice/room_io/room_io.ts +21 -64
  437. package/src/voice/testing/fake_llm.ts +138 -0
  438. package/src/voice/testing/index.ts +2 -0
  439. package/src/voice/turn_config/endpointing.ts +33 -0
  440. package/src/voice/turn_config/interruption.ts +56 -0
  441. package/src/voice/turn_config/turn_handling.ts +45 -0
  442. package/src/voice/turn_config/utils.test.ts +100 -0
  443. package/src/voice/turn_config/utils.ts +103 -0
  444. package/src/voice/wire_format.ts +827 -0
@@ -0,0 +1,545 @@
1
+ // SPDX-FileCopyrightText: 2024 LiveKit, Inc.
2
+ //
3
+ // SPDX-License-Identifier: Apache-2.0
4
+ import { beforeEach, describe, expect, it } from 'vitest';
5
+ import type { LLMMetrics, RealtimeModelMetrics, STTMetrics, TTSMetrics } from './base.js';
6
+ import {
7
+ type LLMModelUsage,
8
+ ModelUsageCollector,
9
+ type STTModelUsage,
10
+ type TTSModelUsage,
11
+ filterZeroValues,
12
+ } from './model_usage.js';
13
+
14
+ describe('model_usage', () => {
15
+ describe('filterZeroValues', () => {
16
+ it('should filter out zero values from LLMModelUsage', () => {
17
+ const usage: LLMModelUsage = {
18
+ type: 'llm_usage',
19
+ provider: 'openai',
20
+ model: 'gpt-4o',
21
+ inputTokens: 100,
22
+ inputCachedTokens: 0,
23
+ inputAudioTokens: 0,
24
+ inputCachedAudioTokens: 0,
25
+ inputTextTokens: 0,
26
+ inputCachedTextTokens: 0,
27
+ inputImageTokens: 0,
28
+ inputCachedImageTokens: 0,
29
+ outputTokens: 50,
30
+ outputAudioTokens: 0,
31
+ outputTextTokens: 0,
32
+ sessionDurationMs: 0,
33
+ };
34
+
35
+ const filtered = filterZeroValues(usage);
36
+
37
+ expect(filtered.type).toBe('llm_usage');
38
+ expect(filtered.provider).toBe('openai');
39
+ expect(filtered.model).toBe('gpt-4o');
40
+ expect(filtered.inputTokens).toBe(100);
41
+ expect(filtered.outputTokens).toBe(50);
42
+ // Zero values should be filtered out
43
+ expect(filtered.inputCachedTokens).toBeUndefined();
44
+ expect(filtered.inputAudioTokens).toBeUndefined();
45
+ expect(filtered.sessionDurationMs).toBeUndefined();
46
+ });
47
+
48
+ it('should filter out zero values from TTSModelUsage', () => {
49
+ const usage: TTSModelUsage = {
50
+ type: 'tts_usage',
51
+ provider: 'elevenlabs',
52
+ model: 'eleven_turbo_v2',
53
+ inputTokens: 0,
54
+ outputTokens: 0,
55
+ charactersCount: 500,
56
+ audioDurationMs: 3000,
57
+ };
58
+
59
+ const filtered = filterZeroValues(usage);
60
+
61
+ expect(filtered.type).toBe('tts_usage');
62
+ expect(filtered.provider).toBe('elevenlabs');
63
+ expect(filtered.charactersCount).toBe(500);
64
+ expect(filtered.audioDurationMs).toBe(3000);
65
+ expect(filtered.inputTokens).toBeUndefined();
66
+ expect(filtered.outputTokens).toBeUndefined();
67
+ });
68
+
69
+ it('should keep all values when none are zero', () => {
70
+ const usage: STTModelUsage = {
71
+ type: 'stt_usage',
72
+ provider: 'deepgram',
73
+ model: 'nova-2',
74
+ inputTokens: 10,
75
+ outputTokens: 20,
76
+ audioDurationMs: 5000,
77
+ };
78
+
79
+ const filtered = filterZeroValues(usage);
80
+
81
+ expect(Object.keys(filtered)).toHaveLength(6);
82
+ expect(filtered).toEqual(usage);
83
+ });
84
+ });
85
+
86
+ describe('ModelUsageCollector', () => {
87
+ let collector: ModelUsageCollector;
88
+
89
+ beforeEach(() => {
90
+ collector = new ModelUsageCollector();
91
+ });
92
+
93
+ describe('collect LLM metrics', () => {
94
+ it('should aggregate LLM metrics by provider and model', () => {
95
+ const metrics1: LLMMetrics = {
96
+ type: 'llm_metrics',
97
+ label: 'test',
98
+ requestId: 'req1',
99
+ timestamp: Date.now(),
100
+ durationMs: 100,
101
+ ttftMs: 50,
102
+ cancelled: false,
103
+ completionTokens: 100,
104
+ promptTokens: 200,
105
+ promptCachedTokens: 50,
106
+ totalTokens: 300,
107
+ tokensPerSecond: 10,
108
+ metadata: {
109
+ modelProvider: 'openai',
110
+ modelName: 'gpt-4o',
111
+ },
112
+ };
113
+
114
+ const metrics2: LLMMetrics = {
115
+ type: 'llm_metrics',
116
+ label: 'test',
117
+ requestId: 'req2',
118
+ timestamp: Date.now(),
119
+ durationMs: 150,
120
+ ttftMs: 60,
121
+ cancelled: false,
122
+ completionTokens: 150,
123
+ promptTokens: 300,
124
+ promptCachedTokens: 75,
125
+ totalTokens: 450,
126
+ tokensPerSecond: 12,
127
+ metadata: {
128
+ modelProvider: 'openai',
129
+ modelName: 'gpt-4o',
130
+ },
131
+ };
132
+
133
+ collector.collect(metrics1);
134
+ collector.collect(metrics2);
135
+
136
+ const usage = collector.flatten();
137
+ expect(usage).toHaveLength(1);
138
+
139
+ const llmUsage = usage[0] as LLMModelUsage;
140
+ expect(llmUsage.type).toBe('llm_usage');
141
+ expect(llmUsage.provider).toBe('openai');
142
+ expect(llmUsage.model).toBe('gpt-4o');
143
+ expect(llmUsage.inputTokens).toBe(500); // 200 + 300
144
+ expect(llmUsage.inputCachedTokens).toBe(125); // 50 + 75
145
+ expect(llmUsage.outputTokens).toBe(250); // 100 + 150
146
+ });
147
+
148
+ it('should separate metrics by different providers', () => {
149
+ const openaiMetrics: LLMMetrics = {
150
+ type: 'llm_metrics',
151
+ label: 'test',
152
+ requestId: 'req1',
153
+ timestamp: Date.now(),
154
+ durationMs: 100,
155
+ ttftMs: 50,
156
+ cancelled: false,
157
+ completionTokens: 100,
158
+ promptTokens: 200,
159
+ promptCachedTokens: 0,
160
+ totalTokens: 300,
161
+ tokensPerSecond: 10,
162
+ metadata: {
163
+ modelProvider: 'openai',
164
+ modelName: 'gpt-4o',
165
+ },
166
+ };
167
+
168
+ const anthropicMetrics: LLMMetrics = {
169
+ type: 'llm_metrics',
170
+ label: 'test',
171
+ requestId: 'req2',
172
+ timestamp: Date.now(),
173
+ durationMs: 120,
174
+ ttftMs: 55,
175
+ cancelled: false,
176
+ completionTokens: 80,
177
+ promptTokens: 150,
178
+ promptCachedTokens: 0,
179
+ totalTokens: 230,
180
+ tokensPerSecond: 8,
181
+ metadata: {
182
+ modelProvider: 'anthropic',
183
+ modelName: 'claude-3-5-sonnet',
184
+ },
185
+ };
186
+
187
+ collector.collect(openaiMetrics);
188
+ collector.collect(anthropicMetrics);
189
+
190
+ const usage = collector.flatten();
191
+ expect(usage).toHaveLength(2);
192
+
193
+ const openaiUsage = usage.find(
194
+ (u) => u.type === 'llm_usage' && u.provider === 'openai',
195
+ ) as LLMModelUsage;
196
+ const anthropicUsage = usage.find(
197
+ (u) => u.type === 'llm_usage' && u.provider === 'anthropic',
198
+ ) as LLMModelUsage;
199
+
200
+ expect(openaiUsage.inputTokens).toBe(200);
201
+ expect(openaiUsage.outputTokens).toBe(100);
202
+ expect(anthropicUsage.inputTokens).toBe(150);
203
+ expect(anthropicUsage.outputTokens).toBe(80);
204
+ });
205
+ });
206
+
207
+ describe('collect TTS metrics', () => {
208
+ it('should aggregate TTS metrics by provider and model', () => {
209
+ const metrics1: TTSMetrics = {
210
+ type: 'tts_metrics',
211
+ label: 'test',
212
+ requestId: 'req1',
213
+ timestamp: Date.now(),
214
+ ttfbMs: 100,
215
+ durationMs: 500,
216
+ audioDurationMs: 3000,
217
+ cancelled: false,
218
+ charactersCount: 100,
219
+ inputTokens: 10,
220
+ outputTokens: 20,
221
+ streamed: true,
222
+ metadata: {
223
+ modelProvider: 'elevenlabs',
224
+ modelName: 'eleven_turbo_v2',
225
+ },
226
+ };
227
+
228
+ const metrics2: TTSMetrics = {
229
+ type: 'tts_metrics',
230
+ label: 'test',
231
+ requestId: 'req2',
232
+ timestamp: Date.now(),
233
+ ttfbMs: 120,
234
+ durationMs: 600,
235
+ audioDurationMs: 4000,
236
+ cancelled: false,
237
+ charactersCount: 200,
238
+ inputTokens: 15,
239
+ outputTokens: 25,
240
+ streamed: true,
241
+ metadata: {
242
+ modelProvider: 'elevenlabs',
243
+ modelName: 'eleven_turbo_v2',
244
+ },
245
+ };
246
+
247
+ collector.collect(metrics1);
248
+ collector.collect(metrics2);
249
+
250
+ const usage = collector.flatten();
251
+ expect(usage).toHaveLength(1);
252
+
253
+ const ttsUsage = usage[0] as TTSModelUsage;
254
+ expect(ttsUsage.type).toBe('tts_usage');
255
+ expect(ttsUsage.provider).toBe('elevenlabs');
256
+ expect(ttsUsage.model).toBe('eleven_turbo_v2');
257
+ expect(ttsUsage.charactersCount).toBe(300); // 100 + 200
258
+ expect(ttsUsage.audioDurationMs).toBe(7000); // 3000 + 4000
259
+ expect(ttsUsage.inputTokens).toBe(25); // 10 + 15
260
+ expect(ttsUsage.outputTokens).toBe(45); // 20 + 25
261
+ });
262
+ });
263
+
264
+ describe('collect STT metrics', () => {
265
+ it('should aggregate STT metrics by provider and model', () => {
266
+ const metrics1: STTMetrics = {
267
+ type: 'stt_metrics',
268
+ label: 'test',
269
+ requestId: 'req1',
270
+ timestamp: Date.now(),
271
+ durationMs: 0,
272
+ audioDurationMs: 5000,
273
+ inputTokens: 50,
274
+ outputTokens: 100,
275
+ streamed: true,
276
+ metadata: {
277
+ modelProvider: 'deepgram',
278
+ modelName: 'nova-2',
279
+ },
280
+ };
281
+
282
+ const metrics2: STTMetrics = {
283
+ type: 'stt_metrics',
284
+ label: 'test',
285
+ requestId: 'req2',
286
+ timestamp: Date.now(),
287
+ durationMs: 0,
288
+ audioDurationMs: 3000,
289
+ inputTokens: 30,
290
+ outputTokens: 60,
291
+ streamed: true,
292
+ metadata: {
293
+ modelProvider: 'deepgram',
294
+ modelName: 'nova-2',
295
+ },
296
+ };
297
+
298
+ collector.collect(metrics1);
299
+ collector.collect(metrics2);
300
+
301
+ const usage = collector.flatten();
302
+ expect(usage).toHaveLength(1);
303
+
304
+ const sttUsage = usage[0] as STTModelUsage;
305
+ expect(sttUsage.type).toBe('stt_usage');
306
+ expect(sttUsage.provider).toBe('deepgram');
307
+ expect(sttUsage.model).toBe('nova-2');
308
+ expect(sttUsage.audioDurationMs).toBe(8000); // 5000 + 3000
309
+ expect(sttUsage.inputTokens).toBe(80); // 50 + 30
310
+ expect(sttUsage.outputTokens).toBe(160); // 100 + 60
311
+ });
312
+ });
313
+
314
+ describe('collect realtime model metrics', () => {
315
+ it('should aggregate realtime model metrics with detailed token breakdown', () => {
316
+ const metrics: RealtimeModelMetrics = {
317
+ type: 'realtime_model_metrics',
318
+ label: 'test',
319
+ requestId: 'req1',
320
+ timestamp: Date.now(),
321
+ durationMs: 1000,
322
+ ttftMs: 100,
323
+ cancelled: false,
324
+ inputTokens: 500,
325
+ outputTokens: 300,
326
+ totalTokens: 800,
327
+ tokensPerSecond: 10,
328
+ sessionDurationMs: 5000,
329
+ inputTokenDetails: {
330
+ audioTokens: 200,
331
+ textTokens: 250,
332
+ imageTokens: 50,
333
+ cachedTokens: 100,
334
+ cachedTokensDetails: {
335
+ audioTokens: 30,
336
+ textTokens: 50,
337
+ imageTokens: 20,
338
+ },
339
+ },
340
+ outputTokenDetails: {
341
+ textTokens: 200,
342
+ audioTokens: 100,
343
+ imageTokens: 0,
344
+ },
345
+ metadata: {
346
+ modelProvider: 'openai',
347
+ modelName: 'gpt-4o-realtime',
348
+ },
349
+ };
350
+
351
+ collector.collect(metrics);
352
+
353
+ const usage = collector.flatten();
354
+ expect(usage).toHaveLength(1);
355
+
356
+ const llmUsage = usage[0] as LLMModelUsage;
357
+ expect(llmUsage.type).toBe('llm_usage');
358
+ expect(llmUsage.provider).toBe('openai');
359
+ expect(llmUsage.model).toBe('gpt-4o-realtime');
360
+ expect(llmUsage.inputTokens).toBe(500);
361
+ expect(llmUsage.inputCachedTokens).toBe(100);
362
+ expect(llmUsage.inputAudioTokens).toBe(200);
363
+ expect(llmUsage.inputCachedAudioTokens).toBe(30);
364
+ expect(llmUsage.inputTextTokens).toBe(250);
365
+ expect(llmUsage.inputCachedTextTokens).toBe(50);
366
+ expect(llmUsage.inputImageTokens).toBe(50);
367
+ expect(llmUsage.inputCachedImageTokens).toBe(20);
368
+ expect(llmUsage.outputTokens).toBe(300);
369
+ expect(llmUsage.outputTextTokens).toBe(200);
370
+ expect(llmUsage.outputAudioTokens).toBe(100);
371
+ expect(llmUsage.sessionDurationMs).toBe(5000);
372
+ });
373
+ });
374
+
375
+ describe('mixed metrics collection', () => {
376
+ it('should collect and separate LLM, TTS, and STT metrics', () => {
377
+ const llmMetrics: LLMMetrics = {
378
+ type: 'llm_metrics',
379
+ label: 'test',
380
+ requestId: 'req1',
381
+ timestamp: Date.now(),
382
+ durationMs: 100,
383
+ ttftMs: 50,
384
+ cancelled: false,
385
+ completionTokens: 100,
386
+ promptTokens: 200,
387
+ promptCachedTokens: 0,
388
+ totalTokens: 300,
389
+ tokensPerSecond: 10,
390
+ metadata: {
391
+ modelProvider: 'openai',
392
+ modelName: 'gpt-4o',
393
+ },
394
+ };
395
+
396
+ const ttsMetrics: TTSMetrics = {
397
+ type: 'tts_metrics',
398
+ label: 'test',
399
+ requestId: 'req2',
400
+ timestamp: Date.now(),
401
+ ttfbMs: 100,
402
+ durationMs: 500,
403
+ audioDurationMs: 3000,
404
+ cancelled: false,
405
+ charactersCount: 100,
406
+ streamed: true,
407
+ metadata: {
408
+ modelProvider: 'elevenlabs',
409
+ modelName: 'eleven_turbo_v2',
410
+ },
411
+ };
412
+
413
+ const sttMetrics: STTMetrics = {
414
+ type: 'stt_metrics',
415
+ label: 'test',
416
+ requestId: 'req3',
417
+ timestamp: Date.now(),
418
+ durationMs: 0,
419
+ audioDurationMs: 5000,
420
+ streamed: true,
421
+ metadata: {
422
+ modelProvider: 'deepgram',
423
+ modelName: 'nova-2',
424
+ },
425
+ };
426
+
427
+ collector.collect(llmMetrics);
428
+ collector.collect(ttsMetrics);
429
+ collector.collect(sttMetrics);
430
+
431
+ const usage = collector.flatten();
432
+ expect(usage).toHaveLength(3);
433
+
434
+ const llmUsage = usage.find((u) => u.type === 'llm_usage');
435
+ const ttsUsage = usage.find((u) => u.type === 'tts_usage');
436
+ const sttUsage = usage.find((u) => u.type === 'stt_usage');
437
+
438
+ expect(llmUsage).toBeDefined();
439
+ expect(ttsUsage).toBeDefined();
440
+ expect(sttUsage).toBeDefined();
441
+ });
442
+ });
443
+
444
+ describe('flatten returns copies', () => {
445
+ it('should return deep copies of usage objects', () => {
446
+ const metrics: LLMMetrics = {
447
+ type: 'llm_metrics',
448
+ label: 'test',
449
+ requestId: 'req1',
450
+ timestamp: Date.now(),
451
+ durationMs: 100,
452
+ ttftMs: 50,
453
+ cancelled: false,
454
+ completionTokens: 100,
455
+ promptTokens: 200,
456
+ promptCachedTokens: 0,
457
+ totalTokens: 300,
458
+ tokensPerSecond: 10,
459
+ metadata: {
460
+ modelProvider: 'openai',
461
+ modelName: 'gpt-4o',
462
+ },
463
+ };
464
+
465
+ collector.collect(metrics);
466
+
467
+ const usage1 = collector.flatten();
468
+ const usage2 = collector.flatten();
469
+
470
+ // Should be equal values
471
+ expect(usage1[0]).toEqual(usage2[0]);
472
+
473
+ // But not the same object reference
474
+ expect(usage1[0]).not.toBe(usage2[0]);
475
+
476
+ // Modifying one shouldn't affect the other
477
+ (usage1[0] as LLMModelUsage).inputTokens = 9999;
478
+ expect((usage2[0] as LLMModelUsage).inputTokens).toBe(200);
479
+ });
480
+ });
481
+
482
+ describe('handles missing metadata', () => {
483
+ it('should use empty strings when metadata is missing', () => {
484
+ const metrics: LLMMetrics = {
485
+ type: 'llm_metrics',
486
+ label: 'test',
487
+ requestId: 'req1',
488
+ timestamp: Date.now(),
489
+ durationMs: 100,
490
+ ttftMs: 50,
491
+ cancelled: false,
492
+ completionTokens: 100,
493
+ promptTokens: 200,
494
+ promptCachedTokens: 0,
495
+ totalTokens: 300,
496
+ tokensPerSecond: 10,
497
+ // No metadata
498
+ };
499
+
500
+ collector.collect(metrics);
501
+
502
+ const usage = collector.flatten();
503
+ expect(usage).toHaveLength(1);
504
+
505
+ const llmUsage = usage[0] as LLMModelUsage;
506
+ expect(llmUsage.provider).toBe('');
507
+ expect(llmUsage.model).toBe('');
508
+ });
509
+ });
510
+
511
+ describe('ignores VAD and EOU metrics', () => {
512
+ it('should not collect VAD metrics', () => {
513
+ const vadMetrics = {
514
+ type: 'vad_metrics' as const,
515
+ label: 'test',
516
+ timestamp: Date.now(),
517
+ idleTimeMs: 100,
518
+ inferenceDurationTotalMs: 50,
519
+ inferenceCount: 10,
520
+ };
521
+
522
+ collector.collect(vadMetrics);
523
+
524
+ const usage = collector.flatten();
525
+ expect(usage).toHaveLength(0);
526
+ });
527
+
528
+ it('should not collect EOU metrics', () => {
529
+ const eouMetrics = {
530
+ type: 'eou_metrics' as const,
531
+ timestamp: Date.now(),
532
+ endOfUtteranceDelayMs: 100,
533
+ transcriptionDelayMs: 50,
534
+ onUserTurnCompletedDelayMs: 30,
535
+ lastSpeakingTimeMs: Date.now(),
536
+ };
537
+
538
+ collector.collect(eouMetrics);
539
+
540
+ const usage = collector.flatten();
541
+ expect(usage).toHaveLength(0);
542
+ });
543
+ });
544
+ });
545
+ });