npm - @livekit/agents - Versions diffs - 0.0.0-20260120144724 - Mend

@livekit/agents 0.0.0-20260120144724

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (987) hide show

package/LICENSE +201 -0
package/README.md +17 -0
package/dist/_exceptions.cjs +109 -0
package/dist/_exceptions.cjs.map +1 -0
package/dist/_exceptions.d.cts +64 -0
package/dist/_exceptions.d.ts +64 -0
package/dist/_exceptions.d.ts.map +1 -0
package/dist/_exceptions.js +80 -0
package/dist/_exceptions.js.map +1 -0
package/dist/audio.cjs +170 -0
package/dist/audio.cjs.map +1 -0
package/dist/audio.d.cts +46 -0
package/dist/audio.d.ts +46 -0
package/dist/audio.d.ts.map +1 -0
package/dist/audio.js +133 -0
package/dist/audio.js.map +1 -0
package/dist/cli.cjs +171 -0
package/dist/cli.cjs.map +1 -0
package/dist/cli.d.cts +14 -0
package/dist/cli.d.ts +14 -0
package/dist/cli.d.ts.map +1 -0
package/dist/cli.js +145 -0
package/dist/cli.js.map +1 -0
package/dist/connection_pool.cjs +242 -0
package/dist/connection_pool.cjs.map +1 -0
package/dist/connection_pool.d.cts +123 -0
package/dist/connection_pool.d.ts +123 -0
package/dist/connection_pool.d.ts.map +1 -0
package/dist/connection_pool.js +218 -0
package/dist/connection_pool.js.map +1 -0
package/dist/connection_pool.test.cjs +256 -0
package/dist/connection_pool.test.cjs.map +1 -0
package/dist/connection_pool.test.js +255 -0
package/dist/connection_pool.test.js.map +1 -0
package/dist/constants.cjs +44 -0
package/dist/constants.cjs.map +1 -0
package/dist/constants.d.cts +7 -0
package/dist/constants.d.ts +7 -0
package/dist/constants.d.ts.map +1 -0
package/dist/constants.js +15 -0
package/dist/constants.js.map +1 -0
package/dist/generator.cjs +36 -0
package/dist/generator.cjs.map +1 -0
package/dist/generator.d.cts +23 -0
package/dist/generator.d.ts +23 -0
package/dist/generator.d.ts.map +1 -0
package/dist/generator.js +11 -0
package/dist/generator.js.map +1 -0
package/dist/http_server.cjs +75 -0
package/dist/http_server.cjs.map +1 -0
package/dist/http_server.d.cts +20 -0
package/dist/http_server.d.ts +20 -0
package/dist/http_server.d.ts.map +1 -0
package/dist/http_server.js +51 -0
package/dist/http_server.js.map +1 -0
package/dist/index.cjs +100 -0
package/dist/index.cjs.map +1 -0
package/dist/index.d.cts +35 -0
package/dist/index.d.ts +35 -0
package/dist/index.d.ts.map +1 -0
package/dist/index.js +40 -0
package/dist/index.js.map +1 -0
package/dist/inference/api_protos.cjs +104 -0
package/dist/inference/api_protos.cjs.map +1 -0
package/dist/inference/api_protos.d.cts +222 -0
package/dist/inference/api_protos.d.ts +222 -0
package/dist/inference/api_protos.d.ts.map +1 -0
package/dist/inference/api_protos.js +70 -0
package/dist/inference/api_protos.js.map +1 -0
package/dist/inference/index.cjs +56 -0
package/dist/inference/index.cjs.map +1 -0
package/dist/inference/index.d.cts +8 -0
package/dist/inference/index.d.ts +8 -0
package/dist/inference/index.d.ts.map +1 -0
package/dist/inference/index.js +23 -0
package/dist/inference/index.js.map +1 -0
package/dist/inference/interruption/AdaptiveInterruptionDetector.cjs +152 -0
package/dist/inference/interruption/AdaptiveInterruptionDetector.cjs.map +1 -0
package/dist/inference/interruption/AdaptiveInterruptionDetector.d.cts +50 -0
package/dist/inference/interruption/AdaptiveInterruptionDetector.d.ts +50 -0
package/dist/inference/interruption/AdaptiveInterruptionDetector.d.ts.map +1 -0
package/dist/inference/interruption/AdaptiveInterruptionDetector.js +125 -0
package/dist/inference/interruption/AdaptiveInterruptionDetector.js.map +1 -0
package/dist/inference/interruption/InterruptionStream.cjs +310 -0
package/dist/inference/interruption/InterruptionStream.cjs.map +1 -0
package/dist/inference/interruption/InterruptionStream.d.cts +57 -0
package/dist/inference/interruption/InterruptionStream.d.ts +57 -0
package/dist/inference/interruption/InterruptionStream.d.ts.map +1 -0
package/dist/inference/interruption/InterruptionStream.js +288 -0
package/dist/inference/interruption/InterruptionStream.js.map +1 -0
package/dist/inference/interruption/defaults.cjs +76 -0
package/dist/inference/interruption/defaults.cjs.map +1 -0
package/dist/inference/interruption/defaults.d.cts +14 -0
package/dist/inference/interruption/defaults.d.ts +14 -0
package/dist/inference/interruption/defaults.d.ts.map +1 -0
package/dist/inference/interruption/defaults.js +42 -0
package/dist/inference/interruption/defaults.js.map +1 -0
package/dist/inference/interruption/errors.cjs +2 -0
package/dist/inference/interruption/errors.cjs.map +1 -0
package/dist/inference/interruption/errors.d.cts +2 -0
package/dist/inference/interruption/errors.d.ts +2 -0
package/dist/inference/interruption/errors.d.ts.map +1 -0
package/dist/inference/interruption/errors.js +1 -0
package/dist/inference/interruption/errors.js.map +1 -0
package/dist/inference/interruption/http_transport.cjs +57 -0
package/dist/inference/interruption/http_transport.cjs.map +1 -0
package/dist/inference/interruption/http_transport.d.cts +23 -0
package/dist/inference/interruption/http_transport.d.ts +23 -0
package/dist/inference/interruption/http_transport.d.ts.map +1 -0
package/dist/inference/interruption/http_transport.js +33 -0
package/dist/inference/interruption/http_transport.js.map +1 -0
package/dist/inference/interruption/index.cjs +34 -0
package/dist/inference/interruption/index.cjs.map +1 -0
package/dist/inference/interruption/index.d.cts +5 -0
package/dist/inference/interruption/index.d.ts +5 -0
package/dist/inference/interruption/index.d.ts.map +1 -0
package/dist/inference/interruption/index.js +7 -0
package/dist/inference/interruption/index.js.map +1 -0
package/dist/inference/interruption/interruption.cjs +85 -0
package/dist/inference/interruption/interruption.cjs.map +1 -0
package/dist/inference/interruption/interruption.d.cts +48 -0
package/dist/inference/interruption/interruption.d.ts +48 -0
package/dist/inference/interruption/interruption.d.ts.map +1 -0
package/dist/inference/interruption/interruption.js +59 -0
package/dist/inference/interruption/interruption.js.map +1 -0
package/dist/inference/llm.cjs +347 -0
package/dist/inference/llm.cjs.map +1 -0
package/dist/inference/llm.d.cts +114 -0
package/dist/inference/llm.d.ts +114 -0
package/dist/inference/llm.d.ts.map +1 -0
package/dist/inference/llm.js +318 -0
package/dist/inference/llm.js.map +1 -0
package/dist/inference/stt.cjs +371 -0
package/dist/inference/stt.cjs.map +1 -0
package/dist/inference/stt.d.cts +91 -0
package/dist/inference/stt.d.ts +91 -0
package/dist/inference/stt.d.ts.map +1 -0
package/dist/inference/stt.js +350 -0
package/dist/inference/stt.js.map +1 -0
package/dist/inference/tts.cjs +439 -0
package/dist/inference/tts.cjs.map +1 -0
package/dist/inference/tts.d.cts +80 -0
package/dist/inference/tts.d.ts +80 -0
package/dist/inference/tts.d.ts.map +1 -0
package/dist/inference/tts.js +417 -0
package/dist/inference/tts.js.map +1 -0
package/dist/inference/utils.cjs +89 -0
package/dist/inference/utils.cjs.map +1 -0
package/dist/inference/utils.d.cts +6 -0
package/dist/inference/utils.d.ts +6 -0
package/dist/inference/utils.d.ts.map +1 -0
package/dist/inference/utils.js +63 -0
package/dist/inference/utils.js.map +1 -0
package/dist/inference/utils.test.cjs +20 -0
package/dist/inference/utils.test.cjs.map +1 -0
package/dist/inference/utils.test.js +19 -0
package/dist/inference/utils.test.js.map +1 -0
package/dist/inference_runner.cjs +37 -0
package/dist/inference_runner.cjs.map +1 -0
package/dist/inference_runner.d.cts +11 -0
package/dist/inference_runner.d.ts +11 -0
package/dist/inference_runner.d.ts.map +1 -0
package/dist/inference_runner.js +13 -0
package/dist/inference_runner.js.map +1 -0
package/dist/ipc/index.cjs +23 -0
package/dist/ipc/index.cjs.map +1 -0
package/dist/ipc/index.d.cts +2 -0
package/dist/ipc/index.d.ts +2 -0
package/dist/ipc/index.d.ts.map +1 -0
package/dist/ipc/index.js +2 -0
package/dist/ipc/index.js.map +1 -0
package/dist/ipc/inference_executor.cjs +17 -0
package/dist/ipc/inference_executor.cjs.map +1 -0
package/dist/ipc/inference_executor.d.cts +4 -0
package/dist/ipc/inference_executor.d.ts +4 -0
package/dist/ipc/inference_executor.d.ts.map +1 -0
package/dist/ipc/inference_executor.js +1 -0
package/dist/ipc/inference_executor.js.map +1 -0
package/dist/ipc/inference_proc_executor.cjs +101 -0
package/dist/ipc/inference_proc_executor.cjs.map +1 -0
package/dist/ipc/inference_proc_executor.d.cts +23 -0
package/dist/ipc/inference_proc_executor.d.ts +23 -0
package/dist/ipc/inference_proc_executor.d.ts.map +1 -0
package/dist/ipc/inference_proc_executor.js +75 -0
package/dist/ipc/inference_proc_executor.js.map +1 -0
package/dist/ipc/inference_proc_lazy_main.cjs +86 -0
package/dist/ipc/inference_proc_lazy_main.cjs.map +1 -0
package/dist/ipc/inference_proc_lazy_main.d.cts +2 -0
package/dist/ipc/inference_proc_lazy_main.d.ts +2 -0
package/dist/ipc/inference_proc_lazy_main.d.ts.map +1 -0
package/dist/ipc/inference_proc_lazy_main.js +85 -0
package/dist/ipc/inference_proc_lazy_main.js.map +1 -0
package/dist/ipc/job_executor.cjs +34 -0
package/dist/ipc/job_executor.cjs.map +1 -0
package/dist/ipc/job_executor.d.cts +18 -0
package/dist/ipc/job_executor.d.ts +18 -0
package/dist/ipc/job_executor.d.ts.map +1 -0
package/dist/ipc/job_executor.js +10 -0
package/dist/ipc/job_executor.js.map +1 -0
package/dist/ipc/job_proc_executor.cjs +115 -0
package/dist/ipc/job_proc_executor.cjs.map +1 -0
package/dist/ipc/job_proc_executor.d.cts +19 -0
package/dist/ipc/job_proc_executor.d.ts +19 -0
package/dist/ipc/job_proc_executor.d.ts.map +1 -0
package/dist/ipc/job_proc_executor.js +89 -0
package/dist/ipc/job_proc_executor.js.map +1 -0
package/dist/ipc/job_proc_lazy_main.cjs +210 -0
package/dist/ipc/job_proc_lazy_main.cjs.map +1 -0
package/dist/ipc/job_proc_lazy_main.d.cts +2 -0
package/dist/ipc/job_proc_lazy_main.d.ts +2 -0
package/dist/ipc/job_proc_lazy_main.d.ts.map +1 -0
package/dist/ipc/job_proc_lazy_main.js +187 -0
package/dist/ipc/job_proc_lazy_main.js.map +1 -0
package/dist/ipc/message.cjs +17 -0
package/dist/ipc/message.cjs.map +1 -0
package/dist/ipc/message.d.cts +58 -0
package/dist/ipc/message.d.ts +58 -0
package/dist/ipc/message.d.ts.map +1 -0
package/dist/ipc/message.js +1 -0
package/dist/ipc/message.js.map +1 -0
package/dist/ipc/proc_pool.cjs +164 -0
package/dist/ipc/proc_pool.cjs.map +1 -0
package/dist/ipc/proc_pool.d.cts +31 -0
package/dist/ipc/proc_pool.d.ts +31 -0
package/dist/ipc/proc_pool.d.ts.map +1 -0
package/dist/ipc/proc_pool.js +140 -0
package/dist/ipc/proc_pool.js.map +1 -0
package/dist/ipc/supervised_proc.cjs +229 -0
package/dist/ipc/supervised_proc.cjs.map +1 -0
package/dist/ipc/supervised_proc.d.cts +32 -0
package/dist/ipc/supervised_proc.d.ts +32 -0
package/dist/ipc/supervised_proc.d.ts.map +1 -0
package/dist/ipc/supervised_proc.js +195 -0
package/dist/ipc/supervised_proc.js.map +1 -0
package/dist/ipc/supervised_proc.test.cjs +145 -0
package/dist/ipc/supervised_proc.test.cjs.map +1 -0
package/dist/ipc/supervised_proc.test.js +122 -0
package/dist/ipc/supervised_proc.test.js.map +1 -0
package/dist/job.cjs +373 -0
package/dist/job.cjs.map +1 -0
package/dist/job.d.cts +141 -0
package/dist/job.d.ts +141 -0
package/dist/job.d.ts.map +1 -0
package/dist/job.js +332 -0
package/dist/job.js.map +1 -0
package/dist/llm/chat_context.cjs +527 -0
package/dist/llm/chat_context.cjs.map +1 -0
package/dist/llm/chat_context.d.cts +223 -0
package/dist/llm/chat_context.d.ts +223 -0
package/dist/llm/chat_context.d.ts.map +1 -0
package/dist/llm/chat_context.js +496 -0
package/dist/llm/chat_context.js.map +1 -0
package/dist/llm/chat_context.test.cjs +911 -0
package/dist/llm/chat_context.test.cjs.map +1 -0
package/dist/llm/chat_context.test.js +916 -0
package/dist/llm/chat_context.test.js.map +1 -0
package/dist/llm/fallback_adapter.cjs +278 -0
package/dist/llm/fallback_adapter.cjs.map +1 -0
package/dist/llm/fallback_adapter.d.cts +73 -0
package/dist/llm/fallback_adapter.d.ts +73 -0
package/dist/llm/fallback_adapter.d.ts.map +1 -0
package/dist/llm/fallback_adapter.js +254 -0
package/dist/llm/fallback_adapter.js.map +1 -0
package/dist/llm/fallback_adapter.test.cjs +176 -0
package/dist/llm/fallback_adapter.test.cjs.map +1 -0
package/dist/llm/fallback_adapter.test.js +175 -0
package/dist/llm/fallback_adapter.test.js.map +1 -0
package/dist/llm/index.cjs +79 -0
package/dist/llm/index.cjs.map +1 -0
package/dist/llm/index.d.cts +9 -0
package/dist/llm/index.d.ts +9 -0
package/dist/llm/index.d.ts.map +1 -0
package/dist/llm/index.js +61 -0
package/dist/llm/index.js.map +1 -0
package/dist/llm/llm.cjs +226 -0
package/dist/llm/llm.cjs.map +1 -0
package/dist/llm/llm.d.cts +94 -0
package/dist/llm/llm.d.ts +94 -0
package/dist/llm/llm.d.ts.map +1 -0
package/dist/llm/llm.js +201 -0
package/dist/llm/llm.js.map +1 -0
package/dist/llm/provider_format/google.cjs +132 -0
package/dist/llm/provider_format/google.cjs.map +1 -0
package/dist/llm/provider_format/google.d.cts +6 -0
package/dist/llm/provider_format/google.d.ts +6 -0
package/dist/llm/provider_format/google.d.ts.map +1 -0
package/dist/llm/provider_format/google.js +108 -0
package/dist/llm/provider_format/google.js.map +1 -0
package/dist/llm/provider_format/google.test.cjs +724 -0
package/dist/llm/provider_format/google.test.cjs.map +1 -0
package/dist/llm/provider_format/google.test.js +728 -0
package/dist/llm/provider_format/google.test.js.map +1 -0
package/dist/llm/provider_format/index.cjs +40 -0
package/dist/llm/provider_format/index.cjs.map +1 -0
package/dist/llm/provider_format/index.d.cts +4 -0
package/dist/llm/provider_format/index.d.ts +4 -0
package/dist/llm/provider_format/index.d.ts.map +1 -0
package/dist/llm/provider_format/index.js +16 -0
package/dist/llm/provider_format/index.js.map +1 -0
package/dist/llm/provider_format/openai.cjs +138 -0
package/dist/llm/provider_format/openai.cjs.map +1 -0
package/dist/llm/provider_format/openai.d.cts +3 -0
package/dist/llm/provider_format/openai.d.ts +3 -0
package/dist/llm/provider_format/openai.d.ts.map +1 -0
package/dist/llm/provider_format/openai.js +114 -0
package/dist/llm/provider_format/openai.js.map +1 -0
package/dist/llm/provider_format/openai.test.cjs +557 -0
package/dist/llm/provider_format/openai.test.cjs.map +1 -0
package/dist/llm/provider_format/openai.test.js +561 -0
package/dist/llm/provider_format/openai.test.js.map +1 -0
package/dist/llm/provider_format/utils.cjs +146 -0
package/dist/llm/provider_format/utils.cjs.map +1 -0
package/dist/llm/provider_format/utils.d.cts +38 -0
package/dist/llm/provider_format/utils.d.ts +38 -0
package/dist/llm/provider_format/utils.d.ts.map +1 -0
package/dist/llm/provider_format/utils.js +122 -0
package/dist/llm/provider_format/utils.js.map +1 -0
package/dist/llm/realtime.cjs +77 -0
package/dist/llm/realtime.cjs.map +1 -0
package/dist/llm/realtime.d.cts +106 -0
package/dist/llm/realtime.d.ts +106 -0
package/dist/llm/realtime.d.ts.map +1 -0
package/dist/llm/realtime.js +52 -0
package/dist/llm/realtime.js.map +1 -0
package/dist/llm/remote_chat_context.cjs +112 -0
package/dist/llm/remote_chat_context.cjs.map +1 -0
package/dist/llm/remote_chat_context.d.cts +25 -0
package/dist/llm/remote_chat_context.d.ts +25 -0
package/dist/llm/remote_chat_context.d.ts.map +1 -0
package/dist/llm/remote_chat_context.js +88 -0
package/dist/llm/remote_chat_context.js.map +1 -0
package/dist/llm/remote_chat_context.test.cjs +225 -0
package/dist/llm/remote_chat_context.test.cjs.map +1 -0
package/dist/llm/remote_chat_context.test.js +224 -0
package/dist/llm/remote_chat_context.test.js.map +1 -0
package/dist/llm/tool_context.cjs +152 -0
package/dist/llm/tool_context.cjs.map +1 -0
package/dist/llm/tool_context.d.cts +153 -0
package/dist/llm/tool_context.d.ts +153 -0
package/dist/llm/tool_context.d.ts.map +1 -0
package/dist/llm/tool_context.js +119 -0
package/dist/llm/tool_context.js.map +1 -0
package/dist/llm/tool_context.test.cjs +359 -0
package/dist/llm/tool_context.test.cjs.map +1 -0
package/dist/llm/tool_context.test.js +336 -0
package/dist/llm/tool_context.test.js.map +1 -0
package/dist/llm/tool_context.type.test.cjs +92 -0
package/dist/llm/tool_context.type.test.cjs.map +1 -0
package/dist/llm/tool_context.type.test.js +91 -0
package/dist/llm/tool_context.type.test.js.map +1 -0
package/dist/llm/utils.cjs +267 -0
package/dist/llm/utils.cjs.map +1 -0
package/dist/llm/utils.d.cts +41 -0
package/dist/llm/utils.d.ts +41 -0
package/dist/llm/utils.d.ts.map +1 -0
package/dist/llm/utils.js +230 -0
package/dist/llm/utils.js.map +1 -0
package/dist/llm/utils.test.cjs +513 -0
package/dist/llm/utils.test.cjs.map +1 -0
package/dist/llm/utils.test.js +490 -0
package/dist/llm/utils.test.js.map +1 -0
package/dist/llm/zod-utils.cjs +102 -0
package/dist/llm/zod-utils.cjs.map +1 -0
package/dist/llm/zod-utils.d.cts +65 -0
package/dist/llm/zod-utils.d.ts +65 -0
package/dist/llm/zod-utils.d.ts.map +1 -0
package/dist/llm/zod-utils.js +64 -0
package/dist/llm/zod-utils.js.map +1 -0
package/dist/llm/zod-utils.test.cjs +472 -0
package/dist/llm/zod-utils.test.cjs.map +1 -0
package/dist/llm/zod-utils.test.js +455 -0
package/dist/llm/zod-utils.test.js.map +1 -0
package/dist/log.cjs +81 -0
package/dist/log.cjs.map +1 -0
package/dist/log.d.cts +20 -0
package/dist/log.d.ts +20 -0
package/dist/log.d.ts.map +1 -0
package/dist/log.js +54 -0
package/dist/log.js.map +1 -0
package/dist/metrics/base.cjs +17 -0
package/dist/metrics/base.cjs.map +1 -0
package/dist/metrics/base.d.cts +150 -0
package/dist/metrics/base.d.ts +150 -0
package/dist/metrics/base.d.ts.map +1 -0
package/dist/metrics/base.js +1 -0
package/dist/metrics/base.js.map +1 -0
package/dist/metrics/index.cjs +32 -0
package/dist/metrics/index.cjs.map +1 -0
package/dist/metrics/index.d.cts +4 -0
package/dist/metrics/index.d.ts +4 -0
package/dist/metrics/index.d.ts.map +1 -0
package/dist/metrics/index.js +7 -0
package/dist/metrics/index.js.map +1 -0
package/dist/metrics/usage_collector.cjs +58 -0
package/dist/metrics/usage_collector.cjs.map +1 -0
package/dist/metrics/usage_collector.d.cts +15 -0
package/dist/metrics/usage_collector.d.ts +15 -0
package/dist/metrics/usage_collector.d.ts.map +1 -0
package/dist/metrics/usage_collector.js +34 -0
package/dist/metrics/usage_collector.js.map +1 -0
package/dist/metrics/utils.cjs +74 -0
package/dist/metrics/utils.cjs.map +1 -0
package/dist/metrics/utils.d.cts +3 -0
package/dist/metrics/utils.d.ts +3 -0
package/dist/metrics/utils.d.ts.map +1 -0
package/dist/metrics/utils.js +50 -0
package/dist/metrics/utils.js.map +1 -0
package/dist/plugin.cjs +62 -0
package/dist/plugin.cjs.map +1 -0
package/dist/plugin.d.cts +24 -0
package/dist/plugin.d.ts +24 -0
package/dist/plugin.d.ts.map +1 -0
package/dist/plugin.js +37 -0
package/dist/plugin.js.map +1 -0
package/dist/stream/deferred_stream.cjs +106 -0
package/dist/stream/deferred_stream.cjs.map +1 -0
package/dist/stream/deferred_stream.d.cts +32 -0
package/dist/stream/deferred_stream.d.ts +32 -0
package/dist/stream/deferred_stream.d.ts.map +1 -0
package/dist/stream/deferred_stream.js +81 -0
package/dist/stream/deferred_stream.js.map +1 -0
package/dist/stream/deferred_stream.test.cjs +527 -0
package/dist/stream/deferred_stream.test.cjs.map +1 -0
package/dist/stream/deferred_stream.test.js +526 -0
package/dist/stream/deferred_stream.test.js.map +1 -0
package/dist/stream/identity_transform.cjs +42 -0
package/dist/stream/identity_transform.cjs.map +1 -0
package/dist/stream/identity_transform.d.cts +6 -0
package/dist/stream/identity_transform.d.ts +6 -0
package/dist/stream/identity_transform.d.ts.map +1 -0
package/dist/stream/identity_transform.js +18 -0
package/dist/stream/identity_transform.js.map +1 -0
package/dist/stream/identity_transform.test.cjs +125 -0
package/dist/stream/identity_transform.test.cjs.map +1 -0
package/dist/stream/identity_transform.test.js +124 -0
package/dist/stream/identity_transform.test.js.map +1 -0
package/dist/stream/index.cjs +38 -0
package/dist/stream/index.cjs.map +1 -0
package/dist/stream/index.d.cts +5 -0
package/dist/stream/index.d.ts +5 -0
package/dist/stream/index.d.ts.map +1 -0
package/dist/stream/index.js +11 -0
package/dist/stream/index.js.map +1 -0
package/dist/stream/merge_readable_streams.cjs +59 -0
package/dist/stream/merge_readable_streams.cjs.map +1 -0
package/dist/stream/merge_readable_streams.d.cts +4 -0
package/dist/stream/merge_readable_streams.d.ts +4 -0
package/dist/stream/merge_readable_streams.d.ts.map +1 -0
package/dist/stream/merge_readable_streams.js +35 -0
package/dist/stream/merge_readable_streams.js.map +1 -0
package/dist/stream/stream_channel.cjs +57 -0
package/dist/stream/stream_channel.cjs.map +1 -0
package/dist/stream/stream_channel.d.cts +11 -0
package/dist/stream/stream_channel.d.ts +11 -0
package/dist/stream/stream_channel.d.ts.map +1 -0
package/dist/stream/stream_channel.js +33 -0
package/dist/stream/stream_channel.js.map +1 -0
package/dist/stream/stream_channel.test.cjs +124 -0
package/dist/stream/stream_channel.test.cjs.map +1 -0
package/dist/stream/stream_channel.test.js +123 -0
package/dist/stream/stream_channel.test.js.map +1 -0
package/dist/stt/index.cjs +38 -0
package/dist/stt/index.cjs.map +1 -0
package/dist/stt/index.d.cts +3 -0
package/dist/stt/index.d.ts +3 -0
package/dist/stt/index.d.ts.map +1 -0
package/dist/stt/index.js +14 -0
package/dist/stt/index.js.map +1 -0
package/dist/stt/stream_adapter.cjs +115 -0
package/dist/stt/stream_adapter.cjs.map +1 -0
package/dist/stt/stream_adapter.d.cts +23 -0
package/dist/stt/stream_adapter.d.ts +23 -0
package/dist/stt/stream_adapter.d.ts.map +1 -0
package/dist/stt/stream_adapter.js +90 -0
package/dist/stt/stream_adapter.js.map +1 -0
package/dist/stt/stt.cjs +253 -0
package/dist/stt/stt.cjs.map +1 -0
package/dist/stt/stt.d.cts +158 -0
package/dist/stt/stt.d.ts +158 -0
package/dist/stt/stt.d.ts.map +1 -0
package/dist/stt/stt.js +227 -0
package/dist/stt/stt.js.map +1 -0
package/dist/telemetry/index.cjs +72 -0
package/dist/telemetry/index.cjs.map +1 -0
package/dist/telemetry/index.d.cts +7 -0
package/dist/telemetry/index.d.ts +7 -0
package/dist/telemetry/index.d.ts.map +1 -0
package/dist/telemetry/index.js +37 -0
package/dist/telemetry/index.js.map +1 -0
package/dist/telemetry/logging.cjs +65 -0
package/dist/telemetry/logging.cjs.map +1 -0
package/dist/telemetry/logging.d.cts +21 -0
package/dist/telemetry/logging.d.ts +21 -0
package/dist/telemetry/logging.d.ts.map +1 -0
package/dist/telemetry/logging.js +40 -0
package/dist/telemetry/logging.js.map +1 -0
package/dist/telemetry/otel_http_exporter.cjs +147 -0
package/dist/telemetry/otel_http_exporter.cjs.map +1 -0
package/dist/telemetry/otel_http_exporter.d.cts +62 -0
package/dist/telemetry/otel_http_exporter.d.ts +62 -0
package/dist/telemetry/otel_http_exporter.d.ts.map +1 -0
package/dist/telemetry/otel_http_exporter.js +123 -0
package/dist/telemetry/otel_http_exporter.js.map +1 -0
package/dist/telemetry/pino_otel_transport.cjs +217 -0
package/dist/telemetry/pino_otel_transport.cjs.map +1 -0
package/dist/telemetry/pino_otel_transport.d.cts +58 -0
package/dist/telemetry/pino_otel_transport.d.ts +58 -0
package/dist/telemetry/pino_otel_transport.d.ts.map +1 -0
package/dist/telemetry/pino_otel_transport.js +189 -0
package/dist/telemetry/pino_otel_transport.js.map +1 -0
package/dist/telemetry/trace_types.cjs +206 -0
package/dist/telemetry/trace_types.cjs.map +1 -0
package/dist/telemetry/trace_types.d.cts +61 -0
package/dist/telemetry/trace_types.d.ts +61 -0
package/dist/telemetry/trace_types.d.ts.map +1 -0
package/dist/telemetry/trace_types.js +123 -0
package/dist/telemetry/trace_types.js.map +1 -0
package/dist/telemetry/traces.cjs +444 -0
package/dist/telemetry/traces.cjs.map +1 -0
package/dist/telemetry/traces.d.cts +114 -0
package/dist/telemetry/traces.d.ts +114 -0
package/dist/telemetry/traces.d.ts.map +1 -0
package/dist/telemetry/traces.js +409 -0
package/dist/telemetry/traces.js.map +1 -0
package/dist/telemetry/utils.cjs +86 -0
package/dist/telemetry/utils.cjs.map +1 -0
package/dist/telemetry/utils.d.cts +5 -0
package/dist/telemetry/utils.d.ts +5 -0
package/dist/telemetry/utils.d.ts.map +1 -0
package/dist/telemetry/utils.js +51 -0
package/dist/telemetry/utils.js.map +1 -0
package/dist/tokenize/basic/basic.cjs +105 -0
package/dist/tokenize/basic/basic.cjs.map +1 -0
package/dist/tokenize/basic/basic.d.cts +24 -0
package/dist/tokenize/basic/basic.d.ts +24 -0
package/dist/tokenize/basic/basic.d.ts.map +1 -0
package/dist/tokenize/basic/basic.js +67 -0
package/dist/tokenize/basic/basic.js.map +1 -0
package/dist/tokenize/basic/hyphenator.cjs +425 -0
package/dist/tokenize/basic/hyphenator.cjs.map +1 -0
package/dist/tokenize/basic/hyphenator.d.cts +17 -0
package/dist/tokenize/basic/hyphenator.d.ts +17 -0
package/dist/tokenize/basic/hyphenator.d.ts.map +1 -0
package/dist/tokenize/basic/hyphenator.js +401 -0
package/dist/tokenize/basic/hyphenator.js.map +1 -0
package/dist/tokenize/basic/index.cjs +37 -0
package/dist/tokenize/basic/index.cjs.map +1 -0
package/dist/tokenize/basic/index.d.cts +2 -0
package/dist/tokenize/basic/index.d.ts +2 -0
package/dist/tokenize/basic/index.d.ts.map +1 -0
package/dist/tokenize/basic/index.js +15 -0
package/dist/tokenize/basic/index.js.map +1 -0
package/dist/tokenize/basic/paragraph.cjs +57 -0
package/dist/tokenize/basic/paragraph.cjs.map +1 -0
package/dist/tokenize/basic/paragraph.d.cts +5 -0
package/dist/tokenize/basic/paragraph.d.ts +5 -0
package/dist/tokenize/basic/paragraph.d.ts.map +1 -0
package/dist/tokenize/basic/paragraph.js +33 -0
package/dist/tokenize/basic/paragraph.js.map +1 -0
package/dist/tokenize/basic/sentence.cjs +97 -0
package/dist/tokenize/basic/sentence.cjs.map +1 -0
package/dist/tokenize/basic/sentence.d.cts +5 -0
package/dist/tokenize/basic/sentence.d.ts +5 -0
package/dist/tokenize/basic/sentence.d.ts.map +1 -0
package/dist/tokenize/basic/sentence.js +73 -0
package/dist/tokenize/basic/sentence.js.map +1 -0
package/dist/tokenize/basic/word.cjs +44 -0
package/dist/tokenize/basic/word.cjs.map +1 -0
package/dist/tokenize/basic/word.d.cts +5 -0
package/dist/tokenize/basic/word.d.ts +5 -0
package/dist/tokenize/basic/word.d.ts.map +1 -0
package/dist/tokenize/basic/word.js +20 -0
package/dist/tokenize/basic/word.js.map +1 -0
package/dist/tokenize/index.cjs +55 -0
package/dist/tokenize/index.cjs.map +1 -0
package/dist/tokenize/index.d.cts +5 -0
package/dist/tokenize/index.d.ts +5 -0
package/dist/tokenize/index.d.ts.map +1 -0
package/dist/tokenize/index.js +19 -0
package/dist/tokenize/index.js.map +1 -0
package/dist/tokenize/token_stream.cjs +168 -0
package/dist/tokenize/token_stream.cjs.map +1 -0
package/dist/tokenize/token_stream.d.cts +40 -0
package/dist/tokenize/token_stream.d.ts +40 -0
package/dist/tokenize/token_stream.d.ts.map +1 -0
package/dist/tokenize/token_stream.js +142 -0
package/dist/tokenize/token_stream.js.map +1 -0
package/dist/tokenize/tokenizer.cjs +184 -0
package/dist/tokenize/tokenizer.cjs.map +1 -0
package/dist/tokenize/tokenizer.d.cts +55 -0
package/dist/tokenize/tokenizer.d.ts +55 -0
package/dist/tokenize/tokenizer.d.ts.map +1 -0
package/dist/tokenize/tokenizer.js +156 -0
package/dist/tokenize/tokenizer.js.map +1 -0
package/dist/tokenize/tokenizer.test.cjs +220 -0
package/dist/tokenize/tokenizer.test.cjs.map +1 -0
package/dist/tokenize/tokenizer.test.js +219 -0
package/dist/tokenize/tokenizer.test.js.map +1 -0
package/dist/transcription.cjs +247 -0
package/dist/transcription.cjs.map +1 -0
package/dist/transcription.d.cts +31 -0
package/dist/transcription.d.ts +31 -0
package/dist/transcription.d.ts.map +1 -0
package/dist/transcription.js +222 -0
package/dist/transcription.js.map +1 -0
package/dist/tts/index.cjs +38 -0
package/dist/tts/index.cjs.map +1 -0
package/dist/tts/index.d.cts +3 -0
package/dist/tts/index.d.ts +3 -0
package/dist/tts/index.d.ts.map +1 -0
package/dist/tts/index.js +14 -0
package/dist/tts/index.js.map +1 -0
package/dist/tts/stream_adapter.cjs +105 -0
package/dist/tts/stream_adapter.cjs.map +1 -0
package/dist/tts/stream_adapter.d.cts +20 -0
package/dist/tts/stream_adapter.d.ts +20 -0
package/dist/tts/stream_adapter.d.ts.map +1 -0
package/dist/tts/stream_adapter.js +80 -0
package/dist/tts/stream_adapter.js.map +1 -0
package/dist/tts/tts.cjs +431 -0
package/dist/tts/tts.cjs.map +1 -0
package/dist/tts/tts.d.cts +161 -0
package/dist/tts/tts.d.ts +161 -0
package/dist/tts/tts.d.ts.map +1 -0
package/dist/tts/tts.js +405 -0
package/dist/tts/tts.js.map +1 -0
package/dist/types.cjs +49 -0
package/dist/types.cjs.map +1 -0
package/dist/types.d.cts +44 -0
package/dist/types.d.ts +44 -0
package/dist/types.d.ts.map +1 -0
package/dist/types.js +23 -0
package/dist/types.js.map +1 -0
package/dist/utils/ws_transport.cjs +51 -0
package/dist/utils/ws_transport.cjs.map +1 -0
package/dist/utils/ws_transport.d.cts +9 -0
package/dist/utils/ws_transport.d.ts +9 -0
package/dist/utils/ws_transport.d.ts.map +1 -0
package/dist/utils/ws_transport.js +17 -0
package/dist/utils/ws_transport.js.map +1 -0
package/dist/utils/ws_transport.test.cjs +212 -0
package/dist/utils/ws_transport.test.cjs.map +1 -0
package/dist/utils/ws_transport.test.js +211 -0
package/dist/utils/ws_transport.test.js.map +1 -0
package/dist/utils.cjs +669 -0
package/dist/utils.cjs.map +1 -0
package/dist/utils.d.cts +244 -0
package/dist/utils.d.ts +244 -0
package/dist/utils.d.ts.map +1 -0
package/dist/utils.js +617 -0
package/dist/utils.js.map +1 -0
package/dist/utils.test.cjs +492 -0
package/dist/utils.test.cjs.map +1 -0
package/dist/utils.test.js +491 -0
package/dist/utils.test.js.map +1 -0
package/dist/vad.cjs +211 -0
package/dist/vad.cjs.map +1 -0
package/dist/vad.d.cts +105 -0
package/dist/vad.d.ts +105 -0
package/dist/vad.d.ts.map +1 -0
package/dist/vad.js +185 -0
package/dist/vad.js.map +1 -0
package/dist/version.cjs +29 -0
package/dist/version.cjs.map +1 -0
package/dist/version.d.cts +2 -0
package/dist/version.d.ts +2 -0
package/dist/version.d.ts.map +1 -0
package/dist/version.js +5 -0
package/dist/version.js.map +1 -0
package/dist/voice/agent.cjs +308 -0
package/dist/voice/agent.cjs.map +1 -0
package/dist/voice/agent.d.cts +83 -0
package/dist/voice/agent.d.ts +83 -0
package/dist/voice/agent.d.ts.map +1 -0
package/dist/voice/agent.js +287 -0
package/dist/voice/agent.js.map +1 -0
package/dist/voice/agent.test.cjs +61 -0
package/dist/voice/agent.test.cjs.map +1 -0
package/dist/voice/agent.test.js +60 -0
package/dist/voice/agent.test.js.map +1 -0
package/dist/voice/agent_activity.cjs +1784 -0
package/dist/voice/agent_activity.cjs.map +1 -0
package/dist/voice/agent_activity.d.cts +116 -0
package/dist/voice/agent_activity.d.ts +116 -0
package/dist/voice/agent_activity.d.ts.map +1 -0
package/dist/voice/agent_activity.js +1780 -0
package/dist/voice/agent_activity.js.map +1 -0
package/dist/voice/agent_session.cjs +592 -0
package/dist/voice/agent_session.cjs.map +1 -0
package/dist/voice/agent_session.d.cts +165 -0
package/dist/voice/agent_session.d.ts +165 -0
package/dist/voice/agent_session.d.ts.map +1 -0
package/dist/voice/agent_session.js +582 -0
package/dist/voice/agent_session.js.map +1 -0
package/dist/voice/audio_recognition.cjs +668 -0
package/dist/voice/audio_recognition.cjs.map +1 -0
package/dist/voice/audio_recognition.d.cts +127 -0
package/dist/voice/audio_recognition.d.ts +127 -0
package/dist/voice/audio_recognition.d.ts.map +1 -0
package/dist/voice/audio_recognition.js +647 -0
package/dist/voice/audio_recognition.js.map +1 -0
package/dist/voice/avatar/datastream_io.cjs +204 -0
package/dist/voice/avatar/datastream_io.cjs.map +1 -0
package/dist/voice/avatar/datastream_io.d.cts +37 -0
package/dist/voice/avatar/datastream_io.d.ts +37 -0
package/dist/voice/avatar/datastream_io.d.ts.map +1 -0
package/dist/voice/avatar/datastream_io.js +188 -0
package/dist/voice/avatar/datastream_io.js.map +1 -0
package/dist/voice/avatar/index.cjs +23 -0
package/dist/voice/avatar/index.cjs.map +1 -0
package/dist/voice/avatar/index.d.cts +2 -0
package/dist/voice/avatar/index.d.ts +2 -0
package/dist/voice/avatar/index.d.ts.map +1 -0
package/dist/voice/avatar/index.js +2 -0
package/dist/voice/avatar/index.js.map +1 -0
package/dist/voice/background_audio.cjs +366 -0
package/dist/voice/background_audio.cjs.map +1 -0
package/dist/voice/background_audio.d.cts +121 -0
package/dist/voice/background_audio.d.ts +121 -0
package/dist/voice/background_audio.d.ts.map +1 -0
package/dist/voice/background_audio.js +342 -0
package/dist/voice/background_audio.js.map +1 -0
package/dist/voice/events.cjs +147 -0
package/dist/voice/events.cjs.map +1 -0
package/dist/voice/events.d.cts +127 -0
package/dist/voice/events.d.ts +127 -0
package/dist/voice/events.d.ts.map +1 -0
package/dist/voice/events.js +112 -0
package/dist/voice/events.js.map +1 -0
package/dist/voice/generation.cjs +747 -0
package/dist/voice/generation.cjs.map +1 -0
package/dist/voice/generation.d.cts +116 -0
package/dist/voice/generation.d.ts +116 -0
package/dist/voice/generation.d.ts.map +1 -0
package/dist/voice/generation.js +719 -0
package/dist/voice/generation.js.map +1 -0
package/dist/voice/generation_tools.test.cjs +236 -0
package/dist/voice/generation_tools.test.cjs.map +1 -0
package/dist/voice/generation_tools.test.js +235 -0
package/dist/voice/generation_tools.test.js.map +1 -0
package/dist/voice/index.cjs +49 -0
package/dist/voice/index.cjs.map +1 -0
package/dist/voice/index.d.cts +10 -0
package/dist/voice/index.d.ts +10 -0
package/dist/voice/index.d.ts.map +1 -0
package/dist/voice/index.js +16 -0
package/dist/voice/index.js.map +1 -0
package/dist/voice/interruption_detection.test.cjs +114 -0
package/dist/voice/interruption_detection.test.cjs.map +1 -0
package/dist/voice/interruption_detection.test.js +113 -0
package/dist/voice/interruption_detection.test.js.map +1 -0
package/dist/voice/io.cjs +270 -0
package/dist/voice/io.cjs.map +1 -0
package/dist/voice/io.d.cts +126 -0
package/dist/voice/io.d.ts +126 -0
package/dist/voice/io.d.ts.map +1 -0
package/dist/voice/io.js +242 -0
package/dist/voice/io.js.map +1 -0
package/dist/voice/recorder_io/index.cjs +23 -0
package/dist/voice/recorder_io/index.cjs.map +1 -0
package/dist/voice/recorder_io/index.d.cts +2 -0
package/dist/voice/recorder_io/index.d.ts +2 -0
package/dist/voice/recorder_io/index.d.ts.map +1 -0
package/dist/voice/recorder_io/index.js +2 -0
package/dist/voice/recorder_io/index.js.map +1 -0
package/dist/voice/recorder_io/recorder_io.cjs +542 -0
package/dist/voice/recorder_io/recorder_io.cjs.map +1 -0
package/dist/voice/recorder_io/recorder_io.d.cts +100 -0
package/dist/voice/recorder_io/recorder_io.d.ts +100 -0
package/dist/voice/recorder_io/recorder_io.d.ts.map +1 -0
package/dist/voice/recorder_io/recorder_io.js +508 -0
package/dist/voice/recorder_io/recorder_io.js.map +1 -0
package/dist/voice/report.cjs +75 -0
package/dist/voice/report.cjs.map +1 -0
package/dist/voice/report.d.cts +42 -0
package/dist/voice/report.d.ts +42 -0
package/dist/voice/report.d.ts.map +1 -0
package/dist/voice/report.js +50 -0
package/dist/voice/report.js.map +1 -0
package/dist/voice/room_io/_input.cjs +133 -0
package/dist/voice/room_io/_input.cjs.map +1 -0
package/dist/voice/room_io/_input.d.cts +24 -0
package/dist/voice/room_io/_input.d.ts +24 -0
package/dist/voice/room_io/_input.d.ts.map +1 -0
package/dist/voice/room_io/_input.js +114 -0
package/dist/voice/room_io/_input.js.map +1 -0
package/dist/voice/room_io/_output.cjs +359 -0
package/dist/voice/room_io/_output.cjs.map +1 -0
package/dist/voice/room_io/_output.d.cts +77 -0
package/dist/voice/room_io/_output.d.ts +77 -0
package/dist/voice/room_io/_output.d.ts.map +1 -0
package/dist/voice/room_io/_output.js +343 -0
package/dist/voice/room_io/_output.js.map +1 -0
package/dist/voice/room_io/index.cjs +25 -0
package/dist/voice/room_io/index.cjs.map +1 -0
package/dist/voice/room_io/index.d.cts +3 -0
package/dist/voice/room_io/index.d.ts +3 -0
package/dist/voice/room_io/index.d.ts.map +1 -0
package/dist/voice/room_io/index.js +3 -0
package/dist/voice/room_io/index.js.map +1 -0
package/dist/voice/room_io/room_io.cjs +373 -0
package/dist/voice/room_io/room_io.cjs.map +1 -0
package/dist/voice/room_io/room_io.d.cts +94 -0
package/dist/voice/room_io/room_io.d.ts +94 -0
package/dist/voice/room_io/room_io.d.ts.map +1 -0
package/dist/voice/room_io/room_io.js +364 -0
package/dist/voice/room_io/room_io.js.map +1 -0
package/dist/voice/run_context.cjs +51 -0
package/dist/voice/run_context.cjs.map +1 -0
package/dist/voice/run_context.d.cts +22 -0
package/dist/voice/run_context.d.ts +22 -0
package/dist/voice/run_context.d.ts.map +1 -0
package/dist/voice/run_context.js +27 -0
package/dist/voice/run_context.js.map +1 -0
package/dist/voice/speech_handle.cjs +228 -0
package/dist/voice/speech_handle.cjs.map +1 -0
package/dist/voice/speech_handle.d.cts +97 -0
package/dist/voice/speech_handle.d.ts +97 -0
package/dist/voice/speech_handle.d.ts.map +1 -0
package/dist/voice/speech_handle.js +204 -0
package/dist/voice/speech_handle.js.map +1 -0
package/dist/voice/transcription/_utils.cjs +45 -0
package/dist/voice/transcription/_utils.cjs.map +1 -0
package/dist/voice/transcription/_utils.d.cts +3 -0
package/dist/voice/transcription/_utils.d.ts +3 -0
package/dist/voice/transcription/_utils.d.ts.map +1 -0
package/dist/voice/transcription/_utils.js +21 -0
package/dist/voice/transcription/_utils.js.map +1 -0
package/dist/voice/transcription/index.cjs +23 -0
package/dist/voice/transcription/index.cjs.map +1 -0
package/dist/voice/transcription/index.d.cts +2 -0
package/dist/voice/transcription/index.d.ts +2 -0
package/dist/voice/transcription/index.d.ts.map +1 -0
package/dist/voice/transcription/index.js +2 -0
package/dist/voice/transcription/index.js.map +1 -0
package/dist/voice/transcription/synchronizer.cjs +379 -0
package/dist/voice/transcription/synchronizer.cjs.map +1 -0
package/dist/voice/transcription/synchronizer.d.cts +87 -0
package/dist/voice/transcription/synchronizer.d.ts +87 -0
package/dist/voice/transcription/synchronizer.d.ts.map +1 -0
package/dist/voice/transcription/synchronizer.js +354 -0
package/dist/voice/transcription/synchronizer.js.map +1 -0
package/dist/worker.cjs +680 -0
package/dist/worker.cjs.map +1 -0
package/dist/worker.d.cts +119 -0
package/dist/worker.d.ts +119 -0
package/dist/worker.d.ts.map +1 -0
package/dist/worker.js +645 -0
package/dist/worker.js.map +1 -0
package/package.json +86 -0
package/resources/NOTICE +2 -0
package/resources/keyboard-typing.ogg +0 -0
package/resources/keyboard-typing2.ogg +0 -0
package/resources/office-ambience.ogg +0 -0
package/src/_exceptions.ts +137 -0
package/src/audio.ts +205 -0
package/src/cli.ts +224 -0
package/src/connection_pool.test.ts +346 -0
package/src/connection_pool.ts +307 -0
package/src/constants.ts +9 -0
package/src/generator.ts +38 -0
package/src/http_server.ts +64 -0
package/src/index.ts +41 -0
package/src/inference/api_protos.ts +82 -0
package/src/inference/index.ts +32 -0
package/src/inference/interruption/AdaptiveInterruptionDetector.ts +166 -0
package/src/inference/interruption/InterruptionStream.ts +397 -0
package/src/inference/interruption/defaults.ts +33 -0
package/src/inference/interruption/errors.ts +0 -0
package/src/inference/interruption/http_transport.ts +61 -0
package/src/inference/interruption/index.ts +4 -0
package/src/inference/interruption/interruption.ts +88 -0
package/src/inference/llm.ts +532 -0
package/src/inference/stt.ts +524 -0
package/src/inference/tts.ts +574 -0
package/src/inference/utils.test.ts +31 -0
package/src/inference/utils.ts +81 -0
package/src/inference_runner.ts +19 -0
package/src/ipc/index.ts +5 -0
package/src/ipc/inference_executor.ts +7 -0
package/src/ipc/inference_proc_executor.ts +101 -0
package/src/ipc/inference_proc_lazy_main.ts +115 -0
package/src/ipc/job_executor.ts +23 -0
package/src/ipc/job_proc_executor.ts +122 -0
package/src/ipc/job_proc_lazy_main.ts +247 -0
package/src/ipc/message.ts +52 -0
package/src/ipc/proc_pool.ts +164 -0
package/src/ipc/supervised_proc.test.ts +153 -0
package/src/ipc/supervised_proc.ts +242 -0
package/src/job.ts +461 -0
package/src/llm/__snapshots__/chat_context.test.ts.snap +527 -0
package/src/llm/__snapshots__/tool_context.test.ts.snap +177 -0
package/src/llm/__snapshots__/zod-utils.test.ts.snap +559 -0
package/src/llm/chat_context.test.ts +1057 -0
package/src/llm/chat_context.ts +759 -0
package/src/llm/fallback_adapter.test.ts +238 -0
package/src/llm/fallback_adapter.ts +391 -0
package/src/llm/index.ts +74 -0
package/src/llm/llm.ts +303 -0
package/src/llm/provider_format/google.test.ts +843 -0
package/src/llm/provider_format/google.ts +134 -0
package/src/llm/provider_format/index.ts +23 -0
package/src/llm/provider_format/openai.test.ts +675 -0
package/src/llm/provider_format/openai.ts +146 -0
package/src/llm/provider_format/utils.ts +187 -0
package/src/llm/realtime.ts +163 -0
package/src/llm/remote_chat_context.test.ts +290 -0
package/src/llm/remote_chat_context.ts +114 -0
package/src/llm/tool_context.test.ts +407 -0
package/src/llm/tool_context.ts +343 -0
package/src/llm/tool_context.type.test.ts +115 -0
package/src/llm/utils.test.ts +670 -0
package/src/llm/utils.ts +336 -0
package/src/llm/zod-utils.test.ts +577 -0
package/src/llm/zod-utils.ts +153 -0
package/src/log.ts +83 -0
package/src/metrics/base.ts +168 -0
package/src/metrics/index.ts +15 -0
package/src/metrics/usage_collector.ts +46 -0
package/src/metrics/utils.ts +64 -0
package/src/plugin.ts +46 -0
package/src/stream/deferred_stream.test.ts +755 -0
package/src/stream/deferred_stream.ts +127 -0
package/src/stream/identity_transform.test.ts +179 -0
package/src/stream/identity_transform.ts +18 -0
package/src/stream/index.ts +7 -0
package/src/stream/merge_readable_streams.ts +40 -0
package/src/stream/stream_channel.test.ts +166 -0
package/src/stream/stream_channel.ts +44 -0
package/src/stt/index.ts +15 -0
package/src/stt/stream_adapter.ts +107 -0
package/src/stt/stt.ts +374 -0
package/src/telemetry/index.ts +28 -0
package/src/telemetry/logging.ts +55 -0
package/src/telemetry/otel_http_exporter.ts +195 -0
package/src/telemetry/pino_otel_transport.ts +265 -0
package/src/telemetry/trace_types.ts +95 -0
package/src/telemetry/traces.ts +612 -0
package/src/telemetry/utils.ts +61 -0
package/src/tokenize/basic/basic.ts +83 -0
package/src/tokenize/basic/hyphenator.ts +434 -0
package/src/tokenize/basic/index.ts +11 -0
package/src/tokenize/basic/paragraph.ts +43 -0
package/src/tokenize/basic/sentence.ts +89 -0
package/src/tokenize/basic/word.ts +27 -0
package/src/tokenize/index.ts +16 -0
package/src/tokenize/token_stream.ts +180 -0
package/src/tokenize/tokenizer.test.ts +255 -0
package/src/tokenize/tokenizer.ts +152 -0
package/src/transcription.ts +307 -0
package/src/tts/index.ts +12 -0
package/src/tts/stream_adapter.ts +110 -0
package/src/tts/tts.ts +598 -0
package/src/types.ts +66 -0
package/src/utils/ws_transport.test.ts +282 -0
package/src/utils/ws_transport.ts +22 -0
package/src/utils.test.ts +651 -0
package/src/utils.ts +871 -0
package/src/vad.ts +262 -0
package/src/version.ts +5 -0
package/src/voice/agent.test.ts +80 -0
package/src/voice/agent.ts +418 -0
package/src/voice/agent_activity.ts +2375 -0
package/src/voice/agent_session.ts +866 -0
package/src/voice/audio_recognition.ts +877 -0
package/src/voice/avatar/datastream_io.ts +247 -0
package/src/voice/avatar/index.ts +4 -0
package/src/voice/background_audio.ts +491 -0
package/src/voice/events.ts +261 -0
package/src/voice/generation.ts +946 -0
package/src/voice/generation_tools.test.ts +268 -0
package/src/voice/index.ts +12 -0
package/src/voice/interruption_detection.test.ts +151 -0
package/src/voice/io.ts +347 -0
package/src/voice/recorder_io/index.ts +4 -0
package/src/voice/recorder_io/recorder_io.ts +690 -0
package/src/voice/report.ts +100 -0
package/src/voice/room_io/_input.ts +162 -0
package/src/voice/room_io/_output.ts +439 -0
package/src/voice/room_io/index.ts +5 -0
package/src/voice/room_io/room_io.ts +518 -0
package/src/voice/run_context.ts +34 -0
package/src/voice/speech_handle.ts +250 -0
package/src/voice/transcription/_utils.ts +25 -0
package/src/voice/transcription/index.ts +4 -0
package/src/voice/transcription/synchronizer.ts +477 -0
package/src/worker.ts +798 -0

package/dist/voice/agent_activity.js ADDED Viewed

@@ -0,0 +1,1780 @@
+import { Mutex } from "@livekit/mutex";
+import { ROOT_CONTEXT, trace } from "@opentelemetry/api";
+import { Heap } from "heap-js";
+import { AsyncLocalStorage } from "node:async_hooks";
+import { ReadableStream } from "node:stream/web";
+import { ChatMessage } from "../llm/chat_context.js";
+import {
+  LLM,
+  RealtimeModel
+} from "../llm/index.js";
+import { isSameToolChoice, isSameToolContext } from "../llm/tool_context.js";
+import { log } from "../log.js";
+import { DeferredReadableStream } from "../stream/deferred_stream.js";
+import { STT } from "../stt/stt.js";
+import { recordRealtimeMetrics, traceTypes, tracer } from "../telemetry/index.js";
+import { splitWords } from "../tokenize/basic/word.js";
+import { TTS } from "../tts/tts.js";
+import { Future, Task, cancelAndWait, waitFor } from "../utils.js";
+import { InterruptionEventType } from "../inference/interruption/interruption.js";
+import { VAD } from "../vad.js";
+import { StopResponse, asyncLocalStorage } from "./agent.js";
+import {} from "./agent_session.js";
+import {
+  AudioRecognition
+} from "./audio_recognition.js";
+import {
+  AgentSessionEventTypes,
+  createErrorEvent,
+  createFunctionToolsExecutedEvent,
+  createMetricsCollectedEvent,
+  createSpeechCreatedEvent,
+  createUserInputTranscribedEvent
+} from "./events.js";
+import {
+  performAudioForwarding,
+  performLLMInference,
+  performTTSInference,
+  performTextForwarding,
+  performToolExecutions,
+  removeInstructions,
+  updateInstructions
+} from "./generation.js";
+import { SpeechHandle } from "./speech_handle.js";
+const speechHandleStorage = new AsyncLocalStorage();
+class AgentActivity {
+  static REPLY_TASK_CANCEL_TIMEOUT = 5e3;
+  started = false;
+  audioRecognition;
+  realtimeSession;
+  realtimeSpans;
+  // Maps response_id to OTEL span for metrics recording
+  turnDetectionMode;
+  logger = log();
+  _draining = false;
+  _currentSpeech;
+  speechQueue;
+  // [priority, timestamp, speechHandle]
+  q_updated;
+  speechTasks = /* @__PURE__ */ new Set();
+  lock = new Mutex();
+  audioStream = new DeferredReadableStream();
+  // default to null as None, which maps to the default provider tool choice value
+  toolChoice = null;
+  _preemptiveGeneration;
+  agent;
+  agentSession;
+  /** @internal */
+  _mainTask;
+  _userTurnCompletedTask;
+  /**
+   * Notify that agent started speaking.
+   * This enables interruption detection in AudioRecognition.
+   * @internal
+   */
+  notifyAgentSpeechStarted() {
+    var _a;
+    (_a = this.audioRecognition) == null ? void 0 : _a.onStartOfAgentSpeech();
+  }
+  /**
+   * Notify that agent stopped speaking.
+   * This disables interruption detection in AudioRecognition.
+   * @internal
+   */
+  notifyAgentSpeechEnded() {
+    var _a;
+    (_a = this.audioRecognition) == null ? void 0 : _a.onEndOfAgentSpeech();
+  }
+  constructor(agent, agentSession) {
+    this.agent = agent;
+    this.agentSession = agentSession;
+    this.speechQueue = new Heap(([p1, t1, _], [p2, t2, __]) => {
+      return p1 === p2 ? t1 - t2 : p2 - p1;
+    });
+    this.q_updated = new Future();
+    this.turnDetectionMode = typeof this.turnDetection === "string" ? this.turnDetection : void 0;
+    if (this.turnDetectionMode === "vad" && this.vad === void 0) {
+      this.logger.warn(
+        'turnDetection is set to "vad", but no VAD model is provided, ignoring the turnDdetection setting'
+      );
+      this.turnDetectionMode = void 0;
+    }
+    if (this.turnDetectionMode === "stt" && this.stt === void 0) {
+      this.logger.warn(
+        'turnDetection is set to "stt", but no STT model is provided, ignoring the turnDetection setting'
+      );
+      this.turnDetectionMode = void 0;
+    }
+    if (this.llm instanceof RealtimeModel) {
+      if (this.llm.capabilities.turnDetection && !this.allowInterruptions) {
+        this.logger.warn(
+          "the RealtimeModel uses a server-side turn detection, allowInterruptions cannot be false, disable turnDetection in the RealtimeModel and use VAD on the AgentSession instead"
+        );
+      }
+      if (this.turnDetectionMode === "realtime_llm" && !this.llm.capabilities.turnDetection) {
+        this.logger.warn(
+          'turnDetection is set to "realtime_llm", but the LLM is not a RealtimeModel or the server-side turn detection is not supported/enabled, ignoring the turnDetection setting'
+        );
+        this.turnDetectionMode = void 0;
+      }
+      if (this.turnDetectionMode === "stt") {
+        this.logger.warn(
+          'turnDetection is set to "stt", but the LLM is a RealtimeModel, ignoring the turnDetection setting'
+        );
+        this.turnDetectionMode = void 0;
+      }
+      if (this.turnDetectionMode && this.turnDetectionMode !== "realtime_llm" && this.llm.capabilities.turnDetection) {
+        this.logger.warn(
+          `turnDetection is set to "${this.turnDetectionMode}", but the LLM is a RealtimeModel and server-side turn detection enabled, ignoring the turnDetection setting`
+        );
+        this.turnDetectionMode = void 0;
+      }
+      if (!this.llm.capabilities.turnDetection && this.vad && this.turnDetectionMode === void 0) {
+        this.turnDetectionMode = "vad";
+      }
+    } else if (this.turnDetectionMode === "realtime_llm") {
+      this.logger.warn(
+        'turnDetection is set to "realtime_llm", but the LLM is not a RealtimeModel'
+      );
+      this.turnDetectionMode = void 0;
+    }
+    if (!this.vad && this.stt && this.llm instanceof LLM && this.allowInterruptions && this.turnDetectionMode === void 0) {
+      this.logger.warn(
+        "VAD is not set. Enabling VAD is recommended when using LLM and STT for more responsive interruption handling."
+      );
+    }
+  }
+  async start() {
+    const unlock = await this.lock.lock();
+    try {
+      const startSpan = tracer.startSpan({
+        name: "start_agent_activity",
+        attributes: { [traceTypes.ATTR_AGENT_LABEL]: this.agent.id },
+        context: ROOT_CONTEXT
+      });
+      this.agent._agentActivity = this;
+      if (this.llm instanceof RealtimeModel) {
+        this.realtimeSession = this.llm.session();
+        this.realtimeSpans = /* @__PURE__ */ new Map();
+        this.realtimeSession.on("generation_created", (ev) => this.onGenerationCreated(ev));
+        this.realtimeSession.on("input_speech_started", (ev) => this.onInputSpeechStarted(ev));
+        this.realtimeSession.on("input_speech_stopped", (ev) => this.onInputSpeechStopped(ev));
+        this.realtimeSession.on(
+          "input_audio_transcription_completed",
+          (ev) => this.onInputAudioTranscriptionCompleted(ev)
+        );
+        this.realtimeSession.on("metrics_collected", (ev) => this.onMetricsCollected(ev));
+        this.realtimeSession.on("error", (ev) => this.onError(ev));
+        removeInstructions(this.agent._chatCtx);
+        try {
+          await this.realtimeSession.updateInstructions(this.agent.instructions);
+        } catch (error) {
+          this.logger.error(error, "failed to update the instructions");
+        }
+        try {
+          await this.realtimeSession.updateChatCtx(this.agent.chatCtx);
+        } catch (error) {
+          this.logger.error(error, "failed to update the chat context");
+        }
+        try {
+          await this.realtimeSession.updateTools(this.tools);
+        } catch (error) {
+          this.logger.error(error, "failed to update the tools");
+        }
+        if (!this.llm.capabilities.audioOutput && !this.tts && this.agentSession.output.audio) {
+          this.logger.error(
+            "audio output is enabled but RealtimeModel has no audio modality and no TTS is set. Either enable audio modality in the RealtimeModel or set a TTS model."
+          );
+        }
+      } else if (this.llm instanceof LLM) {
+        try {
+          updateInstructions({
+            chatCtx: this.agent._chatCtx,
+            instructions: this.agent.instructions,
+            addIfMissing: true
+          });
+        } catch (error) {
+          this.logger.error("failed to update the instructions", error);
+        }
+      }
+      if (this.llm instanceof LLM) {
+        this.llm.on("metrics_collected", (ev) => this.onMetricsCollected(ev));
+        this.llm.on("error", (ev) => this.onError(ev));
+      }
+      if (this.stt instanceof STT) {
+        this.stt.on("metrics_collected", (ev) => this.onMetricsCollected(ev));
+        this.stt.on("error", (ev) => this.onError(ev));
+      }
+      if (this.tts instanceof TTS) {
+        this.tts.on("metrics_collected", (ev) => this.onMetricsCollected(ev));
+        this.tts.on("error", (ev) => this.onError(ev));
+      }
+      if (this.vad instanceof VAD) {
+        this.vad.on("metrics_collected", (ev) => this.onMetricsCollected(ev));
+      }
+      this.audioRecognition = new AudioRecognition({
+        recognitionHooks: this,
+        // Disable stt node if stt is not provided
+        stt: this.stt ? (...args) => this.agent.sttNode(...args) : void 0,
+        vad: this.vad,
+        interruptionDetector: this.agentSession.interruptionDetector,
+        turnDetector: typeof this.turnDetection === "string" ? void 0 : this.turnDetection,
+        turnDetectionMode: this.turnDetectionMode,
+        minEndpointingDelay: this.agentSession.options.minEndpointingDelay,
+        maxEndpointingDelay: this.agentSession.options.maxEndpointingDelay,
+        rootSpanContext: this.agentSession.rootSpanContext
+      });
+      this.audioRecognition.start();
+      this.started = true;
+      this._mainTask = Task.from(({ signal }) => this.mainTask(signal));
+      const onEnterTask = tracer.startActiveSpan(async () => this.agent.onEnter(), {
+        name: "on_enter",
+        context: trace.setSpan(ROOT_CONTEXT, startSpan),
+        attributes: { [traceTypes.ATTR_AGENT_LABEL]: this.agent.id }
+      });
+      this.createSpeechTask({
+        task: Task.from(() => onEnterTask),
+        name: "AgentActivity_onEnter"
+      });
+      startSpan.end();
+    } finally {
+      unlock();
+    }
+  }
+  get currentSpeech() {
+    return this._currentSpeech;
+  }
+  get vad() {
+    return this.agent.vad || this.agentSession.vad;
+  }
+  get stt() {
+    return this.agent.stt || this.agentSession.stt;
+  }
+  get llm() {
+    return this.agent.llm || this.agentSession.llm;
+  }
+  get tts() {
+    return this.agent.tts || this.agentSession.tts;
+  }
+  get tools() {
+    return this.agent.toolCtx;
+  }
+  get draining() {
+    return this._draining;
+  }
+  get realtimeLLMSession() {
+    return this.realtimeSession;
+  }
+  get allowInterruptions() {
+    return this.agentSession.options.allowInterruptions;
+  }
+  get turnDetection() {
+    return this.agentSession.turnDetection;
+  }
+  get toolCtx() {
+    return this.agent.toolCtx;
+  }
+  async updateChatCtx(chatCtx) {
+    chatCtx = chatCtx.copy({ toolCtx: this.toolCtx });
+    this.agent._chatCtx = chatCtx;
+    if (this.realtimeSession) {
+      removeInstructions(chatCtx);
+      this.realtimeSession.updateChatCtx(chatCtx);
+    } else {
+      updateInstructions({
+        chatCtx,
+        instructions: this.agent.instructions,
+        addIfMissing: true
+      });
+    }
+  }
+  updateOptions({ toolChoice }) {
+    if (toolChoice !== void 0) {
+      this.toolChoice = toolChoice;
+    }
+    if (this.realtimeSession) {
+      this.realtimeSession.updateOptions({ toolChoice: this.toolChoice });
+    }
+  }
+  attachAudioInput(audioStream) {
+    if (this.audioStream.isSourceSet) {
+      this.logger.debug("detaching existing audio input in agent activity");
+      this.audioStream.detachSource();
+    }
+    this.audioStream.setSource(audioStream);
+    const [realtimeAudioStream, recognitionAudioStream] = this.audioStream.stream.tee();
+    if (this.realtimeSession) {
+      this.realtimeSession.setInputAudioStream(realtimeAudioStream);
+    }
+    if (this.audioRecognition) {
+      this.audioRecognition.setInputAudioStream(recognitionAudioStream);
+    }
+  }
+  detachAudioInput() {
+    this.audioStream.detachSource();
+  }
+  commitUserTurn() {
+    if (!this.audioRecognition) {
+      throw new Error("AudioRecognition is not initialized");
+    }
+    const audioDetached = false;
+    this.audioRecognition.commitUserTurn(audioDetached);
+  }
+  clearUserTurn() {
+    var _a, _b;
+    (_a = this.audioRecognition) == null ? void 0 : _a.clearUserTurn();
+    (_b = this.realtimeSession) == null ? void 0 : _b.clearAudio();
+  }
+  say(text, options) {
+    const {
+      audio,
+      allowInterruptions: defaultAllowInterruptions,
+      addToChatCtx = true
+    } = options ?? {};
+    let allowInterruptions = defaultAllowInterruptions;
+    if (!audio && !this.tts && this.agentSession.output.audio && this.agentSession.output.audioEnabled) {
+      throw new Error("trying to generate speech from text without a TTS model");
+    }
+    if (this.llm instanceof RealtimeModel && this.llm.capabilities.turnDetection && allowInterruptions === false) {
+      this.logger.warn(
+        "the RealtimeModel uses a server-side turn detection, allowInterruptions cannot be false when using VoiceAgent.say(), disable turnDetection in the RealtimeModel and use VAD on the AgentTask/VoiceAgent instead"
+      );
+      allowInterruptions = true;
+    }
+    const handle = SpeechHandle.create({
+      allowInterruptions: allowInterruptions ?? this.allowInterruptions
+    });
+    this.agentSession.emit(
+      AgentSessionEventTypes.SpeechCreated,
+      createSpeechCreatedEvent({
+        userInitiated: true,
+        source: "say",
+        speechHandle: handle
+      })
+    );
+    const task = this.createSpeechTask({
+      task: Task.from(
+        (abortController) => this.ttsTask(handle, text, addToChatCtx, {}, abortController, audio)
+      ),
+      ownedSpeechHandle: handle,
+      name: "AgentActivity.say_tts"
+    });
+    task.finally(() => this.onPipelineReplyDone());
+    this.scheduleSpeech(handle, SpeechHandle.SPEECH_PRIORITY_NORMAL);
+    return handle;
+  }
+  // -- Metrics and errors --
+  onMetricsCollected = (ev) => {
+    const speechHandle = speechHandleStorage.getStore();
+    if (speechHandle && (ev.type === "llm_metrics" || ev.type === "tts_metrics")) {
+      ev.speechId = speechHandle.id;
+    }
+    if (ev.type === "realtime_model_metrics" && this.realtimeSpans) {
+      const span = this.realtimeSpans.get(ev.requestId);
+      if (span) {
+        recordRealtimeMetrics(span, ev);
+        this.realtimeSpans.delete(ev.requestId);
+      }
+    }
+    this.agentSession.emit(
+      AgentSessionEventTypes.MetricsCollected,
+      createMetricsCollectedEvent({ metrics: ev })
+    );
+  };
+  onError(ev) {
+    if (ev.type === "realtime_model_error") {
+      const errorEvent = createErrorEvent(ev.error, this.llm);
+      this.agentSession.emit(AgentSessionEventTypes.Error, errorEvent);
+    } else if (ev.type === "stt_error") {
+      const errorEvent = createErrorEvent(ev.error, this.stt);
+      this.agentSession.emit(AgentSessionEventTypes.Error, errorEvent);
+    } else if (ev.type === "tts_error") {
+      const errorEvent = createErrorEvent(ev.error, this.tts);
+      this.agentSession.emit(AgentSessionEventTypes.Error, errorEvent);
+    } else if (ev.type === "llm_error") {
+      const errorEvent = createErrorEvent(ev.error, this.llm);
+      this.agentSession.emit(AgentSessionEventTypes.Error, errorEvent);
+    }
+    this.agentSession._onError(ev);
+  }
+  // -- Realtime Session events --
+  onInputSpeechStarted(_ev) {
+    this.logger.info("onInputSpeechStarted");
+    if (!this.vad) {
+      this.agentSession._updateUserState("speaking");
+    }
+    try {
+      this.interrupt();
+    } catch (error) {
+      this.logger.error(
+        "RealtimeAPI input_speech_started, but current speech is not interruptable, this should never happen!",
+        error
+      );
+    }
+  }
+  onInputSpeechStopped(ev) {
+    this.logger.info(ev, "onInputSpeechStopped");
+    if (!this.vad) {
+      this.agentSession._updateUserState("listening");
+    }
+    if (ev.userTranscriptionEnabled) {
+      this.agentSession.emit(
+        AgentSessionEventTypes.UserInputTranscribed,
+        createUserInputTranscribedEvent({
+          isFinal: false,
+          transcript: ""
+        })
+      );
+    }
+  }
+  onInputAudioTranscriptionCompleted(ev) {
+    this.agentSession.emit(
+      AgentSessionEventTypes.UserInputTranscribed,
+      createUserInputTranscribedEvent({
+        transcript: ev.transcript,
+        isFinal: ev.isFinal
+      })
+    );
+    if (ev.isFinal) {
+      const message = ChatMessage.create({
+        role: "user",
+        content: ev.transcript,
+        id: ev.itemId
+      });
+      this.agent._chatCtx.items.push(message);
+      this.agentSession._conversationItemAdded(message);
+    }
+  }
+  onGenerationCreated(ev) {
+    if (ev.userInitiated) {
+      return;
+    }
+    if (this.draining) {
+      this.logger.warn("skipping new realtime generation, the agent is draining");
+      return;
+    }
+    const handle = SpeechHandle.create({
+      allowInterruptions: this.allowInterruptions
+    });
+    this.agentSession.emit(
+      AgentSessionEventTypes.SpeechCreated,
+      createSpeechCreatedEvent({
+        userInitiated: false,
+        source: "generate_reply",
+        speechHandle: handle
+      })
+    );
+    this.logger.info({ speech_id: handle.id }, "Creating speech handle");
+    this.createSpeechTask({
+      task: Task.from(
+        (abortController) => this.realtimeGenerationTask(handle, ev, {}, abortController)
+      ),
+      ownedSpeechHandle: handle,
+      name: "AgentActivity.realtimeGeneration"
+    });
+    this.scheduleSpeech(handle, SpeechHandle.SPEECH_PRIORITY_NORMAL);
+  }
+  // recognition hooks
+  onStartOfSpeech(_ev) {
+    this.agentSession._updateUserState("speaking");
+  }
+  onEndOfSpeech(ev) {
+    let speechEndTime = Date.now();
+    if (ev) {
+      speechEndTime = speechEndTime - ev.silenceDuration;
+    }
+    this.agentSession._updateUserState("listening", speechEndTime);
+  }
+  onVADInferenceDone(ev) {
+    var _a, _b;
+    if (this.turnDetection === "manual" || this.turnDetection === "realtime_llm") {
+      return;
+    }
+    if (this.llm instanceof RealtimeModel && this.llm.capabilities.turnDetection) {
+      return;
+    }
+    if (ev.speechDuration < this.agentSession.options.minInterruptionDuration) {
+      return;
+    }
+    if (this.stt && this.agentSession.options.minInterruptionWords > 0 && this.audioRecognition) {
+      const text = this.audioRecognition.currentTranscript;
+      const normalizedText = text ?? "";
+      const wordCount = splitWords(normalizedText, true).length;
+      if (wordCount < this.agentSession.options.minInterruptionWords) {
+        return;
+      }
+    }
+    (_a = this.realtimeSession) == null ? void 0 : _a.startUserActivity();
+    if (this._currentSpeech && !this._currentSpeech.interrupted && this._currentSpeech.allowInterruptions) {
+      this.logger.info({ "speech id": this._currentSpeech.id }, "speech interrupted by VAD");
+      (_b = this.realtimeSession) == null ? void 0 : _b.interrupt();
+      this._currentSpeech.interrupt();
+    }
+  }
+  onInterruption(ev) {
+    var _a, _b;
+    if (ev.type !== InterruptionEventType.INTERRUPTION) {
+      return;
+    }
+    this.logger.info(
+      {
+        probability: ev.probability,
+        detectionDelay: ev.detectionDelay,
+        totalDuration: ev.totalDuration
+      },
+      "adaptive interruption detected"
+    );
+    if (this.turnDetection === "manual" || this.turnDetection === "realtime_llm") {
+      return;
+    }
+    if (this.llm instanceof RealtimeModel && this.llm.capabilities.turnDetection) {
+      return;
+    }
+    (_a = this.realtimeSession) == null ? void 0 : _a.startUserActivity();
+    if (this._currentSpeech && !this._currentSpeech.interrupted && this._currentSpeech.allowInterruptions) {
+      this.logger.info(
+        { "speech id": this._currentSpeech.id },
+        "speech interrupted by adaptive interruption detector"
+      );
+      (_b = this.realtimeSession) == null ? void 0 : _b.interrupt();
+      this._currentSpeech.interrupt();
+    }
+  }
+  onInterimTranscript(ev) {
+    if (this.llm instanceof RealtimeModel && this.llm.capabilities.userTranscription) {
+      return;
+    }
+    this.agentSession.emit(
+      AgentSessionEventTypes.UserInputTranscribed,
+      createUserInputTranscribedEvent({
+        transcript: ev.alternatives[0].text,
+        isFinal: false,
+        language: ev.alternatives[0].language
+        // TODO(AJS-106): add multi participant support
+      })
+    );
+  }
+  onFinalTranscript(ev) {
+    if (this.llm instanceof RealtimeModel && this.llm.capabilities.userTranscription) {
+      return;
+    }
+    this.agentSession.emit(
+      AgentSessionEventTypes.UserInputTranscribed,
+      createUserInputTranscribedEvent({
+        transcript: ev.alternatives[0].text,
+        isFinal: true,
+        language: ev.alternatives[0].language
+        // TODO(AJS-106): add multi participant support
+      })
+    );
+  }
+  onPreemptiveGeneration(info) {
+    if (!this.agentSession.options.preemptiveGeneration || this.draining || this._currentSpeech !== void 0 && !this._currentSpeech.interrupted || !(this.llm instanceof LLM)) {
+      return;
+    }
+    this.cancelPreemptiveGeneration();
+    this.logger.info(
+      {
+        newTranscript: info.newTranscript,
+        transcriptConfidence: info.transcriptConfidence
+      },
+      "starting preemptive generation"
+    );
+    const userMessage = ChatMessage.create({
+      role: "user",
+      content: info.newTranscript
+    });
+    const chatCtx = this.agent.chatCtx.copy();
+    const speechHandle = this.generateReply({
+      userMessage,
+      chatCtx,
+      scheduleSpeech: false
+    });
+    this._preemptiveGeneration = {
+      speechHandle,
+      userMessage,
+      info,
+      chatCtx: chatCtx.copy(),
+      tools: { ...this.tools },
+      toolChoice: this.toolChoice,
+      createdAt: Date.now()
+    };
+  }
+  cancelPreemptiveGeneration() {
+    if (this._preemptiveGeneration !== void 0) {
+      this._preemptiveGeneration.speechHandle._cancel();
+      this._preemptiveGeneration = void 0;
+    }
+  }
+  createSpeechTask(options) {
+    const { task, ownedSpeechHandle } = options;
+    this.speechTasks.add(task);
+    task.addDoneCallback(() => {
+      this.speechTasks.delete(task);
+    });
+    if (ownedSpeechHandle) {
+      ownedSpeechHandle._tasks.push(task);
+      task.addDoneCallback(() => {
+        if (ownedSpeechHandle._tasks.every((t) => t.done)) {
+          ownedSpeechHandle._markDone();
+        }
+      });
+    }
+    task.addDoneCallback(() => {
+      this.wakeupMainTask();
+    });
+    return task.result;
+  }
+  async onEndOfTurn(info) {
+    if (this.draining) {
+      this.cancelPreemptiveGeneration();
+      this.logger.warn({ user_input: info.newTranscript }, "skipping user input, task is draining");
+      return true;
+    }
+    if (this.stt && this.turnDetection !== "manual" && this._currentSpeech && this._currentSpeech.allowInterruptions && !this._currentSpeech.interrupted && this.agentSession.options.minInterruptionWords > 0) {
+      const wordCount = splitWords(info.newTranscript, true).length;
+      if (wordCount < this.agentSession.options.minInterruptionWords) {
+        this.cancelPreemptiveGeneration();
+        this.logger.info(
+          {
+            wordCount,
+            minInterruptionWords: this.agentSession.options.minInterruptionWords
+          },
+          "skipping user input, word count below minimum interruption threshold"
+        );
+        return false;
+      }
+    }
+    const oldTask = this._userTurnCompletedTask;
+    this._userTurnCompletedTask = this.createSpeechTask({
+      task: Task.from(() => this.userTurnCompleted(info, oldTask)),
+      name: "AgentActivity.userTurnCompleted"
+    });
+    return true;
+  }
+  retrieveChatCtx() {
+    return this.agentSession.chatCtx;
+  }
+  async mainTask(signal) {
+    const abortFuture = new Future();
+    const abortHandler = () => {
+      abortFuture.resolve();
+      signal.removeEventListener("abort", abortHandler);
+    };
+    signal.addEventListener("abort", abortHandler);
+    while (true) {
+      await Promise.race([this.q_updated.await, abortFuture.await]);
+      if (signal.aborted) break;
+      while (this.speechQueue.size() > 0) {
+        if (signal.aborted) break;
+        const heapItem = this.speechQueue.pop();
+        if (!heapItem) {
+          throw new Error("Speech queue is empty");
+        }
+        const speechHandle = heapItem[2];
+        this._currentSpeech = speechHandle;
+        speechHandle._authorizeGeneration();
+        await speechHandle._waitForGeneration();
+        this._currentSpeech = void 0;
+      }
+      if (this.draining && this.speechTasks.size === 0) {
+        this.logger.info("mainTask: draining and no more speech tasks");
+        break;
+      }
+      this.q_updated = new Future();
+    }
+    this.logger.info("AgentActivity mainTask: exiting");
+  }
+  wakeupMainTask() {
+    this.q_updated.resolve();
+  }
+  generateReply(options) {
+    var _a;
+    const {
+      userMessage,
+      chatCtx,
+      instructions: defaultInstructions,
+      toolChoice: defaultToolChoice,
+      allowInterruptions: defaultAllowInterruptions,
+      scheduleSpeech = true
+    } = options;
+    let instructions = defaultInstructions;
+    let toolChoice = defaultToolChoice;
+    let allowInterruptions = defaultAllowInterruptions;
+    if (this.llm instanceof RealtimeModel && this.llm.capabilities.turnDetection && allowInterruptions === false) {
+      this.logger.warn(
+        "the RealtimeModel uses a server-side turn detection, allowInterruptions cannot be false when using VoiceAgent.generateReply(), disable turnDetection in the RealtimeModel and use VAD on the AgentTask/VoiceAgent instead"
+      );
+      allowInterruptions = true;
+    }
+    if (this.llm === void 0) {
+      throw new Error("trying to generate reply without an LLM model");
+    }
+    const functionCall = (_a = asyncLocalStorage.getStore()) == null ? void 0 : _a.functionCall;
+    if (toolChoice === void 0 && functionCall !== void 0) {
+      toolChoice = "none";
+    }
+    const handle = SpeechHandle.create({
+      allowInterruptions: allowInterruptions ?? this.allowInterruptions
+    });
+    this.agentSession.emit(
+      AgentSessionEventTypes.SpeechCreated,
+      createSpeechCreatedEvent({
+        userInitiated: true,
+        source: "generate_reply",
+        speechHandle: handle
+      })
+    );
+    this.logger.info({ speech_id: handle.id }, "Creating speech handle");
+    if (this.llm instanceof RealtimeModel) {
+      this.createSpeechTask({
+        task: Task.from(
+          (abortController) => this.realtimeReplyTask({
+            speechHandle: handle,
+            // TODO(brian): support llm.ChatMessage for the realtime model
+            userInput: userMessage == null ? void 0 : userMessage.textContent,
+            instructions,
+            modelSettings: {
+              // isGiven(toolChoice) = toolChoice !== undefined
+              toolChoice: toOaiToolChoice(toolChoice !== void 0 ? toolChoice : this.toolChoice)
+            },
+            abortController
+          })
+        ),
+        ownedSpeechHandle: handle,
+        name: "AgentActivity.realtimeReply"
+      });
+    } else if (this.llm instanceof LLM) {
+      if (instructions) {
+        instructions = `${this.agent.instructions}
+${instructions}`;
+      }
+      const task = this.createSpeechTask({
+        task: Task.from(
+          (abortController) => this.pipelineReplyTask(
+            handle,
+            chatCtx ?? this.agent.chatCtx,
+            this.agent.toolCtx,
+            {
+              toolChoice: toOaiToolChoice(toolChoice !== void 0 ? toolChoice : this.toolChoice)
+            },
+            abortController,
+            instructions ? `${this.agent.instructions}
+${instructions}` : instructions,
+            userMessage
+          )
+        ),
+        ownedSpeechHandle: handle,
+        name: "AgentActivity.pipelineReply"
+      });
+      task.finally(() => this.onPipelineReplyDone());
+    }
+    if (scheduleSpeech) {
+      this.scheduleSpeech(handle, SpeechHandle.SPEECH_PRIORITY_NORMAL);
+    }
+    return handle;
+  }
+  interrupt() {
+    var _a;
+    const future = new Future();
+    const currentSpeech = this._currentSpeech;
+    currentSpeech == null ? void 0 : currentSpeech.interrupt();
+    for (const [_, __, speech] of this.speechQueue) {
+      speech.interrupt();
+    }
+    (_a = this.realtimeSession) == null ? void 0 : _a.interrupt();
+    if (currentSpeech === void 0) {
+      future.resolve();
+    } else {
+      currentSpeech.addDoneCallback(() => {
+        if (future.done) return;
+        future.resolve();
+      });
+    }
+    return future;
+  }
+  onPipelineReplyDone() {
+    if (!this.speechQueue.peek() && (!this._currentSpeech || this._currentSpeech.done())) {
+      this.agentSession._updateAgentState("listening");
+    }
+  }
+  async userTurnCompleted(info, oldTask) {
+    var _a, _b;
+    if (oldTask) {
+      await oldTask;
+    }
+    if (this.llm instanceof RealtimeModel) {
+      if (this.llm.capabilities.turnDetection) {
+        return;
+      }
+      (_a = this.realtimeSession) == null ? void 0 : _a.commitAudio();
+    }
+    if (this._currentSpeech) {
+      if (!this._currentSpeech.allowInterruptions) {
+        this.logger.warn(
+          { user_input: info.newTranscript },
+          "skipping user input, current speech generation cannot be interrupted"
+        );
+        return;
+      }
+      this.logger.info(
+        { "speech id": this._currentSpeech.id },
+        "speech interrupted, new user turn detected"
+      );
+      this._currentSpeech.interrupt();
+      (_b = this.realtimeSession) == null ? void 0 : _b.interrupt();
+    }
+    let userMessage = ChatMessage.create({
+      role: "user",
+      content: info.newTranscript
+    });
+    const chatCtx = this.agent.chatCtx.copy();
+    const startTime = Date.now();
+    try {
+      await this.agent.onUserTurnCompleted(chatCtx, userMessage);
+    } catch (e) {
+      if (e instanceof StopResponse) {
+        return;
+      }
+      this.logger.error({ error: e }, "error occurred during onUserTurnCompleted");
+    }
+    const callbackDuration = Date.now() - startTime;
+    if (this.llm instanceof RealtimeModel) {
+      userMessage = void 0;
+    } else if (this.llm === void 0) {
+      return;
+    }
+    let speechHandle;
+    if (this._preemptiveGeneration !== void 0) {
+      const preemptive = this._preemptiveGeneration;
+      if (preemptive.info.newTranscript === (userMessage == null ? void 0 : userMessage.textContent) && preemptive.chatCtx.isEquivalent(chatCtx) && isSameToolContext(preemptive.tools, this.tools) && isSameToolChoice(preemptive.toolChoice, this.toolChoice)) {
+        speechHandle = preemptive.speechHandle;
+        this.scheduleSpeech(speechHandle, SpeechHandle.SPEECH_PRIORITY_NORMAL);
+        this.logger.debug(
+          {
+            preemptiveLeadTime: Date.now() - preemptive.createdAt
+          },
+          "using preemptive generation"
+        );
+      } else {
+        this.logger.warn(
+          "preemptive generation enabled but chat context or tools have changed after `onUserTurnCompleted`"
+        );
+        preemptive.speechHandle._cancel();
+      }
+      this._preemptiveGeneration = void 0;
+    }
+    if (speechHandle === void 0) {
+      speechHandle = this.generateReply({ userMessage, chatCtx });
+    }
+    const eouMetrics = {
+      type: "eou_metrics",
+      timestamp: Date.now(),
+      endOfUtteranceDelayMs: info.endOfUtteranceDelay,
+      transcriptionDelayMs: info.transcriptionDelay,
+      onUserTurnCompletedDelayMs: callbackDuration,
+      lastSpeakingTimeMs: info.stoppedSpeakingAt ?? 0,
+      speechId: speechHandle.id
+    };
+    this.agentSession.emit(
+      AgentSessionEventTypes.MetricsCollected,
+      createMetricsCollectedEvent({ metrics: eouMetrics })
+    );
+  }
+  async ttsTask(speechHandle, text, addToChatCtx, modelSettings, replyAbortController, audio) {
+    speechHandleStorage.enterWith(speechHandle);
+    const transcriptionOutput = this.agentSession.output.transcriptionEnabled ? this.agentSession.output.transcription : null;
+    const audioOutput = this.agentSession.output.audioEnabled ? this.agentSession.output.audio : null;
+    await speechHandle.waitIfNotInterrupted([speechHandle._waitForAuthorization()]);
+    if (speechHandle.interrupted) {
+      return;
+    }
+    let baseStream;
+    if (text instanceof ReadableStream) {
+      baseStream = text;
+    } else {
+      baseStream = new ReadableStream({
+        start(controller) {
+          controller.enqueue(text);
+          controller.close();
+        }
+      });
+    }
+    const [textSource, audioSource] = baseStream.tee();
+    const tasks = [];
+    const trNode = await this.agent.transcriptionNode(textSource, {});
+    let textOut = null;
+    if (trNode) {
+      const [textForwardTask, _textOut] = performTextForwarding(
+        trNode,
+        replyAbortController,
+        transcriptionOutput
+      );
+      textOut = _textOut;
+      tasks.push(textForwardTask);
+    }
+    const onFirstFrame = () => {
+      this.agentSession._updateAgentState("speaking");
+    };
+    if (!audioOutput) {
+      if (textOut) {
+        textOut.firstTextFut.await.finally(onFirstFrame);
+      }
+    } else {
+      let audioOut = null;
+      if (!audio) {
+        const [ttsTask, ttsStream] = performTTSInference(
+          (...args) => this.agent.ttsNode(...args),
+          audioSource,
+          modelSettings,
+          replyAbortController
+        );
+        tasks.push(ttsTask);
+        const [forwardTask, _audioOut] = performAudioForwarding(
+          ttsStream,
+          audioOutput,
+          replyAbortController
+        );
+        tasks.push(forwardTask);
+        audioOut = _audioOut;
+      } else {
+        const [forwardTask, _audioOut] = performAudioForwarding(
+          audio,
+          audioOutput,
+          replyAbortController
+        );
+        tasks.push(forwardTask);
+        audioOut = _audioOut;
+      }
+      audioOut.firstFrameFut.await.finally(onFirstFrame);
+    }
+    await speechHandle.waitIfNotInterrupted(tasks.map((task) => task.result));
+    if (audioOutput) {
+      await speechHandle.waitIfNotInterrupted([audioOutput.waitForPlayout()]);
+    }
+    if (speechHandle.interrupted) {
+      replyAbortController.abort();
+      await cancelAndWait(tasks, AgentActivity.REPLY_TASK_CANCEL_TIMEOUT);
+      if (audioOutput) {
+        audioOutput.clearBuffer();
+        await audioOutput.waitForPlayout();
+      }
+    }
+    if (addToChatCtx) {
+      const message = ChatMessage.create({
+        role: "assistant",
+        content: (textOut == null ? void 0 : textOut.text) || "",
+        interrupted: speechHandle.interrupted
+      });
+      this.agent._chatCtx.insert(message);
+      this.agentSession._conversationItemAdded(message);
+    }
+    if (this.agentSession.agentState === "speaking") {
+      this.agentSession._updateAgentState("listening");
+    }
+  }
+  _pipelineReplyTaskImpl = async ({
+    speechHandle,
+    chatCtx,
+    toolCtx,
+    modelSettings,
+    replyAbortController,
+    instructions,
+    newMessage,
+    toolsMessages,
+    span
+  }) => {
+    var _a, _b, _c;
+    span.setAttribute(traceTypes.ATTR_SPEECH_ID, speechHandle.id);
+    if (instructions) {
+      span.setAttribute(traceTypes.ATTR_INSTRUCTIONS, instructions);
+    }
+    if (newMessage) {
+      span.setAttribute(traceTypes.ATTR_USER_INPUT, newMessage.textContent || "");
+    }
+    speechHandleStorage.enterWith(speechHandle);
+    const audioOutput = this.agentSession.output.audioEnabled ? this.agentSession.output.audio : null;
+    const transcriptionOutput = this.agentSession.output.transcriptionEnabled ? this.agentSession.output.transcription : null;
+    chatCtx = chatCtx.copy();
+    if (newMessage) {
+      chatCtx.insert(newMessage);
+    }
+    if (instructions) {
+      try {
+        updateInstructions({
+          chatCtx,
+          instructions,
+          addIfMissing: true
+        });
+      } catch (e) {
+        this.logger.error({ error: e }, "error occurred during updateInstructions");
+      }
+    }
+    const tasks = [];
+    const [llmTask, llmGenData] = performLLMInference(
+      // preserve  `this` context in llmNode
+      (...args) => this.agent.llmNode(...args),
+      chatCtx,
+      toolCtx,
+      modelSettings,
+      replyAbortController
+    );
+    tasks.push(llmTask);
+    const [ttsTextInput, llmOutput] = llmGenData.textStream.tee();
+    let ttsTask = null;
+    let ttsStream = null;
+    if (audioOutput) {
+      [ttsTask, ttsStream] = performTTSInference(
+        (...args) => this.agent.ttsNode(...args),
+        ttsTextInput,
+        modelSettings,
+        replyAbortController
+      );
+      tasks.push(ttsTask);
+    }
+    await speechHandle.waitIfNotInterrupted([speechHandle._waitForScheduled()]);
+    if (newMessage && speechHandle.scheduled) {
+      this.agent._chatCtx.insert(newMessage);
+      this.agentSession._conversationItemAdded(newMessage);
+    }
+    if (speechHandle.interrupted) {
+      replyAbortController.abort();
+      await cancelAndWait(tasks, AgentActivity.REPLY_TASK_CANCEL_TIMEOUT);
+      return;
+    }
+    this.agentSession._updateAgentState("thinking");
+    await speechHandle.waitIfNotInterrupted([speechHandle._waitForAuthorization()]);
+    speechHandle._clearAuthorization();
+    const replyStartedAt = Date.now();
+    const trNodeResult = await this.agent.transcriptionNode(llmOutput, modelSettings);
+    let textOut = null;
+    if (trNodeResult) {
+      const [textForwardTask, _textOut] = performTextForwarding(
+        trNodeResult,
+        replyAbortController,
+        transcriptionOutput
+      );
+      tasks.push(textForwardTask);
+      textOut = _textOut;
+    }
+    const onFirstFrame = () => {
+      this.agentSession._updateAgentState("speaking");
+    };
+    let audioOut = null;
+    if (audioOutput) {
+      if (ttsStream) {
+        const [forwardTask, _audioOut] = performAudioForwarding(
+          ttsStream,
+          audioOutput,
+          replyAbortController
+        );
+        audioOut = _audioOut;
+        tasks.push(forwardTask);
+        audioOut.firstFrameFut.await.finally(onFirstFrame);
+      } else {
+        throw Error("ttsStream is null when audioOutput is enabled");
+      }
+    } else {
+      textOut == null ? void 0 : textOut.firstTextFut.await.finally(onFirstFrame);
+    }
+    const onToolExecutionStarted = (_) => {
+    };
+    const onToolExecutionCompleted = (_) => {
+    };
+    const [executeToolsTask, toolOutput] = performToolExecutions({
+      session: this.agentSession,
+      speechHandle,
+      toolCtx,
+      toolChoice: modelSettings.toolChoice,
+      toolCallStream: llmGenData.toolCallStream,
+      controller: replyAbortController,
+      onToolExecutionStarted,
+      onToolExecutionCompleted
+    });
+    await speechHandle.waitIfNotInterrupted(tasks.map((task) => task.result));
+    if (audioOutput) {
+      await speechHandle.waitIfNotInterrupted([audioOutput.waitForPlayout()]);
+    }
+    if (toolsMessages) {
+      for (const msg of toolsMessages) {
+        msg.createdAt = replyStartedAt;
+      }
+      this.agent._chatCtx.insert(toolsMessages);
+      this.agentSession._toolItemsAdded(toolsMessages);
+    }
+    if (speechHandle.interrupted) {
+      this.logger.debug(
+        { speech_id: speechHandle.id },
+        "Aborting all pipeline reply tasks due to interruption"
+      );
+      if (audioOutput) {
+        audioOutput.clearBuffer();
+      }
+      replyAbortController.abort();
+      await Promise.allSettled(
+        tasks.map((task) => task.cancelAndWait(AgentActivity.REPLY_TASK_CANCEL_TIMEOUT))
+      );
+      let forwardedText = (textOut == null ? void 0 : textOut.text) || "";
+      if (audioOutput) {
+        const playbackEv = await audioOutput.waitForPlayout();
+        if (audioOut == null ? void 0 : audioOut.firstFrameFut.done) {
+          this.logger.info(
+            { speech_id: speechHandle.id, playbackPosition: playbackEv.playbackPosition },
+            "playout interrupted"
+          );
+          if (playbackEv.synchronizedTranscript) {
+            forwardedText = playbackEv.synchronizedTranscript;
+          }
+        } else {
+          forwardedText = "";
+        }
+      }
+      if (forwardedText) {
+        const message = ChatMessage.create({
+          role: "assistant",
+          content: forwardedText,
+          id: llmGenData.id,
+          interrupted: true,
+          createdAt: replyStartedAt
+        });
+        chatCtx.insert(message);
+        this.agent._chatCtx.insert(message);
+        this.agentSession._conversationItemAdded(message);
+      }
+      if (this.agentSession.agentState === "speaking") {
+        this.agentSession._updateAgentState("listening");
+      }
+      this.logger.info(
+        { speech_id: speechHandle.id, message: forwardedText },
+        "playout completed with interrupt"
+      );
+      speechHandle._markGenerationDone();
+      await executeToolsTask.cancelAndWait(AgentActivity.REPLY_TASK_CANCEL_TIMEOUT);
+      return;
+    }
+    if (textOut && textOut.text) {
+      const message = ChatMessage.create({
+        role: "assistant",
+        id: llmGenData.id,
+        interrupted: false,
+        createdAt: replyStartedAt,
+        content: textOut.text
+      });
+      chatCtx.insert(message);
+      this.agent._chatCtx.insert(message);
+      this.agentSession._conversationItemAdded(message);
+      this.logger.info(
+        { speech_id: speechHandle.id, message: textOut.text },
+        "playout completed without interruption"
+      );
+    }
+    if (toolOutput.output.length > 0) {
+      this.agentSession._updateAgentState("thinking");
+    } else if (this.agentSession.agentState === "speaking") {
+      this.agentSession._updateAgentState("listening");
+    }
+    speechHandle._markGenerationDone();
+    await executeToolsTask.result;
+    if (toolOutput.output.length === 0) return;
+    const { maxToolSteps } = this.agentSession.options;
+    if (speechHandle.numSteps >= maxToolSteps) {
+      this.logger.warn(
+        { speech_id: speechHandle.id, max_tool_steps: maxToolSteps },
+        "maximum number of function calls steps reached"
+      );
+      return;
+    }
+    const functionToolsExecutedEvent = createFunctionToolsExecutedEvent({
+      functionCalls: [],
+      functionCallOutputs: []
+    });
+    let shouldGenerateToolReply = false;
+    let newAgentTask = null;
+    let ignoreTaskSwitch = false;
+    for (const sanitizedOut of toolOutput.output) {
+      if (sanitizedOut.toolCallOutput !== void 0) {
+        functionToolsExecutedEvent.functionCalls.push(sanitizedOut.toolCall);
+        functionToolsExecutedEvent.functionCallOutputs.push(sanitizedOut.toolCallOutput);
+        if (sanitizedOut.replyRequired) {
+          shouldGenerateToolReply = true;
+        }
+      }
+      if (newAgentTask !== null && sanitizedOut.agentTask !== void 0) {
+        this.logger.error("expected to receive only one agent task from the tool executions");
+        ignoreTaskSwitch = true;
+      }
+      newAgentTask = sanitizedOut.agentTask ?? null;
+      this.logger.debug(
+        {
+          speechId: speechHandle.id,
+          name: (_a = sanitizedOut.toolCall) == null ? void 0 : _a.name,
+          args: sanitizedOut.toolCall.args,
+          output: (_b = sanitizedOut.toolCallOutput) == null ? void 0 : _b.output,
+          isError: (_c = sanitizedOut.toolCallOutput) == null ? void 0 : _c.isError
+        },
+        "Tool call execution finished"
+      );
+    }
+    this.agentSession.emit(
+      AgentSessionEventTypes.FunctionToolsExecuted,
+      functionToolsExecutedEvent
+    );
+    let draining = this.draining;
+    if (!ignoreTaskSwitch && newAgentTask !== null) {
+      this.agentSession.updateAgent(newAgentTask);
+      draining = true;
+    }
+    const toolMessages = [
+      ...functionToolsExecutedEvent.functionCalls,
+      ...functionToolsExecutedEvent.functionCallOutputs
+    ];
+    if (shouldGenerateToolReply) {
+      chatCtx.insert(toolMessages);
+      const handle = SpeechHandle.create({
+        allowInterruptions: speechHandle.allowInterruptions,
+        stepIndex: speechHandle._stepIndex + 1,
+        parent: speechHandle
+      });
+      this.agentSession.emit(
+        AgentSessionEventTypes.SpeechCreated,
+        createSpeechCreatedEvent({
+          userInitiated: false,
+          source: "tool_response",
+          speechHandle: handle
+        })
+      );
+      const respondToolChoice = draining || modelSettings.toolChoice === "none" ? "none" : "auto";
+      const toolResponseTask = this.createSpeechTask({
+        task: Task.from(
+          () => this.pipelineReplyTask(
+            handle,
+            chatCtx,
+            toolCtx,
+            { toolChoice: respondToolChoice },
+            replyAbortController,
+            instructions,
+            void 0,
+            toolMessages
+          )
+        ),
+        ownedSpeechHandle: handle,
+        name: "AgentActivity.pipelineReply"
+      });
+      toolResponseTask.finally(() => this.onPipelineReplyDone());
+      this.scheduleSpeech(handle, SpeechHandle.SPEECH_PRIORITY_NORMAL, true);
+    } else if (functionToolsExecutedEvent.functionCallOutputs.length > 0) {
+      for (const msg of toolMessages) {
+        msg.createdAt = replyStartedAt;
+      }
+      this.agent._chatCtx.insert(toolMessages);
+      this.agentSession._toolItemsAdded(toolMessages);
+    }
+  };
+  pipelineReplyTask = async (speechHandle, chatCtx, toolCtx, modelSettings, replyAbortController, instructions, newMessage, toolsMessages) => tracer.startActiveSpan(
+    async (span) => this._pipelineReplyTaskImpl({
+      speechHandle,
+      chatCtx,
+      toolCtx,
+      modelSettings,
+      replyAbortController,
+      instructions,
+      newMessage,
+      toolsMessages,
+      span
+    }),
+    {
+      name: "agent_turn",
+      context: this.agentSession.rootSpanContext
+    }
+  );
+  async realtimeGenerationTask(speechHandle, ev, modelSettings, replyAbortController) {
+    return tracer.startActiveSpan(
+      async (span) => this._realtimeGenerationTaskImpl({
+        speechHandle,
+        ev,
+        modelSettings,
+        replyAbortController,
+        span
+      }),
+      {
+        name: "agent_turn",
+        context: this.agentSession.rootSpanContext
+      }
+    );
+  }
+  async _realtimeGenerationTaskImpl({
+    speechHandle,
+    ev,
+    modelSettings,
+    replyAbortController,
+    span
+  }) {
+    var _a, _b, _c;
+    span.setAttribute(traceTypes.ATTR_SPEECH_ID, speechHandle.id);
+    speechHandleStorage.enterWith(speechHandle);
+    if (!this.realtimeSession) {
+      throw new Error("realtime session is not initialized");
+    }
+    if (!(this.llm instanceof RealtimeModel)) {
+      throw new Error("llm is not a realtime model");
+    }
+    span.setAttribute(traceTypes.ATTR_GEN_AI_REQUEST_MODEL, this.llm.model);
+    if (this.realtimeSpans && ev.responseId) {
+      this.realtimeSpans.set(ev.responseId, span);
+    }
+    this.logger.debug(
+      { speech_id: speechHandle.id, stepIndex: speechHandle.numSteps },
+      "realtime generation started"
+    );
+    const audioOutput = this.agentSession.output.audioEnabled ? this.agentSession.output.audio : null;
+    const textOutput = this.agentSession.output.transcriptionEnabled ? this.agentSession.output.transcription : null;
+    const toolCtx = this.realtimeSession.tools;
+    await speechHandle.waitIfNotInterrupted([speechHandle._waitForAuthorization()]);
+    speechHandle._clearAuthorization();
+    if (speechHandle.interrupted) {
+      return;
+    }
+    const onFirstFrame = () => {
+      this.agentSession._updateAgentState("speaking");
+    };
+    const readMessages = async (abortController, outputs) => {
+      replyAbortController.signal.addEventListener("abort", () => abortController.abort(), {
+        once: true
+      });
+      const forwardTasks = [];
+      try {
+        for await (const msg of ev.messageStream) {
+          if (forwardTasks.length > 0) {
+            this.logger.warn(
+              "expected to receive only one message generation from the realtime API"
+            );
+            break;
+          }
+          const msgModalities = msg.modalities ? await msg.modalities : void 0;
+          let ttsTextInput = null;
+          let trTextInput;
+          if (msgModalities && !msgModalities.includes("audio") && this.tts) {
+            if (this.llm instanceof RealtimeModel && this.llm.capabilities.audioOutput) {
+              this.logger.warn(
+                "text response received from realtime API, falling back to use a TTS model."
+              );
+            }
+            const [_ttsTextInput, _trTextInput] = msg.textStream.tee();
+            ttsTextInput = _ttsTextInput;
+            trTextInput = _trTextInput;
+          } else {
+            trTextInput = msg.textStream;
+          }
+          const trNodeResult = await this.agent.transcriptionNode(trTextInput, modelSettings);
+          let textOut = null;
+          if (trNodeResult) {
+            const [textForwardTask, _textOut] = performTextForwarding(
+              trNodeResult,
+              abortController,
+              textOutput
+            );
+            forwardTasks.push(textForwardTask);
+            textOut = _textOut;
+          }
+          let audioOut = null;
+          if (audioOutput) {
+            let realtimeAudioResult = null;
+            if (ttsTextInput) {
+              const [ttsTask, ttsStream] = performTTSInference(
+                (...args) => this.agent.ttsNode(...args),
+                ttsTextInput,
+                modelSettings,
+                abortController
+              );
+              tasks.push(ttsTask);
+              realtimeAudioResult = ttsStream;
+            } else if (msgModalities && msgModalities.includes("audio")) {
+              realtimeAudioResult = await this.agent.realtimeAudioOutputNode(
+                msg.audioStream,
+                modelSettings
+              );
+            } else if (this.llm instanceof RealtimeModel && this.llm.capabilities.audioOutput) {
+              this.logger.error(
+                "Text message received from Realtime API with audio modality. This usually happens when text chat context is synced to the API. Try to add a TTS model as fallback or use text modality with TTS instead."
+              );
+            } else {
+              this.logger.warn(
+                "audio output is enabled but neither tts nor realtime audio is available"
+              );
+            }
+            if (realtimeAudioResult) {
+              const [forwardTask, _audioOut] = performAudioForwarding(
+                realtimeAudioResult,
+                audioOutput,
+                abortController
+              );
+              forwardTasks.push(forwardTask);
+              audioOut = _audioOut;
+              audioOut.firstFrameFut.await.finally(onFirstFrame);
+            }
+          } else if (textOut) {
+            textOut.firstTextFut.await.finally(onFirstFrame);
+          }
+          outputs.push([msg.messageId, textOut, audioOut, msgModalities]);
+        }
+        await waitFor(forwardTasks);
+      } catch (error) {
+        this.logger.error(error, "error reading messages from the realtime API");
+      } finally {
+        await cancelAndWait(forwardTasks, AgentActivity.REPLY_TASK_CANCEL_TIMEOUT);
+      }
+    };
+    const messageOutputs = [];
+    const tasks = [
+      Task.from(
+        (controller) => readMessages(controller, messageOutputs),
+        void 0,
+        "AgentActivity.realtime_generation.read_messages"
+      )
+    ];
+    const [toolCallStream, toolCallStreamForTracing] = ev.functionStream.tee();
+    const toolCalls = [];
+    const readToolStreamTask = async (controller, stream) => {
+      const reader = stream.getReader();
+      try {
+        while (!controller.signal.aborted) {
+          const { done, value } = await reader.read();
+          if (done) break;
+          this.logger.debug({ tool_call: value }, "received tool call from the realtime API");
+          toolCalls.push(value);
+        }
+      } finally {
+        reader.releaseLock();
+      }
+    };
+    tasks.push(
+      Task.from(
+        (controller) => readToolStreamTask(controller, toolCallStreamForTracing),
+        replyAbortController,
+        "AgentActivity.realtime_generation.read_tool_stream"
+      )
+    );
+    const onToolExecutionStarted = (f) => {
+      speechHandle._itemAdded([f]);
+      this.agent._chatCtx.items.push(f);
+      this.agentSession._toolItemsAdded([f]);
+    };
+    const onToolExecutionCompleted = (out) => {
+      if (out.toolCallOutput) {
+        speechHandle._itemAdded([out.toolCallOutput]);
+      }
+    };
+    const [executeToolsTask, toolOutput] = performToolExecutions({
+      session: this.agentSession,
+      speechHandle,
+      toolCtx,
+      toolCallStream,
+      toolChoice: modelSettings.toolChoice,
+      controller: replyAbortController,
+      onToolExecutionStarted,
+      onToolExecutionCompleted
+    });
+    await speechHandle.waitIfNotInterrupted(tasks.map((task) => task.result));
+    if (audioOutput) {
+      await speechHandle.waitIfNotInterrupted([audioOutput.waitForPlayout()]);
+      this.agentSession._updateAgentState("listening");
+    }
+    if (speechHandle.interrupted) {
+      this.logger.debug(
+        { speech_id: speechHandle.id },
+        "Aborting all realtime generation tasks due to interruption"
+      );
+      replyAbortController.abort();
+      await cancelAndWait(tasks, AgentActivity.REPLY_TASK_CANCEL_TIMEOUT);
+      if (messageOutputs.length > 0) {
+        const [msgId, textOut, audioOut, msgModalities] = messageOutputs[0];
+        let forwardedText = (textOut == null ? void 0 : textOut.text) || "";
+        if (audioOutput) {
+          audioOutput.clearBuffer();
+          const playbackEv = await audioOutput.waitForPlayout();
+          let playbackPosition = playbackEv.playbackPosition;
+          if (audioOut == null ? void 0 : audioOut.firstFrameFut.done) {
+            this.logger.info(
+              { speech_id: speechHandle.id, playbackPosition: playbackEv.playbackPosition },
+              "playout interrupted"
+            );
+            if (playbackEv.synchronizedTranscript) {
+              forwardedText = playbackEv.synchronizedTranscript;
+            }
+          } else {
+            forwardedText = "";
+            playbackPosition = 0;
+          }
+          this.realtimeSession.truncate({
+            messageId: msgId,
+            audioEndMs: Math.floor(playbackPosition),
+            modalities: msgModalities,
+            audioTranscript: forwardedText
+          });
+        }
+        if (forwardedText) {
+          const message = ChatMessage.create({
+            role: "assistant",
+            content: forwardedText,
+            id: msgId,
+            interrupted: true
+          });
+          this.agent._chatCtx.insert(message);
+          speechHandle._itemAdded([message]);
+          this.agentSession._conversationItemAdded(message);
+        }
+        this.logger.info(
+          { speech_id: speechHandle.id, message: forwardedText },
+          "playout completed with interrupt"
+        );
+      }
+      speechHandle._markGenerationDone();
+      await executeToolsTask.cancelAndWait(AgentActivity.REPLY_TASK_CANCEL_TIMEOUT);
+      return;
+    }
+    if (messageOutputs.length > 0) {
+      const [msgId, textOut, _, __] = messageOutputs[0];
+      const message = ChatMessage.create({
+        role: "assistant",
+        content: (textOut == null ? void 0 : textOut.text) || "",
+        id: msgId,
+        interrupted: false
+      });
+      this.agent._chatCtx.insert(message);
+      speechHandle._itemAdded([message]);
+      this.agentSession._conversationItemAdded(message);
+    }
+    speechHandle._markGenerationDone();
+    toolOutput.firstToolStartedFuture.await.finally(() => {
+      this.agentSession._updateAgentState("thinking");
+    });
+    await executeToolsTask.result;
+    if (toolOutput.output.length === 0) {
+      if (!speechHandle.interrupted) {
+        this.agentSession._updateAgentState("listening");
+      }
+      return;
+    }
+    const { maxToolSteps } = this.agentSession.options;
+    if (speechHandle.numSteps >= maxToolSteps) {
+      this.logger.warn(
+        { speech_id: speechHandle.id, max_tool_steps: maxToolSteps },
+        "maximum number of function calls steps reached"
+      );
+      return;
+    }
+    const functionToolsExecutedEvent = createFunctionToolsExecutedEvent({
+      functionCalls: [],
+      functionCallOutputs: []
+    });
+    let shouldGenerateToolReply = false;
+    let newAgentTask = null;
+    let ignoreTaskSwitch = false;
+    for (const sanitizedOut of toolOutput.output) {
+      if (sanitizedOut.toolCallOutput !== void 0) {
+        functionToolsExecutedEvent.functionCallOutputs.push(sanitizedOut.toolCallOutput);
+        if (sanitizedOut.replyRequired) {
+          shouldGenerateToolReply = true;
+        }
+      }
+      if (newAgentTask !== null && sanitizedOut.agentTask !== void 0) {
+        this.logger.error("expected to receive only one agent task from the tool executions");
+        ignoreTaskSwitch = true;
+      }
+      newAgentTask = sanitizedOut.agentTask ?? null;
+      this.logger.debug(
+        {
+          speechId: speechHandle.id,
+          name: (_a = sanitizedOut.toolCall) == null ? void 0 : _a.name,
+          args: sanitizedOut.toolCall.args,
+          output: (_b = sanitizedOut.toolCallOutput) == null ? void 0 : _b.output,
+          isError: (_c = sanitizedOut.toolCallOutput) == null ? void 0 : _c.isError
+        },
+        "Tool call execution finished"
+      );
+    }
+    this.agentSession.emit(
+      AgentSessionEventTypes.FunctionToolsExecuted,
+      functionToolsExecutedEvent
+    );
+    let draining = this.draining;
+    if (!ignoreTaskSwitch && newAgentTask !== null) {
+      this.agentSession.updateAgent(newAgentTask);
+      draining = true;
+    }
+    if (functionToolsExecutedEvent.functionCallOutputs.length > 0) {
+      while (this.currentSpeech || this.speechQueue.size() > 0) {
+        if (this.currentSpeech && !this.currentSpeech.done() && this.currentSpeech !== speechHandle) {
+          await this.currentSpeech.waitForPlayout();
+        } else {
+          await new Promise((resolve) => setImmediate(resolve));
+        }
+      }
+      const chatCtx = this.realtimeSession.chatCtx.copy();
+      chatCtx.items.push(...functionToolsExecutedEvent.functionCallOutputs);
+      this.agentSession._toolItemsAdded(
+        functionToolsExecutedEvent.functionCallOutputs
+      );
+      try {
+        await this.realtimeSession.updateChatCtx(chatCtx);
+      } catch (error) {
+        this.logger.warn(
+          { error },
+          "failed to update chat context before generating the function calls results"
+        );
+      }
+    }
+    if (!shouldGenerateToolReply || this.llm.capabilities.autoToolReplyGeneration) {
+      return;
+    }
+    this.realtimeSession.interrupt();
+    const replySpeechHandle = SpeechHandle.create({
+      allowInterruptions: speechHandle.allowInterruptions,
+      stepIndex: speechHandle.numSteps + 1,
+      parent: speechHandle
+    });
+    this.agentSession.emit(
+      AgentSessionEventTypes.SpeechCreated,
+      createSpeechCreatedEvent({
+        userInitiated: false,
+        source: "tool_response",
+        speechHandle: replySpeechHandle
+      })
+    );
+    const toolChoice = draining || modelSettings.toolChoice === "none" ? "none" : "auto";
+    this.createSpeechTask({
+      task: Task.from(
+        (abortController) => this.realtimeReplyTask({
+          speechHandle: replySpeechHandle,
+          modelSettings: { toolChoice },
+          abortController
+        })
+      ),
+      ownedSpeechHandle: replySpeechHandle,
+      name: "AgentActivity.realtime_reply"
+    });
+    this.scheduleSpeech(replySpeechHandle, SpeechHandle.SPEECH_PRIORITY_NORMAL, true);
+  }
+  async realtimeReplyTask({
+    speechHandle,
+    modelSettings: { toolChoice },
+    userInput,
+    instructions,
+    abortController
+  }) {
+    speechHandleStorage.enterWith(speechHandle);
+    if (!this.realtimeSession) {
+      throw new Error("realtime session is not available");
+    }
+    await speechHandle.waitIfNotInterrupted([speechHandle._waitForAuthorization()]);
+    if (userInput) {
+      const chatCtx = this.realtimeSession.chatCtx.copy();
+      const message = chatCtx.addMessage({
+        role: "user",
+        content: userInput
+      });
+      await this.realtimeSession.updateChatCtx(chatCtx);
+      this.agent._chatCtx.insert(message);
+      this.agentSession._conversationItemAdded(message);
+    }
+    const originalToolChoice = this.toolChoice;
+    if (toolChoice !== void 0) {
+      this.realtimeSession.updateOptions({ toolChoice });
+    }
+    try {
+      const generationEvent = await this.realtimeSession.generateReply(instructions);
+      await this.realtimeGenerationTask(
+        speechHandle,
+        generationEvent,
+        { toolChoice },
+        abortController
+      );
+    } finally {
+      if (toolChoice !== void 0 && toolChoice !== originalToolChoice) {
+        this.realtimeSession.updateOptions({ toolChoice: originalToolChoice });
+      }
+    }
+  }
+  scheduleSpeech(speechHandle, priority, force = false) {
+    if (this.draining && !force) {
+      throw new Error("cannot schedule new speech, the agent is draining");
+    }
+    this.speechQueue.push([priority, Number(process.hrtime.bigint()), speechHandle]);
+    speechHandle._markScheduled();
+    this.wakeupMainTask();
+  }
+  async drain() {
+    return tracer.startActiveSpan(async (span) => this._drainImpl(span), {
+      name: "drain_agent_activity",
+      context: ROOT_CONTEXT
+    });
+  }
+  async _drainImpl(span) {
+    var _a;
+    span.setAttribute(traceTypes.ATTR_AGENT_LABEL, this.agent.id);
+    const unlock = await this.lock.lock();
+    try {
+      if (this._draining) return;
+      this.cancelPreemptiveGeneration();
+      const onExitTask = tracer.startActiveSpan(async () => this.agent.onExit(), {
+        name: "on_exit",
+        attributes: { [traceTypes.ATTR_AGENT_LABEL]: this.agent.id }
+      });
+      this.createSpeechTask({
+        task: Task.from(() => onExitTask),
+        name: "AgentActivity_onExit"
+      });
+      this.wakeupMainTask();
+      this._draining = true;
+      await ((_a = this._mainTask) == null ? void 0 : _a.result);
+    } finally {
+      unlock();
+    }
+  }
+  async close() {
+    var _a, _b, _c, _d;
+    const unlock = await this.lock.lock();
+    try {
+      if (!this._draining) {
+        this.logger.warn("task closing without draining");
+      }
+      this.cancelPreemptiveGeneration();
+      if (this.llm instanceof LLM) {
+        this.llm.off("metrics_collected", this.onMetricsCollected);
+      }
+      if (this.realtimeSession) {
+        this.realtimeSession.off("generation_created", this.onGenerationCreated);
+        this.realtimeSession.off("input_speech_started", this.onInputSpeechStarted);
+        this.realtimeSession.off("input_speech_stopped", this.onInputSpeechStopped);
+        this.realtimeSession.off(
+          "input_audio_transcription_completed",
+          this.onInputAudioTranscriptionCompleted
+        );
+        this.realtimeSession.off("metrics_collected", this.onMetricsCollected);
+      }
+      if (this.stt instanceof STT) {
+        this.stt.off("metrics_collected", this.onMetricsCollected);
+      }
+      if (this.tts instanceof TTS) {
+        this.tts.off("metrics_collected", this.onMetricsCollected);
+      }
+      if (this.vad instanceof VAD) {
+        this.vad.off("metrics_collected", this.onMetricsCollected);
+      }
+      this.detachAudioInput();
+      (_a = this.realtimeSpans) == null ? void 0 : _a.clear();
+      await ((_b = this.realtimeSession) == null ? void 0 : _b.close());
+      await ((_c = this.audioRecognition) == null ? void 0 : _c.close());
+      await ((_d = this._mainTask) == null ? void 0 : _d.cancelAndWait());
+    } finally {
+      unlock();
+    }
+  }
+}
+function toOaiToolChoice(toolChoice) {
+  return toolChoice !== null ? toolChoice : void 0;
+}
+export {
+  AgentActivity
+};
+//# sourceMappingURL=agent_activity.js.map