@livekit/agents 0.7.9 → 1.0.0-next.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/_exceptions.cjs +109 -0
- package/dist/_exceptions.cjs.map +1 -0
- package/dist/_exceptions.d.cts +64 -0
- package/dist/_exceptions.d.ts +64 -0
- package/dist/_exceptions.d.ts.map +1 -0
- package/dist/_exceptions.js +80 -0
- package/dist/_exceptions.js.map +1 -0
- package/dist/audio.cjs +10 -3
- package/dist/audio.cjs.map +1 -1
- package/dist/audio.d.cts +2 -0
- package/dist/audio.d.ts +2 -0
- package/dist/audio.d.ts.map +1 -1
- package/dist/audio.js +8 -2
- package/dist/audio.js.map +1 -1
- package/dist/cli.cjs +25 -0
- package/dist/cli.cjs.map +1 -1
- package/dist/cli.d.ts.map +1 -1
- package/dist/cli.js +25 -0
- package/dist/cli.js.map +1 -1
- package/dist/constants.cjs +6 -3
- package/dist/constants.cjs.map +1 -1
- package/dist/constants.d.cts +2 -1
- package/dist/constants.d.ts +2 -1
- package/dist/constants.d.ts.map +1 -1
- package/dist/constants.js +4 -2
- package/dist/constants.js.map +1 -1
- package/dist/http_server.cjs.map +1 -1
- package/dist/http_server.d.cts +1 -0
- package/dist/http_server.d.ts +1 -0
- package/dist/http_server.d.ts.map +1 -1
- package/dist/http_server.js.map +1 -1
- package/dist/index.cjs +27 -20
- package/dist/index.cjs.map +1 -1
- package/dist/index.d.cts +13 -10
- package/dist/index.d.ts +13 -10
- package/dist/index.d.ts.map +1 -1
- package/dist/index.js +15 -11
- package/dist/index.js.map +1 -1
- package/dist/inference_runner.cjs +0 -1
- package/dist/inference_runner.cjs.map +1 -1
- package/dist/inference_runner.d.cts +2 -3
- package/dist/inference_runner.d.ts +2 -3
- package/dist/inference_runner.d.ts.map +1 -1
- package/dist/inference_runner.js +0 -1
- package/dist/inference_runner.js.map +1 -1
- package/dist/ipc/inference_proc_executor.cjs +2 -2
- package/dist/ipc/inference_proc_executor.cjs.map +1 -1
- package/dist/ipc/inference_proc_executor.js +2 -2
- package/dist/ipc/inference_proc_executor.js.map +1 -1
- package/dist/ipc/job_executor.cjs.map +1 -1
- package/dist/ipc/job_executor.js.map +1 -1
- package/dist/ipc/job_proc_executor.cjs +1 -0
- package/dist/ipc/job_proc_executor.cjs.map +1 -1
- package/dist/ipc/job_proc_executor.js +1 -0
- package/dist/ipc/job_proc_executor.js.map +1 -1
- package/dist/ipc/job_proc_lazy_main.cjs +1 -1
- package/dist/ipc/job_proc_lazy_main.cjs.map +1 -1
- package/dist/ipc/job_proc_lazy_main.js +1 -1
- package/dist/ipc/job_proc_lazy_main.js.map +1 -1
- package/dist/ipc/supervised_proc.d.cts +1 -1
- package/dist/ipc/supervised_proc.d.ts +1 -1
- package/dist/ipc/supervised_proc.d.ts.map +1 -1
- package/dist/job.cjs +14 -2
- package/dist/job.cjs.map +1 -1
- package/dist/job.d.cts +8 -0
- package/dist/job.d.ts +8 -0
- package/dist/job.d.ts.map +1 -1
- package/dist/job.js +12 -1
- package/dist/job.js.map +1 -1
- package/dist/llm/chat_context.cjs +332 -82
- package/dist/llm/chat_context.cjs.map +1 -1
- package/dist/llm/chat_context.d.cts +152 -48
- package/dist/llm/chat_context.d.ts +152 -48
- package/dist/llm/chat_context.d.ts.map +1 -1
- package/dist/llm/chat_context.js +327 -81
- package/dist/llm/chat_context.js.map +1 -1
- package/dist/llm/chat_context.test.cjs +380 -0
- package/dist/llm/chat_context.test.cjs.map +1 -0
- package/dist/llm/chat_context.test.js +385 -0
- package/dist/llm/chat_context.test.js.map +1 -0
- package/dist/llm/index.cjs +37 -8
- package/dist/llm/index.cjs.map +1 -1
- package/dist/llm/index.d.cts +7 -3
- package/dist/llm/index.d.ts +7 -3
- package/dist/llm/index.d.ts.map +1 -1
- package/dist/llm/index.js +39 -9
- package/dist/llm/index.js.map +1 -1
- package/dist/llm/llm.cjs +98 -33
- package/dist/llm/llm.cjs.map +1 -1
- package/dist/llm/llm.d.cts +50 -24
- package/dist/llm/llm.d.ts +50 -24
- package/dist/llm/llm.d.ts.map +1 -1
- package/dist/llm/llm.js +99 -33
- package/dist/llm/llm.js.map +1 -1
- package/dist/llm/provider_format/google.cjs +128 -0
- package/dist/llm/provider_format/google.cjs.map +1 -0
- package/dist/llm/provider_format/google.d.cts +6 -0
- package/dist/llm/provider_format/google.d.ts +6 -0
- package/dist/llm/provider_format/google.d.ts.map +1 -0
- package/dist/llm/provider_format/google.js +104 -0
- package/dist/llm/provider_format/google.js.map +1 -0
- package/dist/llm/provider_format/google.test.cjs +676 -0
- package/dist/llm/provider_format/google.test.cjs.map +1 -0
- package/dist/llm/provider_format/google.test.js +675 -0
- package/dist/llm/provider_format/google.test.js.map +1 -0
- package/dist/llm/provider_format/index.cjs +40 -0
- package/dist/llm/provider_format/index.cjs.map +1 -0
- package/dist/llm/provider_format/index.d.cts +4 -0
- package/dist/llm/provider_format/index.d.ts +4 -0
- package/dist/llm/provider_format/index.d.ts.map +1 -0
- package/dist/llm/provider_format/index.js +16 -0
- package/dist/llm/provider_format/index.js.map +1 -0
- package/dist/llm/provider_format/openai.cjs +116 -0
- package/dist/llm/provider_format/openai.cjs.map +1 -0
- package/dist/llm/provider_format/openai.d.cts +3 -0
- package/dist/llm/provider_format/openai.d.ts +3 -0
- package/dist/llm/provider_format/openai.d.ts.map +1 -0
- package/dist/llm/provider_format/openai.js +92 -0
- package/dist/llm/provider_format/openai.js.map +1 -0
- package/dist/llm/provider_format/openai.test.cjs +490 -0
- package/dist/llm/provider_format/openai.test.cjs.map +1 -0
- package/dist/llm/provider_format/openai.test.js +489 -0
- package/dist/llm/provider_format/openai.test.js.map +1 -0
- package/dist/llm/provider_format/utils.cjs +146 -0
- package/dist/llm/provider_format/utils.cjs.map +1 -0
- package/dist/llm/provider_format/utils.d.cts +38 -0
- package/dist/llm/provider_format/utils.d.ts +38 -0
- package/dist/llm/provider_format/utils.d.ts.map +1 -0
- package/dist/llm/provider_format/utils.js +122 -0
- package/dist/llm/provider_format/utils.js.map +1 -0
- package/dist/llm/realtime.cjs +77 -0
- package/dist/llm/realtime.cjs.map +1 -0
- package/dist/llm/realtime.d.cts +98 -0
- package/dist/llm/realtime.d.ts +98 -0
- package/dist/llm/realtime.d.ts.map +1 -0
- package/dist/llm/realtime.js +52 -0
- package/dist/llm/realtime.js.map +1 -0
- package/dist/llm/remote_chat_context.cjs +112 -0
- package/dist/llm/remote_chat_context.cjs.map +1 -0
- package/dist/llm/remote_chat_context.d.cts +23 -0
- package/dist/llm/remote_chat_context.d.ts +23 -0
- package/dist/llm/remote_chat_context.d.ts.map +1 -0
- package/dist/llm/remote_chat_context.js +88 -0
- package/dist/llm/remote_chat_context.js.map +1 -0
- package/dist/llm/remote_chat_context.test.cjs +225 -0
- package/dist/llm/remote_chat_context.test.cjs.map +1 -0
- package/dist/llm/remote_chat_context.test.js +224 -0
- package/dist/llm/remote_chat_context.test.js.map +1 -0
- package/dist/llm/tool_context.cjs +111 -0
- package/dist/llm/tool_context.cjs.map +1 -0
- package/dist/llm/tool_context.d.cts +125 -0
- package/dist/llm/tool_context.d.ts +125 -0
- package/dist/llm/tool_context.d.ts.map +1 -0
- package/dist/llm/tool_context.js +80 -0
- package/dist/llm/tool_context.js.map +1 -0
- package/dist/llm/tool_context.test.cjs +162 -0
- package/dist/llm/tool_context.test.cjs.map +1 -0
- package/dist/llm/tool_context.test.js +161 -0
- package/dist/llm/tool_context.test.js.map +1 -0
- package/dist/llm/tool_context.type.test.cjs +92 -0
- package/dist/llm/tool_context.type.test.cjs.map +1 -0
- package/dist/llm/tool_context.type.test.js +91 -0
- package/dist/llm/tool_context.type.test.js.map +1 -0
- package/dist/llm/utils.cjs +260 -0
- package/dist/llm/utils.cjs.map +1 -0
- package/dist/llm/utils.d.cts +42 -0
- package/dist/llm/utils.d.ts +42 -0
- package/dist/llm/utils.d.ts.map +1 -0
- package/dist/llm/utils.js +223 -0
- package/dist/llm/utils.js.map +1 -0
- package/dist/llm/utils.test.cjs +513 -0
- package/dist/llm/utils.test.cjs.map +1 -0
- package/dist/llm/utils.test.js +490 -0
- package/dist/llm/utils.test.js.map +1 -0
- package/dist/metrics/base.cjs +0 -27
- package/dist/metrics/base.cjs.map +1 -1
- package/dist/metrics/base.d.cts +105 -63
- package/dist/metrics/base.d.ts +105 -63
- package/dist/metrics/base.d.ts.map +1 -1
- package/dist/metrics/base.js +0 -19
- package/dist/metrics/base.js.map +1 -1
- package/dist/metrics/index.cjs +0 -3
- package/dist/metrics/index.cjs.map +1 -1
- package/dist/metrics/index.d.cts +2 -3
- package/dist/metrics/index.d.ts +2 -3
- package/dist/metrics/index.d.ts.map +1 -1
- package/dist/metrics/index.js +0 -2
- package/dist/metrics/index.js.map +1 -1
- package/dist/metrics/usage_collector.cjs +17 -12
- package/dist/metrics/usage_collector.cjs.map +1 -1
- package/dist/metrics/usage_collector.d.cts +3 -2
- package/dist/metrics/usage_collector.d.ts +3 -2
- package/dist/metrics/usage_collector.d.ts.map +1 -1
- package/dist/metrics/usage_collector.js +17 -12
- package/dist/metrics/usage_collector.js.map +1 -1
- package/dist/metrics/utils.cjs +22 -59
- package/dist/metrics/utils.cjs.map +1 -1
- package/dist/metrics/utils.d.cts +1 -8
- package/dist/metrics/utils.d.ts +1 -8
- package/dist/metrics/utils.d.ts.map +1 -1
- package/dist/metrics/utils.js +22 -52
- package/dist/metrics/utils.js.map +1 -1
- package/dist/multimodal/index.cjs +0 -2
- package/dist/multimodal/index.cjs.map +1 -1
- package/dist/multimodal/index.d.cts +0 -1
- package/dist/multimodal/index.d.ts +0 -1
- package/dist/multimodal/index.d.ts.map +1 -1
- package/dist/multimodal/index.js +0 -1
- package/dist/multimodal/index.js.map +1 -1
- package/dist/plugin.cjs +24 -8
- package/dist/plugin.cjs.map +1 -1
- package/dist/plugin.d.cts +18 -4
- package/dist/plugin.d.ts +18 -4
- package/dist/plugin.d.ts.map +1 -1
- package/dist/plugin.js +22 -7
- package/dist/plugin.js.map +1 -1
- package/dist/stream/deferred_stream.cjs +98 -0
- package/dist/stream/deferred_stream.cjs.map +1 -0
- package/dist/stream/deferred_stream.d.cts +27 -0
- package/dist/stream/deferred_stream.d.ts +27 -0
- package/dist/stream/deferred_stream.d.ts.map +1 -0
- package/dist/stream/deferred_stream.js +73 -0
- package/dist/stream/deferred_stream.js.map +1 -0
- package/dist/stream/deferred_stream.test.cjs +527 -0
- package/dist/stream/deferred_stream.test.cjs.map +1 -0
- package/dist/stream/deferred_stream.test.js +526 -0
- package/dist/stream/deferred_stream.test.js.map +1 -0
- package/dist/stream/identity_transform.cjs +42 -0
- package/dist/stream/identity_transform.cjs.map +1 -0
- package/dist/stream/identity_transform.d.cts +6 -0
- package/dist/stream/identity_transform.d.ts +6 -0
- package/dist/stream/identity_transform.d.ts.map +1 -0
- package/dist/stream/identity_transform.js +18 -0
- package/dist/stream/identity_transform.js.map +1 -0
- package/dist/stream/identity_transform.test.cjs +125 -0
- package/dist/stream/identity_transform.test.cjs.map +1 -0
- package/dist/stream/identity_transform.test.js +124 -0
- package/dist/stream/identity_transform.test.js.map +1 -0
- package/dist/stream/index.cjs +38 -0
- package/dist/stream/index.cjs.map +1 -0
- package/dist/stream/index.d.cts +5 -0
- package/dist/stream/index.d.ts +5 -0
- package/dist/stream/index.d.ts.map +1 -0
- package/dist/stream/index.js +11 -0
- package/dist/stream/index.js.map +1 -0
- package/dist/stream/merge_readable_streams.cjs +59 -0
- package/dist/stream/merge_readable_streams.cjs.map +1 -0
- package/dist/stream/merge_readable_streams.d.cts +4 -0
- package/dist/stream/merge_readable_streams.d.ts +4 -0
- package/dist/stream/merge_readable_streams.d.ts.map +1 -0
- package/dist/stream/merge_readable_streams.js +35 -0
- package/dist/stream/merge_readable_streams.js.map +1 -0
- package/dist/stream/stream_channel.cjs +47 -0
- package/dist/stream/stream_channel.cjs.map +1 -0
- package/dist/stream/stream_channel.d.cts +9 -0
- package/dist/stream/stream_channel.d.ts +9 -0
- package/dist/stream/stream_channel.d.ts.map +1 -0
- package/dist/stream/stream_channel.js +23 -0
- package/dist/stream/stream_channel.js.map +1 -0
- package/dist/stream/stream_channel.test.cjs +97 -0
- package/dist/stream/stream_channel.test.cjs.map +1 -0
- package/dist/stream/stream_channel.test.js +96 -0
- package/dist/stream/stream_channel.test.js.map +1 -0
- package/dist/stt/stream_adapter.cjs +3 -4
- package/dist/stt/stream_adapter.cjs.map +1 -1
- package/dist/stt/stream_adapter.d.cts +1 -0
- package/dist/stt/stream_adapter.d.ts +1 -0
- package/dist/stt/stream_adapter.d.ts.map +1 -1
- package/dist/stt/stream_adapter.js +3 -4
- package/dist/stt/stream_adapter.js.map +1 -1
- package/dist/stt/stt.cjs +101 -10
- package/dist/stt/stt.cjs.map +1 -1
- package/dist/stt/stt.d.cts +26 -5
- package/dist/stt/stt.d.ts +26 -5
- package/dist/stt/stt.d.ts.map +1 -1
- package/dist/stt/stt.js +102 -11
- package/dist/stt/stt.js.map +1 -1
- package/dist/tokenize/basic/basic.cjs +10 -5
- package/dist/tokenize/basic/basic.cjs.map +1 -1
- package/dist/tokenize/basic/basic.d.cts +7 -1
- package/dist/tokenize/basic/basic.d.ts +7 -1
- package/dist/tokenize/basic/basic.d.ts.map +1 -1
- package/dist/tokenize/basic/basic.js +10 -5
- package/dist/tokenize/basic/basic.js.map +1 -1
- package/dist/tokenize/basic/sentence.cjs +14 -6
- package/dist/tokenize/basic/sentence.cjs.map +1 -1
- package/dist/tokenize/basic/sentence.d.cts +1 -1
- package/dist/tokenize/basic/sentence.d.ts +1 -1
- package/dist/tokenize/basic/sentence.d.ts.map +1 -1
- package/dist/tokenize/basic/sentence.js +14 -6
- package/dist/tokenize/basic/sentence.js.map +1 -1
- package/dist/tokenize/token_stream.cjs +5 -3
- package/dist/tokenize/token_stream.cjs.map +1 -1
- package/dist/tokenize/token_stream.d.cts +1 -0
- package/dist/tokenize/token_stream.d.ts +1 -0
- package/dist/tokenize/token_stream.d.ts.map +1 -1
- package/dist/tokenize/token_stream.js +6 -4
- package/dist/tokenize/token_stream.js.map +1 -1
- package/dist/transcription.cjs +1 -2
- package/dist/transcription.cjs.map +1 -1
- package/dist/transcription.d.ts.map +1 -1
- package/dist/transcription.js +2 -3
- package/dist/transcription.js.map +1 -1
- package/dist/tts/index.cjs +2 -4
- package/dist/tts/index.cjs.map +1 -1
- package/dist/tts/index.d.cts +1 -1
- package/dist/tts/index.d.ts +1 -1
- package/dist/tts/index.d.ts.map +1 -1
- package/dist/tts/index.js +1 -3
- package/dist/tts/index.js.map +1 -1
- package/dist/tts/stream_adapter.cjs +26 -13
- package/dist/tts/stream_adapter.cjs.map +1 -1
- package/dist/tts/stream_adapter.d.cts +1 -1
- package/dist/tts/stream_adapter.d.ts +1 -1
- package/dist/tts/stream_adapter.d.ts.map +1 -1
- package/dist/tts/stream_adapter.js +27 -14
- package/dist/tts/stream_adapter.js.map +1 -1
- package/dist/tts/tts.cjs +157 -25
- package/dist/tts/tts.cjs.map +1 -1
- package/dist/tts/tts.d.cts +29 -5
- package/dist/tts/tts.d.ts +29 -5
- package/dist/tts/tts.d.ts.map +1 -1
- package/dist/tts/tts.js +157 -24
- package/dist/tts/tts.js.map +1 -1
- package/dist/types.cjs +60 -0
- package/dist/types.cjs.map +1 -0
- package/dist/types.d.cts +13 -0
- package/dist/types.d.ts +13 -0
- package/dist/types.d.ts.map +1 -0
- package/dist/types.js +35 -0
- package/dist/types.js.map +1 -0
- package/dist/utils.cjs +281 -27
- package/dist/utils.cjs.map +1 -1
- package/dist/utils.d.cts +134 -9
- package/dist/utils.d.ts +134 -9
- package/dist/utils.d.ts.map +1 -1
- package/dist/utils.js +265 -26
- package/dist/utils.js.map +1 -1
- package/dist/utils.test.cjs +492 -0
- package/dist/utils.test.cjs.map +1 -0
- package/dist/utils.test.js +498 -0
- package/dist/utils.test.js.map +1 -0
- package/dist/vad.cjs +76 -20
- package/dist/vad.cjs.map +1 -1
- package/dist/vad.d.cts +25 -5
- package/dist/vad.d.ts +25 -5
- package/dist/vad.d.ts.map +1 -1
- package/dist/vad.js +76 -20
- package/dist/vad.js.map +1 -1
- package/dist/voice/agent.cjs +245 -0
- package/dist/voice/agent.cjs.map +1 -0
- package/dist/voice/agent.d.cts +78 -0
- package/dist/voice/agent.d.ts +78 -0
- package/dist/voice/agent.d.ts.map +1 -0
- package/dist/voice/agent.js +220 -0
- package/dist/voice/agent.js.map +1 -0
- package/dist/voice/agent.test.cjs +61 -0
- package/dist/voice/agent.test.cjs.map +1 -0
- package/dist/voice/agent.test.js +60 -0
- package/dist/voice/agent.test.js.map +1 -0
- package/dist/voice/agent_activity.cjs +1453 -0
- package/dist/voice/agent_activity.cjs.map +1 -0
- package/dist/voice/agent_activity.d.cts +94 -0
- package/dist/voice/agent_activity.d.ts +94 -0
- package/dist/voice/agent_activity.d.ts.map +1 -0
- package/dist/voice/agent_activity.js +1449 -0
- package/dist/voice/agent_activity.js.map +1 -0
- package/dist/voice/agent_session.cjs +312 -0
- package/dist/voice/agent_session.cjs.map +1 -0
- package/dist/voice/agent_session.d.cts +121 -0
- package/dist/voice/agent_session.d.ts +121 -0
- package/dist/voice/agent_session.d.ts.map +1 -0
- package/dist/voice/agent_session.js +295 -0
- package/dist/voice/agent_session.js.map +1 -0
- package/dist/voice/audio_recognition.cjs +375 -0
- package/dist/voice/audio_recognition.cjs.map +1 -0
- package/dist/voice/audio_recognition.d.cts +80 -0
- package/dist/voice/audio_recognition.d.ts +80 -0
- package/dist/voice/audio_recognition.d.ts.map +1 -0
- package/dist/voice/audio_recognition.js +351 -0
- package/dist/voice/audio_recognition.js.map +1 -0
- package/dist/voice/events.cjs +145 -0
- package/dist/voice/events.cjs.map +1 -0
- package/dist/voice/events.d.cts +124 -0
- package/dist/voice/events.d.ts +124 -0
- package/dist/voice/events.d.ts.map +1 -0
- package/dist/voice/events.js +110 -0
- package/dist/voice/events.js.map +1 -0
- package/dist/voice/generation.cjs +700 -0
- package/dist/voice/generation.cjs.map +1 -0
- package/dist/voice/generation.d.cts +115 -0
- package/dist/voice/generation.d.ts +115 -0
- package/dist/voice/generation.d.ts.map +1 -0
- package/dist/voice/generation.js +672 -0
- package/dist/voice/generation.js.map +1 -0
- package/dist/voice/index.cjs +40 -0
- package/dist/voice/index.cjs.map +1 -0
- package/dist/voice/index.d.cts +5 -0
- package/dist/voice/index.d.ts +5 -0
- package/dist/voice/index.d.ts.map +1 -0
- package/dist/voice/index.js +11 -0
- package/dist/voice/index.js.map +1 -0
- package/dist/voice/io.cjs +245 -0
- package/dist/voice/io.cjs.map +1 -0
- package/dist/voice/io.d.cts +101 -0
- package/dist/voice/io.d.ts +101 -0
- package/dist/voice/io.d.ts.map +1 -0
- package/dist/voice/io.js +217 -0
- package/dist/voice/io.js.map +1 -0
- package/dist/voice/room_io/_input.cjs +121 -0
- package/dist/voice/room_io/_input.cjs.map +1 -0
- package/dist/voice/room_io/_input.d.cts +24 -0
- package/dist/voice/room_io/_input.d.ts +24 -0
- package/dist/voice/room_io/_input.d.ts.map +1 -0
- package/dist/voice/room_io/_input.js +102 -0
- package/dist/voice/room_io/_input.js.map +1 -0
- package/dist/voice/room_io/_output.cjs +358 -0
- package/dist/voice/room_io/_output.cjs.map +1 -0
- package/dist/voice/room_io/_output.d.cts +75 -0
- package/dist/voice/room_io/_output.d.ts +75 -0
- package/dist/voice/room_io/_output.d.ts.map +1 -0
- package/dist/voice/room_io/_output.js +342 -0
- package/dist/voice/room_io/_output.js.map +1 -0
- package/dist/voice/room_io/index.cjs +25 -0
- package/dist/voice/room_io/index.cjs.map +1 -0
- package/dist/voice/room_io/index.d.cts +3 -0
- package/dist/voice/room_io/index.d.ts +3 -0
- package/dist/voice/room_io/index.d.ts.map +1 -0
- package/dist/voice/room_io/index.js +3 -0
- package/dist/voice/room_io/index.js.map +1 -0
- package/dist/voice/room_io/room_io.cjs +370 -0
- package/dist/voice/room_io/room_io.cjs.map +1 -0
- package/dist/voice/room_io/room_io.d.cts +73 -0
- package/dist/voice/room_io/room_io.d.ts +73 -0
- package/dist/voice/room_io/room_io.d.ts.map +1 -0
- package/dist/voice/room_io/room_io.js +361 -0
- package/dist/voice/room_io/room_io.js.map +1 -0
- package/dist/{pipeline/index.cjs → voice/run_context.cjs} +16 -11
- package/dist/voice/run_context.cjs.map +1 -0
- package/dist/voice/run_context.d.cts +12 -0
- package/dist/voice/run_context.d.ts +12 -0
- package/dist/voice/run_context.d.ts.map +1 -0
- package/dist/voice/run_context.js +14 -0
- package/dist/voice/run_context.js.map +1 -0
- package/dist/voice/speech_handle.cjs +105 -0
- package/dist/voice/speech_handle.cjs.map +1 -0
- package/dist/voice/speech_handle.d.cts +46 -0
- package/dist/voice/speech_handle.d.ts +46 -0
- package/dist/voice/speech_handle.d.ts.map +1 -0
- package/dist/voice/speech_handle.js +81 -0
- package/dist/voice/speech_handle.js.map +1 -0
- package/dist/voice/transcription/_utils.cjs +45 -0
- package/dist/voice/transcription/_utils.cjs.map +1 -0
- package/dist/voice/transcription/_utils.d.cts +3 -0
- package/dist/voice/transcription/_utils.d.ts +3 -0
- package/dist/voice/transcription/_utils.d.ts.map +1 -0
- package/dist/voice/transcription/_utils.js +21 -0
- package/dist/voice/transcription/_utils.js.map +1 -0
- package/dist/voice/transcription/index.cjs +23 -0
- package/dist/voice/transcription/index.cjs.map +1 -0
- package/dist/voice/transcription/index.d.cts +2 -0
- package/dist/voice/transcription/index.d.ts +2 -0
- package/dist/voice/transcription/index.d.ts.map +1 -0
- package/dist/voice/transcription/index.js +2 -0
- package/dist/voice/transcription/index.js.map +1 -0
- package/dist/voice/transcription/synchronizer.cjs +380 -0
- package/dist/voice/transcription/synchronizer.cjs.map +1 -0
- package/dist/voice/transcription/synchronizer.d.cts +86 -0
- package/dist/voice/transcription/synchronizer.d.ts +86 -0
- package/dist/voice/transcription/synchronizer.d.ts.map +1 -0
- package/dist/voice/transcription/synchronizer.js +355 -0
- package/dist/voice/transcription/synchronizer.js.map +1 -0
- package/dist/worker.cjs +22 -4
- package/dist/worker.cjs.map +1 -1
- package/dist/worker.d.cts +1 -1
- package/dist/worker.d.ts +1 -1
- package/dist/worker.d.ts.map +1 -1
- package/dist/worker.js +22 -4
- package/dist/worker.js.map +1 -1
- package/package.json +9 -2
- package/src/_exceptions.ts +137 -0
- package/src/audio.ts +12 -1
- package/src/cli.ts +37 -0
- package/src/constants.ts +2 -1
- package/src/http_server.ts +1 -0
- package/src/index.ts +13 -10
- package/src/inference_runner.ts +2 -3
- package/src/ipc/inference_proc_executor.ts +2 -2
- package/src/ipc/job_executor.ts +1 -1
- package/src/ipc/job_proc_executor.ts +1 -1
- package/src/ipc/job_proc_lazy_main.ts +1 -1
- package/src/job.ts +18 -0
- package/src/llm/__snapshots__/chat_context.test.ts.snap +527 -0
- package/src/llm/__snapshots__/tool_context.test.ts.snap +177 -0
- package/src/llm/__snapshots__/utils.test.ts.snap +65 -0
- package/src/llm/chat_context.test.ts +450 -0
- package/src/llm/chat_context.ts +501 -103
- package/src/llm/index.ts +53 -18
- package/src/llm/llm.ts +149 -50
- package/src/llm/provider_format/google.test.ts +772 -0
- package/src/llm/provider_format/google.ts +130 -0
- package/src/llm/provider_format/index.ts +23 -0
- package/src/llm/provider_format/openai.test.ts +581 -0
- package/src/llm/provider_format/openai.ts +118 -0
- package/src/llm/provider_format/utils.ts +183 -0
- package/src/llm/realtime.ts +151 -0
- package/src/llm/remote_chat_context.test.ts +290 -0
- package/src/llm/remote_chat_context.ts +114 -0
- package/src/llm/tool_context.test.ts +198 -0
- package/src/llm/tool_context.ts +259 -0
- package/src/llm/tool_context.type.test.ts +115 -0
- package/src/llm/utils.test.ts +670 -0
- package/src/llm/utils.ts +324 -0
- package/src/metrics/base.ts +110 -78
- package/src/metrics/index.ts +3 -9
- package/src/metrics/usage_collector.ts +19 -13
- package/src/metrics/utils.ts +24 -69
- package/src/multimodal/index.ts +0 -1
- package/src/plugin.ts +26 -8
- package/src/stream/deferred_stream.test.ts +755 -0
- package/src/stream/deferred_stream.ts +110 -0
- package/src/stream/identity_transform.test.ts +179 -0
- package/src/stream/identity_transform.ts +18 -0
- package/src/stream/index.ts +7 -0
- package/src/stream/merge_readable_streams.ts +40 -0
- package/src/stream/stream_channel.test.ts +129 -0
- package/src/stream/stream_channel.ts +32 -0
- package/src/stt/stream_adapter.ts +3 -5
- package/src/stt/stt.ts +135 -17
- package/src/tokenize/basic/basic.ts +13 -5
- package/src/tokenize/basic/sentence.ts +20 -6
- package/src/tokenize/token_stream.ts +7 -4
- package/src/transcription.ts +2 -3
- package/src/tts/index.ts +0 -1
- package/src/tts/stream_adapter.ts +42 -16
- package/src/tts/tts.ts +203 -21
- package/src/types.ts +42 -0
- package/src/utils.test.ts +658 -0
- package/src/utils.ts +375 -44
- package/src/vad.ts +90 -22
- package/src/voice/agent.test.ts +80 -0
- package/src/voice/agent.ts +332 -0
- package/src/voice/agent_activity.ts +1913 -0
- package/src/voice/agent_session.ts +460 -0
- package/src/voice/audio_recognition.ts +474 -0
- package/src/voice/events.ts +252 -0
- package/src/voice/generation.ts +881 -0
- package/src/voice/index.ts +7 -0
- package/src/voice/io.ts +304 -0
- package/src/voice/room_io/_input.ts +144 -0
- package/src/voice/room_io/_output.ts +436 -0
- package/src/voice/room_io/index.ts +5 -0
- package/src/voice/room_io/room_io.ts +495 -0
- package/src/voice/run_context.ts +20 -0
- package/src/voice/speech_handle.ts +104 -0
- package/src/voice/transcription/_utils.ts +25 -0
- package/src/voice/transcription/index.ts +4 -0
- package/src/voice/transcription/synchronizer.ts +478 -0
- package/src/worker.ts +22 -2
- package/dist/llm/function_context.cjs +0 -103
- package/dist/llm/function_context.cjs.map +0 -1
- package/dist/llm/function_context.d.cts +0 -47
- package/dist/llm/function_context.d.ts +0 -47
- package/dist/llm/function_context.d.ts.map +0 -1
- package/dist/llm/function_context.js +0 -78
- package/dist/llm/function_context.js.map +0 -1
- package/dist/llm/function_context.test.cjs +0 -218
- package/dist/llm/function_context.test.cjs.map +0 -1
- package/dist/llm/function_context.test.js +0 -217
- package/dist/llm/function_context.test.js.map +0 -1
- package/dist/multimodal/multimodal_agent.cjs +0 -486
- package/dist/multimodal/multimodal_agent.cjs.map +0 -1
- package/dist/multimodal/multimodal_agent.d.cts +0 -48
- package/dist/multimodal/multimodal_agent.d.ts +0 -48
- package/dist/multimodal/multimodal_agent.d.ts.map +0 -1
- package/dist/multimodal/multimodal_agent.js +0 -461
- package/dist/multimodal/multimodal_agent.js.map +0 -1
- package/dist/pipeline/agent_output.cjs +0 -197
- package/dist/pipeline/agent_output.cjs.map +0 -1
- package/dist/pipeline/agent_output.d.cts +0 -33
- package/dist/pipeline/agent_output.d.ts +0 -33
- package/dist/pipeline/agent_output.d.ts.map +0 -1
- package/dist/pipeline/agent_output.js +0 -172
- package/dist/pipeline/agent_output.js.map +0 -1
- package/dist/pipeline/agent_playout.cjs +0 -175
- package/dist/pipeline/agent_playout.cjs.map +0 -1
- package/dist/pipeline/agent_playout.d.cts +0 -40
- package/dist/pipeline/agent_playout.d.ts +0 -40
- package/dist/pipeline/agent_playout.d.ts.map +0 -1
- package/dist/pipeline/agent_playout.js +0 -139
- package/dist/pipeline/agent_playout.js.map +0 -1
- package/dist/pipeline/human_input.cjs +0 -171
- package/dist/pipeline/human_input.cjs.map +0 -1
- package/dist/pipeline/human_input.d.cts +0 -30
- package/dist/pipeline/human_input.d.ts +0 -30
- package/dist/pipeline/human_input.d.ts.map +0 -1
- package/dist/pipeline/human_input.js +0 -146
- package/dist/pipeline/human_input.js.map +0 -1
- package/dist/pipeline/index.cjs.map +0 -1
- package/dist/pipeline/index.d.cts +0 -2
- package/dist/pipeline/index.d.ts +0 -2
- package/dist/pipeline/index.d.ts.map +0 -1
- package/dist/pipeline/index.js +0 -11
- package/dist/pipeline/index.js.map +0 -1
- package/dist/pipeline/pipeline_agent.cjs +0 -859
- package/dist/pipeline/pipeline_agent.cjs.map +0 -1
- package/dist/pipeline/pipeline_agent.d.cts +0 -150
- package/dist/pipeline/pipeline_agent.d.ts +0 -150
- package/dist/pipeline/pipeline_agent.d.ts.map +0 -1
- package/dist/pipeline/pipeline_agent.js +0 -837
- package/dist/pipeline/pipeline_agent.js.map +0 -1
- package/dist/pipeline/speech_handle.cjs +0 -176
- package/dist/pipeline/speech_handle.cjs.map +0 -1
- package/dist/pipeline/speech_handle.d.cts +0 -37
- package/dist/pipeline/speech_handle.d.ts +0 -37
- package/dist/pipeline/speech_handle.d.ts.map +0 -1
- package/dist/pipeline/speech_handle.js +0 -152
- package/dist/pipeline/speech_handle.js.map +0 -1
- package/src/llm/function_context.test.ts +0 -248
- package/src/llm/function_context.ts +0 -142
- package/src/multimodal/multimodal_agent.ts +0 -592
- package/src/pipeline/agent_output.ts +0 -219
- package/src/pipeline/agent_playout.ts +0 -192
- package/src/pipeline/human_input.ts +0 -188
- package/src/pipeline/index.ts +0 -15
- package/src/pipeline/pipeline_agent.ts +0 -1197
- package/src/pipeline/speech_handle.ts +0 -201
|
@@ -1,219 +0,0 @@
|
|
|
1
|
-
// SPDX-FileCopyrightText: 2024 LiveKit, Inc.
|
|
2
|
-
//
|
|
3
|
-
// SPDX-License-Identifier: Apache-2.0
|
|
4
|
-
import type { AudioFrame } from '@livekit/rtc-node';
|
|
5
|
-
import { log } from '../log.js';
|
|
6
|
-
import type { TextAudioSynchronizer } from '../transcription.js';
|
|
7
|
-
import { SynthesizeStream, type TTS } from '../tts/index.js';
|
|
8
|
-
import { AsyncIterableQueue, CancellablePromise, Future, gracefullyCancel } from '../utils.js';
|
|
9
|
-
import type { AgentPlayout, PlayoutHandle } from './agent_playout.js';
|
|
10
|
-
|
|
11
|
-
export type SpeechSource = AsyncIterable<string> | string | Promise<string>;
|
|
12
|
-
|
|
13
|
-
export class SynthesisHandle {
|
|
14
|
-
static readonly FLUSH_SENTINEL = Symbol('FLUSH_SENTINEL');
|
|
15
|
-
|
|
16
|
-
#speechId: string;
|
|
17
|
-
text?: string;
|
|
18
|
-
ttsSource: SpeechSource;
|
|
19
|
-
#agentPlayout: AgentPlayout;
|
|
20
|
-
tts: TTS;
|
|
21
|
-
queue = new AsyncIterableQueue<AudioFrame | typeof SynthesisHandle.FLUSH_SENTINEL>();
|
|
22
|
-
#playHandle?: PlayoutHandle;
|
|
23
|
-
intFut = new Future();
|
|
24
|
-
#logger = log();
|
|
25
|
-
synchronizer: TextAudioSynchronizer;
|
|
26
|
-
|
|
27
|
-
constructor(
|
|
28
|
-
speechId: string,
|
|
29
|
-
ttsSource: SpeechSource,
|
|
30
|
-
agentPlayout: AgentPlayout,
|
|
31
|
-
tts: TTS,
|
|
32
|
-
synchronizer: TextAudioSynchronizer,
|
|
33
|
-
) {
|
|
34
|
-
this.#speechId = speechId;
|
|
35
|
-
this.ttsSource = ttsSource;
|
|
36
|
-
this.#agentPlayout = agentPlayout;
|
|
37
|
-
this.tts = tts;
|
|
38
|
-
this.synchronizer = synchronizer;
|
|
39
|
-
}
|
|
40
|
-
|
|
41
|
-
get speechId(): string {
|
|
42
|
-
return this.#speechId;
|
|
43
|
-
}
|
|
44
|
-
|
|
45
|
-
get validated(): boolean {
|
|
46
|
-
return !!this.#playHandle;
|
|
47
|
-
}
|
|
48
|
-
|
|
49
|
-
get interrupted(): boolean {
|
|
50
|
-
return this.intFut.done;
|
|
51
|
-
}
|
|
52
|
-
|
|
53
|
-
get playHandle(): PlayoutHandle | undefined {
|
|
54
|
-
return this.#playHandle;
|
|
55
|
-
}
|
|
56
|
-
|
|
57
|
-
/** Validate the speech for playout. */
|
|
58
|
-
play(): PlayoutHandle {
|
|
59
|
-
if (this.interrupted) {
|
|
60
|
-
throw new Error('synthesis was interrupted');
|
|
61
|
-
}
|
|
62
|
-
|
|
63
|
-
this.#playHandle = this.#agentPlayout.play(this.#speechId, this.queue, this.synchronizer);
|
|
64
|
-
return this.#playHandle;
|
|
65
|
-
}
|
|
66
|
-
|
|
67
|
-
/** Interrupt the speech. */
|
|
68
|
-
interrupt() {
|
|
69
|
-
if (this.interrupted) {
|
|
70
|
-
return;
|
|
71
|
-
}
|
|
72
|
-
|
|
73
|
-
this.#logger.child({ speechId: this.#speechId }).debug('interrupting synthesis/playout');
|
|
74
|
-
this.#playHandle?.interrupt();
|
|
75
|
-
this.intFut.resolve();
|
|
76
|
-
}
|
|
77
|
-
}
|
|
78
|
-
|
|
79
|
-
export class AgentOutput {
|
|
80
|
-
#agentPlayout: AgentPlayout;
|
|
81
|
-
#tts: TTS;
|
|
82
|
-
#tasks: CancellablePromise<void>[] = [];
|
|
83
|
-
|
|
84
|
-
constructor(agentPlayout: AgentPlayout, tts: TTS) {
|
|
85
|
-
this.#agentPlayout = agentPlayout;
|
|
86
|
-
this.#tts = tts;
|
|
87
|
-
}
|
|
88
|
-
|
|
89
|
-
get playout(): AgentPlayout {
|
|
90
|
-
return this.#agentPlayout;
|
|
91
|
-
}
|
|
92
|
-
|
|
93
|
-
async close() {
|
|
94
|
-
this.#tasks.forEach((task) => task.cancel());
|
|
95
|
-
await Promise.all(this.#tasks);
|
|
96
|
-
}
|
|
97
|
-
|
|
98
|
-
synthesize(
|
|
99
|
-
speechId: string,
|
|
100
|
-
ttsSource: SpeechSource,
|
|
101
|
-
synchronizer: TextAudioSynchronizer,
|
|
102
|
-
): SynthesisHandle {
|
|
103
|
-
const handle = new SynthesisHandle(
|
|
104
|
-
speechId,
|
|
105
|
-
ttsSource,
|
|
106
|
-
this.#agentPlayout,
|
|
107
|
-
this.#tts,
|
|
108
|
-
synchronizer,
|
|
109
|
-
);
|
|
110
|
-
const task = this.#synthesize(handle);
|
|
111
|
-
this.#tasks.push(task);
|
|
112
|
-
task.finally(() => this.#tasks.splice(this.#tasks.indexOf(task)));
|
|
113
|
-
return handle;
|
|
114
|
-
}
|
|
115
|
-
|
|
116
|
-
#synthesize(handle: SynthesisHandle): CancellablePromise<void> {
|
|
117
|
-
// eslint-disable-next-line @typescript-eslint/no-unused-vars
|
|
118
|
-
return new CancellablePromise(async (resolve, _, onCancel) => {
|
|
119
|
-
const ttsSource = await handle.ttsSource;
|
|
120
|
-
let task: CancellablePromise<string>;
|
|
121
|
-
if (typeof ttsSource === 'string') {
|
|
122
|
-
task = stringSynthesisTask(ttsSource, handle);
|
|
123
|
-
} else {
|
|
124
|
-
task = streamSynthesisTask(ttsSource, handle);
|
|
125
|
-
}
|
|
126
|
-
|
|
127
|
-
onCancel(() => {
|
|
128
|
-
gracefullyCancel(task);
|
|
129
|
-
});
|
|
130
|
-
|
|
131
|
-
try {
|
|
132
|
-
await Promise.any([task, handle.intFut.await]);
|
|
133
|
-
} finally {
|
|
134
|
-
if (handle.intFut.done) {
|
|
135
|
-
gracefullyCancel(task);
|
|
136
|
-
} else {
|
|
137
|
-
task.then((text) => {
|
|
138
|
-
handle.text = text;
|
|
139
|
-
});
|
|
140
|
-
}
|
|
141
|
-
}
|
|
142
|
-
|
|
143
|
-
resolve();
|
|
144
|
-
});
|
|
145
|
-
}
|
|
146
|
-
}
|
|
147
|
-
|
|
148
|
-
const stringSynthesisTask = (text: string, handle: SynthesisHandle): CancellablePromise<string> => {
|
|
149
|
-
// eslint-disable-next-line @typescript-eslint/no-unused-vars
|
|
150
|
-
return new CancellablePromise(async (resolve, _, onCancel) => {
|
|
151
|
-
let cancelled = false;
|
|
152
|
-
onCancel(() => {
|
|
153
|
-
cancelled = true;
|
|
154
|
-
});
|
|
155
|
-
|
|
156
|
-
const ttsStream = handle.tts.stream();
|
|
157
|
-
ttsStream.pushText(text);
|
|
158
|
-
handle.synchronizer.pushText(text);
|
|
159
|
-
handle.synchronizer.markTextSegmentEnd();
|
|
160
|
-
ttsStream.flush();
|
|
161
|
-
ttsStream.endInput();
|
|
162
|
-
for await (const audio of ttsStream) {
|
|
163
|
-
if (cancelled || audio === SynthesizeStream.END_OF_STREAM) {
|
|
164
|
-
break;
|
|
165
|
-
}
|
|
166
|
-
handle.queue.put(audio.frame);
|
|
167
|
-
}
|
|
168
|
-
handle.queue.put(SynthesisHandle.FLUSH_SENTINEL);
|
|
169
|
-
|
|
170
|
-
resolve(text);
|
|
171
|
-
});
|
|
172
|
-
};
|
|
173
|
-
|
|
174
|
-
const streamSynthesisTask = (
|
|
175
|
-
stream: AsyncIterable<string>,
|
|
176
|
-
handle: SynthesisHandle,
|
|
177
|
-
): CancellablePromise<string> => {
|
|
178
|
-
// eslint-disable-next-line @typescript-eslint/no-unused-vars
|
|
179
|
-
return new CancellablePromise(async (resolve, _, onCancel) => {
|
|
180
|
-
let fullText = '';
|
|
181
|
-
let cancelled = false;
|
|
182
|
-
onCancel(() => {
|
|
183
|
-
cancelled = true;
|
|
184
|
-
});
|
|
185
|
-
|
|
186
|
-
const ttsStream = handle.tts.stream();
|
|
187
|
-
const readGeneratedAudio = async () => {
|
|
188
|
-
for await (const audio of ttsStream) {
|
|
189
|
-
if (cancelled) break;
|
|
190
|
-
if (audio === SynthesizeStream.END_OF_STREAM) {
|
|
191
|
-
break;
|
|
192
|
-
}
|
|
193
|
-
handle.queue.put(audio.frame);
|
|
194
|
-
}
|
|
195
|
-
handle.queue.put(SynthesisHandle.FLUSH_SENTINEL);
|
|
196
|
-
};
|
|
197
|
-
readGeneratedAudio();
|
|
198
|
-
|
|
199
|
-
for await (const text of stream) {
|
|
200
|
-
fullText += text;
|
|
201
|
-
if (cancelled) break;
|
|
202
|
-
handle.synchronizer.pushText(text);
|
|
203
|
-
ttsStream.pushText(text);
|
|
204
|
-
}
|
|
205
|
-
if (!cancelled) {
|
|
206
|
-
handle.synchronizer.markTextSegmentEnd();
|
|
207
|
-
}
|
|
208
|
-
|
|
209
|
-
// end the audio queue early if there is no actual text to turn into speech
|
|
210
|
-
if (!fullText || fullText.trim().length === 0) {
|
|
211
|
-
cancelled = true;
|
|
212
|
-
handle.queue.put(SynthesisHandle.FLUSH_SENTINEL);
|
|
213
|
-
}
|
|
214
|
-
ttsStream.flush();
|
|
215
|
-
ttsStream.endInput();
|
|
216
|
-
|
|
217
|
-
resolve(fullText);
|
|
218
|
-
});
|
|
219
|
-
};
|
|
@@ -1,192 +0,0 @@
|
|
|
1
|
-
// SPDX-FileCopyrightText: 2024 LiveKit, Inc.
|
|
2
|
-
//
|
|
3
|
-
// SPDX-License-Identifier: Apache-2.0
|
|
4
|
-
import type { AudioFrame, AudioSource } from '@livekit/rtc-node';
|
|
5
|
-
import type { TypedEventEmitter as TypedEmitter } from '@livekit/typed-emitter';
|
|
6
|
-
import EventEmitter from 'node:events';
|
|
7
|
-
import { log } from '../log.js';
|
|
8
|
-
import type { TextAudioSynchronizer } from '../transcription.js';
|
|
9
|
-
import { CancellablePromise, Future, gracefullyCancel } from '../utils.js';
|
|
10
|
-
import { SynthesisHandle } from './agent_output.js';
|
|
11
|
-
|
|
12
|
-
export enum AgentPlayoutEvent {
|
|
13
|
-
PLAYOUT_STARTED,
|
|
14
|
-
PLAYOUT_STOPPED,
|
|
15
|
-
}
|
|
16
|
-
|
|
17
|
-
export type AgentPlayoutCallbacks = {
|
|
18
|
-
[AgentPlayoutEvent.PLAYOUT_STARTED]: () => void;
|
|
19
|
-
[AgentPlayoutEvent.PLAYOUT_STOPPED]: (interrupt: boolean) => void;
|
|
20
|
-
};
|
|
21
|
-
|
|
22
|
-
export class PlayoutHandle {
|
|
23
|
-
#speechId: string;
|
|
24
|
-
#audioSource: AudioSource;
|
|
25
|
-
playoutSource: AsyncIterable<AudioFrame | typeof SynthesisHandle.FLUSH_SENTINEL>;
|
|
26
|
-
totalPlayedTime?: number;
|
|
27
|
-
synchronizer: TextAudioSynchronizer;
|
|
28
|
-
#interrupted = false;
|
|
29
|
-
pushedDuration = 0;
|
|
30
|
-
intFut = new Future();
|
|
31
|
-
doneFut = new Future();
|
|
32
|
-
|
|
33
|
-
constructor(
|
|
34
|
-
speechId: string,
|
|
35
|
-
audioSource: AudioSource,
|
|
36
|
-
playoutSource: AsyncIterable<AudioFrame | typeof SynthesisHandle.FLUSH_SENTINEL>,
|
|
37
|
-
synchronizer: TextAudioSynchronizer,
|
|
38
|
-
) {
|
|
39
|
-
this.#speechId = speechId;
|
|
40
|
-
this.#audioSource = audioSource;
|
|
41
|
-
this.playoutSource = playoutSource;
|
|
42
|
-
this.synchronizer = synchronizer;
|
|
43
|
-
}
|
|
44
|
-
|
|
45
|
-
get speechId(): string {
|
|
46
|
-
return this.#speechId;
|
|
47
|
-
}
|
|
48
|
-
|
|
49
|
-
get interrupted(): boolean {
|
|
50
|
-
return this.#interrupted;
|
|
51
|
-
}
|
|
52
|
-
|
|
53
|
-
get timePlayed(): number {
|
|
54
|
-
return this.totalPlayedTime || this.pushedDuration - this.#audioSource.queuedDuration;
|
|
55
|
-
}
|
|
56
|
-
|
|
57
|
-
get done(): boolean {
|
|
58
|
-
return this.doneFut.done || this.#interrupted;
|
|
59
|
-
}
|
|
60
|
-
|
|
61
|
-
interrupt() {
|
|
62
|
-
if (this.done) {
|
|
63
|
-
return;
|
|
64
|
-
}
|
|
65
|
-
|
|
66
|
-
this.intFut.resolve();
|
|
67
|
-
this.#interrupted = true;
|
|
68
|
-
}
|
|
69
|
-
|
|
70
|
-
join(): Future {
|
|
71
|
-
return this.doneFut;
|
|
72
|
-
}
|
|
73
|
-
}
|
|
74
|
-
|
|
75
|
-
export class AgentPlayout extends (EventEmitter as new () => TypedEmitter<AgentPlayoutCallbacks>) {
|
|
76
|
-
#closed = false;
|
|
77
|
-
#audioSource: AudioSource;
|
|
78
|
-
#targetVolume = 1;
|
|
79
|
-
#playoutTask?: CancellablePromise<void>;
|
|
80
|
-
#logger = log();
|
|
81
|
-
|
|
82
|
-
constructor(audioSource: AudioSource) {
|
|
83
|
-
super();
|
|
84
|
-
this.#audioSource = audioSource;
|
|
85
|
-
}
|
|
86
|
-
|
|
87
|
-
get targetVolume(): number {
|
|
88
|
-
return this.#targetVolume;
|
|
89
|
-
}
|
|
90
|
-
|
|
91
|
-
set targetVolume(vol: number) {
|
|
92
|
-
this.#targetVolume = vol;
|
|
93
|
-
}
|
|
94
|
-
|
|
95
|
-
play(
|
|
96
|
-
speechId: string,
|
|
97
|
-
playoutSource: AsyncIterable<AudioFrame | typeof SynthesisHandle.FLUSH_SENTINEL>,
|
|
98
|
-
synchronizer: TextAudioSynchronizer,
|
|
99
|
-
): PlayoutHandle {
|
|
100
|
-
if (this.#closed) {
|
|
101
|
-
throw new Error('source closed');
|
|
102
|
-
}
|
|
103
|
-
|
|
104
|
-
const handle = new PlayoutHandle(speechId, this.#audioSource, playoutSource, synchronizer);
|
|
105
|
-
|
|
106
|
-
this.#playoutTask = this.#playout(handle, this.#playoutTask);
|
|
107
|
-
return handle;
|
|
108
|
-
}
|
|
109
|
-
|
|
110
|
-
#playout(handle: PlayoutHandle, oldTask?: CancellablePromise<void>): CancellablePromise<void> {
|
|
111
|
-
return new CancellablePromise(async (resolve, _, onCancel) => {
|
|
112
|
-
const cancel = () => {
|
|
113
|
-
captureTask.cancel();
|
|
114
|
-
handle.totalPlayedTime = handle.pushedDuration - this.#audioSource.queuedDuration;
|
|
115
|
-
|
|
116
|
-
if (handle.interrupted || captureTask.error) {
|
|
117
|
-
handle.synchronizer.close(true);
|
|
118
|
-
this.#audioSource.clearQueue(); // make sure to remove any queued frames
|
|
119
|
-
}
|
|
120
|
-
|
|
121
|
-
if (!firstFrame) {
|
|
122
|
-
this.emit(AgentPlayoutEvent.PLAYOUT_STOPPED, handle.interrupted);
|
|
123
|
-
}
|
|
124
|
-
|
|
125
|
-
handle.doneFut.resolve();
|
|
126
|
-
|
|
127
|
-
this.#logger
|
|
128
|
-
.child({ speechId: handle.speechId, interrupted: handle.interrupted })
|
|
129
|
-
.debug('playout finished');
|
|
130
|
-
};
|
|
131
|
-
|
|
132
|
-
onCancel(() => {
|
|
133
|
-
cancel();
|
|
134
|
-
});
|
|
135
|
-
|
|
136
|
-
if (oldTask) {
|
|
137
|
-
await gracefullyCancel(oldTask);
|
|
138
|
-
}
|
|
139
|
-
|
|
140
|
-
if (this.#audioSource.queuedDuration > 0) {
|
|
141
|
-
// this should not happen, but log it just in case
|
|
142
|
-
this.#logger
|
|
143
|
-
.child({ speechId: handle.speechId, queuedDuration: this.#audioSource.queuedDuration })
|
|
144
|
-
.warn('new playout while the source is still playing');
|
|
145
|
-
}
|
|
146
|
-
|
|
147
|
-
let firstFrame = true;
|
|
148
|
-
|
|
149
|
-
// eslint-disable-next-line @typescript-eslint/no-unused-vars
|
|
150
|
-
const captureTask = new CancellablePromise<void>(async (resolve, _, onCancel) => {
|
|
151
|
-
let cancelled = false;
|
|
152
|
-
onCancel(() => {
|
|
153
|
-
cancelled = true;
|
|
154
|
-
});
|
|
155
|
-
|
|
156
|
-
for await (const frame of handle.playoutSource) {
|
|
157
|
-
if (cancelled || frame === SynthesisHandle.FLUSH_SENTINEL) {
|
|
158
|
-
break;
|
|
159
|
-
}
|
|
160
|
-
if (firstFrame) {
|
|
161
|
-
this.#logger
|
|
162
|
-
.child({ speechId: handle.speechId })
|
|
163
|
-
.debug('started playing the first time');
|
|
164
|
-
this.emit(AgentPlayoutEvent.PLAYOUT_STARTED);
|
|
165
|
-
handle.synchronizer.segmentPlayoutStarted();
|
|
166
|
-
firstFrame = false;
|
|
167
|
-
}
|
|
168
|
-
handle.pushedDuration += (frame.samplesPerChannel / frame.sampleRate) * 1000;
|
|
169
|
-
handle.synchronizer.pushAudio(frame);
|
|
170
|
-
await this.#audioSource.captureFrame(frame);
|
|
171
|
-
}
|
|
172
|
-
|
|
173
|
-
await this.#audioSource.waitForPlayout();
|
|
174
|
-
|
|
175
|
-
handle.synchronizer.close(false);
|
|
176
|
-
resolve();
|
|
177
|
-
});
|
|
178
|
-
|
|
179
|
-
try {
|
|
180
|
-
await Promise.any([captureTask, handle.intFut.await]);
|
|
181
|
-
} finally {
|
|
182
|
-
cancel();
|
|
183
|
-
resolve();
|
|
184
|
-
}
|
|
185
|
-
});
|
|
186
|
-
}
|
|
187
|
-
|
|
188
|
-
async close() {
|
|
189
|
-
this.#closed = true;
|
|
190
|
-
await this.#playoutTask;
|
|
191
|
-
}
|
|
192
|
-
}
|
|
@@ -1,188 +0,0 @@
|
|
|
1
|
-
// SPDX-FileCopyrightText: 2024 LiveKit, Inc.
|
|
2
|
-
//
|
|
3
|
-
// SPDX-License-Identifier: Apache-2.0
|
|
4
|
-
import type {
|
|
5
|
-
NoiseCancellationOptions,
|
|
6
|
-
RemoteAudioTrack,
|
|
7
|
-
RemoteParticipant,
|
|
8
|
-
RemoteTrackPublication,
|
|
9
|
-
Room,
|
|
10
|
-
} from '@livekit/rtc-node';
|
|
11
|
-
import { AudioStream, RoomEvent, TrackSource } from '@livekit/rtc-node';
|
|
12
|
-
import type { TypedEventEmitter as TypedEmitter } from '@livekit/typed-emitter';
|
|
13
|
-
import { EventEmitter } from 'node:events';
|
|
14
|
-
import { log } from '../log.js';
|
|
15
|
-
import type { STT, SpeechEvent } from '../stt/stt.js';
|
|
16
|
-
import { SpeechEventType } from '../stt/stt.js';
|
|
17
|
-
import { CancellablePromise, gracefullyCancel } from '../utils.js';
|
|
18
|
-
import type { VAD, VADEvent } from '../vad.js';
|
|
19
|
-
import { VADEventType } from '../vad.js';
|
|
20
|
-
|
|
21
|
-
export enum HumanInputEvent {
|
|
22
|
-
START_OF_SPEECH,
|
|
23
|
-
VAD_INFERENCE_DONE,
|
|
24
|
-
END_OF_SPEECH,
|
|
25
|
-
FINAL_TRANSCRIPT,
|
|
26
|
-
INTERIM_TRANSCRIPT,
|
|
27
|
-
}
|
|
28
|
-
|
|
29
|
-
export type HumanInputCallbacks = {
|
|
30
|
-
[HumanInputEvent.START_OF_SPEECH]: (event: VADEvent) => void;
|
|
31
|
-
[HumanInputEvent.VAD_INFERENCE_DONE]: (event: VADEvent) => void;
|
|
32
|
-
[HumanInputEvent.END_OF_SPEECH]: (event: VADEvent) => void;
|
|
33
|
-
[HumanInputEvent.FINAL_TRANSCRIPT]: (event: SpeechEvent) => void;
|
|
34
|
-
[HumanInputEvent.INTERIM_TRANSCRIPT]: (event: SpeechEvent) => void;
|
|
35
|
-
};
|
|
36
|
-
|
|
37
|
-
export class HumanInput extends (EventEmitter as new () => TypedEmitter<HumanInputCallbacks>) {
|
|
38
|
-
#closed = false;
|
|
39
|
-
#room: Room;
|
|
40
|
-
#vad: VAD;
|
|
41
|
-
#stt: STT;
|
|
42
|
-
#participant: RemoteParticipant;
|
|
43
|
-
#subscribedTrack?: RemoteAudioTrack;
|
|
44
|
-
#recognizeTask?: CancellablePromise<void>;
|
|
45
|
-
#speaking = false;
|
|
46
|
-
#speechProbability = 0;
|
|
47
|
-
#logger = log();
|
|
48
|
-
#noiseCancellation?: NoiseCancellationOptions;
|
|
49
|
-
|
|
50
|
-
constructor(
|
|
51
|
-
room: Room,
|
|
52
|
-
vad: VAD,
|
|
53
|
-
stt: STT,
|
|
54
|
-
participant: RemoteParticipant,
|
|
55
|
-
noiseCancellation?: NoiseCancellationOptions,
|
|
56
|
-
) {
|
|
57
|
-
super();
|
|
58
|
-
this.#room = room;
|
|
59
|
-
this.#vad = vad;
|
|
60
|
-
this.#stt = stt;
|
|
61
|
-
this.#participant = participant;
|
|
62
|
-
this.#noiseCancellation = noiseCancellation;
|
|
63
|
-
|
|
64
|
-
this.#room.on(RoomEvent.TrackPublished, this.#subscribeToMicrophone.bind(this));
|
|
65
|
-
this.#room.on(RoomEvent.TrackSubscribed, this.#subscribeToMicrophone.bind(this));
|
|
66
|
-
this.#subscribeToMicrophone();
|
|
67
|
-
}
|
|
68
|
-
|
|
69
|
-
get participant(): RemoteParticipant {
|
|
70
|
-
return this.#participant;
|
|
71
|
-
}
|
|
72
|
-
|
|
73
|
-
get subscribedTrack(): RemoteAudioTrack | undefined {
|
|
74
|
-
return this.#subscribedTrack;
|
|
75
|
-
}
|
|
76
|
-
|
|
77
|
-
#subscribeToMicrophone(): void {
|
|
78
|
-
if (!this.#participant) {
|
|
79
|
-
this.#logger.error('Participant is not set');
|
|
80
|
-
return;
|
|
81
|
-
}
|
|
82
|
-
|
|
83
|
-
let microphonePublication: RemoteTrackPublication | undefined = undefined;
|
|
84
|
-
for (const publication of this.#participant.trackPublications.values()) {
|
|
85
|
-
if (publication.source === TrackSource.SOURCE_MICROPHONE) {
|
|
86
|
-
microphonePublication = publication;
|
|
87
|
-
break;
|
|
88
|
-
}
|
|
89
|
-
}
|
|
90
|
-
if (!microphonePublication) {
|
|
91
|
-
return;
|
|
92
|
-
}
|
|
93
|
-
|
|
94
|
-
if (!microphonePublication.subscribed) {
|
|
95
|
-
microphonePublication.setSubscribed(true);
|
|
96
|
-
}
|
|
97
|
-
|
|
98
|
-
const track = microphonePublication.track;
|
|
99
|
-
if (track && track !== this.#subscribedTrack) {
|
|
100
|
-
this.#subscribedTrack = track;
|
|
101
|
-
if (this.#recognizeTask) {
|
|
102
|
-
this.#recognizeTask.cancel();
|
|
103
|
-
}
|
|
104
|
-
|
|
105
|
-
const audioStreamOptions = {
|
|
106
|
-
sampleRate: 16000,
|
|
107
|
-
numChannels: 1,
|
|
108
|
-
...(this.#noiseCancellation ? { noiseCancellation: this.#noiseCancellation } : {}),
|
|
109
|
-
};
|
|
110
|
-
const audioStream = new AudioStream(track, audioStreamOptions);
|
|
111
|
-
|
|
112
|
-
// eslint-disable-next-line @typescript-eslint/no-unused-vars
|
|
113
|
-
this.#recognizeTask = new CancellablePromise(async (resolve, _, onCancel) => {
|
|
114
|
-
let cancelled = false;
|
|
115
|
-
onCancel(() => {
|
|
116
|
-
cancelled = true;
|
|
117
|
-
});
|
|
118
|
-
|
|
119
|
-
const sttStream = this.#stt.stream();
|
|
120
|
-
const vadStream = this.#vad.stream();
|
|
121
|
-
|
|
122
|
-
const audioStreamCo = async () => {
|
|
123
|
-
for await (const ev of audioStream) {
|
|
124
|
-
if (cancelled) return;
|
|
125
|
-
sttStream.pushFrame(ev);
|
|
126
|
-
vadStream.pushFrame(ev);
|
|
127
|
-
}
|
|
128
|
-
};
|
|
129
|
-
|
|
130
|
-
const vadStreamCo = async () => {
|
|
131
|
-
for await (const ev of vadStream) {
|
|
132
|
-
if (cancelled) return;
|
|
133
|
-
switch (ev.type) {
|
|
134
|
-
case VADEventType.START_OF_SPEECH:
|
|
135
|
-
this.#speaking = true;
|
|
136
|
-
this.emit(HumanInputEvent.START_OF_SPEECH, ev);
|
|
137
|
-
break;
|
|
138
|
-
case VADEventType.INFERENCE_DONE:
|
|
139
|
-
this.#speechProbability = ev.probability;
|
|
140
|
-
this.emit(HumanInputEvent.VAD_INFERENCE_DONE, ev);
|
|
141
|
-
break;
|
|
142
|
-
case VADEventType.END_OF_SPEECH:
|
|
143
|
-
this.#speaking = false;
|
|
144
|
-
this.emit(HumanInputEvent.END_OF_SPEECH, ev);
|
|
145
|
-
break;
|
|
146
|
-
}
|
|
147
|
-
}
|
|
148
|
-
};
|
|
149
|
-
|
|
150
|
-
const sttStreamCo = async () => {
|
|
151
|
-
for await (const ev of sttStream) {
|
|
152
|
-
if (cancelled) return;
|
|
153
|
-
if (ev.type === SpeechEventType.FINAL_TRANSCRIPT) {
|
|
154
|
-
this.emit(HumanInputEvent.FINAL_TRANSCRIPT, ev);
|
|
155
|
-
} else if (ev.type == SpeechEventType.INTERIM_TRANSCRIPT) {
|
|
156
|
-
this.emit(HumanInputEvent.INTERIM_TRANSCRIPT, ev);
|
|
157
|
-
}
|
|
158
|
-
}
|
|
159
|
-
};
|
|
160
|
-
|
|
161
|
-
await Promise.all([audioStreamCo(), vadStreamCo(), sttStreamCo()]);
|
|
162
|
-
sttStream.close();
|
|
163
|
-
vadStream.close();
|
|
164
|
-
resolve();
|
|
165
|
-
});
|
|
166
|
-
}
|
|
167
|
-
}
|
|
168
|
-
|
|
169
|
-
get speaking(): boolean {
|
|
170
|
-
return this.#speaking;
|
|
171
|
-
}
|
|
172
|
-
|
|
173
|
-
get speakingProbability(): number {
|
|
174
|
-
return this.#speechProbability;
|
|
175
|
-
}
|
|
176
|
-
|
|
177
|
-
async close() {
|
|
178
|
-
if (this.#closed) {
|
|
179
|
-
throw new Error('HumanInput already closed');
|
|
180
|
-
}
|
|
181
|
-
this.#closed = true;
|
|
182
|
-
this.#room.removeAllListeners();
|
|
183
|
-
this.#speaking = false;
|
|
184
|
-
if (this.#recognizeTask) {
|
|
185
|
-
await gracefullyCancel(this.#recognizeTask);
|
|
186
|
-
}
|
|
187
|
-
}
|
|
188
|
-
}
|
package/src/pipeline/index.ts
DELETED
|
@@ -1,15 +0,0 @@
|
|
|
1
|
-
// SPDX-FileCopyrightText: 2024 LiveKit, Inc.
|
|
2
|
-
//
|
|
3
|
-
// SPDX-License-Identifier: Apache-2.0
|
|
4
|
-
|
|
5
|
-
export {
|
|
6
|
-
type AgentState,
|
|
7
|
-
type BeforeTTSCallback,
|
|
8
|
-
type BeforeLLMCallback,
|
|
9
|
-
type VPACallbacks,
|
|
10
|
-
type AgentTranscriptionOptions,
|
|
11
|
-
type VPAOptions,
|
|
12
|
-
VPAEvent,
|
|
13
|
-
VoicePipelineAgent,
|
|
14
|
-
AgentCallContext,
|
|
15
|
-
} from './pipeline_agent.js';
|