@elizaos/plugin-local-inference 2.0.3-beta.2 → 2.0.3-beta.4
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +84 -10
- package/dist/actions/generate-media.d.ts.map +1 -0
- package/dist/actions/identify-speaker.d.ts.map +1 -0
- package/dist/actions/transcription-control.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/environment.d.ts +12 -0
- package/dist/adapters/capacitor-llama/environment.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/index.browser.d.ts +9 -0
- package/dist/adapters/capacitor-llama/index.browser.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/index.d.ts +18 -0
- package/dist/adapters/capacitor-llama/index.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/loader.d.ts +35 -0
- package/dist/adapters/capacitor-llama/loader.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/native-voice-capture.d.ts +70 -0
- package/dist/adapters/capacitor-llama/native-voice-capture.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/structured-output.d.ts +62 -0
- package/dist/adapters/capacitor-llama/structured-output.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/text-streaming.d.ts +24 -0
- package/dist/adapters/capacitor-llama/text-streaming.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/types.d.ts +338 -0
- package/dist/adapters/capacitor-llama/types.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/voice-turn.d.ts +86 -0
- package/dist/adapters/capacitor-llama/voice-turn.d.ts.map +1 -0
- package/dist/backends/apple-foundation.d.ts +56 -0
- package/dist/backends/apple-foundation.d.ts.map +1 -0
- package/dist/index.d.ts.map +1 -0
- package/dist/index.js +39647 -0
- package/dist/index.js.map +217 -0
- package/{src → dist}/local-inference-routes.d.ts +9 -0
- package/dist/local-inference-routes.d.ts.map +1 -0
- package/dist/provider.d.ts.map +1 -0
- package/{src → dist}/routes/compat-helpers.d.ts +1 -1
- package/dist/routes/compat-helpers.d.ts.map +1 -0
- package/dist/routes/family-member-route.d.ts.map +1 -0
- package/{src → dist}/routes/index.d.ts +1 -0
- package/dist/routes/index.d.ts.map +1 -0
- package/dist/routes/index.js +42040 -0
- package/dist/routes/index.js.map +236 -0
- package/{src → dist}/routes/live-diarization-route.d.ts +7 -0
- package/dist/routes/live-diarization-route.d.ts.map +1 -0
- package/dist/routes/local-inference-asr-route.d.ts.map +1 -0
- package/dist/routes/local-inference-asr-transcribe.d.ts.map +1 -0
- package/dist/routes/local-inference-compat-routes.d.ts.map +1 -0
- package/dist/routes/local-inference-tts-route.d.ts.map +1 -0
- package/dist/routes/native-pcm-turn-route.d.ts +3 -0
- package/dist/routes/native-pcm-turn-route.d.ts.map +1 -0
- package/dist/routes/transcript-audio-store.d.ts.map +1 -0
- package/{src → dist}/routes/transcripts-routes.d.ts +8 -0
- package/dist/routes/transcripts-routes.d.ts.map +1 -0
- package/dist/routes/voice-first-run-routes.d.ts.map +1 -0
- package/dist/routes/voice-models-routes.d.ts.map +1 -0
- package/dist/routes/voice-profile-plugin-routes.d.ts.map +1 -0
- package/dist/routes/voice-profiles-management-routes.d.ts.map +1 -0
- package/dist/routes/voice-speaker-profile-routes.d.ts.map +1 -0
- package/dist/runtime/embedding-manager-support.d.ts.map +1 -0
- package/dist/runtime/embedding-presets.d.ts.map +1 -0
- package/dist/runtime/embedding-warmup-policy.d.ts.map +1 -0
- package/{src → dist}/runtime/ensure-local-inference-handler.d.ts +8 -0
- package/dist/runtime/ensure-local-inference-handler.d.ts.map +1 -0
- package/{src → dist}/runtime/index.d.ts +1 -1
- package/dist/runtime/index.d.ts.map +1 -0
- package/dist/runtime/index.js +38768 -0
- package/dist/runtime/index.js.map +217 -0
- package/dist/runtime/mobile-local-inference-gate.d.ts +63 -0
- package/dist/runtime/mobile-local-inference-gate.d.ts.map +1 -0
- package/{src → dist}/runtime/voice-entity-binding.d.ts +10 -0
- package/dist/runtime/voice-entity-binding.d.ts.map +1 -0
- package/{src → dist}/services/active-model.d.ts +28 -0
- package/dist/services/active-model.d.ts.map +1 -0
- package/dist/services/asr-provenance.d.ts +5 -0
- package/dist/services/asr-provenance.d.ts.map +1 -0
- package/{src → dist}/services/assignments.d.ts +16 -3
- package/dist/services/assignments.d.ts.map +1 -0
- package/dist/services/backend-selector.d.ts +55 -0
- package/dist/services/backend-selector.d.ts.map +1 -0
- package/{src → dist}/services/backend.d.ts +110 -16
- package/dist/services/backend.d.ts.map +1 -0
- package/{src → dist}/services/bionic-host-loader.d.ts +21 -0
- package/dist/services/bionic-host-loader.d.ts.map +1 -0
- package/dist/services/bundled-models.d.ts.map +1 -0
- package/dist/services/cache-bridge.d.ts.map +1 -0
- package/dist/services/catalog.d.ts +10 -0
- package/dist/services/catalog.d.ts.map +1 -0
- package/dist/services/checkpoint-client.d.ts.map +1 -0
- package/dist/services/checkpoint-manager.d.ts +217 -0
- package/dist/services/checkpoint-manager.d.ts.map +1 -0
- package/dist/services/cloud-fallback.d.ts.map +1 -0
- package/dist/services/context-fit.d.ts +36 -0
- package/dist/services/context-fit.d.ts.map +1 -0
- package/dist/services/conversation-registry.d.ts.map +1 -0
- package/{src → dist}/services/desktop-fused-ffi-backend-runtime.d.ts +22 -6
- package/dist/services/desktop-fused-ffi-backend-runtime.d.ts.map +1 -0
- package/dist/services/device-bridge.d.ts.map +1 -0
- package/dist/services/device-resource-metrics.d.ts.map +1 -0
- package/{src → dist}/services/device-tier.d.ts +19 -1
- package/dist/services/device-tier.d.ts.map +1 -0
- package/{src → dist}/services/downloader.d.ts +16 -4
- package/dist/services/downloader.d.ts.map +1 -0
- package/{src → dist}/services/engine.d.ts +43 -4
- package/dist/services/engine.d.ts.map +1 -0
- package/dist/services/ensure-local-artifacts.d.ts +82 -0
- package/dist/services/ensure-local-artifacts.d.ts.map +1 -0
- package/dist/services/external-scanner.d.ts.map +1 -0
- package/dist/services/ffi-llm-mock.d.ts +90 -0
- package/dist/services/ffi-llm-mock.d.ts.map +1 -0
- package/dist/services/ffi-llm-streaming-abi.d.ts +318 -0
- package/dist/services/ffi-llm-streaming-abi.d.ts.map +1 -0
- package/{src → dist}/services/ffi-streaming-backend.d.ts +28 -7
- package/dist/services/ffi-streaming-backend.d.ts.map +1 -0
- package/{src → dist}/services/ffi-streaming-runner.d.ts +24 -0
- package/dist/services/ffi-streaming-runner.d.ts.map +1 -0
- package/dist/services/gpu-autotune.d.ts +150 -0
- package/dist/services/gpu-autotune.d.ts.map +1 -0
- package/dist/services/gpu-detect.d.ts.map +1 -0
- package/dist/services/handler-registry.d.ts.map +1 -0
- package/dist/services/hardware.d.ts.map +1 -0
- package/dist/services/image-description-runtime.d.ts.map +1 -0
- package/dist/services/imagegen/aosp-unavailable.d.ts.map +1 -0
- package/dist/services/imagegen/backend-selector.d.ts.map +1 -0
- package/dist/services/imagegen/coreml-unavailable.d.ts.map +1 -0
- package/dist/services/imagegen/errors.d.ts.map +1 -0
- package/dist/services/imagegen/index.d.ts.map +1 -0
- package/dist/services/imagegen/mflux.d.ts.map +1 -0
- package/{src → dist}/services/imagegen/sd-cpp.d.ts +1 -0
- package/dist/services/imagegen/sd-cpp.d.ts.map +1 -0
- package/dist/services/imagegen/tensorrt-unavailable.d.ts.map +1 -0
- package/dist/services/imagegen/types.d.ts.map +1 -0
- package/{src → dist}/services/index.d.ts +3 -1
- package/dist/services/index.d.ts.map +1 -0
- package/dist/services/index.js +39453 -0
- package/dist/services/index.js.map +227 -0
- package/dist/services/inference-capabilities.d.ts.map +1 -0
- package/dist/services/inference-telemetry.d.ts.map +1 -0
- package/dist/services/ios-llama-streaming.d.ts +119 -0
- package/dist/services/ios-llama-streaming.d.ts.map +1 -0
- package/dist/services/kv-spill.d.ts.map +1 -0
- package/dist/services/latency-trace.d.ts.map +1 -0
- package/dist/services/lib-target.d.ts +55 -0
- package/dist/services/lib-target.d.ts.map +1 -0
- package/dist/services/live-signals.d.ts +86 -0
- package/dist/services/live-signals.d.ts.map +1 -0
- package/dist/services/llama-server-metrics.d.ts +114 -0
- package/dist/services/llama-server-metrics.d.ts.map +1 -0
- package/dist/services/llm-streaming-binding.d.ts.map +1 -0
- package/dist/services/load-args.d.ts.map +1 -0
- package/dist/services/manifest/index.d.ts +4 -0
- package/dist/services/manifest/index.d.ts.map +1 -0
- package/{src → dist}/services/manifest/schema.d.ts +196 -6
- package/dist/services/manifest/schema.d.ts.map +1 -0
- package/{src → dist}/services/manifest/types.d.ts +3 -1
- package/dist/services/manifest/types.d.ts.map +1 -0
- package/dist/services/manifest/validator.d.ts.map +1 -0
- package/{src → dist}/services/memory-arbiter.d.ts +33 -3
- package/dist/services/memory-arbiter.d.ts.map +1 -0
- package/dist/services/memory-benchmark.d.ts +76 -0
- package/dist/services/memory-benchmark.d.ts.map +1 -0
- package/{src → dist}/services/memory-monitor.d.ts +6 -0
- package/dist/services/memory-monitor.d.ts.map +1 -0
- package/dist/services/memory-pressure.d.ts.map +1 -0
- package/dist/services/mtp-doctor.d.ts.map +1 -0
- package/dist/services/network-policy.d.ts.map +1 -0
- package/dist/services/paths.d.ts.map +1 -0
- package/dist/services/planner-skeleton.d.ts.map +1 -0
- package/dist/services/providers.d.ts.map +1 -0
- package/dist/services/ram-budget.d.ts.map +1 -0
- package/dist/services/readiness.d.ts.map +1 -0
- package/dist/services/recommendation.d.ts.map +1 -0
- package/{src → dist}/services/registry.d.ts +11 -13
- package/dist/services/registry.d.ts.map +1 -0
- package/{src → dist}/services/router-handler.d.ts +2 -2
- package/dist/services/router-handler.d.ts.map +1 -0
- package/{src → dist}/services/routing-policy.d.ts +32 -9
- package/dist/services/routing-policy.d.ts.map +1 -0
- package/dist/services/routing-preferences.d.ts.map +1 -0
- package/dist/services/runtime-target.d.ts.map +1 -0
- package/{src → dist}/services/service.d.ts +1 -1
- package/dist/services/service.d.ts.map +1 -0
- package/dist/services/session-pool.d.ts.map +1 -0
- package/dist/services/structured-output/deterministic-repair.d.ts.map +1 -0
- package/dist/services/structured-output/index.d.ts +2 -0
- package/dist/services/structured-output/index.d.ts.map +1 -0
- package/dist/services/structured-output.d.ts.map +1 -0
- package/dist/services/system-memory.d.ts.map +1 -0
- package/{src → dist}/services/types.d.ts +1 -1
- package/dist/services/types.d.ts.map +1 -0
- package/dist/services/verify-on-device.d.ts.map +1 -0
- package/dist/services/verify.d.ts.map +1 -0
- package/dist/services/vision/aosp-unavailable.d.ts.map +1 -0
- package/dist/services/vision/capacitor-llama.d.ts.map +1 -0
- package/dist/services/vision/cloud-fallback.d.ts.map +1 -0
- package/dist/services/vision/hash.d.ts.map +1 -0
- package/{src → dist}/services/vision/index.d.ts +1 -1
- package/dist/services/vision/index.d.ts.map +1 -0
- package/dist/services/vision/llama-server.d.ts.map +1 -0
- package/{src → dist}/services/vision/types.d.ts +13 -4
- package/dist/services/vision/types.d.ts.map +1 -0
- package/dist/services/vision/vast-fallback.d.ts.map +1 -0
- package/{src → dist}/services/vision-embedding-cache.d.ts +1 -1
- package/dist/services/vision-embedding-cache.d.ts.map +1 -0
- package/dist/services/voice/__test-helpers__/fake-ffi.d.ts +27 -0
- package/dist/services/voice/__test-helpers__/fake-ffi.d.ts.map +1 -0
- package/dist/services/voice/__test-helpers__/synthetic-speech.d.ts +66 -0
- package/dist/services/voice/__test-helpers__/synthetic-speech.d.ts.map +1 -0
- package/dist/services/voice/acoustic-speaker-attribution.d.ts +61 -0
- package/dist/services/voice/acoustic-speaker-attribution.d.ts.map +1 -0
- package/{src → dist}/services/voice/audio-frame-consumer.d.ts +82 -0
- package/dist/services/voice/audio-frame-consumer.d.ts.map +1 -0
- package/dist/services/voice/barge-in.d.ts.map +1 -0
- package/dist/services/voice/cancellation-coordinator.d.ts.map +1 -0
- package/dist/services/voice/checkpoint-manager.d.ts.map +1 -0
- package/dist/services/voice/checkpoint-policy.d.ts +178 -0
- package/dist/services/voice/checkpoint-policy.d.ts.map +1 -0
- package/dist/services/voice/corpus-augment.d.ts +111 -0
- package/dist/services/voice/corpus-augment.d.ts.map +1 -0
- package/dist/services/voice/corpus-generator.d.ts +134 -0
- package/dist/services/voice/corpus-generator.d.ts.map +1 -0
- package/dist/services/voice/diarization-error-rate.d.ts +40 -0
- package/dist/services/voice/diarization-error-rate.d.ts.map +1 -0
- package/dist/services/voice/e2e-harness.d.ts +297 -0
- package/dist/services/voice/e2e-harness.d.ts.map +1 -0
- package/dist/services/voice/eager-context-builder.d.ts.map +1 -0
- package/dist/services/voice/echo-delay.d.ts +67 -0
- package/dist/services/voice/echo-delay.d.ts.map +1 -0
- package/dist/services/voice/echo-metrics.d.ts +7 -0
- package/dist/services/voice/echo-metrics.d.ts.map +1 -0
- package/dist/services/voice/echo-reference-buffer.d.ts +65 -0
- package/dist/services/voice/echo-reference-buffer.d.ts.map +1 -0
- package/{src → dist}/services/voice/eliza1-eot-scorer.d.ts +8 -8
- package/dist/services/voice/eliza1-eot-scorer.d.ts.map +1 -0
- package/dist/services/voice/embedding-server.d.ts +37 -0
- package/dist/services/voice/embedding-server.d.ts.map +1 -0
- package/{src → dist}/services/voice/embedding.d.ts +2 -3
- package/dist/services/voice/embedding.d.ts.map +1 -0
- package/dist/services/voice/emotion-attribution.d.ts.map +1 -0
- package/{src → dist}/services/voice/engine-bridge.d.ts +8 -5
- package/dist/services/voice/engine-bridge.d.ts.map +1 -0
- package/{src → dist}/services/voice/eot-classifier-ggml.d.ts +22 -22
- package/dist/services/voice/eot-classifier-ggml.d.ts.map +1 -0
- package/{src → dist}/services/voice/eot-classifier.d.ts +9 -12
- package/dist/services/voice/eot-classifier.d.ts.map +1 -0
- package/{src → dist}/services/voice/errors.d.ts +1 -1
- package/dist/services/voice/errors.d.ts.map +1 -0
- package/{src → dist}/services/voice/expressive-tags.d.ts +5 -5
- package/dist/services/voice/expressive-tags.d.ts.map +1 -0
- package/{src → dist}/services/voice/ffi-bindings.d.ts +26 -4
- package/dist/services/voice/ffi-bindings.d.ts.map +1 -0
- package/dist/services/voice/first-line-cache.d.ts.map +1 -0
- package/{src → dist}/services/voice/fused-eot-scorer.d.ts +6 -6
- package/dist/services/voice/fused-eot-scorer.d.ts.map +1 -0
- package/{src → dist}/services/voice/index.d.ts +8 -3
- package/dist/services/voice/index.d.ts.map +1 -0
- package/dist/services/voice/kokoro/index.d.ts +24 -0
- package/dist/services/voice/kokoro/index.d.ts.map +1 -0
- package/{src → dist}/services/voice/kokoro/kokoro-backend.d.ts +15 -0
- package/dist/services/voice/kokoro/kokoro-backend.d.ts.map +1 -0
- package/{src → dist}/services/voice/kokoro/kokoro-engine-discovery.d.ts +1 -1
- package/dist/services/voice/kokoro/kokoro-engine-discovery.d.ts.map +1 -0
- package/{src → dist}/services/voice/kokoro/kokoro-ffi-runtime.d.ts +3 -3
- package/dist/services/voice/kokoro/kokoro-ffi-runtime.d.ts.map +1 -0
- package/dist/services/voice/kokoro/kokoro-runtime.d.ts.map +1 -0
- package/dist/services/voice/kokoro/phoneme-stream.d.ts +51 -0
- package/dist/services/voice/kokoro/phoneme-stream.d.ts.map +1 -0
- package/dist/services/voice/kokoro/phonemizer.d.ts.map +1 -0
- package/{src → dist}/services/voice/kokoro/pick-runtime.d.ts +1 -1
- package/dist/services/voice/kokoro/pick-runtime.d.ts.map +1 -0
- package/dist/services/voice/kokoro/runtime-selection.d.ts +31 -0
- package/dist/services/voice/kokoro/runtime-selection.d.ts.map +1 -0
- package/dist/services/voice/kokoro/types.d.ts.map +1 -0
- package/dist/services/voice/kokoro/voice-presets.d.ts.map +1 -0
- package/dist/services/voice/kokoro/voices.d.ts.map +1 -0
- package/dist/services/voice/lifecycle.d.ts.map +1 -0
- package/dist/services/voice/live-diarization-session.d.ts +196 -0
- package/dist/services/voice/live-diarization-session.d.ts.map +1 -0
- package/dist/services/voice/metric-math.d.ts +10 -0
- package/dist/services/voice/metric-math.d.ts.map +1 -0
- package/{src → dist}/services/voice/mic-source.d.ts +1 -1
- package/dist/services/voice/mic-source.d.ts.map +1 -0
- package/dist/services/voice/nlms-echo-canceller.d.ts +137 -0
- package/dist/services/voice/nlms-echo-canceller.d.ts.map +1 -0
- package/dist/services/voice/optimistic-policy.d.ts.map +1 -0
- package/dist/services/voice/optimistic-rollback.d.ts +151 -0
- package/dist/services/voice/optimistic-rollback.d.ts.map +1 -0
- package/{src → dist}/services/voice/partial-stabilizer.d.ts +1 -1
- package/dist/services/voice/partial-stabilizer.d.ts.map +1 -0
- package/dist/services/voice/phoneme-tokenizer.d.ts.map +1 -0
- package/dist/services/voice/phrase-cache.d.ts.map +1 -0
- package/dist/services/voice/phrase-chunker.d.ts.map +1 -0
- package/dist/services/voice/pipeline-impls.d.ts.map +1 -0
- package/dist/services/voice/pipeline.d.ts.map +1 -0
- package/dist/services/voice/prefill-client.d.ts.map +1 -0
- package/dist/services/voice/prefix-preserving-queue.d.ts.map +1 -0
- package/dist/services/voice/profile-store.d.ts.map +1 -0
- package/dist/services/voice/ring-buffer.d.ts.map +1 -0
- package/dist/services/voice/rollback-queue.d.ts.map +1 -0
- package/dist/services/voice/samantha-preset-placeholder.d.ts.map +1 -0
- package/dist/services/voice/samantha-preset-regenerator.d.ts.map +1 -0
- package/dist/services/voice/scheduler.d.ts.map +1 -0
- package/dist/services/voice/self-voice-imprint.d.ts +33 -0
- package/dist/services/voice/self-voice-imprint.d.ts.map +1 -0
- package/{src → dist}/services/voice/shared-resources.d.ts +14 -0
- package/dist/services/voice/shared-resources.d.ts.map +1 -0
- package/dist/services/voice/speaker/attribution-pipeline.d.ts.map +1 -0
- package/dist/services/voice/speaker/diarizer-fused.d.ts.map +1 -0
- package/dist/services/voice/speaker/diarizer.d.ts.map +1 -0
- package/dist/services/voice/speaker/encoder-fused.d.ts.map +1 -0
- package/dist/services/voice/speaker/encoder-ggml.d.ts.map +1 -0
- package/dist/services/voice/speaker/encoder.d.ts.map +1 -0
- package/dist/services/voice/speaker-imprint.d.ts.map +1 -0
- package/dist/services/voice/speaker-preset-cache.d.ts.map +1 -0
- package/dist/services/voice/streaming-asr/streaming-pipeline-adapter.d.ts +160 -0
- package/dist/services/voice/streaming-asr/streaming-pipeline-adapter.d.ts.map +1 -0
- package/dist/services/voice/system-audio-sink.d.ts.map +1 -0
- package/{src → dist}/services/voice/transcriber.d.ts +4 -4
- package/dist/services/voice/transcriber.d.ts.map +1 -0
- package/dist/services/voice/transcript-knowledge.d.ts.map +1 -0
- package/{src → dist}/services/voice/transcript-service.d.ts +20 -1
- package/dist/services/voice/transcript-service.d.ts.map +1 -0
- package/{src → dist}/services/voice/transcript-store.d.ts +12 -1
- package/dist/services/voice/transcript-store.d.ts.map +1 -0
- package/dist/services/voice/turn-controller.d.ts.map +1 -0
- package/{src → dist}/services/voice/types.d.ts +6 -6
- package/dist/services/voice/types.d.ts.map +1 -0
- package/{src → dist}/services/voice/vad.d.ts +6 -5
- package/dist/services/voice/vad.d.ts.map +1 -0
- package/dist/services/voice/voice-budget.d.ts.map +1 -0
- package/dist/services/voice/voice-emotion-classifier.d.ts.map +1 -0
- package/dist/services/voice/voice-preload-predictor.d.ts +76 -0
- package/dist/services/voice/voice-preload-predictor.d.ts.map +1 -0
- package/{src → dist}/services/voice/voice-preset-format.d.ts +2 -2
- package/dist/services/voice/voice-preset-format.d.ts.map +1 -0
- package/dist/services/voice/voice-profile-artifact.d.ts.map +1 -0
- package/dist/services/voice/voice-profile-routes.d.ts.map +1 -0
- package/dist/services/voice/voice-scenario.d.ts +131 -0
- package/dist/services/voice/voice-scenario.d.ts.map +1 -0
- package/dist/services/voice/voice-state-machine.d.ts.map +1 -0
- package/dist/services/voice/voice-workbench-report.d.ts +117 -0
- package/dist/services/voice/voice-workbench-report.d.ts.map +1 -0
- package/{src → dist}/services/voice/wake-word-ggml.d.ts +8 -9
- package/dist/services/voice/wake-word-ggml.d.ts.map +1 -0
- package/dist/services/voice/wake-word.d.ts.map +1 -0
- package/dist/services/voice/wav-codec.d.ts +11 -0
- package/dist/services/voice/wav-codec.d.ts.map +1 -0
- package/dist/services/voice/workbench-entrypoint.d.ts +42 -0
- package/dist/services/voice/workbench-entrypoint.d.ts.map +1 -0
- package/dist/services/voice/workbench-headless-runner.d.ts +102 -0
- package/dist/services/voice/workbench-headless-runner.d.ts.map +1 -0
- package/dist/services/voice/workbench-logic-services.d.ts +36 -0
- package/dist/services/voice/workbench-logic-services.d.ts.map +1 -0
- package/dist/services/voice/workbench-real-services.d.ts +17 -0
- package/dist/services/voice/workbench-real-services.d.ts.map +1 -0
- package/dist/services/voice/workbench-scenarios.d.ts +24 -0
- package/dist/services/voice/workbench-scenarios.d.ts.map +1 -0
- package/dist/services/voice/wrap-with-first-line-cache.d.ts.map +1 -0
- package/dist/services/voice-model-updater.d.ts.map +1 -0
- package/dist/services/voice-prewarm.d.ts.map +1 -0
- package/dist/voice-workbench.d.ts +18 -0
- package/dist/voice-workbench.d.ts.map +1 -0
- package/dist/voice-workbench.js +5259 -0
- package/dist/voice-workbench.js.map +34 -0
- package/package.json +28 -9
- package/registry-entry.json +137 -0
- package/src/adapters/capacitor-llama/__tests__/voice-turn.test.ts +293 -0
- package/src/adapters/capacitor-llama/environment.ts +1 -1
- package/src/adapters/capacitor-llama/index.ts +28 -4
- package/src/adapters/capacitor-llama/native-voice-capture.ts +140 -0
- package/src/adapters/capacitor-llama/text-streaming.ts +2 -2
- package/src/adapters/capacitor-llama/voice-turn.ts +178 -0
- package/src/backends/apple-foundation.ts +1 -1
- package/src/local-inference-routes.test.ts +57 -11
- package/src/local-inference-routes.ts +90 -8
- package/src/provider.ts +32 -3
- package/src/routes/compat-helpers.ts +2 -1
- package/src/routes/index.ts +1 -0
- package/src/routes/live-diarization-route.test.ts +134 -0
- package/src/routes/live-diarization-route.ts +79 -3
- package/src/routes/local-inference-asr-route.test.ts +43 -2
- package/src/routes/local-inference-asr-route.ts +7 -4
- package/src/routes/local-inference-asr-transcribe.test.ts +4 -4
- package/src/routes/local-inference-asr-transcribe.ts +1 -1
- package/src/routes/local-inference-compat-routes.test.ts +3 -3
- package/src/routes/local-inference-compat-routes.ts +23 -56
- package/src/routes/native-pcm-turn-route.test.ts +136 -0
- package/src/routes/native-pcm-turn-route.ts +121 -0
- package/src/routes/transcripts-routes.test.ts +51 -0
- package/src/routes/transcripts-routes.ts +35 -3
- package/src/runtime/bionic-wire-encoding.test.ts +147 -0
- package/src/runtime/ensure-local-inference-handler.test.ts +203 -5
- package/src/runtime/ensure-local-inference-handler.ts +203 -11
- package/src/runtime/index.ts +4 -1
- package/src/runtime/mobile-local-inference-gate.test.ts +85 -2
- package/src/runtime/mobile-local-inference-gate.ts +60 -5
- package/src/runtime/voice-entity-binding.transcript.test.ts +29 -0
- package/src/runtime/voice-entity-binding.ts +46 -6
- package/src/runtime/voice-speaker-entity-contract.test.ts +149 -0
- package/src/services/README.md +2 -2
- package/src/services/__tests__/backend-selector.precedence.test.ts +333 -0
- package/src/services/active-model-context-fit.test.ts +125 -0
- package/src/services/active-model.ts +211 -8
- package/src/services/asr-provenance.ts +68 -0
- package/src/services/assignment-validation.test.ts +118 -0
- package/src/services/assignments.test.ts +26 -0
- package/src/services/assignments.ts +52 -4
- package/src/services/backend.test.ts +84 -0
- package/src/services/backend.ts +198 -19
- package/src/services/bionic-host-loader.test.ts +94 -1
- package/src/services/bionic-host-loader.ts +72 -0
- package/src/services/cache-bridge.test.ts +7 -7
- package/src/services/catalog.test.ts +32 -11
- package/src/services/catalog.ts +6 -0
- package/src/services/cloud-fallback.ts +1 -1
- package/src/services/context-fit.test.ts +121 -0
- package/src/services/context-fit.ts +113 -0
- package/src/services/desktop-fused-ffi-backend-runtime.ts +99 -7
- package/src/services/device-tier.test.ts +89 -2
- package/src/services/device-tier.ts +103 -11
- package/src/services/downloader.test.ts +199 -58
- package/src/services/downloader.ts +141 -27
- package/src/services/engine-direct-bundle.test.ts +38 -6
- package/src/services/engine.ts +291 -104
- package/src/services/ensure-local-artifacts.ts +1 -1
- package/src/services/ffi-llm-streaming-abi.ts +6 -3
- package/src/services/ffi-streaming-backend.ts +44 -8
- package/src/services/ffi-streaming-runner.test.ts +163 -3
- package/src/services/ffi-streaming-runner.ts +54 -1
- package/src/services/ffi-unload-ordering.test.ts +5 -1
- package/src/services/fused-eliza1-no-regression.test.ts +144 -0
- package/src/services/hardware.test.ts +7 -2
- package/src/services/hardware.ts +28 -0
- package/src/services/imagegen/backend-selector.test.ts +190 -0
- package/src/services/imagegen/sd-cpp.ts +6 -9
- package/src/services/index.ts +18 -0
- package/src/services/ios-llama-streaming.ts +1 -1
- package/src/services/kv-spill.ts +6 -5
- package/src/services/lib-target.test.ts +145 -0
- package/src/services/lib-target.ts +102 -0
- package/src/services/live-signals.test.ts +132 -0
- package/src/services/live-signals.ts +177 -0
- package/src/services/llama-server-metrics.test.ts +168 -0
- package/src/services/manifest/eliza-1.manifest.v1.json +84 -2
- package/src/services/manifest/index.ts +6 -0
- package/src/services/manifest/manifest.test.ts +156 -54
- package/src/services/manifest/schema.ts +160 -52
- package/src/services/manifest/types.ts +6 -0
- package/src/services/manifest/validator.ts +91 -25
- package/src/services/memory-arbiter.test.ts +139 -0
- package/src/services/memory-arbiter.ts +81 -15
- package/src/services/memory-benchmark.test.ts +91 -0
- package/src/services/memory-benchmark.ts +354 -0
- package/src/services/memory-monitor.test.ts +24 -0
- package/src/services/memory-monitor.ts +12 -0
- package/src/services/mtp-doctor.ts +10 -2
- package/src/services/network-policy.ts +5 -5
- package/src/services/ram-budget-cache.test.ts +2 -1
- package/src/services/ram-budget.ts +0 -0
- package/src/services/recommendation.test.ts +216 -0
- package/src/services/registry.ts +25 -19
- package/src/services/required-kernels-gate.test.ts +64 -0
- package/src/services/router-handler.ts +43 -24
- package/src/services/routing-policy.test.ts +211 -23
- package/src/services/routing-policy.ts +92 -22
- package/src/services/service.test.ts +3 -3
- package/src/services/service.ts +22 -7
- package/src/services/transcription-priority.test.ts +2 -2
- package/src/services/types.ts +4 -0
- package/src/services/verify-on-device.test.ts +2 -2
- package/src/services/vision/hash.ts +1 -1
- package/src/services/vision/index.ts +2 -2
- package/src/services/vision/llama-server.ts +1 -1
- package/src/services/vision/types.ts +13 -4
- package/src/services/vision-embedding-cache.ts +1 -1
- package/src/services/voice/VOICE_WORKBENCH.md +71 -26
- package/src/services/voice/__fixtures__/voice-workbench-logic-baseline.json +180 -0
- package/src/services/voice/__test-helpers__/synthetic-speech.ts +72 -2
- package/src/services/voice/__tests__/eliza1-eot-scorer.test.ts +29 -29
- package/src/services/voice/__tests__/streaming-asr.test.ts +1 -1
- package/src/services/voice/acoustic-speaker-attribution.test.ts +165 -0
- package/src/services/voice/acoustic-speaker-attribution.ts +336 -0
- package/src/services/voice/asr-timed.real.test.ts +6 -8
- package/src/services/voice/audio-frame-consumer.test.ts +327 -1
- package/src/services/voice/audio-frame-consumer.ts +165 -5
- package/src/services/voice/barge-in.ts +2 -3
- package/src/services/voice/corpus-augment.test.ts +276 -0
- package/src/services/voice/corpus-augment.ts +451 -0
- package/src/services/voice/corpus-generator.test.ts +201 -0
- package/src/services/voice/corpus-generator.ts +413 -0
- package/src/services/voice/diarization-error-rate.greedy.test.ts +140 -0
- package/src/services/voice/diarization-error-rate.test.ts +100 -0
- package/src/services/voice/diarization-error-rate.ts +249 -0
- package/src/services/voice/e2e-harness.der.test.ts +94 -0
- package/src/services/voice/e2e-harness.respond-eot-entity.test.ts +277 -0
- package/src/services/voice/e2e-harness.security-echo.test.ts +103 -0
- package/src/services/voice/e2e-harness.test.ts +2 -2
- package/src/services/voice/e2e-harness.ts +175 -16
- package/src/services/voice/echo-delay.test.ts +118 -0
- package/src/services/voice/echo-delay.ts +135 -0
- package/src/services/voice/echo-metrics.test.ts +17 -0
- package/src/services/voice/echo-metrics.ts +20 -0
- package/src/services/voice/echo-reference-buffer.test.ts +86 -0
- package/src/services/voice/echo-reference-buffer.ts +165 -0
- package/src/services/voice/eliza1-eot-scorer.ts +22 -22
- package/src/services/voice/embedding.ts +2 -3
- package/src/services/voice/engine-bridge-transcript-join.test.ts +278 -0
- package/src/services/voice/engine-bridge.ts +151 -110
- package/src/services/voice/eot-classifier-ggml.ts +42 -39
- package/src/services/voice/eot-classifier.test.ts +98 -0
- package/src/services/voice/eot-classifier.ts +11 -122
- package/src/services/voice/errors.ts +2 -0
- package/src/services/voice/expressive-tags.asr.test.ts +77 -0
- package/src/services/voice/expressive-tags.test.ts +102 -0
- package/src/services/voice/expressive-tags.ts +8 -8
- package/src/services/voice/ffi-bindings.test.ts +10 -3
- package/src/services/voice/ffi-bindings.ts +177 -15
- package/src/services/voice/fused-eot-scorer.ts +17 -13
- package/src/services/voice/index.ts +33 -12
- package/src/services/voice/kokoro/__tests__/kokoro-backend.test.ts +112 -1
- package/src/services/voice/kokoro/__tests__/kokoro-engine-bridge.real.test.ts +88 -3
- package/src/services/voice/kokoro/__tests__/runtime-selection.test.ts +37 -201
- package/src/services/voice/kokoro/kokoro-backend.ts +16 -0
- package/src/services/voice/kokoro/kokoro-engine-discovery.ts +1 -1
- package/src/services/voice/kokoro/kokoro-ffi-runtime.ts +3 -3
- package/src/services/voice/kokoro/pick-runtime.ts +1 -1
- package/src/services/voice/kokoro/runtime-selection.ts +28 -201
- package/src/services/voice/live-diarization-session.echo.test.ts +232 -0
- package/src/services/voice/live-diarization-session.ts +335 -2
- package/src/services/voice/metric-math.test.ts +61 -0
- package/src/services/voice/metric-math.ts +25 -0
- package/src/services/voice/mic-source.ts +1 -1
- package/src/services/voice/nlms-echo-canceller.test.ts +244 -0
- package/src/services/voice/nlms-echo-canceller.ts +317 -0
- package/src/services/voice/optimistic-policy.power-source.test.ts +36 -0
- package/src/services/voice/partial-stabilizer.ts +1 -1
- package/src/services/voice/pipeline.ts +3 -4
- package/src/services/voice/research/VOICE_8785_ASSESSMENT.md +141 -0
- package/src/services/voice/research/VOICE_PIPELINE_RESEARCH_2026.md +117 -0
- package/src/services/voice/research/VOICE_VALIDATION_RUNBOOK.md +135 -0
- package/src/services/voice/samantha-preset-regenerator.wav.test.ts +90 -0
- package/src/services/voice/self-voice-imprint.test.ts +59 -0
- package/src/services/voice/self-voice-imprint.ts +102 -0
- package/src/services/voice/shared-resources.ts +23 -0
- package/src/services/voice/speaker/attribution-pipeline.test.ts +221 -0
- package/src/services/voice/speaker/attribution-pipeline.ts +85 -22
- package/src/services/voice/speaker/encoder-ggml.test.ts +59 -0
- package/src/services/voice/transcriber.asr-backend.test.ts +76 -0
- package/src/services/voice/transcriber.ts +4 -4
- package/src/services/voice/transcript-service.test.ts +58 -0
- package/src/services/voice/transcript-service.ts +64 -0
- package/src/services/voice/transcript-store.test.ts +36 -0
- package/src/services/voice/transcript-store.ts +32 -0
- package/src/services/voice/types.ts +7 -7
- package/src/services/voice/vad.test.ts +33 -15
- package/src/services/voice/vad.ts +25 -20
- package/src/services/voice/voice-budget.test.ts +0 -3
- package/src/services/voice/voice-budget.ts +6 -6
- package/src/services/voice/voice-duet.test.ts +1 -1
- package/src/services/voice/voice-hardening.fuzz.test.ts +116 -0
- package/src/services/voice/voice-preload-predictor.test.ts +130 -0
- package/src/services/voice/voice-preload-predictor.ts +113 -0
- package/src/services/voice/voice-preset-format.fuzz.test.ts +89 -0
- package/src/services/voice/voice-preset-format.test.ts +75 -0
- package/src/services/voice/voice-preset-format.ts +17 -4
- package/src/services/voice/voice-scenario.test.ts +159 -0
- package/src/services/voice/voice-scenario.ts +133 -7
- package/src/services/voice/voice-scenario.turn-helpers.test.ts +77 -0
- package/src/services/voice/voice-workbench-report.ts +58 -17
- package/src/services/voice/wake-word-ggml.ts +12 -13
- package/src/services/voice/wav-codec.fuzz.test.ts +59 -0
- package/src/services/voice/wav-codec.test.ts +32 -0
- package/src/services/voice/wav-codec.ts +101 -0
- package/src/services/voice/workbench-entrypoint.test.ts +55 -0
- package/src/services/voice/workbench-entrypoint.ts +88 -0
- package/src/services/voice/workbench-headless-runner.test.ts +162 -0
- package/src/services/voice/workbench-headless-runner.ts +396 -0
- package/src/services/voice/workbench-logic-services.test.ts +225 -0
- package/src/services/voice/workbench-logic-services.ts +184 -0
- package/src/services/voice/workbench-real-services.ts +629 -0
- package/src/services/voice/workbench-scenarios.ts +407 -0
- package/src/services/voice-prewarm.ts +1 -1
- package/src/voice-workbench.ts +71 -0
- package/src/actions/generate-media.d.ts.map +0 -1
- package/src/actions/identify-speaker.d.ts.map +0 -1
- package/src/actions/transcription-control.d.ts.map +0 -1
- package/src/index.d.ts.map +0 -1
- package/src/local-inference-routes.d.ts.map +0 -1
- package/src/provider.d.ts.map +0 -1
- package/src/routes/compat-helpers.d.ts.map +0 -1
- package/src/routes/family-member-route.d.ts.map +0 -1
- package/src/routes/index.d.ts.map +0 -1
- package/src/routes/live-diarization-route.d.ts.map +0 -1
- package/src/routes/local-inference-asr-route.d.ts.map +0 -1
- package/src/routes/local-inference-asr-transcribe.d.ts.map +0 -1
- package/src/routes/local-inference-compat-routes.d.ts.map +0 -1
- package/src/routes/local-inference-tts-route.d.ts.map +0 -1
- package/src/routes/transcript-audio-store.d.ts.map +0 -1
- package/src/routes/transcripts-routes.d.ts.map +0 -1
- package/src/routes/voice-first-run-routes.d.ts.map +0 -1
- package/src/routes/voice-models-routes.d.ts.map +0 -1
- package/src/routes/voice-profile-plugin-routes.d.ts.map +0 -1
- package/src/routes/voice-profiles-management-routes.d.ts.map +0 -1
- package/src/routes/voice-speaker-profile-routes.d.ts.map +0 -1
- package/src/runtime/embedding-manager-support.d.ts.map +0 -1
- package/src/runtime/embedding-presets.d.ts.map +0 -1
- package/src/runtime/embedding-warmup-policy.d.ts.map +0 -1
- package/src/runtime/ensure-local-inference-handler.d.ts.map +0 -1
- package/src/runtime/index.d.ts.map +0 -1
- package/src/runtime/mobile-local-inference-gate.d.ts +0 -31
- package/src/runtime/mobile-local-inference-gate.d.ts.map +0 -1
- package/src/runtime/voice-entity-binding.d.ts.map +0 -1
- package/src/services/active-model.d.ts.map +0 -1
- package/src/services/assignments.d.ts.map +0 -1
- package/src/services/backend.d.ts.map +0 -1
- package/src/services/bionic-host-loader.d.ts.map +0 -1
- package/src/services/bundled-models.d.ts.map +0 -1
- package/src/services/cache-bridge.d.ts.map +0 -1
- package/src/services/catalog.d.ts +0 -10
- package/src/services/catalog.d.ts.map +0 -1
- package/src/services/checkpoint-client.d.ts.map +0 -1
- package/src/services/cloud-fallback.d.ts.map +0 -1
- package/src/services/conversation-registry.d.ts.map +0 -1
- package/src/services/desktop-fused-ffi-backend-runtime.d.ts.map +0 -1
- package/src/services/device-bridge.d.ts.map +0 -1
- package/src/services/device-resource-metrics.d.ts.map +0 -1
- package/src/services/device-tier.d.ts.map +0 -1
- package/src/services/downloader.d.ts.map +0 -1
- package/src/services/engine.d.ts.map +0 -1
- package/src/services/external-scanner.d.ts.map +0 -1
- package/src/services/ffi-streaming-backend.d.ts.map +0 -1
- package/src/services/ffi-streaming-runner.d.ts.map +0 -1
- package/src/services/gpu-detect.d.ts.map +0 -1
- package/src/services/handler-registry.d.ts.map +0 -1
- package/src/services/hardware.d.ts.map +0 -1
- package/src/services/hf-search.d.ts +0 -26
- package/src/services/hf-search.d.ts.map +0 -1
- package/src/services/hf-search.test.ts +0 -69
- package/src/services/hf-search.ts +0 -420
- package/src/services/image-description-runtime.d.ts.map +0 -1
- package/src/services/imagegen/aosp-unavailable.d.ts.map +0 -1
- package/src/services/imagegen/backend-selector.d.ts.map +0 -1
- package/src/services/imagegen/coreml-unavailable.d.ts.map +0 -1
- package/src/services/imagegen/errors.d.ts.map +0 -1
- package/src/services/imagegen/index.d.ts.map +0 -1
- package/src/services/imagegen/mflux.d.ts.map +0 -1
- package/src/services/imagegen/sd-cpp.d.ts.map +0 -1
- package/src/services/imagegen/tensorrt-unavailable.d.ts.map +0 -1
- package/src/services/imagegen/types.d.ts.map +0 -1
- package/src/services/index.d.ts.map +0 -1
- package/src/services/inference-capabilities.d.ts.map +0 -1
- package/src/services/inference-telemetry.d.ts.map +0 -1
- package/src/services/kv-spill.d.ts.map +0 -1
- package/src/services/latency-trace.d.ts.map +0 -1
- package/src/services/llm-streaming-binding.d.ts.map +0 -1
- package/src/services/load-args.d.ts.map +0 -1
- package/src/services/manifest/index.d.ts +0 -4
- package/src/services/manifest/index.d.ts.map +0 -1
- package/src/services/manifest/schema.d.ts.map +0 -1
- package/src/services/manifest/types.d.ts.map +0 -1
- package/src/services/manifest/validator.d.ts.map +0 -1
- package/src/services/memory-arbiter.d.ts.map +0 -1
- package/src/services/memory-monitor.d.ts.map +0 -1
- package/src/services/memory-pressure.d.ts.map +0 -1
- package/src/services/mtp-doctor.d.ts.map +0 -1
- package/src/services/network-policy.d.ts.map +0 -1
- package/src/services/paths.d.ts.map +0 -1
- package/src/services/planner-skeleton.d.ts.map +0 -1
- package/src/services/providers.d.ts.map +0 -1
- package/src/services/ram-budget.d.ts.map +0 -1
- package/src/services/readiness.d.ts.map +0 -1
- package/src/services/recommendation.d.ts.map +0 -1
- package/src/services/registry.d.ts.map +0 -1
- package/src/services/router-handler.d.ts.map +0 -1
- package/src/services/routing-policy.d.ts.map +0 -1
- package/src/services/routing-preferences.d.ts.map +0 -1
- package/src/services/runtime-target.d.ts.map +0 -1
- package/src/services/service.d.ts.map +0 -1
- package/src/services/session-pool.d.ts.map +0 -1
- package/src/services/structured-output/deterministic-repair.d.ts.map +0 -1
- package/src/services/structured-output.d.ts.map +0 -1
- package/src/services/system-memory.d.ts.map +0 -1
- package/src/services/types.d.ts.map +0 -1
- package/src/services/verify-on-device.d.ts.map +0 -1
- package/src/services/verify.d.ts.map +0 -1
- package/src/services/vision/aosp-unavailable.d.ts.map +0 -1
- package/src/services/vision/capacitor-llama.d.ts.map +0 -1
- package/src/services/vision/cloud-fallback.d.ts.map +0 -1
- package/src/services/vision/hash.d.ts.map +0 -1
- package/src/services/vision/index.d.ts.map +0 -1
- package/src/services/vision/llama-server.d.ts.map +0 -1
- package/src/services/vision/types.d.ts.map +0 -1
- package/src/services/vision/vast-fallback.d.ts.map +0 -1
- package/src/services/vision-embedding-cache.d.ts.map +0 -1
- package/src/services/voice/audio-frame-consumer.d.ts.map +0 -1
- package/src/services/voice/barge-in.d.ts.map +0 -1
- package/src/services/voice/cancellation-coordinator.d.ts.map +0 -1
- package/src/services/voice/checkpoint-manager.d.ts.map +0 -1
- package/src/services/voice/eager-context-builder.d.ts.map +0 -1
- package/src/services/voice/eliza1-eot-scorer.d.ts.map +0 -1
- package/src/services/voice/embedding.d.ts.map +0 -1
- package/src/services/voice/emotion-attribution.d.ts.map +0 -1
- package/src/services/voice/engine-bridge.d.ts.map +0 -1
- package/src/services/voice/eot-classifier-ggml.d.ts.map +0 -1
- package/src/services/voice/eot-classifier.d.ts.map +0 -1
- package/src/services/voice/errors.d.ts.map +0 -1
- package/src/services/voice/expressive-tags.d.ts.map +0 -1
- package/src/services/voice/ffi-bindings.d.ts.map +0 -1
- package/src/services/voice/first-line-cache.d.ts.map +0 -1
- package/src/services/voice/fused-eot-scorer.d.ts.map +0 -1
- package/src/services/voice/index.d.ts.map +0 -1
- package/src/services/voice/kokoro/kokoro-backend.d.ts.map +0 -1
- package/src/services/voice/kokoro/kokoro-engine-discovery.d.ts.map +0 -1
- package/src/services/voice/kokoro/kokoro-ffi-runtime.d.ts.map +0 -1
- package/src/services/voice/kokoro/kokoro-runtime.d.ts.map +0 -1
- package/src/services/voice/kokoro/phonemizer.d.ts.map +0 -1
- package/src/services/voice/kokoro/pick-runtime.d.ts.map +0 -1
- package/src/services/voice/kokoro/runtime-selection.d.ts +0 -92
- package/src/services/voice/kokoro/runtime-selection.d.ts.map +0 -1
- package/src/services/voice/kokoro/types.d.ts.map +0 -1
- package/src/services/voice/kokoro/voice-presets.d.ts.map +0 -1
- package/src/services/voice/kokoro/voices.d.ts.map +0 -1
- package/src/services/voice/lifecycle.d.ts.map +0 -1
- package/src/services/voice/live-diarization-session.d.ts +0 -96
- package/src/services/voice/live-diarization-session.d.ts.map +0 -1
- package/src/services/voice/mic-source.d.ts.map +0 -1
- package/src/services/voice/optimistic-policy.d.ts.map +0 -1
- package/src/services/voice/partial-stabilizer.d.ts.map +0 -1
- package/src/services/voice/phoneme-tokenizer.d.ts.map +0 -1
- package/src/services/voice/phrase-cache.d.ts.map +0 -1
- package/src/services/voice/phrase-chunker.d.ts.map +0 -1
- package/src/services/voice/pipeline-impls.d.ts.map +0 -1
- package/src/services/voice/pipeline.d.ts.map +0 -1
- package/src/services/voice/prefill-client.d.ts.map +0 -1
- package/src/services/voice/prefix-preserving-queue.d.ts.map +0 -1
- package/src/services/voice/profile-store.d.ts.map +0 -1
- package/src/services/voice/ring-buffer.d.ts.map +0 -1
- package/src/services/voice/rollback-queue.d.ts.map +0 -1
- package/src/services/voice/samantha-preset-placeholder.d.ts.map +0 -1
- package/src/services/voice/samantha-preset-regenerator.d.ts.map +0 -1
- package/src/services/voice/scheduler.d.ts.map +0 -1
- package/src/services/voice/shared-resources.d.ts.map +0 -1
- package/src/services/voice/speaker/attribution-pipeline.d.ts.map +0 -1
- package/src/services/voice/speaker/diarizer-fused.d.ts.map +0 -1
- package/src/services/voice/speaker/diarizer.d.ts.map +0 -1
- package/src/services/voice/speaker/encoder-fused.d.ts.map +0 -1
- package/src/services/voice/speaker/encoder-ggml.d.ts.map +0 -1
- package/src/services/voice/speaker/encoder.d.ts.map +0 -1
- package/src/services/voice/speaker-imprint.d.ts.map +0 -1
- package/src/services/voice/speaker-preset-cache.d.ts.map +0 -1
- package/src/services/voice/system-audio-sink.d.ts.map +0 -1
- package/src/services/voice/transcriber.d.ts.map +0 -1
- package/src/services/voice/transcript-knowledge.d.ts.map +0 -1
- package/src/services/voice/transcript-service.d.ts.map +0 -1
- package/src/services/voice/transcript-store.d.ts.map +0 -1
- package/src/services/voice/turn-controller.d.ts.map +0 -1
- package/src/services/voice/types.d.ts.map +0 -1
- package/src/services/voice/vad.d.ts.map +0 -1
- package/src/services/voice/voice-budget.d.ts.map +0 -1
- package/src/services/voice/voice-emotion-classifier.d.ts.map +0 -1
- package/src/services/voice/voice-preset-format.d.ts.map +0 -1
- package/src/services/voice/voice-profile-artifact.d.ts.map +0 -1
- package/src/services/voice/voice-profile-routes.d.ts.map +0 -1
- package/src/services/voice/voice-settings.d.ts +0 -82
- package/src/services/voice/voice-settings.d.ts.map +0 -1
- package/src/services/voice/voice-settings.ts +0 -172
- package/src/services/voice/voice-state-machine.d.ts.map +0 -1
- package/src/services/voice/wake-word-ggml.d.ts.map +0 -1
- package/src/services/voice/wake-word.d.ts.map +0 -1
- package/src/services/voice/wrap-with-first-line-cache.d.ts.map +0 -1
- package/src/services/voice-model-updater.d.ts.map +0 -1
- package/src/services/voice-prewarm.d.ts.map +0 -1
- /package/{src → dist}/actions/generate-media.d.ts +0 -0
- /package/{src → dist}/actions/identify-speaker.d.ts +0 -0
- /package/{src → dist}/actions/transcription-control.d.ts +0 -0
- /package/{src → dist}/index.d.ts +0 -0
- /package/{src → dist}/provider.d.ts +0 -0
- /package/{src → dist}/routes/family-member-route.d.ts +0 -0
- /package/{src → dist}/routes/local-inference-asr-route.d.ts +0 -0
- /package/{src → dist}/routes/local-inference-asr-transcribe.d.ts +0 -0
- /package/{src → dist}/routes/local-inference-compat-routes.d.ts +0 -0
- /package/{src → dist}/routes/local-inference-tts-route.d.ts +0 -0
- /package/{src → dist}/routes/transcript-audio-store.d.ts +0 -0
- /package/{src → dist}/routes/voice-first-run-routes.d.ts +0 -0
- /package/{src → dist}/routes/voice-models-routes.d.ts +0 -0
- /package/{src → dist}/routes/voice-profile-plugin-routes.d.ts +0 -0
- /package/{src → dist}/routes/voice-profiles-management-routes.d.ts +0 -0
- /package/{src → dist}/routes/voice-speaker-profile-routes.d.ts +0 -0
- /package/{src → dist}/runtime/embedding-manager-support.d.ts +0 -0
- /package/{src → dist}/runtime/embedding-presets.d.ts +0 -0
- /package/{src → dist}/runtime/embedding-warmup-policy.d.ts +0 -0
- /package/{src → dist}/services/bundled-models.d.ts +0 -0
- /package/{src → dist}/services/cache-bridge.d.ts +0 -0
- /package/{src → dist}/services/checkpoint-client.d.ts +0 -0
- /package/{src → dist}/services/cloud-fallback.d.ts +0 -0
- /package/{src → dist}/services/conversation-registry.d.ts +0 -0
- /package/{src → dist}/services/device-bridge.d.ts +0 -0
- /package/{src → dist}/services/device-resource-metrics.d.ts +0 -0
- /package/{src → dist}/services/external-scanner.d.ts +0 -0
- /package/{src → dist}/services/gpu-detect.d.ts +0 -0
- /package/{src → dist}/services/handler-registry.d.ts +0 -0
- /package/{src → dist}/services/hardware.d.ts +0 -0
- /package/{src → dist}/services/image-description-runtime.d.ts +0 -0
- /package/{src → dist}/services/imagegen/aosp-unavailable.d.ts +0 -0
- /package/{src → dist}/services/imagegen/backend-selector.d.ts +0 -0
- /package/{src → dist}/services/imagegen/coreml-unavailable.d.ts +0 -0
- /package/{src → dist}/services/imagegen/errors.d.ts +0 -0
- /package/{src → dist}/services/imagegen/index.d.ts +0 -0
- /package/{src → dist}/services/imagegen/mflux.d.ts +0 -0
- /package/{src → dist}/services/imagegen/tensorrt-unavailable.d.ts +0 -0
- /package/{src → dist}/services/imagegen/types.d.ts +0 -0
- /package/{src → dist}/services/inference-capabilities.d.ts +0 -0
- /package/{src → dist}/services/inference-telemetry.d.ts +0 -0
- /package/{src → dist}/services/kv-spill.d.ts +0 -0
- /package/{src → dist}/services/latency-trace.d.ts +0 -0
- /package/{src → dist}/services/llm-streaming-binding.d.ts +0 -0
- /package/{src → dist}/services/load-args.d.ts +0 -0
- /package/{src → dist}/services/manifest/validator.d.ts +0 -0
- /package/{src → dist}/services/memory-pressure.d.ts +0 -0
- /package/{src → dist}/services/mtp-doctor.d.ts +0 -0
- /package/{src → dist}/services/network-policy.d.ts +0 -0
- /package/{src → dist}/services/paths.d.ts +0 -0
- /package/{src → dist}/services/planner-skeleton.d.ts +0 -0
- /package/{src → dist}/services/providers.d.ts +0 -0
- /package/{src → dist}/services/ram-budget.d.ts +0 -0
- /package/{src → dist}/services/readiness.d.ts +0 -0
- /package/{src → dist}/services/recommendation.d.ts +0 -0
- /package/{src → dist}/services/routing-preferences.d.ts +0 -0
- /package/{src → dist}/services/runtime-target.d.ts +0 -0
- /package/{src → dist}/services/session-pool.d.ts +0 -0
- /package/{src → dist}/services/structured-output/deterministic-repair.d.ts +0 -0
- /package/{src → dist}/services/structured-output.d.ts +0 -0
- /package/{src → dist}/services/system-memory.d.ts +0 -0
- /package/{src → dist}/services/verify-on-device.d.ts +0 -0
- /package/{src → dist}/services/verify.d.ts +0 -0
- /package/{src → dist}/services/vision/aosp-unavailable.d.ts +0 -0
- /package/{src → dist}/services/vision/capacitor-llama.d.ts +0 -0
- /package/{src → dist}/services/vision/cloud-fallback.d.ts +0 -0
- /package/{src → dist}/services/vision/hash.d.ts +0 -0
- /package/{src → dist}/services/vision/llama-server.d.ts +0 -0
- /package/{src → dist}/services/vision/vast-fallback.d.ts +0 -0
- /package/{src → dist}/services/voice/barge-in.d.ts +0 -0
- /package/{src → dist}/services/voice/cancellation-coordinator.d.ts +0 -0
- /package/{src → dist}/services/voice/checkpoint-manager.d.ts +0 -0
- /package/{src → dist}/services/voice/eager-context-builder.d.ts +0 -0
- /package/{src → dist}/services/voice/emotion-attribution.d.ts +0 -0
- /package/{src → dist}/services/voice/first-line-cache.d.ts +0 -0
- /package/{src → dist}/services/voice/kokoro/kokoro-runtime.d.ts +0 -0
- /package/{src → dist}/services/voice/kokoro/phonemizer.d.ts +0 -0
- /package/{src → dist}/services/voice/kokoro/types.d.ts +0 -0
- /package/{src → dist}/services/voice/kokoro/voice-presets.d.ts +0 -0
- /package/{src → dist}/services/voice/kokoro/voices.d.ts +0 -0
- /package/{src → dist}/services/voice/lifecycle.d.ts +0 -0
- /package/{src → dist}/services/voice/optimistic-policy.d.ts +0 -0
- /package/{src → dist}/services/voice/phoneme-tokenizer.d.ts +0 -0
- /package/{src → dist}/services/voice/phrase-cache.d.ts +0 -0
- /package/{src → dist}/services/voice/phrase-chunker.d.ts +0 -0
- /package/{src → dist}/services/voice/pipeline-impls.d.ts +0 -0
- /package/{src → dist}/services/voice/pipeline.d.ts +0 -0
- /package/{src → dist}/services/voice/prefill-client.d.ts +0 -0
- /package/{src → dist}/services/voice/prefix-preserving-queue.d.ts +0 -0
- /package/{src → dist}/services/voice/profile-store.d.ts +0 -0
- /package/{src → dist}/services/voice/ring-buffer.d.ts +0 -0
- /package/{src → dist}/services/voice/rollback-queue.d.ts +0 -0
- /package/{src → dist}/services/voice/samantha-preset-placeholder.d.ts +0 -0
- /package/{src → dist}/services/voice/samantha-preset-regenerator.d.ts +0 -0
- /package/{src → dist}/services/voice/scheduler.d.ts +0 -0
- /package/{src → dist}/services/voice/speaker/attribution-pipeline.d.ts +0 -0
- /package/{src → dist}/services/voice/speaker/diarizer-fused.d.ts +0 -0
- /package/{src → dist}/services/voice/speaker/diarizer.d.ts +0 -0
- /package/{src → dist}/services/voice/speaker/encoder-fused.d.ts +0 -0
- /package/{src → dist}/services/voice/speaker/encoder-ggml.d.ts +0 -0
- /package/{src → dist}/services/voice/speaker/encoder.d.ts +0 -0
- /package/{src → dist}/services/voice/speaker-imprint.d.ts +0 -0
- /package/{src → dist}/services/voice/speaker-preset-cache.d.ts +0 -0
- /package/{src → dist}/services/voice/system-audio-sink.d.ts +0 -0
- /package/{src → dist}/services/voice/transcript-knowledge.d.ts +0 -0
- /package/{src → dist}/services/voice/turn-controller.d.ts +0 -0
- /package/{src → dist}/services/voice/voice-budget.d.ts +0 -0
- /package/{src → dist}/services/voice/voice-emotion-classifier.d.ts +0 -0
- /package/{src → dist}/services/voice/voice-profile-artifact.d.ts +0 -0
- /package/{src → dist}/services/voice/voice-profile-routes.d.ts +0 -0
- /package/{src → dist}/services/voice/voice-state-machine.d.ts +0 -0
- /package/{src → dist}/services/voice/wake-word.d.ts +0 -0
- /package/{src → dist}/services/voice/wrap-with-first-line-cache.d.ts +0 -0
- /package/{src → dist}/services/voice-model-updater.d.ts +0 -0
- /package/{src → dist}/services/voice-prewarm.d.ts +0 -0
|
@@ -0,0 +1,98 @@
|
|
|
1
|
+
// Coverage for the pure end-of-turn decision helpers (#9147, "eot" matrix
|
|
2
|
+
// class). turnSignalFromProbability maps an EOT probability onto the
|
|
3
|
+
// agent/user/unknown next-speaker decision via the commit/tentative thresholds;
|
|
4
|
+
// these boundaries gate whether the agent speaks, so they are pinned here.
|
|
5
|
+
|
|
6
|
+
import { describe, expect, it } from "vitest";
|
|
7
|
+
import {
|
|
8
|
+
clampProbability,
|
|
9
|
+
EOT_MID_CLAUSE_THRESHOLD,
|
|
10
|
+
EOT_TENTATIVE_THRESHOLD,
|
|
11
|
+
LIVEKIT_TURN_DETECTOR_EN_REVISION,
|
|
12
|
+
LIVEKIT_TURN_DETECTOR_INTL_REVISION,
|
|
13
|
+
turnDetectorRevisionForTier,
|
|
14
|
+
turnSignalFromProbability,
|
|
15
|
+
} from "./eot-classifier";
|
|
16
|
+
|
|
17
|
+
describe("clampProbability", () => {
|
|
18
|
+
it("clamps to [0,1] and defaults non-finite input to 0.5", () => {
|
|
19
|
+
expect(clampProbability(-1)).toBe(0);
|
|
20
|
+
expect(clampProbability(2)).toBe(1);
|
|
21
|
+
expect(clampProbability(0.7)).toBe(0.7);
|
|
22
|
+
expect(clampProbability(Number.NaN)).toBe(0.5);
|
|
23
|
+
expect(clampProbability(Number.POSITIVE_INFINITY)).toBe(0.5);
|
|
24
|
+
});
|
|
25
|
+
});
|
|
26
|
+
|
|
27
|
+
describe("turnSignalFromProbability", () => {
|
|
28
|
+
const base = { transcript: "are we done", source: "heuristic" as const };
|
|
29
|
+
|
|
30
|
+
it("yields agent (speak) at/above the tentative threshold", () => {
|
|
31
|
+
const sig = turnSignalFromProbability({
|
|
32
|
+
...base,
|
|
33
|
+
probability: EOT_TENTATIVE_THRESHOLD,
|
|
34
|
+
});
|
|
35
|
+
expect(sig.nextSpeaker).toBe("agent");
|
|
36
|
+
expect(sig.agentShouldSpeak).toBe(true);
|
|
37
|
+
});
|
|
38
|
+
|
|
39
|
+
it("yields user (stay silent) below the mid-clause threshold", () => {
|
|
40
|
+
const sig = turnSignalFromProbability({
|
|
41
|
+
...base,
|
|
42
|
+
probability: EOT_MID_CLAUSE_THRESHOLD - 0.01,
|
|
43
|
+
});
|
|
44
|
+
expect(sig.nextSpeaker).toBe("user");
|
|
45
|
+
expect(sig.agentShouldSpeak).toBe(false);
|
|
46
|
+
});
|
|
47
|
+
|
|
48
|
+
it("yields unknown (null) in the mid-clause band", () => {
|
|
49
|
+
const sig = turnSignalFromProbability({
|
|
50
|
+
...base,
|
|
51
|
+
probability: EOT_MID_CLAUSE_THRESHOLD,
|
|
52
|
+
});
|
|
53
|
+
expect(sig.nextSpeaker).toBe("unknown");
|
|
54
|
+
expect(sig.agentShouldSpeak).toBeNull();
|
|
55
|
+
});
|
|
56
|
+
|
|
57
|
+
it("clamps a non-finite probability into the unknown band", () => {
|
|
58
|
+
const sig = turnSignalFromProbability({
|
|
59
|
+
...base,
|
|
60
|
+
probability: Number.NaN,
|
|
61
|
+
});
|
|
62
|
+
expect(sig.endOfTurnProbability).toBe(0.5);
|
|
63
|
+
expect(sig.nextSpeaker).toBe("unknown");
|
|
64
|
+
});
|
|
65
|
+
|
|
66
|
+
it("passes transcript through and includes model/latency only when supplied", () => {
|
|
67
|
+
const withOpts = turnSignalFromProbability({
|
|
68
|
+
...base,
|
|
69
|
+
probability: 0.9,
|
|
70
|
+
model: "eot-v2",
|
|
71
|
+
latencyMs: 12,
|
|
72
|
+
});
|
|
73
|
+
expect(withOpts.transcript).toBe("are we done");
|
|
74
|
+
expect(withOpts.model).toBe("eot-v2");
|
|
75
|
+
expect(withOpts.latencyMs).toBe(12);
|
|
76
|
+
|
|
77
|
+
const without = turnSignalFromProbability({ ...base, probability: 0.9 });
|
|
78
|
+
expect("model" in without).toBe(false);
|
|
79
|
+
expect("latencyMs" in without).toBe(false);
|
|
80
|
+
});
|
|
81
|
+
});
|
|
82
|
+
|
|
83
|
+
describe("turnDetectorRevisionForTier", () => {
|
|
84
|
+
it("maps the 2b entry tier to the English variant, others to multilingual", () => {
|
|
85
|
+
expect(turnDetectorRevisionForTier("2b")).toBe(
|
|
86
|
+
LIVEKIT_TURN_DETECTOR_EN_REVISION,
|
|
87
|
+
);
|
|
88
|
+
expect(turnDetectorRevisionForTier("eliza-1-2b")).toBe(
|
|
89
|
+
LIVEKIT_TURN_DETECTOR_EN_REVISION,
|
|
90
|
+
);
|
|
91
|
+
expect(turnDetectorRevisionForTier("4b")).toBe(
|
|
92
|
+
LIVEKIT_TURN_DETECTOR_INTL_REVISION,
|
|
93
|
+
);
|
|
94
|
+
expect(turnDetectorRevisionForTier("eliza-1-8b")).toBe(
|
|
95
|
+
LIVEKIT_TURN_DETECTOR_INTL_REVISION,
|
|
96
|
+
);
|
|
97
|
+
});
|
|
98
|
+
});
|
|
@@ -34,6 +34,7 @@
|
|
|
34
34
|
* suppress (via `BargeInCancelToken.signal` with reason `"turn-suppressed"`).
|
|
35
35
|
*/
|
|
36
36
|
|
|
37
|
+
import { scoreEndOfTurnHeuristic } from "@elizaos/shared/voice-eot";
|
|
37
38
|
import type {
|
|
38
39
|
Eliza1EotScoreResult,
|
|
39
40
|
Eliza1EotScorerOptions,
|
|
@@ -120,136 +121,24 @@ export function turnSignalFromProbability(args: {
|
|
|
120
121
|
// ---------------------------------------------------------------------------
|
|
121
122
|
|
|
122
123
|
/**
|
|
123
|
-
* Rules-of-thumb EOT classifier.
|
|
124
|
-
*
|
|
124
|
+
* Rules-of-thumb EOT classifier. Delegates to the single canonical heuristic in
|
|
125
|
+
* `@elizaos/shared/voice-eot` — the SAME scorer the UI shell capture path
|
|
126
|
+
* (`packages/ui/src/voice/end-of-turn.ts`) uses, so the two surfaces can never
|
|
127
|
+
* drift. The rules fire in priority order; the first match wins:
|
|
125
128
|
*
|
|
126
129
|
* Priority Signal P(done)
|
|
127
130
|
* -------- ------------------------------------------- -------
|
|
128
|
-
* 1
|
|
129
|
-
* 2
|
|
130
|
-
* 3
|
|
131
|
+
* 1 Trailing ellipsis ("…" / "..") 0.20
|
|
132
|
+
* 2 Sentence-final punctuation (. ! ?) 0.95
|
|
133
|
+
* 3 Question-tag words ("right?", "yeah", …) 0.85
|
|
131
134
|
* 4 Trailing conjunction (and/but/or/because/…) 0.15
|
|
132
135
|
* 5 Last word is a preposition or article 0.20
|
|
133
|
-
* 6
|
|
136
|
+
* 6 Short utterance (< 3 words, no trail-off) 0.70
|
|
137
|
+
* 7 No signal 0.50
|
|
134
138
|
*/
|
|
135
139
|
export class HeuristicEotClassifier implements EotClassifier {
|
|
136
|
-
/** Conjunctions that strongly suggest the user is mid-clause. */
|
|
137
|
-
private static readonly TRAILING_CONJUNCTIONS = new Set([
|
|
138
|
-
"and",
|
|
139
|
-
"but",
|
|
140
|
-
"or",
|
|
141
|
-
"nor",
|
|
142
|
-
"yet",
|
|
143
|
-
"so",
|
|
144
|
-
"because",
|
|
145
|
-
"although",
|
|
146
|
-
"though",
|
|
147
|
-
"while",
|
|
148
|
-
"whereas",
|
|
149
|
-
"if",
|
|
150
|
-
"unless",
|
|
151
|
-
"until",
|
|
152
|
-
"since",
|
|
153
|
-
"when",
|
|
154
|
-
"where",
|
|
155
|
-
"which",
|
|
156
|
-
"that",
|
|
157
|
-
"who",
|
|
158
|
-
"whom",
|
|
159
|
-
"whose",
|
|
160
|
-
]);
|
|
161
|
-
|
|
162
|
-
/** Prepositions and articles that suggest an incomplete NP follows. */
|
|
163
|
-
private static readonly TRAILING_INCOMPLETE = new Set([
|
|
164
|
-
"a",
|
|
165
|
-
"an",
|
|
166
|
-
"the",
|
|
167
|
-
"to",
|
|
168
|
-
"of",
|
|
169
|
-
"in",
|
|
170
|
-
"on",
|
|
171
|
-
"at",
|
|
172
|
-
"by",
|
|
173
|
-
"for",
|
|
174
|
-
"with",
|
|
175
|
-
"from",
|
|
176
|
-
"into",
|
|
177
|
-
"about",
|
|
178
|
-
"through",
|
|
179
|
-
"between",
|
|
180
|
-
"against",
|
|
181
|
-
"during",
|
|
182
|
-
"before",
|
|
183
|
-
"after",
|
|
184
|
-
"without",
|
|
185
|
-
"under",
|
|
186
|
-
"over",
|
|
187
|
-
"above",
|
|
188
|
-
"below",
|
|
189
|
-
"around",
|
|
190
|
-
"beside",
|
|
191
|
-
"beyond",
|
|
192
|
-
"like",
|
|
193
|
-
"near",
|
|
194
|
-
"past",
|
|
195
|
-
"via",
|
|
196
|
-
]);
|
|
197
|
-
|
|
198
|
-
/** Question-tag suffixes that end an utterance (case-insensitive). */
|
|
199
|
-
private static readonly QUESTION_TAGS = [
|
|
200
|
-
"right?",
|
|
201
|
-
"yeah?",
|
|
202
|
-
"ok?",
|
|
203
|
-
"okay?",
|
|
204
|
-
"right",
|
|
205
|
-
"yeah",
|
|
206
|
-
"correct?",
|
|
207
|
-
"correct",
|
|
208
|
-
"hm?",
|
|
209
|
-
"huh?",
|
|
210
|
-
"eh?",
|
|
211
|
-
];
|
|
212
|
-
|
|
213
140
|
score(partialTranscript: string): Promise<number> {
|
|
214
|
-
|
|
215
|
-
if (text.length === 0) return Promise.resolve(0.5);
|
|
216
|
-
|
|
217
|
-
// Rule 1 — sentence-final punctuation.
|
|
218
|
-
if (/[.!?]$/.test(text)) {
|
|
219
|
-
return Promise.resolve(0.95);
|
|
220
|
-
}
|
|
221
|
-
|
|
222
|
-
// Rule 2 — question-tag words at the end.
|
|
223
|
-
const lower = text.toLowerCase();
|
|
224
|
-
for (const tag of HeuristicEotClassifier.QUESTION_TAGS) {
|
|
225
|
-
if (lower.endsWith(tag)) return Promise.resolve(0.85);
|
|
226
|
-
}
|
|
227
|
-
|
|
228
|
-
// Split into words for word-level checks.
|
|
229
|
-
const words = text
|
|
230
|
-
.toLowerCase()
|
|
231
|
-
.replace(/[^a-z0-9'\s-]/gi, "")
|
|
232
|
-
.split(/\s+/)
|
|
233
|
-
.filter(Boolean);
|
|
234
|
-
if (words.length === 0) return Promise.resolve(0.5);
|
|
235
|
-
|
|
236
|
-
const lastWord = words[words.length - 1].replace(/[',;:-]+$/, "");
|
|
237
|
-
|
|
238
|
-
// Rule 3 — short utterance (< 3 words) → likely complete.
|
|
239
|
-
if (words.length < 3) return Promise.resolve(0.7);
|
|
240
|
-
|
|
241
|
-
// Rule 4 — trailing conjunction → mid-clause.
|
|
242
|
-
if (HeuristicEotClassifier.TRAILING_CONJUNCTIONS.has(lastWord)) {
|
|
243
|
-
return Promise.resolve(0.15);
|
|
244
|
-
}
|
|
245
|
-
|
|
246
|
-
// Rule 5 — trailing preposition or article → incomplete NP.
|
|
247
|
-
if (HeuristicEotClassifier.TRAILING_INCOMPLETE.has(lastWord)) {
|
|
248
|
-
return Promise.resolve(0.2);
|
|
249
|
-
}
|
|
250
|
-
|
|
251
|
-
// Rule 6 — no signal.
|
|
252
|
-
return Promise.resolve(0.5);
|
|
141
|
+
return Promise.resolve(scoreEndOfTurnHeuristic(partialTranscript));
|
|
253
142
|
}
|
|
254
143
|
|
|
255
144
|
async signal(partialTranscript: string): Promise<VoiceTurnSignal> {
|
|
@@ -18,7 +18,9 @@ export class VoiceStartupError extends Error {
|
|
|
18
18
|
| "missing-ffi"
|
|
19
19
|
| "missing-speaker-preset"
|
|
20
20
|
| "missing-bundle-root"
|
|
21
|
+
| "missing-asr-model"
|
|
21
22
|
| "missing-fused-build"
|
|
23
|
+
| "blocked-asr-provenance"
|
|
22
24
|
| "missing-turn-detector"
|
|
23
25
|
| "already-started"
|
|
24
26
|
| "not-started"
|
|
@@ -0,0 +1,77 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Unit coverage for the ASR-emotion → expressive-tag helpers (#9147 voice).
|
|
3
|
+
*
|
|
4
|
+
* normalizeAsrEmotionLabel / asrEmotionToTag / expressiveTagPromptClause are
|
|
5
|
+
* pure mappers between local ASR emotion labels and the TTS expressive-tag
|
|
6
|
+
* vocabulary; they were untested (the parse/strip helpers in the same file are
|
|
7
|
+
* covered separately). No GGUF / audio.
|
|
8
|
+
*/
|
|
9
|
+
|
|
10
|
+
import { describe, expect, it } from "vitest";
|
|
11
|
+
import {
|
|
12
|
+
asrEmotionToTag,
|
|
13
|
+
EXPRESSIVE_EMOTION_TAGS,
|
|
14
|
+
EXPRESSIVE_NONVERBAL_TAGS,
|
|
15
|
+
EXPRESSIVE_SINGING_TAG,
|
|
16
|
+
expressiveTagPromptClause,
|
|
17
|
+
normalizeAsrEmotionLabel,
|
|
18
|
+
} from "./expressive-tags";
|
|
19
|
+
|
|
20
|
+
describe("normalizeAsrEmotionLabel", () => {
|
|
21
|
+
it("returns null for empty/missing input", () => {
|
|
22
|
+
expect(normalizeAsrEmotionLabel(null)).toBeNull();
|
|
23
|
+
expect(normalizeAsrEmotionLabel(undefined)).toBeNull();
|
|
24
|
+
expect(normalizeAsrEmotionLabel("")).toBeNull();
|
|
25
|
+
});
|
|
26
|
+
|
|
27
|
+
it("passes through a canonical noun label (case/space-insensitive)", () => {
|
|
28
|
+
expect(normalizeAsrEmotionLabel("happiness")).toBe("happiness");
|
|
29
|
+
expect(normalizeAsrEmotionLabel(" HAPPINESS ")).toBe("happiness");
|
|
30
|
+
});
|
|
31
|
+
|
|
32
|
+
it("maps common adjective forms to noun labels", () => {
|
|
33
|
+
expect(normalizeAsrEmotionLabel("happy")).toBe("happiness");
|
|
34
|
+
expect(normalizeAsrEmotionLabel("sad")).toBe("sadness");
|
|
35
|
+
expect(normalizeAsrEmotionLabel("angry")).toBe("anger");
|
|
36
|
+
expect(normalizeAsrEmotionLabel("afraid")).toBe("fear");
|
|
37
|
+
expect(normalizeAsrEmotionLabel("scared")).toBe("fear");
|
|
38
|
+
expect(normalizeAsrEmotionLabel("surprised")).toBe("surprise");
|
|
39
|
+
expect(normalizeAsrEmotionLabel("disgusted")).toBe("disgust");
|
|
40
|
+
});
|
|
41
|
+
|
|
42
|
+
it("returns null for an unknown label", () => {
|
|
43
|
+
expect(normalizeAsrEmotionLabel("gibberish-xyz")).toBeNull();
|
|
44
|
+
});
|
|
45
|
+
});
|
|
46
|
+
|
|
47
|
+
describe("asrEmotionToTag", () => {
|
|
48
|
+
it("maps a recognized emotion to an expressive emotion tag", () => {
|
|
49
|
+
const tag = asrEmotionToTag("happy");
|
|
50
|
+
expect(tag).not.toBeNull();
|
|
51
|
+
expect(EXPRESSIVE_EMOTION_TAGS).toContain(tag);
|
|
52
|
+
});
|
|
53
|
+
|
|
54
|
+
it("returns null for null / unknown input", () => {
|
|
55
|
+
expect(asrEmotionToTag(null)).toBeNull();
|
|
56
|
+
expect(asrEmotionToTag("gibberish-xyz")).toBeNull();
|
|
57
|
+
});
|
|
58
|
+
});
|
|
59
|
+
|
|
60
|
+
describe("expressiveTagPromptClause", () => {
|
|
61
|
+
it("lists the emotion + nonverbal tags and excludes singing by default", () => {
|
|
62
|
+
const clause = expressiveTagPromptClause();
|
|
63
|
+
for (const tag of EXPRESSIVE_EMOTION_TAGS) {
|
|
64
|
+
expect(clause).toContain(`[${tag}]`);
|
|
65
|
+
}
|
|
66
|
+
for (const tag of EXPRESSIVE_NONVERBAL_TAGS) {
|
|
67
|
+
expect(clause).toContain(`[${tag}]`);
|
|
68
|
+
}
|
|
69
|
+
expect(clause).not.toContain(`[${EXPRESSIVE_SINGING_TAG}]`);
|
|
70
|
+
});
|
|
71
|
+
|
|
72
|
+
it("includes the singing tag only when singingAllowed", () => {
|
|
73
|
+
expect(expressiveTagPromptClause({ singingAllowed: true })).toContain(
|
|
74
|
+
`[${EXPRESSIVE_SINGING_TAG}]`,
|
|
75
|
+
);
|
|
76
|
+
});
|
|
77
|
+
});
|
|
@@ -0,0 +1,102 @@
|
|
|
1
|
+
import { describe, expect, it } from "vitest";
|
|
2
|
+
import {
|
|
3
|
+
emotionToEnum,
|
|
4
|
+
enumToEmotion,
|
|
5
|
+
isExpressiveEmotionEnum,
|
|
6
|
+
isExpressiveTag,
|
|
7
|
+
parseExpressiveTags,
|
|
8
|
+
stripExpressiveTags,
|
|
9
|
+
} from "./expressive-tags.js";
|
|
10
|
+
|
|
11
|
+
/**
|
|
12
|
+
* Inline expressive-tag parsing for the voice path (#9147). Tags are scoped:
|
|
13
|
+
* an emotion/`[singing]` tag starts a new segment; `[laughter]`/`[sigh]` are
|
|
14
|
+
* recorded non-verbals; unrecognized `[tokens]` are preserved as model text
|
|
15
|
+
* (and flagged) rather than silently consumed.
|
|
16
|
+
*/
|
|
17
|
+
|
|
18
|
+
describe("isExpressiveTag / isExpressiveEmotionEnum", () => {
|
|
19
|
+
it("recognizes vocabulary tags, case/space-insensitively", () => {
|
|
20
|
+
expect(isExpressiveTag("happy")).toBe(true);
|
|
21
|
+
expect(isExpressiveTag(" SINGING ")).toBe(true);
|
|
22
|
+
expect(isExpressiveTag("laughter")).toBe(true);
|
|
23
|
+
expect(isExpressiveTag("grumpy")).toBe(false);
|
|
24
|
+
});
|
|
25
|
+
|
|
26
|
+
it("treats none + emotions (but not singing) as enum values", () => {
|
|
27
|
+
expect(isExpressiveEmotionEnum("none")).toBe(true);
|
|
28
|
+
expect(isExpressiveEmotionEnum("excited")).toBe(true);
|
|
29
|
+
expect(isExpressiveEmotionEnum("singing")).toBe(false);
|
|
30
|
+
expect(isExpressiveEmotionEnum("grumpy")).toBe(false);
|
|
31
|
+
});
|
|
32
|
+
});
|
|
33
|
+
|
|
34
|
+
describe("parseExpressiveTags", () => {
|
|
35
|
+
it("returns one neutral segment for untagged text", () => {
|
|
36
|
+
const parsed = parseExpressiveTags("just a normal reply");
|
|
37
|
+
expect(parsed.hasTags).toBe(false);
|
|
38
|
+
expect(parsed.dominantEmotion).toBeNull();
|
|
39
|
+
expect(parsed.segments).toHaveLength(1);
|
|
40
|
+
expect(parsed.segments[0]).toMatchObject({
|
|
41
|
+
emotion: null,
|
|
42
|
+
singing: false,
|
|
43
|
+
cleanText: "just a normal reply",
|
|
44
|
+
});
|
|
45
|
+
});
|
|
46
|
+
|
|
47
|
+
it("segments on each scope-setting emotion tag", () => {
|
|
48
|
+
const parsed = parseExpressiveTags("[happy] hello [sad] world");
|
|
49
|
+
expect(parsed.segments.map((s) => [s.emotion, s.cleanText])).toEqual([
|
|
50
|
+
["happy", "hello"],
|
|
51
|
+
["sad", "world"],
|
|
52
|
+
]);
|
|
53
|
+
expect(parsed.dominantEmotion).toBe("happy");
|
|
54
|
+
expect(parsed.cleanText).toBe("hello world");
|
|
55
|
+
expect(parsed.hasTags).toBe(true);
|
|
56
|
+
});
|
|
57
|
+
|
|
58
|
+
it("allows a mid-sentence shift with a leading neutral segment", () => {
|
|
59
|
+
const parsed = parseExpressiveTags("that's [excited] amazing");
|
|
60
|
+
expect(parsed.segments.map((s) => [s.emotion, s.cleanText])).toEqual([
|
|
61
|
+
[null, "that's"],
|
|
62
|
+
["excited", "amazing"],
|
|
63
|
+
]);
|
|
64
|
+
expect(parsed.dominantEmotion).toBe("excited");
|
|
65
|
+
});
|
|
66
|
+
|
|
67
|
+
it("tracks singing scope and preserves non-verbals without segmenting", () => {
|
|
68
|
+
const singing = parseExpressiveTags("[singing] la la la");
|
|
69
|
+
expect(singing.anySinging).toBe(true);
|
|
70
|
+
expect(singing.segments[0]).toMatchObject({ singing: true, emotion: null });
|
|
71
|
+
|
|
72
|
+
const nonverbal = parseExpressiveTags("hello [laughter] there");
|
|
73
|
+
expect(nonverbal.segments).toHaveLength(1);
|
|
74
|
+
expect(nonverbal.segments[0].nonverbals).toEqual(["laughter"]);
|
|
75
|
+
expect(nonverbal.cleanText).toBe("hello there");
|
|
76
|
+
});
|
|
77
|
+
|
|
78
|
+
it("records unknown bracket tokens instead of treating them as tags", () => {
|
|
79
|
+
const parsed = parseExpressiveTags("this is [grumpy] text");
|
|
80
|
+
expect(parsed.unknownTags).toEqual(["[grumpy]"]);
|
|
81
|
+
expect(parsed.hasTags).toBe(false);
|
|
82
|
+
expect(parsed.cleanText).toBe("this is text");
|
|
83
|
+
});
|
|
84
|
+
});
|
|
85
|
+
|
|
86
|
+
describe("stripExpressiveTags", () => {
|
|
87
|
+
it("removes recognized tags but leaves unknown bracket tokens", () => {
|
|
88
|
+
expect(stripExpressiveTags("[happy] hi [sigh] there")).toBe("hi there");
|
|
89
|
+
expect(stripExpressiveTags("[grumpy] hi")).toBe("[grumpy] hi");
|
|
90
|
+
});
|
|
91
|
+
});
|
|
92
|
+
|
|
93
|
+
describe("emotionToEnum / enumToEmotion", () => {
|
|
94
|
+
it("round-trips an emotion and maps null ⇄ none", () => {
|
|
95
|
+
expect(emotionToEnum("happy")).toBe("happy");
|
|
96
|
+
expect(emotionToEnum(null)).toBe("none");
|
|
97
|
+
expect(enumToEmotion("none")).toBeNull();
|
|
98
|
+
expect(enumToEmotion("happy")).toBe("happy");
|
|
99
|
+
expect(enumToEmotion("singing")).toBeNull();
|
|
100
|
+
expect(enumToEmotion(undefined)).toBeNull();
|
|
101
|
+
});
|
|
102
|
+
});
|
|
@@ -308,7 +308,7 @@ export function enumToEmotion(
|
|
|
308
308
|
* as model-native emotion recognition unless that backend explicitly advertises
|
|
309
309
|
* such a field; callers should record heuristic attribution separately.
|
|
310
310
|
*/
|
|
311
|
-
export const
|
|
311
|
+
export const ASR_EMOTION_LABELS = [
|
|
312
312
|
"surprise",
|
|
313
313
|
"calm",
|
|
314
314
|
"happiness",
|
|
@@ -318,7 +318,7 @@ export const QWEN3_ASR_EMOTION_LABELS = [
|
|
|
318
318
|
"fear",
|
|
319
319
|
] as const;
|
|
320
320
|
|
|
321
|
-
export type
|
|
321
|
+
export type AsrEmotionLabel = (typeof ASR_EMOTION_LABELS)[number];
|
|
322
322
|
|
|
323
323
|
/**
|
|
324
324
|
* Explicit mapping from an ASR-perceived emotion label to the tag vocab the
|
|
@@ -328,7 +328,7 @@ export type Qwen3AsrEmotionLabel = (typeof QWEN3_ASR_EMOTION_LABELS)[number];
|
|
|
328
328
|
* `null` (counted as "no agreement" rather than forced).
|
|
329
329
|
*/
|
|
330
330
|
export const ASR_LABEL_TO_EMOTION_TAG: Readonly<
|
|
331
|
-
Record<
|
|
331
|
+
Record<AsrEmotionLabel, ExpressiveEmotion | null>
|
|
332
332
|
> = {
|
|
333
333
|
happiness: "happy",
|
|
334
334
|
sadness: "sad",
|
|
@@ -340,18 +340,18 @@ export const ASR_LABEL_TO_EMOTION_TAG: Readonly<
|
|
|
340
340
|
};
|
|
341
341
|
|
|
342
342
|
/** Normalize an arbitrary ASR-emitted emotion string (any casing, possibly an
|
|
343
|
-
* adjective form) to
|
|
343
|
+
* adjective form) to an `AsrEmotionLabel` if it matches, else `null`. */
|
|
344
344
|
export function normalizeAsrEmotionLabel(
|
|
345
345
|
raw: string | null | undefined,
|
|
346
|
-
):
|
|
346
|
+
): AsrEmotionLabel | null {
|
|
347
347
|
if (!raw) return null;
|
|
348
348
|
const v = raw.trim().toLowerCase();
|
|
349
349
|
// Direct hit.
|
|
350
|
-
if ((
|
|
351
|
-
return v as
|
|
350
|
+
if ((ASR_EMOTION_LABELS as readonly string[]).includes(v)) {
|
|
351
|
+
return v as AsrEmotionLabel;
|
|
352
352
|
}
|
|
353
353
|
// Common adjective forms → noun labels.
|
|
354
|
-
const ADJ: Record<string,
|
|
354
|
+
const ADJ: Record<string, AsrEmotionLabel> = {
|
|
355
355
|
happy: "happiness",
|
|
356
356
|
sad: "sadness",
|
|
357
357
|
angry: "anger",
|
|
@@ -187,9 +187,16 @@ const FFI_STUB_DIR = path.resolve(
|
|
|
187
187
|
);
|
|
188
188
|
const STUB_DYLIB = path.join(
|
|
189
189
|
FFI_STUB_DIR,
|
|
190
|
+
// Per-OS shared-library naming. Windows must load a PE `.dll` — attempting to
|
|
191
|
+
// `dlopen` the committed Linux `.so` fails with error 193 (ERROR_BAD_EXE_FORMAT)
|
|
192
|
+
// rather than skipping. No Windows stub is built/committed, so the `existsSync`
|
|
193
|
+
// guards below skip these integration tests on Windows (same as Linux before
|
|
194
|
+
// `make -C scripts/ffi-stub`), instead of hard-failing on a format mismatch.
|
|
190
195
|
process.platform === "darwin"
|
|
191
196
|
? "libelizainference_stub.dylib"
|
|
192
|
-
:
|
|
197
|
+
: process.platform === "win32"
|
|
198
|
+
? "libelizainference_stub.dll"
|
|
199
|
+
: "libelizainference_stub.so",
|
|
193
200
|
);
|
|
194
201
|
|
|
195
202
|
function bunOnPath(): string | null {
|
|
@@ -215,8 +222,8 @@ function bunOnPath(): string | null {
|
|
|
215
222
|
}
|
|
216
223
|
|
|
217
224
|
describe("ffi-bindings — pure unit (no Bun, no dylib)", () => {
|
|
218
|
-
it("ELIZA_INFERENCE_ABI_VERSION is
|
|
219
|
-
expect(ELIZA_INFERENCE_ABI_VERSION).toBe(
|
|
225
|
+
it("ELIZA_INFERENCE_ABI_VERSION is 13 (streaming vision describe)", () => {
|
|
226
|
+
expect(ELIZA_INFERENCE_ABI_VERSION).toBe(13);
|
|
220
227
|
});
|
|
221
228
|
|
|
222
229
|
it("loadElizaInferenceFfi throws VoiceLifecycleError when FFI is unavailable", () => {
|