@elizaos/plugin-local-inference 2.0.3-beta.2 → 2.0.3-beta.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +84 -10
- package/dist/actions/generate-media.d.ts.map +1 -0
- package/dist/actions/identify-speaker.d.ts.map +1 -0
- package/dist/actions/transcription-control.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/environment.d.ts +12 -0
- package/dist/adapters/capacitor-llama/environment.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/index.browser.d.ts +9 -0
- package/dist/adapters/capacitor-llama/index.browser.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/index.d.ts +18 -0
- package/dist/adapters/capacitor-llama/index.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/loader.d.ts +35 -0
- package/dist/adapters/capacitor-llama/loader.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/native-voice-capture.d.ts +70 -0
- package/dist/adapters/capacitor-llama/native-voice-capture.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/structured-output.d.ts +62 -0
- package/dist/adapters/capacitor-llama/structured-output.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/text-streaming.d.ts +24 -0
- package/dist/adapters/capacitor-llama/text-streaming.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/types.d.ts +338 -0
- package/dist/adapters/capacitor-llama/types.d.ts.map +1 -0
- package/dist/adapters/capacitor-llama/voice-turn.d.ts +86 -0
- package/dist/adapters/capacitor-llama/voice-turn.d.ts.map +1 -0
- package/dist/backends/apple-foundation.d.ts +56 -0
- package/dist/backends/apple-foundation.d.ts.map +1 -0
- package/dist/index.d.ts.map +1 -0
- package/dist/index.js +39647 -0
- package/dist/index.js.map +217 -0
- package/{src → dist}/local-inference-routes.d.ts +9 -0
- package/dist/local-inference-routes.d.ts.map +1 -0
- package/dist/provider.d.ts.map +1 -0
- package/{src → dist}/routes/compat-helpers.d.ts +1 -1
- package/dist/routes/compat-helpers.d.ts.map +1 -0
- package/dist/routes/family-member-route.d.ts.map +1 -0
- package/{src → dist}/routes/index.d.ts +1 -0
- package/dist/routes/index.d.ts.map +1 -0
- package/dist/routes/index.js +42040 -0
- package/dist/routes/index.js.map +236 -0
- package/{src → dist}/routes/live-diarization-route.d.ts +7 -0
- package/dist/routes/live-diarization-route.d.ts.map +1 -0
- package/dist/routes/local-inference-asr-route.d.ts.map +1 -0
- package/dist/routes/local-inference-asr-transcribe.d.ts.map +1 -0
- package/dist/routes/local-inference-compat-routes.d.ts.map +1 -0
- package/dist/routes/local-inference-tts-route.d.ts.map +1 -0
- package/dist/routes/native-pcm-turn-route.d.ts +3 -0
- package/dist/routes/native-pcm-turn-route.d.ts.map +1 -0
- package/dist/routes/transcript-audio-store.d.ts.map +1 -0
- package/{src → dist}/routes/transcripts-routes.d.ts +8 -0
- package/dist/routes/transcripts-routes.d.ts.map +1 -0
- package/dist/routes/voice-first-run-routes.d.ts.map +1 -0
- package/dist/routes/voice-models-routes.d.ts.map +1 -0
- package/dist/routes/voice-profile-plugin-routes.d.ts.map +1 -0
- package/dist/routes/voice-profiles-management-routes.d.ts.map +1 -0
- package/dist/routes/voice-speaker-profile-routes.d.ts.map +1 -0
- package/dist/runtime/embedding-manager-support.d.ts.map +1 -0
- package/dist/runtime/embedding-presets.d.ts.map +1 -0
- package/dist/runtime/embedding-warmup-policy.d.ts.map +1 -0
- package/{src → dist}/runtime/ensure-local-inference-handler.d.ts +8 -0
- package/dist/runtime/ensure-local-inference-handler.d.ts.map +1 -0
- package/{src → dist}/runtime/index.d.ts +1 -1
- package/dist/runtime/index.d.ts.map +1 -0
- package/dist/runtime/index.js +38768 -0
- package/dist/runtime/index.js.map +217 -0
- package/dist/runtime/mobile-local-inference-gate.d.ts +63 -0
- package/dist/runtime/mobile-local-inference-gate.d.ts.map +1 -0
- package/{src → dist}/runtime/voice-entity-binding.d.ts +10 -0
- package/dist/runtime/voice-entity-binding.d.ts.map +1 -0
- package/{src → dist}/services/active-model.d.ts +28 -0
- package/dist/services/active-model.d.ts.map +1 -0
- package/dist/services/asr-provenance.d.ts +5 -0
- package/dist/services/asr-provenance.d.ts.map +1 -0
- package/{src → dist}/services/assignments.d.ts +16 -3
- package/dist/services/assignments.d.ts.map +1 -0
- package/dist/services/backend-selector.d.ts +55 -0
- package/dist/services/backend-selector.d.ts.map +1 -0
- package/{src → dist}/services/backend.d.ts +110 -16
- package/dist/services/backend.d.ts.map +1 -0
- package/{src → dist}/services/bionic-host-loader.d.ts +21 -0
- package/dist/services/bionic-host-loader.d.ts.map +1 -0
- package/dist/services/bundled-models.d.ts.map +1 -0
- package/dist/services/cache-bridge.d.ts.map +1 -0
- package/dist/services/catalog.d.ts +10 -0
- package/dist/services/catalog.d.ts.map +1 -0
- package/dist/services/checkpoint-client.d.ts.map +1 -0
- package/dist/services/checkpoint-manager.d.ts +217 -0
- package/dist/services/checkpoint-manager.d.ts.map +1 -0
- package/dist/services/cloud-fallback.d.ts.map +1 -0
- package/dist/services/context-fit.d.ts +36 -0
- package/dist/services/context-fit.d.ts.map +1 -0
- package/dist/services/conversation-registry.d.ts.map +1 -0
- package/{src → dist}/services/desktop-fused-ffi-backend-runtime.d.ts +22 -6
- package/dist/services/desktop-fused-ffi-backend-runtime.d.ts.map +1 -0
- package/dist/services/device-bridge.d.ts.map +1 -0
- package/dist/services/device-resource-metrics.d.ts.map +1 -0
- package/{src → dist}/services/device-tier.d.ts +19 -1
- package/dist/services/device-tier.d.ts.map +1 -0
- package/{src → dist}/services/downloader.d.ts +16 -4
- package/dist/services/downloader.d.ts.map +1 -0
- package/{src → dist}/services/engine.d.ts +43 -4
- package/dist/services/engine.d.ts.map +1 -0
- package/dist/services/ensure-local-artifacts.d.ts +82 -0
- package/dist/services/ensure-local-artifacts.d.ts.map +1 -0
- package/dist/services/external-scanner.d.ts.map +1 -0
- package/dist/services/ffi-llm-mock.d.ts +90 -0
- package/dist/services/ffi-llm-mock.d.ts.map +1 -0
- package/dist/services/ffi-llm-streaming-abi.d.ts +318 -0
- package/dist/services/ffi-llm-streaming-abi.d.ts.map +1 -0
- package/{src → dist}/services/ffi-streaming-backend.d.ts +28 -7
- package/dist/services/ffi-streaming-backend.d.ts.map +1 -0
- package/{src → dist}/services/ffi-streaming-runner.d.ts +24 -0
- package/dist/services/ffi-streaming-runner.d.ts.map +1 -0
- package/dist/services/gpu-autotune.d.ts +150 -0
- package/dist/services/gpu-autotune.d.ts.map +1 -0
- package/dist/services/gpu-detect.d.ts.map +1 -0
- package/dist/services/handler-registry.d.ts.map +1 -0
- package/dist/services/hardware.d.ts.map +1 -0
- package/dist/services/image-description-runtime.d.ts.map +1 -0
- package/dist/services/imagegen/aosp-unavailable.d.ts.map +1 -0
- package/dist/services/imagegen/backend-selector.d.ts.map +1 -0
- package/dist/services/imagegen/coreml-unavailable.d.ts.map +1 -0
- package/dist/services/imagegen/errors.d.ts.map +1 -0
- package/dist/services/imagegen/index.d.ts.map +1 -0
- package/dist/services/imagegen/mflux.d.ts.map +1 -0
- package/{src → dist}/services/imagegen/sd-cpp.d.ts +1 -0
- package/dist/services/imagegen/sd-cpp.d.ts.map +1 -0
- package/dist/services/imagegen/tensorrt-unavailable.d.ts.map +1 -0
- package/dist/services/imagegen/types.d.ts.map +1 -0
- package/{src → dist}/services/index.d.ts +3 -1
- package/dist/services/index.d.ts.map +1 -0
- package/dist/services/index.js +39453 -0
- package/dist/services/index.js.map +227 -0
- package/dist/services/inference-capabilities.d.ts.map +1 -0
- package/dist/services/inference-telemetry.d.ts.map +1 -0
- package/dist/services/ios-llama-streaming.d.ts +119 -0
- package/dist/services/ios-llama-streaming.d.ts.map +1 -0
- package/dist/services/kv-spill.d.ts.map +1 -0
- package/dist/services/latency-trace.d.ts.map +1 -0
- package/dist/services/lib-target.d.ts +55 -0
- package/dist/services/lib-target.d.ts.map +1 -0
- package/dist/services/live-signals.d.ts +86 -0
- package/dist/services/live-signals.d.ts.map +1 -0
- package/dist/services/llama-server-metrics.d.ts +114 -0
- package/dist/services/llama-server-metrics.d.ts.map +1 -0
- package/dist/services/llm-streaming-binding.d.ts.map +1 -0
- package/dist/services/load-args.d.ts.map +1 -0
- package/dist/services/manifest/index.d.ts +4 -0
- package/dist/services/manifest/index.d.ts.map +1 -0
- package/{src → dist}/services/manifest/schema.d.ts +196 -6
- package/dist/services/manifest/schema.d.ts.map +1 -0
- package/{src → dist}/services/manifest/types.d.ts +3 -1
- package/dist/services/manifest/types.d.ts.map +1 -0
- package/dist/services/manifest/validator.d.ts.map +1 -0
- package/{src → dist}/services/memory-arbiter.d.ts +33 -3
- package/dist/services/memory-arbiter.d.ts.map +1 -0
- package/dist/services/memory-benchmark.d.ts +76 -0
- package/dist/services/memory-benchmark.d.ts.map +1 -0
- package/{src → dist}/services/memory-monitor.d.ts +6 -0
- package/dist/services/memory-monitor.d.ts.map +1 -0
- package/dist/services/memory-pressure.d.ts.map +1 -0
- package/dist/services/mtp-doctor.d.ts.map +1 -0
- package/dist/services/network-policy.d.ts.map +1 -0
- package/dist/services/paths.d.ts.map +1 -0
- package/dist/services/planner-skeleton.d.ts.map +1 -0
- package/dist/services/providers.d.ts.map +1 -0
- package/dist/services/ram-budget.d.ts.map +1 -0
- package/dist/services/readiness.d.ts.map +1 -0
- package/dist/services/recommendation.d.ts.map +1 -0
- package/{src → dist}/services/registry.d.ts +11 -13
- package/dist/services/registry.d.ts.map +1 -0
- package/{src → dist}/services/router-handler.d.ts +2 -2
- package/dist/services/router-handler.d.ts.map +1 -0
- package/{src → dist}/services/routing-policy.d.ts +32 -9
- package/dist/services/routing-policy.d.ts.map +1 -0
- package/dist/services/routing-preferences.d.ts.map +1 -0
- package/dist/services/runtime-target.d.ts.map +1 -0
- package/{src → dist}/services/service.d.ts +1 -1
- package/dist/services/service.d.ts.map +1 -0
- package/dist/services/session-pool.d.ts.map +1 -0
- package/dist/services/structured-output/deterministic-repair.d.ts.map +1 -0
- package/dist/services/structured-output/index.d.ts +2 -0
- package/dist/services/structured-output/index.d.ts.map +1 -0
- package/dist/services/structured-output.d.ts.map +1 -0
- package/dist/services/system-memory.d.ts.map +1 -0
- package/{src → dist}/services/types.d.ts +1 -1
- package/dist/services/types.d.ts.map +1 -0
- package/dist/services/verify-on-device.d.ts.map +1 -0
- package/dist/services/verify.d.ts.map +1 -0
- package/dist/services/vision/aosp-unavailable.d.ts.map +1 -0
- package/dist/services/vision/capacitor-llama.d.ts.map +1 -0
- package/dist/services/vision/cloud-fallback.d.ts.map +1 -0
- package/dist/services/vision/hash.d.ts.map +1 -0
- package/{src → dist}/services/vision/index.d.ts +1 -1
- package/dist/services/vision/index.d.ts.map +1 -0
- package/dist/services/vision/llama-server.d.ts.map +1 -0
- package/{src → dist}/services/vision/types.d.ts +13 -4
- package/dist/services/vision/types.d.ts.map +1 -0
- package/dist/services/vision/vast-fallback.d.ts.map +1 -0
- package/{src → dist}/services/vision-embedding-cache.d.ts +1 -1
- package/dist/services/vision-embedding-cache.d.ts.map +1 -0
- package/dist/services/voice/__test-helpers__/fake-ffi.d.ts +27 -0
- package/dist/services/voice/__test-helpers__/fake-ffi.d.ts.map +1 -0
- package/dist/services/voice/__test-helpers__/synthetic-speech.d.ts +66 -0
- package/dist/services/voice/__test-helpers__/synthetic-speech.d.ts.map +1 -0
- package/dist/services/voice/acoustic-speaker-attribution.d.ts +61 -0
- package/dist/services/voice/acoustic-speaker-attribution.d.ts.map +1 -0
- package/{src → dist}/services/voice/audio-frame-consumer.d.ts +82 -0
- package/dist/services/voice/audio-frame-consumer.d.ts.map +1 -0
- package/dist/services/voice/barge-in.d.ts.map +1 -0
- package/dist/services/voice/cancellation-coordinator.d.ts.map +1 -0
- package/dist/services/voice/checkpoint-manager.d.ts.map +1 -0
- package/dist/services/voice/checkpoint-policy.d.ts +178 -0
- package/dist/services/voice/checkpoint-policy.d.ts.map +1 -0
- package/dist/services/voice/corpus-augment.d.ts +111 -0
- package/dist/services/voice/corpus-augment.d.ts.map +1 -0
- package/dist/services/voice/corpus-generator.d.ts +134 -0
- package/dist/services/voice/corpus-generator.d.ts.map +1 -0
- package/dist/services/voice/diarization-error-rate.d.ts +40 -0
- package/dist/services/voice/diarization-error-rate.d.ts.map +1 -0
- package/dist/services/voice/e2e-harness.d.ts +297 -0
- package/dist/services/voice/e2e-harness.d.ts.map +1 -0
- package/dist/services/voice/eager-context-builder.d.ts.map +1 -0
- package/dist/services/voice/echo-delay.d.ts +67 -0
- package/dist/services/voice/echo-delay.d.ts.map +1 -0
- package/dist/services/voice/echo-metrics.d.ts +7 -0
- package/dist/services/voice/echo-metrics.d.ts.map +1 -0
- package/dist/services/voice/echo-reference-buffer.d.ts +65 -0
- package/dist/services/voice/echo-reference-buffer.d.ts.map +1 -0
- package/{src → dist}/services/voice/eliza1-eot-scorer.d.ts +8 -8
- package/dist/services/voice/eliza1-eot-scorer.d.ts.map +1 -0
- package/dist/services/voice/embedding-server.d.ts +37 -0
- package/dist/services/voice/embedding-server.d.ts.map +1 -0
- package/{src → dist}/services/voice/embedding.d.ts +2 -3
- package/dist/services/voice/embedding.d.ts.map +1 -0
- package/dist/services/voice/emotion-attribution.d.ts.map +1 -0
- package/{src → dist}/services/voice/engine-bridge.d.ts +8 -5
- package/dist/services/voice/engine-bridge.d.ts.map +1 -0
- package/{src → dist}/services/voice/eot-classifier-ggml.d.ts +22 -22
- package/dist/services/voice/eot-classifier-ggml.d.ts.map +1 -0
- package/{src → dist}/services/voice/eot-classifier.d.ts +9 -12
- package/dist/services/voice/eot-classifier.d.ts.map +1 -0
- package/{src → dist}/services/voice/errors.d.ts +1 -1
- package/dist/services/voice/errors.d.ts.map +1 -0
- package/{src → dist}/services/voice/expressive-tags.d.ts +5 -5
- package/dist/services/voice/expressive-tags.d.ts.map +1 -0
- package/{src → dist}/services/voice/ffi-bindings.d.ts +26 -4
- package/dist/services/voice/ffi-bindings.d.ts.map +1 -0
- package/dist/services/voice/first-line-cache.d.ts.map +1 -0
- package/{src → dist}/services/voice/fused-eot-scorer.d.ts +6 -6
- package/dist/services/voice/fused-eot-scorer.d.ts.map +1 -0
- package/{src → dist}/services/voice/index.d.ts +8 -3
- package/dist/services/voice/index.d.ts.map +1 -0
- package/dist/services/voice/kokoro/index.d.ts +24 -0
- package/dist/services/voice/kokoro/index.d.ts.map +1 -0
- package/{src → dist}/services/voice/kokoro/kokoro-backend.d.ts +15 -0
- package/dist/services/voice/kokoro/kokoro-backend.d.ts.map +1 -0
- package/{src → dist}/services/voice/kokoro/kokoro-engine-discovery.d.ts +1 -1
- package/dist/services/voice/kokoro/kokoro-engine-discovery.d.ts.map +1 -0
- package/{src → dist}/services/voice/kokoro/kokoro-ffi-runtime.d.ts +3 -3
- package/dist/services/voice/kokoro/kokoro-ffi-runtime.d.ts.map +1 -0
- package/dist/services/voice/kokoro/kokoro-runtime.d.ts.map +1 -0
- package/dist/services/voice/kokoro/phoneme-stream.d.ts +51 -0
- package/dist/services/voice/kokoro/phoneme-stream.d.ts.map +1 -0
- package/dist/services/voice/kokoro/phonemizer.d.ts.map +1 -0
- package/{src → dist}/services/voice/kokoro/pick-runtime.d.ts +1 -1
- package/dist/services/voice/kokoro/pick-runtime.d.ts.map +1 -0
- package/dist/services/voice/kokoro/runtime-selection.d.ts +31 -0
- package/dist/services/voice/kokoro/runtime-selection.d.ts.map +1 -0
- package/dist/services/voice/kokoro/types.d.ts.map +1 -0
- package/dist/services/voice/kokoro/voice-presets.d.ts.map +1 -0
- package/dist/services/voice/kokoro/voices.d.ts.map +1 -0
- package/dist/services/voice/lifecycle.d.ts.map +1 -0
- package/dist/services/voice/live-diarization-session.d.ts +196 -0
- package/dist/services/voice/live-diarization-session.d.ts.map +1 -0
- package/dist/services/voice/metric-math.d.ts +10 -0
- package/dist/services/voice/metric-math.d.ts.map +1 -0
- package/{src → dist}/services/voice/mic-source.d.ts +1 -1
- package/dist/services/voice/mic-source.d.ts.map +1 -0
- package/dist/services/voice/nlms-echo-canceller.d.ts +137 -0
- package/dist/services/voice/nlms-echo-canceller.d.ts.map +1 -0
- package/dist/services/voice/optimistic-policy.d.ts.map +1 -0
- package/dist/services/voice/optimistic-rollback.d.ts +151 -0
- package/dist/services/voice/optimistic-rollback.d.ts.map +1 -0
- package/{src → dist}/services/voice/partial-stabilizer.d.ts +1 -1
- package/dist/services/voice/partial-stabilizer.d.ts.map +1 -0
- package/dist/services/voice/phoneme-tokenizer.d.ts.map +1 -0
- package/dist/services/voice/phrase-cache.d.ts.map +1 -0
- package/dist/services/voice/phrase-chunker.d.ts.map +1 -0
- package/dist/services/voice/pipeline-impls.d.ts.map +1 -0
- package/dist/services/voice/pipeline.d.ts.map +1 -0
- package/dist/services/voice/prefill-client.d.ts.map +1 -0
- package/dist/services/voice/prefix-preserving-queue.d.ts.map +1 -0
- package/dist/services/voice/profile-store.d.ts.map +1 -0
- package/dist/services/voice/ring-buffer.d.ts.map +1 -0
- package/dist/services/voice/rollback-queue.d.ts.map +1 -0
- package/dist/services/voice/samantha-preset-placeholder.d.ts.map +1 -0
- package/dist/services/voice/samantha-preset-regenerator.d.ts.map +1 -0
- package/dist/services/voice/scheduler.d.ts.map +1 -0
- package/dist/services/voice/self-voice-imprint.d.ts +33 -0
- package/dist/services/voice/self-voice-imprint.d.ts.map +1 -0
- package/{src → dist}/services/voice/shared-resources.d.ts +14 -0
- package/dist/services/voice/shared-resources.d.ts.map +1 -0
- package/dist/services/voice/speaker/attribution-pipeline.d.ts.map +1 -0
- package/dist/services/voice/speaker/diarizer-fused.d.ts.map +1 -0
- package/dist/services/voice/speaker/diarizer.d.ts.map +1 -0
- package/dist/services/voice/speaker/encoder-fused.d.ts.map +1 -0
- package/dist/services/voice/speaker/encoder-ggml.d.ts.map +1 -0
- package/dist/services/voice/speaker/encoder.d.ts.map +1 -0
- package/dist/services/voice/speaker-imprint.d.ts.map +1 -0
- package/dist/services/voice/speaker-preset-cache.d.ts.map +1 -0
- package/dist/services/voice/streaming-asr/streaming-pipeline-adapter.d.ts +160 -0
- package/dist/services/voice/streaming-asr/streaming-pipeline-adapter.d.ts.map +1 -0
- package/dist/services/voice/system-audio-sink.d.ts.map +1 -0
- package/{src → dist}/services/voice/transcriber.d.ts +4 -4
- package/dist/services/voice/transcriber.d.ts.map +1 -0
- package/dist/services/voice/transcript-knowledge.d.ts.map +1 -0
- package/{src → dist}/services/voice/transcript-service.d.ts +20 -1
- package/dist/services/voice/transcript-service.d.ts.map +1 -0
- package/{src → dist}/services/voice/transcript-store.d.ts +12 -1
- package/dist/services/voice/transcript-store.d.ts.map +1 -0
- package/dist/services/voice/turn-controller.d.ts.map +1 -0
- package/{src → dist}/services/voice/types.d.ts +6 -6
- package/dist/services/voice/types.d.ts.map +1 -0
- package/{src → dist}/services/voice/vad.d.ts +6 -5
- package/dist/services/voice/vad.d.ts.map +1 -0
- package/dist/services/voice/voice-budget.d.ts.map +1 -0
- package/dist/services/voice/voice-emotion-classifier.d.ts.map +1 -0
- package/dist/services/voice/voice-preload-predictor.d.ts +76 -0
- package/dist/services/voice/voice-preload-predictor.d.ts.map +1 -0
- package/{src → dist}/services/voice/voice-preset-format.d.ts +2 -2
- package/dist/services/voice/voice-preset-format.d.ts.map +1 -0
- package/dist/services/voice/voice-profile-artifact.d.ts.map +1 -0
- package/dist/services/voice/voice-profile-routes.d.ts.map +1 -0
- package/dist/services/voice/voice-scenario.d.ts +131 -0
- package/dist/services/voice/voice-scenario.d.ts.map +1 -0
- package/dist/services/voice/voice-state-machine.d.ts.map +1 -0
- package/dist/services/voice/voice-workbench-report.d.ts +117 -0
- package/dist/services/voice/voice-workbench-report.d.ts.map +1 -0
- package/{src → dist}/services/voice/wake-word-ggml.d.ts +8 -9
- package/dist/services/voice/wake-word-ggml.d.ts.map +1 -0
- package/dist/services/voice/wake-word.d.ts.map +1 -0
- package/dist/services/voice/wav-codec.d.ts +11 -0
- package/dist/services/voice/wav-codec.d.ts.map +1 -0
- package/dist/services/voice/workbench-entrypoint.d.ts +42 -0
- package/dist/services/voice/workbench-entrypoint.d.ts.map +1 -0
- package/dist/services/voice/workbench-headless-runner.d.ts +102 -0
- package/dist/services/voice/workbench-headless-runner.d.ts.map +1 -0
- package/dist/services/voice/workbench-logic-services.d.ts +36 -0
- package/dist/services/voice/workbench-logic-services.d.ts.map +1 -0
- package/dist/services/voice/workbench-real-services.d.ts +17 -0
- package/dist/services/voice/workbench-real-services.d.ts.map +1 -0
- package/dist/services/voice/workbench-scenarios.d.ts +24 -0
- package/dist/services/voice/workbench-scenarios.d.ts.map +1 -0
- package/dist/services/voice/wrap-with-first-line-cache.d.ts.map +1 -0
- package/dist/services/voice-model-updater.d.ts.map +1 -0
- package/dist/services/voice-prewarm.d.ts.map +1 -0
- package/dist/voice-workbench.d.ts +18 -0
- package/dist/voice-workbench.d.ts.map +1 -0
- package/dist/voice-workbench.js +5259 -0
- package/dist/voice-workbench.js.map +34 -0
- package/package.json +28 -9
- package/registry-entry.json +137 -0
- package/src/adapters/capacitor-llama/__tests__/voice-turn.test.ts +293 -0
- package/src/adapters/capacitor-llama/environment.ts +1 -1
- package/src/adapters/capacitor-llama/index.ts +28 -4
- package/src/adapters/capacitor-llama/native-voice-capture.ts +140 -0
- package/src/adapters/capacitor-llama/text-streaming.ts +2 -2
- package/src/adapters/capacitor-llama/voice-turn.ts +178 -0
- package/src/backends/apple-foundation.ts +1 -1
- package/src/local-inference-routes.test.ts +57 -11
- package/src/local-inference-routes.ts +90 -8
- package/src/provider.ts +32 -3
- package/src/routes/compat-helpers.ts +2 -1
- package/src/routes/index.ts +1 -0
- package/src/routes/live-diarization-route.test.ts +134 -0
- package/src/routes/live-diarization-route.ts +79 -3
- package/src/routes/local-inference-asr-route.test.ts +43 -2
- package/src/routes/local-inference-asr-route.ts +7 -4
- package/src/routes/local-inference-asr-transcribe.test.ts +4 -4
- package/src/routes/local-inference-asr-transcribe.ts +1 -1
- package/src/routes/local-inference-compat-routes.test.ts +3 -3
- package/src/routes/local-inference-compat-routes.ts +23 -56
- package/src/routes/native-pcm-turn-route.test.ts +136 -0
- package/src/routes/native-pcm-turn-route.ts +121 -0
- package/src/routes/transcripts-routes.test.ts +51 -0
- package/src/routes/transcripts-routes.ts +35 -3
- package/src/runtime/bionic-wire-encoding.test.ts +147 -0
- package/src/runtime/ensure-local-inference-handler.test.ts +203 -5
- package/src/runtime/ensure-local-inference-handler.ts +203 -11
- package/src/runtime/index.ts +4 -1
- package/src/runtime/mobile-local-inference-gate.test.ts +85 -2
- package/src/runtime/mobile-local-inference-gate.ts +60 -5
- package/src/runtime/voice-entity-binding.transcript.test.ts +29 -0
- package/src/runtime/voice-entity-binding.ts +46 -6
- package/src/runtime/voice-speaker-entity-contract.test.ts +149 -0
- package/src/services/README.md +2 -2
- package/src/services/__tests__/backend-selector.precedence.test.ts +333 -0
- package/src/services/active-model-context-fit.test.ts +125 -0
- package/src/services/active-model.ts +211 -8
- package/src/services/asr-provenance.ts +68 -0
- package/src/services/assignment-validation.test.ts +118 -0
- package/src/services/assignments.test.ts +26 -0
- package/src/services/assignments.ts +52 -4
- package/src/services/backend.test.ts +84 -0
- package/src/services/backend.ts +198 -19
- package/src/services/bionic-host-loader.test.ts +94 -1
- package/src/services/bionic-host-loader.ts +72 -0
- package/src/services/cache-bridge.test.ts +7 -7
- package/src/services/catalog.test.ts +32 -11
- package/src/services/catalog.ts +6 -0
- package/src/services/cloud-fallback.ts +1 -1
- package/src/services/context-fit.test.ts +121 -0
- package/src/services/context-fit.ts +113 -0
- package/src/services/desktop-fused-ffi-backend-runtime.ts +99 -7
- package/src/services/device-tier.test.ts +89 -2
- package/src/services/device-tier.ts +103 -11
- package/src/services/downloader.test.ts +199 -58
- package/src/services/downloader.ts +141 -27
- package/src/services/engine-direct-bundle.test.ts +38 -6
- package/src/services/engine.ts +291 -104
- package/src/services/ensure-local-artifacts.ts +1 -1
- package/src/services/ffi-llm-streaming-abi.ts +6 -3
- package/src/services/ffi-streaming-backend.ts +44 -8
- package/src/services/ffi-streaming-runner.test.ts +163 -3
- package/src/services/ffi-streaming-runner.ts +54 -1
- package/src/services/ffi-unload-ordering.test.ts +5 -1
- package/src/services/fused-eliza1-no-regression.test.ts +144 -0
- package/src/services/hardware.test.ts +7 -2
- package/src/services/hardware.ts +28 -0
- package/src/services/imagegen/backend-selector.test.ts +190 -0
- package/src/services/imagegen/sd-cpp.ts +6 -9
- package/src/services/index.ts +18 -0
- package/src/services/ios-llama-streaming.ts +1 -1
- package/src/services/kv-spill.ts +6 -5
- package/src/services/lib-target.test.ts +145 -0
- package/src/services/lib-target.ts +102 -0
- package/src/services/live-signals.test.ts +132 -0
- package/src/services/live-signals.ts +177 -0
- package/src/services/llama-server-metrics.test.ts +168 -0
- package/src/services/manifest/eliza-1.manifest.v1.json +84 -2
- package/src/services/manifest/index.ts +6 -0
- package/src/services/manifest/manifest.test.ts +156 -54
- package/src/services/manifest/schema.ts +160 -52
- package/src/services/manifest/types.ts +6 -0
- package/src/services/manifest/validator.ts +91 -25
- package/src/services/memory-arbiter.test.ts +139 -0
- package/src/services/memory-arbiter.ts +81 -15
- package/src/services/memory-benchmark.test.ts +91 -0
- package/src/services/memory-benchmark.ts +354 -0
- package/src/services/memory-monitor.test.ts +24 -0
- package/src/services/memory-monitor.ts +12 -0
- package/src/services/mtp-doctor.ts +10 -2
- package/src/services/network-policy.ts +5 -5
- package/src/services/ram-budget-cache.test.ts +2 -1
- package/src/services/ram-budget.ts +0 -0
- package/src/services/recommendation.test.ts +216 -0
- package/src/services/registry.ts +25 -19
- package/src/services/required-kernels-gate.test.ts +64 -0
- package/src/services/router-handler.ts +43 -24
- package/src/services/routing-policy.test.ts +211 -23
- package/src/services/routing-policy.ts +92 -22
- package/src/services/service.test.ts +3 -3
- package/src/services/service.ts +22 -7
- package/src/services/transcription-priority.test.ts +2 -2
- package/src/services/types.ts +4 -0
- package/src/services/verify-on-device.test.ts +2 -2
- package/src/services/vision/hash.ts +1 -1
- package/src/services/vision/index.ts +2 -2
- package/src/services/vision/llama-server.ts +1 -1
- package/src/services/vision/types.ts +13 -4
- package/src/services/vision-embedding-cache.ts +1 -1
- package/src/services/voice/VOICE_WORKBENCH.md +71 -26
- package/src/services/voice/__fixtures__/voice-workbench-logic-baseline.json +180 -0
- package/src/services/voice/__test-helpers__/synthetic-speech.ts +72 -2
- package/src/services/voice/__tests__/eliza1-eot-scorer.test.ts +29 -29
- package/src/services/voice/__tests__/streaming-asr.test.ts +1 -1
- package/src/services/voice/acoustic-speaker-attribution.test.ts +165 -0
- package/src/services/voice/acoustic-speaker-attribution.ts +336 -0
- package/src/services/voice/asr-timed.real.test.ts +6 -8
- package/src/services/voice/audio-frame-consumer.test.ts +327 -1
- package/src/services/voice/audio-frame-consumer.ts +165 -5
- package/src/services/voice/barge-in.ts +2 -3
- package/src/services/voice/corpus-augment.test.ts +276 -0
- package/src/services/voice/corpus-augment.ts +451 -0
- package/src/services/voice/corpus-generator.test.ts +201 -0
- package/src/services/voice/corpus-generator.ts +413 -0
- package/src/services/voice/diarization-error-rate.greedy.test.ts +140 -0
- package/src/services/voice/diarization-error-rate.test.ts +100 -0
- package/src/services/voice/diarization-error-rate.ts +249 -0
- package/src/services/voice/e2e-harness.der.test.ts +94 -0
- package/src/services/voice/e2e-harness.respond-eot-entity.test.ts +277 -0
- package/src/services/voice/e2e-harness.security-echo.test.ts +103 -0
- package/src/services/voice/e2e-harness.test.ts +2 -2
- package/src/services/voice/e2e-harness.ts +175 -16
- package/src/services/voice/echo-delay.test.ts +118 -0
- package/src/services/voice/echo-delay.ts +135 -0
- package/src/services/voice/echo-metrics.test.ts +17 -0
- package/src/services/voice/echo-metrics.ts +20 -0
- package/src/services/voice/echo-reference-buffer.test.ts +86 -0
- package/src/services/voice/echo-reference-buffer.ts +165 -0
- package/src/services/voice/eliza1-eot-scorer.ts +22 -22
- package/src/services/voice/embedding.ts +2 -3
- package/src/services/voice/engine-bridge-transcript-join.test.ts +278 -0
- package/src/services/voice/engine-bridge.ts +151 -110
- package/src/services/voice/eot-classifier-ggml.ts +42 -39
- package/src/services/voice/eot-classifier.test.ts +98 -0
- package/src/services/voice/eot-classifier.ts +11 -122
- package/src/services/voice/errors.ts +2 -0
- package/src/services/voice/expressive-tags.asr.test.ts +77 -0
- package/src/services/voice/expressive-tags.test.ts +102 -0
- package/src/services/voice/expressive-tags.ts +8 -8
- package/src/services/voice/ffi-bindings.test.ts +10 -3
- package/src/services/voice/ffi-bindings.ts +177 -15
- package/src/services/voice/fused-eot-scorer.ts +17 -13
- package/src/services/voice/index.ts +33 -12
- package/src/services/voice/kokoro/__tests__/kokoro-backend.test.ts +112 -1
- package/src/services/voice/kokoro/__tests__/kokoro-engine-bridge.real.test.ts +88 -3
- package/src/services/voice/kokoro/__tests__/runtime-selection.test.ts +37 -201
- package/src/services/voice/kokoro/kokoro-backend.ts +16 -0
- package/src/services/voice/kokoro/kokoro-engine-discovery.ts +1 -1
- package/src/services/voice/kokoro/kokoro-ffi-runtime.ts +3 -3
- package/src/services/voice/kokoro/pick-runtime.ts +1 -1
- package/src/services/voice/kokoro/runtime-selection.ts +28 -201
- package/src/services/voice/live-diarization-session.echo.test.ts +232 -0
- package/src/services/voice/live-diarization-session.ts +335 -2
- package/src/services/voice/metric-math.test.ts +61 -0
- package/src/services/voice/metric-math.ts +25 -0
- package/src/services/voice/mic-source.ts +1 -1
- package/src/services/voice/nlms-echo-canceller.test.ts +244 -0
- package/src/services/voice/nlms-echo-canceller.ts +317 -0
- package/src/services/voice/optimistic-policy.power-source.test.ts +36 -0
- package/src/services/voice/partial-stabilizer.ts +1 -1
- package/src/services/voice/pipeline.ts +3 -4
- package/src/services/voice/research/VOICE_8785_ASSESSMENT.md +141 -0
- package/src/services/voice/research/VOICE_PIPELINE_RESEARCH_2026.md +117 -0
- package/src/services/voice/research/VOICE_VALIDATION_RUNBOOK.md +135 -0
- package/src/services/voice/samantha-preset-regenerator.wav.test.ts +90 -0
- package/src/services/voice/self-voice-imprint.test.ts +59 -0
- package/src/services/voice/self-voice-imprint.ts +102 -0
- package/src/services/voice/shared-resources.ts +23 -0
- package/src/services/voice/speaker/attribution-pipeline.test.ts +221 -0
- package/src/services/voice/speaker/attribution-pipeline.ts +85 -22
- package/src/services/voice/speaker/encoder-ggml.test.ts +59 -0
- package/src/services/voice/transcriber.asr-backend.test.ts +76 -0
- package/src/services/voice/transcriber.ts +4 -4
- package/src/services/voice/transcript-service.test.ts +58 -0
- package/src/services/voice/transcript-service.ts +64 -0
- package/src/services/voice/transcript-store.test.ts +36 -0
- package/src/services/voice/transcript-store.ts +32 -0
- package/src/services/voice/types.ts +7 -7
- package/src/services/voice/vad.test.ts +33 -15
- package/src/services/voice/vad.ts +25 -20
- package/src/services/voice/voice-budget.test.ts +0 -3
- package/src/services/voice/voice-budget.ts +6 -6
- package/src/services/voice/voice-duet.test.ts +1 -1
- package/src/services/voice/voice-hardening.fuzz.test.ts +116 -0
- package/src/services/voice/voice-preload-predictor.test.ts +130 -0
- package/src/services/voice/voice-preload-predictor.ts +113 -0
- package/src/services/voice/voice-preset-format.fuzz.test.ts +89 -0
- package/src/services/voice/voice-preset-format.test.ts +75 -0
- package/src/services/voice/voice-preset-format.ts +17 -4
- package/src/services/voice/voice-scenario.test.ts +159 -0
- package/src/services/voice/voice-scenario.ts +133 -7
- package/src/services/voice/voice-scenario.turn-helpers.test.ts +77 -0
- package/src/services/voice/voice-workbench-report.ts +58 -17
- package/src/services/voice/wake-word-ggml.ts +12 -13
- package/src/services/voice/wav-codec.fuzz.test.ts +59 -0
- package/src/services/voice/wav-codec.test.ts +32 -0
- package/src/services/voice/wav-codec.ts +101 -0
- package/src/services/voice/workbench-entrypoint.test.ts +55 -0
- package/src/services/voice/workbench-entrypoint.ts +88 -0
- package/src/services/voice/workbench-headless-runner.test.ts +162 -0
- package/src/services/voice/workbench-headless-runner.ts +396 -0
- package/src/services/voice/workbench-logic-services.test.ts +225 -0
- package/src/services/voice/workbench-logic-services.ts +184 -0
- package/src/services/voice/workbench-real-services.ts +629 -0
- package/src/services/voice/workbench-scenarios.ts +407 -0
- package/src/services/voice-prewarm.ts +1 -1
- package/src/voice-workbench.ts +71 -0
- package/src/actions/generate-media.d.ts.map +0 -1
- package/src/actions/identify-speaker.d.ts.map +0 -1
- package/src/actions/transcription-control.d.ts.map +0 -1
- package/src/index.d.ts.map +0 -1
- package/src/local-inference-routes.d.ts.map +0 -1
- package/src/provider.d.ts.map +0 -1
- package/src/routes/compat-helpers.d.ts.map +0 -1
- package/src/routes/family-member-route.d.ts.map +0 -1
- package/src/routes/index.d.ts.map +0 -1
- package/src/routes/live-diarization-route.d.ts.map +0 -1
- package/src/routes/local-inference-asr-route.d.ts.map +0 -1
- package/src/routes/local-inference-asr-transcribe.d.ts.map +0 -1
- package/src/routes/local-inference-compat-routes.d.ts.map +0 -1
- package/src/routes/local-inference-tts-route.d.ts.map +0 -1
- package/src/routes/transcript-audio-store.d.ts.map +0 -1
- package/src/routes/transcripts-routes.d.ts.map +0 -1
- package/src/routes/voice-first-run-routes.d.ts.map +0 -1
- package/src/routes/voice-models-routes.d.ts.map +0 -1
- package/src/routes/voice-profile-plugin-routes.d.ts.map +0 -1
- package/src/routes/voice-profiles-management-routes.d.ts.map +0 -1
- package/src/routes/voice-speaker-profile-routes.d.ts.map +0 -1
- package/src/runtime/embedding-manager-support.d.ts.map +0 -1
- package/src/runtime/embedding-presets.d.ts.map +0 -1
- package/src/runtime/embedding-warmup-policy.d.ts.map +0 -1
- package/src/runtime/ensure-local-inference-handler.d.ts.map +0 -1
- package/src/runtime/index.d.ts.map +0 -1
- package/src/runtime/mobile-local-inference-gate.d.ts +0 -31
- package/src/runtime/mobile-local-inference-gate.d.ts.map +0 -1
- package/src/runtime/voice-entity-binding.d.ts.map +0 -1
- package/src/services/active-model.d.ts.map +0 -1
- package/src/services/assignments.d.ts.map +0 -1
- package/src/services/backend.d.ts.map +0 -1
- package/src/services/bionic-host-loader.d.ts.map +0 -1
- package/src/services/bundled-models.d.ts.map +0 -1
- package/src/services/cache-bridge.d.ts.map +0 -1
- package/src/services/catalog.d.ts +0 -10
- package/src/services/catalog.d.ts.map +0 -1
- package/src/services/checkpoint-client.d.ts.map +0 -1
- package/src/services/cloud-fallback.d.ts.map +0 -1
- package/src/services/conversation-registry.d.ts.map +0 -1
- package/src/services/desktop-fused-ffi-backend-runtime.d.ts.map +0 -1
- package/src/services/device-bridge.d.ts.map +0 -1
- package/src/services/device-resource-metrics.d.ts.map +0 -1
- package/src/services/device-tier.d.ts.map +0 -1
- package/src/services/downloader.d.ts.map +0 -1
- package/src/services/engine.d.ts.map +0 -1
- package/src/services/external-scanner.d.ts.map +0 -1
- package/src/services/ffi-streaming-backend.d.ts.map +0 -1
- package/src/services/ffi-streaming-runner.d.ts.map +0 -1
- package/src/services/gpu-detect.d.ts.map +0 -1
- package/src/services/handler-registry.d.ts.map +0 -1
- package/src/services/hardware.d.ts.map +0 -1
- package/src/services/hf-search.d.ts +0 -26
- package/src/services/hf-search.d.ts.map +0 -1
- package/src/services/hf-search.test.ts +0 -69
- package/src/services/hf-search.ts +0 -420
- package/src/services/image-description-runtime.d.ts.map +0 -1
- package/src/services/imagegen/aosp-unavailable.d.ts.map +0 -1
- package/src/services/imagegen/backend-selector.d.ts.map +0 -1
- package/src/services/imagegen/coreml-unavailable.d.ts.map +0 -1
- package/src/services/imagegen/errors.d.ts.map +0 -1
- package/src/services/imagegen/index.d.ts.map +0 -1
- package/src/services/imagegen/mflux.d.ts.map +0 -1
- package/src/services/imagegen/sd-cpp.d.ts.map +0 -1
- package/src/services/imagegen/tensorrt-unavailable.d.ts.map +0 -1
- package/src/services/imagegen/types.d.ts.map +0 -1
- package/src/services/index.d.ts.map +0 -1
- package/src/services/inference-capabilities.d.ts.map +0 -1
- package/src/services/inference-telemetry.d.ts.map +0 -1
- package/src/services/kv-spill.d.ts.map +0 -1
- package/src/services/latency-trace.d.ts.map +0 -1
- package/src/services/llm-streaming-binding.d.ts.map +0 -1
- package/src/services/load-args.d.ts.map +0 -1
- package/src/services/manifest/index.d.ts +0 -4
- package/src/services/manifest/index.d.ts.map +0 -1
- package/src/services/manifest/schema.d.ts.map +0 -1
- package/src/services/manifest/types.d.ts.map +0 -1
- package/src/services/manifest/validator.d.ts.map +0 -1
- package/src/services/memory-arbiter.d.ts.map +0 -1
- package/src/services/memory-monitor.d.ts.map +0 -1
- package/src/services/memory-pressure.d.ts.map +0 -1
- package/src/services/mtp-doctor.d.ts.map +0 -1
- package/src/services/network-policy.d.ts.map +0 -1
- package/src/services/paths.d.ts.map +0 -1
- package/src/services/planner-skeleton.d.ts.map +0 -1
- package/src/services/providers.d.ts.map +0 -1
- package/src/services/ram-budget.d.ts.map +0 -1
- package/src/services/readiness.d.ts.map +0 -1
- package/src/services/recommendation.d.ts.map +0 -1
- package/src/services/registry.d.ts.map +0 -1
- package/src/services/router-handler.d.ts.map +0 -1
- package/src/services/routing-policy.d.ts.map +0 -1
- package/src/services/routing-preferences.d.ts.map +0 -1
- package/src/services/runtime-target.d.ts.map +0 -1
- package/src/services/service.d.ts.map +0 -1
- package/src/services/session-pool.d.ts.map +0 -1
- package/src/services/structured-output/deterministic-repair.d.ts.map +0 -1
- package/src/services/structured-output.d.ts.map +0 -1
- package/src/services/system-memory.d.ts.map +0 -1
- package/src/services/types.d.ts.map +0 -1
- package/src/services/verify-on-device.d.ts.map +0 -1
- package/src/services/verify.d.ts.map +0 -1
- package/src/services/vision/aosp-unavailable.d.ts.map +0 -1
- package/src/services/vision/capacitor-llama.d.ts.map +0 -1
- package/src/services/vision/cloud-fallback.d.ts.map +0 -1
- package/src/services/vision/hash.d.ts.map +0 -1
- package/src/services/vision/index.d.ts.map +0 -1
- package/src/services/vision/llama-server.d.ts.map +0 -1
- package/src/services/vision/types.d.ts.map +0 -1
- package/src/services/vision/vast-fallback.d.ts.map +0 -1
- package/src/services/vision-embedding-cache.d.ts.map +0 -1
- package/src/services/voice/audio-frame-consumer.d.ts.map +0 -1
- package/src/services/voice/barge-in.d.ts.map +0 -1
- package/src/services/voice/cancellation-coordinator.d.ts.map +0 -1
- package/src/services/voice/checkpoint-manager.d.ts.map +0 -1
- package/src/services/voice/eager-context-builder.d.ts.map +0 -1
- package/src/services/voice/eliza1-eot-scorer.d.ts.map +0 -1
- package/src/services/voice/embedding.d.ts.map +0 -1
- package/src/services/voice/emotion-attribution.d.ts.map +0 -1
- package/src/services/voice/engine-bridge.d.ts.map +0 -1
- package/src/services/voice/eot-classifier-ggml.d.ts.map +0 -1
- package/src/services/voice/eot-classifier.d.ts.map +0 -1
- package/src/services/voice/errors.d.ts.map +0 -1
- package/src/services/voice/expressive-tags.d.ts.map +0 -1
- package/src/services/voice/ffi-bindings.d.ts.map +0 -1
- package/src/services/voice/first-line-cache.d.ts.map +0 -1
- package/src/services/voice/fused-eot-scorer.d.ts.map +0 -1
- package/src/services/voice/index.d.ts.map +0 -1
- package/src/services/voice/kokoro/kokoro-backend.d.ts.map +0 -1
- package/src/services/voice/kokoro/kokoro-engine-discovery.d.ts.map +0 -1
- package/src/services/voice/kokoro/kokoro-ffi-runtime.d.ts.map +0 -1
- package/src/services/voice/kokoro/kokoro-runtime.d.ts.map +0 -1
- package/src/services/voice/kokoro/phonemizer.d.ts.map +0 -1
- package/src/services/voice/kokoro/pick-runtime.d.ts.map +0 -1
- package/src/services/voice/kokoro/runtime-selection.d.ts +0 -92
- package/src/services/voice/kokoro/runtime-selection.d.ts.map +0 -1
- package/src/services/voice/kokoro/types.d.ts.map +0 -1
- package/src/services/voice/kokoro/voice-presets.d.ts.map +0 -1
- package/src/services/voice/kokoro/voices.d.ts.map +0 -1
- package/src/services/voice/lifecycle.d.ts.map +0 -1
- package/src/services/voice/live-diarization-session.d.ts +0 -96
- package/src/services/voice/live-diarization-session.d.ts.map +0 -1
- package/src/services/voice/mic-source.d.ts.map +0 -1
- package/src/services/voice/optimistic-policy.d.ts.map +0 -1
- package/src/services/voice/partial-stabilizer.d.ts.map +0 -1
- package/src/services/voice/phoneme-tokenizer.d.ts.map +0 -1
- package/src/services/voice/phrase-cache.d.ts.map +0 -1
- package/src/services/voice/phrase-chunker.d.ts.map +0 -1
- package/src/services/voice/pipeline-impls.d.ts.map +0 -1
- package/src/services/voice/pipeline.d.ts.map +0 -1
- package/src/services/voice/prefill-client.d.ts.map +0 -1
- package/src/services/voice/prefix-preserving-queue.d.ts.map +0 -1
- package/src/services/voice/profile-store.d.ts.map +0 -1
- package/src/services/voice/ring-buffer.d.ts.map +0 -1
- package/src/services/voice/rollback-queue.d.ts.map +0 -1
- package/src/services/voice/samantha-preset-placeholder.d.ts.map +0 -1
- package/src/services/voice/samantha-preset-regenerator.d.ts.map +0 -1
- package/src/services/voice/scheduler.d.ts.map +0 -1
- package/src/services/voice/shared-resources.d.ts.map +0 -1
- package/src/services/voice/speaker/attribution-pipeline.d.ts.map +0 -1
- package/src/services/voice/speaker/diarizer-fused.d.ts.map +0 -1
- package/src/services/voice/speaker/diarizer.d.ts.map +0 -1
- package/src/services/voice/speaker/encoder-fused.d.ts.map +0 -1
- package/src/services/voice/speaker/encoder-ggml.d.ts.map +0 -1
- package/src/services/voice/speaker/encoder.d.ts.map +0 -1
- package/src/services/voice/speaker-imprint.d.ts.map +0 -1
- package/src/services/voice/speaker-preset-cache.d.ts.map +0 -1
- package/src/services/voice/system-audio-sink.d.ts.map +0 -1
- package/src/services/voice/transcriber.d.ts.map +0 -1
- package/src/services/voice/transcript-knowledge.d.ts.map +0 -1
- package/src/services/voice/transcript-service.d.ts.map +0 -1
- package/src/services/voice/transcript-store.d.ts.map +0 -1
- package/src/services/voice/turn-controller.d.ts.map +0 -1
- package/src/services/voice/types.d.ts.map +0 -1
- package/src/services/voice/vad.d.ts.map +0 -1
- package/src/services/voice/voice-budget.d.ts.map +0 -1
- package/src/services/voice/voice-emotion-classifier.d.ts.map +0 -1
- package/src/services/voice/voice-preset-format.d.ts.map +0 -1
- package/src/services/voice/voice-profile-artifact.d.ts.map +0 -1
- package/src/services/voice/voice-profile-routes.d.ts.map +0 -1
- package/src/services/voice/voice-settings.d.ts +0 -82
- package/src/services/voice/voice-settings.d.ts.map +0 -1
- package/src/services/voice/voice-settings.ts +0 -172
- package/src/services/voice/voice-state-machine.d.ts.map +0 -1
- package/src/services/voice/wake-word-ggml.d.ts.map +0 -1
- package/src/services/voice/wake-word.d.ts.map +0 -1
- package/src/services/voice/wrap-with-first-line-cache.d.ts.map +0 -1
- package/src/services/voice-model-updater.d.ts.map +0 -1
- package/src/services/voice-prewarm.d.ts.map +0 -1
- /package/{src → dist}/actions/generate-media.d.ts +0 -0
- /package/{src → dist}/actions/identify-speaker.d.ts +0 -0
- /package/{src → dist}/actions/transcription-control.d.ts +0 -0
- /package/{src → dist}/index.d.ts +0 -0
- /package/{src → dist}/provider.d.ts +0 -0
- /package/{src → dist}/routes/family-member-route.d.ts +0 -0
- /package/{src → dist}/routes/local-inference-asr-route.d.ts +0 -0
- /package/{src → dist}/routes/local-inference-asr-transcribe.d.ts +0 -0
- /package/{src → dist}/routes/local-inference-compat-routes.d.ts +0 -0
- /package/{src → dist}/routes/local-inference-tts-route.d.ts +0 -0
- /package/{src → dist}/routes/transcript-audio-store.d.ts +0 -0
- /package/{src → dist}/routes/voice-first-run-routes.d.ts +0 -0
- /package/{src → dist}/routes/voice-models-routes.d.ts +0 -0
- /package/{src → dist}/routes/voice-profile-plugin-routes.d.ts +0 -0
- /package/{src → dist}/routes/voice-profiles-management-routes.d.ts +0 -0
- /package/{src → dist}/routes/voice-speaker-profile-routes.d.ts +0 -0
- /package/{src → dist}/runtime/embedding-manager-support.d.ts +0 -0
- /package/{src → dist}/runtime/embedding-presets.d.ts +0 -0
- /package/{src → dist}/runtime/embedding-warmup-policy.d.ts +0 -0
- /package/{src → dist}/services/bundled-models.d.ts +0 -0
- /package/{src → dist}/services/cache-bridge.d.ts +0 -0
- /package/{src → dist}/services/checkpoint-client.d.ts +0 -0
- /package/{src → dist}/services/cloud-fallback.d.ts +0 -0
- /package/{src → dist}/services/conversation-registry.d.ts +0 -0
- /package/{src → dist}/services/device-bridge.d.ts +0 -0
- /package/{src → dist}/services/device-resource-metrics.d.ts +0 -0
- /package/{src → dist}/services/external-scanner.d.ts +0 -0
- /package/{src → dist}/services/gpu-detect.d.ts +0 -0
- /package/{src → dist}/services/handler-registry.d.ts +0 -0
- /package/{src → dist}/services/hardware.d.ts +0 -0
- /package/{src → dist}/services/image-description-runtime.d.ts +0 -0
- /package/{src → dist}/services/imagegen/aosp-unavailable.d.ts +0 -0
- /package/{src → dist}/services/imagegen/backend-selector.d.ts +0 -0
- /package/{src → dist}/services/imagegen/coreml-unavailable.d.ts +0 -0
- /package/{src → dist}/services/imagegen/errors.d.ts +0 -0
- /package/{src → dist}/services/imagegen/index.d.ts +0 -0
- /package/{src → dist}/services/imagegen/mflux.d.ts +0 -0
- /package/{src → dist}/services/imagegen/tensorrt-unavailable.d.ts +0 -0
- /package/{src → dist}/services/imagegen/types.d.ts +0 -0
- /package/{src → dist}/services/inference-capabilities.d.ts +0 -0
- /package/{src → dist}/services/inference-telemetry.d.ts +0 -0
- /package/{src → dist}/services/kv-spill.d.ts +0 -0
- /package/{src → dist}/services/latency-trace.d.ts +0 -0
- /package/{src → dist}/services/llm-streaming-binding.d.ts +0 -0
- /package/{src → dist}/services/load-args.d.ts +0 -0
- /package/{src → dist}/services/manifest/validator.d.ts +0 -0
- /package/{src → dist}/services/memory-pressure.d.ts +0 -0
- /package/{src → dist}/services/mtp-doctor.d.ts +0 -0
- /package/{src → dist}/services/network-policy.d.ts +0 -0
- /package/{src → dist}/services/paths.d.ts +0 -0
- /package/{src → dist}/services/planner-skeleton.d.ts +0 -0
- /package/{src → dist}/services/providers.d.ts +0 -0
- /package/{src → dist}/services/ram-budget.d.ts +0 -0
- /package/{src → dist}/services/readiness.d.ts +0 -0
- /package/{src → dist}/services/recommendation.d.ts +0 -0
- /package/{src → dist}/services/routing-preferences.d.ts +0 -0
- /package/{src → dist}/services/runtime-target.d.ts +0 -0
- /package/{src → dist}/services/session-pool.d.ts +0 -0
- /package/{src → dist}/services/structured-output/deterministic-repair.d.ts +0 -0
- /package/{src → dist}/services/structured-output.d.ts +0 -0
- /package/{src → dist}/services/system-memory.d.ts +0 -0
- /package/{src → dist}/services/verify-on-device.d.ts +0 -0
- /package/{src → dist}/services/verify.d.ts +0 -0
- /package/{src → dist}/services/vision/aosp-unavailable.d.ts +0 -0
- /package/{src → dist}/services/vision/capacitor-llama.d.ts +0 -0
- /package/{src → dist}/services/vision/cloud-fallback.d.ts +0 -0
- /package/{src → dist}/services/vision/hash.d.ts +0 -0
- /package/{src → dist}/services/vision/llama-server.d.ts +0 -0
- /package/{src → dist}/services/vision/vast-fallback.d.ts +0 -0
- /package/{src → dist}/services/voice/barge-in.d.ts +0 -0
- /package/{src → dist}/services/voice/cancellation-coordinator.d.ts +0 -0
- /package/{src → dist}/services/voice/checkpoint-manager.d.ts +0 -0
- /package/{src → dist}/services/voice/eager-context-builder.d.ts +0 -0
- /package/{src → dist}/services/voice/emotion-attribution.d.ts +0 -0
- /package/{src → dist}/services/voice/first-line-cache.d.ts +0 -0
- /package/{src → dist}/services/voice/kokoro/kokoro-runtime.d.ts +0 -0
- /package/{src → dist}/services/voice/kokoro/phonemizer.d.ts +0 -0
- /package/{src → dist}/services/voice/kokoro/types.d.ts +0 -0
- /package/{src → dist}/services/voice/kokoro/voice-presets.d.ts +0 -0
- /package/{src → dist}/services/voice/kokoro/voices.d.ts +0 -0
- /package/{src → dist}/services/voice/lifecycle.d.ts +0 -0
- /package/{src → dist}/services/voice/optimistic-policy.d.ts +0 -0
- /package/{src → dist}/services/voice/phoneme-tokenizer.d.ts +0 -0
- /package/{src → dist}/services/voice/phrase-cache.d.ts +0 -0
- /package/{src → dist}/services/voice/phrase-chunker.d.ts +0 -0
- /package/{src → dist}/services/voice/pipeline-impls.d.ts +0 -0
- /package/{src → dist}/services/voice/pipeline.d.ts +0 -0
- /package/{src → dist}/services/voice/prefill-client.d.ts +0 -0
- /package/{src → dist}/services/voice/prefix-preserving-queue.d.ts +0 -0
- /package/{src → dist}/services/voice/profile-store.d.ts +0 -0
- /package/{src → dist}/services/voice/ring-buffer.d.ts +0 -0
- /package/{src → dist}/services/voice/rollback-queue.d.ts +0 -0
- /package/{src → dist}/services/voice/samantha-preset-placeholder.d.ts +0 -0
- /package/{src → dist}/services/voice/samantha-preset-regenerator.d.ts +0 -0
- /package/{src → dist}/services/voice/scheduler.d.ts +0 -0
- /package/{src → dist}/services/voice/speaker/attribution-pipeline.d.ts +0 -0
- /package/{src → dist}/services/voice/speaker/diarizer-fused.d.ts +0 -0
- /package/{src → dist}/services/voice/speaker/diarizer.d.ts +0 -0
- /package/{src → dist}/services/voice/speaker/encoder-fused.d.ts +0 -0
- /package/{src → dist}/services/voice/speaker/encoder-ggml.d.ts +0 -0
- /package/{src → dist}/services/voice/speaker/encoder.d.ts +0 -0
- /package/{src → dist}/services/voice/speaker-imprint.d.ts +0 -0
- /package/{src → dist}/services/voice/speaker-preset-cache.d.ts +0 -0
- /package/{src → dist}/services/voice/system-audio-sink.d.ts +0 -0
- /package/{src → dist}/services/voice/transcript-knowledge.d.ts +0 -0
- /package/{src → dist}/services/voice/turn-controller.d.ts +0 -0
- /package/{src → dist}/services/voice/voice-budget.d.ts +0 -0
- /package/{src → dist}/services/voice/voice-emotion-classifier.d.ts +0 -0
- /package/{src → dist}/services/voice/voice-profile-artifact.d.ts +0 -0
- /package/{src → dist}/services/voice/voice-profile-routes.d.ts +0 -0
- /package/{src → dist}/services/voice/voice-state-machine.d.ts +0 -0
- /package/{src → dist}/services/voice/wake-word.d.ts +0 -0
- /package/{src → dist}/services/voice/wrap-with-first-line-cache.d.ts +0 -0
- /package/{src → dist}/services/voice-model-updater.d.ts +0 -0
- /package/{src → dist}/services/voice-prewarm.d.ts +0 -0
|
@@ -0,0 +1,396 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Voice Workbench headless runner (#8785).
|
|
3
|
+
*
|
|
4
|
+
* Drives a {@link VoiceScenario} + its generated corpus through the real voice
|
|
5
|
+
* services WITHOUT a browser, scores every turn with the shared scorers
|
|
6
|
+
* (`e2e-harness.ts`), and emits one {@link VoiceWorkbenchScenarioRun} the report
|
|
7
|
+
* layer (`voice-workbench-report.ts`) aggregates. The services are injected
|
|
8
|
+
* through {@link VoiceWorkbenchServices} so:
|
|
9
|
+
* - a provisioned local backend wires the real ASR / diarization / EOT /
|
|
10
|
+
* respond / entity / TTS path,
|
|
11
|
+
* - a mock returns ground-truth-derived observations for the CI plumbing lane,
|
|
12
|
+
* - and an ABSENT backend (`services === null`) or absent corpus
|
|
13
|
+
* (`corpus === null`) yields a `skipped` run — never a `pass` (honesty
|
|
14
|
+
* contract).
|
|
15
|
+
*
|
|
16
|
+
* Pure orchestration: it slices the corpus per turn, asks the services to
|
|
17
|
+
* observe the turn, and maps observations onto scorer inputs. No model loading
|
|
18
|
+
* here, so it is unit-testable with a fake services adapter.
|
|
19
|
+
*/
|
|
20
|
+
|
|
21
|
+
import { mkdirSync, writeFileSync } from "node:fs";
|
|
22
|
+
import path from "node:path";
|
|
23
|
+
import type {
|
|
24
|
+
CorpusGroundTruth,
|
|
25
|
+
CorpusTurnLabel,
|
|
26
|
+
GeneratedVoiceCorpus,
|
|
27
|
+
} from "./corpus-generator";
|
|
28
|
+
import {
|
|
29
|
+
type DiarizationTurnSample,
|
|
30
|
+
scoreDiarizationTimeline,
|
|
31
|
+
scoreEchoRejection,
|
|
32
|
+
scoreEntityExtraction,
|
|
33
|
+
scoreEotDecision,
|
|
34
|
+
scoreFirstResponseLatency,
|
|
35
|
+
scoreOwnerSecurity,
|
|
36
|
+
scoreRespondDecision,
|
|
37
|
+
scoreTtsAsrRoundTrip,
|
|
38
|
+
scoreVoiceEntityMatch,
|
|
39
|
+
type VoiceE2eCaseResult,
|
|
40
|
+
} from "./e2e-harness";
|
|
41
|
+
import type { VoiceScenario } from "./voice-scenario";
|
|
42
|
+
import type {
|
|
43
|
+
VoiceAudioArtifact,
|
|
44
|
+
VoiceWorkbenchScenarioRun,
|
|
45
|
+
} from "./voice-workbench-report";
|
|
46
|
+
import { encodeMonoPcm16Wav } from "./wav-codec";
|
|
47
|
+
|
|
48
|
+
/** What the real (or mock) services observed for one turn of audio. */
|
|
49
|
+
export interface VoiceTurnObservation {
|
|
50
|
+
/** ASR hypothesis transcript for the turn's audio. */
|
|
51
|
+
hypothesisTranscript: string;
|
|
52
|
+
/** Diarized speaker label, or null when the diarizer missed the turn. */
|
|
53
|
+
predictedSpeakerLabel: string | null;
|
|
54
|
+
/** The EOT classifier decided end-of-turn at this turn's boundary. */
|
|
55
|
+
eotDecided: boolean;
|
|
56
|
+
/** EOT decision latency (ms) from the true boundary, when measured. */
|
|
57
|
+
eotLatencyMs?: number;
|
|
58
|
+
/** The agent decided to respond to this turn. */
|
|
59
|
+
responded: boolean;
|
|
60
|
+
/** Entities inferred from this turn's transcript (name/partner extraction). */
|
|
61
|
+
inferredEntities: string[];
|
|
62
|
+
/** Voice→entity match: the entity the recognized voice resolved to (or null). */
|
|
63
|
+
matchedEntityId: string | null;
|
|
64
|
+
/** First-audio latency (ms) of the agent's spoken reply, when it replied. */
|
|
65
|
+
firstAudioMs?: number;
|
|
66
|
+
/** The system judged this turn to be the device owner (owner-security). */
|
|
67
|
+
predictedOwner?: boolean;
|
|
68
|
+
}
|
|
69
|
+
|
|
70
|
+
export interface VoiceWorkbenchServices {
|
|
71
|
+
/**
|
|
72
|
+
* Optional one-shot hook before a scenario's turns are scored. Real services
|
|
73
|
+
* use this to enroll speaker centroids from the generated corpus; mock
|
|
74
|
+
* services can omit it.
|
|
75
|
+
*/
|
|
76
|
+
prepareScenario?(args: {
|
|
77
|
+
scenario: VoiceScenario;
|
|
78
|
+
corpus: GeneratedVoiceCorpus;
|
|
79
|
+
}): Promise<void> | void;
|
|
80
|
+
/**
|
|
81
|
+
* Feed one turn's audio slice through the real services and report what was
|
|
82
|
+
* observed. The `label` carries the turn's ground truth (so a mock can echo
|
|
83
|
+
* it); the real adapter ignores it and measures.
|
|
84
|
+
*/
|
|
85
|
+
observeTurn(args: {
|
|
86
|
+
turnIndex: number;
|
|
87
|
+
audio: Float32Array;
|
|
88
|
+
sampleRate: number;
|
|
89
|
+
label: CorpusTurnLabel;
|
|
90
|
+
/** Scenario-level ground truth (participants, owner set, agents). */
|
|
91
|
+
groundTruth: CorpusGroundTruth;
|
|
92
|
+
}): Promise<VoiceTurnObservation>;
|
|
93
|
+
}
|
|
94
|
+
|
|
95
|
+
/**
|
|
96
|
+
* Where to write per-run `.wav` artifacts. When present, the runner encodes the
|
|
97
|
+
* full corpus + each consumed per-turn slice to disk under `dir` and records the
|
|
98
|
+
* paths (relative to `relativeTo`) on the run's `audioArtifacts`. Absent ⇒ no IO.
|
|
99
|
+
*/
|
|
100
|
+
export interface VoiceAudioCaptureSink {
|
|
101
|
+
/** Directory the `.wav` files are written into (created recursively). */
|
|
102
|
+
dir: string;
|
|
103
|
+
/** Artifact paths are recorded relative to this dir (the scenario run dir). */
|
|
104
|
+
relativeTo: string;
|
|
105
|
+
}
|
|
106
|
+
|
|
107
|
+
export interface RunVoiceScenarioHeadlessArgs {
|
|
108
|
+
scenario: VoiceScenario;
|
|
109
|
+
/** The generated/loaded corpus; null when its artifacts are absent. */
|
|
110
|
+
corpus: GeneratedVoiceCorpus | null;
|
|
111
|
+
/** The voice services; null when no backend is provisioned. */
|
|
112
|
+
services: VoiceWorkbenchServices | null;
|
|
113
|
+
/** When set, write the run's audio as `.wav` artifacts and record their paths. */
|
|
114
|
+
captureAudio?: VoiceAudioCaptureSink;
|
|
115
|
+
}
|
|
116
|
+
|
|
117
|
+
/** Encode `pcm` to `<dir>/<fileName>` and return a relative-path artifact. */
|
|
118
|
+
function writeAudioArtifact(args: {
|
|
119
|
+
sink: VoiceAudioCaptureSink;
|
|
120
|
+
fileName: string;
|
|
121
|
+
pcm: Float32Array;
|
|
122
|
+
sampleRate: number;
|
|
123
|
+
turnIndex: number;
|
|
124
|
+
kind: VoiceAudioArtifact["kind"];
|
|
125
|
+
speakerLabel?: string;
|
|
126
|
+
}): VoiceAudioArtifact {
|
|
127
|
+
const absolutePath = path.join(args.sink.dir, args.fileName);
|
|
128
|
+
writeFileSync(absolutePath, encodeMonoPcm16Wav(args.pcm, args.sampleRate));
|
|
129
|
+
const relativePath = path
|
|
130
|
+
.relative(args.sink.relativeTo, absolutePath)
|
|
131
|
+
.split(path.sep)
|
|
132
|
+
.join("/");
|
|
133
|
+
return {
|
|
134
|
+
turnIndex: args.turnIndex,
|
|
135
|
+
kind: args.kind,
|
|
136
|
+
path: relativePath,
|
|
137
|
+
sampleRate: args.sampleRate,
|
|
138
|
+
durationMs: Math.round((args.pcm.length / args.sampleRate) * 1000),
|
|
139
|
+
...(args.speakerLabel !== undefined
|
|
140
|
+
? { speakerLabel: args.speakerLabel }
|
|
141
|
+
: {}),
|
|
142
|
+
};
|
|
143
|
+
}
|
|
144
|
+
|
|
145
|
+
function skipped(
|
|
146
|
+
scenario: VoiceScenario,
|
|
147
|
+
skipReason: string,
|
|
148
|
+
): VoiceWorkbenchScenarioRun {
|
|
149
|
+
return {
|
|
150
|
+
scenarioId: scenario.id,
|
|
151
|
+
classes: scenario.classes,
|
|
152
|
+
status: "skipped",
|
|
153
|
+
cases: [],
|
|
154
|
+
skipReason,
|
|
155
|
+
};
|
|
156
|
+
}
|
|
157
|
+
|
|
158
|
+
/**
|
|
159
|
+
* Run one scenario headless and score it. Returns a `skipped` run (never a
|
|
160
|
+
* pass) when the corpus or the backend is absent.
|
|
161
|
+
*/
|
|
162
|
+
export async function runVoiceScenarioHeadless(
|
|
163
|
+
args: RunVoiceScenarioHeadlessArgs,
|
|
164
|
+
): Promise<VoiceWorkbenchScenarioRun> {
|
|
165
|
+
const { scenario, corpus, services, captureAudio } = args;
|
|
166
|
+
if (!corpus) return skipped(scenario, "corpus artifacts absent");
|
|
167
|
+
if (!services) return skipped(scenario, "no voice backend provisioned");
|
|
168
|
+
|
|
169
|
+
const assertions = scenario.assertions ?? {};
|
|
170
|
+
const cases: VoiceE2eCaseResult[] = [];
|
|
171
|
+
await services.prepareScenario?.({ scenario, corpus });
|
|
172
|
+
|
|
173
|
+
// When a capture sink is active, write the full corpus once + each per-turn
|
|
174
|
+
// slice as `.wav` artifacts and record their (run-dir-relative) paths.
|
|
175
|
+
const audioArtifacts: VoiceAudioArtifact[] = [];
|
|
176
|
+
if (captureAudio) {
|
|
177
|
+
mkdirSync(captureAudio.dir, { recursive: true });
|
|
178
|
+
audioArtifacts.push(
|
|
179
|
+
writeAudioArtifact({
|
|
180
|
+
sink: captureAudio,
|
|
181
|
+
fileName: "corpus.wav",
|
|
182
|
+
pcm: corpus.pcm,
|
|
183
|
+
sampleRate: corpus.sampleRate,
|
|
184
|
+
turnIndex: 0,
|
|
185
|
+
kind: "generated",
|
|
186
|
+
}),
|
|
187
|
+
);
|
|
188
|
+
}
|
|
189
|
+
|
|
190
|
+
const eotSamples: Array<{
|
|
191
|
+
decided: boolean;
|
|
192
|
+
expected: boolean;
|
|
193
|
+
latencyMs?: number;
|
|
194
|
+
}> = [];
|
|
195
|
+
const diarTurns: DiarizationTurnSample[] = [];
|
|
196
|
+
const respondSamples: Array<{ responded: boolean; expectRespond: boolean }> =
|
|
197
|
+
[];
|
|
198
|
+
const voiceEntitySamples: Array<{
|
|
199
|
+
matchedEntityId: string | null;
|
|
200
|
+
expectedEntityId: string;
|
|
201
|
+
}> = [];
|
|
202
|
+
const inferredEntities: string[] = [];
|
|
203
|
+
const expectedEntities: string[] = [];
|
|
204
|
+
const echoSamples: Array<{ isAgentEcho: boolean; responded: boolean }> = [];
|
|
205
|
+
const ownerSamples: Array<{
|
|
206
|
+
predictedOwner: boolean;
|
|
207
|
+
expectedOwner: boolean;
|
|
208
|
+
}> = [];
|
|
209
|
+
const wantsOwnerScoring = scenario.classes.includes("owner-security");
|
|
210
|
+
|
|
211
|
+
for (const label of corpus.groundTruth.turns) {
|
|
212
|
+
const audio = corpus.pcm.subarray(
|
|
213
|
+
label.segmentStartSample,
|
|
214
|
+
label.segmentEndSample,
|
|
215
|
+
);
|
|
216
|
+
if (captureAudio) {
|
|
217
|
+
audioArtifacts.push(
|
|
218
|
+
writeAudioArtifact({
|
|
219
|
+
sink: captureAudio,
|
|
220
|
+
fileName: `turn-${label.index}.wav`,
|
|
221
|
+
pcm: audio,
|
|
222
|
+
sampleRate: corpus.sampleRate,
|
|
223
|
+
turnIndex: label.index,
|
|
224
|
+
kind: "consumed",
|
|
225
|
+
speakerLabel: label.speaker,
|
|
226
|
+
}),
|
|
227
|
+
);
|
|
228
|
+
}
|
|
229
|
+
const obs = await services.observeTurn({
|
|
230
|
+
turnIndex: label.index,
|
|
231
|
+
audio,
|
|
232
|
+
sampleRate: corpus.sampleRate,
|
|
233
|
+
label,
|
|
234
|
+
groundTruth: corpus.groundTruth,
|
|
235
|
+
});
|
|
236
|
+
|
|
237
|
+
// WER — one round-trip case per turn (referenceTranscript vs ASR hypothesis).
|
|
238
|
+
cases.push(
|
|
239
|
+
scoreTtsAsrRoundTrip({
|
|
240
|
+
referenceText: label.referenceTranscript,
|
|
241
|
+
hypothesisText: obs.hypothesisTranscript,
|
|
242
|
+
...(assertions.maxWer !== undefined
|
|
243
|
+
? { maxWer: assertions.maxWer }
|
|
244
|
+
: {}),
|
|
245
|
+
}),
|
|
246
|
+
);
|
|
247
|
+
|
|
248
|
+
// EOT — some corpus segments deliberately stop mid-utterance so the
|
|
249
|
+
// classifier can be scored for false triggers.
|
|
250
|
+
eotSamples.push({
|
|
251
|
+
decided: obs.eotDecided,
|
|
252
|
+
expected: label.expectEndOfTurn ?? true,
|
|
253
|
+
...(obs.eotLatencyMs !== undefined
|
|
254
|
+
? { latencyMs: obs.eotLatencyMs }
|
|
255
|
+
: {}),
|
|
256
|
+
});
|
|
257
|
+
// Diarization scores REAL speaker turns only — an agent-echo turn is the
|
|
258
|
+
// agent's own voice bleeding back, not a speaker to attribute, so it is
|
|
259
|
+
// handled by the echo-rejection scorer instead.
|
|
260
|
+
if (!label.isAgentEcho) {
|
|
261
|
+
diarTurns.push({
|
|
262
|
+
predictedLabel: obs.predictedSpeakerLabel,
|
|
263
|
+
expectedLabel: label.speaker,
|
|
264
|
+
startMs: (label.speechStartSample / corpus.sampleRate) * 1000,
|
|
265
|
+
endMs: (label.speechEndSample / corpus.sampleRate) * 1000,
|
|
266
|
+
});
|
|
267
|
+
}
|
|
268
|
+
respondSamples.push({
|
|
269
|
+
responded: obs.responded,
|
|
270
|
+
expectRespond: label.expectRespond,
|
|
271
|
+
});
|
|
272
|
+
if (label.entityId) {
|
|
273
|
+
voiceEntitySamples.push({
|
|
274
|
+
matchedEntityId: obs.matchedEntityId,
|
|
275
|
+
expectedEntityId: label.entityId,
|
|
276
|
+
});
|
|
277
|
+
}
|
|
278
|
+
if (label.expectedEntity) expectedEntities.push(label.expectedEntity);
|
|
279
|
+
inferredEntities.push(...obs.inferredEntities);
|
|
280
|
+
|
|
281
|
+
if (label.isAgentEcho) {
|
|
282
|
+
echoSamples.push({ isAgentEcho: true, responded: obs.responded });
|
|
283
|
+
}
|
|
284
|
+
if (wantsOwnerScoring && typeof obs.predictedOwner === "boolean") {
|
|
285
|
+
ownerSamples.push({
|
|
286
|
+
predictedOwner: obs.predictedOwner,
|
|
287
|
+
expectedOwner: label.isOwner === true,
|
|
288
|
+
});
|
|
289
|
+
}
|
|
290
|
+
|
|
291
|
+
if (obs.responded && typeof obs.firstAudioMs === "number") {
|
|
292
|
+
cases.push(
|
|
293
|
+
scoreFirstResponseLatency({
|
|
294
|
+
turnStartedAtMs: 0,
|
|
295
|
+
ttsFirstAudioAtMs: obs.firstAudioMs,
|
|
296
|
+
...(assertions.maxFirstAudioMs !== undefined
|
|
297
|
+
? { maxFirstAudioMs: assertions.maxFirstAudioMs }
|
|
298
|
+
: {}),
|
|
299
|
+
}),
|
|
300
|
+
);
|
|
301
|
+
}
|
|
302
|
+
}
|
|
303
|
+
|
|
304
|
+
cases.push(
|
|
305
|
+
scoreEotDecision(eotSamples, {
|
|
306
|
+
...(assertions.maxEotFalseTriggerRate !== undefined
|
|
307
|
+
? { maxFalseTriggerRate: assertions.maxEotFalseTriggerRate }
|
|
308
|
+
: {}),
|
|
309
|
+
}),
|
|
310
|
+
);
|
|
311
|
+
if (diarTurns.length > 0) {
|
|
312
|
+
cases.push(
|
|
313
|
+
scoreDiarizationTimeline(diarTurns, {
|
|
314
|
+
...(assertions.maxDer !== undefined
|
|
315
|
+
? { maxDer: assertions.maxDer }
|
|
316
|
+
: {}),
|
|
317
|
+
}),
|
|
318
|
+
);
|
|
319
|
+
}
|
|
320
|
+
cases.push(
|
|
321
|
+
scoreRespondDecision(respondSamples, {
|
|
322
|
+
...(assertions.minRespondAccuracy !== undefined
|
|
323
|
+
? { minAccuracy: assertions.minRespondAccuracy }
|
|
324
|
+
: {}),
|
|
325
|
+
}),
|
|
326
|
+
);
|
|
327
|
+
// Entity extraction + voice→entity match only when the scenario asserts them.
|
|
328
|
+
if (expectedEntities.length > 0 || inferredEntities.length > 0) {
|
|
329
|
+
cases.push(
|
|
330
|
+
scoreEntityExtraction({
|
|
331
|
+
expected: expectedEntities,
|
|
332
|
+
inferred: inferredEntities,
|
|
333
|
+
}),
|
|
334
|
+
);
|
|
335
|
+
}
|
|
336
|
+
if (voiceEntitySamples.length > 0) {
|
|
337
|
+
cases.push(
|
|
338
|
+
scoreVoiceEntityMatch(voiceEntitySamples, {
|
|
339
|
+
...(assertions.minVoiceEntityMatchRate !== undefined
|
|
340
|
+
? { minMatchRate: assertions.minVoiceEntityMatchRate }
|
|
341
|
+
: {}),
|
|
342
|
+
}),
|
|
343
|
+
);
|
|
344
|
+
}
|
|
345
|
+
if (echoSamples.length > 0) {
|
|
346
|
+
cases.push(
|
|
347
|
+
scoreEchoRejection(echoSamples, {
|
|
348
|
+
...(assertions.minEchoRejectionRate !== undefined
|
|
349
|
+
? { minRejectionRate: assertions.minEchoRejectionRate }
|
|
350
|
+
: {}),
|
|
351
|
+
}),
|
|
352
|
+
);
|
|
353
|
+
}
|
|
354
|
+
if (ownerSamples.length > 0) {
|
|
355
|
+
cases.push(
|
|
356
|
+
scoreOwnerSecurity(ownerSamples, {
|
|
357
|
+
...(assertions.minOwnerAccuracy !== undefined
|
|
358
|
+
? { minAccuracy: assertions.minOwnerAccuracy }
|
|
359
|
+
: {}),
|
|
360
|
+
}),
|
|
361
|
+
);
|
|
362
|
+
}
|
|
363
|
+
|
|
364
|
+
return {
|
|
365
|
+
scenarioId: scenario.id,
|
|
366
|
+
classes: scenario.classes,
|
|
367
|
+
status: "ran",
|
|
368
|
+
cases,
|
|
369
|
+
...(audioArtifacts.length > 0 ? { audioArtifacts } : {}),
|
|
370
|
+
};
|
|
371
|
+
}
|
|
372
|
+
|
|
373
|
+
export interface RunVoiceWorkbenchArgs {
|
|
374
|
+
scenarios: ReadonlyArray<{
|
|
375
|
+
scenario: VoiceScenario;
|
|
376
|
+
corpus: GeneratedVoiceCorpus | null;
|
|
377
|
+
}>;
|
|
378
|
+
services: VoiceWorkbenchServices | null;
|
|
379
|
+
}
|
|
380
|
+
|
|
381
|
+
/** Run a matrix of scenarios headless, returning one run per scenario. */
|
|
382
|
+
export async function runVoiceWorkbenchHeadless(
|
|
383
|
+
args: RunVoiceWorkbenchArgs,
|
|
384
|
+
): Promise<VoiceWorkbenchScenarioRun[]> {
|
|
385
|
+
const runs: VoiceWorkbenchScenarioRun[] = [];
|
|
386
|
+
for (const entry of args.scenarios) {
|
|
387
|
+
runs.push(
|
|
388
|
+
await runVoiceScenarioHeadless({
|
|
389
|
+
scenario: entry.scenario,
|
|
390
|
+
corpus: entry.corpus,
|
|
391
|
+
services: args.services,
|
|
392
|
+
}),
|
|
393
|
+
);
|
|
394
|
+
}
|
|
395
|
+
return runs;
|
|
396
|
+
}
|
|
@@ -0,0 +1,225 @@
|
|
|
1
|
+
import { describe, expect, it } from "vitest";
|
|
2
|
+
import { generateVoiceCorpus } from "./corpus-generator";
|
|
3
|
+
import type { VoiceScenario } from "./voice-scenario";
|
|
4
|
+
import { buildVoiceWorkbenchReport } from "./voice-workbench-report";
|
|
5
|
+
import { runVoiceScenarioHeadless } from "./workbench-headless-runner";
|
|
6
|
+
import { realDecisionLogicServices } from "./workbench-logic-services";
|
|
7
|
+
import { VOICE_WORKBENCH_SCENARIOS } from "./workbench-scenarios";
|
|
8
|
+
|
|
9
|
+
describe("realDecisionLogicServices over the built-in scenario matrix", () => {
|
|
10
|
+
it("every built-in scenario PASSES against the real decision logic", async () => {
|
|
11
|
+
const services = realDecisionLogicServices();
|
|
12
|
+
const runs = [];
|
|
13
|
+
for (const scenario of VOICE_WORKBENCH_SCENARIOS) {
|
|
14
|
+
const corpus = await generateVoiceCorpus(scenario);
|
|
15
|
+
runs.push(await runVoiceScenarioHeadless({ scenario, corpus, services }));
|
|
16
|
+
}
|
|
17
|
+
const report = buildVoiceWorkbenchReport(runs);
|
|
18
|
+
const failures = report.scenarios.filter((s) => s.verdict === "fail");
|
|
19
|
+
expect(
|
|
20
|
+
failures,
|
|
21
|
+
`failing scenarios: ${JSON.stringify(failures, null, 2)}`,
|
|
22
|
+
).toEqual([]);
|
|
23
|
+
expect(report.overall).toBe("pass");
|
|
24
|
+
expect(report.scenariosRan).toBe(VOICE_WORKBENCH_SCENARIOS.length);
|
|
25
|
+
});
|
|
26
|
+
|
|
27
|
+
it("attributes the multi-speaker scenarios from AUDIO, scoring DER 0", async () => {
|
|
28
|
+
// The real diarization gate: blind acoustic clustering must partition the
|
|
29
|
+
// distinct voices correctly — proving `predictedSpeakerLabel` is derived,
|
|
30
|
+
// not copied from the ground-truth label (#9427).
|
|
31
|
+
const services = realDecisionLogicServices();
|
|
32
|
+
for (const id of ["multi-voice-greeting", "multi-speaker-name-capture"]) {
|
|
33
|
+
const scenario = VOICE_WORKBENCH_SCENARIOS.find((s) => s.id === id);
|
|
34
|
+
if (!scenario) throw new Error(`scenario ${id} missing`);
|
|
35
|
+
const corpus = await generateVoiceCorpus(scenario);
|
|
36
|
+
const run = await runVoiceScenarioHeadless({
|
|
37
|
+
scenario,
|
|
38
|
+
corpus,
|
|
39
|
+
services,
|
|
40
|
+
});
|
|
41
|
+
const diar = run.cases.find((c) => c.kind === "diarization");
|
|
42
|
+
expect(diar, `${id} has a diarization case`).toBeDefined();
|
|
43
|
+
expect(diar?.kind === "diarization" && diar.der).toBe(0);
|
|
44
|
+
expect(diar?.passed).toBe(true);
|
|
45
|
+
}
|
|
46
|
+
});
|
|
47
|
+
|
|
48
|
+
it("the DER gate FAILS on a real misattribution — not a tautology (#9427)", async () => {
|
|
49
|
+
// Two participants, SAME words so their speech regions are the same length.
|
|
50
|
+
const scenario: VoiceScenario = {
|
|
51
|
+
id: "diar-divergence-probe",
|
|
52
|
+
classes: ["diarization", "multi-speaker"],
|
|
53
|
+
participants: [
|
|
54
|
+
{ label: "alice", entityId: "entity-alice" },
|
|
55
|
+
{ label: "bob", entityId: "entity-bob" },
|
|
56
|
+
],
|
|
57
|
+
turns: [
|
|
58
|
+
{
|
|
59
|
+
speaker: "alice",
|
|
60
|
+
text: "eliza what time is it now",
|
|
61
|
+
expectRespond: true,
|
|
62
|
+
},
|
|
63
|
+
{
|
|
64
|
+
speaker: "bob",
|
|
65
|
+
text: "eliza what time is it now",
|
|
66
|
+
expectRespond: true,
|
|
67
|
+
},
|
|
68
|
+
],
|
|
69
|
+
assertions: { maxDer: 0.2 },
|
|
70
|
+
};
|
|
71
|
+
const corpus = await generateVoiceCorpus(scenario);
|
|
72
|
+
|
|
73
|
+
// Honest: the two distinct voices cluster apart → DER 0, gate passes.
|
|
74
|
+
const honest = await runVoiceScenarioHeadless({
|
|
75
|
+
scenario,
|
|
76
|
+
corpus,
|
|
77
|
+
services: realDecisionLogicServices(),
|
|
78
|
+
});
|
|
79
|
+
const honestDer = honest.cases.find((c) => c.kind === "diarization");
|
|
80
|
+
expect(honestDer?.der).toBe(0);
|
|
81
|
+
expect(honestDer?.passed).toBe(true);
|
|
82
|
+
|
|
83
|
+
// Tamper ONLY the audio: overwrite bob's speech with alice's voice. Ground
|
|
84
|
+
// truth still labels the turns alice/bob, so a tautological gate would keep
|
|
85
|
+
// passing — but the real acoustic clusterer hears one voice, merges the
|
|
86
|
+
// turns, and the DER gate trips.
|
|
87
|
+
const [aliceTurn, bobTurn] = corpus.groundTruth.turns;
|
|
88
|
+
const tamperedPcm = corpus.pcm.slice();
|
|
89
|
+
tamperedPcm.set(
|
|
90
|
+
corpus.pcm.subarray(
|
|
91
|
+
aliceTurn.speechStartSample,
|
|
92
|
+
aliceTurn.speechEndSample,
|
|
93
|
+
),
|
|
94
|
+
bobTurn.speechStartSample,
|
|
95
|
+
);
|
|
96
|
+
const tampered = await runVoiceScenarioHeadless({
|
|
97
|
+
scenario,
|
|
98
|
+
corpus: { ...corpus, pcm: tamperedPcm },
|
|
99
|
+
services: realDecisionLogicServices(),
|
|
100
|
+
});
|
|
101
|
+
const tamperedDer = tampered.cases.find((c) => c.kind === "diarization");
|
|
102
|
+
expect(tamperedDer?.der).toBeGreaterThan(0.2);
|
|
103
|
+
expect(tamperedDer?.passed).toBe(false);
|
|
104
|
+
});
|
|
105
|
+
|
|
106
|
+
it("genuinely SUPPRESSES a confident bystander (not just echoing ground truth)", async () => {
|
|
107
|
+
const scenario = VOICE_WORKBENCH_SCENARIOS.find(
|
|
108
|
+
(s) => s.id === "respond-vs-bystander",
|
|
109
|
+
);
|
|
110
|
+
if (!scenario) throw new Error("scenario missing");
|
|
111
|
+
const corpus = await generateVoiceCorpus(scenario);
|
|
112
|
+
const services = realDecisionLogicServices();
|
|
113
|
+
const responded: boolean[] = [];
|
|
114
|
+
for (const label of corpus.groundTruth.turns) {
|
|
115
|
+
const obs = await services.observeTurn({
|
|
116
|
+
turnIndex: label.index,
|
|
117
|
+
audio: corpus.pcm.subarray(
|
|
118
|
+
label.segmentStartSample,
|
|
119
|
+
label.segmentEndSample,
|
|
120
|
+
),
|
|
121
|
+
sampleRate: corpus.sampleRate,
|
|
122
|
+
label,
|
|
123
|
+
groundTruth: corpus.groundTruth,
|
|
124
|
+
});
|
|
125
|
+
responded.push(obs.responded);
|
|
126
|
+
}
|
|
127
|
+
// alice (owner) → respond, bob (bystander) → silent, alice → respond.
|
|
128
|
+
expect(responded).toEqual([true, false, true]);
|
|
129
|
+
});
|
|
130
|
+
|
|
131
|
+
it("genuinely REJECTS the agent's own echoed reply via word-overlap", async () => {
|
|
132
|
+
const scenario = VOICE_WORKBENCH_SCENARIOS.find(
|
|
133
|
+
(s) => s.id === "echo-self-trigger",
|
|
134
|
+
);
|
|
135
|
+
if (!scenario) throw new Error("scenario missing");
|
|
136
|
+
const corpus = await generateVoiceCorpus(scenario);
|
|
137
|
+
const services = realDecisionLogicServices();
|
|
138
|
+
const responded: boolean[] = [];
|
|
139
|
+
for (const label of corpus.groundTruth.turns) {
|
|
140
|
+
const obs = await services.observeTurn({
|
|
141
|
+
turnIndex: label.index,
|
|
142
|
+
audio: corpus.pcm.subarray(
|
|
143
|
+
label.segmentStartSample,
|
|
144
|
+
label.segmentEndSample,
|
|
145
|
+
),
|
|
146
|
+
sampleRate: corpus.sampleRate,
|
|
147
|
+
label,
|
|
148
|
+
groundTruth: corpus.groundTruth,
|
|
149
|
+
});
|
|
150
|
+
responded.push(obs.responded);
|
|
151
|
+
}
|
|
152
|
+
// real reply (respond) → echoed reply (suppressed) → thanks (respond).
|
|
153
|
+
expect(responded).toEqual([true, false, true]);
|
|
154
|
+
});
|
|
155
|
+
|
|
156
|
+
it("genuinely HOLDS on a mid-utterance pause (EOT gate), then commits", async () => {
|
|
157
|
+
const scenario = VOICE_WORKBENCH_SCENARIOS.find(
|
|
158
|
+
(s) => s.id === "pauses-midutterance",
|
|
159
|
+
);
|
|
160
|
+
if (!scenario) throw new Error("scenario missing");
|
|
161
|
+
const corpus = await generateVoiceCorpus(scenario);
|
|
162
|
+
const services = realDecisionLogicServices();
|
|
163
|
+
const decided: boolean[] = [];
|
|
164
|
+
const responded: boolean[] = [];
|
|
165
|
+
for (const label of corpus.groundTruth.turns) {
|
|
166
|
+
const obs = await services.observeTurn({
|
|
167
|
+
turnIndex: label.index,
|
|
168
|
+
audio: corpus.pcm.subarray(
|
|
169
|
+
label.segmentStartSample,
|
|
170
|
+
label.segmentEndSample,
|
|
171
|
+
),
|
|
172
|
+
sampleRate: corpus.sampleRate,
|
|
173
|
+
label,
|
|
174
|
+
groundTruth: corpus.groundTruth,
|
|
175
|
+
});
|
|
176
|
+
decided.push(obs.eotDecided);
|
|
177
|
+
responded.push(obs.responded);
|
|
178
|
+
}
|
|
179
|
+
// "...schedule a meeting with" trails off → not end-of-turn, no response;
|
|
180
|
+
// "Bob tomorrow at noon" completes → end-of-turn, respond.
|
|
181
|
+
expect(decided).toEqual([false, true]);
|
|
182
|
+
expect(responded).toEqual([false, true]);
|
|
183
|
+
});
|
|
184
|
+
|
|
185
|
+
it("resets reply state between scenarios (no cross-scenario echo leak)", async () => {
|
|
186
|
+
const services = realDecisionLogicServices();
|
|
187
|
+
const echo = VOICE_WORKBENCH_SCENARIOS.find(
|
|
188
|
+
(s) => s.id === "echo-self-trigger",
|
|
189
|
+
);
|
|
190
|
+
const greeting = VOICE_WORKBENCH_SCENARIOS.find(
|
|
191
|
+
(s) => s.id === "multi-voice-greeting",
|
|
192
|
+
);
|
|
193
|
+
if (!echo || !greeting) throw new Error("scenarios missing");
|
|
194
|
+
// Run echo scenario first (populates lastAgentReply), then greeting.
|
|
195
|
+
for (const scenario of [echo, greeting]) {
|
|
196
|
+
const corpus = await generateVoiceCorpus(scenario);
|
|
197
|
+
for (const label of corpus.groundTruth.turns) {
|
|
198
|
+
await services.observeTurn({
|
|
199
|
+
turnIndex: label.index,
|
|
200
|
+
audio: corpus.pcm.subarray(
|
|
201
|
+
label.segmentStartSample,
|
|
202
|
+
label.segmentEndSample,
|
|
203
|
+
),
|
|
204
|
+
sampleRate: corpus.sampleRate,
|
|
205
|
+
label,
|
|
206
|
+
groundTruth: corpus.groundTruth,
|
|
207
|
+
});
|
|
208
|
+
}
|
|
209
|
+
}
|
|
210
|
+
// Greeting's first turn must still be answered (no stale reply suppressing it).
|
|
211
|
+
const corpus = await generateVoiceCorpus(greeting);
|
|
212
|
+
const first = corpus.groundTruth.turns[0];
|
|
213
|
+
const obs = await services.observeTurn({
|
|
214
|
+
turnIndex: 0,
|
|
215
|
+
audio: corpus.pcm.subarray(
|
|
216
|
+
first.segmentStartSample,
|
|
217
|
+
first.segmentEndSample,
|
|
218
|
+
),
|
|
219
|
+
sampleRate: corpus.sampleRate,
|
|
220
|
+
label: first,
|
|
221
|
+
groundTruth: corpus.groundTruth,
|
|
222
|
+
});
|
|
223
|
+
expect(obs.responded).toBe(true);
|
|
224
|
+
});
|
|
225
|
+
});
|