@elizaos/plugin-local-inference 2.0.0-beta.1 → 2.0.11-beta.7
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +21 -0
- package/README.md +83 -0
- package/package.json +81 -15
- package/src/actions/generate-media.d.ts +59 -0
- package/src/actions/generate-media.d.ts.map +1 -0
- package/src/actions/generate-media.ts +647 -0
- package/src/actions/identify-speaker.d.ts +23 -0
- package/src/actions/identify-speaker.d.ts.map +1 -0
- package/src/actions/identify-speaker.ts +171 -0
- package/src/adapters/capacitor-llama/__tests__/compat-behavior.test.ts +218 -0
- package/src/adapters/capacitor-llama/__tests__/index.test.ts +68 -0
- package/src/adapters/capacitor-llama/__tests__/structured-output.test.ts +215 -0
- package/src/adapters/capacitor-llama/__tests__/text-streaming.test.ts +174 -0
- package/src/adapters/capacitor-llama/environment.ts +71 -0
- package/src/adapters/capacitor-llama/index.browser.ts +83 -0
- package/src/adapters/capacitor-llama/index.ts +807 -0
- package/src/adapters/capacitor-llama/loader.ts +109 -0
- package/src/adapters/capacitor-llama/structured-output.ts +165 -0
- package/src/adapters/capacitor-llama/text-streaming.ts +227 -0
- package/src/adapters/capacitor-llama/types.ts +374 -0
- package/src/backends/apple-foundation.ts +127 -0
- package/src/index.d.ts +7 -0
- package/src/index.d.ts.map +1 -0
- package/src/index.ts +54 -0
- package/src/local-inference-routes.d.ts +38 -0
- package/src/local-inference-routes.d.ts.map +1 -0
- package/src/local-inference-routes.test.ts +344 -0
- package/src/local-inference-routes.ts +1543 -0
- package/src/provider.d.ts +21 -0
- package/src/provider.d.ts.map +1 -0
- package/src/provider.ts +1171 -0
- package/src/routes/compat-helpers.d.ts +18 -0
- package/src/routes/compat-helpers.d.ts.map +1 -0
- package/src/routes/compat-helpers.ts +274 -0
- package/src/routes/family-member-route.d.ts +62 -0
- package/src/routes/family-member-route.d.ts.map +1 -0
- package/src/routes/family-member-route.ts +353 -0
- package/src/routes/index.d.ts +19 -0
- package/src/routes/index.d.ts.map +1 -0
- package/src/routes/index.ts +60 -0
- package/src/routes/live-diarization-route.d.ts +26 -0
- package/src/routes/live-diarization-route.d.ts.map +1 -0
- package/src/routes/live-diarization-route.test.ts +213 -0
- package/src/routes/live-diarization-route.ts +122 -0
- package/src/routes/local-inference-asr-route.d.ts +4 -0
- package/src/routes/local-inference-asr-route.d.ts.map +1 -0
- package/src/routes/local-inference-asr-route.test.ts +190 -0
- package/src/routes/local-inference-asr-route.ts +213 -0
- package/src/routes/local-inference-compat-routes.d.ts +16 -0
- package/src/routes/local-inference-compat-routes.d.ts.map +1 -0
- package/src/routes/local-inference-compat-routes.test.ts +423 -0
- package/src/routes/local-inference-compat-routes.ts +782 -0
- package/src/routes/local-inference-tts-route.d.ts +7 -0
- package/src/routes/local-inference-tts-route.d.ts.map +1 -0
- package/src/routes/local-inference-tts-route.test.ts +179 -0
- package/src/routes/local-inference-tts-route.ts +230 -0
- package/src/routes/voice-first-run-routes.d.ts +62 -0
- package/src/routes/voice-first-run-routes.d.ts.map +1 -0
- package/src/routes/voice-first-run-routes.ts +524 -0
- package/src/routes/voice-models-routes.d.ts +62 -0
- package/src/routes/voice-models-routes.d.ts.map +1 -0
- package/src/routes/voice-models-routes.ts +554 -0
- package/src/routes/voice-profile-plugin-routes.d.ts +19 -0
- package/src/routes/voice-profile-plugin-routes.d.ts.map +1 -0
- package/src/routes/voice-profile-plugin-routes.ts +138 -0
- package/src/routes/voice-profiles-management-routes.d.ts +52 -0
- package/src/routes/voice-profiles-management-routes.d.ts.map +1 -0
- package/src/routes/voice-profiles-management-routes.ts +476 -0
- package/src/routes/voice-speaker-profile-routes.d.ts +57 -0
- package/src/routes/voice-speaker-profile-routes.d.ts.map +1 -0
- package/src/routes/voice-speaker-profile-routes.ts +199 -0
- package/src/runtime/aosp-llama-loader-selection.test.ts +80 -0
- package/src/runtime/capacitor-llama.d.ts +25 -0
- package/src/runtime/embedding-manager-support.d.ts +77 -0
- package/src/runtime/embedding-manager-support.d.ts.map +1 -0
- package/src/runtime/embedding-manager-support.ts +497 -0
- package/src/runtime/embedding-presets.d.ts +16 -0
- package/src/runtime/embedding-presets.d.ts.map +1 -0
- package/src/runtime/embedding-presets.ts +81 -0
- package/src/runtime/embedding-warmup-policy.d.ts +14 -0
- package/src/runtime/embedding-warmup-policy.d.ts.map +1 -0
- package/src/runtime/embedding-warmup-policy.test.ts +53 -0
- package/src/runtime/embedding-warmup-policy.ts +48 -0
- package/src/runtime/ensure-local-inference-handler.d.ts +53 -0
- package/src/runtime/ensure-local-inference-handler.d.ts.map +1 -0
- package/src/runtime/ensure-local-inference-handler.test.ts +528 -0
- package/src/runtime/ensure-local-inference-handler.ts +1398 -0
- package/src/runtime/index.d.ts +14 -0
- package/src/runtime/index.d.ts.map +1 -0
- package/src/runtime/index.ts +27 -0
- package/src/runtime/mobile-local-inference-gate.d.ts +31 -0
- package/src/runtime/mobile-local-inference-gate.d.ts.map +1 -0
- package/src/runtime/mobile-local-inference-gate.test.ts +69 -0
- package/src/runtime/mobile-local-inference-gate.ts +44 -0
- package/src/runtime/voice-entity-binding.d.ts +103 -0
- package/src/runtime/voice-entity-binding.d.ts.map +1 -0
- package/src/runtime/voice-entity-binding.transcript.test.ts +69 -0
- package/src/runtime/voice-entity-binding.ts +328 -0
- package/src/services/README.md +71 -0
- package/src/services/__tests__/backend-selector.test.ts +101 -0
- package/src/services/__tests__/checkpoint-manager.test.ts +376 -0
- package/src/services/__tests__/gpu-autotune.test.ts +400 -0
- package/src/services/__tests__/llm-streaming-binding.test.ts +85 -0
- package/src/services/__tests__/planner-grammar.test.ts +372 -0
- package/src/services/__tests__/runtime-target.test.ts +176 -0
- package/src/services/active-model-switch-rollback.test.ts +183 -0
- package/src/services/active-model.d.ts +282 -0
- package/src/services/active-model.d.ts.map +1 -0
- package/src/services/active-model.ts +1213 -0
- package/src/services/asr/errors.d.ts +21 -0
- package/src/services/asr/errors.d.ts.map +1 -0
- package/src/services/asr/errors.ts +50 -0
- package/src/services/asr/hash.d.ts +28 -0
- package/src/services/asr/hash.d.ts.map +1 -0
- package/src/services/asr/hash.ts +49 -0
- package/src/services/asr/index.d.ts +76 -0
- package/src/services/asr/index.d.ts.map +1 -0
- package/src/services/asr/index.ts +178 -0
- package/src/services/asr/types.d.ts +91 -0
- package/src/services/asr/types.d.ts.map +1 -0
- package/src/services/asr/types.ts +95 -0
- package/src/services/assignments.d.ts +71 -0
- package/src/services/assignments.d.ts.map +1 -0
- package/src/services/assignments.test.ts +80 -0
- package/src/services/assignments.ts +230 -0
- package/src/services/backend-selector.ts +95 -0
- package/src/services/backend.d.ts +346 -0
- package/src/services/backend.d.ts.map +1 -0
- package/src/services/backend.ts +612 -0
- package/src/services/bundled-models.d.ts +34 -0
- package/src/services/bundled-models.d.ts.map +1 -0
- package/src/services/bundled-models.ts +129 -0
- package/src/services/cache-bridge.d.ts +206 -0
- package/src/services/cache-bridge.d.ts.map +1 -0
- package/src/services/cache-bridge.test.ts +516 -0
- package/src/services/cache-bridge.ts +423 -0
- package/src/services/catalog.d.ts +10 -0
- package/src/services/catalog.d.ts.map +1 -0
- package/src/services/catalog.test.ts +240 -0
- package/src/services/catalog.ts +27 -0
- package/src/services/checkpoint-client.d.ts +109 -0
- package/src/services/checkpoint-client.d.ts.map +1 -0
- package/src/services/checkpoint-client.ts +258 -0
- package/src/services/checkpoint-manager.ts +474 -0
- package/src/services/cloud-fallback.d.ts +102 -0
- package/src/services/cloud-fallback.d.ts.map +1 -0
- package/src/services/cloud-fallback.ts +230 -0
- package/src/services/conversation-registry.d.ts +142 -0
- package/src/services/conversation-registry.d.ts.map +1 -0
- package/src/services/conversation-registry.test.ts +235 -0
- package/src/services/conversation-registry.ts +264 -0
- package/src/services/desktop-fused-ffi-backend-runtime.d.ts +92 -0
- package/src/services/desktop-fused-ffi-backend-runtime.d.ts.map +1 -0
- package/src/services/desktop-fused-ffi-backend-runtime.ts +333 -0
- package/src/services/device-bridge.d.ts +188 -0
- package/src/services/device-bridge.d.ts.map +1 -0
- package/src/services/device-bridge.ts +1237 -0
- package/src/services/device-resource-metrics.d.ts +149 -0
- package/src/services/device-resource-metrics.d.ts.map +1 -0
- package/src/services/device-resource-metrics.test.ts +98 -0
- package/src/services/device-resource-metrics.ts +346 -0
- package/src/services/device-tier.d.ts +115 -0
- package/src/services/device-tier.d.ts.map +1 -0
- package/src/services/device-tier.test.ts +371 -0
- package/src/services/device-tier.ts +410 -0
- package/src/services/downloader.d.ts +82 -0
- package/src/services/downloader.d.ts.map +1 -0
- package/src/services/downloader.test.ts +724 -0
- package/src/services/downloader.ts +899 -0
- package/src/services/engine-direct-bundle.test.ts +58 -0
- package/src/services/engine-streaming.test.ts +80 -0
- package/src/services/engine.d.ts +534 -0
- package/src/services/engine.d.ts.map +1 -0
- package/src/services/engine.ts +1891 -0
- package/src/services/ensure-local-artifacts.integration.test.ts +273 -0
- package/src/services/ensure-local-artifacts.test.ts +368 -0
- package/src/services/ensure-local-artifacts.ts +351 -0
- package/src/services/external-scanner.d.ts +17 -0
- package/src/services/external-scanner.d.ts.map +1 -0
- package/src/services/external-scanner.ts +312 -0
- package/src/services/ffi-llm-mock.ts +354 -0
- package/src/services/ffi-llm-streaming-abi.ts +442 -0
- package/src/services/ffi-streaming-backend.d.ts +180 -0
- package/src/services/ffi-streaming-backend.d.ts.map +1 -0
- package/src/services/ffi-streaming-backend.ts +382 -0
- package/src/services/ffi-streaming-runner.d.ts +122 -0
- package/src/services/ffi-streaming-runner.d.ts.map +1 -0
- package/src/services/ffi-streaming-runner.test.ts +60 -0
- package/src/services/ffi-streaming-runner.ts +354 -0
- package/src/services/ffi-unload-ordering.test.ts +162 -0
- package/src/services/gpu-autotune.ts +534 -0
- package/src/services/gpu-detect.ts +139 -0
- package/src/services/handler-registry.d.ts +72 -0
- package/src/services/handler-registry.d.ts.map +1 -0
- package/src/services/handler-registry.ts +240 -0
- package/src/services/hardware.d.ts +63 -0
- package/src/services/hardware.d.ts.map +1 -0
- package/src/services/hardware.test.ts +183 -0
- package/src/services/hardware.ts +404 -0
- package/src/services/hf-search.d.ts +26 -0
- package/src/services/hf-search.d.ts.map +1 -0
- package/src/services/hf-search.test.ts +69 -0
- package/src/services/hf-search.ts +420 -0
- package/src/services/image-description-runtime.d.ts +14 -0
- package/src/services/image-description-runtime.d.ts.map +1 -0
- package/src/services/image-description-runtime.test.ts +61 -0
- package/src/services/image-description-runtime.ts +118 -0
- package/src/services/imagegen/aosp-unavailable.d.ts +134 -0
- package/src/services/imagegen/aosp-unavailable.d.ts.map +1 -0
- package/src/services/imagegen/aosp-unavailable.ts +229 -0
- package/src/services/imagegen/backend-selector.d.ts +118 -0
- package/src/services/imagegen/backend-selector.d.ts.map +1 -0
- package/src/services/imagegen/backend-selector.ts +281 -0
- package/src/services/imagegen/coreml-unavailable.d.ts +105 -0
- package/src/services/imagegen/coreml-unavailable.d.ts.map +1 -0
- package/src/services/imagegen/coreml-unavailable.ts +237 -0
- package/src/services/imagegen/errors.d.ts +16 -0
- package/src/services/imagegen/errors.d.ts.map +1 -0
- package/src/services/imagegen/errors.ts +40 -0
- package/src/services/imagegen/index.d.ts +58 -0
- package/src/services/imagegen/index.d.ts.map +1 -0
- package/src/services/imagegen/index.ts +144 -0
- package/src/services/imagegen/mflux.d.ts +74 -0
- package/src/services/imagegen/mflux.d.ts.map +1 -0
- package/src/services/imagegen/mflux.ts +313 -0
- package/src/services/imagegen/sd-cpp.d.ts +180 -0
- package/src/services/imagegen/sd-cpp.d.ts.map +1 -0
- package/src/services/imagegen/sd-cpp.ts +718 -0
- package/src/services/imagegen/tensorrt-unavailable.d.ts +83 -0
- package/src/services/imagegen/tensorrt-unavailable.d.ts.map +1 -0
- package/src/services/imagegen/tensorrt-unavailable.ts +295 -0
- package/src/services/imagegen/types.d.ts +181 -0
- package/src/services/imagegen/types.d.ts.map +1 -0
- package/src/services/imagegen/types.ts +193 -0
- package/src/services/index.d.ts +30 -0
- package/src/services/index.d.ts.map +1 -0
- package/src/services/index.ts +225 -0
- package/src/services/inference-capabilities.d.ts +132 -0
- package/src/services/inference-capabilities.d.ts.map +1 -0
- package/src/services/inference-capabilities.test.ts +75 -0
- package/src/services/inference-capabilities.ts +204 -0
- package/src/services/inference-telemetry.d.ts +59 -0
- package/src/services/inference-telemetry.d.ts.map +1 -0
- package/src/services/inference-telemetry.ts +143 -0
- package/src/services/ios-llama-streaming.ts +248 -0
- package/src/services/kv-spill.d.ts +189 -0
- package/src/services/kv-spill.d.ts.map +1 -0
- package/src/services/kv-spill.test.ts +222 -0
- package/src/services/kv-spill.ts +356 -0
- package/src/services/latency-trace.d.ts +346 -0
- package/src/services/latency-trace.d.ts.map +1 -0
- package/src/services/latency-trace.test.ts +266 -0
- package/src/services/latency-trace.ts +844 -0
- package/src/services/llama-server-metrics.ts +304 -0
- package/src/services/llm-streaming-binding.d.ts +96 -0
- package/src/services/llm-streaming-binding.d.ts.map +1 -0
- package/src/services/llm-streaming-binding.ts +136 -0
- package/src/services/load-args.d.ts +82 -0
- package/src/services/load-args.d.ts.map +1 -0
- package/src/services/load-args.ts +81 -0
- package/src/services/manifest/eliza-1.manifest.v1.json +708 -0
- package/src/services/manifest/index.d.ts +4 -0
- package/src/services/manifest/index.d.ts.map +1 -0
- package/src/services/manifest/index.ts +66 -0
- package/src/services/manifest/manifest.test.ts +693 -0
- package/src/services/manifest/schema.d.ts +715 -0
- package/src/services/manifest/schema.d.ts.map +1 -0
- package/src/services/manifest/schema.ts +655 -0
- package/src/services/manifest/types.d.ts +30 -0
- package/src/services/manifest/types.d.ts.map +1 -0
- package/src/services/manifest/types.ts +55 -0
- package/src/services/manifest/validator.d.ts +66 -0
- package/src/services/manifest/validator.d.ts.map +1 -0
- package/src/services/manifest/validator.ts +569 -0
- package/src/services/memory-arbiter.d.ts +343 -0
- package/src/services/memory-arbiter.d.ts.map +1 -0
- package/src/services/memory-arbiter.test.ts +419 -0
- package/src/services/memory-arbiter.ts +1000 -0
- package/src/services/memory-monitor.d.ts +119 -0
- package/src/services/memory-monitor.d.ts.map +1 -0
- package/src/services/memory-monitor.test.ts +208 -0
- package/src/services/memory-monitor.ts +296 -0
- package/src/services/memory-pressure.d.ts +127 -0
- package/src/services/memory-pressure.d.ts.map +1 -0
- package/src/services/memory-pressure.ts +413 -0
- package/src/services/mtp-doctor.d.ts +13 -0
- package/src/services/mtp-doctor.d.ts.map +1 -0
- package/src/services/mtp-doctor.ts +78 -0
- package/src/services/network-policy.d.ts +127 -0
- package/src/services/network-policy.d.ts.map +1 -0
- package/src/services/network-policy.ts +346 -0
- package/src/services/paths.d.ts +6 -0
- package/src/services/paths.d.ts.map +1 -0
- package/src/services/paths.ts +25 -0
- package/src/services/planner-skeleton.d.ts +124 -0
- package/src/services/planner-skeleton.d.ts.map +1 -0
- package/src/services/planner-skeleton.ts +175 -0
- package/src/services/providers.d.ts +38 -0
- package/src/services/providers.d.ts.map +1 -0
- package/src/services/providers.ts +507 -0
- package/src/services/ram-budget-cache.test.ts +163 -0
- package/src/services/ram-budget.d.ts +110 -0
- package/src/services/ram-budget.d.ts.map +1 -0
- package/src/services/ram-budget.ts +0 -0
- package/src/services/readiness.d.ts +9 -0
- package/src/services/readiness.d.ts.map +1 -0
- package/src/services/readiness.test.ts +87 -0
- package/src/services/readiness.ts +238 -0
- package/src/services/recommendation.d.ts +111 -0
- package/src/services/recommendation.d.ts.map +1 -0
- package/src/services/recommendation.ts +672 -0
- package/src/services/registry.d.ts +35 -0
- package/src/services/registry.d.ts.map +1 -0
- package/src/services/registry.ts +151 -0
- package/src/services/router-handler.d.ts +92 -0
- package/src/services/router-handler.d.ts.map +1 -0
- package/src/services/router-handler.test.ts +45 -0
- package/src/services/router-handler.ts +376 -0
- package/src/services/routing-policy.d.ts +55 -0
- package/src/services/routing-policy.d.ts.map +1 -0
- package/src/services/routing-policy.ts +228 -0
- package/src/services/routing-preferences.d.ts +8 -0
- package/src/services/routing-preferences.d.ts.map +1 -0
- package/src/services/routing-preferences.ts +15 -0
- package/src/services/runtime-target.d.ts +98 -0
- package/src/services/runtime-target.d.ts.map +1 -0
- package/src/services/runtime-target.ts +154 -0
- package/src/services/service.d.ts +128 -0
- package/src/services/service.d.ts.map +1 -0
- package/src/services/service.test.ts +223 -0
- package/src/services/service.ts +735 -0
- package/src/services/session-pool.d.ts +72 -0
- package/src/services/session-pool.d.ts.map +1 -0
- package/src/services/session-pool.ts +153 -0
- package/src/services/structured-output/deterministic-repair.d.ts +23 -0
- package/src/services/structured-output/deterministic-repair.d.ts.map +1 -0
- package/src/services/structured-output/deterministic-repair.test.ts +169 -0
- package/src/services/structured-output/deterministic-repair.ts +443 -0
- package/src/services/structured-output/index.ts +4 -0
- package/src/services/structured-output.d.ts +311 -0
- package/src/services/structured-output.d.ts.map +1 -0
- package/src/services/structured-output.test.ts +483 -0
- package/src/services/structured-output.ts +712 -0
- package/src/services/transcription-priority.test.ts +211 -0
- package/src/services/tts/errors.ts +46 -0
- package/src/services/tts/index.ts +214 -0
- package/src/services/tts/tts-audio-cache.ts +235 -0
- package/src/services/tts/types.ts +157 -0
- package/src/services/types.d.ts +19 -0
- package/src/services/types.d.ts.map +1 -0
- package/src/services/types.ts +55 -0
- package/src/services/verify-on-device.d.ts +34 -0
- package/src/services/verify-on-device.d.ts.map +1 -0
- package/src/services/verify-on-device.test.ts +87 -0
- package/src/services/verify-on-device.ts +127 -0
- package/src/services/verify.d.ts +8 -0
- package/src/services/verify.d.ts.map +1 -0
- package/src/services/verify.ts +13 -0
- package/src/services/vision/aosp-unavailable.d.ts +115 -0
- package/src/services/vision/aosp-unavailable.d.ts.map +1 -0
- package/src/services/vision/aosp-unavailable.ts +163 -0
- package/src/services/vision/capacitor-llama.d.ts +99 -0
- package/src/services/vision/capacitor-llama.d.ts.map +1 -0
- package/src/services/vision/capacitor-llama.ts +255 -0
- package/src/services/vision/cloud-fallback.d.ts +47 -0
- package/src/services/vision/cloud-fallback.d.ts.map +1 -0
- package/src/services/vision/cloud-fallback.test.ts +243 -0
- package/src/services/vision/cloud-fallback.ts +268 -0
- package/src/services/vision/fallback-chain.test.ts +86 -0
- package/src/services/vision/hash.d.ts +71 -0
- package/src/services/vision/hash.d.ts.map +1 -0
- package/src/services/vision/hash.ts +157 -0
- package/src/services/vision/index.d.ts +95 -0
- package/src/services/vision/index.d.ts.map +1 -0
- package/src/services/vision/index.ts +251 -0
- package/src/services/vision/llama-server.d.ts +73 -0
- package/src/services/vision/llama-server.d.ts.map +1 -0
- package/src/services/vision/llama-server.ts +177 -0
- package/src/services/vision/types.d.ts +153 -0
- package/src/services/vision/types.d.ts.map +1 -0
- package/src/services/vision/types.ts +154 -0
- package/src/services/vision/vast-fallback.d.ts +18 -0
- package/src/services/vision/vast-fallback.d.ts.map +1 -0
- package/src/services/vision/vast-fallback.ts +127 -0
- package/src/services/vision-embedding-cache.d.ts +98 -0
- package/src/services/vision-embedding-cache.d.ts.map +1 -0
- package/src/services/vision-embedding-cache.ts +189 -0
- package/src/services/voice/VOICE_WORKBENCH.md +88 -0
- package/src/services/voice/__test-helpers__/fake-ffi.ts +92 -0
- package/src/services/voice/__test-helpers__/synthetic-speech.ts +124 -0
- package/src/services/voice/__tests__/checkpoint-manager.test.ts +241 -0
- package/src/services/voice/__tests__/checkpoint-policy.test.ts +270 -0
- package/src/services/voice/__tests__/eager-context-builder.test.ts +257 -0
- package/src/services/voice/__tests__/eliza1-eot-scorer.test.ts +288 -0
- package/src/services/voice/__tests__/eot-classifier.test.ts +431 -0
- package/src/services/voice/__tests__/optimistic-rollback.test.ts +312 -0
- package/src/services/voice/__tests__/prefill-client.test.ts +266 -0
- package/src/services/voice/__tests__/prefix-preserving-queue.test.ts +208 -0
- package/src/services/voice/__tests__/streaming-asr.test.ts +450 -0
- package/src/services/voice/__tests__/streaming-transcriber.test.ts +339 -0
- package/src/services/voice/__tests__/turn-detector-resolver.test.ts +197 -0
- package/src/services/voice/__tests__/voice-state-machine-prefill.test.ts +275 -0
- package/src/services/voice/__tests__/voice-state-machine.test.ts +354 -0
- package/src/services/voice/audio-frame-consumer.d.ts +212 -0
- package/src/services/voice/audio-frame-consumer.d.ts.map +1 -0
- package/src/services/voice/audio-frame-consumer.test.ts +343 -0
- package/src/services/voice/audio-frame-consumer.ts +491 -0
- package/src/services/voice/barge-in.d.ts +112 -0
- package/src/services/voice/barge-in.d.ts.map +1 -0
- package/src/services/voice/barge-in.test.ts +244 -0
- package/src/services/voice/barge-in.ts +336 -0
- package/src/services/voice/cancellation-coordinator.d.ts +127 -0
- package/src/services/voice/cancellation-coordinator.d.ts.map +1 -0
- package/src/services/voice/cancellation-coordinator.test.ts +196 -0
- package/src/services/voice/cancellation-coordinator.ts +269 -0
- package/src/services/voice/checkpoint-manager.d.ts +199 -0
- package/src/services/voice/checkpoint-manager.d.ts.map +1 -0
- package/src/services/voice/checkpoint-manager.ts +401 -0
- package/src/services/voice/checkpoint-policy.ts +336 -0
- package/src/services/voice/composite-eot-classifier.test.ts +59 -0
- package/src/services/voice/e2e-harness.test.ts +182 -0
- package/src/services/voice/e2e-harness.ts +743 -0
- package/src/services/voice/eager-context-builder.d.ts +170 -0
- package/src/services/voice/eager-context-builder.d.ts.map +1 -0
- package/src/services/voice/eager-context-builder.ts +262 -0
- package/src/services/voice/eliza1-eot-scorer.d.ts +124 -0
- package/src/services/voice/eliza1-eot-scorer.d.ts.map +1 -0
- package/src/services/voice/eliza1-eot-scorer.ts +242 -0
- package/src/services/voice/embedding-server.ts +200 -0
- package/src/services/voice/embedding.d.ts +133 -0
- package/src/services/voice/embedding.d.ts.map +1 -0
- package/src/services/voice/embedding.test.ts +148 -0
- package/src/services/voice/embedding.ts +244 -0
- package/src/services/voice/emotion-attribution.d.ts +68 -0
- package/src/services/voice/emotion-attribution.d.ts.map +1 -0
- package/src/services/voice/emotion-attribution.test.ts +129 -0
- package/src/services/voice/emotion-attribution.ts +361 -0
- package/src/services/voice/engine-bridge-cancellation.test.ts +422 -0
- package/src/services/voice/engine-bridge.d.ts +746 -0
- package/src/services/voice/engine-bridge.d.ts.map +1 -0
- package/src/services/voice/engine-bridge.test.ts +384 -0
- package/src/services/voice/engine-bridge.ts +2226 -0
- package/src/services/voice/eot-classifier-ggml.d.ts +179 -0
- package/src/services/voice/eot-classifier-ggml.d.ts.map +1 -0
- package/src/services/voice/eot-classifier-ggml.ts +566 -0
- package/src/services/voice/eot-classifier.d.ts +214 -0
- package/src/services/voice/eot-classifier.d.ts.map +1 -0
- package/src/services/voice/eot-classifier.ts +533 -0
- package/src/services/voice/errors.d.ts +20 -0
- package/src/services/voice/errors.d.ts.map +1 -0
- package/src/services/voice/errors.ts +32 -0
- package/src/services/voice/expressive-tags.d.ts +158 -0
- package/src/services/voice/expressive-tags.d.ts.map +1 -0
- package/src/services/voice/expressive-tags.ts +405 -0
- package/src/services/voice/ffi-bindings.d.ts +636 -0
- package/src/services/voice/ffi-bindings.d.ts.map +1 -0
- package/src/services/voice/ffi-bindings.test.ts +671 -0
- package/src/services/voice/ffi-bindings.ts +3050 -0
- package/src/services/voice/first-line-cache.d.ts +181 -0
- package/src/services/voice/first-line-cache.d.ts.map +1 -0
- package/src/services/voice/first-line-cache.ts +725 -0
- package/src/services/voice/fused-eot-scorer.d.ts +51 -0
- package/src/services/voice/fused-eot-scorer.d.ts.map +1 -0
- package/src/services/voice/fused-eot-scorer.ts +135 -0
- package/src/services/voice/index.d.ts +91 -0
- package/src/services/voice/index.d.ts.map +1 -0
- package/src/services/voice/index.ts +481 -0
- package/src/services/voice/kokoro/__tests__/kokoro-backend.test.ts +151 -0
- package/src/services/voice/kokoro/__tests__/kokoro-engine-bridge.real.test.ts +151 -0
- package/src/services/voice/kokoro/__tests__/kokoro-engine-bridge.test.ts +60 -0
- package/src/services/voice/kokoro/__tests__/kokoro-engine-discovery.test.ts +277 -0
- package/src/services/voice/kokoro/__tests__/kokoro-ffi-runtime.test.ts +235 -0
- package/src/services/voice/kokoro/__tests__/kokoro-runtime.test.ts +95 -0
- package/src/services/voice/kokoro/__tests__/phonemizer.test.ts +53 -0
- package/src/services/voice/kokoro/__tests__/runtime-selection.test.ts +231 -0
- package/src/services/voice/kokoro/__tests__/voices.test.ts +57 -0
- package/src/services/voice/kokoro/index.ts +79 -0
- package/src/services/voice/kokoro/kokoro-backend.d.ts +72 -0
- package/src/services/voice/kokoro/kokoro-backend.d.ts.map +1 -0
- package/src/services/voice/kokoro/kokoro-backend.ts +207 -0
- package/src/services/voice/kokoro/kokoro-engine-discovery.d.ts +58 -0
- package/src/services/voice/kokoro/kokoro-engine-discovery.d.ts.map +1 -0
- package/src/services/voice/kokoro/kokoro-engine-discovery.ts +177 -0
- package/src/services/voice/kokoro/kokoro-ffi-runtime.d.ts +75 -0
- package/src/services/voice/kokoro/kokoro-ffi-runtime.d.ts.map +1 -0
- package/src/services/voice/kokoro/kokoro-ffi-runtime.ts +233 -0
- package/src/services/voice/kokoro/kokoro-runtime.d.ts +100 -0
- package/src/services/voice/kokoro/kokoro-runtime.d.ts.map +1 -0
- package/src/services/voice/kokoro/kokoro-runtime.ts +170 -0
- package/src/services/voice/kokoro/phoneme-stream.ts +123 -0
- package/src/services/voice/kokoro/phonemizer.d.ts +50 -0
- package/src/services/voice/kokoro/phonemizer.d.ts.map +1 -0
- package/src/services/voice/kokoro/phonemizer.ts +344 -0
- package/src/services/voice/kokoro/pick-runtime.d.ts +61 -0
- package/src/services/voice/kokoro/pick-runtime.d.ts.map +1 -0
- package/src/services/voice/kokoro/pick-runtime.test.ts +91 -0
- package/src/services/voice/kokoro/pick-runtime.ts +130 -0
- package/src/services/voice/kokoro/runtime-selection.d.ts +92 -0
- package/src/services/voice/kokoro/runtime-selection.d.ts.map +1 -0
- package/src/services/voice/kokoro/runtime-selection.ts +237 -0
- package/src/services/voice/kokoro/types.d.ts +82 -0
- package/src/services/voice/kokoro/types.d.ts.map +1 -0
- package/src/services/voice/kokoro/types.ts +95 -0
- package/src/services/voice/kokoro/voice-presets.d.ts +23 -0
- package/src/services/voice/kokoro/voice-presets.d.ts.map +1 -0
- package/src/services/voice/kokoro/voice-presets.ts +129 -0
- package/src/services/voice/kokoro/voices.d.ts +30 -0
- package/src/services/voice/kokoro/voices.d.ts.map +1 -0
- package/src/services/voice/kokoro/voices.ts +64 -0
- package/src/services/voice/lifecycle.d.ts +135 -0
- package/src/services/voice/lifecycle.d.ts.map +1 -0
- package/src/services/voice/lifecycle.test.ts +315 -0
- package/src/services/voice/lifecycle.ts +301 -0
- package/src/services/voice/live-diarization-session.d.ts +96 -0
- package/src/services/voice/live-diarization-session.d.ts.map +1 -0
- package/src/services/voice/live-diarization-session.ts +289 -0
- package/src/services/voice/mic-source.d.ts +136 -0
- package/src/services/voice/mic-source.d.ts.map +1 -0
- package/src/services/voice/mic-source.test.ts +210 -0
- package/src/services/voice/mic-source.ts +503 -0
- package/src/services/voice/optimistic-policy.d.ts +109 -0
- package/src/services/voice/optimistic-policy.d.ts.map +1 -0
- package/src/services/voice/optimistic-policy.test.ts +101 -0
- package/src/services/voice/optimistic-policy.ts +192 -0
- package/src/services/voice/optimistic-rollback.ts +343 -0
- package/src/services/voice/partial-stabilizer.d.ts +73 -0
- package/src/services/voice/partial-stabilizer.d.ts.map +1 -0
- package/src/services/voice/partial-stabilizer.test.ts +68 -0
- package/src/services/voice/partial-stabilizer.ts +140 -0
- package/src/services/voice/phoneme-tokenizer.d.ts +49 -0
- package/src/services/voice/phoneme-tokenizer.d.ts.map +1 -0
- package/src/services/voice/phoneme-tokenizer.ts +158 -0
- package/src/services/voice/phrase-cache.d.ts +76 -0
- package/src/services/voice/phrase-cache.d.ts.map +1 -0
- package/src/services/voice/phrase-cache.test.ts +242 -0
- package/src/services/voice/phrase-cache.ts +186 -0
- package/src/services/voice/phrase-chunker.d.ts +62 -0
- package/src/services/voice/phrase-chunker.d.ts.map +1 -0
- package/src/services/voice/phrase-chunker.test.ts +239 -0
- package/src/services/voice/phrase-chunker.ts +281 -0
- package/src/services/voice/pipeline-impls.d.ts +151 -0
- package/src/services/voice/pipeline-impls.d.ts.map +1 -0
- package/src/services/voice/pipeline-impls.l6.test.ts +110 -0
- package/src/services/voice/pipeline-impls.test.ts +292 -0
- package/src/services/voice/pipeline-impls.ts +315 -0
- package/src/services/voice/pipeline.d.ts +216 -0
- package/src/services/voice/pipeline.d.ts.map +1 -0
- package/src/services/voice/pipeline.ts +505 -0
- package/src/services/voice/prefill-client.d.ts +123 -0
- package/src/services/voice/prefill-client.d.ts.map +1 -0
- package/src/services/voice/prefill-client.ts +316 -0
- package/src/services/voice/prefix-preserving-queue.d.ts +113 -0
- package/src/services/voice/prefix-preserving-queue.d.ts.map +1 -0
- package/src/services/voice/prefix-preserving-queue.ts +162 -0
- package/src/services/voice/profile-store.d.ts +248 -0
- package/src/services/voice/profile-store.d.ts.map +1 -0
- package/src/services/voice/profile-store.ts +887 -0
- package/src/services/voice/ring-buffer.d.ts +40 -0
- package/src/services/voice/ring-buffer.d.ts.map +1 -0
- package/src/services/voice/ring-buffer.ts +105 -0
- package/src/services/voice/rollback-queue.d.ts +24 -0
- package/src/services/voice/rollback-queue.d.ts.map +1 -0
- package/src/services/voice/rollback-queue.ts +74 -0
- package/src/services/voice/samantha-preset-placeholder.d.ts +67 -0
- package/src/services/voice/samantha-preset-placeholder.d.ts.map +1 -0
- package/src/services/voice/samantha-preset-placeholder.test.ts +97 -0
- package/src/services/voice/samantha-preset-placeholder.ts +148 -0
- package/src/services/voice/samantha-preset-regenerator.d.ts +87 -0
- package/src/services/voice/samantha-preset-regenerator.d.ts.map +1 -0
- package/src/services/voice/samantha-preset-regenerator.ts +393 -0
- package/src/services/voice/scheduler.d.ts +146 -0
- package/src/services/voice/scheduler.d.ts.map +1 -0
- package/src/services/voice/scheduler.t2.test.ts +141 -0
- package/src/services/voice/scheduler.ts +927 -0
- package/src/services/voice/shared-resources.d.ts +190 -0
- package/src/services/voice/shared-resources.d.ts.map +1 -0
- package/src/services/voice/shared-resources.ts +320 -0
- package/src/services/voice/speaker/attribution-pipeline.d.ts +74 -0
- package/src/services/voice/speaker/attribution-pipeline.d.ts.map +1 -0
- package/src/services/voice/speaker/attribution-pipeline.ts +386 -0
- package/src/services/voice/speaker/diarizer-fused.d.ts +59 -0
- package/src/services/voice/speaker/diarizer-fused.d.ts.map +1 -0
- package/src/services/voice/speaker/diarizer-fused.real.test.ts +100 -0
- package/src/services/voice/speaker/diarizer-fused.ts +154 -0
- package/src/services/voice/speaker/diarizer.d.ts +75 -0
- package/src/services/voice/speaker/diarizer.d.ts.map +1 -0
- package/src/services/voice/speaker/diarizer.ts +218 -0
- package/src/services/voice/speaker/encoder-fused.d.ts +60 -0
- package/src/services/voice/speaker/encoder-fused.d.ts.map +1 -0
- package/src/services/voice/speaker/encoder-fused.real.test.ts +113 -0
- package/src/services/voice/speaker/encoder-fused.ts +138 -0
- package/src/services/voice/speaker/encoder-ggml.d.ts +33 -0
- package/src/services/voice/speaker/encoder-ggml.d.ts.map +1 -0
- package/src/services/voice/speaker/encoder-ggml.ts +79 -0
- package/src/services/voice/speaker/encoder.d.ts +37 -0
- package/src/services/voice/speaker/encoder.d.ts.map +1 -0
- package/src/services/voice/speaker/encoder.ts +105 -0
- package/src/services/voice/speaker-imprint.d.ts +83 -0
- package/src/services/voice/speaker-imprint.d.ts.map +1 -0
- package/src/services/voice/speaker-imprint.test.ts +185 -0
- package/src/services/voice/speaker-imprint.ts +312 -0
- package/src/services/voice/speaker-preset-cache.d.ts +77 -0
- package/src/services/voice/speaker-preset-cache.d.ts.map +1 -0
- package/src/services/voice/speaker-preset-cache.test.ts +154 -0
- package/src/services/voice/speaker-preset-cache.ts +195 -0
- package/src/services/voice/streaming-asr/streaming-pipeline-adapter.ts +292 -0
- package/src/services/voice/system-audio-sink.d.ts +73 -0
- package/src/services/voice/system-audio-sink.d.ts.map +1 -0
- package/src/services/voice/system-audio-sink.test.ts +29 -0
- package/src/services/voice/system-audio-sink.ts +366 -0
- package/src/services/voice/transcriber.d.ts +244 -0
- package/src/services/voice/transcriber.d.ts.map +1 -0
- package/src/services/voice/transcriber.test.ts +392 -0
- package/src/services/voice/transcriber.ts +704 -0
- package/src/services/voice/turn-controller.d.ts +183 -0
- package/src/services/voice/turn-controller.d.ts.map +1 -0
- package/src/services/voice/turn-controller.test.ts +575 -0
- package/src/services/voice/turn-controller.ts +596 -0
- package/src/services/voice/types.d.ts +643 -0
- package/src/services/voice/types.d.ts.map +1 -0
- package/src/services/voice/types.ts +699 -0
- package/src/services/voice/vad.d.ts +282 -0
- package/src/services/voice/vad.d.ts.map +1 -0
- package/src/services/voice/vad.test.ts +480 -0
- package/src/services/voice/vad.ts +827 -0
- package/src/services/voice/vad.v1-v4.test.ts +222 -0
- package/src/services/voice/voice-budget.d.ts +241 -0
- package/src/services/voice/voice-budget.d.ts.map +1 -0
- package/src/services/voice/voice-budget.test.ts +420 -0
- package/src/services/voice/voice-budget.ts +656 -0
- package/src/services/voice/voice-duet.test.ts +375 -0
- package/src/services/voice/voice-emotion-classifier.d.ts +95 -0
- package/src/services/voice/voice-emotion-classifier.d.ts.map +1 -0
- package/src/services/voice/voice-emotion-classifier.test.ts +210 -0
- package/src/services/voice/voice-emotion-classifier.ts +273 -0
- package/src/services/voice/voice-preset-format.d.ts +158 -0
- package/src/services/voice/voice-preset-format.d.ts.map +1 -0
- package/src/services/voice/voice-preset-format.ts +700 -0
- package/src/services/voice/voice-preset-generator.test.ts +89 -0
- package/src/services/voice/voice-profile-artifact.d.ts +116 -0
- package/src/services/voice/voice-profile-artifact.d.ts.map +1 -0
- package/src/services/voice/voice-profile-artifact.test.ts +138 -0
- package/src/services/voice/voice-profile-artifact.ts +518 -0
- package/src/services/voice/voice-profile-routes.d.ts +83 -0
- package/src/services/voice/voice-profile-routes.d.ts.map +1 -0
- package/src/services/voice/voice-profile-routes.test.ts +429 -0
- package/src/services/voice/voice-profile-routes.ts +425 -0
- package/src/services/voice/voice-scenario.ts +154 -0
- package/src/services/voice/voice-settings.d.ts +82 -0
- package/src/services/voice/voice-settings.d.ts.map +1 -0
- package/src/services/voice/voice-settings.ts +172 -0
- package/src/services/voice/voice-state-machine.d.ts +364 -0
- package/src/services/voice/voice-state-machine.d.ts.map +1 -0
- package/src/services/voice/voice-state-machine.ts +727 -0
- package/src/services/voice/voice-workbench-report.test.ts +168 -0
- package/src/services/voice/voice-workbench-report.ts +326 -0
- package/src/services/voice/voice-workbench.test.ts +158 -0
- package/src/services/voice/voice.test.ts +1070 -0
- package/src/services/voice/wake-word-ggml.d.ts +101 -0
- package/src/services/voice/wake-word-ggml.d.ts.map +1 -0
- package/src/services/voice/wake-word-ggml.ts +320 -0
- package/src/services/voice/wake-word.d.ts +255 -0
- package/src/services/voice/wake-word.d.ts.map +1 -0
- package/src/services/voice/wake-word.test.ts +298 -0
- package/src/services/voice/wake-word.ts +554 -0
- package/src/services/voice/wrap-with-first-line-cache.d.ts +70 -0
- package/src/services/voice/wrap-with-first-line-cache.d.ts.map +1 -0
- package/src/services/voice/wrap-with-first-line-cache.ts +267 -0
- package/src/services/voice-model-updater.d.ts +240 -0
- package/src/services/voice-model-updater.d.ts.map +1 -0
- package/src/services/voice-model-updater.ts +724 -0
- package/src/services/voice-prewarm.d.ts +3 -0
- package/src/services/voice-prewarm.d.ts.map +1 -0
- package/src/services/voice-prewarm.ts +51 -0
- package/dist/index.d.ts +0 -37
- package/dist/index.js +0 -1098
|
@@ -0,0 +1,336 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Voice checkpoint policy — thin VAD-event → checkpoint-op translator that
|
|
3
|
+
* sits between the voice loop (turn-controller / pipeline / vad) and the
|
|
4
|
+
* `GatedCheckpointManager` (`../checkpoint-manager.ts`).
|
|
5
|
+
*
|
|
6
|
+
* Why a separate policy module?
|
|
7
|
+
*
|
|
8
|
+
* - The constraint envelope on this scaffold explicitly forbids editing
|
|
9
|
+
* `turn-controller.ts`, `pipeline.ts`, `pipeline-impls.ts`, `vad.ts`,
|
|
10
|
+
* `scheduler.ts`, `phrase-chunker.ts`, `barge-in.ts`, `transcriber.ts`,
|
|
11
|
+
* and anything under `voice/kokoro/` / `voice/streaming-asr/`. Those
|
|
12
|
+
* files are owned by other agents.
|
|
13
|
+
* - But the upstream merge for `--ctx-checkpoints` lands "any week now,"
|
|
14
|
+
* and the JS-side rollback policy is what the merge unlocks. So the
|
|
15
|
+
* policy lives here as a free-standing module that the turn controller
|
|
16
|
+
* can pick up in a follow-up PR by injecting it into its VAD handler
|
|
17
|
+
* and calling `onSpeechPause` / `onSpeechResume` / `onSpeechEndCommit`
|
|
18
|
+
* / `onHardStop` at the matching transitions.
|
|
19
|
+
* - The wiring required in `turn-controller.ts` is documented in the
|
|
20
|
+
* `WIRING-INSTRUCTIONS` comment at the bottom of this file and in
|
|
21
|
+
* `docs/eliza-1-ctx-checkpoints-integration.md`. We intentionally do
|
|
22
|
+
* NOT apply the wiring here — that is a follow-up PR scoped to the
|
|
23
|
+
* turn-controller owner.
|
|
24
|
+
*
|
|
25
|
+
* Policy summary (one C1 per turn, named `pre-speculative-T<turnId>`):
|
|
26
|
+
*
|
|
27
|
+
* - `onSpeechPause(turnId)` — VAD reports the user stopped speaking but
|
|
28
|
+
* hangover hasn't elapsed. Save C1 and let the caller kick the
|
|
29
|
+
* speculative drafter. If the save fails the policy logs and continues
|
|
30
|
+
* (callers MUST treat speculative work as best-effort).
|
|
31
|
+
*
|
|
32
|
+
* - `onSpeechResume(turnId)` — VAD fires `speech-active` within the
|
|
33
|
+
* rollback window. If we previously kicked a speculative draft (the
|
|
34
|
+
* caller flips `speculativeFired=true` to tell us), restore C1 so the
|
|
35
|
+
* KV state is rolled back to the pre-draft point. Otherwise no-op.
|
|
36
|
+
*
|
|
37
|
+
* - `onSpeechEndCommit(turnId)` — VAD's hangover elapsed; the pause was a
|
|
38
|
+
* real turn boundary. The speculative draft is promoted. Erase C1: we
|
|
39
|
+
* no longer need a rollback target for this turn.
|
|
40
|
+
*
|
|
41
|
+
* - `onHardStop(turnId)` — caller-initiated cancellation (e.g. user
|
|
42
|
+
* pressed mute, app backgrounded). If C1 exists, prefer restoring to
|
|
43
|
+
* it so the KV cache is in a known-clean state for the next turn; if
|
|
44
|
+
* C1 isn't around, fall back to `cancel` (the gated manager will
|
|
45
|
+
* either issue `DELETE /slots/<id>` or invoke the SSE-disconnect
|
|
46
|
+
* callback depending on the gate).
|
|
47
|
+
*
|
|
48
|
+
* All four hooks are idempotent and survive a missing C1 by no-op'ing.
|
|
49
|
+
* Errors from the underlying manager are caught and reported through the
|
|
50
|
+
* `events.onError` sink — the policy NEVER throws back into the voice
|
|
51
|
+
* loop, because a failing checkpoint endpoint must not be able to break
|
|
52
|
+
* audio.
|
|
53
|
+
*
|
|
54
|
+
* The policy holds no state of its own beyond the per-turn name; the
|
|
55
|
+
* `GatedCheckpointManager` owns the registry, the REST client, and the
|
|
56
|
+
* capability cache.
|
|
57
|
+
*
|
|
58
|
+
* --- WIRING-INSTRUCTIONS (turn-controller.ts) -----------------------------
|
|
59
|
+
*
|
|
60
|
+
* The turn-controller owner adds (after the upstream merge lands):
|
|
61
|
+
*
|
|
62
|
+
* 1. Construct a `GatedCheckpointManager` once at session start and
|
|
63
|
+
* pass it into a `CheckpointPolicy` instance (one per slot).
|
|
64
|
+
* 2. In the VAD `speech-pause` handler, immediately after the pause
|
|
65
|
+
* hangover timer is armed:
|
|
66
|
+
*
|
|
67
|
+
* await policy.onSpeechPause(this.turnId, this.slotId);
|
|
68
|
+
* // ...kick speculative drafter against the partial transcript
|
|
69
|
+
*
|
|
70
|
+
* 3. In the VAD `speech-active` handler (only when arriving within the
|
|
71
|
+
* rollback window — the controller already tracks this):
|
|
72
|
+
*
|
|
73
|
+
* await policy.onSpeechResume(this.turnId, this.slotId, {
|
|
74
|
+
* speculativeFired: this.speculativeFired,
|
|
75
|
+
* });
|
|
76
|
+
* // ...abort the speculative drafter
|
|
77
|
+
*
|
|
78
|
+
* 4. In the `speech-end` → SPEAKING transition (after the verifier
|
|
79
|
+
* promotes the draft):
|
|
80
|
+
*
|
|
81
|
+
* await policy.onSpeechEndCommit(this.turnId, this.slotId);
|
|
82
|
+
*
|
|
83
|
+
* 5. In the `dispose()` path and any other hard-stop site (mute, app
|
|
84
|
+
* background, error shutdown, barge-in mid-SPEAKING):
|
|
85
|
+
*
|
|
86
|
+
* await policy.onHardStop(this.turnId, this.slotId, () => {
|
|
87
|
+
* this.speculativeAbort?.abort(); // SSE-disconnect callback
|
|
88
|
+
* });
|
|
89
|
+
*
|
|
90
|
+
* 6. Feature flag: pass `useCtxCheckpoints` through to the
|
|
91
|
+
* `GatedCheckpointManager` constructor; when off the policy still
|
|
92
|
+
* runs but every call is a logged no-op.
|
|
93
|
+
*
|
|
94
|
+
* The turn-controller must NOT call `mgr.save/restore/erase/cancel`
|
|
95
|
+
* directly — those names are reserved for the policy so the gated/no-op
|
|
96
|
+
* branching stays in one place. The `policy.events.onError` sink lets the
|
|
97
|
+
* controller forward checkpoint failures into its existing voice-loop
|
|
98
|
+
* telemetry without coupling to the REST error type.
|
|
99
|
+
*/
|
|
100
|
+
|
|
101
|
+
import { logger } from "@elizaos/core";
|
|
102
|
+
import type {
|
|
103
|
+
CheckpointHandle,
|
|
104
|
+
GatedCheckpointManager,
|
|
105
|
+
SseDisconnectFn,
|
|
106
|
+
} from "../checkpoint-manager";
|
|
107
|
+
|
|
108
|
+
/**
|
|
109
|
+
* Errors are surfaced through this sink rather than rethrown. The voice
|
|
110
|
+
* loop wires it into its existing telemetry; tests assert on it directly.
|
|
111
|
+
*/
|
|
112
|
+
export interface CheckpointPolicyEvents {
|
|
113
|
+
onError?(
|
|
114
|
+
op: "save" | "restore" | "erase" | "cancel",
|
|
115
|
+
error: unknown,
|
|
116
|
+
turnId: string,
|
|
117
|
+
): void;
|
|
118
|
+
/**
|
|
119
|
+
* Called after a successful save so callers can record the handle in
|
|
120
|
+
* their per-turn state if they want to bypass the name-based lookup on
|
|
121
|
+
* the matching restore.
|
|
122
|
+
*/
|
|
123
|
+
onSaved?(turnId: string, handle: CheckpointHandle): void;
|
|
124
|
+
/** Called after a successful restore. */
|
|
125
|
+
onRestored?(turnId: string, handle: CheckpointHandle): void;
|
|
126
|
+
/** Called when the policy decides to no-op (registry miss, gate off). */
|
|
127
|
+
onNoop?(
|
|
128
|
+
op: "save" | "restore" | "erase" | "cancel",
|
|
129
|
+
turnId: string,
|
|
130
|
+
reason: "gate-off" | "registry-miss" | "no-speculative",
|
|
131
|
+
): void;
|
|
132
|
+
}
|
|
133
|
+
|
|
134
|
+
export interface CheckpointPolicyOptions {
|
|
135
|
+
/** Gated manager. Owned by the caller; one per session. */
|
|
136
|
+
manager: GatedCheckpointManager;
|
|
137
|
+
/** Events sink (errors + observability). Optional. */
|
|
138
|
+
events?: CheckpointPolicyEvents;
|
|
139
|
+
}
|
|
140
|
+
|
|
141
|
+
/** Optional second arg to `onSpeechResume` so the policy knows whether
|
|
142
|
+
* a speculative draft actually fired. When `false`, the resume is a no-op
|
|
143
|
+
* (no draft means nothing to roll back).
|
|
144
|
+
*/
|
|
145
|
+
export interface SpeechResumeContext {
|
|
146
|
+
speculativeFired: boolean;
|
|
147
|
+
}
|
|
148
|
+
|
|
149
|
+
/**
|
|
150
|
+
* Voice checkpoint policy. Stateless w.r.t. checkpoints (the manager owns
|
|
151
|
+
* the registry) — only holds the manager + event sink. One instance per
|
|
152
|
+
* voice session is enough; the `turnId` argument scopes each operation.
|
|
153
|
+
*/
|
|
154
|
+
export class CheckpointPolicy {
|
|
155
|
+
private readonly manager: GatedCheckpointManager;
|
|
156
|
+
private readonly events: CheckpointPolicyEvents;
|
|
157
|
+
|
|
158
|
+
constructor(opts: CheckpointPolicyOptions) {
|
|
159
|
+
this.manager = opts.manager;
|
|
160
|
+
this.events = opts.events ?? {};
|
|
161
|
+
}
|
|
162
|
+
|
|
163
|
+
/**
|
|
164
|
+
* VAD `speech-pause`. Save C1. Caller kicks the speculative drafter on
|
|
165
|
+
* its own — the policy doesn't care; it just guarantees the rollback
|
|
166
|
+
* target exists.
|
|
167
|
+
*/
|
|
168
|
+
async onSpeechPause(turnId: string, slotId: number): Promise<void> {
|
|
169
|
+
const name = checkpointNameFor(turnId);
|
|
170
|
+
if (!this.manager.isFeatureFlagOn()) {
|
|
171
|
+
this.events.onNoop?.("save", turnId, "gate-off");
|
|
172
|
+
logger.debug(
|
|
173
|
+
`[checkpoint-policy] onSpeechPause(${turnId}) — gate off, skipping save`,
|
|
174
|
+
);
|
|
175
|
+
return;
|
|
176
|
+
}
|
|
177
|
+
try {
|
|
178
|
+
const handle = await this.manager.save(slotId, name);
|
|
179
|
+
if (handle === null) {
|
|
180
|
+
// Gate flipped on but capability check declined — manager logs.
|
|
181
|
+
this.events.onNoop?.("save", turnId, "gate-off");
|
|
182
|
+
return;
|
|
183
|
+
}
|
|
184
|
+
this.events.onSaved?.(turnId, handle);
|
|
185
|
+
} catch (error) {
|
|
186
|
+
this.events.onError?.("save", error, turnId);
|
|
187
|
+
logger.warn(
|
|
188
|
+
{ error, turnId, slotId },
|
|
189
|
+
"[checkpoint-policy] save failed; speculative draft will run without rollback target",
|
|
190
|
+
);
|
|
191
|
+
}
|
|
192
|
+
}
|
|
193
|
+
|
|
194
|
+
/**
|
|
195
|
+
* VAD `speech-active` within the rollback window. Restore C1 ONLY if
|
|
196
|
+
* the caller actually kicked a speculative draft — otherwise the KV
|
|
197
|
+
* state hasn't been mutated and we'd be doing a needless REST round
|
|
198
|
+
* trip.
|
|
199
|
+
*/
|
|
200
|
+
async onSpeechResume(
|
|
201
|
+
turnId: string,
|
|
202
|
+
slotId: number,
|
|
203
|
+
ctx: SpeechResumeContext,
|
|
204
|
+
): Promise<void> {
|
|
205
|
+
if (!ctx.speculativeFired) {
|
|
206
|
+
this.events.onNoop?.("restore", turnId, "no-speculative");
|
|
207
|
+
logger.debug(
|
|
208
|
+
`[checkpoint-policy] onSpeechResume(${turnId}) — no speculative draft fired; skipping restore`,
|
|
209
|
+
);
|
|
210
|
+
return;
|
|
211
|
+
}
|
|
212
|
+
const name = checkpointNameFor(turnId);
|
|
213
|
+
if (!this.manager.isFeatureFlagOn()) {
|
|
214
|
+
this.events.onNoop?.("restore", turnId, "gate-off");
|
|
215
|
+
logger.debug(
|
|
216
|
+
`[checkpoint-policy] onSpeechResume(${turnId}) — gate off, skipping restore`,
|
|
217
|
+
);
|
|
218
|
+
return;
|
|
219
|
+
}
|
|
220
|
+
try {
|
|
221
|
+
const ok = await this.manager.restore(slotId, name);
|
|
222
|
+
if (!ok) {
|
|
223
|
+
this.events.onNoop?.("restore", turnId, "registry-miss");
|
|
224
|
+
logger.warn(
|
|
225
|
+
{ turnId, slotId, name },
|
|
226
|
+
"[checkpoint-policy] restore returned false (handle not found / expired); KV cache may be dirty until next pause",
|
|
227
|
+
);
|
|
228
|
+
return;
|
|
229
|
+
}
|
|
230
|
+
const handle = this.manager.getNamedHandle(name);
|
|
231
|
+
if (handle) this.events.onRestored?.(turnId, handle);
|
|
232
|
+
} catch (error) {
|
|
233
|
+
this.events.onError?.("restore", error, turnId);
|
|
234
|
+
logger.warn(
|
|
235
|
+
{ error, turnId, slotId },
|
|
236
|
+
"[checkpoint-policy] restore failed; KV cache may contain speculative writes",
|
|
237
|
+
);
|
|
238
|
+
}
|
|
239
|
+
}
|
|
240
|
+
|
|
241
|
+
/**
|
|
242
|
+
* VAD's hangover elapsed → real turn boundary. Speculative draft is
|
|
243
|
+
* being promoted, so C1 is no longer needed. Erase frees the registry
|
|
244
|
+
* slot (the server-side LRU handles its own eviction independently).
|
|
245
|
+
*/
|
|
246
|
+
async onSpeechEndCommit(turnId: string, slotId: number): Promise<void> {
|
|
247
|
+
const name = checkpointNameFor(turnId);
|
|
248
|
+
if (!this.manager.isFeatureFlagOn()) {
|
|
249
|
+
this.events.onNoop?.("erase", turnId, "gate-off");
|
|
250
|
+
logger.debug(
|
|
251
|
+
`[checkpoint-policy] onSpeechEndCommit(${turnId}) — gate off, skipping erase`,
|
|
252
|
+
);
|
|
253
|
+
return;
|
|
254
|
+
}
|
|
255
|
+
try {
|
|
256
|
+
await this.manager.erase(slotId, name);
|
|
257
|
+
} catch (error) {
|
|
258
|
+
this.events.onError?.("erase", error, turnId);
|
|
259
|
+
logger.warn(
|
|
260
|
+
{ error, turnId, slotId },
|
|
261
|
+
"[checkpoint-policy] erase failed; registry entry remains until TTL eviction",
|
|
262
|
+
);
|
|
263
|
+
}
|
|
264
|
+
}
|
|
265
|
+
|
|
266
|
+
/**
|
|
267
|
+
* Hard-stop: caller-initiated cancellation. Prefer rolling back to C1
|
|
268
|
+
* (clean KV state for the next turn) when available, else cancel any
|
|
269
|
+
* in-flight decode on the slot. `sseDisconnect` is the existing voice-
|
|
270
|
+
* loop abort hook — required because the gated manager falls back to
|
|
271
|
+
* it when the REST endpoints aren't available.
|
|
272
|
+
*/
|
|
273
|
+
async onHardStop(
|
|
274
|
+
turnId: string,
|
|
275
|
+
slotId: number,
|
|
276
|
+
sseDisconnect: SseDisconnectFn,
|
|
277
|
+
): Promise<void> {
|
|
278
|
+
const name = checkpointNameFor(turnId);
|
|
279
|
+
if (!this.manager.isFeatureFlagOn()) {
|
|
280
|
+
sseDisconnect(slotId);
|
|
281
|
+
this.events.onNoop?.("cancel", turnId, "gate-off");
|
|
282
|
+
return;
|
|
283
|
+
}
|
|
284
|
+
const existing = this.manager.getNamedHandle(name);
|
|
285
|
+
if (existing) {
|
|
286
|
+
try {
|
|
287
|
+
const ok = await this.manager.restore(slotId, name);
|
|
288
|
+
if (ok) {
|
|
289
|
+
this.events.onRestored?.(turnId, existing);
|
|
290
|
+
}
|
|
291
|
+
// Also erase: the registry slot serves no further purpose after
|
|
292
|
+
// a hard stop, and leaving it pinned through TTL eviction is
|
|
293
|
+
// wasteful.
|
|
294
|
+
try {
|
|
295
|
+
await this.manager.erase(slotId, name);
|
|
296
|
+
} catch (eraseError) {
|
|
297
|
+
this.events.onError?.("erase", eraseError, turnId);
|
|
298
|
+
}
|
|
299
|
+
return;
|
|
300
|
+
} catch (error) {
|
|
301
|
+
this.events.onError?.("restore", error, turnId);
|
|
302
|
+
logger.warn(
|
|
303
|
+
{ error, turnId, slotId },
|
|
304
|
+
"[checkpoint-policy] hard-stop restore failed; falling back to cancel",
|
|
305
|
+
);
|
|
306
|
+
}
|
|
307
|
+
}
|
|
308
|
+
try {
|
|
309
|
+
await this.manager.cancel(slotId, sseDisconnect);
|
|
310
|
+
} catch (error) {
|
|
311
|
+
this.events.onError?.("cancel", error, turnId);
|
|
312
|
+
logger.warn(
|
|
313
|
+
{ error, turnId, slotId },
|
|
314
|
+
"[checkpoint-policy] cancel failed; voice loop SSE-disconnect already invoked",
|
|
315
|
+
);
|
|
316
|
+
}
|
|
317
|
+
}
|
|
318
|
+
}
|
|
319
|
+
|
|
320
|
+
/**
|
|
321
|
+
* Per-turn checkpoint name. Keeps the namespace stable so a hard-stop
|
|
322
|
+
* after a normal commit doesn't collide with the next turn's C1.
|
|
323
|
+
*
|
|
324
|
+
* The format is the only thing callers outside the policy ever see —
|
|
325
|
+
* `GatedCheckpointManager.getNamedHandle('pre-speculative-T123')` returns
|
|
326
|
+
* the same handle the policy used. Keep it stable; if the format changes
|
|
327
|
+
* in a later change, audit every consumer of `getNamedHandle`.
|
|
328
|
+
*/
|
|
329
|
+
export function checkpointNameFor(turnId: string): string {
|
|
330
|
+
// The gated manager's REST filename validation allows
|
|
331
|
+
// `[A-Za-z0-9._-]`, and turn ids in the voice loop are short integer
|
|
332
|
+
// strings. Sanitize defensively for the unlikely case where turn
|
|
333
|
+
// ids carry colons or slashes.
|
|
334
|
+
const safe = turnId.replace(/[^A-Za-z0-9._-]/g, "_");
|
|
335
|
+
return `pre-speculative-T${safe}`;
|
|
336
|
+
}
|
|
@@ -0,0 +1,59 @@
|
|
|
1
|
+
import { describe, expect, it, vi } from "vitest";
|
|
2
|
+
import { CompositeEotClassifier } from "./eot-classifier";
|
|
3
|
+
import type { FfiEotScorer } from "./fused-eot-scorer";
|
|
4
|
+
|
|
5
|
+
/** A stub fused scorer that returns a fixed model probability. */
|
|
6
|
+
function mockScorer(probability: number) {
|
|
7
|
+
const score = vi.fn(async () => ({
|
|
8
|
+
probability,
|
|
9
|
+
latencyMs: 3,
|
|
10
|
+
promptTokens: 5,
|
|
11
|
+
}));
|
|
12
|
+
const scorer = { modelLabel: "mock-eot", score } as unknown as FfiEotScorer;
|
|
13
|
+
return { scorer, score };
|
|
14
|
+
}
|
|
15
|
+
|
|
16
|
+
describe("CompositeEotClassifier", () => {
|
|
17
|
+
it("trusts the heuristic and skips the model when it is confident — sentence-final punctuation", async () => {
|
|
18
|
+
const { scorer, score } = mockScorer(0.0);
|
|
19
|
+
const c = new CompositeEotClassifier({ model: scorer });
|
|
20
|
+
// "Hello there." → punctuation → heuristic 0.95 (confidence 0.9 ≥ cutoff).
|
|
21
|
+
expect(await c.score("Hello there.")).toBeCloseTo(0.95, 5);
|
|
22
|
+
expect(score).not.toHaveBeenCalled();
|
|
23
|
+
});
|
|
24
|
+
|
|
25
|
+
it("trusts the heuristic and skips the model when it is confident — trailing conjunction", async () => {
|
|
26
|
+
const { scorer, score } = mockScorer(0.99);
|
|
27
|
+
const c = new CompositeEotClassifier({ model: scorer });
|
|
28
|
+
// "I want to go and" → trailing conjunction → heuristic 0.15 (confidence 0.7).
|
|
29
|
+
expect(await c.score("I want to go and")).toBeCloseTo(0.15, 5);
|
|
30
|
+
expect(score).not.toHaveBeenCalled();
|
|
31
|
+
});
|
|
32
|
+
|
|
33
|
+
it("defers to the model in the ambiguous middle (no syntactic signal)", async () => {
|
|
34
|
+
const { scorer, score } = mockScorer(0.82);
|
|
35
|
+
const c = new CompositeEotClassifier({ model: scorer });
|
|
36
|
+
// 5 words, no punctuation, last word a pronoun → heuristic 0.5 (confidence
|
|
37
|
+
// 0) → the blend is the pure model probability.
|
|
38
|
+
expect(await c.score("tell me more about it")).toBeCloseTo(0.82, 5);
|
|
39
|
+
expect(score).toHaveBeenCalledTimes(1);
|
|
40
|
+
});
|
|
41
|
+
|
|
42
|
+
it("blends model + heuristic for a mid-confidence heuristic (short utterance)", async () => {
|
|
43
|
+
const { scorer, score } = mockScorer(0.2);
|
|
44
|
+
const c = new CompositeEotClassifier({ model: scorer });
|
|
45
|
+
// "okay sure" → 2 words → heuristic 0.7 (confidence 0.4 < cutoff) → model
|
|
46
|
+
// runs; blend = 0.2·(1−0.4) + 0.7·0.4 = 0.40.
|
|
47
|
+
expect(await c.score("okay sure")).toBeCloseTo(0.4, 5);
|
|
48
|
+
expect(score).toHaveBeenCalledTimes(1);
|
|
49
|
+
});
|
|
50
|
+
|
|
51
|
+
it("signal() reports the model source only when the model contributed", async () => {
|
|
52
|
+
const { scorer } = mockScorer(0.6);
|
|
53
|
+
const c = new CompositeEotClassifier({ model: scorer });
|
|
54
|
+
expect((await c.signal("Done.")).source).toBe("heuristic");
|
|
55
|
+
const ambiguous = await c.signal("tell me more about it");
|
|
56
|
+
expect(ambiguous.source).toBe("eliza-1-drafter");
|
|
57
|
+
expect(ambiguous.model).toContain("mock-eot");
|
|
58
|
+
});
|
|
59
|
+
});
|
|
@@ -0,0 +1,182 @@
|
|
|
1
|
+
import { describe, expect, it } from "vitest";
|
|
2
|
+
import {
|
|
3
|
+
assertRequiredVoiceArtifacts,
|
|
4
|
+
scoreBargeInInterruption,
|
|
5
|
+
scoreFirstResponseLatency,
|
|
6
|
+
scoreOptimisticRollbackRestart,
|
|
7
|
+
scorePauseContinuation,
|
|
8
|
+
scoreTtsAsrRoundTrip,
|
|
9
|
+
summarizeVoiceE2e,
|
|
10
|
+
VoiceE2eHarnessError,
|
|
11
|
+
wordErrorRate,
|
|
12
|
+
} from "./e2e-harness";
|
|
13
|
+
|
|
14
|
+
describe("voice E2E harness WER scoring", () => {
|
|
15
|
+
it("normalizes punctuation and computes word error rate", () => {
|
|
16
|
+
expect(wordErrorRate("Hello, local voice!", "hello local voice")).toBe(0);
|
|
17
|
+
expect(wordErrorRate("alpha beta gamma", "alpha gamma")).toBeCloseTo(
|
|
18
|
+
1 / 3,
|
|
19
|
+
4,
|
|
20
|
+
);
|
|
21
|
+
});
|
|
22
|
+
|
|
23
|
+
it("scores TTS -> ASR roundtrip against a WER threshold", () => {
|
|
24
|
+
const pass = scoreTtsAsrRoundTrip({
|
|
25
|
+
referenceText: "Eliza local voice smoke.",
|
|
26
|
+
hypothesisText: "eliza local voice smoke",
|
|
27
|
+
maxWer: 0,
|
|
28
|
+
});
|
|
29
|
+
expect(pass.passed).toBe(true);
|
|
30
|
+
expect(pass.wer).toBe(0);
|
|
31
|
+
|
|
32
|
+
const fail = scoreTtsAsrRoundTrip({
|
|
33
|
+
referenceText: "one two three four",
|
|
34
|
+
hypothesisText: "one four",
|
|
35
|
+
maxWer: 0.25,
|
|
36
|
+
});
|
|
37
|
+
expect(fail.passed).toBe(false);
|
|
38
|
+
expect(fail.wer).toBe(0.5);
|
|
39
|
+
});
|
|
40
|
+
});
|
|
41
|
+
|
|
42
|
+
describe("voice E2E harness artifact validation", () => {
|
|
43
|
+
it("fails clearly when a required model artifact is missing", () => {
|
|
44
|
+
expect(() =>
|
|
45
|
+
assertRequiredVoiceArtifacts(
|
|
46
|
+
[
|
|
47
|
+
{ kind: "bundle-root", path: "/models/eliza-1-0_8b.bundle" },
|
|
48
|
+
{
|
|
49
|
+
kind: "asr-model",
|
|
50
|
+
path: "/models/eliza-1-0_8b.bundle/asr/eliza-1-asr.gguf",
|
|
51
|
+
magic: "GGUF",
|
|
52
|
+
},
|
|
53
|
+
],
|
|
54
|
+
{
|
|
55
|
+
exists: (p) => p.endsWith(".bundle"),
|
|
56
|
+
size: () => null,
|
|
57
|
+
readMagic: () => null,
|
|
58
|
+
},
|
|
59
|
+
),
|
|
60
|
+
).toThrow(/asr-model.*not found/);
|
|
61
|
+
});
|
|
62
|
+
|
|
63
|
+
it("rejects a tiny or non-GGUF model instead of accepting a placeholder", () => {
|
|
64
|
+
try {
|
|
65
|
+
assertRequiredVoiceArtifacts(
|
|
66
|
+
[
|
|
67
|
+
{
|
|
68
|
+
kind: "tts-model",
|
|
69
|
+
path: "/tmp/placeholder.gguf",
|
|
70
|
+
minBytes: 1024,
|
|
71
|
+
magic: "GGUF",
|
|
72
|
+
},
|
|
73
|
+
],
|
|
74
|
+
{
|
|
75
|
+
exists: () => true,
|
|
76
|
+
size: () => 12,
|
|
77
|
+
readMagic: () => "NOPE",
|
|
78
|
+
},
|
|
79
|
+
);
|
|
80
|
+
throw new Error("expected artifact validation to fail");
|
|
81
|
+
} catch (err) {
|
|
82
|
+
expect(err).toBeInstanceOf(VoiceE2eHarnessError);
|
|
83
|
+
expect((err as VoiceE2eHarnessError).code).toBe("missing-artifact");
|
|
84
|
+
expect(String((err as Error).message)).toContain("too small");
|
|
85
|
+
}
|
|
86
|
+
});
|
|
87
|
+
});
|
|
88
|
+
|
|
89
|
+
describe("voice E2E harness barge-in scoring", () => {
|
|
90
|
+
it("passes when TTS, LLM, and audio drain cancel inside the budget", () => {
|
|
91
|
+
const result = scoreBargeInInterruption({
|
|
92
|
+
voiceDetectedAtMs: 1000,
|
|
93
|
+
ttsCancelledAtMs: 1060,
|
|
94
|
+
llmCancelledAtMs: 1100,
|
|
95
|
+
audioDrainedAtMs: 1030,
|
|
96
|
+
maxCancelMs: 250,
|
|
97
|
+
});
|
|
98
|
+
expect(result.passed).toBe(true);
|
|
99
|
+
expect(result.bargeInCancelMs).toBe(100);
|
|
100
|
+
});
|
|
101
|
+
|
|
102
|
+
it("does not pass a missing LLM cancel measurement by default", () => {
|
|
103
|
+
expect(() =>
|
|
104
|
+
scoreBargeInInterruption({
|
|
105
|
+
voiceDetectedAtMs: 1000,
|
|
106
|
+
ttsCancelledAtMs: 1030,
|
|
107
|
+
}),
|
|
108
|
+
).toThrow(/llmCancelledAtMs/);
|
|
109
|
+
});
|
|
110
|
+
});
|
|
111
|
+
|
|
112
|
+
describe("voice E2E harness pause and rollback scoring", () => {
|
|
113
|
+
it("scores user continuation within the 4s pause window", () => {
|
|
114
|
+
const result = scorePauseContinuation({
|
|
115
|
+
speechPauseAtMs: 1000,
|
|
116
|
+
speculativeStartedAtMs: 1200,
|
|
117
|
+
continuationAtMs: 4700,
|
|
118
|
+
speculativeAbortedAtMs: 4740,
|
|
119
|
+
finalRestartedAtMs: 4900,
|
|
120
|
+
});
|
|
121
|
+
expect(result.passed).toBe(true);
|
|
122
|
+
expect(result.continuationGapMs).toBe(3700);
|
|
123
|
+
});
|
|
124
|
+
|
|
125
|
+
it("fails when the partial response committed before the user continued", () => {
|
|
126
|
+
const result = scorePauseContinuation({
|
|
127
|
+
speechPauseAtMs: 1000,
|
|
128
|
+
continuationAtMs: 3000,
|
|
129
|
+
speculativeStartedAtMs: 1100,
|
|
130
|
+
committedBeforeContinuationAtMs: 2500,
|
|
131
|
+
speculativeAbortedAtMs: 3020,
|
|
132
|
+
finalRestartedAtMs: 3100,
|
|
133
|
+
});
|
|
134
|
+
expect(result.passed).toBe(false);
|
|
135
|
+
});
|
|
136
|
+
|
|
137
|
+
it("scores optimistic rollback restore and restart timing", () => {
|
|
138
|
+
const result = scoreOptimisticRollbackRestart({
|
|
139
|
+
speechPauseAtMs: 1000,
|
|
140
|
+
checkpointSavedAtMs: 1025,
|
|
141
|
+
speculativeStartedAtMs: 1030,
|
|
142
|
+
continuationAtMs: 1300,
|
|
143
|
+
speculativeAbortedAtMs: 1315,
|
|
144
|
+
checkpointRestoredAtMs: 1370,
|
|
145
|
+
restartedAtMs: 1460,
|
|
146
|
+
});
|
|
147
|
+
expect(result.passed).toBe(true);
|
|
148
|
+
expect(result.restoreAfterContinuationMs).toBe(70);
|
|
149
|
+
expect(result.restartAfterRestoreMs).toBe(90);
|
|
150
|
+
});
|
|
151
|
+
});
|
|
152
|
+
|
|
153
|
+
describe("voice E2E harness latency summary", () => {
|
|
154
|
+
it("scores first response latency from a real timestamp set", () => {
|
|
155
|
+
const result = scoreFirstResponseLatency({
|
|
156
|
+
turnStartedAtMs: 100,
|
|
157
|
+
asrFinalAtMs: 420,
|
|
158
|
+
llmFirstTokenAtMs: 700,
|
|
159
|
+
ttsFirstAudioAtMs: 980,
|
|
160
|
+
audioFirstPlayedAtMs: 1005,
|
|
161
|
+
maxFirstAudioMs: 1000,
|
|
162
|
+
});
|
|
163
|
+
expect(result.passed).toBe(true);
|
|
164
|
+
expect(result.firstAudioMs).toBe(880);
|
|
165
|
+
expect(result.firstPlayedMs).toBe(905);
|
|
166
|
+
});
|
|
167
|
+
|
|
168
|
+
it("summarizes all case pass/fail flags", () => {
|
|
169
|
+
const summary = summarizeVoiceE2e([
|
|
170
|
+
scoreTtsAsrRoundTrip({
|
|
171
|
+
referenceText: "hello",
|
|
172
|
+
hypothesisText: "hello",
|
|
173
|
+
}),
|
|
174
|
+
scoreFirstResponseLatency({
|
|
175
|
+
turnStartedAtMs: 0,
|
|
176
|
+
ttsFirstAudioAtMs: 400,
|
|
177
|
+
}),
|
|
178
|
+
]);
|
|
179
|
+
expect(summary.passed).toBe(true);
|
|
180
|
+
expect(summary.cases).toHaveLength(2);
|
|
181
|
+
});
|
|
182
|
+
});
|