@elizaos/plugin-local-inference 2.0.0-beta.1 → 2.0.11-beta.7
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +21 -0
- package/README.md +83 -0
- package/package.json +81 -15
- package/src/actions/generate-media.d.ts +59 -0
- package/src/actions/generate-media.d.ts.map +1 -0
- package/src/actions/generate-media.ts +647 -0
- package/src/actions/identify-speaker.d.ts +23 -0
- package/src/actions/identify-speaker.d.ts.map +1 -0
- package/src/actions/identify-speaker.ts +171 -0
- package/src/adapters/capacitor-llama/__tests__/compat-behavior.test.ts +218 -0
- package/src/adapters/capacitor-llama/__tests__/index.test.ts +68 -0
- package/src/adapters/capacitor-llama/__tests__/structured-output.test.ts +215 -0
- package/src/adapters/capacitor-llama/__tests__/text-streaming.test.ts +174 -0
- package/src/adapters/capacitor-llama/environment.ts +71 -0
- package/src/adapters/capacitor-llama/index.browser.ts +83 -0
- package/src/adapters/capacitor-llama/index.ts +807 -0
- package/src/adapters/capacitor-llama/loader.ts +109 -0
- package/src/adapters/capacitor-llama/structured-output.ts +165 -0
- package/src/adapters/capacitor-llama/text-streaming.ts +227 -0
- package/src/adapters/capacitor-llama/types.ts +374 -0
- package/src/backends/apple-foundation.ts +127 -0
- package/src/index.d.ts +7 -0
- package/src/index.d.ts.map +1 -0
- package/src/index.ts +54 -0
- package/src/local-inference-routes.d.ts +38 -0
- package/src/local-inference-routes.d.ts.map +1 -0
- package/src/local-inference-routes.test.ts +344 -0
- package/src/local-inference-routes.ts +1543 -0
- package/src/provider.d.ts +21 -0
- package/src/provider.d.ts.map +1 -0
- package/src/provider.ts +1171 -0
- package/src/routes/compat-helpers.d.ts +18 -0
- package/src/routes/compat-helpers.d.ts.map +1 -0
- package/src/routes/compat-helpers.ts +274 -0
- package/src/routes/family-member-route.d.ts +62 -0
- package/src/routes/family-member-route.d.ts.map +1 -0
- package/src/routes/family-member-route.ts +353 -0
- package/src/routes/index.d.ts +19 -0
- package/src/routes/index.d.ts.map +1 -0
- package/src/routes/index.ts +60 -0
- package/src/routes/live-diarization-route.d.ts +26 -0
- package/src/routes/live-diarization-route.d.ts.map +1 -0
- package/src/routes/live-diarization-route.test.ts +213 -0
- package/src/routes/live-diarization-route.ts +122 -0
- package/src/routes/local-inference-asr-route.d.ts +4 -0
- package/src/routes/local-inference-asr-route.d.ts.map +1 -0
- package/src/routes/local-inference-asr-route.test.ts +190 -0
- package/src/routes/local-inference-asr-route.ts +213 -0
- package/src/routes/local-inference-compat-routes.d.ts +16 -0
- package/src/routes/local-inference-compat-routes.d.ts.map +1 -0
- package/src/routes/local-inference-compat-routes.test.ts +423 -0
- package/src/routes/local-inference-compat-routes.ts +782 -0
- package/src/routes/local-inference-tts-route.d.ts +7 -0
- package/src/routes/local-inference-tts-route.d.ts.map +1 -0
- package/src/routes/local-inference-tts-route.test.ts +179 -0
- package/src/routes/local-inference-tts-route.ts +230 -0
- package/src/routes/voice-first-run-routes.d.ts +62 -0
- package/src/routes/voice-first-run-routes.d.ts.map +1 -0
- package/src/routes/voice-first-run-routes.ts +524 -0
- package/src/routes/voice-models-routes.d.ts +62 -0
- package/src/routes/voice-models-routes.d.ts.map +1 -0
- package/src/routes/voice-models-routes.ts +554 -0
- package/src/routes/voice-profile-plugin-routes.d.ts +19 -0
- package/src/routes/voice-profile-plugin-routes.d.ts.map +1 -0
- package/src/routes/voice-profile-plugin-routes.ts +138 -0
- package/src/routes/voice-profiles-management-routes.d.ts +52 -0
- package/src/routes/voice-profiles-management-routes.d.ts.map +1 -0
- package/src/routes/voice-profiles-management-routes.ts +476 -0
- package/src/routes/voice-speaker-profile-routes.d.ts +57 -0
- package/src/routes/voice-speaker-profile-routes.d.ts.map +1 -0
- package/src/routes/voice-speaker-profile-routes.ts +199 -0
- package/src/runtime/aosp-llama-loader-selection.test.ts +80 -0
- package/src/runtime/capacitor-llama.d.ts +25 -0
- package/src/runtime/embedding-manager-support.d.ts +77 -0
- package/src/runtime/embedding-manager-support.d.ts.map +1 -0
- package/src/runtime/embedding-manager-support.ts +497 -0
- package/src/runtime/embedding-presets.d.ts +16 -0
- package/src/runtime/embedding-presets.d.ts.map +1 -0
- package/src/runtime/embedding-presets.ts +81 -0
- package/src/runtime/embedding-warmup-policy.d.ts +14 -0
- package/src/runtime/embedding-warmup-policy.d.ts.map +1 -0
- package/src/runtime/embedding-warmup-policy.test.ts +53 -0
- package/src/runtime/embedding-warmup-policy.ts +48 -0
- package/src/runtime/ensure-local-inference-handler.d.ts +53 -0
- package/src/runtime/ensure-local-inference-handler.d.ts.map +1 -0
- package/src/runtime/ensure-local-inference-handler.test.ts +528 -0
- package/src/runtime/ensure-local-inference-handler.ts +1398 -0
- package/src/runtime/index.d.ts +14 -0
- package/src/runtime/index.d.ts.map +1 -0
- package/src/runtime/index.ts +27 -0
- package/src/runtime/mobile-local-inference-gate.d.ts +31 -0
- package/src/runtime/mobile-local-inference-gate.d.ts.map +1 -0
- package/src/runtime/mobile-local-inference-gate.test.ts +69 -0
- package/src/runtime/mobile-local-inference-gate.ts +44 -0
- package/src/runtime/voice-entity-binding.d.ts +103 -0
- package/src/runtime/voice-entity-binding.d.ts.map +1 -0
- package/src/runtime/voice-entity-binding.transcript.test.ts +69 -0
- package/src/runtime/voice-entity-binding.ts +328 -0
- package/src/services/README.md +71 -0
- package/src/services/__tests__/backend-selector.test.ts +101 -0
- package/src/services/__tests__/checkpoint-manager.test.ts +376 -0
- package/src/services/__tests__/gpu-autotune.test.ts +400 -0
- package/src/services/__tests__/llm-streaming-binding.test.ts +85 -0
- package/src/services/__tests__/planner-grammar.test.ts +372 -0
- package/src/services/__tests__/runtime-target.test.ts +176 -0
- package/src/services/active-model-switch-rollback.test.ts +183 -0
- package/src/services/active-model.d.ts +282 -0
- package/src/services/active-model.d.ts.map +1 -0
- package/src/services/active-model.ts +1213 -0
- package/src/services/asr/errors.d.ts +21 -0
- package/src/services/asr/errors.d.ts.map +1 -0
- package/src/services/asr/errors.ts +50 -0
- package/src/services/asr/hash.d.ts +28 -0
- package/src/services/asr/hash.d.ts.map +1 -0
- package/src/services/asr/hash.ts +49 -0
- package/src/services/asr/index.d.ts +76 -0
- package/src/services/asr/index.d.ts.map +1 -0
- package/src/services/asr/index.ts +178 -0
- package/src/services/asr/types.d.ts +91 -0
- package/src/services/asr/types.d.ts.map +1 -0
- package/src/services/asr/types.ts +95 -0
- package/src/services/assignments.d.ts +71 -0
- package/src/services/assignments.d.ts.map +1 -0
- package/src/services/assignments.test.ts +80 -0
- package/src/services/assignments.ts +230 -0
- package/src/services/backend-selector.ts +95 -0
- package/src/services/backend.d.ts +346 -0
- package/src/services/backend.d.ts.map +1 -0
- package/src/services/backend.ts +612 -0
- package/src/services/bundled-models.d.ts +34 -0
- package/src/services/bundled-models.d.ts.map +1 -0
- package/src/services/bundled-models.ts +129 -0
- package/src/services/cache-bridge.d.ts +206 -0
- package/src/services/cache-bridge.d.ts.map +1 -0
- package/src/services/cache-bridge.test.ts +516 -0
- package/src/services/cache-bridge.ts +423 -0
- package/src/services/catalog.d.ts +10 -0
- package/src/services/catalog.d.ts.map +1 -0
- package/src/services/catalog.test.ts +240 -0
- package/src/services/catalog.ts +27 -0
- package/src/services/checkpoint-client.d.ts +109 -0
- package/src/services/checkpoint-client.d.ts.map +1 -0
- package/src/services/checkpoint-client.ts +258 -0
- package/src/services/checkpoint-manager.ts +474 -0
- package/src/services/cloud-fallback.d.ts +102 -0
- package/src/services/cloud-fallback.d.ts.map +1 -0
- package/src/services/cloud-fallback.ts +230 -0
- package/src/services/conversation-registry.d.ts +142 -0
- package/src/services/conversation-registry.d.ts.map +1 -0
- package/src/services/conversation-registry.test.ts +235 -0
- package/src/services/conversation-registry.ts +264 -0
- package/src/services/desktop-fused-ffi-backend-runtime.d.ts +92 -0
- package/src/services/desktop-fused-ffi-backend-runtime.d.ts.map +1 -0
- package/src/services/desktop-fused-ffi-backend-runtime.ts +333 -0
- package/src/services/device-bridge.d.ts +188 -0
- package/src/services/device-bridge.d.ts.map +1 -0
- package/src/services/device-bridge.ts +1237 -0
- package/src/services/device-resource-metrics.d.ts +149 -0
- package/src/services/device-resource-metrics.d.ts.map +1 -0
- package/src/services/device-resource-metrics.test.ts +98 -0
- package/src/services/device-resource-metrics.ts +346 -0
- package/src/services/device-tier.d.ts +115 -0
- package/src/services/device-tier.d.ts.map +1 -0
- package/src/services/device-tier.test.ts +371 -0
- package/src/services/device-tier.ts +410 -0
- package/src/services/downloader.d.ts +82 -0
- package/src/services/downloader.d.ts.map +1 -0
- package/src/services/downloader.test.ts +724 -0
- package/src/services/downloader.ts +899 -0
- package/src/services/engine-direct-bundle.test.ts +58 -0
- package/src/services/engine-streaming.test.ts +80 -0
- package/src/services/engine.d.ts +534 -0
- package/src/services/engine.d.ts.map +1 -0
- package/src/services/engine.ts +1891 -0
- package/src/services/ensure-local-artifacts.integration.test.ts +273 -0
- package/src/services/ensure-local-artifacts.test.ts +368 -0
- package/src/services/ensure-local-artifacts.ts +351 -0
- package/src/services/external-scanner.d.ts +17 -0
- package/src/services/external-scanner.d.ts.map +1 -0
- package/src/services/external-scanner.ts +312 -0
- package/src/services/ffi-llm-mock.ts +354 -0
- package/src/services/ffi-llm-streaming-abi.ts +442 -0
- package/src/services/ffi-streaming-backend.d.ts +180 -0
- package/src/services/ffi-streaming-backend.d.ts.map +1 -0
- package/src/services/ffi-streaming-backend.ts +382 -0
- package/src/services/ffi-streaming-runner.d.ts +122 -0
- package/src/services/ffi-streaming-runner.d.ts.map +1 -0
- package/src/services/ffi-streaming-runner.test.ts +60 -0
- package/src/services/ffi-streaming-runner.ts +354 -0
- package/src/services/ffi-unload-ordering.test.ts +162 -0
- package/src/services/gpu-autotune.ts +534 -0
- package/src/services/gpu-detect.ts +139 -0
- package/src/services/handler-registry.d.ts +72 -0
- package/src/services/handler-registry.d.ts.map +1 -0
- package/src/services/handler-registry.ts +240 -0
- package/src/services/hardware.d.ts +63 -0
- package/src/services/hardware.d.ts.map +1 -0
- package/src/services/hardware.test.ts +183 -0
- package/src/services/hardware.ts +404 -0
- package/src/services/hf-search.d.ts +26 -0
- package/src/services/hf-search.d.ts.map +1 -0
- package/src/services/hf-search.test.ts +69 -0
- package/src/services/hf-search.ts +420 -0
- package/src/services/image-description-runtime.d.ts +14 -0
- package/src/services/image-description-runtime.d.ts.map +1 -0
- package/src/services/image-description-runtime.test.ts +61 -0
- package/src/services/image-description-runtime.ts +118 -0
- package/src/services/imagegen/aosp-unavailable.d.ts +134 -0
- package/src/services/imagegen/aosp-unavailable.d.ts.map +1 -0
- package/src/services/imagegen/aosp-unavailable.ts +229 -0
- package/src/services/imagegen/backend-selector.d.ts +118 -0
- package/src/services/imagegen/backend-selector.d.ts.map +1 -0
- package/src/services/imagegen/backend-selector.ts +281 -0
- package/src/services/imagegen/coreml-unavailable.d.ts +105 -0
- package/src/services/imagegen/coreml-unavailable.d.ts.map +1 -0
- package/src/services/imagegen/coreml-unavailable.ts +237 -0
- package/src/services/imagegen/errors.d.ts +16 -0
- package/src/services/imagegen/errors.d.ts.map +1 -0
- package/src/services/imagegen/errors.ts +40 -0
- package/src/services/imagegen/index.d.ts +58 -0
- package/src/services/imagegen/index.d.ts.map +1 -0
- package/src/services/imagegen/index.ts +144 -0
- package/src/services/imagegen/mflux.d.ts +74 -0
- package/src/services/imagegen/mflux.d.ts.map +1 -0
- package/src/services/imagegen/mflux.ts +313 -0
- package/src/services/imagegen/sd-cpp.d.ts +180 -0
- package/src/services/imagegen/sd-cpp.d.ts.map +1 -0
- package/src/services/imagegen/sd-cpp.ts +718 -0
- package/src/services/imagegen/tensorrt-unavailable.d.ts +83 -0
- package/src/services/imagegen/tensorrt-unavailable.d.ts.map +1 -0
- package/src/services/imagegen/tensorrt-unavailable.ts +295 -0
- package/src/services/imagegen/types.d.ts +181 -0
- package/src/services/imagegen/types.d.ts.map +1 -0
- package/src/services/imagegen/types.ts +193 -0
- package/src/services/index.d.ts +30 -0
- package/src/services/index.d.ts.map +1 -0
- package/src/services/index.ts +225 -0
- package/src/services/inference-capabilities.d.ts +132 -0
- package/src/services/inference-capabilities.d.ts.map +1 -0
- package/src/services/inference-capabilities.test.ts +75 -0
- package/src/services/inference-capabilities.ts +204 -0
- package/src/services/inference-telemetry.d.ts +59 -0
- package/src/services/inference-telemetry.d.ts.map +1 -0
- package/src/services/inference-telemetry.ts +143 -0
- package/src/services/ios-llama-streaming.ts +248 -0
- package/src/services/kv-spill.d.ts +189 -0
- package/src/services/kv-spill.d.ts.map +1 -0
- package/src/services/kv-spill.test.ts +222 -0
- package/src/services/kv-spill.ts +356 -0
- package/src/services/latency-trace.d.ts +346 -0
- package/src/services/latency-trace.d.ts.map +1 -0
- package/src/services/latency-trace.test.ts +266 -0
- package/src/services/latency-trace.ts +844 -0
- package/src/services/llama-server-metrics.ts +304 -0
- package/src/services/llm-streaming-binding.d.ts +96 -0
- package/src/services/llm-streaming-binding.d.ts.map +1 -0
- package/src/services/llm-streaming-binding.ts +136 -0
- package/src/services/load-args.d.ts +82 -0
- package/src/services/load-args.d.ts.map +1 -0
- package/src/services/load-args.ts +81 -0
- package/src/services/manifest/eliza-1.manifest.v1.json +708 -0
- package/src/services/manifest/index.d.ts +4 -0
- package/src/services/manifest/index.d.ts.map +1 -0
- package/src/services/manifest/index.ts +66 -0
- package/src/services/manifest/manifest.test.ts +693 -0
- package/src/services/manifest/schema.d.ts +715 -0
- package/src/services/manifest/schema.d.ts.map +1 -0
- package/src/services/manifest/schema.ts +655 -0
- package/src/services/manifest/types.d.ts +30 -0
- package/src/services/manifest/types.d.ts.map +1 -0
- package/src/services/manifest/types.ts +55 -0
- package/src/services/manifest/validator.d.ts +66 -0
- package/src/services/manifest/validator.d.ts.map +1 -0
- package/src/services/manifest/validator.ts +569 -0
- package/src/services/memory-arbiter.d.ts +343 -0
- package/src/services/memory-arbiter.d.ts.map +1 -0
- package/src/services/memory-arbiter.test.ts +419 -0
- package/src/services/memory-arbiter.ts +1000 -0
- package/src/services/memory-monitor.d.ts +119 -0
- package/src/services/memory-monitor.d.ts.map +1 -0
- package/src/services/memory-monitor.test.ts +208 -0
- package/src/services/memory-monitor.ts +296 -0
- package/src/services/memory-pressure.d.ts +127 -0
- package/src/services/memory-pressure.d.ts.map +1 -0
- package/src/services/memory-pressure.ts +413 -0
- package/src/services/mtp-doctor.d.ts +13 -0
- package/src/services/mtp-doctor.d.ts.map +1 -0
- package/src/services/mtp-doctor.ts +78 -0
- package/src/services/network-policy.d.ts +127 -0
- package/src/services/network-policy.d.ts.map +1 -0
- package/src/services/network-policy.ts +346 -0
- package/src/services/paths.d.ts +6 -0
- package/src/services/paths.d.ts.map +1 -0
- package/src/services/paths.ts +25 -0
- package/src/services/planner-skeleton.d.ts +124 -0
- package/src/services/planner-skeleton.d.ts.map +1 -0
- package/src/services/planner-skeleton.ts +175 -0
- package/src/services/providers.d.ts +38 -0
- package/src/services/providers.d.ts.map +1 -0
- package/src/services/providers.ts +507 -0
- package/src/services/ram-budget-cache.test.ts +163 -0
- package/src/services/ram-budget.d.ts +110 -0
- package/src/services/ram-budget.d.ts.map +1 -0
- package/src/services/ram-budget.ts +0 -0
- package/src/services/readiness.d.ts +9 -0
- package/src/services/readiness.d.ts.map +1 -0
- package/src/services/readiness.test.ts +87 -0
- package/src/services/readiness.ts +238 -0
- package/src/services/recommendation.d.ts +111 -0
- package/src/services/recommendation.d.ts.map +1 -0
- package/src/services/recommendation.ts +672 -0
- package/src/services/registry.d.ts +35 -0
- package/src/services/registry.d.ts.map +1 -0
- package/src/services/registry.ts +151 -0
- package/src/services/router-handler.d.ts +92 -0
- package/src/services/router-handler.d.ts.map +1 -0
- package/src/services/router-handler.test.ts +45 -0
- package/src/services/router-handler.ts +376 -0
- package/src/services/routing-policy.d.ts +55 -0
- package/src/services/routing-policy.d.ts.map +1 -0
- package/src/services/routing-policy.ts +228 -0
- package/src/services/routing-preferences.d.ts +8 -0
- package/src/services/routing-preferences.d.ts.map +1 -0
- package/src/services/routing-preferences.ts +15 -0
- package/src/services/runtime-target.d.ts +98 -0
- package/src/services/runtime-target.d.ts.map +1 -0
- package/src/services/runtime-target.ts +154 -0
- package/src/services/service.d.ts +128 -0
- package/src/services/service.d.ts.map +1 -0
- package/src/services/service.test.ts +223 -0
- package/src/services/service.ts +735 -0
- package/src/services/session-pool.d.ts +72 -0
- package/src/services/session-pool.d.ts.map +1 -0
- package/src/services/session-pool.ts +153 -0
- package/src/services/structured-output/deterministic-repair.d.ts +23 -0
- package/src/services/structured-output/deterministic-repair.d.ts.map +1 -0
- package/src/services/structured-output/deterministic-repair.test.ts +169 -0
- package/src/services/structured-output/deterministic-repair.ts +443 -0
- package/src/services/structured-output/index.ts +4 -0
- package/src/services/structured-output.d.ts +311 -0
- package/src/services/structured-output.d.ts.map +1 -0
- package/src/services/structured-output.test.ts +483 -0
- package/src/services/structured-output.ts +712 -0
- package/src/services/transcription-priority.test.ts +211 -0
- package/src/services/tts/errors.ts +46 -0
- package/src/services/tts/index.ts +214 -0
- package/src/services/tts/tts-audio-cache.ts +235 -0
- package/src/services/tts/types.ts +157 -0
- package/src/services/types.d.ts +19 -0
- package/src/services/types.d.ts.map +1 -0
- package/src/services/types.ts +55 -0
- package/src/services/verify-on-device.d.ts +34 -0
- package/src/services/verify-on-device.d.ts.map +1 -0
- package/src/services/verify-on-device.test.ts +87 -0
- package/src/services/verify-on-device.ts +127 -0
- package/src/services/verify.d.ts +8 -0
- package/src/services/verify.d.ts.map +1 -0
- package/src/services/verify.ts +13 -0
- package/src/services/vision/aosp-unavailable.d.ts +115 -0
- package/src/services/vision/aosp-unavailable.d.ts.map +1 -0
- package/src/services/vision/aosp-unavailable.ts +163 -0
- package/src/services/vision/capacitor-llama.d.ts +99 -0
- package/src/services/vision/capacitor-llama.d.ts.map +1 -0
- package/src/services/vision/capacitor-llama.ts +255 -0
- package/src/services/vision/cloud-fallback.d.ts +47 -0
- package/src/services/vision/cloud-fallback.d.ts.map +1 -0
- package/src/services/vision/cloud-fallback.test.ts +243 -0
- package/src/services/vision/cloud-fallback.ts +268 -0
- package/src/services/vision/fallback-chain.test.ts +86 -0
- package/src/services/vision/hash.d.ts +71 -0
- package/src/services/vision/hash.d.ts.map +1 -0
- package/src/services/vision/hash.ts +157 -0
- package/src/services/vision/index.d.ts +95 -0
- package/src/services/vision/index.d.ts.map +1 -0
- package/src/services/vision/index.ts +251 -0
- package/src/services/vision/llama-server.d.ts +73 -0
- package/src/services/vision/llama-server.d.ts.map +1 -0
- package/src/services/vision/llama-server.ts +177 -0
- package/src/services/vision/types.d.ts +153 -0
- package/src/services/vision/types.d.ts.map +1 -0
- package/src/services/vision/types.ts +154 -0
- package/src/services/vision/vast-fallback.d.ts +18 -0
- package/src/services/vision/vast-fallback.d.ts.map +1 -0
- package/src/services/vision/vast-fallback.ts +127 -0
- package/src/services/vision-embedding-cache.d.ts +98 -0
- package/src/services/vision-embedding-cache.d.ts.map +1 -0
- package/src/services/vision-embedding-cache.ts +189 -0
- package/src/services/voice/VOICE_WORKBENCH.md +88 -0
- package/src/services/voice/__test-helpers__/fake-ffi.ts +92 -0
- package/src/services/voice/__test-helpers__/synthetic-speech.ts +124 -0
- package/src/services/voice/__tests__/checkpoint-manager.test.ts +241 -0
- package/src/services/voice/__tests__/checkpoint-policy.test.ts +270 -0
- package/src/services/voice/__tests__/eager-context-builder.test.ts +257 -0
- package/src/services/voice/__tests__/eliza1-eot-scorer.test.ts +288 -0
- package/src/services/voice/__tests__/eot-classifier.test.ts +431 -0
- package/src/services/voice/__tests__/optimistic-rollback.test.ts +312 -0
- package/src/services/voice/__tests__/prefill-client.test.ts +266 -0
- package/src/services/voice/__tests__/prefix-preserving-queue.test.ts +208 -0
- package/src/services/voice/__tests__/streaming-asr.test.ts +450 -0
- package/src/services/voice/__tests__/streaming-transcriber.test.ts +339 -0
- package/src/services/voice/__tests__/turn-detector-resolver.test.ts +197 -0
- package/src/services/voice/__tests__/voice-state-machine-prefill.test.ts +275 -0
- package/src/services/voice/__tests__/voice-state-machine.test.ts +354 -0
- package/src/services/voice/audio-frame-consumer.d.ts +212 -0
- package/src/services/voice/audio-frame-consumer.d.ts.map +1 -0
- package/src/services/voice/audio-frame-consumer.test.ts +343 -0
- package/src/services/voice/audio-frame-consumer.ts +491 -0
- package/src/services/voice/barge-in.d.ts +112 -0
- package/src/services/voice/barge-in.d.ts.map +1 -0
- package/src/services/voice/barge-in.test.ts +244 -0
- package/src/services/voice/barge-in.ts +336 -0
- package/src/services/voice/cancellation-coordinator.d.ts +127 -0
- package/src/services/voice/cancellation-coordinator.d.ts.map +1 -0
- package/src/services/voice/cancellation-coordinator.test.ts +196 -0
- package/src/services/voice/cancellation-coordinator.ts +269 -0
- package/src/services/voice/checkpoint-manager.d.ts +199 -0
- package/src/services/voice/checkpoint-manager.d.ts.map +1 -0
- package/src/services/voice/checkpoint-manager.ts +401 -0
- package/src/services/voice/checkpoint-policy.ts +336 -0
- package/src/services/voice/composite-eot-classifier.test.ts +59 -0
- package/src/services/voice/e2e-harness.test.ts +182 -0
- package/src/services/voice/e2e-harness.ts +743 -0
- package/src/services/voice/eager-context-builder.d.ts +170 -0
- package/src/services/voice/eager-context-builder.d.ts.map +1 -0
- package/src/services/voice/eager-context-builder.ts +262 -0
- package/src/services/voice/eliza1-eot-scorer.d.ts +124 -0
- package/src/services/voice/eliza1-eot-scorer.d.ts.map +1 -0
- package/src/services/voice/eliza1-eot-scorer.ts +242 -0
- package/src/services/voice/embedding-server.ts +200 -0
- package/src/services/voice/embedding.d.ts +133 -0
- package/src/services/voice/embedding.d.ts.map +1 -0
- package/src/services/voice/embedding.test.ts +148 -0
- package/src/services/voice/embedding.ts +244 -0
- package/src/services/voice/emotion-attribution.d.ts +68 -0
- package/src/services/voice/emotion-attribution.d.ts.map +1 -0
- package/src/services/voice/emotion-attribution.test.ts +129 -0
- package/src/services/voice/emotion-attribution.ts +361 -0
- package/src/services/voice/engine-bridge-cancellation.test.ts +422 -0
- package/src/services/voice/engine-bridge.d.ts +746 -0
- package/src/services/voice/engine-bridge.d.ts.map +1 -0
- package/src/services/voice/engine-bridge.test.ts +384 -0
- package/src/services/voice/engine-bridge.ts +2226 -0
- package/src/services/voice/eot-classifier-ggml.d.ts +179 -0
- package/src/services/voice/eot-classifier-ggml.d.ts.map +1 -0
- package/src/services/voice/eot-classifier-ggml.ts +566 -0
- package/src/services/voice/eot-classifier.d.ts +214 -0
- package/src/services/voice/eot-classifier.d.ts.map +1 -0
- package/src/services/voice/eot-classifier.ts +533 -0
- package/src/services/voice/errors.d.ts +20 -0
- package/src/services/voice/errors.d.ts.map +1 -0
- package/src/services/voice/errors.ts +32 -0
- package/src/services/voice/expressive-tags.d.ts +158 -0
- package/src/services/voice/expressive-tags.d.ts.map +1 -0
- package/src/services/voice/expressive-tags.ts +405 -0
- package/src/services/voice/ffi-bindings.d.ts +636 -0
- package/src/services/voice/ffi-bindings.d.ts.map +1 -0
- package/src/services/voice/ffi-bindings.test.ts +671 -0
- package/src/services/voice/ffi-bindings.ts +3050 -0
- package/src/services/voice/first-line-cache.d.ts +181 -0
- package/src/services/voice/first-line-cache.d.ts.map +1 -0
- package/src/services/voice/first-line-cache.ts +725 -0
- package/src/services/voice/fused-eot-scorer.d.ts +51 -0
- package/src/services/voice/fused-eot-scorer.d.ts.map +1 -0
- package/src/services/voice/fused-eot-scorer.ts +135 -0
- package/src/services/voice/index.d.ts +91 -0
- package/src/services/voice/index.d.ts.map +1 -0
- package/src/services/voice/index.ts +481 -0
- package/src/services/voice/kokoro/__tests__/kokoro-backend.test.ts +151 -0
- package/src/services/voice/kokoro/__tests__/kokoro-engine-bridge.real.test.ts +151 -0
- package/src/services/voice/kokoro/__tests__/kokoro-engine-bridge.test.ts +60 -0
- package/src/services/voice/kokoro/__tests__/kokoro-engine-discovery.test.ts +277 -0
- package/src/services/voice/kokoro/__tests__/kokoro-ffi-runtime.test.ts +235 -0
- package/src/services/voice/kokoro/__tests__/kokoro-runtime.test.ts +95 -0
- package/src/services/voice/kokoro/__tests__/phonemizer.test.ts +53 -0
- package/src/services/voice/kokoro/__tests__/runtime-selection.test.ts +231 -0
- package/src/services/voice/kokoro/__tests__/voices.test.ts +57 -0
- package/src/services/voice/kokoro/index.ts +79 -0
- package/src/services/voice/kokoro/kokoro-backend.d.ts +72 -0
- package/src/services/voice/kokoro/kokoro-backend.d.ts.map +1 -0
- package/src/services/voice/kokoro/kokoro-backend.ts +207 -0
- package/src/services/voice/kokoro/kokoro-engine-discovery.d.ts +58 -0
- package/src/services/voice/kokoro/kokoro-engine-discovery.d.ts.map +1 -0
- package/src/services/voice/kokoro/kokoro-engine-discovery.ts +177 -0
- package/src/services/voice/kokoro/kokoro-ffi-runtime.d.ts +75 -0
- package/src/services/voice/kokoro/kokoro-ffi-runtime.d.ts.map +1 -0
- package/src/services/voice/kokoro/kokoro-ffi-runtime.ts +233 -0
- package/src/services/voice/kokoro/kokoro-runtime.d.ts +100 -0
- package/src/services/voice/kokoro/kokoro-runtime.d.ts.map +1 -0
- package/src/services/voice/kokoro/kokoro-runtime.ts +170 -0
- package/src/services/voice/kokoro/phoneme-stream.ts +123 -0
- package/src/services/voice/kokoro/phonemizer.d.ts +50 -0
- package/src/services/voice/kokoro/phonemizer.d.ts.map +1 -0
- package/src/services/voice/kokoro/phonemizer.ts +344 -0
- package/src/services/voice/kokoro/pick-runtime.d.ts +61 -0
- package/src/services/voice/kokoro/pick-runtime.d.ts.map +1 -0
- package/src/services/voice/kokoro/pick-runtime.test.ts +91 -0
- package/src/services/voice/kokoro/pick-runtime.ts +130 -0
- package/src/services/voice/kokoro/runtime-selection.d.ts +92 -0
- package/src/services/voice/kokoro/runtime-selection.d.ts.map +1 -0
- package/src/services/voice/kokoro/runtime-selection.ts +237 -0
- package/src/services/voice/kokoro/types.d.ts +82 -0
- package/src/services/voice/kokoro/types.d.ts.map +1 -0
- package/src/services/voice/kokoro/types.ts +95 -0
- package/src/services/voice/kokoro/voice-presets.d.ts +23 -0
- package/src/services/voice/kokoro/voice-presets.d.ts.map +1 -0
- package/src/services/voice/kokoro/voice-presets.ts +129 -0
- package/src/services/voice/kokoro/voices.d.ts +30 -0
- package/src/services/voice/kokoro/voices.d.ts.map +1 -0
- package/src/services/voice/kokoro/voices.ts +64 -0
- package/src/services/voice/lifecycle.d.ts +135 -0
- package/src/services/voice/lifecycle.d.ts.map +1 -0
- package/src/services/voice/lifecycle.test.ts +315 -0
- package/src/services/voice/lifecycle.ts +301 -0
- package/src/services/voice/live-diarization-session.d.ts +96 -0
- package/src/services/voice/live-diarization-session.d.ts.map +1 -0
- package/src/services/voice/live-diarization-session.ts +289 -0
- package/src/services/voice/mic-source.d.ts +136 -0
- package/src/services/voice/mic-source.d.ts.map +1 -0
- package/src/services/voice/mic-source.test.ts +210 -0
- package/src/services/voice/mic-source.ts +503 -0
- package/src/services/voice/optimistic-policy.d.ts +109 -0
- package/src/services/voice/optimistic-policy.d.ts.map +1 -0
- package/src/services/voice/optimistic-policy.test.ts +101 -0
- package/src/services/voice/optimistic-policy.ts +192 -0
- package/src/services/voice/optimistic-rollback.ts +343 -0
- package/src/services/voice/partial-stabilizer.d.ts +73 -0
- package/src/services/voice/partial-stabilizer.d.ts.map +1 -0
- package/src/services/voice/partial-stabilizer.test.ts +68 -0
- package/src/services/voice/partial-stabilizer.ts +140 -0
- package/src/services/voice/phoneme-tokenizer.d.ts +49 -0
- package/src/services/voice/phoneme-tokenizer.d.ts.map +1 -0
- package/src/services/voice/phoneme-tokenizer.ts +158 -0
- package/src/services/voice/phrase-cache.d.ts +76 -0
- package/src/services/voice/phrase-cache.d.ts.map +1 -0
- package/src/services/voice/phrase-cache.test.ts +242 -0
- package/src/services/voice/phrase-cache.ts +186 -0
- package/src/services/voice/phrase-chunker.d.ts +62 -0
- package/src/services/voice/phrase-chunker.d.ts.map +1 -0
- package/src/services/voice/phrase-chunker.test.ts +239 -0
- package/src/services/voice/phrase-chunker.ts +281 -0
- package/src/services/voice/pipeline-impls.d.ts +151 -0
- package/src/services/voice/pipeline-impls.d.ts.map +1 -0
- package/src/services/voice/pipeline-impls.l6.test.ts +110 -0
- package/src/services/voice/pipeline-impls.test.ts +292 -0
- package/src/services/voice/pipeline-impls.ts +315 -0
- package/src/services/voice/pipeline.d.ts +216 -0
- package/src/services/voice/pipeline.d.ts.map +1 -0
- package/src/services/voice/pipeline.ts +505 -0
- package/src/services/voice/prefill-client.d.ts +123 -0
- package/src/services/voice/prefill-client.d.ts.map +1 -0
- package/src/services/voice/prefill-client.ts +316 -0
- package/src/services/voice/prefix-preserving-queue.d.ts +113 -0
- package/src/services/voice/prefix-preserving-queue.d.ts.map +1 -0
- package/src/services/voice/prefix-preserving-queue.ts +162 -0
- package/src/services/voice/profile-store.d.ts +248 -0
- package/src/services/voice/profile-store.d.ts.map +1 -0
- package/src/services/voice/profile-store.ts +887 -0
- package/src/services/voice/ring-buffer.d.ts +40 -0
- package/src/services/voice/ring-buffer.d.ts.map +1 -0
- package/src/services/voice/ring-buffer.ts +105 -0
- package/src/services/voice/rollback-queue.d.ts +24 -0
- package/src/services/voice/rollback-queue.d.ts.map +1 -0
- package/src/services/voice/rollback-queue.ts +74 -0
- package/src/services/voice/samantha-preset-placeholder.d.ts +67 -0
- package/src/services/voice/samantha-preset-placeholder.d.ts.map +1 -0
- package/src/services/voice/samantha-preset-placeholder.test.ts +97 -0
- package/src/services/voice/samantha-preset-placeholder.ts +148 -0
- package/src/services/voice/samantha-preset-regenerator.d.ts +87 -0
- package/src/services/voice/samantha-preset-regenerator.d.ts.map +1 -0
- package/src/services/voice/samantha-preset-regenerator.ts +393 -0
- package/src/services/voice/scheduler.d.ts +146 -0
- package/src/services/voice/scheduler.d.ts.map +1 -0
- package/src/services/voice/scheduler.t2.test.ts +141 -0
- package/src/services/voice/scheduler.ts +927 -0
- package/src/services/voice/shared-resources.d.ts +190 -0
- package/src/services/voice/shared-resources.d.ts.map +1 -0
- package/src/services/voice/shared-resources.ts +320 -0
- package/src/services/voice/speaker/attribution-pipeline.d.ts +74 -0
- package/src/services/voice/speaker/attribution-pipeline.d.ts.map +1 -0
- package/src/services/voice/speaker/attribution-pipeline.ts +386 -0
- package/src/services/voice/speaker/diarizer-fused.d.ts +59 -0
- package/src/services/voice/speaker/diarizer-fused.d.ts.map +1 -0
- package/src/services/voice/speaker/diarizer-fused.real.test.ts +100 -0
- package/src/services/voice/speaker/diarizer-fused.ts +154 -0
- package/src/services/voice/speaker/diarizer.d.ts +75 -0
- package/src/services/voice/speaker/diarizer.d.ts.map +1 -0
- package/src/services/voice/speaker/diarizer.ts +218 -0
- package/src/services/voice/speaker/encoder-fused.d.ts +60 -0
- package/src/services/voice/speaker/encoder-fused.d.ts.map +1 -0
- package/src/services/voice/speaker/encoder-fused.real.test.ts +113 -0
- package/src/services/voice/speaker/encoder-fused.ts +138 -0
- package/src/services/voice/speaker/encoder-ggml.d.ts +33 -0
- package/src/services/voice/speaker/encoder-ggml.d.ts.map +1 -0
- package/src/services/voice/speaker/encoder-ggml.ts +79 -0
- package/src/services/voice/speaker/encoder.d.ts +37 -0
- package/src/services/voice/speaker/encoder.d.ts.map +1 -0
- package/src/services/voice/speaker/encoder.ts +105 -0
- package/src/services/voice/speaker-imprint.d.ts +83 -0
- package/src/services/voice/speaker-imprint.d.ts.map +1 -0
- package/src/services/voice/speaker-imprint.test.ts +185 -0
- package/src/services/voice/speaker-imprint.ts +312 -0
- package/src/services/voice/speaker-preset-cache.d.ts +77 -0
- package/src/services/voice/speaker-preset-cache.d.ts.map +1 -0
- package/src/services/voice/speaker-preset-cache.test.ts +154 -0
- package/src/services/voice/speaker-preset-cache.ts +195 -0
- package/src/services/voice/streaming-asr/streaming-pipeline-adapter.ts +292 -0
- package/src/services/voice/system-audio-sink.d.ts +73 -0
- package/src/services/voice/system-audio-sink.d.ts.map +1 -0
- package/src/services/voice/system-audio-sink.test.ts +29 -0
- package/src/services/voice/system-audio-sink.ts +366 -0
- package/src/services/voice/transcriber.d.ts +244 -0
- package/src/services/voice/transcriber.d.ts.map +1 -0
- package/src/services/voice/transcriber.test.ts +392 -0
- package/src/services/voice/transcriber.ts +704 -0
- package/src/services/voice/turn-controller.d.ts +183 -0
- package/src/services/voice/turn-controller.d.ts.map +1 -0
- package/src/services/voice/turn-controller.test.ts +575 -0
- package/src/services/voice/turn-controller.ts +596 -0
- package/src/services/voice/types.d.ts +643 -0
- package/src/services/voice/types.d.ts.map +1 -0
- package/src/services/voice/types.ts +699 -0
- package/src/services/voice/vad.d.ts +282 -0
- package/src/services/voice/vad.d.ts.map +1 -0
- package/src/services/voice/vad.test.ts +480 -0
- package/src/services/voice/vad.ts +827 -0
- package/src/services/voice/vad.v1-v4.test.ts +222 -0
- package/src/services/voice/voice-budget.d.ts +241 -0
- package/src/services/voice/voice-budget.d.ts.map +1 -0
- package/src/services/voice/voice-budget.test.ts +420 -0
- package/src/services/voice/voice-budget.ts +656 -0
- package/src/services/voice/voice-duet.test.ts +375 -0
- package/src/services/voice/voice-emotion-classifier.d.ts +95 -0
- package/src/services/voice/voice-emotion-classifier.d.ts.map +1 -0
- package/src/services/voice/voice-emotion-classifier.test.ts +210 -0
- package/src/services/voice/voice-emotion-classifier.ts +273 -0
- package/src/services/voice/voice-preset-format.d.ts +158 -0
- package/src/services/voice/voice-preset-format.d.ts.map +1 -0
- package/src/services/voice/voice-preset-format.ts +700 -0
- package/src/services/voice/voice-preset-generator.test.ts +89 -0
- package/src/services/voice/voice-profile-artifact.d.ts +116 -0
- package/src/services/voice/voice-profile-artifact.d.ts.map +1 -0
- package/src/services/voice/voice-profile-artifact.test.ts +138 -0
- package/src/services/voice/voice-profile-artifact.ts +518 -0
- package/src/services/voice/voice-profile-routes.d.ts +83 -0
- package/src/services/voice/voice-profile-routes.d.ts.map +1 -0
- package/src/services/voice/voice-profile-routes.test.ts +429 -0
- package/src/services/voice/voice-profile-routes.ts +425 -0
- package/src/services/voice/voice-scenario.ts +154 -0
- package/src/services/voice/voice-settings.d.ts +82 -0
- package/src/services/voice/voice-settings.d.ts.map +1 -0
- package/src/services/voice/voice-settings.ts +172 -0
- package/src/services/voice/voice-state-machine.d.ts +364 -0
- package/src/services/voice/voice-state-machine.d.ts.map +1 -0
- package/src/services/voice/voice-state-machine.ts +727 -0
- package/src/services/voice/voice-workbench-report.test.ts +168 -0
- package/src/services/voice/voice-workbench-report.ts +326 -0
- package/src/services/voice/voice-workbench.test.ts +158 -0
- package/src/services/voice/voice.test.ts +1070 -0
- package/src/services/voice/wake-word-ggml.d.ts +101 -0
- package/src/services/voice/wake-word-ggml.d.ts.map +1 -0
- package/src/services/voice/wake-word-ggml.ts +320 -0
- package/src/services/voice/wake-word.d.ts +255 -0
- package/src/services/voice/wake-word.d.ts.map +1 -0
- package/src/services/voice/wake-word.test.ts +298 -0
- package/src/services/voice/wake-word.ts +554 -0
- package/src/services/voice/wrap-with-first-line-cache.d.ts +70 -0
- package/src/services/voice/wrap-with-first-line-cache.d.ts.map +1 -0
- package/src/services/voice/wrap-with-first-line-cache.ts +267 -0
- package/src/services/voice-model-updater.d.ts +240 -0
- package/src/services/voice-model-updater.d.ts.map +1 -0
- package/src/services/voice-model-updater.ts +724 -0
- package/src/services/voice-prewarm.d.ts +3 -0
- package/src/services/voice-prewarm.d.ts.map +1 -0
- package/src/services/voice-prewarm.ts +51 -0
- package/dist/index.d.ts +0 -37
- package/dist/index.js +0 -1098
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"registry.d.ts","sourceRoot":"","sources":["registry.ts"],"names":[],"mappings":"AAAA;;;;;;;;;;;;GAYG;AAMH,OAAO,KAAK,EAAE,cAAc,EAAE,MAAM,SAAS,CAAC;AAmC9C;;;;GAIG;AACH,wBAAsB,mBAAmB,IAAI,OAAO,CAAC,cAAc,EAAE,CAAC,CAerE;AAED,wEAAwE;AACxE,wBAAsB,gBAAgB,CAAC,KAAK,EAAE,cAAc,GAAG,OAAO,CAAC,IAAI,CAAC,CAyB3E;AAED,gEAAgE;AAChE,wBAAsB,eAAe,CAAC,EAAE,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC,CAM/D;AAED;;;;;GAKG;AACH,wBAAsB,gBAAgB,CAAC,EAAE,EAAE,MAAM,GAAG,OAAO,CAAC;IAC3D,OAAO,EAAE,OAAO,CAAC;IACjB,MAAM,CAAC,EAAE,UAAU,GAAG,WAAW,CAAC;CAClC,CAAC,CA6BD"}
|
|
@@ -0,0 +1,151 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* On-disk registry of installed models.
|
|
3
|
+
*
|
|
4
|
+
* Two sources feed the registry:
|
|
5
|
+
* 1. Eliza-owned downloads (source: "eliza-download") — written on
|
|
6
|
+
* successful completion by the downloader.
|
|
7
|
+
* 2. External scans (source: "external-scan") — merged in at read time
|
|
8
|
+
* from `scanExternalModels()`. These are never persisted to the
|
|
9
|
+
* registry file; a rescan runs whenever we read.
|
|
10
|
+
*
|
|
11
|
+
* The JSON file only holds Eliza-owned entries. That way, if a user
|
|
12
|
+
* cleans up LM Studio models we don't show stale ghosts.
|
|
13
|
+
*/
|
|
14
|
+
|
|
15
|
+
import fs from "node:fs/promises";
|
|
16
|
+
import path from "node:path";
|
|
17
|
+
import { scanExternalModels } from "./external-scanner";
|
|
18
|
+
import { isWithinElizaRoot, localInferenceRoot, registryPath } from "./paths";
|
|
19
|
+
import type { InstalledModel } from "./types";
|
|
20
|
+
|
|
21
|
+
interface RegistryFile {
|
|
22
|
+
version: 1;
|
|
23
|
+
models: InstalledModel[];
|
|
24
|
+
}
|
|
25
|
+
|
|
26
|
+
async function ensureRootDir(): Promise<void> {
|
|
27
|
+
await fs.mkdir(localInferenceRoot(), { recursive: true });
|
|
28
|
+
}
|
|
29
|
+
|
|
30
|
+
async function readElizaOwned(): Promise<InstalledModel[]> {
|
|
31
|
+
try {
|
|
32
|
+
const raw = await fs.readFile(registryPath(), "utf8");
|
|
33
|
+
const parsed = JSON.parse(raw) as RegistryFile;
|
|
34
|
+
if (parsed?.version !== 1 || !Array.isArray(parsed.models)) {
|
|
35
|
+
return [];
|
|
36
|
+
}
|
|
37
|
+
return parsed.models.filter(
|
|
38
|
+
(m): m is InstalledModel =>
|
|
39
|
+
m && typeof m === "object" && m.source === "eliza-download",
|
|
40
|
+
);
|
|
41
|
+
} catch {
|
|
42
|
+
return [];
|
|
43
|
+
}
|
|
44
|
+
}
|
|
45
|
+
|
|
46
|
+
async function writeElizaOwned(models: InstalledModel[]): Promise<void> {
|
|
47
|
+
await ensureRootDir();
|
|
48
|
+
const tmp = `${registryPath()}.tmp`;
|
|
49
|
+
const payload: RegistryFile = { version: 1, models };
|
|
50
|
+
await fs.writeFile(tmp, JSON.stringify(payload, null, 2), "utf8");
|
|
51
|
+
await fs.rename(tmp, registryPath());
|
|
52
|
+
}
|
|
53
|
+
|
|
54
|
+
/**
|
|
55
|
+
* Return all models currently usable: persisted Eliza downloads plus a
|
|
56
|
+
* fresh external-tool scan. External duplicates of Eliza-owned files are
|
|
57
|
+
* filtered out by path.
|
|
58
|
+
*/
|
|
59
|
+
export async function listInstalledModels(): Promise<InstalledModel[]> {
|
|
60
|
+
const [ownedRaw, external] = await Promise.all([
|
|
61
|
+
readElizaOwned(),
|
|
62
|
+
scanExternalModels(),
|
|
63
|
+
]);
|
|
64
|
+
const owned = ownedRaw;
|
|
65
|
+
|
|
66
|
+
// Filter out Eliza-owned files that also survived a reboot of the local
|
|
67
|
+
// file and got re-detected by the scanner.
|
|
68
|
+
const ownedPaths = new Set(owned.map((m) => path.resolve(m.path)));
|
|
69
|
+
const dedupedExternal = external.filter(
|
|
70
|
+
(m) => !ownedPaths.has(path.resolve(m.path)),
|
|
71
|
+
);
|
|
72
|
+
|
|
73
|
+
return [...owned, ...dedupedExternal];
|
|
74
|
+
}
|
|
75
|
+
|
|
76
|
+
/** Add or update a Eliza-owned entry. External entries are rejected. */
|
|
77
|
+
export async function upsertElizaModel(model: InstalledModel): Promise<void> {
|
|
78
|
+
if (model.source !== "eliza-download") {
|
|
79
|
+
throw new Error(
|
|
80
|
+
"[local-inference] registry only accepts Eliza-owned models",
|
|
81
|
+
);
|
|
82
|
+
}
|
|
83
|
+
if (!isWithinElizaRoot(model.path)) {
|
|
84
|
+
throw new Error(
|
|
85
|
+
"[local-inference] Eliza-owned models must live under the local-inference root",
|
|
86
|
+
);
|
|
87
|
+
}
|
|
88
|
+
if (model.bundleRoot && !isWithinElizaRoot(model.bundleRoot)) {
|
|
89
|
+
throw new Error(
|
|
90
|
+
"[local-inference] Eliza-owned bundle roots must live under the local-inference root",
|
|
91
|
+
);
|
|
92
|
+
}
|
|
93
|
+
if (model.manifestPath && !isWithinElizaRoot(model.manifestPath)) {
|
|
94
|
+
throw new Error(
|
|
95
|
+
"[local-inference] Eliza-owned manifests must live under the local-inference root",
|
|
96
|
+
);
|
|
97
|
+
}
|
|
98
|
+
const owned = await readElizaOwned();
|
|
99
|
+
const withoutCurrent = owned.filter((m) => m.id !== model.id);
|
|
100
|
+
withoutCurrent.push(model);
|
|
101
|
+
await writeElizaOwned(withoutCurrent);
|
|
102
|
+
}
|
|
103
|
+
|
|
104
|
+
/** Mark an existing Eliza-owned model as most-recently-used. */
|
|
105
|
+
export async function touchElizaModel(id: string): Promise<void> {
|
|
106
|
+
const owned = await readElizaOwned();
|
|
107
|
+
const target = owned.find((m) => m.id === id);
|
|
108
|
+
if (!target) return;
|
|
109
|
+
target.lastUsedAt = new Date().toISOString();
|
|
110
|
+
await writeElizaOwned(owned);
|
|
111
|
+
}
|
|
112
|
+
|
|
113
|
+
/**
|
|
114
|
+
* Delete a Eliza-owned model from the registry and from disk.
|
|
115
|
+
*
|
|
116
|
+
* Refuses if the model was discovered from another tool — Eliza must not
|
|
117
|
+
* touch files it doesn't own. Callers surface that refusal as a 4xx.
|
|
118
|
+
*/
|
|
119
|
+
export async function removeElizaModel(id: string): Promise<{
|
|
120
|
+
removed: boolean;
|
|
121
|
+
reason?: "external" | "not-found";
|
|
122
|
+
}> {
|
|
123
|
+
const owned = await readElizaOwned();
|
|
124
|
+
const target = owned.find((m) => m.id === id);
|
|
125
|
+
if (!target) {
|
|
126
|
+
// Check whether it's a known external entry so we can return a
|
|
127
|
+
// helpful error message instead of 404.
|
|
128
|
+
const external = await scanExternalModels();
|
|
129
|
+
if (external.some((m) => m.id === id)) {
|
|
130
|
+
return { removed: false, reason: "external" };
|
|
131
|
+
}
|
|
132
|
+
return { removed: false, reason: "not-found" };
|
|
133
|
+
}
|
|
134
|
+
|
|
135
|
+
if (!isWithinElizaRoot(target.path)) {
|
|
136
|
+
return { removed: false, reason: "external" };
|
|
137
|
+
}
|
|
138
|
+
|
|
139
|
+
const removePath =
|
|
140
|
+
target.bundleRoot && isWithinElizaRoot(target.bundleRoot)
|
|
141
|
+
? target.bundleRoot
|
|
142
|
+
: target.path;
|
|
143
|
+
try {
|
|
144
|
+
await fs.rm(removePath, { recursive: true, force: true });
|
|
145
|
+
} catch {
|
|
146
|
+
// If the file was already gone we still want to clear the registry entry.
|
|
147
|
+
}
|
|
148
|
+
|
|
149
|
+
await writeElizaOwned(owned.filter((m) => m.id !== id));
|
|
150
|
+
return { removed: true };
|
|
151
|
+
}
|
|
@@ -0,0 +1,92 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Top-priority router handler.
|
|
3
|
+
*
|
|
4
|
+
* Registers a model handler for every `AgentModelSlot` at priority
|
|
5
|
+
* `Number.MAX_SAFE_INTEGER`, which guarantees the runtime dispatches to
|
|
6
|
+
* us first. At dispatch time we:
|
|
7
|
+
*
|
|
8
|
+
* 1. Read the user's per-slot policy + preferred-provider choice from
|
|
9
|
+
* `routing-preferences.ts`.
|
|
10
|
+
* 2. Ask the `policyEngine` to pick a provider from the handler
|
|
11
|
+
* registry's current set (excluding ourselves).
|
|
12
|
+
* 3. Invoke that provider's original handler directly — bypassing
|
|
13
|
+
* `runtime.useModel` which would recurse into us.
|
|
14
|
+
* 4. Record the observed latency so later "fastest" picks have data.
|
|
15
|
+
* 5. On handler failure: retry the next eligible provider in priority
|
|
16
|
+
* order until exhausted (except in `manual` mode with an explicit
|
|
17
|
+
* preferred provider — that throws verbatim).
|
|
18
|
+
*
|
|
19
|
+
* If no other handler exists we throw a clear error rather than return
|
|
20
|
+
* garbage — the caller is meant to see "no provider configured" so they
|
|
21
|
+
* know to set one up.
|
|
22
|
+
*
|
|
23
|
+
* Because the router sits at the top of the priority stack, the user's
|
|
24
|
+
* preference is always authoritative regardless of what plugins register
|
|
25
|
+
* at lower priorities. This is the mechanism that unifies cloud + local
|
|
26
|
+
* + device-bridge routing from one settings panel.
|
|
27
|
+
*
|
|
28
|
+
* ## TTS routing precedence (`TEXT_TO_SPEECH` slot)
|
|
29
|
+
*
|
|
30
|
+
* The default per-slot policy is `prefer-local` (see
|
|
31
|
+
* `DEFAULT_ROUTING_POLICY` in `routing-preferences.ts`), which the
|
|
32
|
+
* policyEngine implements by short-circuiting to whichever candidate
|
|
33
|
+
* has provider `eliza-local-inference` / `capacitor-llama` /
|
|
34
|
+
* `eliza-device-bridge`. So even though `plugin-elizacloud` registers
|
|
35
|
+
* its TTS handler at plugin priority 50 (higher than the default 0 of
|
|
36
|
+
* direct providers like ElevenLabs / OpenAI / Groq / Edge-TTS), the
|
|
37
|
+
* router prefers local first when local is registered AND
|
|
38
|
+
* `local-inference` has a TTS-capable handler.
|
|
39
|
+
*
|
|
40
|
+
* Documented routing precedence for `TEXT_TO_SPEECH`:
|
|
41
|
+
*
|
|
42
|
+
* 1. **Local (`eliza-local-inference`)** — tier-aware Eliza-1 voice,
|
|
43
|
+
* using the ordered `ELIZA_1_VOICE_BACKENDS` policy in
|
|
44
|
+
* `@elizaos/shared/local-inference/catalog` (OmniVoice first where
|
|
45
|
+
* bundled, Kokoro fallback where bundled). Always preferred when
|
|
46
|
+
* available.
|
|
47
|
+
* 2. **Eliza Cloud (`elizacloud`)** — managed cloud proxy. Picked when
|
|
48
|
+
* local is unavailable. Throws `CloudTtsUnavailableError` when
|
|
49
|
+
* cloud isn't connected, which the loop above catches and falls
|
|
50
|
+
* through to step 3.
|
|
51
|
+
* 3. **ElevenLabs (`elevenlabs`)** — direct API key path.
|
|
52
|
+
* 4. **OpenAI (`openai`)** — direct API key path.
|
|
53
|
+
* 5. **Groq (`groq`)** — direct API key path.
|
|
54
|
+
* 6. **Edge-TTS (`edge-tts`)** — free Microsoft Edge endpoint, no key.
|
|
55
|
+
*
|
|
56
|
+
* Same precedence applies to `TRANSCRIPTION`, with the local side using
|
|
57
|
+
* Qwen3-ASR via the fused libelizainference (no whisper.cpp; see
|
|
58
|
+
* `plugin-local-inference/native/AGENTS.md` §1).
|
|
59
|
+
*
|
|
60
|
+
* Users can override this per slot via the routing-preferences settings
|
|
61
|
+
* panel (`prefer-local` ↔ `manual` + explicit `preferredProvider`).
|
|
62
|
+
*/
|
|
63
|
+
import type { AgentRuntime } from "@elizaos/core";
|
|
64
|
+
import type { HandlerRegistration } from "./handler-registry";
|
|
65
|
+
import { type AgentModelSlot } from "./types";
|
|
66
|
+
export declare const ROUTER_PROVIDER = "eliza-router";
|
|
67
|
+
declare function modelTypeToSlot(modelType: string): AgentModelSlot | null;
|
|
68
|
+
export declare function filterUnavailableLocalInferenceCandidates(candidates: HandlerRegistration[], localInferenceAvailable: boolean, forceLocalInference: boolean): HandlerRegistration[];
|
|
69
|
+
export declare function filterUnavailableLocalInference(slot: AgentModelSlot, policy: string, preferredProvider: string | null, candidates: HandlerRegistration[]): Promise<HandlerRegistration[]>;
|
|
70
|
+
/**
|
|
71
|
+
* Install the router as the top-priority handler for every slot.
|
|
72
|
+
*
|
|
73
|
+
* Idempotent per-runtime via the handler-registry's "last write wins"
|
|
74
|
+
* behaviour — re-registering our handlers just refreshes them in place.
|
|
75
|
+
* Called from `ensure-local-inference-handler.ts` after `handlerRegistry`
|
|
76
|
+
* has been installed on the runtime.
|
|
77
|
+
*/
|
|
78
|
+
export interface RouterInstallOptions {
|
|
79
|
+
skipSlots?: readonly AgentModelSlot[];
|
|
80
|
+
}
|
|
81
|
+
export declare function installRouterHandler(runtime: AgentRuntime, options?: RouterInstallOptions): void;
|
|
82
|
+
/** Public helper — useful for diagnostics endpoints. */
|
|
83
|
+
export declare function describeCurrentRouting(): Array<{
|
|
84
|
+
slot: AgentModelSlot;
|
|
85
|
+
modelType: string;
|
|
86
|
+
candidates: Array<{
|
|
87
|
+
provider: string;
|
|
88
|
+
priority: number;
|
|
89
|
+
}>;
|
|
90
|
+
}>;
|
|
91
|
+
export { modelTypeToSlot };
|
|
92
|
+
//# sourceMappingURL=router-handler.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"router-handler.d.ts","sourceRoot":"","sources":["router-handler.ts"],"names":[],"mappings":"AAAA;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA6DG;AAEH,OAAO,KAAK,EAAE,YAAY,EAAiB,MAAM,eAAe,CAAC;AAQjE,OAAO,KAAK,EAAE,mBAAmB,EAAE,MAAM,oBAAoB,CAAC;AAO9D,OAAO,EAAqB,KAAK,cAAc,EAAE,MAAM,SAAS,CAAC;AAEjE,eAAO,MAAM,eAAe,iBAAiB,CAAC;AA0C9C,iBAAS,eAAe,CAAC,SAAS,EAAE,MAAM,GAAG,cAAc,GAAG,IAAI,CAKjE;AA0CD,wBAAgB,yCAAyC,CACxD,UAAU,EAAE,mBAAmB,EAAE,EACjC,uBAAuB,EAAE,OAAO,EAChC,mBAAmB,EAAE,OAAO,GAC1B,mBAAmB,EAAE,CAQvB;AAED,wBAAsB,+BAA+B,CACpD,IAAI,EAAE,cAAc,EACpB,MAAM,EAAE,MAAM,EACd,iBAAiB,EAAE,MAAM,GAAG,IAAI,EAChC,UAAU,EAAE,mBAAmB,EAAE,GAC/B,OAAO,CAAC,mBAAmB,EAAE,CAAC,CAsBhC;AAsGD;;;;;;;GAOG;AACH,MAAM,WAAW,oBAAoB;IACpC,SAAS,CAAC,EAAE,SAAS,cAAc,EAAE,CAAC;CACtC;AAED,wBAAgB,oBAAoB,CACnC,OAAO,EAAE,YAAY,EACrB,OAAO,GAAE,oBAAyB,GAChC,IAAI,CAuBN;AAED,wDAAwD;AACxD,wBAAgB,sBAAsB,IAAI,KAAK,CAAC;IAC/C,IAAI,EAAE,cAAc,CAAC;IACrB,SAAS,EAAE,MAAM,CAAC;IAClB,UAAU,EAAE,KAAK,CAAC;QACjB,QAAQ,EAAE,MAAM,CAAC;QACjB,QAAQ,EAAE,MAAM,CAAC;KACjB,CAAC,CAAC;CACH,CAAC,CAWD;AAID,OAAO,EAAE,eAAe,EAAE,CAAC"}
|
|
@@ -0,0 +1,45 @@
|
|
|
1
|
+
import { type AgentRuntime, ModelType } from "@elizaos/core";
|
|
2
|
+
import { describe, expect, it, vi } from "vitest";
|
|
3
|
+
import { installRouterHandler, ROUTER_PROVIDER } from "./router-handler";
|
|
4
|
+
|
|
5
|
+
describe("installRouterHandler", () => {
|
|
6
|
+
it("does not register router handlers for skipped slots", () => {
|
|
7
|
+
const registrations: Array<{
|
|
8
|
+
modelType: string;
|
|
9
|
+
provider: string;
|
|
10
|
+
priority?: number;
|
|
11
|
+
}> = [];
|
|
12
|
+
const runtime = {
|
|
13
|
+
registerModel: vi.fn(
|
|
14
|
+
(
|
|
15
|
+
modelType: string,
|
|
16
|
+
_handler: unknown,
|
|
17
|
+
provider: string,
|
|
18
|
+
priority?: number,
|
|
19
|
+
) => {
|
|
20
|
+
registrations.push({ modelType, provider, priority });
|
|
21
|
+
},
|
|
22
|
+
),
|
|
23
|
+
} as unknown as AgentRuntime;
|
|
24
|
+
|
|
25
|
+
installRouterHandler(runtime, { skipSlots: ["TEXT_EMBEDDING"] });
|
|
26
|
+
|
|
27
|
+
expect(registrations).toEqual(
|
|
28
|
+
expect.arrayContaining([
|
|
29
|
+
expect.objectContaining({
|
|
30
|
+
modelType: ModelType.TEXT_SMALL,
|
|
31
|
+
provider: ROUTER_PROVIDER,
|
|
32
|
+
}),
|
|
33
|
+
expect.objectContaining({
|
|
34
|
+
modelType: ModelType.TEXT_LARGE,
|
|
35
|
+
provider: ROUTER_PROVIDER,
|
|
36
|
+
}),
|
|
37
|
+
]),
|
|
38
|
+
);
|
|
39
|
+
expect(
|
|
40
|
+
registrations.some(
|
|
41
|
+
(registration) => registration.modelType === ModelType.TEXT_EMBEDDING,
|
|
42
|
+
),
|
|
43
|
+
).toBe(false);
|
|
44
|
+
});
|
|
45
|
+
});
|
|
@@ -0,0 +1,376 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Top-priority router handler.
|
|
3
|
+
*
|
|
4
|
+
* Registers a model handler for every `AgentModelSlot` at priority
|
|
5
|
+
* `Number.MAX_SAFE_INTEGER`, which guarantees the runtime dispatches to
|
|
6
|
+
* us first. At dispatch time we:
|
|
7
|
+
*
|
|
8
|
+
* 1. Read the user's per-slot policy + preferred-provider choice from
|
|
9
|
+
* `routing-preferences.ts`.
|
|
10
|
+
* 2. Ask the `policyEngine` to pick a provider from the handler
|
|
11
|
+
* registry's current set (excluding ourselves).
|
|
12
|
+
* 3. Invoke that provider's original handler directly — bypassing
|
|
13
|
+
* `runtime.useModel` which would recurse into us.
|
|
14
|
+
* 4. Record the observed latency so later "fastest" picks have data.
|
|
15
|
+
* 5. On handler failure: retry the next eligible provider in priority
|
|
16
|
+
* order until exhausted (except in `manual` mode with an explicit
|
|
17
|
+
* preferred provider — that throws verbatim).
|
|
18
|
+
*
|
|
19
|
+
* If no other handler exists we throw a clear error rather than return
|
|
20
|
+
* garbage — the caller is meant to see "no provider configured" so they
|
|
21
|
+
* know to set one up.
|
|
22
|
+
*
|
|
23
|
+
* Because the router sits at the top of the priority stack, the user's
|
|
24
|
+
* preference is always authoritative regardless of what plugins register
|
|
25
|
+
* at lower priorities. This is the mechanism that unifies cloud + local
|
|
26
|
+
* + device-bridge routing from one settings panel.
|
|
27
|
+
*
|
|
28
|
+
* ## TTS routing precedence (`TEXT_TO_SPEECH` slot)
|
|
29
|
+
*
|
|
30
|
+
* The default per-slot policy is `prefer-local` (see
|
|
31
|
+
* `DEFAULT_ROUTING_POLICY` in `routing-preferences.ts`), which the
|
|
32
|
+
* policyEngine implements by short-circuiting to whichever candidate
|
|
33
|
+
* has provider `eliza-local-inference` / `capacitor-llama` /
|
|
34
|
+
* `eliza-device-bridge`. So even though `plugin-elizacloud` registers
|
|
35
|
+
* its TTS handler at plugin priority 50 (higher than the default 0 of
|
|
36
|
+
* direct providers like ElevenLabs / OpenAI / Groq / Edge-TTS), the
|
|
37
|
+
* router prefers local first when local is registered AND
|
|
38
|
+
* `local-inference` has a TTS-capable handler.
|
|
39
|
+
*
|
|
40
|
+
* Documented routing precedence for `TEXT_TO_SPEECH`:
|
|
41
|
+
*
|
|
42
|
+
* 1. **Local (`eliza-local-inference`)** — tier-aware Eliza-1 voice,
|
|
43
|
+
* using the ordered `ELIZA_1_VOICE_BACKENDS` policy in
|
|
44
|
+
* `@elizaos/shared/local-inference/catalog` (OmniVoice first where
|
|
45
|
+
* bundled, Kokoro fallback where bundled). Always preferred when
|
|
46
|
+
* available.
|
|
47
|
+
* 2. **Eliza Cloud (`elizacloud`)** — managed cloud proxy. Picked when
|
|
48
|
+
* local is unavailable. Throws `CloudTtsUnavailableError` when
|
|
49
|
+
* cloud isn't connected, which the loop above catches and falls
|
|
50
|
+
* through to step 3.
|
|
51
|
+
* 3. **ElevenLabs (`elevenlabs`)** — direct API key path.
|
|
52
|
+
* 4. **OpenAI (`openai`)** — direct API key path.
|
|
53
|
+
* 5. **Groq (`groq`)** — direct API key path.
|
|
54
|
+
* 6. **Edge-TTS (`edge-tts`)** — free Microsoft Edge endpoint, no key.
|
|
55
|
+
*
|
|
56
|
+
* Same precedence applies to `TRANSCRIPTION`, with the local side using
|
|
57
|
+
* Qwen3-ASR via the fused libelizainference (no whisper.cpp; see
|
|
58
|
+
* `plugin-local-inference/native/AGENTS.md` §1).
|
|
59
|
+
*
|
|
60
|
+
* Users can override this per slot via the routing-preferences settings
|
|
61
|
+
* panel (`prefer-local` ↔ `manual` + explicit `preferredProvider`).
|
|
62
|
+
*/
|
|
63
|
+
|
|
64
|
+
import type { AgentRuntime, IAgentRuntime } from "@elizaos/core";
|
|
65
|
+
import {
|
|
66
|
+
logger,
|
|
67
|
+
ModelType,
|
|
68
|
+
NoModelProviderConfiguredError,
|
|
69
|
+
} from "@elizaos/core";
|
|
70
|
+
import { readEffectiveAssignments } from "./assignments";
|
|
71
|
+
import { localInferenceEngine } from "./engine";
|
|
72
|
+
import type { HandlerRegistration } from "./handler-registry";
|
|
73
|
+
import { handlerRegistry } from "./handler-registry";
|
|
74
|
+
import { policyEngine } from "./routing-policy";
|
|
75
|
+
import {
|
|
76
|
+
DEFAULT_ROUTING_POLICY,
|
|
77
|
+
readRoutingPreferences,
|
|
78
|
+
} from "./routing-preferences";
|
|
79
|
+
import { AGENT_MODEL_SLOTS, type AgentModelSlot } from "./types";
|
|
80
|
+
|
|
81
|
+
export const ROUTER_PROVIDER = "eliza-router";
|
|
82
|
+
/**
|
|
83
|
+
* Max safe integer keeps us at the top even if a plugin registers with
|
|
84
|
+
* a very high priority. If someone deliberately wants to outrank us,
|
|
85
|
+
* they can register with Infinity — unlikely in practice.
|
|
86
|
+
*/
|
|
87
|
+
const ROUTER_PRIORITY = Number.MAX_SAFE_INTEGER;
|
|
88
|
+
|
|
89
|
+
function readBooleanEnv(name: string): boolean {
|
|
90
|
+
const value =
|
|
91
|
+
typeof process !== "undefined" ? process.env[name]?.trim() : undefined;
|
|
92
|
+
if (!value) {
|
|
93
|
+
return false;
|
|
94
|
+
}
|
|
95
|
+
return value === "1" || value.toLowerCase() === "true";
|
|
96
|
+
}
|
|
97
|
+
|
|
98
|
+
/**
|
|
99
|
+
* Runtime's registerModel type, narrowed for our use. The core signature
|
|
100
|
+
* lets the handler return any model type; for routing we only care that
|
|
101
|
+
* we can call it and await a result.
|
|
102
|
+
*/
|
|
103
|
+
type AnyHandler = (
|
|
104
|
+
runtime: IAgentRuntime,
|
|
105
|
+
params: Record<string, unknown>,
|
|
106
|
+
) => Promise<unknown>;
|
|
107
|
+
|
|
108
|
+
function slotToModelType(slot: AgentModelSlot): string | undefined {
|
|
109
|
+
switch (slot) {
|
|
110
|
+
case "TEXT_SMALL":
|
|
111
|
+
return ModelType.TEXT_SMALL;
|
|
112
|
+
case "TEXT_LARGE":
|
|
113
|
+
return ModelType.TEXT_LARGE;
|
|
114
|
+
case "TEXT_EMBEDDING":
|
|
115
|
+
return ModelType.TEXT_EMBEDDING;
|
|
116
|
+
case "TEXT_TO_SPEECH":
|
|
117
|
+
return ModelType.TEXT_TO_SPEECH;
|
|
118
|
+
case "TRANSCRIPTION":
|
|
119
|
+
return ModelType.TRANSCRIPTION;
|
|
120
|
+
}
|
|
121
|
+
}
|
|
122
|
+
|
|
123
|
+
function modelTypeToSlot(modelType: string): AgentModelSlot | null {
|
|
124
|
+
for (const slot of AGENT_MODEL_SLOTS) {
|
|
125
|
+
if (slotToModelType(slot) === modelType) return slot;
|
|
126
|
+
}
|
|
127
|
+
return null;
|
|
128
|
+
}
|
|
129
|
+
|
|
130
|
+
function shouldForceLocalInference(
|
|
131
|
+
policy: string,
|
|
132
|
+
preferredProvider: string | null,
|
|
133
|
+
): boolean {
|
|
134
|
+
return policy === "manual" && preferredProvider === "eliza-local-inference";
|
|
135
|
+
}
|
|
136
|
+
|
|
137
|
+
function getRuntimeModelCandidates(
|
|
138
|
+
runtime: IAgentRuntime,
|
|
139
|
+
modelType: string,
|
|
140
|
+
): HandlerRegistration[] {
|
|
141
|
+
const models = (runtime as { models?: unknown }).models;
|
|
142
|
+
if (!(models instanceof Map)) return [];
|
|
143
|
+
const registrations = models.get(modelType);
|
|
144
|
+
if (!Array.isArray(registrations)) return [];
|
|
145
|
+
return registrations
|
|
146
|
+
.filter(
|
|
147
|
+
(
|
|
148
|
+
entry,
|
|
149
|
+
): entry is {
|
|
150
|
+
provider: string;
|
|
151
|
+
priority?: number;
|
|
152
|
+
handler: HandlerRegistration["handler"];
|
|
153
|
+
} =>
|
|
154
|
+
entry &&
|
|
155
|
+
typeof entry === "object" &&
|
|
156
|
+
typeof (entry as { provider?: unknown }).provider === "string" &&
|
|
157
|
+
(entry as { provider: string }).provider !== ROUTER_PROVIDER &&
|
|
158
|
+
typeof (entry as { handler?: unknown }).handler === "function",
|
|
159
|
+
)
|
|
160
|
+
.map((entry) => ({
|
|
161
|
+
modelType,
|
|
162
|
+
provider: entry.provider,
|
|
163
|
+
priority: typeof entry.priority === "number" ? entry.priority : 0,
|
|
164
|
+
registeredAt: "runtime-introspection",
|
|
165
|
+
handler: entry.handler,
|
|
166
|
+
}))
|
|
167
|
+
.sort((a, b) => b.priority - a.priority);
|
|
168
|
+
}
|
|
169
|
+
|
|
170
|
+
export function filterUnavailableLocalInferenceCandidates(
|
|
171
|
+
candidates: HandlerRegistration[],
|
|
172
|
+
localInferenceAvailable: boolean,
|
|
173
|
+
forceLocalInference: boolean,
|
|
174
|
+
): HandlerRegistration[] {
|
|
175
|
+
if (forceLocalInference || localInferenceAvailable) {
|
|
176
|
+
return candidates;
|
|
177
|
+
}
|
|
178
|
+
|
|
179
|
+
return candidates.filter(
|
|
180
|
+
(candidate) => candidate.provider !== "eliza-local-inference",
|
|
181
|
+
);
|
|
182
|
+
}
|
|
183
|
+
|
|
184
|
+
export async function filterUnavailableLocalInference(
|
|
185
|
+
slot: AgentModelSlot,
|
|
186
|
+
policy: string,
|
|
187
|
+
preferredProvider: string | null,
|
|
188
|
+
candidates: HandlerRegistration[],
|
|
189
|
+
): Promise<HandlerRegistration[]> {
|
|
190
|
+
// Voice slots (TTS / STT) are self-sufficient — their handlers call
|
|
191
|
+
// ensureActiveBundleVoiceReady() internally which loads the voice model
|
|
192
|
+
// on-demand. Don't gate them behind text model availability; the text
|
|
193
|
+
// model assignment check only makes sense for text generation slots.
|
|
194
|
+
if (slot === "TEXT_TO_SPEECH" || slot === "TRANSCRIPTION") {
|
|
195
|
+
return candidates;
|
|
196
|
+
}
|
|
197
|
+
|
|
198
|
+
const hasLocalInference = candidates.some(
|
|
199
|
+
(candidate) => candidate.provider === "eliza-local-inference",
|
|
200
|
+
);
|
|
201
|
+
if (!hasLocalInference) {
|
|
202
|
+
return candidates;
|
|
203
|
+
}
|
|
204
|
+
|
|
205
|
+
const assignments = await readEffectiveAssignments();
|
|
206
|
+
return filterUnavailableLocalInferenceCandidates(
|
|
207
|
+
candidates,
|
|
208
|
+
Boolean(assignments[slot]) || localInferenceEngine.hasLoadedModel(),
|
|
209
|
+
shouldForceLocalInference(policy, preferredProvider),
|
|
210
|
+
);
|
|
211
|
+
}
|
|
212
|
+
|
|
213
|
+
function makeRouterHandler(slot: AgentModelSlot): AnyHandler {
|
|
214
|
+
return async (runtime, params) => {
|
|
215
|
+
const modelType = slotToModelType(slot);
|
|
216
|
+
if (!modelType) {
|
|
217
|
+
throw new Error(`[router] Unknown agent slot: ${slot}`);
|
|
218
|
+
}
|
|
219
|
+
|
|
220
|
+
// Global local-only override: ELIZA_LOCAL_ONLY=1 pins every slot to
|
|
221
|
+
// manual + eliza-local-inference, disabling cloud fallback entirely.
|
|
222
|
+
const globalLocalOnly = readBooleanEnv("ELIZA_LOCAL_ONLY");
|
|
223
|
+
|
|
224
|
+
// Read the user's policy for this slot. Absent = local-first fallback.
|
|
225
|
+
const prefs = await readRoutingPreferences();
|
|
226
|
+
const policy = globalLocalOnly
|
|
227
|
+
? "manual"
|
|
228
|
+
: (prefs.policy[slot] ?? DEFAULT_ROUTING_POLICY);
|
|
229
|
+
const preferred = globalLocalOnly
|
|
230
|
+
? "eliza-local-inference"
|
|
231
|
+
: (prefs.preferredProvider[slot] ?? null);
|
|
232
|
+
|
|
233
|
+
// Ask the policy engine which handler to dispatch to. For automatic
|
|
234
|
+
// policies, honor the documented fallback behaviour: if the selected
|
|
235
|
+
// provider throws, try the next eligible provider instead of surfacing a
|
|
236
|
+
// local/model-specific failure while cloud providers are available.
|
|
237
|
+
const registeredCandidates = handlerRegistry.getForTypeExcluding(
|
|
238
|
+
modelType,
|
|
239
|
+
ROUTER_PROVIDER,
|
|
240
|
+
);
|
|
241
|
+
const candidates = await filterUnavailableLocalInference(
|
|
242
|
+
slot,
|
|
243
|
+
policy,
|
|
244
|
+
preferred,
|
|
245
|
+
registeredCandidates.length > 0
|
|
246
|
+
? registeredCandidates
|
|
247
|
+
: getRuntimeModelCandidates(runtime, modelType),
|
|
248
|
+
);
|
|
249
|
+
const failedProviders = new Set<string>();
|
|
250
|
+
let lastError: unknown = null;
|
|
251
|
+
|
|
252
|
+
while (true) {
|
|
253
|
+
const remaining = candidates.filter(
|
|
254
|
+
(candidate) => !failedProviders.has(candidate.provider),
|
|
255
|
+
);
|
|
256
|
+
const pick = policyEngine.pickProvider({
|
|
257
|
+
modelType,
|
|
258
|
+
policy,
|
|
259
|
+
preferredProvider: preferred,
|
|
260
|
+
candidates: remaining,
|
|
261
|
+
selfProvider: ROUTER_PROVIDER,
|
|
262
|
+
});
|
|
263
|
+
|
|
264
|
+
if (!pick) {
|
|
265
|
+
if (lastError) {
|
|
266
|
+
throw lastError;
|
|
267
|
+
}
|
|
268
|
+
throw new NoModelProviderConfiguredError(
|
|
269
|
+
`[router] No provider registered for ${slot}. Configure a cloud provider, enable local inference, or pair a device.`,
|
|
270
|
+
);
|
|
271
|
+
}
|
|
272
|
+
|
|
273
|
+
policyEngine.recordPick(pick.provider, modelType);
|
|
274
|
+
const start = Date.now();
|
|
275
|
+
try {
|
|
276
|
+
const result = await pick.handler(runtime, params);
|
|
277
|
+
policyEngine.recordLatency(
|
|
278
|
+
pick.provider,
|
|
279
|
+
modelType,
|
|
280
|
+
Date.now() - start,
|
|
281
|
+
);
|
|
282
|
+
return result;
|
|
283
|
+
} catch (err) {
|
|
284
|
+
// Record the timing even on failure so "fastest" doesn't silently
|
|
285
|
+
// prefer providers that error out fast.
|
|
286
|
+
policyEngine.recordLatency(
|
|
287
|
+
pick.provider,
|
|
288
|
+
modelType,
|
|
289
|
+
Date.now() - start,
|
|
290
|
+
);
|
|
291
|
+
|
|
292
|
+
const manualPreferred =
|
|
293
|
+
policy === "manual" &&
|
|
294
|
+
preferred !== null &&
|
|
295
|
+
pick.provider === preferred;
|
|
296
|
+
const hasAlternative = remaining.some(
|
|
297
|
+
(candidate) => candidate.provider !== pick.provider,
|
|
298
|
+
);
|
|
299
|
+
if (manualPreferred || !hasAlternative) {
|
|
300
|
+
throw err;
|
|
301
|
+
}
|
|
302
|
+
|
|
303
|
+
failedProviders.add(pick.provider);
|
|
304
|
+
lastError = err;
|
|
305
|
+
logger.info(
|
|
306
|
+
`[router] Provider ${pick.provider} failed for ${slot}; trying fallback provider (${err instanceof Error ? err.message : String(err)})`,
|
|
307
|
+
);
|
|
308
|
+
}
|
|
309
|
+
}
|
|
310
|
+
};
|
|
311
|
+
}
|
|
312
|
+
|
|
313
|
+
/**
|
|
314
|
+
* Install the router as the top-priority handler for every slot.
|
|
315
|
+
*
|
|
316
|
+
* Idempotent per-runtime via the handler-registry's "last write wins"
|
|
317
|
+
* behaviour — re-registering our handlers just refreshes them in place.
|
|
318
|
+
* Called from `ensure-local-inference-handler.ts` after `handlerRegistry`
|
|
319
|
+
* has been installed on the runtime.
|
|
320
|
+
*/
|
|
321
|
+
export interface RouterInstallOptions {
|
|
322
|
+
skipSlots?: readonly AgentModelSlot[];
|
|
323
|
+
}
|
|
324
|
+
|
|
325
|
+
export function installRouterHandler(
|
|
326
|
+
runtime: AgentRuntime,
|
|
327
|
+
options: RouterInstallOptions = {},
|
|
328
|
+
): void {
|
|
329
|
+
const rt = runtime as AgentRuntime & {
|
|
330
|
+
registerModel?: (
|
|
331
|
+
modelType: string,
|
|
332
|
+
handler: AnyHandler,
|
|
333
|
+
provider: string,
|
|
334
|
+
priority?: number,
|
|
335
|
+
) => void;
|
|
336
|
+
};
|
|
337
|
+
if (typeof rt.registerModel !== "function") return;
|
|
338
|
+
|
|
339
|
+
const skippedSlots = new Set(options.skipSlots ?? []);
|
|
340
|
+
for (const slot of AGENT_MODEL_SLOTS) {
|
|
341
|
+
if (skippedSlots.has(slot)) continue;
|
|
342
|
+
const modelType = slotToModelType(slot);
|
|
343
|
+
if (!modelType) continue;
|
|
344
|
+
rt.registerModel(
|
|
345
|
+
modelType,
|
|
346
|
+
makeRouterHandler(slot),
|
|
347
|
+
ROUTER_PROVIDER,
|
|
348
|
+
ROUTER_PRIORITY,
|
|
349
|
+
);
|
|
350
|
+
}
|
|
351
|
+
}
|
|
352
|
+
|
|
353
|
+
/** Public helper — useful for diagnostics endpoints. */
|
|
354
|
+
export function describeCurrentRouting(): Array<{
|
|
355
|
+
slot: AgentModelSlot;
|
|
356
|
+
modelType: string;
|
|
357
|
+
candidates: Array<{
|
|
358
|
+
provider: string;
|
|
359
|
+
priority: number;
|
|
360
|
+
}>;
|
|
361
|
+
}> {
|
|
362
|
+
const out: ReturnType<typeof describeCurrentRouting> = [];
|
|
363
|
+
for (const slot of AGENT_MODEL_SLOTS) {
|
|
364
|
+
const modelType = slotToModelType(slot);
|
|
365
|
+
if (!modelType) continue;
|
|
366
|
+
const candidates = handlerRegistry
|
|
367
|
+
.getForTypeExcluding(modelType, ROUTER_PROVIDER)
|
|
368
|
+
.map((c) => ({ provider: c.provider, priority: c.priority }));
|
|
369
|
+
out.push({ slot, modelType, candidates });
|
|
370
|
+
}
|
|
371
|
+
return out;
|
|
372
|
+
}
|
|
373
|
+
|
|
374
|
+
// Re-export so the handler registry can tell whether it's looking at a
|
|
375
|
+
// recursive router registration when filtering.
|
|
376
|
+
export { modelTypeToSlot };
|