@elizaos/plugin-local-inference 2.0.0-beta.1 → 2.0.11-beta.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (676) hide show
  1. package/LICENSE +21 -0
  2. package/README.md +83 -0
  3. package/package.json +81 -15
  4. package/src/actions/generate-media.d.ts +59 -0
  5. package/src/actions/generate-media.d.ts.map +1 -0
  6. package/src/actions/generate-media.ts +647 -0
  7. package/src/actions/identify-speaker.d.ts +23 -0
  8. package/src/actions/identify-speaker.d.ts.map +1 -0
  9. package/src/actions/identify-speaker.ts +171 -0
  10. package/src/adapters/capacitor-llama/__tests__/compat-behavior.test.ts +218 -0
  11. package/src/adapters/capacitor-llama/__tests__/index.test.ts +68 -0
  12. package/src/adapters/capacitor-llama/__tests__/structured-output.test.ts +215 -0
  13. package/src/adapters/capacitor-llama/__tests__/text-streaming.test.ts +174 -0
  14. package/src/adapters/capacitor-llama/environment.ts +71 -0
  15. package/src/adapters/capacitor-llama/index.browser.ts +83 -0
  16. package/src/adapters/capacitor-llama/index.ts +807 -0
  17. package/src/adapters/capacitor-llama/loader.ts +109 -0
  18. package/src/adapters/capacitor-llama/structured-output.ts +165 -0
  19. package/src/adapters/capacitor-llama/text-streaming.ts +227 -0
  20. package/src/adapters/capacitor-llama/types.ts +374 -0
  21. package/src/backends/apple-foundation.ts +127 -0
  22. package/src/index.d.ts +7 -0
  23. package/src/index.d.ts.map +1 -0
  24. package/src/index.ts +54 -0
  25. package/src/local-inference-routes.d.ts +38 -0
  26. package/src/local-inference-routes.d.ts.map +1 -0
  27. package/src/local-inference-routes.test.ts +344 -0
  28. package/src/local-inference-routes.ts +1543 -0
  29. package/src/provider.d.ts +21 -0
  30. package/src/provider.d.ts.map +1 -0
  31. package/src/provider.ts +1171 -0
  32. package/src/routes/compat-helpers.d.ts +18 -0
  33. package/src/routes/compat-helpers.d.ts.map +1 -0
  34. package/src/routes/compat-helpers.ts +274 -0
  35. package/src/routes/family-member-route.d.ts +62 -0
  36. package/src/routes/family-member-route.d.ts.map +1 -0
  37. package/src/routes/family-member-route.ts +353 -0
  38. package/src/routes/index.d.ts +19 -0
  39. package/src/routes/index.d.ts.map +1 -0
  40. package/src/routes/index.ts +60 -0
  41. package/src/routes/live-diarization-route.d.ts +26 -0
  42. package/src/routes/live-diarization-route.d.ts.map +1 -0
  43. package/src/routes/live-diarization-route.test.ts +213 -0
  44. package/src/routes/live-diarization-route.ts +122 -0
  45. package/src/routes/local-inference-asr-route.d.ts +4 -0
  46. package/src/routes/local-inference-asr-route.d.ts.map +1 -0
  47. package/src/routes/local-inference-asr-route.test.ts +190 -0
  48. package/src/routes/local-inference-asr-route.ts +213 -0
  49. package/src/routes/local-inference-compat-routes.d.ts +16 -0
  50. package/src/routes/local-inference-compat-routes.d.ts.map +1 -0
  51. package/src/routes/local-inference-compat-routes.test.ts +423 -0
  52. package/src/routes/local-inference-compat-routes.ts +782 -0
  53. package/src/routes/local-inference-tts-route.d.ts +7 -0
  54. package/src/routes/local-inference-tts-route.d.ts.map +1 -0
  55. package/src/routes/local-inference-tts-route.test.ts +179 -0
  56. package/src/routes/local-inference-tts-route.ts +230 -0
  57. package/src/routes/voice-first-run-routes.d.ts +62 -0
  58. package/src/routes/voice-first-run-routes.d.ts.map +1 -0
  59. package/src/routes/voice-first-run-routes.ts +524 -0
  60. package/src/routes/voice-models-routes.d.ts +62 -0
  61. package/src/routes/voice-models-routes.d.ts.map +1 -0
  62. package/src/routes/voice-models-routes.ts +554 -0
  63. package/src/routes/voice-profile-plugin-routes.d.ts +19 -0
  64. package/src/routes/voice-profile-plugin-routes.d.ts.map +1 -0
  65. package/src/routes/voice-profile-plugin-routes.ts +138 -0
  66. package/src/routes/voice-profiles-management-routes.d.ts +52 -0
  67. package/src/routes/voice-profiles-management-routes.d.ts.map +1 -0
  68. package/src/routes/voice-profiles-management-routes.ts +476 -0
  69. package/src/routes/voice-speaker-profile-routes.d.ts +57 -0
  70. package/src/routes/voice-speaker-profile-routes.d.ts.map +1 -0
  71. package/src/routes/voice-speaker-profile-routes.ts +199 -0
  72. package/src/runtime/aosp-llama-loader-selection.test.ts +80 -0
  73. package/src/runtime/capacitor-llama.d.ts +25 -0
  74. package/src/runtime/embedding-manager-support.d.ts +77 -0
  75. package/src/runtime/embedding-manager-support.d.ts.map +1 -0
  76. package/src/runtime/embedding-manager-support.ts +497 -0
  77. package/src/runtime/embedding-presets.d.ts +16 -0
  78. package/src/runtime/embedding-presets.d.ts.map +1 -0
  79. package/src/runtime/embedding-presets.ts +81 -0
  80. package/src/runtime/embedding-warmup-policy.d.ts +14 -0
  81. package/src/runtime/embedding-warmup-policy.d.ts.map +1 -0
  82. package/src/runtime/embedding-warmup-policy.test.ts +53 -0
  83. package/src/runtime/embedding-warmup-policy.ts +48 -0
  84. package/src/runtime/ensure-local-inference-handler.d.ts +53 -0
  85. package/src/runtime/ensure-local-inference-handler.d.ts.map +1 -0
  86. package/src/runtime/ensure-local-inference-handler.test.ts +528 -0
  87. package/src/runtime/ensure-local-inference-handler.ts +1398 -0
  88. package/src/runtime/index.d.ts +14 -0
  89. package/src/runtime/index.d.ts.map +1 -0
  90. package/src/runtime/index.ts +27 -0
  91. package/src/runtime/mobile-local-inference-gate.d.ts +31 -0
  92. package/src/runtime/mobile-local-inference-gate.d.ts.map +1 -0
  93. package/src/runtime/mobile-local-inference-gate.test.ts +69 -0
  94. package/src/runtime/mobile-local-inference-gate.ts +44 -0
  95. package/src/runtime/voice-entity-binding.d.ts +103 -0
  96. package/src/runtime/voice-entity-binding.d.ts.map +1 -0
  97. package/src/runtime/voice-entity-binding.transcript.test.ts +69 -0
  98. package/src/runtime/voice-entity-binding.ts +328 -0
  99. package/src/services/README.md +71 -0
  100. package/src/services/__tests__/backend-selector.test.ts +101 -0
  101. package/src/services/__tests__/checkpoint-manager.test.ts +376 -0
  102. package/src/services/__tests__/gpu-autotune.test.ts +400 -0
  103. package/src/services/__tests__/llm-streaming-binding.test.ts +85 -0
  104. package/src/services/__tests__/planner-grammar.test.ts +372 -0
  105. package/src/services/__tests__/runtime-target.test.ts +176 -0
  106. package/src/services/active-model-switch-rollback.test.ts +183 -0
  107. package/src/services/active-model.d.ts +282 -0
  108. package/src/services/active-model.d.ts.map +1 -0
  109. package/src/services/active-model.ts +1213 -0
  110. package/src/services/asr/errors.d.ts +21 -0
  111. package/src/services/asr/errors.d.ts.map +1 -0
  112. package/src/services/asr/errors.ts +50 -0
  113. package/src/services/asr/hash.d.ts +28 -0
  114. package/src/services/asr/hash.d.ts.map +1 -0
  115. package/src/services/asr/hash.ts +49 -0
  116. package/src/services/asr/index.d.ts +76 -0
  117. package/src/services/asr/index.d.ts.map +1 -0
  118. package/src/services/asr/index.ts +178 -0
  119. package/src/services/asr/types.d.ts +91 -0
  120. package/src/services/asr/types.d.ts.map +1 -0
  121. package/src/services/asr/types.ts +95 -0
  122. package/src/services/assignments.d.ts +71 -0
  123. package/src/services/assignments.d.ts.map +1 -0
  124. package/src/services/assignments.test.ts +80 -0
  125. package/src/services/assignments.ts +230 -0
  126. package/src/services/backend-selector.ts +95 -0
  127. package/src/services/backend.d.ts +346 -0
  128. package/src/services/backend.d.ts.map +1 -0
  129. package/src/services/backend.ts +612 -0
  130. package/src/services/bundled-models.d.ts +34 -0
  131. package/src/services/bundled-models.d.ts.map +1 -0
  132. package/src/services/bundled-models.ts +129 -0
  133. package/src/services/cache-bridge.d.ts +206 -0
  134. package/src/services/cache-bridge.d.ts.map +1 -0
  135. package/src/services/cache-bridge.test.ts +516 -0
  136. package/src/services/cache-bridge.ts +423 -0
  137. package/src/services/catalog.d.ts +10 -0
  138. package/src/services/catalog.d.ts.map +1 -0
  139. package/src/services/catalog.test.ts +240 -0
  140. package/src/services/catalog.ts +27 -0
  141. package/src/services/checkpoint-client.d.ts +109 -0
  142. package/src/services/checkpoint-client.d.ts.map +1 -0
  143. package/src/services/checkpoint-client.ts +258 -0
  144. package/src/services/checkpoint-manager.ts +474 -0
  145. package/src/services/cloud-fallback.d.ts +102 -0
  146. package/src/services/cloud-fallback.d.ts.map +1 -0
  147. package/src/services/cloud-fallback.ts +230 -0
  148. package/src/services/conversation-registry.d.ts +142 -0
  149. package/src/services/conversation-registry.d.ts.map +1 -0
  150. package/src/services/conversation-registry.test.ts +235 -0
  151. package/src/services/conversation-registry.ts +264 -0
  152. package/src/services/desktop-fused-ffi-backend-runtime.d.ts +92 -0
  153. package/src/services/desktop-fused-ffi-backend-runtime.d.ts.map +1 -0
  154. package/src/services/desktop-fused-ffi-backend-runtime.ts +333 -0
  155. package/src/services/device-bridge.d.ts +188 -0
  156. package/src/services/device-bridge.d.ts.map +1 -0
  157. package/src/services/device-bridge.ts +1237 -0
  158. package/src/services/device-resource-metrics.d.ts +149 -0
  159. package/src/services/device-resource-metrics.d.ts.map +1 -0
  160. package/src/services/device-resource-metrics.test.ts +98 -0
  161. package/src/services/device-resource-metrics.ts +346 -0
  162. package/src/services/device-tier.d.ts +115 -0
  163. package/src/services/device-tier.d.ts.map +1 -0
  164. package/src/services/device-tier.test.ts +371 -0
  165. package/src/services/device-tier.ts +410 -0
  166. package/src/services/downloader.d.ts +82 -0
  167. package/src/services/downloader.d.ts.map +1 -0
  168. package/src/services/downloader.test.ts +724 -0
  169. package/src/services/downloader.ts +899 -0
  170. package/src/services/engine-direct-bundle.test.ts +58 -0
  171. package/src/services/engine-streaming.test.ts +80 -0
  172. package/src/services/engine.d.ts +534 -0
  173. package/src/services/engine.d.ts.map +1 -0
  174. package/src/services/engine.ts +1891 -0
  175. package/src/services/ensure-local-artifacts.integration.test.ts +273 -0
  176. package/src/services/ensure-local-artifacts.test.ts +368 -0
  177. package/src/services/ensure-local-artifacts.ts +351 -0
  178. package/src/services/external-scanner.d.ts +17 -0
  179. package/src/services/external-scanner.d.ts.map +1 -0
  180. package/src/services/external-scanner.ts +312 -0
  181. package/src/services/ffi-llm-mock.ts +354 -0
  182. package/src/services/ffi-llm-streaming-abi.ts +442 -0
  183. package/src/services/ffi-streaming-backend.d.ts +180 -0
  184. package/src/services/ffi-streaming-backend.d.ts.map +1 -0
  185. package/src/services/ffi-streaming-backend.ts +382 -0
  186. package/src/services/ffi-streaming-runner.d.ts +122 -0
  187. package/src/services/ffi-streaming-runner.d.ts.map +1 -0
  188. package/src/services/ffi-streaming-runner.test.ts +60 -0
  189. package/src/services/ffi-streaming-runner.ts +354 -0
  190. package/src/services/ffi-unload-ordering.test.ts +162 -0
  191. package/src/services/gpu-autotune.ts +534 -0
  192. package/src/services/gpu-detect.ts +139 -0
  193. package/src/services/handler-registry.d.ts +72 -0
  194. package/src/services/handler-registry.d.ts.map +1 -0
  195. package/src/services/handler-registry.ts +240 -0
  196. package/src/services/hardware.d.ts +63 -0
  197. package/src/services/hardware.d.ts.map +1 -0
  198. package/src/services/hardware.test.ts +183 -0
  199. package/src/services/hardware.ts +404 -0
  200. package/src/services/hf-search.d.ts +26 -0
  201. package/src/services/hf-search.d.ts.map +1 -0
  202. package/src/services/hf-search.test.ts +69 -0
  203. package/src/services/hf-search.ts +420 -0
  204. package/src/services/image-description-runtime.d.ts +14 -0
  205. package/src/services/image-description-runtime.d.ts.map +1 -0
  206. package/src/services/image-description-runtime.test.ts +61 -0
  207. package/src/services/image-description-runtime.ts +118 -0
  208. package/src/services/imagegen/aosp-unavailable.d.ts +134 -0
  209. package/src/services/imagegen/aosp-unavailable.d.ts.map +1 -0
  210. package/src/services/imagegen/aosp-unavailable.ts +229 -0
  211. package/src/services/imagegen/backend-selector.d.ts +118 -0
  212. package/src/services/imagegen/backend-selector.d.ts.map +1 -0
  213. package/src/services/imagegen/backend-selector.ts +281 -0
  214. package/src/services/imagegen/coreml-unavailable.d.ts +105 -0
  215. package/src/services/imagegen/coreml-unavailable.d.ts.map +1 -0
  216. package/src/services/imagegen/coreml-unavailable.ts +237 -0
  217. package/src/services/imagegen/errors.d.ts +16 -0
  218. package/src/services/imagegen/errors.d.ts.map +1 -0
  219. package/src/services/imagegen/errors.ts +40 -0
  220. package/src/services/imagegen/index.d.ts +58 -0
  221. package/src/services/imagegen/index.d.ts.map +1 -0
  222. package/src/services/imagegen/index.ts +144 -0
  223. package/src/services/imagegen/mflux.d.ts +74 -0
  224. package/src/services/imagegen/mflux.d.ts.map +1 -0
  225. package/src/services/imagegen/mflux.ts +313 -0
  226. package/src/services/imagegen/sd-cpp.d.ts +180 -0
  227. package/src/services/imagegen/sd-cpp.d.ts.map +1 -0
  228. package/src/services/imagegen/sd-cpp.ts +718 -0
  229. package/src/services/imagegen/tensorrt-unavailable.d.ts +83 -0
  230. package/src/services/imagegen/tensorrt-unavailable.d.ts.map +1 -0
  231. package/src/services/imagegen/tensorrt-unavailable.ts +295 -0
  232. package/src/services/imagegen/types.d.ts +181 -0
  233. package/src/services/imagegen/types.d.ts.map +1 -0
  234. package/src/services/imagegen/types.ts +193 -0
  235. package/src/services/index.d.ts +30 -0
  236. package/src/services/index.d.ts.map +1 -0
  237. package/src/services/index.ts +225 -0
  238. package/src/services/inference-capabilities.d.ts +132 -0
  239. package/src/services/inference-capabilities.d.ts.map +1 -0
  240. package/src/services/inference-capabilities.test.ts +75 -0
  241. package/src/services/inference-capabilities.ts +204 -0
  242. package/src/services/inference-telemetry.d.ts +59 -0
  243. package/src/services/inference-telemetry.d.ts.map +1 -0
  244. package/src/services/inference-telemetry.ts +143 -0
  245. package/src/services/ios-llama-streaming.ts +248 -0
  246. package/src/services/kv-spill.d.ts +189 -0
  247. package/src/services/kv-spill.d.ts.map +1 -0
  248. package/src/services/kv-spill.test.ts +222 -0
  249. package/src/services/kv-spill.ts +356 -0
  250. package/src/services/latency-trace.d.ts +346 -0
  251. package/src/services/latency-trace.d.ts.map +1 -0
  252. package/src/services/latency-trace.test.ts +266 -0
  253. package/src/services/latency-trace.ts +844 -0
  254. package/src/services/llama-server-metrics.ts +304 -0
  255. package/src/services/llm-streaming-binding.d.ts +96 -0
  256. package/src/services/llm-streaming-binding.d.ts.map +1 -0
  257. package/src/services/llm-streaming-binding.ts +136 -0
  258. package/src/services/load-args.d.ts +82 -0
  259. package/src/services/load-args.d.ts.map +1 -0
  260. package/src/services/load-args.ts +81 -0
  261. package/src/services/manifest/eliza-1.manifest.v1.json +708 -0
  262. package/src/services/manifest/index.d.ts +4 -0
  263. package/src/services/manifest/index.d.ts.map +1 -0
  264. package/src/services/manifest/index.ts +66 -0
  265. package/src/services/manifest/manifest.test.ts +693 -0
  266. package/src/services/manifest/schema.d.ts +715 -0
  267. package/src/services/manifest/schema.d.ts.map +1 -0
  268. package/src/services/manifest/schema.ts +655 -0
  269. package/src/services/manifest/types.d.ts +30 -0
  270. package/src/services/manifest/types.d.ts.map +1 -0
  271. package/src/services/manifest/types.ts +55 -0
  272. package/src/services/manifest/validator.d.ts +66 -0
  273. package/src/services/manifest/validator.d.ts.map +1 -0
  274. package/src/services/manifest/validator.ts +569 -0
  275. package/src/services/memory-arbiter.d.ts +343 -0
  276. package/src/services/memory-arbiter.d.ts.map +1 -0
  277. package/src/services/memory-arbiter.test.ts +419 -0
  278. package/src/services/memory-arbiter.ts +1000 -0
  279. package/src/services/memory-monitor.d.ts +119 -0
  280. package/src/services/memory-monitor.d.ts.map +1 -0
  281. package/src/services/memory-monitor.test.ts +208 -0
  282. package/src/services/memory-monitor.ts +296 -0
  283. package/src/services/memory-pressure.d.ts +127 -0
  284. package/src/services/memory-pressure.d.ts.map +1 -0
  285. package/src/services/memory-pressure.ts +413 -0
  286. package/src/services/mtp-doctor.d.ts +13 -0
  287. package/src/services/mtp-doctor.d.ts.map +1 -0
  288. package/src/services/mtp-doctor.ts +78 -0
  289. package/src/services/network-policy.d.ts +127 -0
  290. package/src/services/network-policy.d.ts.map +1 -0
  291. package/src/services/network-policy.ts +346 -0
  292. package/src/services/paths.d.ts +6 -0
  293. package/src/services/paths.d.ts.map +1 -0
  294. package/src/services/paths.ts +25 -0
  295. package/src/services/planner-skeleton.d.ts +124 -0
  296. package/src/services/planner-skeleton.d.ts.map +1 -0
  297. package/src/services/planner-skeleton.ts +175 -0
  298. package/src/services/providers.d.ts +38 -0
  299. package/src/services/providers.d.ts.map +1 -0
  300. package/src/services/providers.ts +507 -0
  301. package/src/services/ram-budget-cache.test.ts +163 -0
  302. package/src/services/ram-budget.d.ts +110 -0
  303. package/src/services/ram-budget.d.ts.map +1 -0
  304. package/src/services/ram-budget.ts +0 -0
  305. package/src/services/readiness.d.ts +9 -0
  306. package/src/services/readiness.d.ts.map +1 -0
  307. package/src/services/readiness.test.ts +87 -0
  308. package/src/services/readiness.ts +238 -0
  309. package/src/services/recommendation.d.ts +111 -0
  310. package/src/services/recommendation.d.ts.map +1 -0
  311. package/src/services/recommendation.ts +672 -0
  312. package/src/services/registry.d.ts +35 -0
  313. package/src/services/registry.d.ts.map +1 -0
  314. package/src/services/registry.ts +151 -0
  315. package/src/services/router-handler.d.ts +92 -0
  316. package/src/services/router-handler.d.ts.map +1 -0
  317. package/src/services/router-handler.test.ts +45 -0
  318. package/src/services/router-handler.ts +376 -0
  319. package/src/services/routing-policy.d.ts +55 -0
  320. package/src/services/routing-policy.d.ts.map +1 -0
  321. package/src/services/routing-policy.ts +228 -0
  322. package/src/services/routing-preferences.d.ts +8 -0
  323. package/src/services/routing-preferences.d.ts.map +1 -0
  324. package/src/services/routing-preferences.ts +15 -0
  325. package/src/services/runtime-target.d.ts +98 -0
  326. package/src/services/runtime-target.d.ts.map +1 -0
  327. package/src/services/runtime-target.ts +154 -0
  328. package/src/services/service.d.ts +128 -0
  329. package/src/services/service.d.ts.map +1 -0
  330. package/src/services/service.test.ts +223 -0
  331. package/src/services/service.ts +735 -0
  332. package/src/services/session-pool.d.ts +72 -0
  333. package/src/services/session-pool.d.ts.map +1 -0
  334. package/src/services/session-pool.ts +153 -0
  335. package/src/services/structured-output/deterministic-repair.d.ts +23 -0
  336. package/src/services/structured-output/deterministic-repair.d.ts.map +1 -0
  337. package/src/services/structured-output/deterministic-repair.test.ts +169 -0
  338. package/src/services/structured-output/deterministic-repair.ts +443 -0
  339. package/src/services/structured-output/index.ts +4 -0
  340. package/src/services/structured-output.d.ts +311 -0
  341. package/src/services/structured-output.d.ts.map +1 -0
  342. package/src/services/structured-output.test.ts +483 -0
  343. package/src/services/structured-output.ts +712 -0
  344. package/src/services/transcription-priority.test.ts +211 -0
  345. package/src/services/tts/errors.ts +46 -0
  346. package/src/services/tts/index.ts +214 -0
  347. package/src/services/tts/tts-audio-cache.ts +235 -0
  348. package/src/services/tts/types.ts +157 -0
  349. package/src/services/types.d.ts +19 -0
  350. package/src/services/types.d.ts.map +1 -0
  351. package/src/services/types.ts +55 -0
  352. package/src/services/verify-on-device.d.ts +34 -0
  353. package/src/services/verify-on-device.d.ts.map +1 -0
  354. package/src/services/verify-on-device.test.ts +87 -0
  355. package/src/services/verify-on-device.ts +127 -0
  356. package/src/services/verify.d.ts +8 -0
  357. package/src/services/verify.d.ts.map +1 -0
  358. package/src/services/verify.ts +13 -0
  359. package/src/services/vision/aosp-unavailable.d.ts +115 -0
  360. package/src/services/vision/aosp-unavailable.d.ts.map +1 -0
  361. package/src/services/vision/aosp-unavailable.ts +163 -0
  362. package/src/services/vision/capacitor-llama.d.ts +99 -0
  363. package/src/services/vision/capacitor-llama.d.ts.map +1 -0
  364. package/src/services/vision/capacitor-llama.ts +255 -0
  365. package/src/services/vision/cloud-fallback.d.ts +47 -0
  366. package/src/services/vision/cloud-fallback.d.ts.map +1 -0
  367. package/src/services/vision/cloud-fallback.test.ts +243 -0
  368. package/src/services/vision/cloud-fallback.ts +268 -0
  369. package/src/services/vision/fallback-chain.test.ts +86 -0
  370. package/src/services/vision/hash.d.ts +71 -0
  371. package/src/services/vision/hash.d.ts.map +1 -0
  372. package/src/services/vision/hash.ts +157 -0
  373. package/src/services/vision/index.d.ts +95 -0
  374. package/src/services/vision/index.d.ts.map +1 -0
  375. package/src/services/vision/index.ts +251 -0
  376. package/src/services/vision/llama-server.d.ts +73 -0
  377. package/src/services/vision/llama-server.d.ts.map +1 -0
  378. package/src/services/vision/llama-server.ts +177 -0
  379. package/src/services/vision/types.d.ts +153 -0
  380. package/src/services/vision/types.d.ts.map +1 -0
  381. package/src/services/vision/types.ts +154 -0
  382. package/src/services/vision/vast-fallback.d.ts +18 -0
  383. package/src/services/vision/vast-fallback.d.ts.map +1 -0
  384. package/src/services/vision/vast-fallback.ts +127 -0
  385. package/src/services/vision-embedding-cache.d.ts +98 -0
  386. package/src/services/vision-embedding-cache.d.ts.map +1 -0
  387. package/src/services/vision-embedding-cache.ts +189 -0
  388. package/src/services/voice/VOICE_WORKBENCH.md +88 -0
  389. package/src/services/voice/__test-helpers__/fake-ffi.ts +92 -0
  390. package/src/services/voice/__test-helpers__/synthetic-speech.ts +124 -0
  391. package/src/services/voice/__tests__/checkpoint-manager.test.ts +241 -0
  392. package/src/services/voice/__tests__/checkpoint-policy.test.ts +270 -0
  393. package/src/services/voice/__tests__/eager-context-builder.test.ts +257 -0
  394. package/src/services/voice/__tests__/eliza1-eot-scorer.test.ts +288 -0
  395. package/src/services/voice/__tests__/eot-classifier.test.ts +431 -0
  396. package/src/services/voice/__tests__/optimistic-rollback.test.ts +312 -0
  397. package/src/services/voice/__tests__/prefill-client.test.ts +266 -0
  398. package/src/services/voice/__tests__/prefix-preserving-queue.test.ts +208 -0
  399. package/src/services/voice/__tests__/streaming-asr.test.ts +450 -0
  400. package/src/services/voice/__tests__/streaming-transcriber.test.ts +339 -0
  401. package/src/services/voice/__tests__/turn-detector-resolver.test.ts +197 -0
  402. package/src/services/voice/__tests__/voice-state-machine-prefill.test.ts +275 -0
  403. package/src/services/voice/__tests__/voice-state-machine.test.ts +354 -0
  404. package/src/services/voice/audio-frame-consumer.d.ts +212 -0
  405. package/src/services/voice/audio-frame-consumer.d.ts.map +1 -0
  406. package/src/services/voice/audio-frame-consumer.test.ts +343 -0
  407. package/src/services/voice/audio-frame-consumer.ts +491 -0
  408. package/src/services/voice/barge-in.d.ts +112 -0
  409. package/src/services/voice/barge-in.d.ts.map +1 -0
  410. package/src/services/voice/barge-in.test.ts +244 -0
  411. package/src/services/voice/barge-in.ts +336 -0
  412. package/src/services/voice/cancellation-coordinator.d.ts +127 -0
  413. package/src/services/voice/cancellation-coordinator.d.ts.map +1 -0
  414. package/src/services/voice/cancellation-coordinator.test.ts +196 -0
  415. package/src/services/voice/cancellation-coordinator.ts +269 -0
  416. package/src/services/voice/checkpoint-manager.d.ts +199 -0
  417. package/src/services/voice/checkpoint-manager.d.ts.map +1 -0
  418. package/src/services/voice/checkpoint-manager.ts +401 -0
  419. package/src/services/voice/checkpoint-policy.ts +336 -0
  420. package/src/services/voice/composite-eot-classifier.test.ts +59 -0
  421. package/src/services/voice/e2e-harness.test.ts +182 -0
  422. package/src/services/voice/e2e-harness.ts +743 -0
  423. package/src/services/voice/eager-context-builder.d.ts +170 -0
  424. package/src/services/voice/eager-context-builder.d.ts.map +1 -0
  425. package/src/services/voice/eager-context-builder.ts +262 -0
  426. package/src/services/voice/eliza1-eot-scorer.d.ts +124 -0
  427. package/src/services/voice/eliza1-eot-scorer.d.ts.map +1 -0
  428. package/src/services/voice/eliza1-eot-scorer.ts +242 -0
  429. package/src/services/voice/embedding-server.ts +200 -0
  430. package/src/services/voice/embedding.d.ts +133 -0
  431. package/src/services/voice/embedding.d.ts.map +1 -0
  432. package/src/services/voice/embedding.test.ts +148 -0
  433. package/src/services/voice/embedding.ts +244 -0
  434. package/src/services/voice/emotion-attribution.d.ts +68 -0
  435. package/src/services/voice/emotion-attribution.d.ts.map +1 -0
  436. package/src/services/voice/emotion-attribution.test.ts +129 -0
  437. package/src/services/voice/emotion-attribution.ts +361 -0
  438. package/src/services/voice/engine-bridge-cancellation.test.ts +422 -0
  439. package/src/services/voice/engine-bridge.d.ts +746 -0
  440. package/src/services/voice/engine-bridge.d.ts.map +1 -0
  441. package/src/services/voice/engine-bridge.test.ts +384 -0
  442. package/src/services/voice/engine-bridge.ts +2226 -0
  443. package/src/services/voice/eot-classifier-ggml.d.ts +179 -0
  444. package/src/services/voice/eot-classifier-ggml.d.ts.map +1 -0
  445. package/src/services/voice/eot-classifier-ggml.ts +566 -0
  446. package/src/services/voice/eot-classifier.d.ts +214 -0
  447. package/src/services/voice/eot-classifier.d.ts.map +1 -0
  448. package/src/services/voice/eot-classifier.ts +533 -0
  449. package/src/services/voice/errors.d.ts +20 -0
  450. package/src/services/voice/errors.d.ts.map +1 -0
  451. package/src/services/voice/errors.ts +32 -0
  452. package/src/services/voice/expressive-tags.d.ts +158 -0
  453. package/src/services/voice/expressive-tags.d.ts.map +1 -0
  454. package/src/services/voice/expressive-tags.ts +405 -0
  455. package/src/services/voice/ffi-bindings.d.ts +636 -0
  456. package/src/services/voice/ffi-bindings.d.ts.map +1 -0
  457. package/src/services/voice/ffi-bindings.test.ts +671 -0
  458. package/src/services/voice/ffi-bindings.ts +3050 -0
  459. package/src/services/voice/first-line-cache.d.ts +181 -0
  460. package/src/services/voice/first-line-cache.d.ts.map +1 -0
  461. package/src/services/voice/first-line-cache.ts +725 -0
  462. package/src/services/voice/fused-eot-scorer.d.ts +51 -0
  463. package/src/services/voice/fused-eot-scorer.d.ts.map +1 -0
  464. package/src/services/voice/fused-eot-scorer.ts +135 -0
  465. package/src/services/voice/index.d.ts +91 -0
  466. package/src/services/voice/index.d.ts.map +1 -0
  467. package/src/services/voice/index.ts +481 -0
  468. package/src/services/voice/kokoro/__tests__/kokoro-backend.test.ts +151 -0
  469. package/src/services/voice/kokoro/__tests__/kokoro-engine-bridge.real.test.ts +151 -0
  470. package/src/services/voice/kokoro/__tests__/kokoro-engine-bridge.test.ts +60 -0
  471. package/src/services/voice/kokoro/__tests__/kokoro-engine-discovery.test.ts +277 -0
  472. package/src/services/voice/kokoro/__tests__/kokoro-ffi-runtime.test.ts +235 -0
  473. package/src/services/voice/kokoro/__tests__/kokoro-runtime.test.ts +95 -0
  474. package/src/services/voice/kokoro/__tests__/phonemizer.test.ts +53 -0
  475. package/src/services/voice/kokoro/__tests__/runtime-selection.test.ts +231 -0
  476. package/src/services/voice/kokoro/__tests__/voices.test.ts +57 -0
  477. package/src/services/voice/kokoro/index.ts +79 -0
  478. package/src/services/voice/kokoro/kokoro-backend.d.ts +72 -0
  479. package/src/services/voice/kokoro/kokoro-backend.d.ts.map +1 -0
  480. package/src/services/voice/kokoro/kokoro-backend.ts +207 -0
  481. package/src/services/voice/kokoro/kokoro-engine-discovery.d.ts +58 -0
  482. package/src/services/voice/kokoro/kokoro-engine-discovery.d.ts.map +1 -0
  483. package/src/services/voice/kokoro/kokoro-engine-discovery.ts +177 -0
  484. package/src/services/voice/kokoro/kokoro-ffi-runtime.d.ts +75 -0
  485. package/src/services/voice/kokoro/kokoro-ffi-runtime.d.ts.map +1 -0
  486. package/src/services/voice/kokoro/kokoro-ffi-runtime.ts +233 -0
  487. package/src/services/voice/kokoro/kokoro-runtime.d.ts +100 -0
  488. package/src/services/voice/kokoro/kokoro-runtime.d.ts.map +1 -0
  489. package/src/services/voice/kokoro/kokoro-runtime.ts +170 -0
  490. package/src/services/voice/kokoro/phoneme-stream.ts +123 -0
  491. package/src/services/voice/kokoro/phonemizer.d.ts +50 -0
  492. package/src/services/voice/kokoro/phonemizer.d.ts.map +1 -0
  493. package/src/services/voice/kokoro/phonemizer.ts +344 -0
  494. package/src/services/voice/kokoro/pick-runtime.d.ts +61 -0
  495. package/src/services/voice/kokoro/pick-runtime.d.ts.map +1 -0
  496. package/src/services/voice/kokoro/pick-runtime.test.ts +91 -0
  497. package/src/services/voice/kokoro/pick-runtime.ts +130 -0
  498. package/src/services/voice/kokoro/runtime-selection.d.ts +92 -0
  499. package/src/services/voice/kokoro/runtime-selection.d.ts.map +1 -0
  500. package/src/services/voice/kokoro/runtime-selection.ts +237 -0
  501. package/src/services/voice/kokoro/types.d.ts +82 -0
  502. package/src/services/voice/kokoro/types.d.ts.map +1 -0
  503. package/src/services/voice/kokoro/types.ts +95 -0
  504. package/src/services/voice/kokoro/voice-presets.d.ts +23 -0
  505. package/src/services/voice/kokoro/voice-presets.d.ts.map +1 -0
  506. package/src/services/voice/kokoro/voice-presets.ts +129 -0
  507. package/src/services/voice/kokoro/voices.d.ts +30 -0
  508. package/src/services/voice/kokoro/voices.d.ts.map +1 -0
  509. package/src/services/voice/kokoro/voices.ts +64 -0
  510. package/src/services/voice/lifecycle.d.ts +135 -0
  511. package/src/services/voice/lifecycle.d.ts.map +1 -0
  512. package/src/services/voice/lifecycle.test.ts +315 -0
  513. package/src/services/voice/lifecycle.ts +301 -0
  514. package/src/services/voice/live-diarization-session.d.ts +96 -0
  515. package/src/services/voice/live-diarization-session.d.ts.map +1 -0
  516. package/src/services/voice/live-diarization-session.ts +289 -0
  517. package/src/services/voice/mic-source.d.ts +136 -0
  518. package/src/services/voice/mic-source.d.ts.map +1 -0
  519. package/src/services/voice/mic-source.test.ts +210 -0
  520. package/src/services/voice/mic-source.ts +503 -0
  521. package/src/services/voice/optimistic-policy.d.ts +109 -0
  522. package/src/services/voice/optimistic-policy.d.ts.map +1 -0
  523. package/src/services/voice/optimistic-policy.test.ts +101 -0
  524. package/src/services/voice/optimistic-policy.ts +192 -0
  525. package/src/services/voice/optimistic-rollback.ts +343 -0
  526. package/src/services/voice/partial-stabilizer.d.ts +73 -0
  527. package/src/services/voice/partial-stabilizer.d.ts.map +1 -0
  528. package/src/services/voice/partial-stabilizer.test.ts +68 -0
  529. package/src/services/voice/partial-stabilizer.ts +140 -0
  530. package/src/services/voice/phoneme-tokenizer.d.ts +49 -0
  531. package/src/services/voice/phoneme-tokenizer.d.ts.map +1 -0
  532. package/src/services/voice/phoneme-tokenizer.ts +158 -0
  533. package/src/services/voice/phrase-cache.d.ts +76 -0
  534. package/src/services/voice/phrase-cache.d.ts.map +1 -0
  535. package/src/services/voice/phrase-cache.test.ts +242 -0
  536. package/src/services/voice/phrase-cache.ts +186 -0
  537. package/src/services/voice/phrase-chunker.d.ts +62 -0
  538. package/src/services/voice/phrase-chunker.d.ts.map +1 -0
  539. package/src/services/voice/phrase-chunker.test.ts +239 -0
  540. package/src/services/voice/phrase-chunker.ts +281 -0
  541. package/src/services/voice/pipeline-impls.d.ts +151 -0
  542. package/src/services/voice/pipeline-impls.d.ts.map +1 -0
  543. package/src/services/voice/pipeline-impls.l6.test.ts +110 -0
  544. package/src/services/voice/pipeline-impls.test.ts +292 -0
  545. package/src/services/voice/pipeline-impls.ts +315 -0
  546. package/src/services/voice/pipeline.d.ts +216 -0
  547. package/src/services/voice/pipeline.d.ts.map +1 -0
  548. package/src/services/voice/pipeline.ts +505 -0
  549. package/src/services/voice/prefill-client.d.ts +123 -0
  550. package/src/services/voice/prefill-client.d.ts.map +1 -0
  551. package/src/services/voice/prefill-client.ts +316 -0
  552. package/src/services/voice/prefix-preserving-queue.d.ts +113 -0
  553. package/src/services/voice/prefix-preserving-queue.d.ts.map +1 -0
  554. package/src/services/voice/prefix-preserving-queue.ts +162 -0
  555. package/src/services/voice/profile-store.d.ts +248 -0
  556. package/src/services/voice/profile-store.d.ts.map +1 -0
  557. package/src/services/voice/profile-store.ts +887 -0
  558. package/src/services/voice/ring-buffer.d.ts +40 -0
  559. package/src/services/voice/ring-buffer.d.ts.map +1 -0
  560. package/src/services/voice/ring-buffer.ts +105 -0
  561. package/src/services/voice/rollback-queue.d.ts +24 -0
  562. package/src/services/voice/rollback-queue.d.ts.map +1 -0
  563. package/src/services/voice/rollback-queue.ts +74 -0
  564. package/src/services/voice/samantha-preset-placeholder.d.ts +67 -0
  565. package/src/services/voice/samantha-preset-placeholder.d.ts.map +1 -0
  566. package/src/services/voice/samantha-preset-placeholder.test.ts +97 -0
  567. package/src/services/voice/samantha-preset-placeholder.ts +148 -0
  568. package/src/services/voice/samantha-preset-regenerator.d.ts +87 -0
  569. package/src/services/voice/samantha-preset-regenerator.d.ts.map +1 -0
  570. package/src/services/voice/samantha-preset-regenerator.ts +393 -0
  571. package/src/services/voice/scheduler.d.ts +146 -0
  572. package/src/services/voice/scheduler.d.ts.map +1 -0
  573. package/src/services/voice/scheduler.t2.test.ts +141 -0
  574. package/src/services/voice/scheduler.ts +927 -0
  575. package/src/services/voice/shared-resources.d.ts +190 -0
  576. package/src/services/voice/shared-resources.d.ts.map +1 -0
  577. package/src/services/voice/shared-resources.ts +320 -0
  578. package/src/services/voice/speaker/attribution-pipeline.d.ts +74 -0
  579. package/src/services/voice/speaker/attribution-pipeline.d.ts.map +1 -0
  580. package/src/services/voice/speaker/attribution-pipeline.ts +386 -0
  581. package/src/services/voice/speaker/diarizer-fused.d.ts +59 -0
  582. package/src/services/voice/speaker/diarizer-fused.d.ts.map +1 -0
  583. package/src/services/voice/speaker/diarizer-fused.real.test.ts +100 -0
  584. package/src/services/voice/speaker/diarizer-fused.ts +154 -0
  585. package/src/services/voice/speaker/diarizer.d.ts +75 -0
  586. package/src/services/voice/speaker/diarizer.d.ts.map +1 -0
  587. package/src/services/voice/speaker/diarizer.ts +218 -0
  588. package/src/services/voice/speaker/encoder-fused.d.ts +60 -0
  589. package/src/services/voice/speaker/encoder-fused.d.ts.map +1 -0
  590. package/src/services/voice/speaker/encoder-fused.real.test.ts +113 -0
  591. package/src/services/voice/speaker/encoder-fused.ts +138 -0
  592. package/src/services/voice/speaker/encoder-ggml.d.ts +33 -0
  593. package/src/services/voice/speaker/encoder-ggml.d.ts.map +1 -0
  594. package/src/services/voice/speaker/encoder-ggml.ts +79 -0
  595. package/src/services/voice/speaker/encoder.d.ts +37 -0
  596. package/src/services/voice/speaker/encoder.d.ts.map +1 -0
  597. package/src/services/voice/speaker/encoder.ts +105 -0
  598. package/src/services/voice/speaker-imprint.d.ts +83 -0
  599. package/src/services/voice/speaker-imprint.d.ts.map +1 -0
  600. package/src/services/voice/speaker-imprint.test.ts +185 -0
  601. package/src/services/voice/speaker-imprint.ts +312 -0
  602. package/src/services/voice/speaker-preset-cache.d.ts +77 -0
  603. package/src/services/voice/speaker-preset-cache.d.ts.map +1 -0
  604. package/src/services/voice/speaker-preset-cache.test.ts +154 -0
  605. package/src/services/voice/speaker-preset-cache.ts +195 -0
  606. package/src/services/voice/streaming-asr/streaming-pipeline-adapter.ts +292 -0
  607. package/src/services/voice/system-audio-sink.d.ts +73 -0
  608. package/src/services/voice/system-audio-sink.d.ts.map +1 -0
  609. package/src/services/voice/system-audio-sink.test.ts +29 -0
  610. package/src/services/voice/system-audio-sink.ts +366 -0
  611. package/src/services/voice/transcriber.d.ts +244 -0
  612. package/src/services/voice/transcriber.d.ts.map +1 -0
  613. package/src/services/voice/transcriber.test.ts +392 -0
  614. package/src/services/voice/transcriber.ts +704 -0
  615. package/src/services/voice/turn-controller.d.ts +183 -0
  616. package/src/services/voice/turn-controller.d.ts.map +1 -0
  617. package/src/services/voice/turn-controller.test.ts +575 -0
  618. package/src/services/voice/turn-controller.ts +596 -0
  619. package/src/services/voice/types.d.ts +643 -0
  620. package/src/services/voice/types.d.ts.map +1 -0
  621. package/src/services/voice/types.ts +699 -0
  622. package/src/services/voice/vad.d.ts +282 -0
  623. package/src/services/voice/vad.d.ts.map +1 -0
  624. package/src/services/voice/vad.test.ts +480 -0
  625. package/src/services/voice/vad.ts +827 -0
  626. package/src/services/voice/vad.v1-v4.test.ts +222 -0
  627. package/src/services/voice/voice-budget.d.ts +241 -0
  628. package/src/services/voice/voice-budget.d.ts.map +1 -0
  629. package/src/services/voice/voice-budget.test.ts +420 -0
  630. package/src/services/voice/voice-budget.ts +656 -0
  631. package/src/services/voice/voice-duet.test.ts +375 -0
  632. package/src/services/voice/voice-emotion-classifier.d.ts +95 -0
  633. package/src/services/voice/voice-emotion-classifier.d.ts.map +1 -0
  634. package/src/services/voice/voice-emotion-classifier.test.ts +210 -0
  635. package/src/services/voice/voice-emotion-classifier.ts +273 -0
  636. package/src/services/voice/voice-preset-format.d.ts +158 -0
  637. package/src/services/voice/voice-preset-format.d.ts.map +1 -0
  638. package/src/services/voice/voice-preset-format.ts +700 -0
  639. package/src/services/voice/voice-preset-generator.test.ts +89 -0
  640. package/src/services/voice/voice-profile-artifact.d.ts +116 -0
  641. package/src/services/voice/voice-profile-artifact.d.ts.map +1 -0
  642. package/src/services/voice/voice-profile-artifact.test.ts +138 -0
  643. package/src/services/voice/voice-profile-artifact.ts +518 -0
  644. package/src/services/voice/voice-profile-routes.d.ts +83 -0
  645. package/src/services/voice/voice-profile-routes.d.ts.map +1 -0
  646. package/src/services/voice/voice-profile-routes.test.ts +429 -0
  647. package/src/services/voice/voice-profile-routes.ts +425 -0
  648. package/src/services/voice/voice-scenario.ts +154 -0
  649. package/src/services/voice/voice-settings.d.ts +82 -0
  650. package/src/services/voice/voice-settings.d.ts.map +1 -0
  651. package/src/services/voice/voice-settings.ts +172 -0
  652. package/src/services/voice/voice-state-machine.d.ts +364 -0
  653. package/src/services/voice/voice-state-machine.d.ts.map +1 -0
  654. package/src/services/voice/voice-state-machine.ts +727 -0
  655. package/src/services/voice/voice-workbench-report.test.ts +168 -0
  656. package/src/services/voice/voice-workbench-report.ts +326 -0
  657. package/src/services/voice/voice-workbench.test.ts +158 -0
  658. package/src/services/voice/voice.test.ts +1070 -0
  659. package/src/services/voice/wake-word-ggml.d.ts +101 -0
  660. package/src/services/voice/wake-word-ggml.d.ts.map +1 -0
  661. package/src/services/voice/wake-word-ggml.ts +320 -0
  662. package/src/services/voice/wake-word.d.ts +255 -0
  663. package/src/services/voice/wake-word.d.ts.map +1 -0
  664. package/src/services/voice/wake-word.test.ts +298 -0
  665. package/src/services/voice/wake-word.ts +554 -0
  666. package/src/services/voice/wrap-with-first-line-cache.d.ts +70 -0
  667. package/src/services/voice/wrap-with-first-line-cache.d.ts.map +1 -0
  668. package/src/services/voice/wrap-with-first-line-cache.ts +267 -0
  669. package/src/services/voice-model-updater.d.ts +240 -0
  670. package/src/services/voice-model-updater.d.ts.map +1 -0
  671. package/src/services/voice-model-updater.ts +724 -0
  672. package/src/services/voice-prewarm.d.ts +3 -0
  673. package/src/services/voice-prewarm.d.ts.map +1 -0
  674. package/src/services/voice-prewarm.ts +51 -0
  675. package/dist/index.d.ts +0 -37
  676. package/dist/index.js +0 -1098
@@ -0,0 +1,328 @@
1
+ /**
2
+ * Voice ⇄ entity binding seam (producer + round-trip consumer).
3
+ *
4
+ * Producer (`emitVoiceTurnObserved`): emit `VOICE_TURN_OBSERVED` so a
5
+ * merge-engine owner (plugin-lifeops) can fold the recognized voice turn
6
+ * into the entity/relationship graph. The voice-profile store is owned
7
+ * here; the entity graph is owned there; the only shared surface is the
8
+ * core event seam — neither plugin imports the other.
9
+ *
10
+ * Consumer (`handleVoiceEntityBound`): when the merge engine reports a
11
+ * binding via `VOICE_ENTITY_BOUND`, persist the resulting `entityId` onto
12
+ * every profile in that imprint cluster (`VoiceProfileStore.bindEntity`).
13
+ * This is the runtime path that was missing in issue #8234 — without it a
14
+ * profile's `entityId` stayed `null` and recognized speakers never reached
15
+ * the relationship graph.
16
+ */
17
+
18
+ import crypto from "node:crypto";
19
+ import path from "node:path";
20
+ import {
21
+ EventType,
22
+ type IAgentRuntime,
23
+ logger,
24
+ resolveStateDir,
25
+ type VoiceEntityBoundPayload,
26
+ } from "@elizaos/core";
27
+ import type {
28
+ VoiceNextSpeaker,
29
+ VoiceTurnSignal,
30
+ } from "../services/voice/eot-classifier.js";
31
+ import { VoiceProfileStore } from "../services/voice/profile-store.js";
32
+ import type { VoiceAttributionOutput } from "../services/voice/speaker/attribution-pipeline.js";
33
+
34
+ // ---------------------------------------------------------------------------
35
+ // Store wiring (injectable for tests, mirrors the route handlers)
36
+ // ---------------------------------------------------------------------------
37
+
38
+ let storeOverride: VoiceProfileStore | null = null;
39
+
40
+ export function setVoiceEntityBindingStore(
41
+ store: VoiceProfileStore | null,
42
+ ): void {
43
+ storeOverride = store;
44
+ }
45
+
46
+ export async function getVoiceProfileStore(): Promise<VoiceProfileStore> {
47
+ if (storeOverride) return storeOverride;
48
+ const store = new VoiceProfileStore({
49
+ rootDir: path.join(resolveStateDir(), "voice-profiles"),
50
+ });
51
+ await store.init();
52
+ return store;
53
+ }
54
+
55
+ // ---------------------------------------------------------------------------
56
+ // Producer
57
+ // ---------------------------------------------------------------------------
58
+
59
+ export interface EmitVoiceTurnObservedArgs {
60
+ /** Stable utterance id; a random one is minted when omitted. */
61
+ turnId?: string;
62
+ /** Recognized text (drives name/partner-claim extraction downstream). */
63
+ text: string;
64
+ /** Imprint cluster id from the voice-profile store. */
65
+ imprintClusterId: string;
66
+ /** Confidence of the imprint match (0..1). */
67
+ matchConfidence: number;
68
+ /** Entity the imprint already resolved to, or `null`/omitted when unbound. */
69
+ matchedEntityId?: string | null;
70
+ /** True when the OWNER spoke this turn. */
71
+ isOwner?: boolean;
72
+ /** ISO timestamp; defaults to now. */
73
+ observedAt?: string;
74
+ }
75
+
76
+ /**
77
+ * Emit `VOICE_TURN_OBSERVED`. No-op in effect when no merge-engine plugin
78
+ * is loaded (the event simply has no handler). `emitEvent` awaits every
79
+ * handler, so by the time this resolves the binding round-trip (including
80
+ * `VOICE_ENTITY_BOUND` → profile persist) has completed.
81
+ */
82
+ export async function emitVoiceTurnObserved(
83
+ runtime: IAgentRuntime,
84
+ args: EmitVoiceTurnObservedArgs,
85
+ ): Promise<void> {
86
+ await runtime.emitEvent(EventType.VOICE_TURN_OBSERVED, {
87
+ runtime,
88
+ turnId: args.turnId ?? `vturn_${crypto.randomUUID()}`,
89
+ text: args.text,
90
+ imprintClusterId: args.imprintClusterId,
91
+ matchConfidence: args.matchConfidence,
92
+ matchedEntityId: args.matchedEntityId ?? null,
93
+ observedAt: args.observedAt ?? new Date().toISOString(),
94
+ ...(args.isOwner !== undefined ? { isOwner: args.isOwner } : {}),
95
+ });
96
+ }
97
+
98
+ // ---------------------------------------------------------------------------
99
+ // Live-turn attribution → VOICE_TURN_OBSERVED + voiceTurnSignal (gating)
100
+ // ---------------------------------------------------------------------------
101
+
102
+ /** Server SUPPRESS threshold for EOT — below this reads as "user still talking". */
103
+ const SERVER_EOT_SUPPRESS_THRESHOLD = 0.4;
104
+ /** Only a CONFIDENT bystander attribution is allowed to silence a turn. */
105
+ const BYSTANDER_SUPPRESS_CONFIDENCE = 0.7;
106
+
107
+ export interface HandleLiveVoiceAttributionOptions {
108
+ /**
109
+ * Entity id the agent treats as the device owner / primary enrolled
110
+ * speaker. A turn attributed to this entity is always allowed to speak.
111
+ */
112
+ ownerEntityId?: string | null;
113
+ /**
114
+ * Entity ids the agent answers to without a wake word (owner + enrolled
115
+ * household members). A confident bystander is anyone attributed to an
116
+ * entity NOT in this set.
117
+ */
118
+ knownSpeakerEntityIds?: readonly string[];
119
+ /**
120
+ * The EOT-based turn signal the turn-controller already computed for this
121
+ * turn (from `eot-classifier` / `turn-controller`). The speaker decision is
122
+ * folded into it. When omitted, a neutral base is synthesized from
123
+ * `endOfTurnProbability` (default 0.5 — "unknown", fail open).
124
+ */
125
+ baseSignal?: VoiceTurnSignal;
126
+ /** P(turn complete) when no `baseSignal` is supplied (default 0.5). */
127
+ endOfTurnProbability?: number;
128
+ /** True when a wake word fired within the recent listen window. */
129
+ wakeWordActive?: boolean;
130
+ /**
131
+ * The ASR transcript for this turn, joined from the streaming-ASR path. When
132
+ * provided it rides on `VOICE_TURN_OBSERVED` (and the turn signal) so the
133
+ * merge engine's name/partner extraction (`VoiceObserver.ingestTurn`) runs
134
+ * from LIVE audio — previously this was hardcoded `""`, so live recognition
135
+ * could identify *who* spoke but never *what* they said (#8786). Diarization-
136
+ * only callers (audio-frame path) leave it unset; the in-process voice engine
137
+ * (which has both ASR + diarization) passes the real transcript.
138
+ */
139
+ transcript?: string;
140
+ }
141
+
142
+ /**
143
+ * Resolve owner / enrolled state for the attributed primary speaker.
144
+ *
145
+ * `isOwner` is `entityId === ownerEntityId`; "enrolled" is owner OR an entity
146
+ * id present in `knownSpeakerEntityIds`. An unbound speaker (`entityId == null`)
147
+ * is neither — it can never be a "confident bystander" (fail open).
148
+ */
149
+ function resolveSpeakerStanding(
150
+ output: VoiceAttributionOutput,
151
+ opts: HandleLiveVoiceAttributionOptions,
152
+ ): {
153
+ entityId: string | null;
154
+ confidence: number;
155
+ isOwner: boolean;
156
+ enrolled: boolean;
157
+ } {
158
+ const speaker = output.primarySpeaker;
159
+ const entityId = speaker?.entityId ?? output.observation?.entityId ?? null;
160
+ const confidence = speaker?.confidence ?? output.observation?.confidence ?? 0;
161
+ const ownerEntityId = opts.ownerEntityId ?? null;
162
+ const isOwner = entityId !== null && entityId === ownerEntityId;
163
+ const known = new Set<string>(opts.knownSpeakerEntityIds ?? []);
164
+ const enrolled = isOwner || (entityId !== null && known.has(entityId));
165
+ return { entityId, confidence, isOwner, enrolled };
166
+ }
167
+
168
+ /**
169
+ * Compose the EOT base signal with the live speaker decision.
170
+ *
171
+ * Mirrors `packages/ui/src/voice/voice-turn-signal.ts buildVoiceTurnSignal`
172
+ * (the transcript-only producer) on the audio-frame side: a CONFIDENT bystander
173
+ * who did NOT say the wake word is cross-talk → suppress. A wake word is an
174
+ * explicit address → always speak. Uncertain attribution never silences a real
175
+ * turn. The server gate `core.voice_turn_signal` reads the returned object.
176
+ */
177
+ function foldSpeakerIntoSignal(
178
+ base: VoiceTurnSignal,
179
+ standing: {
180
+ entityId: string | null;
181
+ confidence: number;
182
+ isOwner: boolean;
183
+ enrolled: boolean;
184
+ },
185
+ opts: HandleLiveVoiceAttributionOptions,
186
+ ): VoiceTurnSignal {
187
+ let agentShouldSpeak = base.agentShouldSpeak !== false;
188
+
189
+ const confidentBystander =
190
+ !standing.enrolled &&
191
+ standing.entityId !== null &&
192
+ standing.confidence >= BYSTANDER_SUPPRESS_CONFIDENCE;
193
+ if (agentShouldSpeak && opts.wakeWordActive !== true && confidentBystander) {
194
+ agentShouldSpeak = false;
195
+ }
196
+
197
+ // Wake word overrides bystander doubt — the user deliberately summoned us.
198
+ if (opts.wakeWordActive === true) agentShouldSpeak = true;
199
+
200
+ const eot = base.endOfTurnProbability;
201
+ const nextSpeaker: VoiceNextSpeaker = !agentShouldSpeak
202
+ ? "user"
203
+ : eot < SERVER_EOT_SUPPRESS_THRESHOLD
204
+ ? "user"
205
+ : "agent";
206
+
207
+ const source = opts.wakeWordActive
208
+ ? "voice-bridge+wakeword"
209
+ : "voice-bridge+diarization";
210
+
211
+ return {
212
+ endOfTurnProbability: eot,
213
+ nextSpeaker,
214
+ agentShouldSpeak,
215
+ source: "custom",
216
+ transcript: base.transcript,
217
+ ...(base.model ? { model: base.model } : {}),
218
+ ...(base.latencyMs !== undefined ? { latencyMs: base.latencyMs } : {}),
219
+ // Stash the human-readable provenance so traces show the fold source even
220
+ // though the typed `source` enum stays "custom".
221
+ metadata: { provenance: source },
222
+ } as VoiceTurnSignal & { metadata: { provenance: string } };
223
+ }
224
+
225
+ /**
226
+ * Handle a live per-turn attribution result. This is the single automatic seam
227
+ * the engine bridge calls from its `onAttribution` path: any caller that wires a
228
+ * `profileStore` gets diarization-driven gating for free.
229
+ *
230
+ * 1. Emits `VOICE_TURN_OBSERVED` when the turn produced a profile observation
231
+ * (so the merge engine can fold the recognized speaker into the entity
232
+ * graph and round-trip the binding back onto the profile).
233
+ * 2. Composes the EOT-based turn signal with the speaker decision and stamps it
234
+ * onto `output.turn.metadata.voiceTurnSignal`, which the chat-view producer
235
+ * forwards to the server gate verbatim.
236
+ *
237
+ * Returns the composed signal (also written onto the turn metadata in place).
238
+ * Never throws on the emit path — observation emission is best-effort and is
239
+ * logged, never propagated, so an attribution turn never crashes a voice turn.
240
+ */
241
+ export async function handleLiveVoiceAttribution(
242
+ runtime: IAgentRuntime,
243
+ output: VoiceAttributionOutput,
244
+ opts: HandleLiveVoiceAttributionOptions = {},
245
+ ): Promise<VoiceTurnSignal> {
246
+ const standing = resolveSpeakerStanding(output, opts);
247
+ // Carry the real ASR transcript when the caller joined it (in-process engine);
248
+ // fall back to a base-signal transcript, else "" for diarization-only callers.
249
+ const transcript = opts.transcript ?? opts.baseSignal?.transcript ?? "";
250
+
251
+ if (output.observation) {
252
+ const obs = output.observation;
253
+ try {
254
+ await emitVoiceTurnObserved(runtime, {
255
+ turnId: output.turnId,
256
+ text: transcript,
257
+ imprintClusterId: obs.imprintClusterId,
258
+ matchConfidence: obs.confidence,
259
+ matchedEntityId: obs.entityId,
260
+ isOwner: standing.isOwner,
261
+ });
262
+ } catch (err) {
263
+ logger.warn(
264
+ {
265
+ turnId: output.turnId,
266
+ imprintClusterId: obs.imprintClusterId,
267
+ error: err instanceof Error ? err.message : String(err),
268
+ },
269
+ "[local-inference] VOICE_TURN_OBSERVED emit failed during live attribution",
270
+ );
271
+ }
272
+ }
273
+
274
+ const base: VoiceTurnSignal = opts.baseSignal ?? {
275
+ endOfTurnProbability: opts.endOfTurnProbability ?? 0.5,
276
+ nextSpeaker: "unknown",
277
+ agentShouldSpeak: null,
278
+ source: "custom",
279
+ transcript,
280
+ };
281
+
282
+ const signal = foldSpeakerIntoSignal(base, standing, opts);
283
+
284
+ const turn = output.turn;
285
+ turn.metadata = { ...(turn.metadata ?? {}), voiceTurnSignal: signal };
286
+
287
+ return signal;
288
+ }
289
+
290
+ // ---------------------------------------------------------------------------
291
+ // Consumer
292
+ // ---------------------------------------------------------------------------
293
+
294
+ /**
295
+ * Handler for `VOICE_ENTITY_BOUND`. Persists `entityId` onto every profile
296
+ * in the cluster that is not already bound to it. Returns nothing (the
297
+ * `EventHandler` contract); the bound count is logged.
298
+ */
299
+ export async function handleVoiceEntityBound(
300
+ payload: VoiceEntityBoundPayload,
301
+ ): Promise<void> {
302
+ const store = await getVoiceProfileStore();
303
+ const records = await store.list();
304
+ const targets = records.filter(
305
+ (r) =>
306
+ r.imprintClusterId === payload.imprintClusterId &&
307
+ r.entityId !== payload.entityId,
308
+ );
309
+ let bound = 0;
310
+ for (const record of targets) {
311
+ const updated = await store.bindEntity({
312
+ profileId: record.profileId,
313
+ entityId: payload.entityId,
314
+ ...(payload.displayName ? { label: payload.displayName } : {}),
315
+ });
316
+ if (updated) bound += 1;
317
+ }
318
+ if (bound > 0) {
319
+ logger.info(
320
+ {
321
+ imprintClusterId: payload.imprintClusterId,
322
+ entityId: payload.entityId,
323
+ bound,
324
+ },
325
+ "[local-inference] persisted voice→entity binding onto profile(s)",
326
+ );
327
+ }
328
+ }
@@ -0,0 +1,71 @@
1
+ # `services/local-inference/` (app-core, server-side)
2
+
3
+ This is the **server-side** local-inference service used by the agent
4
+ runtime (`@elizaos/app-core`). It owns:
5
+
6
+ - KV-cache slot management (`cache-bridge.ts`, `mtp-cache-flow.test.ts`).
7
+ - llama-server lifecycle (`ffi-streaming-backend.ts`, `mtp-doctor.ts`,
8
+ `llama-server-metrics.ts`, `session-pool.ts`).
9
+ - Conversation registry (`conversation-registry.ts`).
10
+ - Backend dispatch (`backend.ts`, `engine.ts`, `handler-registry.ts`,
11
+ `router-handler.ts`, `service.ts`).
12
+ - Provider snapshot, hardware probe, model catalog, recommendation, and
13
+ download orchestration (`providers.ts`, `hardware.ts`, `catalog.ts`,
14
+ `recommendation.ts`, `downloader.ts`, `assignments.ts`,
15
+ `bundled-models.ts`, `external-scanner.ts`, `hf-search.ts`,
16
+ `registry.ts`, `paths.ts`, `routing-policy.ts`).
17
+
18
+ ## Server / client split
19
+
20
+ The UI client mirror lives in
21
+ [`packages/ui/src/services/local-inference/`](../../../../ui/src/services/local-inference/README.md).
22
+ That mirror exists because UI code (panels, hooks, the iOS/Android local
23
+ agent kernel) needs access to the **catalog**, **recommendation**, and
24
+ the **type contract** for status payloads, but must not pull in the
25
+ server runtime (KV cache, llama-server lifecycle, conversation
26
+ registry).
27
+
28
+ Some files are byte-identical between the two trees and have identical
29
+ semantics. Those have been extracted to `@elizaos/shared/local-inference`
30
+ and the local files in this directory are thin re-exports:
31
+
32
+ - `paths.ts` — re-exports `localInferenceRoot` etc. from
33
+ `@elizaos/shared`.
34
+ - `routing-preferences.ts` — re-exports `readRoutingPreferences` etc.
35
+ from `@elizaos/shared`.
36
+ - `verify.ts` — re-exports `verifyInstalledModel` etc. from
37
+ `@elizaos/shared`.
38
+ - `types.ts` — re-exports `AgentModelSlot`, `InstalledModel`,
39
+ `ModelAssignments`, `TextGenerationSlot`, and `AGENT_MODEL_SLOTS` from
40
+ `@elizaos/shared`. Server-only types (MTP kernel metadata,
41
+ `LocalRuntimeOptimizations`, `loadedCacheTypeK`/`...V`/`GpuLayers`,
42
+ etc.) remain declared in this file because the UI public client has
43
+ no consumer for them.
44
+
45
+ ## What stays a twin (and why)
46
+
47
+ These files exist in both `packages/app-core` and `packages/ui` and are
48
+ intentionally **not bundled:
49
+
50
+ - `catalog.ts` — server adds `contextLength`, `optimizations.requiresKernel`,
51
+ and MTP drafter variants that the UI public catalog does not surface.
52
+ - `recommendation.ts` — server has kernel-availability filtering
53
+ (`recommendation.test.ts` covers MTP gating) that depends on
54
+ server-only `LocalRuntimeOptimizations.requiresKernel`.
55
+ - `active-model.ts` — server resolves load args against the loader's
56
+ KV-cache type / GPU-layer overrides (server-only types).
57
+ - `device-bridge.ts` — server forwards `promptCacheKey` from the runtime
58
+ cache plan.
59
+ - `ffi-streaming-backend.ts` — server owns the full llama-server lifecycle, the
60
+ in-process binding fallback, and metrics scraping.
61
+ - `mtp-doctor.ts` — uses tokenizer parity catalog metadata that only
62
+ the server catalog declares.
63
+ - `engine.ts`, `handler-registry.ts`, `hardware.ts`, `index.ts`,
64
+ `providers.ts`, `router-handler.ts`, `service.ts` — server-side
65
+ superset; the UI mirror keeps a slim subset of the same surface for
66
+ type-only / catalog-only consumers.
67
+
68
+ If a twin pair becomes byte-identical with identical semantics, extract
69
+ it to `packages/shared/src/local-inference/` and replace both copies
70
+ with a thin re-export, the same way `paths.ts` / `verify.ts` /
71
+ `routing-preferences.ts` were handled.
@@ -0,0 +1,101 @@
1
+ import { describe, expect, it } from "vitest";
2
+
3
+ import { readBackendEnvOverride, selectBackend } from "../backend-selector";
4
+
5
+ describe("selectBackend", () => {
6
+ it("forces ffi-streaming on mobile when FFI is supported", () => {
7
+ expect(
8
+ selectBackend({
9
+ platform: "mobile",
10
+ ffiSupported: true,
11
+ }),
12
+ ).toBe("ffi-streaming");
13
+ });
14
+
15
+ it("throws on mobile when FFI is missing", () => {
16
+ expect(() =>
17
+ selectBackend({
18
+ platform: "mobile",
19
+ ffiSupported: false,
20
+ }),
21
+ ).toThrow(/streaming-LLM FFI symbols/);
22
+ });
23
+
24
+ it("desktop defaults to ffi-streaming when FFI is supported", () => {
25
+ expect(
26
+ selectBackend({
27
+ platform: "desktop",
28
+ ffiSupported: true,
29
+ }),
30
+ ).toBe("ffi-streaming");
31
+ });
32
+
33
+ it("throws on desktop when FFI symbols are absent", () => {
34
+ expect(() =>
35
+ selectBackend({
36
+ platform: "desktop",
37
+ ffiSupported: false,
38
+ }),
39
+ ).toThrow(/streaming-LLM FFI symbols/);
40
+ });
41
+
42
+ it("envOverride=ffi wins on desktop when supported", () => {
43
+ expect(
44
+ selectBackend({
45
+ platform: "desktop",
46
+ ffiSupported: true,
47
+ envOverride: "ffi",
48
+ }),
49
+ ).toBe("ffi-streaming");
50
+ });
51
+
52
+ it("envOverride=ffi without ffiSupported throws", () => {
53
+ expect(() =>
54
+ selectBackend({
55
+ platform: "desktop",
56
+ ffiSupported: false,
57
+ envOverride: "ffi",
58
+ }),
59
+ ).toThrow(/does not export the streaming-LLM symbols/);
60
+ });
61
+
62
+ it("envOverride=auto on desktop with FFI keeps the new default (ffi-streaming)", () => {
63
+ expect(
64
+ selectBackend({
65
+ platform: "desktop",
66
+ ffiSupported: true,
67
+ envOverride: "auto",
68
+ }),
69
+ ).toBe("ffi-streaming");
70
+ });
71
+ });
72
+
73
+ describe("readBackendEnvOverride", () => {
74
+ it("returns auto for explicit auto", () => {
75
+ expect(readBackendEnvOverride({ ELIZA_INFERENCE_BACKEND: "auto" })).toBe(
76
+ "auto",
77
+ );
78
+ });
79
+
80
+ it("normalizes ffi aliases and ignores server aliases", () => {
81
+ expect(readBackendEnvOverride({ ELIZA_INFERENCE_BACKEND: "FFI" })).toBe(
82
+ "ffi",
83
+ );
84
+ expect(
85
+ readBackendEnvOverride({ ELIZA_INFERENCE_BACKEND: "ffi-streaming" }),
86
+ ).toBe("ffi");
87
+ expect(
88
+ readBackendEnvOverride({ ELIZA_INFERENCE_BACKEND: "http-server" }),
89
+ ).toBeNull();
90
+ expect(readBackendEnvOverride({ ELIZA_INFERENCE_BACKEND: "server" })).toBe(
91
+ null,
92
+ );
93
+ });
94
+
95
+ it("returns null for unset / unknown", () => {
96
+ expect(readBackendEnvOverride({})).toBeNull();
97
+ expect(
98
+ readBackendEnvOverride({ ELIZA_INFERENCE_BACKEND: "foo" }),
99
+ ).toBeNull();
100
+ });
101
+ });