@elizaos/plugin-local-inference 2.0.0-beta.1 → 2.0.11-beta.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (676) hide show
  1. package/LICENSE +21 -0
  2. package/README.md +83 -0
  3. package/package.json +81 -15
  4. package/src/actions/generate-media.d.ts +59 -0
  5. package/src/actions/generate-media.d.ts.map +1 -0
  6. package/src/actions/generate-media.ts +647 -0
  7. package/src/actions/identify-speaker.d.ts +23 -0
  8. package/src/actions/identify-speaker.d.ts.map +1 -0
  9. package/src/actions/identify-speaker.ts +171 -0
  10. package/src/adapters/capacitor-llama/__tests__/compat-behavior.test.ts +218 -0
  11. package/src/adapters/capacitor-llama/__tests__/index.test.ts +68 -0
  12. package/src/adapters/capacitor-llama/__tests__/structured-output.test.ts +215 -0
  13. package/src/adapters/capacitor-llama/__tests__/text-streaming.test.ts +174 -0
  14. package/src/adapters/capacitor-llama/environment.ts +71 -0
  15. package/src/adapters/capacitor-llama/index.browser.ts +83 -0
  16. package/src/adapters/capacitor-llama/index.ts +807 -0
  17. package/src/adapters/capacitor-llama/loader.ts +109 -0
  18. package/src/adapters/capacitor-llama/structured-output.ts +165 -0
  19. package/src/adapters/capacitor-llama/text-streaming.ts +227 -0
  20. package/src/adapters/capacitor-llama/types.ts +374 -0
  21. package/src/backends/apple-foundation.ts +127 -0
  22. package/src/index.d.ts +7 -0
  23. package/src/index.d.ts.map +1 -0
  24. package/src/index.ts +54 -0
  25. package/src/local-inference-routes.d.ts +38 -0
  26. package/src/local-inference-routes.d.ts.map +1 -0
  27. package/src/local-inference-routes.test.ts +344 -0
  28. package/src/local-inference-routes.ts +1543 -0
  29. package/src/provider.d.ts +21 -0
  30. package/src/provider.d.ts.map +1 -0
  31. package/src/provider.ts +1171 -0
  32. package/src/routes/compat-helpers.d.ts +18 -0
  33. package/src/routes/compat-helpers.d.ts.map +1 -0
  34. package/src/routes/compat-helpers.ts +274 -0
  35. package/src/routes/family-member-route.d.ts +62 -0
  36. package/src/routes/family-member-route.d.ts.map +1 -0
  37. package/src/routes/family-member-route.ts +353 -0
  38. package/src/routes/index.d.ts +19 -0
  39. package/src/routes/index.d.ts.map +1 -0
  40. package/src/routes/index.ts +60 -0
  41. package/src/routes/live-diarization-route.d.ts +26 -0
  42. package/src/routes/live-diarization-route.d.ts.map +1 -0
  43. package/src/routes/live-diarization-route.test.ts +213 -0
  44. package/src/routes/live-diarization-route.ts +122 -0
  45. package/src/routes/local-inference-asr-route.d.ts +4 -0
  46. package/src/routes/local-inference-asr-route.d.ts.map +1 -0
  47. package/src/routes/local-inference-asr-route.test.ts +190 -0
  48. package/src/routes/local-inference-asr-route.ts +213 -0
  49. package/src/routes/local-inference-compat-routes.d.ts +16 -0
  50. package/src/routes/local-inference-compat-routes.d.ts.map +1 -0
  51. package/src/routes/local-inference-compat-routes.test.ts +423 -0
  52. package/src/routes/local-inference-compat-routes.ts +782 -0
  53. package/src/routes/local-inference-tts-route.d.ts +7 -0
  54. package/src/routes/local-inference-tts-route.d.ts.map +1 -0
  55. package/src/routes/local-inference-tts-route.test.ts +179 -0
  56. package/src/routes/local-inference-tts-route.ts +230 -0
  57. package/src/routes/voice-first-run-routes.d.ts +62 -0
  58. package/src/routes/voice-first-run-routes.d.ts.map +1 -0
  59. package/src/routes/voice-first-run-routes.ts +524 -0
  60. package/src/routes/voice-models-routes.d.ts +62 -0
  61. package/src/routes/voice-models-routes.d.ts.map +1 -0
  62. package/src/routes/voice-models-routes.ts +554 -0
  63. package/src/routes/voice-profile-plugin-routes.d.ts +19 -0
  64. package/src/routes/voice-profile-plugin-routes.d.ts.map +1 -0
  65. package/src/routes/voice-profile-plugin-routes.ts +138 -0
  66. package/src/routes/voice-profiles-management-routes.d.ts +52 -0
  67. package/src/routes/voice-profiles-management-routes.d.ts.map +1 -0
  68. package/src/routes/voice-profiles-management-routes.ts +476 -0
  69. package/src/routes/voice-speaker-profile-routes.d.ts +57 -0
  70. package/src/routes/voice-speaker-profile-routes.d.ts.map +1 -0
  71. package/src/routes/voice-speaker-profile-routes.ts +199 -0
  72. package/src/runtime/aosp-llama-loader-selection.test.ts +80 -0
  73. package/src/runtime/capacitor-llama.d.ts +25 -0
  74. package/src/runtime/embedding-manager-support.d.ts +77 -0
  75. package/src/runtime/embedding-manager-support.d.ts.map +1 -0
  76. package/src/runtime/embedding-manager-support.ts +497 -0
  77. package/src/runtime/embedding-presets.d.ts +16 -0
  78. package/src/runtime/embedding-presets.d.ts.map +1 -0
  79. package/src/runtime/embedding-presets.ts +81 -0
  80. package/src/runtime/embedding-warmup-policy.d.ts +14 -0
  81. package/src/runtime/embedding-warmup-policy.d.ts.map +1 -0
  82. package/src/runtime/embedding-warmup-policy.test.ts +53 -0
  83. package/src/runtime/embedding-warmup-policy.ts +48 -0
  84. package/src/runtime/ensure-local-inference-handler.d.ts +53 -0
  85. package/src/runtime/ensure-local-inference-handler.d.ts.map +1 -0
  86. package/src/runtime/ensure-local-inference-handler.test.ts +528 -0
  87. package/src/runtime/ensure-local-inference-handler.ts +1398 -0
  88. package/src/runtime/index.d.ts +14 -0
  89. package/src/runtime/index.d.ts.map +1 -0
  90. package/src/runtime/index.ts +27 -0
  91. package/src/runtime/mobile-local-inference-gate.d.ts +31 -0
  92. package/src/runtime/mobile-local-inference-gate.d.ts.map +1 -0
  93. package/src/runtime/mobile-local-inference-gate.test.ts +69 -0
  94. package/src/runtime/mobile-local-inference-gate.ts +44 -0
  95. package/src/runtime/voice-entity-binding.d.ts +103 -0
  96. package/src/runtime/voice-entity-binding.d.ts.map +1 -0
  97. package/src/runtime/voice-entity-binding.transcript.test.ts +69 -0
  98. package/src/runtime/voice-entity-binding.ts +328 -0
  99. package/src/services/README.md +71 -0
  100. package/src/services/__tests__/backend-selector.test.ts +101 -0
  101. package/src/services/__tests__/checkpoint-manager.test.ts +376 -0
  102. package/src/services/__tests__/gpu-autotune.test.ts +400 -0
  103. package/src/services/__tests__/llm-streaming-binding.test.ts +85 -0
  104. package/src/services/__tests__/planner-grammar.test.ts +372 -0
  105. package/src/services/__tests__/runtime-target.test.ts +176 -0
  106. package/src/services/active-model-switch-rollback.test.ts +183 -0
  107. package/src/services/active-model.d.ts +282 -0
  108. package/src/services/active-model.d.ts.map +1 -0
  109. package/src/services/active-model.ts +1213 -0
  110. package/src/services/asr/errors.d.ts +21 -0
  111. package/src/services/asr/errors.d.ts.map +1 -0
  112. package/src/services/asr/errors.ts +50 -0
  113. package/src/services/asr/hash.d.ts +28 -0
  114. package/src/services/asr/hash.d.ts.map +1 -0
  115. package/src/services/asr/hash.ts +49 -0
  116. package/src/services/asr/index.d.ts +76 -0
  117. package/src/services/asr/index.d.ts.map +1 -0
  118. package/src/services/asr/index.ts +178 -0
  119. package/src/services/asr/types.d.ts +91 -0
  120. package/src/services/asr/types.d.ts.map +1 -0
  121. package/src/services/asr/types.ts +95 -0
  122. package/src/services/assignments.d.ts +71 -0
  123. package/src/services/assignments.d.ts.map +1 -0
  124. package/src/services/assignments.test.ts +80 -0
  125. package/src/services/assignments.ts +230 -0
  126. package/src/services/backend-selector.ts +95 -0
  127. package/src/services/backend.d.ts +346 -0
  128. package/src/services/backend.d.ts.map +1 -0
  129. package/src/services/backend.ts +612 -0
  130. package/src/services/bundled-models.d.ts +34 -0
  131. package/src/services/bundled-models.d.ts.map +1 -0
  132. package/src/services/bundled-models.ts +129 -0
  133. package/src/services/cache-bridge.d.ts +206 -0
  134. package/src/services/cache-bridge.d.ts.map +1 -0
  135. package/src/services/cache-bridge.test.ts +516 -0
  136. package/src/services/cache-bridge.ts +423 -0
  137. package/src/services/catalog.d.ts +10 -0
  138. package/src/services/catalog.d.ts.map +1 -0
  139. package/src/services/catalog.test.ts +240 -0
  140. package/src/services/catalog.ts +27 -0
  141. package/src/services/checkpoint-client.d.ts +109 -0
  142. package/src/services/checkpoint-client.d.ts.map +1 -0
  143. package/src/services/checkpoint-client.ts +258 -0
  144. package/src/services/checkpoint-manager.ts +474 -0
  145. package/src/services/cloud-fallback.d.ts +102 -0
  146. package/src/services/cloud-fallback.d.ts.map +1 -0
  147. package/src/services/cloud-fallback.ts +230 -0
  148. package/src/services/conversation-registry.d.ts +142 -0
  149. package/src/services/conversation-registry.d.ts.map +1 -0
  150. package/src/services/conversation-registry.test.ts +235 -0
  151. package/src/services/conversation-registry.ts +264 -0
  152. package/src/services/desktop-fused-ffi-backend-runtime.d.ts +92 -0
  153. package/src/services/desktop-fused-ffi-backend-runtime.d.ts.map +1 -0
  154. package/src/services/desktop-fused-ffi-backend-runtime.ts +333 -0
  155. package/src/services/device-bridge.d.ts +188 -0
  156. package/src/services/device-bridge.d.ts.map +1 -0
  157. package/src/services/device-bridge.ts +1237 -0
  158. package/src/services/device-resource-metrics.d.ts +149 -0
  159. package/src/services/device-resource-metrics.d.ts.map +1 -0
  160. package/src/services/device-resource-metrics.test.ts +98 -0
  161. package/src/services/device-resource-metrics.ts +346 -0
  162. package/src/services/device-tier.d.ts +115 -0
  163. package/src/services/device-tier.d.ts.map +1 -0
  164. package/src/services/device-tier.test.ts +371 -0
  165. package/src/services/device-tier.ts +410 -0
  166. package/src/services/downloader.d.ts +82 -0
  167. package/src/services/downloader.d.ts.map +1 -0
  168. package/src/services/downloader.test.ts +724 -0
  169. package/src/services/downloader.ts +899 -0
  170. package/src/services/engine-direct-bundle.test.ts +58 -0
  171. package/src/services/engine-streaming.test.ts +80 -0
  172. package/src/services/engine.d.ts +534 -0
  173. package/src/services/engine.d.ts.map +1 -0
  174. package/src/services/engine.ts +1891 -0
  175. package/src/services/ensure-local-artifacts.integration.test.ts +273 -0
  176. package/src/services/ensure-local-artifacts.test.ts +368 -0
  177. package/src/services/ensure-local-artifacts.ts +351 -0
  178. package/src/services/external-scanner.d.ts +17 -0
  179. package/src/services/external-scanner.d.ts.map +1 -0
  180. package/src/services/external-scanner.ts +312 -0
  181. package/src/services/ffi-llm-mock.ts +354 -0
  182. package/src/services/ffi-llm-streaming-abi.ts +442 -0
  183. package/src/services/ffi-streaming-backend.d.ts +180 -0
  184. package/src/services/ffi-streaming-backend.d.ts.map +1 -0
  185. package/src/services/ffi-streaming-backend.ts +382 -0
  186. package/src/services/ffi-streaming-runner.d.ts +122 -0
  187. package/src/services/ffi-streaming-runner.d.ts.map +1 -0
  188. package/src/services/ffi-streaming-runner.test.ts +60 -0
  189. package/src/services/ffi-streaming-runner.ts +354 -0
  190. package/src/services/ffi-unload-ordering.test.ts +162 -0
  191. package/src/services/gpu-autotune.ts +534 -0
  192. package/src/services/gpu-detect.ts +139 -0
  193. package/src/services/handler-registry.d.ts +72 -0
  194. package/src/services/handler-registry.d.ts.map +1 -0
  195. package/src/services/handler-registry.ts +240 -0
  196. package/src/services/hardware.d.ts +63 -0
  197. package/src/services/hardware.d.ts.map +1 -0
  198. package/src/services/hardware.test.ts +183 -0
  199. package/src/services/hardware.ts +404 -0
  200. package/src/services/hf-search.d.ts +26 -0
  201. package/src/services/hf-search.d.ts.map +1 -0
  202. package/src/services/hf-search.test.ts +69 -0
  203. package/src/services/hf-search.ts +420 -0
  204. package/src/services/image-description-runtime.d.ts +14 -0
  205. package/src/services/image-description-runtime.d.ts.map +1 -0
  206. package/src/services/image-description-runtime.test.ts +61 -0
  207. package/src/services/image-description-runtime.ts +118 -0
  208. package/src/services/imagegen/aosp-unavailable.d.ts +134 -0
  209. package/src/services/imagegen/aosp-unavailable.d.ts.map +1 -0
  210. package/src/services/imagegen/aosp-unavailable.ts +229 -0
  211. package/src/services/imagegen/backend-selector.d.ts +118 -0
  212. package/src/services/imagegen/backend-selector.d.ts.map +1 -0
  213. package/src/services/imagegen/backend-selector.ts +281 -0
  214. package/src/services/imagegen/coreml-unavailable.d.ts +105 -0
  215. package/src/services/imagegen/coreml-unavailable.d.ts.map +1 -0
  216. package/src/services/imagegen/coreml-unavailable.ts +237 -0
  217. package/src/services/imagegen/errors.d.ts +16 -0
  218. package/src/services/imagegen/errors.d.ts.map +1 -0
  219. package/src/services/imagegen/errors.ts +40 -0
  220. package/src/services/imagegen/index.d.ts +58 -0
  221. package/src/services/imagegen/index.d.ts.map +1 -0
  222. package/src/services/imagegen/index.ts +144 -0
  223. package/src/services/imagegen/mflux.d.ts +74 -0
  224. package/src/services/imagegen/mflux.d.ts.map +1 -0
  225. package/src/services/imagegen/mflux.ts +313 -0
  226. package/src/services/imagegen/sd-cpp.d.ts +180 -0
  227. package/src/services/imagegen/sd-cpp.d.ts.map +1 -0
  228. package/src/services/imagegen/sd-cpp.ts +718 -0
  229. package/src/services/imagegen/tensorrt-unavailable.d.ts +83 -0
  230. package/src/services/imagegen/tensorrt-unavailable.d.ts.map +1 -0
  231. package/src/services/imagegen/tensorrt-unavailable.ts +295 -0
  232. package/src/services/imagegen/types.d.ts +181 -0
  233. package/src/services/imagegen/types.d.ts.map +1 -0
  234. package/src/services/imagegen/types.ts +193 -0
  235. package/src/services/index.d.ts +30 -0
  236. package/src/services/index.d.ts.map +1 -0
  237. package/src/services/index.ts +225 -0
  238. package/src/services/inference-capabilities.d.ts +132 -0
  239. package/src/services/inference-capabilities.d.ts.map +1 -0
  240. package/src/services/inference-capabilities.test.ts +75 -0
  241. package/src/services/inference-capabilities.ts +204 -0
  242. package/src/services/inference-telemetry.d.ts +59 -0
  243. package/src/services/inference-telemetry.d.ts.map +1 -0
  244. package/src/services/inference-telemetry.ts +143 -0
  245. package/src/services/ios-llama-streaming.ts +248 -0
  246. package/src/services/kv-spill.d.ts +189 -0
  247. package/src/services/kv-spill.d.ts.map +1 -0
  248. package/src/services/kv-spill.test.ts +222 -0
  249. package/src/services/kv-spill.ts +356 -0
  250. package/src/services/latency-trace.d.ts +346 -0
  251. package/src/services/latency-trace.d.ts.map +1 -0
  252. package/src/services/latency-trace.test.ts +266 -0
  253. package/src/services/latency-trace.ts +844 -0
  254. package/src/services/llama-server-metrics.ts +304 -0
  255. package/src/services/llm-streaming-binding.d.ts +96 -0
  256. package/src/services/llm-streaming-binding.d.ts.map +1 -0
  257. package/src/services/llm-streaming-binding.ts +136 -0
  258. package/src/services/load-args.d.ts +82 -0
  259. package/src/services/load-args.d.ts.map +1 -0
  260. package/src/services/load-args.ts +81 -0
  261. package/src/services/manifest/eliza-1.manifest.v1.json +708 -0
  262. package/src/services/manifest/index.d.ts +4 -0
  263. package/src/services/manifest/index.d.ts.map +1 -0
  264. package/src/services/manifest/index.ts +66 -0
  265. package/src/services/manifest/manifest.test.ts +693 -0
  266. package/src/services/manifest/schema.d.ts +715 -0
  267. package/src/services/manifest/schema.d.ts.map +1 -0
  268. package/src/services/manifest/schema.ts +655 -0
  269. package/src/services/manifest/types.d.ts +30 -0
  270. package/src/services/manifest/types.d.ts.map +1 -0
  271. package/src/services/manifest/types.ts +55 -0
  272. package/src/services/manifest/validator.d.ts +66 -0
  273. package/src/services/manifest/validator.d.ts.map +1 -0
  274. package/src/services/manifest/validator.ts +569 -0
  275. package/src/services/memory-arbiter.d.ts +343 -0
  276. package/src/services/memory-arbiter.d.ts.map +1 -0
  277. package/src/services/memory-arbiter.test.ts +419 -0
  278. package/src/services/memory-arbiter.ts +1000 -0
  279. package/src/services/memory-monitor.d.ts +119 -0
  280. package/src/services/memory-monitor.d.ts.map +1 -0
  281. package/src/services/memory-monitor.test.ts +208 -0
  282. package/src/services/memory-monitor.ts +296 -0
  283. package/src/services/memory-pressure.d.ts +127 -0
  284. package/src/services/memory-pressure.d.ts.map +1 -0
  285. package/src/services/memory-pressure.ts +413 -0
  286. package/src/services/mtp-doctor.d.ts +13 -0
  287. package/src/services/mtp-doctor.d.ts.map +1 -0
  288. package/src/services/mtp-doctor.ts +78 -0
  289. package/src/services/network-policy.d.ts +127 -0
  290. package/src/services/network-policy.d.ts.map +1 -0
  291. package/src/services/network-policy.ts +346 -0
  292. package/src/services/paths.d.ts +6 -0
  293. package/src/services/paths.d.ts.map +1 -0
  294. package/src/services/paths.ts +25 -0
  295. package/src/services/planner-skeleton.d.ts +124 -0
  296. package/src/services/planner-skeleton.d.ts.map +1 -0
  297. package/src/services/planner-skeleton.ts +175 -0
  298. package/src/services/providers.d.ts +38 -0
  299. package/src/services/providers.d.ts.map +1 -0
  300. package/src/services/providers.ts +507 -0
  301. package/src/services/ram-budget-cache.test.ts +163 -0
  302. package/src/services/ram-budget.d.ts +110 -0
  303. package/src/services/ram-budget.d.ts.map +1 -0
  304. package/src/services/ram-budget.ts +0 -0
  305. package/src/services/readiness.d.ts +9 -0
  306. package/src/services/readiness.d.ts.map +1 -0
  307. package/src/services/readiness.test.ts +87 -0
  308. package/src/services/readiness.ts +238 -0
  309. package/src/services/recommendation.d.ts +111 -0
  310. package/src/services/recommendation.d.ts.map +1 -0
  311. package/src/services/recommendation.ts +672 -0
  312. package/src/services/registry.d.ts +35 -0
  313. package/src/services/registry.d.ts.map +1 -0
  314. package/src/services/registry.ts +151 -0
  315. package/src/services/router-handler.d.ts +92 -0
  316. package/src/services/router-handler.d.ts.map +1 -0
  317. package/src/services/router-handler.test.ts +45 -0
  318. package/src/services/router-handler.ts +376 -0
  319. package/src/services/routing-policy.d.ts +55 -0
  320. package/src/services/routing-policy.d.ts.map +1 -0
  321. package/src/services/routing-policy.ts +228 -0
  322. package/src/services/routing-preferences.d.ts +8 -0
  323. package/src/services/routing-preferences.d.ts.map +1 -0
  324. package/src/services/routing-preferences.ts +15 -0
  325. package/src/services/runtime-target.d.ts +98 -0
  326. package/src/services/runtime-target.d.ts.map +1 -0
  327. package/src/services/runtime-target.ts +154 -0
  328. package/src/services/service.d.ts +128 -0
  329. package/src/services/service.d.ts.map +1 -0
  330. package/src/services/service.test.ts +223 -0
  331. package/src/services/service.ts +735 -0
  332. package/src/services/session-pool.d.ts +72 -0
  333. package/src/services/session-pool.d.ts.map +1 -0
  334. package/src/services/session-pool.ts +153 -0
  335. package/src/services/structured-output/deterministic-repair.d.ts +23 -0
  336. package/src/services/structured-output/deterministic-repair.d.ts.map +1 -0
  337. package/src/services/structured-output/deterministic-repair.test.ts +169 -0
  338. package/src/services/structured-output/deterministic-repair.ts +443 -0
  339. package/src/services/structured-output/index.ts +4 -0
  340. package/src/services/structured-output.d.ts +311 -0
  341. package/src/services/structured-output.d.ts.map +1 -0
  342. package/src/services/structured-output.test.ts +483 -0
  343. package/src/services/structured-output.ts +712 -0
  344. package/src/services/transcription-priority.test.ts +211 -0
  345. package/src/services/tts/errors.ts +46 -0
  346. package/src/services/tts/index.ts +214 -0
  347. package/src/services/tts/tts-audio-cache.ts +235 -0
  348. package/src/services/tts/types.ts +157 -0
  349. package/src/services/types.d.ts +19 -0
  350. package/src/services/types.d.ts.map +1 -0
  351. package/src/services/types.ts +55 -0
  352. package/src/services/verify-on-device.d.ts +34 -0
  353. package/src/services/verify-on-device.d.ts.map +1 -0
  354. package/src/services/verify-on-device.test.ts +87 -0
  355. package/src/services/verify-on-device.ts +127 -0
  356. package/src/services/verify.d.ts +8 -0
  357. package/src/services/verify.d.ts.map +1 -0
  358. package/src/services/verify.ts +13 -0
  359. package/src/services/vision/aosp-unavailable.d.ts +115 -0
  360. package/src/services/vision/aosp-unavailable.d.ts.map +1 -0
  361. package/src/services/vision/aosp-unavailable.ts +163 -0
  362. package/src/services/vision/capacitor-llama.d.ts +99 -0
  363. package/src/services/vision/capacitor-llama.d.ts.map +1 -0
  364. package/src/services/vision/capacitor-llama.ts +255 -0
  365. package/src/services/vision/cloud-fallback.d.ts +47 -0
  366. package/src/services/vision/cloud-fallback.d.ts.map +1 -0
  367. package/src/services/vision/cloud-fallback.test.ts +243 -0
  368. package/src/services/vision/cloud-fallback.ts +268 -0
  369. package/src/services/vision/fallback-chain.test.ts +86 -0
  370. package/src/services/vision/hash.d.ts +71 -0
  371. package/src/services/vision/hash.d.ts.map +1 -0
  372. package/src/services/vision/hash.ts +157 -0
  373. package/src/services/vision/index.d.ts +95 -0
  374. package/src/services/vision/index.d.ts.map +1 -0
  375. package/src/services/vision/index.ts +251 -0
  376. package/src/services/vision/llama-server.d.ts +73 -0
  377. package/src/services/vision/llama-server.d.ts.map +1 -0
  378. package/src/services/vision/llama-server.ts +177 -0
  379. package/src/services/vision/types.d.ts +153 -0
  380. package/src/services/vision/types.d.ts.map +1 -0
  381. package/src/services/vision/types.ts +154 -0
  382. package/src/services/vision/vast-fallback.d.ts +18 -0
  383. package/src/services/vision/vast-fallback.d.ts.map +1 -0
  384. package/src/services/vision/vast-fallback.ts +127 -0
  385. package/src/services/vision-embedding-cache.d.ts +98 -0
  386. package/src/services/vision-embedding-cache.d.ts.map +1 -0
  387. package/src/services/vision-embedding-cache.ts +189 -0
  388. package/src/services/voice/VOICE_WORKBENCH.md +88 -0
  389. package/src/services/voice/__test-helpers__/fake-ffi.ts +92 -0
  390. package/src/services/voice/__test-helpers__/synthetic-speech.ts +124 -0
  391. package/src/services/voice/__tests__/checkpoint-manager.test.ts +241 -0
  392. package/src/services/voice/__tests__/checkpoint-policy.test.ts +270 -0
  393. package/src/services/voice/__tests__/eager-context-builder.test.ts +257 -0
  394. package/src/services/voice/__tests__/eliza1-eot-scorer.test.ts +288 -0
  395. package/src/services/voice/__tests__/eot-classifier.test.ts +431 -0
  396. package/src/services/voice/__tests__/optimistic-rollback.test.ts +312 -0
  397. package/src/services/voice/__tests__/prefill-client.test.ts +266 -0
  398. package/src/services/voice/__tests__/prefix-preserving-queue.test.ts +208 -0
  399. package/src/services/voice/__tests__/streaming-asr.test.ts +450 -0
  400. package/src/services/voice/__tests__/streaming-transcriber.test.ts +339 -0
  401. package/src/services/voice/__tests__/turn-detector-resolver.test.ts +197 -0
  402. package/src/services/voice/__tests__/voice-state-machine-prefill.test.ts +275 -0
  403. package/src/services/voice/__tests__/voice-state-machine.test.ts +354 -0
  404. package/src/services/voice/audio-frame-consumer.d.ts +212 -0
  405. package/src/services/voice/audio-frame-consumer.d.ts.map +1 -0
  406. package/src/services/voice/audio-frame-consumer.test.ts +343 -0
  407. package/src/services/voice/audio-frame-consumer.ts +491 -0
  408. package/src/services/voice/barge-in.d.ts +112 -0
  409. package/src/services/voice/barge-in.d.ts.map +1 -0
  410. package/src/services/voice/barge-in.test.ts +244 -0
  411. package/src/services/voice/barge-in.ts +336 -0
  412. package/src/services/voice/cancellation-coordinator.d.ts +127 -0
  413. package/src/services/voice/cancellation-coordinator.d.ts.map +1 -0
  414. package/src/services/voice/cancellation-coordinator.test.ts +196 -0
  415. package/src/services/voice/cancellation-coordinator.ts +269 -0
  416. package/src/services/voice/checkpoint-manager.d.ts +199 -0
  417. package/src/services/voice/checkpoint-manager.d.ts.map +1 -0
  418. package/src/services/voice/checkpoint-manager.ts +401 -0
  419. package/src/services/voice/checkpoint-policy.ts +336 -0
  420. package/src/services/voice/composite-eot-classifier.test.ts +59 -0
  421. package/src/services/voice/e2e-harness.test.ts +182 -0
  422. package/src/services/voice/e2e-harness.ts +743 -0
  423. package/src/services/voice/eager-context-builder.d.ts +170 -0
  424. package/src/services/voice/eager-context-builder.d.ts.map +1 -0
  425. package/src/services/voice/eager-context-builder.ts +262 -0
  426. package/src/services/voice/eliza1-eot-scorer.d.ts +124 -0
  427. package/src/services/voice/eliza1-eot-scorer.d.ts.map +1 -0
  428. package/src/services/voice/eliza1-eot-scorer.ts +242 -0
  429. package/src/services/voice/embedding-server.ts +200 -0
  430. package/src/services/voice/embedding.d.ts +133 -0
  431. package/src/services/voice/embedding.d.ts.map +1 -0
  432. package/src/services/voice/embedding.test.ts +148 -0
  433. package/src/services/voice/embedding.ts +244 -0
  434. package/src/services/voice/emotion-attribution.d.ts +68 -0
  435. package/src/services/voice/emotion-attribution.d.ts.map +1 -0
  436. package/src/services/voice/emotion-attribution.test.ts +129 -0
  437. package/src/services/voice/emotion-attribution.ts +361 -0
  438. package/src/services/voice/engine-bridge-cancellation.test.ts +422 -0
  439. package/src/services/voice/engine-bridge.d.ts +746 -0
  440. package/src/services/voice/engine-bridge.d.ts.map +1 -0
  441. package/src/services/voice/engine-bridge.test.ts +384 -0
  442. package/src/services/voice/engine-bridge.ts +2226 -0
  443. package/src/services/voice/eot-classifier-ggml.d.ts +179 -0
  444. package/src/services/voice/eot-classifier-ggml.d.ts.map +1 -0
  445. package/src/services/voice/eot-classifier-ggml.ts +566 -0
  446. package/src/services/voice/eot-classifier.d.ts +214 -0
  447. package/src/services/voice/eot-classifier.d.ts.map +1 -0
  448. package/src/services/voice/eot-classifier.ts +533 -0
  449. package/src/services/voice/errors.d.ts +20 -0
  450. package/src/services/voice/errors.d.ts.map +1 -0
  451. package/src/services/voice/errors.ts +32 -0
  452. package/src/services/voice/expressive-tags.d.ts +158 -0
  453. package/src/services/voice/expressive-tags.d.ts.map +1 -0
  454. package/src/services/voice/expressive-tags.ts +405 -0
  455. package/src/services/voice/ffi-bindings.d.ts +636 -0
  456. package/src/services/voice/ffi-bindings.d.ts.map +1 -0
  457. package/src/services/voice/ffi-bindings.test.ts +671 -0
  458. package/src/services/voice/ffi-bindings.ts +3050 -0
  459. package/src/services/voice/first-line-cache.d.ts +181 -0
  460. package/src/services/voice/first-line-cache.d.ts.map +1 -0
  461. package/src/services/voice/first-line-cache.ts +725 -0
  462. package/src/services/voice/fused-eot-scorer.d.ts +51 -0
  463. package/src/services/voice/fused-eot-scorer.d.ts.map +1 -0
  464. package/src/services/voice/fused-eot-scorer.ts +135 -0
  465. package/src/services/voice/index.d.ts +91 -0
  466. package/src/services/voice/index.d.ts.map +1 -0
  467. package/src/services/voice/index.ts +481 -0
  468. package/src/services/voice/kokoro/__tests__/kokoro-backend.test.ts +151 -0
  469. package/src/services/voice/kokoro/__tests__/kokoro-engine-bridge.real.test.ts +151 -0
  470. package/src/services/voice/kokoro/__tests__/kokoro-engine-bridge.test.ts +60 -0
  471. package/src/services/voice/kokoro/__tests__/kokoro-engine-discovery.test.ts +277 -0
  472. package/src/services/voice/kokoro/__tests__/kokoro-ffi-runtime.test.ts +235 -0
  473. package/src/services/voice/kokoro/__tests__/kokoro-runtime.test.ts +95 -0
  474. package/src/services/voice/kokoro/__tests__/phonemizer.test.ts +53 -0
  475. package/src/services/voice/kokoro/__tests__/runtime-selection.test.ts +231 -0
  476. package/src/services/voice/kokoro/__tests__/voices.test.ts +57 -0
  477. package/src/services/voice/kokoro/index.ts +79 -0
  478. package/src/services/voice/kokoro/kokoro-backend.d.ts +72 -0
  479. package/src/services/voice/kokoro/kokoro-backend.d.ts.map +1 -0
  480. package/src/services/voice/kokoro/kokoro-backend.ts +207 -0
  481. package/src/services/voice/kokoro/kokoro-engine-discovery.d.ts +58 -0
  482. package/src/services/voice/kokoro/kokoro-engine-discovery.d.ts.map +1 -0
  483. package/src/services/voice/kokoro/kokoro-engine-discovery.ts +177 -0
  484. package/src/services/voice/kokoro/kokoro-ffi-runtime.d.ts +75 -0
  485. package/src/services/voice/kokoro/kokoro-ffi-runtime.d.ts.map +1 -0
  486. package/src/services/voice/kokoro/kokoro-ffi-runtime.ts +233 -0
  487. package/src/services/voice/kokoro/kokoro-runtime.d.ts +100 -0
  488. package/src/services/voice/kokoro/kokoro-runtime.d.ts.map +1 -0
  489. package/src/services/voice/kokoro/kokoro-runtime.ts +170 -0
  490. package/src/services/voice/kokoro/phoneme-stream.ts +123 -0
  491. package/src/services/voice/kokoro/phonemizer.d.ts +50 -0
  492. package/src/services/voice/kokoro/phonemizer.d.ts.map +1 -0
  493. package/src/services/voice/kokoro/phonemizer.ts +344 -0
  494. package/src/services/voice/kokoro/pick-runtime.d.ts +61 -0
  495. package/src/services/voice/kokoro/pick-runtime.d.ts.map +1 -0
  496. package/src/services/voice/kokoro/pick-runtime.test.ts +91 -0
  497. package/src/services/voice/kokoro/pick-runtime.ts +130 -0
  498. package/src/services/voice/kokoro/runtime-selection.d.ts +92 -0
  499. package/src/services/voice/kokoro/runtime-selection.d.ts.map +1 -0
  500. package/src/services/voice/kokoro/runtime-selection.ts +237 -0
  501. package/src/services/voice/kokoro/types.d.ts +82 -0
  502. package/src/services/voice/kokoro/types.d.ts.map +1 -0
  503. package/src/services/voice/kokoro/types.ts +95 -0
  504. package/src/services/voice/kokoro/voice-presets.d.ts +23 -0
  505. package/src/services/voice/kokoro/voice-presets.d.ts.map +1 -0
  506. package/src/services/voice/kokoro/voice-presets.ts +129 -0
  507. package/src/services/voice/kokoro/voices.d.ts +30 -0
  508. package/src/services/voice/kokoro/voices.d.ts.map +1 -0
  509. package/src/services/voice/kokoro/voices.ts +64 -0
  510. package/src/services/voice/lifecycle.d.ts +135 -0
  511. package/src/services/voice/lifecycle.d.ts.map +1 -0
  512. package/src/services/voice/lifecycle.test.ts +315 -0
  513. package/src/services/voice/lifecycle.ts +301 -0
  514. package/src/services/voice/live-diarization-session.d.ts +96 -0
  515. package/src/services/voice/live-diarization-session.d.ts.map +1 -0
  516. package/src/services/voice/live-diarization-session.ts +289 -0
  517. package/src/services/voice/mic-source.d.ts +136 -0
  518. package/src/services/voice/mic-source.d.ts.map +1 -0
  519. package/src/services/voice/mic-source.test.ts +210 -0
  520. package/src/services/voice/mic-source.ts +503 -0
  521. package/src/services/voice/optimistic-policy.d.ts +109 -0
  522. package/src/services/voice/optimistic-policy.d.ts.map +1 -0
  523. package/src/services/voice/optimistic-policy.test.ts +101 -0
  524. package/src/services/voice/optimistic-policy.ts +192 -0
  525. package/src/services/voice/optimistic-rollback.ts +343 -0
  526. package/src/services/voice/partial-stabilizer.d.ts +73 -0
  527. package/src/services/voice/partial-stabilizer.d.ts.map +1 -0
  528. package/src/services/voice/partial-stabilizer.test.ts +68 -0
  529. package/src/services/voice/partial-stabilizer.ts +140 -0
  530. package/src/services/voice/phoneme-tokenizer.d.ts +49 -0
  531. package/src/services/voice/phoneme-tokenizer.d.ts.map +1 -0
  532. package/src/services/voice/phoneme-tokenizer.ts +158 -0
  533. package/src/services/voice/phrase-cache.d.ts +76 -0
  534. package/src/services/voice/phrase-cache.d.ts.map +1 -0
  535. package/src/services/voice/phrase-cache.test.ts +242 -0
  536. package/src/services/voice/phrase-cache.ts +186 -0
  537. package/src/services/voice/phrase-chunker.d.ts +62 -0
  538. package/src/services/voice/phrase-chunker.d.ts.map +1 -0
  539. package/src/services/voice/phrase-chunker.test.ts +239 -0
  540. package/src/services/voice/phrase-chunker.ts +281 -0
  541. package/src/services/voice/pipeline-impls.d.ts +151 -0
  542. package/src/services/voice/pipeline-impls.d.ts.map +1 -0
  543. package/src/services/voice/pipeline-impls.l6.test.ts +110 -0
  544. package/src/services/voice/pipeline-impls.test.ts +292 -0
  545. package/src/services/voice/pipeline-impls.ts +315 -0
  546. package/src/services/voice/pipeline.d.ts +216 -0
  547. package/src/services/voice/pipeline.d.ts.map +1 -0
  548. package/src/services/voice/pipeline.ts +505 -0
  549. package/src/services/voice/prefill-client.d.ts +123 -0
  550. package/src/services/voice/prefill-client.d.ts.map +1 -0
  551. package/src/services/voice/prefill-client.ts +316 -0
  552. package/src/services/voice/prefix-preserving-queue.d.ts +113 -0
  553. package/src/services/voice/prefix-preserving-queue.d.ts.map +1 -0
  554. package/src/services/voice/prefix-preserving-queue.ts +162 -0
  555. package/src/services/voice/profile-store.d.ts +248 -0
  556. package/src/services/voice/profile-store.d.ts.map +1 -0
  557. package/src/services/voice/profile-store.ts +887 -0
  558. package/src/services/voice/ring-buffer.d.ts +40 -0
  559. package/src/services/voice/ring-buffer.d.ts.map +1 -0
  560. package/src/services/voice/ring-buffer.ts +105 -0
  561. package/src/services/voice/rollback-queue.d.ts +24 -0
  562. package/src/services/voice/rollback-queue.d.ts.map +1 -0
  563. package/src/services/voice/rollback-queue.ts +74 -0
  564. package/src/services/voice/samantha-preset-placeholder.d.ts +67 -0
  565. package/src/services/voice/samantha-preset-placeholder.d.ts.map +1 -0
  566. package/src/services/voice/samantha-preset-placeholder.test.ts +97 -0
  567. package/src/services/voice/samantha-preset-placeholder.ts +148 -0
  568. package/src/services/voice/samantha-preset-regenerator.d.ts +87 -0
  569. package/src/services/voice/samantha-preset-regenerator.d.ts.map +1 -0
  570. package/src/services/voice/samantha-preset-regenerator.ts +393 -0
  571. package/src/services/voice/scheduler.d.ts +146 -0
  572. package/src/services/voice/scheduler.d.ts.map +1 -0
  573. package/src/services/voice/scheduler.t2.test.ts +141 -0
  574. package/src/services/voice/scheduler.ts +927 -0
  575. package/src/services/voice/shared-resources.d.ts +190 -0
  576. package/src/services/voice/shared-resources.d.ts.map +1 -0
  577. package/src/services/voice/shared-resources.ts +320 -0
  578. package/src/services/voice/speaker/attribution-pipeline.d.ts +74 -0
  579. package/src/services/voice/speaker/attribution-pipeline.d.ts.map +1 -0
  580. package/src/services/voice/speaker/attribution-pipeline.ts +386 -0
  581. package/src/services/voice/speaker/diarizer-fused.d.ts +59 -0
  582. package/src/services/voice/speaker/diarizer-fused.d.ts.map +1 -0
  583. package/src/services/voice/speaker/diarizer-fused.real.test.ts +100 -0
  584. package/src/services/voice/speaker/diarizer-fused.ts +154 -0
  585. package/src/services/voice/speaker/diarizer.d.ts +75 -0
  586. package/src/services/voice/speaker/diarizer.d.ts.map +1 -0
  587. package/src/services/voice/speaker/diarizer.ts +218 -0
  588. package/src/services/voice/speaker/encoder-fused.d.ts +60 -0
  589. package/src/services/voice/speaker/encoder-fused.d.ts.map +1 -0
  590. package/src/services/voice/speaker/encoder-fused.real.test.ts +113 -0
  591. package/src/services/voice/speaker/encoder-fused.ts +138 -0
  592. package/src/services/voice/speaker/encoder-ggml.d.ts +33 -0
  593. package/src/services/voice/speaker/encoder-ggml.d.ts.map +1 -0
  594. package/src/services/voice/speaker/encoder-ggml.ts +79 -0
  595. package/src/services/voice/speaker/encoder.d.ts +37 -0
  596. package/src/services/voice/speaker/encoder.d.ts.map +1 -0
  597. package/src/services/voice/speaker/encoder.ts +105 -0
  598. package/src/services/voice/speaker-imprint.d.ts +83 -0
  599. package/src/services/voice/speaker-imprint.d.ts.map +1 -0
  600. package/src/services/voice/speaker-imprint.test.ts +185 -0
  601. package/src/services/voice/speaker-imprint.ts +312 -0
  602. package/src/services/voice/speaker-preset-cache.d.ts +77 -0
  603. package/src/services/voice/speaker-preset-cache.d.ts.map +1 -0
  604. package/src/services/voice/speaker-preset-cache.test.ts +154 -0
  605. package/src/services/voice/speaker-preset-cache.ts +195 -0
  606. package/src/services/voice/streaming-asr/streaming-pipeline-adapter.ts +292 -0
  607. package/src/services/voice/system-audio-sink.d.ts +73 -0
  608. package/src/services/voice/system-audio-sink.d.ts.map +1 -0
  609. package/src/services/voice/system-audio-sink.test.ts +29 -0
  610. package/src/services/voice/system-audio-sink.ts +366 -0
  611. package/src/services/voice/transcriber.d.ts +244 -0
  612. package/src/services/voice/transcriber.d.ts.map +1 -0
  613. package/src/services/voice/transcriber.test.ts +392 -0
  614. package/src/services/voice/transcriber.ts +704 -0
  615. package/src/services/voice/turn-controller.d.ts +183 -0
  616. package/src/services/voice/turn-controller.d.ts.map +1 -0
  617. package/src/services/voice/turn-controller.test.ts +575 -0
  618. package/src/services/voice/turn-controller.ts +596 -0
  619. package/src/services/voice/types.d.ts +643 -0
  620. package/src/services/voice/types.d.ts.map +1 -0
  621. package/src/services/voice/types.ts +699 -0
  622. package/src/services/voice/vad.d.ts +282 -0
  623. package/src/services/voice/vad.d.ts.map +1 -0
  624. package/src/services/voice/vad.test.ts +480 -0
  625. package/src/services/voice/vad.ts +827 -0
  626. package/src/services/voice/vad.v1-v4.test.ts +222 -0
  627. package/src/services/voice/voice-budget.d.ts +241 -0
  628. package/src/services/voice/voice-budget.d.ts.map +1 -0
  629. package/src/services/voice/voice-budget.test.ts +420 -0
  630. package/src/services/voice/voice-budget.ts +656 -0
  631. package/src/services/voice/voice-duet.test.ts +375 -0
  632. package/src/services/voice/voice-emotion-classifier.d.ts +95 -0
  633. package/src/services/voice/voice-emotion-classifier.d.ts.map +1 -0
  634. package/src/services/voice/voice-emotion-classifier.test.ts +210 -0
  635. package/src/services/voice/voice-emotion-classifier.ts +273 -0
  636. package/src/services/voice/voice-preset-format.d.ts +158 -0
  637. package/src/services/voice/voice-preset-format.d.ts.map +1 -0
  638. package/src/services/voice/voice-preset-format.ts +700 -0
  639. package/src/services/voice/voice-preset-generator.test.ts +89 -0
  640. package/src/services/voice/voice-profile-artifact.d.ts +116 -0
  641. package/src/services/voice/voice-profile-artifact.d.ts.map +1 -0
  642. package/src/services/voice/voice-profile-artifact.test.ts +138 -0
  643. package/src/services/voice/voice-profile-artifact.ts +518 -0
  644. package/src/services/voice/voice-profile-routes.d.ts +83 -0
  645. package/src/services/voice/voice-profile-routes.d.ts.map +1 -0
  646. package/src/services/voice/voice-profile-routes.test.ts +429 -0
  647. package/src/services/voice/voice-profile-routes.ts +425 -0
  648. package/src/services/voice/voice-scenario.ts +154 -0
  649. package/src/services/voice/voice-settings.d.ts +82 -0
  650. package/src/services/voice/voice-settings.d.ts.map +1 -0
  651. package/src/services/voice/voice-settings.ts +172 -0
  652. package/src/services/voice/voice-state-machine.d.ts +364 -0
  653. package/src/services/voice/voice-state-machine.d.ts.map +1 -0
  654. package/src/services/voice/voice-state-machine.ts +727 -0
  655. package/src/services/voice/voice-workbench-report.test.ts +168 -0
  656. package/src/services/voice/voice-workbench-report.ts +326 -0
  657. package/src/services/voice/voice-workbench.test.ts +158 -0
  658. package/src/services/voice/voice.test.ts +1070 -0
  659. package/src/services/voice/wake-word-ggml.d.ts +101 -0
  660. package/src/services/voice/wake-word-ggml.d.ts.map +1 -0
  661. package/src/services/voice/wake-word-ggml.ts +320 -0
  662. package/src/services/voice/wake-word.d.ts +255 -0
  663. package/src/services/voice/wake-word.d.ts.map +1 -0
  664. package/src/services/voice/wake-word.test.ts +298 -0
  665. package/src/services/voice/wake-word.ts +554 -0
  666. package/src/services/voice/wrap-with-first-line-cache.d.ts +70 -0
  667. package/src/services/voice/wrap-with-first-line-cache.d.ts.map +1 -0
  668. package/src/services/voice/wrap-with-first-line-cache.ts +267 -0
  669. package/src/services/voice-model-updater.d.ts +240 -0
  670. package/src/services/voice-model-updater.d.ts.map +1 -0
  671. package/src/services/voice-model-updater.ts +724 -0
  672. package/src/services/voice-prewarm.d.ts +3 -0
  673. package/src/services/voice-prewarm.d.ts.map +1 -0
  674. package/src/services/voice-prewarm.ts +51 -0
  675. package/dist/index.d.ts +0 -37
  676. package/dist/index.js +0 -1098
@@ -0,0 +1,807 @@
1
+ /**
2
+ * Local-AI plugin backed by the Capacitor-llama adapter.
3
+ *
4
+ * This is the unified replacement for the legacy capacitor-llama adapter.
5
+ * It registers a `Plugin` that handles `ModelType.TEXT_SMALL/LARGE/EMBEDDING`
6
+ * via `CapacitorLlamaContext` — a single contract that resolves to
7
+ * `llama-cpp-capacitor` on mobile and the desktop bun:ffi adapter on
8
+ * desktop. Both load THE vendored llama.cpp at
9
+ * `plugins/plugin-local-inference/native/llama.cpp/` (Wave 2's cross-compiles).
10
+ *
11
+ * `capacitor-llama` is NEVER imported here.
12
+ */
13
+
14
+ import fs from "node:fs";
15
+ import path, { basename } from "node:path";
16
+ import type {
17
+ DetokenizeTextParams,
18
+ EventPayload,
19
+ GenerateTextParams,
20
+ ImageDescriptionParams,
21
+ ImageDescriptionResult,
22
+ JSONSchema,
23
+ ModelTypeName,
24
+ TextEmbeddingParams,
25
+ TextStreamResult,
26
+ TextToSpeechParams,
27
+ TokenizeTextParams,
28
+ TokenUsage,
29
+ ToolChoice,
30
+ ToolDefinition,
31
+ TranscriptionParams,
32
+ } from "@elizaos/core";
33
+ import {
34
+ EventType,
35
+ type IAgentRuntime,
36
+ logger,
37
+ ModelType,
38
+ type Plugin,
39
+ resolveStateDir,
40
+ } from "@elizaos/core";
41
+ import {
42
+ createLocalInferenceModelHandlers,
43
+ isLocalInferenceUnavailableError,
44
+ } from "../..";
45
+ import { type Config, validateConfig } from "./environment";
46
+ import { initCapacitorLlama } from "./loader";
47
+ import {
48
+ applyStructuredPlan,
49
+ extractToolCalls,
50
+ planStructuredRequest,
51
+ type ToolCallResult,
52
+ } from "./structured-output";
53
+ import { streamCapacitorPrompt } from "./text-streaming";
54
+ import {
55
+ type CapacitorLlamaCompletionParams,
56
+ type CapacitorLlamaContext,
57
+ type EmbeddingModelSpec,
58
+ MODEL_SPECS,
59
+ type ModelSpec,
60
+ } from "./types";
61
+
62
+ const DEFAULT_LOCAL_SYSTEM_PROMPT = "Respond to the current request only.";
63
+
64
+ interface ContextEntry {
65
+ ctx: CapacitorLlamaContext;
66
+ systemPrompt: string;
67
+ }
68
+
69
+ interface LocalGenerationResult {
70
+ text: string;
71
+ toolCalls: ToolCallResult[];
72
+ finishReason: string | undefined;
73
+ }
74
+
75
+ type LocalGenerateTextParams = GenerateTextParams & {
76
+ modelType?: ModelTypeName;
77
+ };
78
+
79
+ type LocalGenerationOutput = LocalGenerationResult | TextStreamResult;
80
+
81
+ type LocalInferenceRouteResult<T> =
82
+ | { handled: true; value: T }
83
+ | { handled: false };
84
+
85
+ function isStreamResult(
86
+ value: LocalGenerationOutput,
87
+ ): value is TextStreamResult {
88
+ return (
89
+ typeof value === "object" &&
90
+ value !== null &&
91
+ "textStream" in value &&
92
+ "text" in value &&
93
+ "usage" in value &&
94
+ "finishReason" in value
95
+ );
96
+ }
97
+
98
+ type LocalNativeTextModelResult = string & {
99
+ text: string;
100
+ toolCalls: ToolCallResult[];
101
+ finishReason?: string;
102
+ };
103
+
104
+ function getObjectField(value: unknown, key: string): unknown {
105
+ if (!value || typeof value !== "object") return undefined;
106
+ return (value as Record<string, unknown>)[key];
107
+ }
108
+
109
+ function extractEmbeddingText(
110
+ params: TextEmbeddingParams | string | null,
111
+ ): string | null {
112
+ if (typeof params === "string") return params;
113
+ const text = getObjectField(params, "text");
114
+ return typeof text === "string" ? text : null;
115
+ }
116
+
117
+ function getRequiredEmbeddingText(
118
+ params: TextEmbeddingParams | string | null,
119
+ ): string {
120
+ const text = extractEmbeddingText(params)?.trim();
121
+ if (!text) {
122
+ throw new Error("Embedding text must be a non-empty string");
123
+ }
124
+ return text;
125
+ }
126
+
127
+ function stringifyMessageContent(
128
+ content: NonNullable<GenerateTextParams["messages"]>[number]["content"],
129
+ ): string {
130
+ if (typeof content === "string") return content;
131
+ if (Array.isArray(content)) {
132
+ return content
133
+ .map((part) => {
134
+ if (!part || typeof part !== "object") return "";
135
+ const record = part as Record<string, unknown>;
136
+ if (typeof record.text === "string") return record.text;
137
+ if (typeof record.content === "string") return record.content;
138
+ return "";
139
+ })
140
+ .filter(Boolean)
141
+ .join("\n");
142
+ }
143
+ return "";
144
+ }
145
+
146
+ function renderCompletionPrompt(params: GenerateTextParams): string {
147
+ if (params.messages && params.messages.length > 0) {
148
+ return params.messages
149
+ .map((message) => {
150
+ const content = stringifyMessageContent(message.content);
151
+ return content ? `${message.role}: ${content}` : `${message.role}:`;
152
+ })
153
+ .join("\n");
154
+ }
155
+
156
+ const system = params.system?.trim() || DEFAULT_LOCAL_SYSTEM_PROMPT;
157
+ const prompt = params.prompt ?? "";
158
+ return `system: ${system}\nuser: ${prompt}`;
159
+ }
160
+
161
+ function getToolChoiceLabel(
162
+ toolChoice: ToolChoice | undefined,
163
+ ): string | undefined {
164
+ if (typeof toolChoice === "string") return toolChoice;
165
+ if (!toolChoice || typeof toolChoice !== "object") return undefined;
166
+ if ("name" in toolChoice && typeof toolChoice.name === "string") {
167
+ return toolChoice.name;
168
+ }
169
+ if (
170
+ "type" in toolChoice &&
171
+ toolChoice.type === "function" &&
172
+ "function" in toolChoice &&
173
+ toolChoice.function &&
174
+ typeof toolChoice.function.name === "string"
175
+ ) {
176
+ return toolChoice.function.name;
177
+ }
178
+ return undefined;
179
+ }
180
+
181
+ type NormalizedUsage = {
182
+ promptTokens: number;
183
+ completionTokens: number;
184
+ totalTokens: number;
185
+ estimated?: boolean;
186
+ };
187
+
188
+ function estimateTokenCount(text: string): number {
189
+ return text.length === 0 ? 0 : Math.ceil(text.length / 4);
190
+ }
191
+
192
+ function estimateUsage(prompt: string, response: unknown): NormalizedUsage {
193
+ const responseText =
194
+ typeof response === "string"
195
+ ? response
196
+ : (() => {
197
+ try {
198
+ return JSON.stringify(response);
199
+ } catch {
200
+ return String(response);
201
+ }
202
+ })();
203
+ const promptTokens = estimateTokenCount(prompt);
204
+ const completionTokens = estimateTokenCount(responseText);
205
+ return {
206
+ promptTokens,
207
+ completionTokens,
208
+ totalTokens: promptTokens + completionTokens,
209
+ estimated: true,
210
+ };
211
+ }
212
+
213
+ function normalizedToTokenUsage(usage: NormalizedUsage): TokenUsage {
214
+ return {
215
+ promptTokens: usage.promptTokens,
216
+ completionTokens: usage.completionTokens,
217
+ totalTokens: usage.totalTokens,
218
+ };
219
+ }
220
+
221
+ function estimateEmbeddingUsage(text: string): NormalizedUsage {
222
+ const promptTokens = estimateTokenCount(text);
223
+ return {
224
+ promptTokens,
225
+ completionTokens: 0,
226
+ totalTokens: promptTokens,
227
+ estimated: true,
228
+ };
229
+ }
230
+
231
+ function stripThinkTags(text: string): string {
232
+ return text.includes("<think>")
233
+ ? text.replace(/<think>[\s\S]*?<\/think>\n?/g, "")
234
+ : text;
235
+ }
236
+
237
+ function wantsNativeShape(params: GenerateTextParams): boolean {
238
+ if (params.tools && params.tools.length > 0) return true;
239
+ if (params.responseSchema) return true;
240
+ if (params.toolChoice) return true;
241
+ if (
242
+ params.responseFormat &&
243
+ typeof params.responseFormat === "object" &&
244
+ params.responseFormat.type === "json_object"
245
+ ) {
246
+ return true;
247
+ }
248
+ return false;
249
+ }
250
+
251
+ function shouldFallbackFromLocalInference(error: unknown): boolean {
252
+ return (
253
+ isLocalInferenceUnavailableError(error) &&
254
+ ("reason" in error
255
+ ? error.reason === "backend_unavailable" ||
256
+ error.reason === "capability_unavailable"
257
+ : true)
258
+ );
259
+ }
260
+
261
+ async function tryLocalInferenceModel<T>(
262
+ runtime: IAgentRuntime,
263
+ modelType: ModelTypeName,
264
+ params: unknown,
265
+ ): Promise<LocalInferenceRouteResult<T>> {
266
+ const handler =
267
+ localInferenceModelHandlers[
268
+ modelType as keyof typeof localInferenceModelHandlers
269
+ ];
270
+ if (typeof handler !== "function") return { handled: false };
271
+
272
+ try {
273
+ const value = await handler(runtime, params as never);
274
+ return { handled: true, value: value as T };
275
+ } catch (error) {
276
+ if (shouldFallbackFromLocalInference(error)) {
277
+ logger.debug(
278
+ {
279
+ modelType,
280
+ reason:
281
+ isLocalInferenceUnavailableError(error) && "reason" in error
282
+ ? error.reason
283
+ : "unknown",
284
+ },
285
+ "[plugin-local-ai] Local-inference route unavailable; falling back to legacy compatibility path.",
286
+ );
287
+ return { handled: false };
288
+ }
289
+ throw error;
290
+ }
291
+ }
292
+
293
+ function buildNativeResult(
294
+ result: LocalGenerationResult,
295
+ ): LocalNativeTextModelResult {
296
+ const nativeResult = {
297
+ text: result.text,
298
+ toolCalls: result.toolCalls,
299
+ ...(result.finishReason ? { finishReason: result.finishReason } : {}),
300
+ };
301
+ return nativeResult as unknown as LocalNativeTextModelResult;
302
+ }
303
+
304
+ function getLocalModelLabel(
305
+ runtime: IAgentRuntime,
306
+ type: ModelTypeName,
307
+ ): string {
308
+ const config = validateConfig();
309
+ if (type === ModelType.TEXT_EMBEDDING) {
310
+ return String(
311
+ runtime.getSetting("LOCAL_EMBEDDING_MODEL") ||
312
+ config.LOCAL_EMBEDDING_MODEL,
313
+ );
314
+ }
315
+ if (type === ModelType.TEXT_LARGE) {
316
+ return String(
317
+ runtime.getSetting("LOCAL_LARGE_MODEL") || config.LOCAL_LARGE_MODEL,
318
+ );
319
+ }
320
+ return String(
321
+ runtime.getSetting("LOCAL_SMALL_MODEL") || config.LOCAL_SMALL_MODEL,
322
+ );
323
+ }
324
+
325
+ function emitModelUsed(
326
+ runtime: IAgentRuntime,
327
+ type: ModelTypeName,
328
+ model: string,
329
+ usage: NormalizedUsage,
330
+ ): void {
331
+ void runtime.emitEvent(
332
+ EventType.MODEL_USED as string,
333
+ {
334
+ runtime,
335
+ source: "local-ai",
336
+ provider: "local-ai",
337
+ type,
338
+ model,
339
+ modelName: model,
340
+ tokens: {
341
+ prompt: usage.promptTokens,
342
+ completion: usage.completionTokens,
343
+ total: usage.totalTokens,
344
+ ...(usage.estimated ? { estimated: true } : {}),
345
+ },
346
+ ...(usage.estimated ? { usageEstimated: true } : {}),
347
+ } as EventPayload,
348
+ );
349
+ }
350
+
351
+ /**
352
+ * Singleton manager. Holds one Capacitor context per `ModelType` (small,
353
+ * large, embedding), plus the resolved environment configuration and model
354
+ * paths. The KV cache survives between turns inside `CapacitorLlamaContext`
355
+ * because we reuse the same handle.
356
+ */
357
+ class LocalAIManager {
358
+ private static instance: LocalAIManager | null = null;
359
+ private smallCtx: ContextEntry | null = null;
360
+ private mediumCtx: ContextEntry | null = null;
361
+ private embeddingCtx: CapacitorLlamaContext | null = null;
362
+ private modelPath!: string;
363
+ private mediumModelPath!: string;
364
+ private embeddingModelPath!: string;
365
+ private cacheDir!: string;
366
+ private activeModelConfig: ModelSpec;
367
+ private embeddingModelConfig: EmbeddingModelSpec;
368
+ private config: Config | null = null;
369
+ private environmentInitialized = false;
370
+ private environmentInitializingPromise: Promise<void> | null = null;
371
+ private modelsDir!: string;
372
+
373
+ private constructor() {
374
+ this.config = validateConfig();
375
+ this._setupCacheDir();
376
+ this.activeModelConfig = MODEL_SPECS.small;
377
+ this.embeddingModelConfig = MODEL_SPECS.embedding;
378
+ }
379
+
380
+ private _setupModelsDir(): void {
381
+ const modelsDirEnv =
382
+ this.config?.MODELS_DIR?.trim() || process.env.MODELS_DIR?.trim();
383
+ this.modelsDir = modelsDirEnv
384
+ ? path.resolve(modelsDirEnv)
385
+ : path.join(resolveStateDir(), "models");
386
+ if (!fs.existsSync(this.modelsDir)) {
387
+ fs.mkdirSync(this.modelsDir, { recursive: true });
388
+ }
389
+ logger.info({ modelsDir: this.modelsDir }, "Models directory ready");
390
+ }
391
+
392
+ private _setupCacheDir(): void {
393
+ const cacheDirEnv =
394
+ this.config?.CACHE_DIR?.trim() || process.env.CACHE_DIR?.trim();
395
+ this.cacheDir = cacheDirEnv
396
+ ? path.resolve(cacheDirEnv)
397
+ : path.join(resolveStateDir(), "cache");
398
+ if (!fs.existsSync(this.cacheDir)) {
399
+ fs.mkdirSync(this.cacheDir, { recursive: true });
400
+ }
401
+ logger.info({ cacheDir: this.cacheDir }, "Cache directory ready");
402
+ }
403
+
404
+ public static getInstance(): LocalAIManager {
405
+ if (!LocalAIManager.instance) {
406
+ LocalAIManager.instance = new LocalAIManager();
407
+ }
408
+ return LocalAIManager.instance;
409
+ }
410
+
411
+ public async initializeEnvironment(): Promise<void> {
412
+ if (this.environmentInitialized) return;
413
+ if (this.environmentInitializingPromise) {
414
+ await this.environmentInitializingPromise;
415
+ return;
416
+ }
417
+ this.environmentInitializingPromise = (async () => {
418
+ this.config = await validateConfig();
419
+ this._setupModelsDir();
420
+ this.modelPath = path.join(this.modelsDir, this.config.LOCAL_SMALL_MODEL);
421
+ this.mediumModelPath = path.join(
422
+ this.modelsDir,
423
+ this.config.LOCAL_LARGE_MODEL,
424
+ );
425
+ this.embeddingModelPath = path.join(
426
+ this.modelsDir,
427
+ this.config.LOCAL_EMBEDDING_MODEL,
428
+ );
429
+ logger.info(
430
+ {
431
+ small: basename(this.modelPath),
432
+ medium: basename(this.mediumModelPath),
433
+ embedding: basename(this.embeddingModelPath),
434
+ },
435
+ "Model paths resolved",
436
+ );
437
+ this.environmentInitialized = true;
438
+ })();
439
+ await this.environmentInitializingPromise;
440
+ }
441
+
442
+ public getActiveModelConfig(): ModelSpec {
443
+ return this.activeModelConfig;
444
+ }
445
+
446
+ private async resolveCtx(
447
+ modelType: ModelTypeName,
448
+ systemPrompt: string,
449
+ ): Promise<ContextEntry> {
450
+ const slot = modelType === ModelType.TEXT_LARGE ? "medium" : "small";
451
+ const existing = slot === "medium" ? this.mediumCtx : this.smallCtx;
452
+ if (existing && existing.systemPrompt === systemPrompt) {
453
+ if (slot === "medium") this.activeModelConfig = MODEL_SPECS.medium;
454
+ else this.activeModelConfig = MODEL_SPECS.small;
455
+ return existing;
456
+ }
457
+ if (existing) {
458
+ // System prompt changed — release the cached context.
459
+ try {
460
+ await existing.ctx.release();
461
+ } catch (err) {
462
+ logger.warn(
463
+ { err: err instanceof Error ? err.message : String(err) },
464
+ "[plugin-local-ai] Failed releasing stale context",
465
+ );
466
+ }
467
+ if (slot === "medium") this.mediumCtx = null;
468
+ else this.smallCtx = null;
469
+ }
470
+
471
+ const spec = slot === "medium" ? MODEL_SPECS.medium : MODEL_SPECS.small;
472
+ const modelPath = slot === "medium" ? this.mediumModelPath : this.modelPath;
473
+ const ctx = await initCapacitorLlama({
474
+ model: modelPath,
475
+ n_ctx: spec.contextSize,
476
+ n_gpu_layers: 999,
477
+ use_mmap: true,
478
+ });
479
+ const entry: ContextEntry = { ctx, systemPrompt };
480
+ if (slot === "medium") this.mediumCtx = entry;
481
+ else this.smallCtx = entry;
482
+ this.activeModelConfig = spec;
483
+ return entry;
484
+ }
485
+
486
+ async initialize(
487
+ modelType: ModelTypeName = ModelType.TEXT_SMALL,
488
+ ): Promise<void> {
489
+ await this.initializeEnvironment();
490
+ await this.resolveCtx(modelType, DEFAULT_LOCAL_SYSTEM_PROMPT);
491
+ }
492
+
493
+ public async initializeEmbedding(): Promise<void> {
494
+ await this.initializeEnvironment();
495
+ if (this.embeddingCtx) return;
496
+ this.embeddingCtx = await initCapacitorLlama({
497
+ model: this.embeddingModelPath,
498
+ n_ctx: this.embeddingModelConfig.contextSize,
499
+ n_gpu_layers: 0,
500
+ embedding: true,
501
+ pooling_type: "mean",
502
+ });
503
+ }
504
+
505
+ async generateEmbedding(text: string): Promise<number[]> {
506
+ await this.initializeEmbedding();
507
+ if (!this.embeddingCtx) {
508
+ throw new Error("Failed to initialize embedding context");
509
+ }
510
+ const result = await this.embeddingCtx.embedding(text, {
511
+ embd_normalize: 2,
512
+ });
513
+ return result.embedding;
514
+ }
515
+
516
+ async generateText(
517
+ params: LocalGenerateTextParams,
518
+ ): Promise<LocalGenerationOutput> {
519
+ await this.initializeEnvironment();
520
+ const modelType = params.modelType ?? ModelType.TEXT_SMALL;
521
+ const systemPrompt = params.system?.trim() || DEFAULT_LOCAL_SYSTEM_PROMPT;
522
+ const entry = await this.resolveCtx(modelType, systemPrompt);
523
+ const toolChoiceLabel = getToolChoiceLabel(params.toolChoice);
524
+ const plan = planStructuredRequest({
525
+ tools: params.tools as readonly ToolDefinition[] | undefined,
526
+ responseSchema: params.responseSchema as JSONSchema | undefined,
527
+ responseFormat: params.responseFormat,
528
+ toolChoice: toolChoiceLabel,
529
+ });
530
+
531
+ const baseParams: CapacitorLlamaCompletionParams = {
532
+ prompt: renderCompletionPrompt({ ...params, system: systemPrompt }),
533
+ n_predict: params.maxTokens ?? 8192,
534
+ temperature: params.temperature ?? 0.7,
535
+ top_p: params.topP ?? 0.9,
536
+ ...(typeof params.topK === "number" ? { top_k: params.topK } : {}),
537
+ ...(typeof params.minP === "number" ? { min_p: params.minP } : {}),
538
+ ...(typeof params.seed === "number" ? { seed: params.seed } : {}),
539
+ penalty_repeat: params.repetitionPenalty ?? 1.2,
540
+ penalty_freq: params.frequencyPenalty ?? 0.7,
541
+ penalty_present: params.presencePenalty ?? 0.7,
542
+ stop: params.stopSequences ?? [],
543
+ };
544
+ const fullParams = applyStructuredPlan(baseParams, plan);
545
+
546
+ if (plan.kind === "tools") {
547
+ const result = await entry.ctx.completion(fullParams);
548
+ const toolCalls = extractToolCalls(result);
549
+ const text = stripThinkTags(result.content || result.text);
550
+ return {
551
+ text,
552
+ toolCalls,
553
+ finishReason: result.stopped_eos ? "stop" : undefined,
554
+ };
555
+ }
556
+
557
+ if (plan.kind === "schema" || plan.kind === "json_object") {
558
+ const result = await entry.ctx.completion(fullParams);
559
+ const text = stripThinkTags(result.content || result.text);
560
+ return {
561
+ text,
562
+ toolCalls: [],
563
+ finishReason: result.stopped_eos ? "stop" : undefined,
564
+ };
565
+ }
566
+
567
+ const streamParams = params as GenerateTextParams & {
568
+ onStreamChunk?: unknown;
569
+ };
570
+ const wantsStreaming =
571
+ params.stream === true ||
572
+ typeof streamParams.onStreamChunk === "function";
573
+
574
+ if (wantsStreaming) {
575
+ return streamCapacitorPrompt({
576
+ ctx: entry.ctx,
577
+ params: fullParams,
578
+ estimateUsage: (p, fullText) =>
579
+ normalizedToTokenUsage(estimateUsage(p, fullText)),
580
+ onChunk:
581
+ typeof streamParams.onStreamChunk === "function"
582
+ ? (delta) => streamParams.onStreamChunk?.(delta)
583
+ : undefined,
584
+ postProcess: stripThinkTags,
585
+ });
586
+ }
587
+
588
+ const result = await entry.ctx.completion(fullParams);
589
+ const text = stripThinkTags(result.content || result.text);
590
+ return {
591
+ text,
592
+ toolCalls: [],
593
+ finishReason: result.stopped_eos ? "stop" : undefined,
594
+ };
595
+ }
596
+ }
597
+
598
+ function finalizeTextResult(
599
+ runtime: IAgentRuntime,
600
+ modelType: ModelTypeName,
601
+ params: GenerateTextParams,
602
+ result: LocalGenerationOutput,
603
+ ): string | LocalNativeTextModelResult | TextStreamResult {
604
+ if (isStreamResult(result)) {
605
+ const modelLabel = getLocalModelLabel(runtime, modelType);
606
+ void result.usage.then((usage) => {
607
+ if (!usage) return;
608
+ emitModelUsed(runtime, modelType, modelLabel, {
609
+ promptTokens: usage.promptTokens,
610
+ completionTokens: usage.completionTokens,
611
+ totalTokens: usage.totalTokens,
612
+ estimated: true,
613
+ });
614
+ });
615
+ return result;
616
+ }
617
+
618
+ emitModelUsed(
619
+ runtime,
620
+ modelType,
621
+ getLocalModelLabel(runtime, modelType),
622
+ estimateUsage(params.prompt ?? "", result.text),
623
+ );
624
+ return wantsNativeShape(params) ? buildNativeResult(result) : result.text;
625
+ }
626
+
627
+ const localInferenceModelHandlers = createLocalInferenceModelHandlers();
628
+ const localAIManager = LocalAIManager.getInstance();
629
+
630
+ export const localAiPlugin: Plugin = {
631
+ name: "local-ai",
632
+ description:
633
+ "Local AI plugin using Eliza-1 GGUF models via the canonical Capacitor-llama adapter (mobile + desktop FFI; no node-llama-cpp).",
634
+
635
+ async init(
636
+ _config: Record<string, unknown> | undefined,
637
+ _runtime: IAgentRuntime,
638
+ ) {
639
+ logger.info("Initializing Local AI plugin (Capacitor-llama backend)");
640
+ await localAIManager.initializeEnvironment();
641
+ const config = validateConfig();
642
+ const modelsDir =
643
+ config.MODELS_DIR || path.join(resolveStateDir(), "models");
644
+ if (!fs.existsSync(modelsDir)) {
645
+ logger.warn(
646
+ { modelsDir },
647
+ "Models directory missing; will be created on first download",
648
+ );
649
+ }
650
+ const smallModelPath = path.join(modelsDir, config.LOCAL_SMALL_MODEL);
651
+ const largeModelPath = path.join(modelsDir, config.LOCAL_LARGE_MODEL);
652
+ const embeddingModelPath = path.join(
653
+ modelsDir,
654
+ config.LOCAL_EMBEDDING_MODEL,
655
+ );
656
+ const modelsExist = {
657
+ small: fs.existsSync(smallModelPath),
658
+ large: fs.existsSync(largeModelPath),
659
+ embedding: fs.existsSync(embeddingModelPath),
660
+ };
661
+ logger.info(modelsExist, "Local AI model file presence");
662
+ logger.info("Local AI plugin initialized");
663
+ },
664
+
665
+ models: {
666
+ [ModelType.TEXT_SMALL]: async (
667
+ runtime: IAgentRuntime,
668
+ params: GenerateTextParams,
669
+ ) => {
670
+ if (!wantsNativeShape(params)) {
671
+ const routed = await tryLocalInferenceModel<string>(
672
+ runtime,
673
+ ModelType.TEXT_SMALL,
674
+ params,
675
+ );
676
+ if (routed.handled) return routed.value;
677
+ }
678
+ await localAIManager.initializeEnvironment();
679
+ const result = await localAIManager.generateText({
680
+ ...params,
681
+ modelType: ModelType.TEXT_SMALL,
682
+ });
683
+ return finalizeTextResult(runtime, ModelType.TEXT_SMALL, params, result);
684
+ },
685
+
686
+ [ModelType.TEXT_LARGE]: async (
687
+ runtime: IAgentRuntime,
688
+ params: GenerateTextParams,
689
+ ) => {
690
+ if (!wantsNativeShape(params)) {
691
+ const routed = await tryLocalInferenceModel<string>(
692
+ runtime,
693
+ ModelType.TEXT_LARGE,
694
+ params,
695
+ );
696
+ if (routed.handled) return routed.value;
697
+ }
698
+ await localAIManager.initializeEnvironment();
699
+ const result = await localAIManager.generateText({
700
+ ...params,
701
+ modelType: ModelType.TEXT_LARGE,
702
+ });
703
+ return finalizeTextResult(runtime, ModelType.TEXT_LARGE, params, result);
704
+ },
705
+
706
+ [ModelType.TEXT_EMBEDDING]: async (
707
+ runtime: IAgentRuntime,
708
+ params: TextEmbeddingParams | string | null,
709
+ ) => {
710
+ const text = getRequiredEmbeddingText(params);
711
+ const routed = await tryLocalInferenceModel<number[]>(
712
+ runtime,
713
+ ModelType.TEXT_EMBEDDING,
714
+ params,
715
+ );
716
+ if (routed.handled) return routed.value;
717
+
718
+ const embedding = await localAIManager.generateEmbedding(text);
719
+ emitModelUsed(
720
+ runtime,
721
+ ModelType.TEXT_EMBEDDING,
722
+ getLocalModelLabel(runtime, ModelType.TEXT_EMBEDDING),
723
+ estimateEmbeddingUsage(text),
724
+ );
725
+ return embedding;
726
+ },
727
+
728
+ [ModelType.TEXT_TOKENIZER_ENCODE]: async (
729
+ runtime: IAgentRuntime,
730
+ params: TokenizeTextParams,
731
+ ) => {
732
+ const routed = await tryLocalInferenceModel<number[]>(
733
+ runtime,
734
+ ModelType.TEXT_TOKENIZER_ENCODE,
735
+ params,
736
+ );
737
+ if (routed.handled) return routed.value;
738
+ throw new Error(
739
+ "plugin-local-ai tokenizer has been migrated to @elizaos/plugin-local-inference. " +
740
+ "Enable an Eliza-1 bundle and route via plugin-local-inference for tokenization.",
741
+ );
742
+ },
743
+
744
+ [ModelType.TEXT_TOKENIZER_DECODE]: async (
745
+ runtime: IAgentRuntime,
746
+ params: DetokenizeTextParams,
747
+ ) => {
748
+ const routed = await tryLocalInferenceModel<string>(
749
+ runtime,
750
+ ModelType.TEXT_TOKENIZER_DECODE,
751
+ params,
752
+ );
753
+ if (routed.handled) return routed.value;
754
+ throw new Error(
755
+ "plugin-local-ai detokenizer has been migrated to @elizaos/plugin-local-inference. " +
756
+ "Enable an Eliza-1 bundle and route via plugin-local-inference for detokenization.",
757
+ );
758
+ },
759
+
760
+ [ModelType.IMAGE_DESCRIPTION]: async (
761
+ runtime: IAgentRuntime,
762
+ params: ImageDescriptionParams | string,
763
+ ) => {
764
+ const routed = await tryLocalInferenceModel<ImageDescriptionResult>(
765
+ runtime,
766
+ ModelType.IMAGE_DESCRIPTION,
767
+ params,
768
+ );
769
+ if (routed.handled) return routed.value;
770
+ throw new Error(
771
+ "plugin-local-ai image description has been migrated to @elizaos/plugin-local-inference.",
772
+ );
773
+ },
774
+
775
+ [ModelType.TRANSCRIPTION]: async (
776
+ runtime: IAgentRuntime,
777
+ params: TranscriptionParams | Buffer | string,
778
+ ) => {
779
+ const routed = await tryLocalInferenceModel<string>(
780
+ runtime,
781
+ ModelType.TRANSCRIPTION,
782
+ params,
783
+ );
784
+ if (routed.handled) return routed.value;
785
+ throw new Error(
786
+ "plugin-local-ai transcription has been migrated to @elizaos/plugin-local-inference.",
787
+ );
788
+ },
789
+
790
+ [ModelType.TEXT_TO_SPEECH]: async (
791
+ runtime: IAgentRuntime,
792
+ params: TextToSpeechParams | string,
793
+ ) => {
794
+ const routed = await tryLocalInferenceModel<Uint8Array>(
795
+ runtime,
796
+ ModelType.TEXT_TO_SPEECH,
797
+ params,
798
+ );
799
+ if (routed.handled) return routed.value;
800
+ throw new Error(
801
+ "plugin-local-ai TTS has been migrated to @elizaos/plugin-local-inference.",
802
+ );
803
+ },
804
+ },
805
+ };
806
+
807
+ export default localAiPlugin;