@elizaos/plugin-local-inference 2.0.0-beta.1 → 2.0.3-beta.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (893) hide show
  1. package/LICENSE +21 -0
  2. package/README.md +157 -0
  3. package/dist/actions/generate-media.d.ts +59 -0
  4. package/dist/actions/generate-media.d.ts.map +1 -0
  5. package/dist/actions/identify-speaker.d.ts +23 -0
  6. package/dist/actions/identify-speaker.d.ts.map +1 -0
  7. package/dist/actions/transcription-control.d.ts +29 -0
  8. package/dist/actions/transcription-control.d.ts.map +1 -0
  9. package/dist/adapters/capacitor-llama/environment.d.ts +12 -0
  10. package/dist/adapters/capacitor-llama/environment.d.ts.map +1 -0
  11. package/dist/adapters/capacitor-llama/index.browser.d.ts +9 -0
  12. package/dist/adapters/capacitor-llama/index.browser.d.ts.map +1 -0
  13. package/dist/adapters/capacitor-llama/index.d.ts +18 -0
  14. package/dist/adapters/capacitor-llama/index.d.ts.map +1 -0
  15. package/dist/adapters/capacitor-llama/loader.d.ts +35 -0
  16. package/dist/adapters/capacitor-llama/loader.d.ts.map +1 -0
  17. package/dist/adapters/capacitor-llama/native-voice-capture.d.ts +70 -0
  18. package/dist/adapters/capacitor-llama/native-voice-capture.d.ts.map +1 -0
  19. package/dist/adapters/capacitor-llama/structured-output.d.ts +62 -0
  20. package/dist/adapters/capacitor-llama/structured-output.d.ts.map +1 -0
  21. package/dist/adapters/capacitor-llama/text-streaming.d.ts +24 -0
  22. package/dist/adapters/capacitor-llama/text-streaming.d.ts.map +1 -0
  23. package/dist/adapters/capacitor-llama/types.d.ts +338 -0
  24. package/dist/adapters/capacitor-llama/types.d.ts.map +1 -0
  25. package/dist/adapters/capacitor-llama/voice-turn.d.ts +86 -0
  26. package/dist/adapters/capacitor-llama/voice-turn.d.ts.map +1 -0
  27. package/dist/backends/apple-foundation.d.ts +56 -0
  28. package/dist/backends/apple-foundation.d.ts.map +1 -0
  29. package/dist/index.d.ts +8 -37
  30. package/dist/index.d.ts.map +1 -0
  31. package/dist/index.js +38979 -430
  32. package/dist/index.js.map +217 -0
  33. package/dist/local-inference-routes.d.ts +47 -0
  34. package/dist/local-inference-routes.d.ts.map +1 -0
  35. package/dist/provider.d.ts +21 -0
  36. package/dist/provider.d.ts.map +1 -0
  37. package/dist/routes/compat-helpers.d.ts +18 -0
  38. package/dist/routes/compat-helpers.d.ts.map +1 -0
  39. package/dist/routes/family-member-route.d.ts +62 -0
  40. package/dist/routes/family-member-route.d.ts.map +1 -0
  41. package/dist/routes/index.d.ts +20 -0
  42. package/dist/routes/index.d.ts.map +1 -0
  43. package/dist/routes/index.js +42040 -0
  44. package/dist/routes/index.js.map +236 -0
  45. package/dist/routes/live-diarization-route.d.ts +33 -0
  46. package/dist/routes/live-diarization-route.d.ts.map +1 -0
  47. package/dist/routes/local-inference-asr-route.d.ts +4 -0
  48. package/dist/routes/local-inference-asr-route.d.ts.map +1 -0
  49. package/dist/routes/local-inference-asr-transcribe.d.ts +20 -0
  50. package/dist/routes/local-inference-asr-transcribe.d.ts.map +1 -0
  51. package/dist/routes/local-inference-compat-routes.d.ts +16 -0
  52. package/dist/routes/local-inference-compat-routes.d.ts.map +1 -0
  53. package/dist/routes/local-inference-tts-route.d.ts +7 -0
  54. package/dist/routes/local-inference-tts-route.d.ts.map +1 -0
  55. package/dist/routes/native-pcm-turn-route.d.ts +3 -0
  56. package/dist/routes/native-pcm-turn-route.d.ts.map +1 -0
  57. package/dist/routes/transcript-audio-store.d.ts +15 -0
  58. package/dist/routes/transcript-audio-store.d.ts.map +1 -0
  59. package/dist/routes/transcripts-routes.d.ts +44 -0
  60. package/dist/routes/transcripts-routes.d.ts.map +1 -0
  61. package/dist/routes/voice-first-run-routes.d.ts +62 -0
  62. package/dist/routes/voice-first-run-routes.d.ts.map +1 -0
  63. package/dist/routes/voice-models-routes.d.ts +62 -0
  64. package/dist/routes/voice-models-routes.d.ts.map +1 -0
  65. package/dist/routes/voice-profile-plugin-routes.d.ts +19 -0
  66. package/dist/routes/voice-profile-plugin-routes.d.ts.map +1 -0
  67. package/dist/routes/voice-profiles-management-routes.d.ts +52 -0
  68. package/dist/routes/voice-profiles-management-routes.d.ts.map +1 -0
  69. package/dist/routes/voice-speaker-profile-routes.d.ts +57 -0
  70. package/dist/routes/voice-speaker-profile-routes.d.ts.map +1 -0
  71. package/dist/runtime/embedding-manager-support.d.ts +77 -0
  72. package/dist/runtime/embedding-manager-support.d.ts.map +1 -0
  73. package/dist/runtime/embedding-presets.d.ts +16 -0
  74. package/dist/runtime/embedding-presets.d.ts.map +1 -0
  75. package/dist/runtime/embedding-warmup-policy.d.ts +14 -0
  76. package/dist/runtime/embedding-warmup-policy.d.ts.map +1 -0
  77. package/dist/runtime/ensure-local-inference-handler.d.ts +70 -0
  78. package/dist/runtime/ensure-local-inference-handler.d.ts.map +1 -0
  79. package/dist/runtime/index.d.ts +15 -0
  80. package/dist/runtime/index.d.ts.map +1 -0
  81. package/dist/runtime/index.js +38768 -0
  82. package/dist/runtime/index.js.map +217 -0
  83. package/dist/runtime/mobile-local-inference-gate.d.ts +63 -0
  84. package/dist/runtime/mobile-local-inference-gate.d.ts.map +1 -0
  85. package/dist/runtime/voice-entity-binding.d.ts +113 -0
  86. package/dist/runtime/voice-entity-binding.d.ts.map +1 -0
  87. package/dist/services/active-model.d.ts +310 -0
  88. package/dist/services/active-model.d.ts.map +1 -0
  89. package/dist/services/asr-provenance.d.ts +5 -0
  90. package/dist/services/asr-provenance.d.ts.map +1 -0
  91. package/dist/services/assignments.d.ts +84 -0
  92. package/dist/services/assignments.d.ts.map +1 -0
  93. package/dist/services/backend-selector.d.ts +55 -0
  94. package/dist/services/backend-selector.d.ts.map +1 -0
  95. package/dist/services/backend.d.ts +440 -0
  96. package/dist/services/backend.d.ts.map +1 -0
  97. package/dist/services/bionic-host-loader.d.ts +67 -0
  98. package/dist/services/bionic-host-loader.d.ts.map +1 -0
  99. package/dist/services/bundled-models.d.ts +34 -0
  100. package/dist/services/bundled-models.d.ts.map +1 -0
  101. package/dist/services/cache-bridge.d.ts +206 -0
  102. package/dist/services/cache-bridge.d.ts.map +1 -0
  103. package/dist/services/catalog.d.ts +10 -0
  104. package/dist/services/catalog.d.ts.map +1 -0
  105. package/dist/services/checkpoint-client.d.ts +109 -0
  106. package/dist/services/checkpoint-client.d.ts.map +1 -0
  107. package/dist/services/checkpoint-manager.d.ts +217 -0
  108. package/dist/services/checkpoint-manager.d.ts.map +1 -0
  109. package/dist/services/cloud-fallback.d.ts +102 -0
  110. package/dist/services/cloud-fallback.d.ts.map +1 -0
  111. package/dist/services/context-fit.d.ts +36 -0
  112. package/dist/services/context-fit.d.ts.map +1 -0
  113. package/dist/services/conversation-registry.d.ts +142 -0
  114. package/dist/services/conversation-registry.d.ts.map +1 -0
  115. package/dist/services/desktop-fused-ffi-backend-runtime.d.ts +111 -0
  116. package/dist/services/desktop-fused-ffi-backend-runtime.d.ts.map +1 -0
  117. package/dist/services/device-bridge.d.ts +188 -0
  118. package/dist/services/device-bridge.d.ts.map +1 -0
  119. package/dist/services/device-resource-metrics.d.ts +149 -0
  120. package/dist/services/device-resource-metrics.d.ts.map +1 -0
  121. package/dist/services/device-tier.d.ts +133 -0
  122. package/dist/services/device-tier.d.ts.map +1 -0
  123. package/dist/services/downloader.d.ts +94 -0
  124. package/dist/services/downloader.d.ts.map +1 -0
  125. package/dist/services/engine.d.ts +579 -0
  126. package/dist/services/engine.d.ts.map +1 -0
  127. package/dist/services/ensure-local-artifacts.d.ts +82 -0
  128. package/dist/services/ensure-local-artifacts.d.ts.map +1 -0
  129. package/dist/services/external-scanner.d.ts +17 -0
  130. package/dist/services/external-scanner.d.ts.map +1 -0
  131. package/dist/services/ffi-llm-mock.d.ts +90 -0
  132. package/dist/services/ffi-llm-mock.d.ts.map +1 -0
  133. package/dist/services/ffi-llm-streaming-abi.d.ts +318 -0
  134. package/dist/services/ffi-llm-streaming-abi.d.ts.map +1 -0
  135. package/dist/services/ffi-streaming-backend.d.ts +201 -0
  136. package/dist/services/ffi-streaming-backend.d.ts.map +1 -0
  137. package/dist/services/ffi-streaming-runner.d.ts +146 -0
  138. package/dist/services/ffi-streaming-runner.d.ts.map +1 -0
  139. package/dist/services/gpu-autotune.d.ts +150 -0
  140. package/dist/services/gpu-autotune.d.ts.map +1 -0
  141. package/dist/services/gpu-detect.d.ts +56 -0
  142. package/dist/services/gpu-detect.d.ts.map +1 -0
  143. package/dist/services/handler-registry.d.ts +72 -0
  144. package/dist/services/handler-registry.d.ts.map +1 -0
  145. package/dist/services/hardware.d.ts +63 -0
  146. package/dist/services/hardware.d.ts.map +1 -0
  147. package/dist/services/image-description-runtime.d.ts +14 -0
  148. package/dist/services/image-description-runtime.d.ts.map +1 -0
  149. package/dist/services/imagegen/aosp-unavailable.d.ts +134 -0
  150. package/dist/services/imagegen/aosp-unavailable.d.ts.map +1 -0
  151. package/dist/services/imagegen/backend-selector.d.ts +118 -0
  152. package/dist/services/imagegen/backend-selector.d.ts.map +1 -0
  153. package/dist/services/imagegen/coreml-unavailable.d.ts +105 -0
  154. package/dist/services/imagegen/coreml-unavailable.d.ts.map +1 -0
  155. package/dist/services/imagegen/errors.d.ts +16 -0
  156. package/dist/services/imagegen/errors.d.ts.map +1 -0
  157. package/dist/services/imagegen/index.d.ts +58 -0
  158. package/dist/services/imagegen/index.d.ts.map +1 -0
  159. package/dist/services/imagegen/mflux.d.ts +74 -0
  160. package/dist/services/imagegen/mflux.d.ts.map +1 -0
  161. package/dist/services/imagegen/sd-cpp.d.ts +181 -0
  162. package/dist/services/imagegen/sd-cpp.d.ts.map +1 -0
  163. package/dist/services/imagegen/tensorrt-unavailable.d.ts +83 -0
  164. package/dist/services/imagegen/tensorrt-unavailable.d.ts.map +1 -0
  165. package/dist/services/imagegen/types.d.ts +181 -0
  166. package/dist/services/imagegen/types.d.ts.map +1 -0
  167. package/dist/services/index.d.ts +31 -0
  168. package/dist/services/index.d.ts.map +1 -0
  169. package/dist/services/index.js +39453 -0
  170. package/dist/services/index.js.map +227 -0
  171. package/dist/services/inference-capabilities.d.ts +132 -0
  172. package/dist/services/inference-capabilities.d.ts.map +1 -0
  173. package/dist/services/inference-telemetry.d.ts +59 -0
  174. package/dist/services/inference-telemetry.d.ts.map +1 -0
  175. package/dist/services/ios-llama-streaming.d.ts +119 -0
  176. package/dist/services/ios-llama-streaming.d.ts.map +1 -0
  177. package/dist/services/kv-spill.d.ts +189 -0
  178. package/dist/services/kv-spill.d.ts.map +1 -0
  179. package/dist/services/latency-trace.d.ts +346 -0
  180. package/dist/services/latency-trace.d.ts.map +1 -0
  181. package/dist/services/lib-target.d.ts +55 -0
  182. package/dist/services/lib-target.d.ts.map +1 -0
  183. package/dist/services/live-signals.d.ts +86 -0
  184. package/dist/services/live-signals.d.ts.map +1 -0
  185. package/dist/services/llama-server-metrics.d.ts +114 -0
  186. package/dist/services/llama-server-metrics.d.ts.map +1 -0
  187. package/dist/services/llm-streaming-binding.d.ts +96 -0
  188. package/dist/services/llm-streaming-binding.d.ts.map +1 -0
  189. package/dist/services/load-args.d.ts +82 -0
  190. package/dist/services/load-args.d.ts.map +1 -0
  191. package/dist/services/manifest/index.d.ts +4 -0
  192. package/dist/services/manifest/index.d.ts.map +1 -0
  193. package/dist/services/manifest/schema.d.ts +903 -0
  194. package/dist/services/manifest/schema.d.ts.map +1 -0
  195. package/dist/services/manifest/types.d.ts +32 -0
  196. package/dist/services/manifest/types.d.ts.map +1 -0
  197. package/dist/services/manifest/validator.d.ts +66 -0
  198. package/dist/services/manifest/validator.d.ts.map +1 -0
  199. package/dist/services/memory-arbiter.d.ts +348 -0
  200. package/dist/services/memory-arbiter.d.ts.map +1 -0
  201. package/dist/services/memory-benchmark.d.ts +76 -0
  202. package/dist/services/memory-benchmark.d.ts.map +1 -0
  203. package/dist/services/memory-monitor.d.ts +128 -0
  204. package/dist/services/memory-monitor.d.ts.map +1 -0
  205. package/dist/services/memory-pressure.d.ts +130 -0
  206. package/dist/services/memory-pressure.d.ts.map +1 -0
  207. package/dist/services/mtp-doctor.d.ts +13 -0
  208. package/dist/services/mtp-doctor.d.ts.map +1 -0
  209. package/dist/services/network-policy.d.ts +127 -0
  210. package/dist/services/network-policy.d.ts.map +1 -0
  211. package/dist/services/paths.d.ts +6 -0
  212. package/dist/services/paths.d.ts.map +1 -0
  213. package/dist/services/planner-skeleton.d.ts +124 -0
  214. package/dist/services/planner-skeleton.d.ts.map +1 -0
  215. package/dist/services/providers.d.ts +38 -0
  216. package/dist/services/providers.d.ts.map +1 -0
  217. package/dist/services/ram-budget.d.ts +110 -0
  218. package/dist/services/ram-budget.d.ts.map +1 -0
  219. package/dist/services/readiness.d.ts +9 -0
  220. package/dist/services/readiness.d.ts.map +1 -0
  221. package/dist/services/recommendation.d.ts +111 -0
  222. package/dist/services/recommendation.d.ts.map +1 -0
  223. package/dist/services/registry.d.ts +33 -0
  224. package/dist/services/registry.d.ts.map +1 -0
  225. package/dist/services/router-handler.d.ts +92 -0
  226. package/dist/services/router-handler.d.ts.map +1 -0
  227. package/dist/services/routing-policy.d.ts +92 -0
  228. package/dist/services/routing-policy.d.ts.map +1 -0
  229. package/dist/services/routing-preferences.d.ts +8 -0
  230. package/dist/services/routing-preferences.d.ts.map +1 -0
  231. package/dist/services/runtime-target.d.ts +98 -0
  232. package/dist/services/runtime-target.d.ts.map +1 -0
  233. package/dist/services/service.d.ts +128 -0
  234. package/dist/services/service.d.ts.map +1 -0
  235. package/dist/services/session-pool.d.ts +72 -0
  236. package/dist/services/session-pool.d.ts.map +1 -0
  237. package/dist/services/structured-output/deterministic-repair.d.ts +23 -0
  238. package/dist/services/structured-output/deterministic-repair.d.ts.map +1 -0
  239. package/dist/services/structured-output/index.d.ts +2 -0
  240. package/dist/services/structured-output/index.d.ts.map +1 -0
  241. package/dist/services/structured-output.d.ts +311 -0
  242. package/dist/services/structured-output.d.ts.map +1 -0
  243. package/dist/services/system-memory.d.ts +33 -0
  244. package/dist/services/system-memory.d.ts.map +1 -0
  245. package/dist/services/types.d.ts +19 -0
  246. package/dist/services/types.d.ts.map +1 -0
  247. package/dist/services/verify-on-device.d.ts +34 -0
  248. package/dist/services/verify-on-device.d.ts.map +1 -0
  249. package/dist/services/verify.d.ts +8 -0
  250. package/dist/services/verify.d.ts.map +1 -0
  251. package/dist/services/vision/aosp-unavailable.d.ts +115 -0
  252. package/dist/services/vision/aosp-unavailable.d.ts.map +1 -0
  253. package/dist/services/vision/capacitor-llama.d.ts +99 -0
  254. package/dist/services/vision/capacitor-llama.d.ts.map +1 -0
  255. package/dist/services/vision/cloud-fallback.d.ts +47 -0
  256. package/dist/services/vision/cloud-fallback.d.ts.map +1 -0
  257. package/dist/services/vision/hash.d.ts +71 -0
  258. package/dist/services/vision/hash.d.ts.map +1 -0
  259. package/dist/services/vision/index.d.ts +95 -0
  260. package/dist/services/vision/index.d.ts.map +1 -0
  261. package/dist/services/vision/llama-server.d.ts +73 -0
  262. package/dist/services/vision/llama-server.d.ts.map +1 -0
  263. package/dist/services/vision/types.d.ts +162 -0
  264. package/dist/services/vision/types.d.ts.map +1 -0
  265. package/dist/services/vision/vast-fallback.d.ts +18 -0
  266. package/dist/services/vision/vast-fallback.d.ts.map +1 -0
  267. package/dist/services/vision-embedding-cache.d.ts +98 -0
  268. package/dist/services/vision-embedding-cache.d.ts.map +1 -0
  269. package/dist/services/voice/__test-helpers__/fake-ffi.d.ts +27 -0
  270. package/dist/services/voice/__test-helpers__/fake-ffi.d.ts.map +1 -0
  271. package/dist/services/voice/__test-helpers__/synthetic-speech.d.ts +66 -0
  272. package/dist/services/voice/__test-helpers__/synthetic-speech.d.ts.map +1 -0
  273. package/dist/services/voice/acoustic-speaker-attribution.d.ts +61 -0
  274. package/dist/services/voice/acoustic-speaker-attribution.d.ts.map +1 -0
  275. package/dist/services/voice/audio-frame-consumer.d.ts +294 -0
  276. package/dist/services/voice/audio-frame-consumer.d.ts.map +1 -0
  277. package/dist/services/voice/barge-in.d.ts +112 -0
  278. package/dist/services/voice/barge-in.d.ts.map +1 -0
  279. package/dist/services/voice/cancellation-coordinator.d.ts +127 -0
  280. package/dist/services/voice/cancellation-coordinator.d.ts.map +1 -0
  281. package/dist/services/voice/checkpoint-manager.d.ts +199 -0
  282. package/dist/services/voice/checkpoint-manager.d.ts.map +1 -0
  283. package/dist/services/voice/checkpoint-policy.d.ts +178 -0
  284. package/dist/services/voice/checkpoint-policy.d.ts.map +1 -0
  285. package/dist/services/voice/corpus-augment.d.ts +111 -0
  286. package/dist/services/voice/corpus-augment.d.ts.map +1 -0
  287. package/dist/services/voice/corpus-generator.d.ts +134 -0
  288. package/dist/services/voice/corpus-generator.d.ts.map +1 -0
  289. package/dist/services/voice/diarization-error-rate.d.ts +40 -0
  290. package/dist/services/voice/diarization-error-rate.d.ts.map +1 -0
  291. package/dist/services/voice/e2e-harness.d.ts +297 -0
  292. package/dist/services/voice/e2e-harness.d.ts.map +1 -0
  293. package/dist/services/voice/eager-context-builder.d.ts +170 -0
  294. package/dist/services/voice/eager-context-builder.d.ts.map +1 -0
  295. package/dist/services/voice/echo-delay.d.ts +67 -0
  296. package/dist/services/voice/echo-delay.d.ts.map +1 -0
  297. package/dist/services/voice/echo-metrics.d.ts +7 -0
  298. package/dist/services/voice/echo-metrics.d.ts.map +1 -0
  299. package/dist/services/voice/echo-reference-buffer.d.ts +65 -0
  300. package/dist/services/voice/echo-reference-buffer.d.ts.map +1 -0
  301. package/dist/services/voice/eliza1-eot-scorer.d.ts +124 -0
  302. package/dist/services/voice/eliza1-eot-scorer.d.ts.map +1 -0
  303. package/dist/services/voice/embedding-server.d.ts +37 -0
  304. package/dist/services/voice/embedding-server.d.ts.map +1 -0
  305. package/dist/services/voice/embedding.d.ts +132 -0
  306. package/dist/services/voice/embedding.d.ts.map +1 -0
  307. package/dist/services/voice/emotion-attribution.d.ts +68 -0
  308. package/dist/services/voice/emotion-attribution.d.ts.map +1 -0
  309. package/dist/services/voice/engine-bridge.d.ts +762 -0
  310. package/dist/services/voice/engine-bridge.d.ts.map +1 -0
  311. package/dist/services/voice/eot-classifier-ggml.d.ts +179 -0
  312. package/dist/services/voice/eot-classifier-ggml.d.ts.map +1 -0
  313. package/dist/services/voice/eot-classifier.d.ts +211 -0
  314. package/dist/services/voice/eot-classifier.d.ts.map +1 -0
  315. package/dist/services/voice/errors.d.ts +20 -0
  316. package/dist/services/voice/errors.d.ts.map +1 -0
  317. package/dist/services/voice/expressive-tags.d.ts +158 -0
  318. package/dist/services/voice/expressive-tags.d.ts.map +1 -0
  319. package/dist/services/voice/ffi-bindings.d.ts +696 -0
  320. package/dist/services/voice/ffi-bindings.d.ts.map +1 -0
  321. package/dist/services/voice/first-line-cache.d.ts +181 -0
  322. package/dist/services/voice/first-line-cache.d.ts.map +1 -0
  323. package/dist/services/voice/fused-eot-scorer.d.ts +51 -0
  324. package/dist/services/voice/fused-eot-scorer.d.ts.map +1 -0
  325. package/dist/services/voice/index.d.ts +96 -0
  326. package/dist/services/voice/index.d.ts.map +1 -0
  327. package/dist/services/voice/kokoro/index.d.ts +24 -0
  328. package/dist/services/voice/kokoro/index.d.ts.map +1 -0
  329. package/dist/services/voice/kokoro/kokoro-backend.d.ts +87 -0
  330. package/dist/services/voice/kokoro/kokoro-backend.d.ts.map +1 -0
  331. package/dist/services/voice/kokoro/kokoro-engine-discovery.d.ts +58 -0
  332. package/dist/services/voice/kokoro/kokoro-engine-discovery.d.ts.map +1 -0
  333. package/dist/services/voice/kokoro/kokoro-ffi-runtime.d.ts +75 -0
  334. package/dist/services/voice/kokoro/kokoro-ffi-runtime.d.ts.map +1 -0
  335. package/dist/services/voice/kokoro/kokoro-runtime.d.ts +100 -0
  336. package/dist/services/voice/kokoro/kokoro-runtime.d.ts.map +1 -0
  337. package/dist/services/voice/kokoro/phoneme-stream.d.ts +51 -0
  338. package/dist/services/voice/kokoro/phoneme-stream.d.ts.map +1 -0
  339. package/dist/services/voice/kokoro/phonemizer.d.ts +50 -0
  340. package/dist/services/voice/kokoro/phonemizer.d.ts.map +1 -0
  341. package/dist/services/voice/kokoro/pick-runtime.d.ts +61 -0
  342. package/dist/services/voice/kokoro/pick-runtime.d.ts.map +1 -0
  343. package/dist/services/voice/kokoro/runtime-selection.d.ts +31 -0
  344. package/dist/services/voice/kokoro/runtime-selection.d.ts.map +1 -0
  345. package/dist/services/voice/kokoro/types.d.ts +82 -0
  346. package/dist/services/voice/kokoro/types.d.ts.map +1 -0
  347. package/dist/services/voice/kokoro/voice-presets.d.ts +23 -0
  348. package/dist/services/voice/kokoro/voice-presets.d.ts.map +1 -0
  349. package/dist/services/voice/kokoro/voices.d.ts +30 -0
  350. package/dist/services/voice/kokoro/voices.d.ts.map +1 -0
  351. package/dist/services/voice/lifecycle.d.ts +135 -0
  352. package/dist/services/voice/lifecycle.d.ts.map +1 -0
  353. package/dist/services/voice/live-diarization-session.d.ts +196 -0
  354. package/dist/services/voice/live-diarization-session.d.ts.map +1 -0
  355. package/dist/services/voice/metric-math.d.ts +10 -0
  356. package/dist/services/voice/metric-math.d.ts.map +1 -0
  357. package/dist/services/voice/mic-source.d.ts +136 -0
  358. package/dist/services/voice/mic-source.d.ts.map +1 -0
  359. package/dist/services/voice/nlms-echo-canceller.d.ts +137 -0
  360. package/dist/services/voice/nlms-echo-canceller.d.ts.map +1 -0
  361. package/dist/services/voice/optimistic-policy.d.ts +109 -0
  362. package/dist/services/voice/optimistic-policy.d.ts.map +1 -0
  363. package/dist/services/voice/optimistic-rollback.d.ts +151 -0
  364. package/dist/services/voice/optimistic-rollback.d.ts.map +1 -0
  365. package/dist/services/voice/partial-stabilizer.d.ts +73 -0
  366. package/dist/services/voice/partial-stabilizer.d.ts.map +1 -0
  367. package/dist/services/voice/phoneme-tokenizer.d.ts +49 -0
  368. package/dist/services/voice/phoneme-tokenizer.d.ts.map +1 -0
  369. package/dist/services/voice/phrase-cache.d.ts +76 -0
  370. package/dist/services/voice/phrase-cache.d.ts.map +1 -0
  371. package/dist/services/voice/phrase-chunker.d.ts +62 -0
  372. package/dist/services/voice/phrase-chunker.d.ts.map +1 -0
  373. package/dist/services/voice/pipeline-impls.d.ts +151 -0
  374. package/dist/services/voice/pipeline-impls.d.ts.map +1 -0
  375. package/dist/services/voice/pipeline.d.ts +216 -0
  376. package/dist/services/voice/pipeline.d.ts.map +1 -0
  377. package/dist/services/voice/prefill-client.d.ts +123 -0
  378. package/dist/services/voice/prefill-client.d.ts.map +1 -0
  379. package/dist/services/voice/prefix-preserving-queue.d.ts +113 -0
  380. package/dist/services/voice/prefix-preserving-queue.d.ts.map +1 -0
  381. package/dist/services/voice/profile-store.d.ts +248 -0
  382. package/dist/services/voice/profile-store.d.ts.map +1 -0
  383. package/dist/services/voice/ring-buffer.d.ts +40 -0
  384. package/dist/services/voice/ring-buffer.d.ts.map +1 -0
  385. package/dist/services/voice/rollback-queue.d.ts +24 -0
  386. package/dist/services/voice/rollback-queue.d.ts.map +1 -0
  387. package/dist/services/voice/samantha-preset-placeholder.d.ts +67 -0
  388. package/dist/services/voice/samantha-preset-placeholder.d.ts.map +1 -0
  389. package/dist/services/voice/samantha-preset-regenerator.d.ts +87 -0
  390. package/dist/services/voice/samantha-preset-regenerator.d.ts.map +1 -0
  391. package/dist/services/voice/scheduler.d.ts +146 -0
  392. package/dist/services/voice/scheduler.d.ts.map +1 -0
  393. package/dist/services/voice/self-voice-imprint.d.ts +33 -0
  394. package/dist/services/voice/self-voice-imprint.d.ts.map +1 -0
  395. package/dist/services/voice/shared-resources.d.ts +204 -0
  396. package/dist/services/voice/shared-resources.d.ts.map +1 -0
  397. package/dist/services/voice/speaker/attribution-pipeline.d.ts +74 -0
  398. package/dist/services/voice/speaker/attribution-pipeline.d.ts.map +1 -0
  399. package/dist/services/voice/speaker/diarizer-fused.d.ts +59 -0
  400. package/dist/services/voice/speaker/diarizer-fused.d.ts.map +1 -0
  401. package/dist/services/voice/speaker/diarizer.d.ts +75 -0
  402. package/dist/services/voice/speaker/diarizer.d.ts.map +1 -0
  403. package/dist/services/voice/speaker/encoder-fused.d.ts +60 -0
  404. package/dist/services/voice/speaker/encoder-fused.d.ts.map +1 -0
  405. package/dist/services/voice/speaker/encoder-ggml.d.ts +33 -0
  406. package/dist/services/voice/speaker/encoder-ggml.d.ts.map +1 -0
  407. package/dist/services/voice/speaker/encoder.d.ts +37 -0
  408. package/dist/services/voice/speaker/encoder.d.ts.map +1 -0
  409. package/dist/services/voice/speaker-imprint.d.ts +83 -0
  410. package/dist/services/voice/speaker-imprint.d.ts.map +1 -0
  411. package/dist/services/voice/speaker-preset-cache.d.ts +77 -0
  412. package/dist/services/voice/speaker-preset-cache.d.ts.map +1 -0
  413. package/dist/services/voice/streaming-asr/streaming-pipeline-adapter.d.ts +160 -0
  414. package/dist/services/voice/streaming-asr/streaming-pipeline-adapter.d.ts.map +1 -0
  415. package/dist/services/voice/system-audio-sink.d.ts +73 -0
  416. package/dist/services/voice/system-audio-sink.d.ts.map +1 -0
  417. package/dist/services/voice/transcriber.d.ts +244 -0
  418. package/dist/services/voice/transcriber.d.ts.map +1 -0
  419. package/dist/services/voice/transcript-knowledge.d.ts +37 -0
  420. package/dist/services/voice/transcript-knowledge.d.ts.map +1 -0
  421. package/dist/services/voice/transcript-service.d.ts +60 -0
  422. package/dist/services/voice/transcript-service.d.ts.map +1 -0
  423. package/dist/services/voice/transcript-store.d.ts +64 -0
  424. package/dist/services/voice/transcript-store.d.ts.map +1 -0
  425. package/dist/services/voice/turn-controller.d.ts +183 -0
  426. package/dist/services/voice/turn-controller.d.ts.map +1 -0
  427. package/dist/services/voice/types.d.ts +643 -0
  428. package/dist/services/voice/types.d.ts.map +1 -0
  429. package/dist/services/voice/vad.d.ts +283 -0
  430. package/dist/services/voice/vad.d.ts.map +1 -0
  431. package/dist/services/voice/voice-budget.d.ts +241 -0
  432. package/dist/services/voice/voice-budget.d.ts.map +1 -0
  433. package/dist/services/voice/voice-emotion-classifier.d.ts +95 -0
  434. package/dist/services/voice/voice-emotion-classifier.d.ts.map +1 -0
  435. package/dist/services/voice/voice-preload-predictor.d.ts +76 -0
  436. package/dist/services/voice/voice-preload-predictor.d.ts.map +1 -0
  437. package/dist/services/voice/voice-preset-format.d.ts +158 -0
  438. package/dist/services/voice/voice-preset-format.d.ts.map +1 -0
  439. package/dist/services/voice/voice-profile-artifact.d.ts +116 -0
  440. package/dist/services/voice/voice-profile-artifact.d.ts.map +1 -0
  441. package/dist/services/voice/voice-profile-routes.d.ts +83 -0
  442. package/dist/services/voice/voice-profile-routes.d.ts.map +1 -0
  443. package/dist/services/voice/voice-scenario.d.ts +131 -0
  444. package/dist/services/voice/voice-scenario.d.ts.map +1 -0
  445. package/dist/services/voice/voice-state-machine.d.ts +364 -0
  446. package/dist/services/voice/voice-state-machine.d.ts.map +1 -0
  447. package/dist/services/voice/voice-workbench-report.d.ts +117 -0
  448. package/dist/services/voice/voice-workbench-report.d.ts.map +1 -0
  449. package/dist/services/voice/wake-word-ggml.d.ts +100 -0
  450. package/dist/services/voice/wake-word-ggml.d.ts.map +1 -0
  451. package/dist/services/voice/wake-word.d.ts +255 -0
  452. package/dist/services/voice/wake-word.d.ts.map +1 -0
  453. package/dist/services/voice/wav-codec.d.ts +11 -0
  454. package/dist/services/voice/wav-codec.d.ts.map +1 -0
  455. package/dist/services/voice/workbench-entrypoint.d.ts +42 -0
  456. package/dist/services/voice/workbench-entrypoint.d.ts.map +1 -0
  457. package/dist/services/voice/workbench-headless-runner.d.ts +102 -0
  458. package/dist/services/voice/workbench-headless-runner.d.ts.map +1 -0
  459. package/dist/services/voice/workbench-logic-services.d.ts +36 -0
  460. package/dist/services/voice/workbench-logic-services.d.ts.map +1 -0
  461. package/dist/services/voice/workbench-real-services.d.ts +17 -0
  462. package/dist/services/voice/workbench-real-services.d.ts.map +1 -0
  463. package/dist/services/voice/workbench-scenarios.d.ts +24 -0
  464. package/dist/services/voice/workbench-scenarios.d.ts.map +1 -0
  465. package/dist/services/voice/wrap-with-first-line-cache.d.ts +70 -0
  466. package/dist/services/voice/wrap-with-first-line-cache.d.ts.map +1 -0
  467. package/dist/services/voice-model-updater.d.ts +240 -0
  468. package/dist/services/voice-model-updater.d.ts.map +1 -0
  469. package/dist/services/voice-prewarm.d.ts +3 -0
  470. package/dist/services/voice-prewarm.d.ts.map +1 -0
  471. package/dist/voice-workbench.d.ts +18 -0
  472. package/dist/voice-workbench.d.ts.map +1 -0
  473. package/dist/voice-workbench.js +5259 -0
  474. package/dist/voice-workbench.js.map +34 -0
  475. package/package.json +101 -15
  476. package/registry-entry.json +137 -0
  477. package/src/actions/generate-media.ts +647 -0
  478. package/src/actions/identify-speaker.ts +171 -0
  479. package/src/actions/transcription-control.test.ts +100 -0
  480. package/src/actions/transcription-control.ts +127 -0
  481. package/src/adapters/capacitor-llama/__tests__/compat-behavior.test.ts +218 -0
  482. package/src/adapters/capacitor-llama/__tests__/index.test.ts +68 -0
  483. package/src/adapters/capacitor-llama/__tests__/structured-output.test.ts +215 -0
  484. package/src/adapters/capacitor-llama/__tests__/text-streaming.test.ts +174 -0
  485. package/src/adapters/capacitor-llama/__tests__/voice-turn.test.ts +293 -0
  486. package/src/adapters/capacitor-llama/environment.ts +71 -0
  487. package/src/adapters/capacitor-llama/index.browser.ts +83 -0
  488. package/src/adapters/capacitor-llama/index.ts +831 -0
  489. package/src/adapters/capacitor-llama/loader.ts +109 -0
  490. package/src/adapters/capacitor-llama/native-voice-capture.ts +140 -0
  491. package/src/adapters/capacitor-llama/structured-output.ts +165 -0
  492. package/src/adapters/capacitor-llama/text-streaming.ts +227 -0
  493. package/src/adapters/capacitor-llama/types.ts +374 -0
  494. package/src/adapters/capacitor-llama/voice-turn.ts +178 -0
  495. package/src/backends/apple-foundation.ts +127 -0
  496. package/src/index.ts +62 -0
  497. package/src/local-inference-routes.test.ts +390 -0
  498. package/src/local-inference-routes.ts +1625 -0
  499. package/src/provider.ts +1111 -0
  500. package/src/routes/compat-helpers.ts +275 -0
  501. package/src/routes/family-member-route.ts +353 -0
  502. package/src/routes/index.ts +61 -0
  503. package/src/routes/live-diarization-route.test.ts +347 -0
  504. package/src/routes/live-diarization-route.ts +198 -0
  505. package/src/routes/local-inference-asr-route.test.ts +246 -0
  506. package/src/routes/local-inference-asr-route.ts +166 -0
  507. package/src/routes/local-inference-asr-transcribe.test.ts +118 -0
  508. package/src/routes/local-inference-asr-transcribe.ts +97 -0
  509. package/src/routes/local-inference-compat-routes.test.ts +485 -0
  510. package/src/routes/local-inference-compat-routes.ts +775 -0
  511. package/src/routes/local-inference-tts-route.test.ts +179 -0
  512. package/src/routes/local-inference-tts-route.ts +230 -0
  513. package/src/routes/native-pcm-turn-route.test.ts +136 -0
  514. package/src/routes/native-pcm-turn-route.ts +121 -0
  515. package/src/routes/transcript-audio-store.ts +27 -0
  516. package/src/routes/transcripts-routes.test.ts +195 -0
  517. package/src/routes/transcripts-routes.ts +191 -0
  518. package/src/routes/voice-first-run-routes.ts +524 -0
  519. package/src/routes/voice-models-routes.ts +554 -0
  520. package/src/routes/voice-profile-plugin-routes.ts +138 -0
  521. package/src/routes/voice-profiles-management-routes.ts +476 -0
  522. package/src/routes/voice-speaker-profile-routes.ts +199 -0
  523. package/src/runtime/aosp-llama-loader-selection.test.ts +80 -0
  524. package/src/runtime/bionic-wire-encoding.test.ts +147 -0
  525. package/src/runtime/capacitor-llama.d.ts +25 -0
  526. package/src/runtime/embedding-manager-support.ts +497 -0
  527. package/src/runtime/embedding-presets.ts +81 -0
  528. package/src/runtime/embedding-warmup-policy.test.ts +53 -0
  529. package/src/runtime/embedding-warmup-policy.ts +48 -0
  530. package/src/runtime/ensure-local-inference-handler.test.ts +726 -0
  531. package/src/runtime/ensure-local-inference-handler.ts +1640 -0
  532. package/src/runtime/index.ts +36 -0
  533. package/src/runtime/mobile-local-inference-gate.test.ts +152 -0
  534. package/src/runtime/mobile-local-inference-gate.ts +99 -0
  535. package/src/runtime/voice-entity-binding.transcript.test.ts +98 -0
  536. package/src/runtime/voice-entity-binding.ts +368 -0
  537. package/src/runtime/voice-speaker-entity-contract.test.ts +149 -0
  538. package/src/services/README.md +71 -0
  539. package/src/services/__tests__/backend-selector.precedence.test.ts +333 -0
  540. package/src/services/__tests__/backend-selector.test.ts +101 -0
  541. package/src/services/__tests__/checkpoint-manager.test.ts +376 -0
  542. package/src/services/__tests__/gpu-autotune.test.ts +400 -0
  543. package/src/services/__tests__/llm-streaming-binding.test.ts +85 -0
  544. package/src/services/__tests__/planner-grammar.test.ts +372 -0
  545. package/src/services/__tests__/runtime-target.test.ts +176 -0
  546. package/src/services/active-model-context-fit.test.ts +125 -0
  547. package/src/services/active-model-switch-rollback.test.ts +183 -0
  548. package/src/services/active-model.ts +1416 -0
  549. package/src/services/asr-provenance.ts +68 -0
  550. package/src/services/assignment-validation.test.ts +118 -0
  551. package/src/services/assignments.test.ts +106 -0
  552. package/src/services/assignments.ts +278 -0
  553. package/src/services/backend-selector.ts +95 -0
  554. package/src/services/backend.test.ts +84 -0
  555. package/src/services/backend.ts +791 -0
  556. package/src/services/bionic-host-loader.test.ts +226 -0
  557. package/src/services/bionic-host-loader.ts +252 -0
  558. package/src/services/bundled-models.ts +129 -0
  559. package/src/services/cache-bridge.test.ts +516 -0
  560. package/src/services/cache-bridge.ts +423 -0
  561. package/src/services/catalog.test.ts +259 -0
  562. package/src/services/catalog.ts +33 -0
  563. package/src/services/checkpoint-client.ts +258 -0
  564. package/src/services/checkpoint-manager.ts +474 -0
  565. package/src/services/cloud-fallback.ts +230 -0
  566. package/src/services/context-fit.test.ts +121 -0
  567. package/src/services/context-fit.ts +113 -0
  568. package/src/services/conversation-registry.test.ts +235 -0
  569. package/src/services/conversation-registry.ts +264 -0
  570. package/src/services/desktop-fused-ffi-backend-runtime.ts +431 -0
  571. package/src/services/device-bridge.ts +1237 -0
  572. package/src/services/device-resource-metrics.test.ts +98 -0
  573. package/src/services/device-resource-metrics.ts +346 -0
  574. package/src/services/device-tier.test.ts +458 -0
  575. package/src/services/device-tier.ts +502 -0
  576. package/src/services/downloader.test.ts +888 -0
  577. package/src/services/downloader.ts +1039 -0
  578. package/src/services/engine-direct-bundle.test.ts +90 -0
  579. package/src/services/engine-streaming.test.ts +80 -0
  580. package/src/services/engine.ts +2096 -0
  581. package/src/services/ensure-local-artifacts.integration.test.ts +273 -0
  582. package/src/services/ensure-local-artifacts.test.ts +368 -0
  583. package/src/services/ensure-local-artifacts.ts +351 -0
  584. package/src/services/external-scanner.ts +312 -0
  585. package/src/services/ffi-llm-mock.ts +354 -0
  586. package/src/services/ffi-llm-streaming-abi.ts +445 -0
  587. package/src/services/ffi-streaming-backend.ts +418 -0
  588. package/src/services/ffi-streaming-runner.test.ts +220 -0
  589. package/src/services/ffi-streaming-runner.ts +407 -0
  590. package/src/services/ffi-unload-ordering.test.ts +166 -0
  591. package/src/services/fused-eliza1-no-regression.test.ts +144 -0
  592. package/src/services/gpu-autotune.ts +534 -0
  593. package/src/services/gpu-detect.ts +139 -0
  594. package/src/services/handler-registry.ts +240 -0
  595. package/src/services/hardware.test.ts +236 -0
  596. package/src/services/hardware.ts +438 -0
  597. package/src/services/image-description-runtime.test.ts +61 -0
  598. package/src/services/image-description-runtime.ts +118 -0
  599. package/src/services/imagegen/aosp-unavailable.ts +229 -0
  600. package/src/services/imagegen/backend-selector.test.ts +190 -0
  601. package/src/services/imagegen/backend-selector.ts +277 -0
  602. package/src/services/imagegen/coreml-unavailable.ts +237 -0
  603. package/src/services/imagegen/errors.ts +40 -0
  604. package/src/services/imagegen/index.ts +144 -0
  605. package/src/services/imagegen/mflux.ts +313 -0
  606. package/src/services/imagegen/sd-cpp.ts +715 -0
  607. package/src/services/imagegen/tensorrt-unavailable.ts +295 -0
  608. package/src/services/imagegen/types.ts +193 -0
  609. package/src/services/index.ts +229 -0
  610. package/src/services/inference-capabilities.test.ts +75 -0
  611. package/src/services/inference-capabilities.ts +204 -0
  612. package/src/services/inference-telemetry.ts +143 -0
  613. package/src/services/ios-llama-streaming.ts +248 -0
  614. package/src/services/kv-spill.test.ts +222 -0
  615. package/src/services/kv-spill.ts +357 -0
  616. package/src/services/latency-trace.test.ts +266 -0
  617. package/src/services/latency-trace.ts +844 -0
  618. package/src/services/lib-target.test.ts +145 -0
  619. package/src/services/lib-target.ts +102 -0
  620. package/src/services/live-signals.test.ts +132 -0
  621. package/src/services/live-signals.ts +177 -0
  622. package/src/services/llama-server-metrics.test.ts +168 -0
  623. package/src/services/llama-server-metrics.ts +304 -0
  624. package/src/services/llm-streaming-binding.ts +136 -0
  625. package/src/services/load-args.ts +81 -0
  626. package/src/services/manifest/eliza-1.manifest.v1.json +790 -0
  627. package/src/services/manifest/index.ts +72 -0
  628. package/src/services/manifest/manifest.test.ts +791 -0
  629. package/src/services/manifest/schema.ts +761 -0
  630. package/src/services/manifest/types.ts +61 -0
  631. package/src/services/manifest/validator.ts +633 -0
  632. package/src/services/memory-arbiter.test.ts +558 -0
  633. package/src/services/memory-arbiter.ts +991 -0
  634. package/src/services/memory-benchmark.test.ts +91 -0
  635. package/src/services/memory-benchmark.ts +354 -0
  636. package/src/services/memory-monitor.test.ts +232 -0
  637. package/src/services/memory-monitor.ts +309 -0
  638. package/src/services/memory-pressure.ts +414 -0
  639. package/src/services/mtp-doctor.ts +86 -0
  640. package/src/services/network-policy.ts +346 -0
  641. package/src/services/paths.ts +25 -0
  642. package/src/services/planner-skeleton.ts +175 -0
  643. package/src/services/providers.ts +507 -0
  644. package/src/services/ram-budget-cache.test.ts +164 -0
  645. package/src/services/ram-budget.ts +309 -0
  646. package/src/services/readiness.test.ts +87 -0
  647. package/src/services/readiness.ts +238 -0
  648. package/src/services/recommendation.test.ts +216 -0
  649. package/src/services/recommendation.ts +671 -0
  650. package/src/services/registry.ts +157 -0
  651. package/src/services/required-kernels-gate.test.ts +64 -0
  652. package/src/services/router-handler.test.ts +45 -0
  653. package/src/services/router-handler.ts +426 -0
  654. package/src/services/routing-policy.test.ts +352 -0
  655. package/src/services/routing-policy.ts +367 -0
  656. package/src/services/routing-preferences.ts +17 -0
  657. package/src/services/runtime-target.ts +154 -0
  658. package/src/services/service.test.ts +223 -0
  659. package/src/services/service.ts +750 -0
  660. package/src/services/session-pool.ts +153 -0
  661. package/src/services/structured-output/deterministic-repair.test.ts +169 -0
  662. package/src/services/structured-output/deterministic-repair.ts +443 -0
  663. package/src/services/structured-output/index.ts +4 -0
  664. package/src/services/structured-output.test.ts +483 -0
  665. package/src/services/structured-output.ts +712 -0
  666. package/src/services/system-memory.test.ts +47 -0
  667. package/src/services/system-memory.ts +67 -0
  668. package/src/services/transcription-priority.test.ts +211 -0
  669. package/src/services/types.ts +59 -0
  670. package/src/services/verify-on-device.test.ts +87 -0
  671. package/src/services/verify-on-device.ts +127 -0
  672. package/src/services/verify.ts +13 -0
  673. package/src/services/vision/aosp-unavailable.ts +163 -0
  674. package/src/services/vision/capacitor-llama.ts +255 -0
  675. package/src/services/vision/cloud-fallback.test.ts +243 -0
  676. package/src/services/vision/cloud-fallback.ts +268 -0
  677. package/src/services/vision/fallback-chain.test.ts +86 -0
  678. package/src/services/vision/hash.ts +157 -0
  679. package/src/services/vision/index.ts +251 -0
  680. package/src/services/vision/llama-server.ts +177 -0
  681. package/src/services/vision/types.ts +163 -0
  682. package/src/services/vision/vast-fallback.ts +127 -0
  683. package/src/services/vision-embedding-cache.ts +189 -0
  684. package/src/services/voice/VOICE_WORKBENCH.md +133 -0
  685. package/src/services/voice/__fixtures__/voice-workbench-logic-baseline.json +180 -0
  686. package/src/services/voice/__test-helpers__/fake-ffi.ts +94 -0
  687. package/src/services/voice/__test-helpers__/synthetic-speech.ts +194 -0
  688. package/src/services/voice/__tests__/checkpoint-manager.test.ts +241 -0
  689. package/src/services/voice/__tests__/checkpoint-policy.test.ts +270 -0
  690. package/src/services/voice/__tests__/eager-context-builder.test.ts +257 -0
  691. package/src/services/voice/__tests__/eliza1-eot-scorer.test.ts +288 -0
  692. package/src/services/voice/__tests__/eot-classifier.test.ts +431 -0
  693. package/src/services/voice/__tests__/optimistic-rollback.test.ts +312 -0
  694. package/src/services/voice/__tests__/prefill-client.test.ts +266 -0
  695. package/src/services/voice/__tests__/prefix-preserving-queue.test.ts +208 -0
  696. package/src/services/voice/__tests__/streaming-asr.test.ts +450 -0
  697. package/src/services/voice/__tests__/streaming-transcriber.test.ts +339 -0
  698. package/src/services/voice/__tests__/turn-detector-resolver.test.ts +195 -0
  699. package/src/services/voice/__tests__/voice-state-machine-prefill.test.ts +275 -0
  700. package/src/services/voice/__tests__/voice-state-machine.test.ts +354 -0
  701. package/src/services/voice/acoustic-speaker-attribution.test.ts +165 -0
  702. package/src/services/voice/acoustic-speaker-attribution.ts +336 -0
  703. package/src/services/voice/asr-timed.real.test.ts +139 -0
  704. package/src/services/voice/audio-frame-consumer.test.ts +669 -0
  705. package/src/services/voice/audio-frame-consumer.ts +651 -0
  706. package/src/services/voice/barge-in.test.ts +244 -0
  707. package/src/services/voice/barge-in.ts +335 -0
  708. package/src/services/voice/cancellation-coordinator.test.ts +196 -0
  709. package/src/services/voice/cancellation-coordinator.ts +269 -0
  710. package/src/services/voice/checkpoint-manager.ts +401 -0
  711. package/src/services/voice/checkpoint-policy.ts +336 -0
  712. package/src/services/voice/composite-eot-classifier.test.ts +59 -0
  713. package/src/services/voice/corpus-augment.test.ts +276 -0
  714. package/src/services/voice/corpus-augment.ts +451 -0
  715. package/src/services/voice/corpus-generator.test.ts +201 -0
  716. package/src/services/voice/corpus-generator.ts +413 -0
  717. package/src/services/voice/diarization-error-rate.greedy.test.ts +140 -0
  718. package/src/services/voice/diarization-error-rate.test.ts +100 -0
  719. package/src/services/voice/diarization-error-rate.ts +249 -0
  720. package/src/services/voice/e2e-harness.der.test.ts +94 -0
  721. package/src/services/voice/e2e-harness.respond-eot-entity.test.ts +277 -0
  722. package/src/services/voice/e2e-harness.security-echo.test.ts +103 -0
  723. package/src/services/voice/e2e-harness.test.ts +182 -0
  724. package/src/services/voice/e2e-harness.ts +902 -0
  725. package/src/services/voice/eager-context-builder.ts +262 -0
  726. package/src/services/voice/echo-delay.test.ts +118 -0
  727. package/src/services/voice/echo-delay.ts +135 -0
  728. package/src/services/voice/echo-metrics.test.ts +17 -0
  729. package/src/services/voice/echo-metrics.ts +20 -0
  730. package/src/services/voice/echo-reference-buffer.test.ts +86 -0
  731. package/src/services/voice/echo-reference-buffer.ts +165 -0
  732. package/src/services/voice/eliza1-eot-scorer.ts +242 -0
  733. package/src/services/voice/embedding-server.ts +200 -0
  734. package/src/services/voice/embedding.test.ts +131 -0
  735. package/src/services/voice/embedding.ts +242 -0
  736. package/src/services/voice/emotion-attribution.test.ts +129 -0
  737. package/src/services/voice/emotion-attribution.ts +361 -0
  738. package/src/services/voice/engine-bridge-cancellation.test.ts +422 -0
  739. package/src/services/voice/engine-bridge-transcript-join.test.ts +278 -0
  740. package/src/services/voice/engine-bridge.test.ts +384 -0
  741. package/src/services/voice/engine-bridge.ts +2343 -0
  742. package/src/services/voice/eot-classifier-ggml.ts +569 -0
  743. package/src/services/voice/eot-classifier.test.ts +98 -0
  744. package/src/services/voice/eot-classifier.ts +422 -0
  745. package/src/services/voice/errors.ts +34 -0
  746. package/src/services/voice/expressive-tags.asr.test.ts +77 -0
  747. package/src/services/voice/expressive-tags.test.ts +102 -0
  748. package/src/services/voice/expressive-tags.ts +405 -0
  749. package/src/services/voice/ffi-bindings.test.ts +735 -0
  750. package/src/services/voice/ffi-bindings.ts +3387 -0
  751. package/src/services/voice/first-line-cache.ts +725 -0
  752. package/src/services/voice/fused-eot-scorer.ts +139 -0
  753. package/src/services/voice/index.ts +502 -0
  754. package/src/services/voice/kokoro/__tests__/kokoro-backend.test.ts +262 -0
  755. package/src/services/voice/kokoro/__tests__/kokoro-engine-bridge.real.test.ts +236 -0
  756. package/src/services/voice/kokoro/__tests__/kokoro-engine-bridge.test.ts +60 -0
  757. package/src/services/voice/kokoro/__tests__/kokoro-engine-discovery.test.ts +277 -0
  758. package/src/services/voice/kokoro/__tests__/kokoro-ffi-runtime.test.ts +235 -0
  759. package/src/services/voice/kokoro/__tests__/kokoro-runtime.test.ts +95 -0
  760. package/src/services/voice/kokoro/__tests__/phonemizer.test.ts +53 -0
  761. package/src/services/voice/kokoro/__tests__/runtime-selection.test.ts +67 -0
  762. package/src/services/voice/kokoro/__tests__/voices.test.ts +57 -0
  763. package/src/services/voice/kokoro/index.ts +79 -0
  764. package/src/services/voice/kokoro/kokoro-backend.ts +223 -0
  765. package/src/services/voice/kokoro/kokoro-engine-discovery.ts +177 -0
  766. package/src/services/voice/kokoro/kokoro-ffi-runtime.ts +233 -0
  767. package/src/services/voice/kokoro/kokoro-runtime.ts +170 -0
  768. package/src/services/voice/kokoro/phoneme-stream.ts +123 -0
  769. package/src/services/voice/kokoro/phonemizer.ts +344 -0
  770. package/src/services/voice/kokoro/pick-runtime.test.ts +91 -0
  771. package/src/services/voice/kokoro/pick-runtime.ts +130 -0
  772. package/src/services/voice/kokoro/runtime-selection.ts +64 -0
  773. package/src/services/voice/kokoro/types.ts +95 -0
  774. package/src/services/voice/kokoro/voice-presets.ts +129 -0
  775. package/src/services/voice/kokoro/voices.ts +64 -0
  776. package/src/services/voice/lifecycle.test.ts +315 -0
  777. package/src/services/voice/lifecycle.ts +301 -0
  778. package/src/services/voice/live-diarization-session.echo.test.ts +232 -0
  779. package/src/services/voice/live-diarization-session.ts +622 -0
  780. package/src/services/voice/metric-math.test.ts +61 -0
  781. package/src/services/voice/metric-math.ts +25 -0
  782. package/src/services/voice/mic-source.test.ts +210 -0
  783. package/src/services/voice/mic-source.ts +503 -0
  784. package/src/services/voice/nlms-echo-canceller.test.ts +244 -0
  785. package/src/services/voice/nlms-echo-canceller.ts +317 -0
  786. package/src/services/voice/optimistic-policy.power-source.test.ts +36 -0
  787. package/src/services/voice/optimistic-policy.test.ts +101 -0
  788. package/src/services/voice/optimistic-policy.ts +192 -0
  789. package/src/services/voice/optimistic-rollback.ts +343 -0
  790. package/src/services/voice/partial-stabilizer.test.ts +68 -0
  791. package/src/services/voice/partial-stabilizer.ts +140 -0
  792. package/src/services/voice/phoneme-tokenizer.ts +158 -0
  793. package/src/services/voice/phrase-cache.test.ts +242 -0
  794. package/src/services/voice/phrase-cache.ts +186 -0
  795. package/src/services/voice/phrase-chunker.test.ts +239 -0
  796. package/src/services/voice/phrase-chunker.ts +281 -0
  797. package/src/services/voice/pipeline-impls.l6.test.ts +110 -0
  798. package/src/services/voice/pipeline-impls.test.ts +292 -0
  799. package/src/services/voice/pipeline-impls.ts +315 -0
  800. package/src/services/voice/pipeline.ts +504 -0
  801. package/src/services/voice/prefill-client.ts +316 -0
  802. package/src/services/voice/prefix-preserving-queue.ts +162 -0
  803. package/src/services/voice/profile-store.ts +887 -0
  804. package/src/services/voice/real-audio-decode.test.ts +148 -0
  805. package/src/services/voice/research/VOICE_8785_ASSESSMENT.md +141 -0
  806. package/src/services/voice/research/VOICE_PIPELINE_RESEARCH_2026.md +117 -0
  807. package/src/services/voice/research/VOICE_VALIDATION_RUNBOOK.md +135 -0
  808. package/src/services/voice/ring-buffer.test.ts +129 -0
  809. package/src/services/voice/ring-buffer.ts +123 -0
  810. package/src/services/voice/rollback-queue.ts +74 -0
  811. package/src/services/voice/samantha-preset-placeholder.test.ts +97 -0
  812. package/src/services/voice/samantha-preset-placeholder.ts +148 -0
  813. package/src/services/voice/samantha-preset-regenerator.ts +393 -0
  814. package/src/services/voice/samantha-preset-regenerator.wav.test.ts +90 -0
  815. package/src/services/voice/scheduler.t2.test.ts +141 -0
  816. package/src/services/voice/scheduler.ts +927 -0
  817. package/src/services/voice/self-voice-imprint.test.ts +59 -0
  818. package/src/services/voice/self-voice-imprint.ts +102 -0
  819. package/src/services/voice/shared-resources.ts +343 -0
  820. package/src/services/voice/speaker/attribution-pipeline.test.ts +221 -0
  821. package/src/services/voice/speaker/attribution-pipeline.ts +449 -0
  822. package/src/services/voice/speaker/diarizer-fused.real.test.ts +100 -0
  823. package/src/services/voice/speaker/diarizer-fused.ts +154 -0
  824. package/src/services/voice/speaker/diarizer.ts +218 -0
  825. package/src/services/voice/speaker/encoder-fused.real.test.ts +113 -0
  826. package/src/services/voice/speaker/encoder-fused.ts +138 -0
  827. package/src/services/voice/speaker/encoder-ggml.test.ts +59 -0
  828. package/src/services/voice/speaker/encoder-ggml.ts +79 -0
  829. package/src/services/voice/speaker/encoder.ts +105 -0
  830. package/src/services/voice/speaker-imprint.test.ts +185 -0
  831. package/src/services/voice/speaker-imprint.ts +312 -0
  832. package/src/services/voice/speaker-preset-cache.test.ts +154 -0
  833. package/src/services/voice/speaker-preset-cache.ts +195 -0
  834. package/src/services/voice/streaming-asr/streaming-pipeline-adapter.ts +292 -0
  835. package/src/services/voice/system-audio-sink.test.ts +29 -0
  836. package/src/services/voice/system-audio-sink.ts +366 -0
  837. package/src/services/voice/transcriber.asr-backend.test.ts +76 -0
  838. package/src/services/voice/transcriber.test.ts +392 -0
  839. package/src/services/voice/transcriber.ts +704 -0
  840. package/src/services/voice/transcript-knowledge.test.ts +68 -0
  841. package/src/services/voice/transcript-knowledge.ts +75 -0
  842. package/src/services/voice/transcript-service.test.ts +195 -0
  843. package/src/services/voice/transcript-service.ts +205 -0
  844. package/src/services/voice/transcript-store.test.ts +189 -0
  845. package/src/services/voice/transcript-store.ts +164 -0
  846. package/src/services/voice/turn-controller.test.ts +575 -0
  847. package/src/services/voice/turn-controller.ts +596 -0
  848. package/src/services/voice/types.ts +699 -0
  849. package/src/services/voice/vad.test.ts +498 -0
  850. package/src/services/voice/vad.ts +832 -0
  851. package/src/services/voice/vad.v1-v4.test.ts +222 -0
  852. package/src/services/voice/voice-budget.test.ts +415 -0
  853. package/src/services/voice/voice-budget.ts +635 -0
  854. package/src/services/voice/voice-duet.test.ts +375 -0
  855. package/src/services/voice/voice-emotion-classifier.test.ts +210 -0
  856. package/src/services/voice/voice-emotion-classifier.ts +273 -0
  857. package/src/services/voice/voice-hardening.fuzz.test.ts +116 -0
  858. package/src/services/voice/voice-preload-predictor.test.ts +130 -0
  859. package/src/services/voice/voice-preload-predictor.ts +113 -0
  860. package/src/services/voice/voice-preset-format.fuzz.test.ts +89 -0
  861. package/src/services/voice/voice-preset-format.test.ts +75 -0
  862. package/src/services/voice/voice-preset-format.ts +713 -0
  863. package/src/services/voice/voice-preset-generator.test.ts +89 -0
  864. package/src/services/voice/voice-profile-artifact.test.ts +138 -0
  865. package/src/services/voice/voice-profile-artifact.ts +518 -0
  866. package/src/services/voice/voice-profile-routes.test.ts +429 -0
  867. package/src/services/voice/voice-profile-routes.ts +425 -0
  868. package/src/services/voice/voice-scenario.test.ts +159 -0
  869. package/src/services/voice/voice-scenario.ts +280 -0
  870. package/src/services/voice/voice-scenario.turn-helpers.test.ts +77 -0
  871. package/src/services/voice/voice-state-machine.ts +727 -0
  872. package/src/services/voice/voice-workbench-report.test.ts +168 -0
  873. package/src/services/voice/voice-workbench-report.ts +367 -0
  874. package/src/services/voice/voice-workbench.test.ts +158 -0
  875. package/src/services/voice/voice.test.ts +1070 -0
  876. package/src/services/voice/wake-word-ggml.ts +319 -0
  877. package/src/services/voice/wake-word.test.ts +298 -0
  878. package/src/services/voice/wake-word.ts +554 -0
  879. package/src/services/voice/wav-codec.fuzz.test.ts +59 -0
  880. package/src/services/voice/wav-codec.test.ts +32 -0
  881. package/src/services/voice/wav-codec.ts +101 -0
  882. package/src/services/voice/workbench-entrypoint.test.ts +55 -0
  883. package/src/services/voice/workbench-entrypoint.ts +88 -0
  884. package/src/services/voice/workbench-headless-runner.test.ts +162 -0
  885. package/src/services/voice/workbench-headless-runner.ts +396 -0
  886. package/src/services/voice/workbench-logic-services.test.ts +225 -0
  887. package/src/services/voice/workbench-logic-services.ts +184 -0
  888. package/src/services/voice/workbench-real-services.ts +629 -0
  889. package/src/services/voice/workbench-scenarios.ts +407 -0
  890. package/src/services/voice/wrap-with-first-line-cache.ts +267 -0
  891. package/src/services/voice-model-updater.ts +724 -0
  892. package/src/services/voice-prewarm.ts +51 -0
  893. package/src/voice-workbench.ts +71 -0
@@ -0,0 +1,715 @@
1
+ /**
2
+ * stable-diffusion.cpp image-gen backend (WS3) — Linux + Windows
3
+ * (CPU/CUDA/Vulkan), and Android NDK builds reuse the same binary via
4
+ * `plugin-aosp-local-inference`'s JNI bridge.
5
+ *
6
+ * Why a child-process backend (and not a Node binding):
7
+ *
8
+ * - stable-diffusion.cpp ships a single CLI binary (`sd`) per build
9
+ * flavour (CPU / CUDA / Vulkan / Metal). Linking it as a Node addon
10
+ * would require maintaining a parallel build matrix to llama.cpp;
11
+ * we instead reuse the same binary shipped by the bundle installer.
12
+ * - The CLI is stable across versions for monolithic SD checkpoints
13
+ * (`--model …` / `--prompt …` / `-o …`) and split diffusion assets
14
+ * (`--diffusion-model …` plus companion encoders / VAE), so contract
15
+ * drift is unlikely.
16
+ * - Diffusion runs in seconds, not milliseconds; the subprocess
17
+ * spawn cost is negligible relative to inference time.
18
+ *
19
+ * Binary resolution order:
20
+ *
21
+ * 1. `opts.binaryPath` (test injection, explicit override).
22
+ * 2. `process.env.SD_CPP_BIN` (operator override).
23
+ * 3. `${MODELS_DIR}/bin/sd` (default install path; the bundle drops
24
+ * the binary here on first activation of an image-gen tier).
25
+ *
26
+ * Availability is checked at load time by spawning the binary with
27
+ * `--version`. CUDA loads also require explicit capability evidence from
28
+ * an adjacent manifest, `--help`, or `--version`; a Linux NVIDIA GPU alone
29
+ * is not evidence that the installed binary was compiled with CUDA.
30
+ *
31
+ * Accelerator flags (from `ImageGenLoadArgs.accelerator`):
32
+ *
33
+ * - `"cuda"` → no extra flag; relies on the CUDA-built binary.
34
+ * - `"vulkan"` → `--backend vulkan0` (works on AMD + Intel + NV Vulkan paths).
35
+ * - `"cpu"` → `--backend cpu --params-backend cpu` (forces CPU).
36
+ * - `"auto"` → no extra flag; the binary's own auto-detection runs.
37
+ *
38
+ * GPU validation status (this host has no GPU):
39
+ * The contract here is binary surface only. CUDA / Vulkan smoke tests
40
+ * run on real hardware as part of the WS5 e2e gate; documented at the
41
+ * bottom of `__tests__/imagegen-handler.test.ts`.
42
+ *
43
+ * Publishing pipeline (per platform):
44
+ *
45
+ * Linux x86_64 (CUDA):
46
+ * git clone https://github.com/leejet/stable-diffusion.cpp && cd stable-diffusion.cpp \
47
+ * && cmake -B build -DSD_CUDA=ON -DCMAKE_BUILD_TYPE=Release \
48
+ * && cmake --build build --config Release -j
49
+ * Strip + tar; sign: not required (Linux). Drop into
50
+ * releases.elizaos.ai/sd-cpp/<version>/linux-x86_64-cuda/sd.tar.zst.
51
+ * Linux x86_64 (Vulkan):
52
+ * cmake -B build -DSD_VULKAN=ON -DCMAKE_BUILD_TYPE=Release && cmake --build build -j
53
+ * Linux x86_64 (CPU):
54
+ * cmake -B build -DCMAKE_BUILD_TYPE=Release && cmake --build build -j
55
+ * Windows x86_64 (CUDA):
56
+ * Same cmake invocation under MSVC 2022; produces sd.exe. Sign with the
57
+ * Eliza Labs EV cert (signtool sign /tr ...); submit to Microsoft
58
+ * SmartScreen if a new cert. Drop into releases.elizaos.ai/sd-cpp/
59
+ * <version>/windows-x86_64-cuda/sd.exe.
60
+ * Windows x86_64 (Vulkan, CPU): mirror the CUDA build with the matching
61
+ * cmake -DSD_VULKAN=ON / -DCMAKE_BUILD_TYPE=Release flags.
62
+ * Android (arm64-v8a JNI): cross-compile through the NDK against the
63
+ * same upstream; not consumed directly here — `plugin-aosp-local-inference`
64
+ * wraps it as `libstable-diffusion-jni.so` and the AOSP backend (see
65
+ * `aosp-unavailable.ts`) calls into it via the eliza-llama-shim FFI surface.
66
+ * macOS (Metal): cmake -B build -DSD_METAL=ON; codesign with the Eliza
67
+ * Labs Developer ID Application cert and notarize via `xcrun notarytool
68
+ * submit ...`; staple. Drop into releases.elizaos.ai/sd-cpp/<version>/
69
+ * darwin-{arm64,x86_64}/sd. macOS Apple Silicon prefers `mflux` over
70
+ * sd-cpp (see `mflux.ts`), but sd-cpp Metal is the fallback.
71
+ * Linux riscv64 (CPU): unavailable as a shipped binary. Cross-compile via
72
+ * `zig cc --target=riscv64-linux-musl` (same toolchain
73
+ * packages/app-core/scripts/aosp/compile-libllama.mjs uses; see also
74
+ * `native/build-omnivoice.mjs` for the omnivoice / ggml precedent).
75
+ * There is no Node/host build script for sd-cpp in this repo — sd-cpp
76
+ * is a child-process backend wrapping a precompiled `sd` binary
77
+ * fetched from releases.elizaos.ai. Wiring riscv64 is a CDN-side
78
+ * artifact addition (drop a `releases.elizaos.ai/sd-cpp/<version>/
79
+ * linux-riscv64-cpu/sd` build); no build-matrix entry needs to land
80
+ * here. Until then, the riscv64 binary-resolution attempt simply
81
+ * surfaces the same `ImageGenBackendUnavailableError("sd-cpp", ...)`
82
+ * it surfaces today on any host where the bundle installer did not
83
+ * stage `sd` — i.e. image-gen is silently disabled on riscv64
84
+ * (acceptable: the eliza-1 phone tier does not require image-gen).
85
+ */
86
+
87
+ import { execFile, spawn } from "node:child_process";
88
+ import { existsSync, promises as fs, mkdtempSync } from "node:fs";
89
+ import { tmpdir } from "node:os";
90
+ import { basename, dirname, join } from "node:path";
91
+ import { ImageGenBackendUnavailableError } from "./errors";
92
+ import type {
93
+ ImageGenBackend,
94
+ ImageGenLoadArgs,
95
+ ImageGenRequest,
96
+ ImageGenResult,
97
+ } from "./types";
98
+
99
+ /**
100
+ * Optional test seam. Production code uses Node's `child_process.spawn`;
101
+ * tests inject a fake to drive deterministic outputs without forking.
102
+ */
103
+ export type SdCppSpawnLike = (
104
+ command: string,
105
+ args: readonly string[],
106
+ options?: { signal?: AbortSignal; cwd?: string },
107
+ ) => {
108
+ stdout: AsyncIterable<Buffer> | NodeJS.ReadableStream | null;
109
+ stderr: AsyncIterable<Buffer> | NodeJS.ReadableStream | null;
110
+ on(event: "exit", listener: (code: number | null) => void): unknown;
111
+ on(event: "close", listener: (code: number | null) => void): unknown;
112
+ on(event: "error", listener: (err: Error) => void): unknown;
113
+ kill?(signal?: NodeJS.Signals): void;
114
+ };
115
+
116
+ export interface SdCppBackendOptions {
117
+ loadArgs: ImageGenLoadArgs;
118
+ /** Catalog key — copied into `ImageGenResult.metadata.model`. */
119
+ modelKey: string;
120
+ /** Override the binary path. Useful for tests. */
121
+ binaryPath?: string;
122
+ /**
123
+ * Override the on-disk output directory. Defaults to a fresh dir
124
+ * under `os.tmpdir()`. Tests can pin this so the deterministic
125
+ * fixture is read from a known path.
126
+ */
127
+ outputDir?: string;
128
+ /** Spawn implementation. Defaults to Node's `child_process.spawn`. */
129
+ spawnImpl?: SdCppSpawnLike;
130
+ /**
131
+ * For tests: instead of running the binary, write `fakeImageBytes`
132
+ * to the output file and return it. When set, `binaryPath` and
133
+ * version-probing are skipped.
134
+ */
135
+ fakeImageBytes?: Uint8Array;
136
+ /**
137
+ * For tests: override `Date.now` so timing assertions are stable.
138
+ */
139
+ now?: () => number;
140
+ }
141
+
142
+ const DEFAULT_BIN = "sd";
143
+
144
+ /**
145
+ * Load (or in this case, "smoke-check") the sd-cpp backend. The binary
146
+ * lives out-of-process; "loading" is verifying it exists and runs.
147
+ * The actual model weights are passed per-call as either `--model <path>`
148
+ * or `--diffusion-model <path>`, so the same binary serves multiple
149
+ * GGUFs without an explicit unload step.
150
+ */
151
+ export async function loadSdCppImageGenBackend(
152
+ opts: SdCppBackendOptions,
153
+ ): Promise<ImageGenBackend> {
154
+ const binary = resolveBinaryPath(opts.binaryPath);
155
+ const now = opts.now ?? Date.now;
156
+
157
+ if (!opts.fakeImageBytes) {
158
+ // Smoke-check: run `--version` so we fail fast instead of waiting
159
+ // for the first real generate.
160
+ await assertBinaryAvailable(
161
+ binary,
162
+ opts.loadArgs.accelerator,
163
+ opts.spawnImpl,
164
+ );
165
+ }
166
+
167
+ // Ensure the model file exists. Caller resolves the path through
168
+ // the bundle installer; we just gate on its presence so a missing
169
+ // weight surfaces here instead of from the binary stderr.
170
+ if (!opts.fakeImageBytes && !existsSync(opts.loadArgs.modelPath)) {
171
+ throw new ImageGenBackendUnavailableError(
172
+ "sd-cpp",
173
+ "model_missing",
174
+ `[imagegen/sd-cpp] model not found: ${opts.loadArgs.modelPath}`,
175
+ );
176
+ }
177
+
178
+ const outputDir = opts.outputDir ?? mkdtempSync(join(tmpdir(), "sdcpp-"));
179
+ let disposed = false;
180
+
181
+ return {
182
+ id: "sd-cpp",
183
+ supports(req) {
184
+ // sd-cpp accepts any reasonable WxH (rounded to /8). Reject
185
+ // obviously bad inputs so the selector keeps walking.
186
+ const w = req.width ?? 512;
187
+ const h = req.height ?? 512;
188
+ if (w <= 0 || h <= 0) return false;
189
+ if (w > 4096 || h > 4096) return false;
190
+ return true;
191
+ },
192
+ async generate(req): Promise<ImageGenResult> {
193
+ if (disposed) {
194
+ throw new ImageGenBackendUnavailableError(
195
+ "sd-cpp",
196
+ "subprocess_failed",
197
+ "[imagegen/sd-cpp] generate called after dispose()",
198
+ );
199
+ }
200
+ if (!req.prompt.trim()) {
201
+ throw new ImageGenBackendUnavailableError(
202
+ "sd-cpp",
203
+ "unsupported_request",
204
+ "[imagegen/sd-cpp] prompt is empty",
205
+ );
206
+ }
207
+ const seed = resolveSeed(req.seed);
208
+ const width = req.width ?? 512;
209
+ const height = req.height ?? 512;
210
+ const steps = req.steps ?? 20;
211
+ const guidanceScale = req.guidanceScale ?? 7.5;
212
+ const outputPath = join(outputDir, `out-${seed}-${now()}.png`);
213
+ const startMs = now();
214
+
215
+ if (opts.fakeImageBytes) {
216
+ // Test path: skip the subprocess entirely. The deterministic
217
+ // in-memory bytes are what `__tests__/imagegen-handler.test.ts` uses.
218
+ await fs.writeFile(outputPath, opts.fakeImageBytes);
219
+ const elapsed = Math.max(1, now() - startMs);
220
+ if (req.onProgressChunk)
221
+ req.onProgressChunk({ step: steps, total: steps });
222
+ return {
223
+ image: opts.fakeImageBytes,
224
+ mime: "image/png",
225
+ seed,
226
+ metadata: {
227
+ model: opts.modelKey,
228
+ prompt: req.prompt,
229
+ steps,
230
+ guidanceScale,
231
+ inferenceTimeMs: elapsed,
232
+ },
233
+ };
234
+ }
235
+
236
+ const args = buildArgs({
237
+ modelPath: opts.loadArgs.modelPath,
238
+ splitDiffusionModel: opts.loadArgs.splitDiffusionModel,
239
+ vae: opts.loadArgs.vae,
240
+ llm: opts.loadArgs.llm,
241
+ prompt: req.prompt,
242
+ negativePrompt: req.negativePrompt,
243
+ width,
244
+ height,
245
+ steps,
246
+ guidanceScale,
247
+ seed,
248
+ scheduler: req.scheduler,
249
+ output: outputPath,
250
+ accelerator: opts.loadArgs.accelerator,
251
+ });
252
+
253
+ await runSdCpp(binary, args, {
254
+ signal: req.signal,
255
+ spawnImpl: opts.spawnImpl,
256
+ onProgressChunk: req.onProgressChunk,
257
+ totalSteps: steps,
258
+ });
259
+
260
+ const bytes = new Uint8Array(await fs.readFile(outputPath));
261
+ // Defensive: if the binary wrote a non-PNG (e.g. someone passed
262
+ // `-o foo.jpg`) we still report `image/png` because the catalog
263
+ // pins PNG; mismatch is a configuration bug, not a runtime case.
264
+ assertPngOutput(bytes, "sd-cpp", "subprocess_failed");
265
+ const elapsed = Math.max(1, now() - startMs);
266
+ return {
267
+ image: bytes,
268
+ mime: "image/png",
269
+ seed,
270
+ metadata: {
271
+ model: opts.modelKey,
272
+ prompt: req.prompt,
273
+ steps,
274
+ guidanceScale,
275
+ inferenceTimeMs: elapsed,
276
+ },
277
+ };
278
+ },
279
+ async dispose() {
280
+ if (disposed) return;
281
+ disposed = true;
282
+ // Best-effort scratch cleanup. We don't fail dispose if the
283
+ // temp dir is missing — it just means a prior caller already
284
+ // removed it.
285
+ await fs.rm(outputDir, { recursive: true, force: true }).catch(() => {});
286
+ },
287
+ };
288
+ }
289
+
290
+ function resolveBinaryPath(override?: string): string {
291
+ if (override) return override;
292
+ const envBin = process.env.SD_CPP_BIN;
293
+ if (envBin?.trim()) return envBin.trim();
294
+ return DEFAULT_BIN;
295
+ }
296
+
297
+ async function assertBinaryAvailable(
298
+ binary: string,
299
+ accelerator?: ImageGenLoadArgs["accelerator"],
300
+ spawnImpl?: SdCppSpawnLike,
301
+ ): Promise<void> {
302
+ let version: SdCppCommandResult;
303
+ try {
304
+ version = await runCollect(binary, ["--version"], spawnImpl);
305
+ if (version.code !== 0) {
306
+ throw new ImageGenBackendUnavailableError(
307
+ "sd-cpp",
308
+ "binary_version_mismatch",
309
+ `[imagegen/sd-cpp] '${binary} --version' exited with code ${version.code}`,
310
+ );
311
+ }
312
+ } catch (err) {
313
+ if (err instanceof ImageGenBackendUnavailableError) throw err;
314
+ const message = err instanceof Error ? err.message : String(err);
315
+ throw new ImageGenBackendUnavailableError(
316
+ "sd-cpp",
317
+ "binary_missing",
318
+ `[imagegen/sd-cpp] cannot run '${binary} --version': ${message}. Set SD_CPP_BIN or install the bundle's image-gen binary.`,
319
+ { cause: err },
320
+ );
321
+ }
322
+ if (
323
+ accelerator === "cuda" ||
324
+ accelerator === "vulkan" ||
325
+ accelerator === "metal"
326
+ ) {
327
+ const capabilities = await probeSdCppCapabilitiesFromBinary(
328
+ binary,
329
+ version,
330
+ spawnImpl,
331
+ );
332
+ if (!capabilities.accelerators.includes(accelerator)) {
333
+ throw new ImageGenBackendUnavailableError(
334
+ "sd-cpp",
335
+ `${accelerator}_binary_missing`,
336
+ `[imagegen/sd-cpp] '${binary}' is available but does not prove ${accelerator.toUpperCase()} support via manifest, --help, or --version. Falling back from sd-cpp ${accelerator}; install a stable-diffusion.cpp ${accelerator.toUpperCase()} build or set SD_CPP_BIN to one.`,
337
+ );
338
+ }
339
+ }
340
+ }
341
+
342
+ interface SdCppCommandResult {
343
+ code: number | null;
344
+ stdout: string;
345
+ stderr: string;
346
+ }
347
+
348
+ function runCollect(
349
+ binary: string,
350
+ args: readonly string[],
351
+ spawnImpl?: SdCppSpawnLike,
352
+ ): Promise<SdCppCommandResult> {
353
+ if (!spawnImpl) {
354
+ return new Promise<SdCppCommandResult>((resolve, reject) => {
355
+ execFile(binary, [...args], (error, stdout, stderr) => {
356
+ const code =
357
+ typeof (error as { code?: unknown } | null)?.code === "number"
358
+ ? (error as { code: number }).code
359
+ : error
360
+ ? null
361
+ : 0;
362
+ if (error && code === null) {
363
+ reject(error);
364
+ return;
365
+ }
366
+ resolve({
367
+ code,
368
+ stdout: String(stdout),
369
+ stderr: String(stderr),
370
+ });
371
+ });
372
+ });
373
+ }
374
+ return new Promise<SdCppCommandResult>((resolve, reject) => {
375
+ const proc = defaultSpawn(spawnImpl)(binary, args);
376
+ let stdout = "";
377
+ let stderr = "";
378
+ let settled = false;
379
+ const finish = (code: number | null) => {
380
+ if (settled) return;
381
+ settled = true;
382
+ setTimeout(() => resolve({ code, stdout, stderr }), 0);
383
+ };
384
+ collectOutput(proc.stdout, (chunk) => {
385
+ stdout += chunk;
386
+ });
387
+ collectOutput(proc.stderr, (chunk) => {
388
+ stderr += chunk;
389
+ });
390
+ proc.on("error", (err: Error) => reject(err));
391
+ if (typeof (proc as { on?: unknown }).on === "function") {
392
+ try {
393
+ proc.on("close", finish);
394
+ } catch {
395
+ // Test doubles may only implement the narrower SdCppSpawnLike
396
+ // exit/error event set. The exit listener below still resolves.
397
+ }
398
+ }
399
+ proc.on("exit", finish);
400
+ });
401
+ }
402
+
403
+ function collectOutput(
404
+ stream: AsyncIterable<Buffer> | NodeJS.ReadableStream | null,
405
+ append: (chunk: string) => void,
406
+ ): void {
407
+ if (!stream) return;
408
+ if (typeof (stream as NodeJS.ReadableStream).on === "function") {
409
+ (stream as NodeJS.ReadableStream).on("data", (chunk: Buffer | string) => {
410
+ append(typeof chunk === "string" ? chunk : chunk.toString("utf8"));
411
+ });
412
+ return;
413
+ }
414
+ void (async () => {
415
+ for await (const chunk of stream as AsyncIterable<Buffer>) {
416
+ append(chunk.toString("utf8"));
417
+ }
418
+ })();
419
+ }
420
+
421
+ type SdCppAccelerator = NonNullable<ImageGenLoadArgs["accelerator"]>;
422
+
423
+ export interface SdCppCapabilities {
424
+ version: string | null;
425
+ accelerators: readonly SdCppAccelerator[];
426
+ evidence: readonly string[];
427
+ }
428
+
429
+ export async function probeSdCppCapabilitiesFromBinary(
430
+ binary: string,
431
+ versionResult?: SdCppCommandResult,
432
+ spawnImpl?: SdCppSpawnLike,
433
+ ): Promise<SdCppCapabilities> {
434
+ const version =
435
+ versionResult ?? (await runCollect(binary, ["--version"], spawnImpl));
436
+ const help = await runCollect(binary, ["--help"], spawnImpl).catch(
437
+ () => null,
438
+ );
439
+ const manifest = await readSdCppCapabilityManifest(binary);
440
+ const textEvidence = [
441
+ version.stdout,
442
+ version.stderr,
443
+ help?.stdout ?? "",
444
+ help?.stderr ?? "",
445
+ ].join("\n");
446
+ const accelerators = new Set<SdCppAccelerator>(["auto", "cpu"]);
447
+ const evidence: string[] = [];
448
+ for (const accelerator of manifest.accelerators) {
449
+ accelerators.add(accelerator);
450
+ evidence.push("manifest");
451
+ }
452
+ if (hasPositiveCudaEvidence(textEvidence)) {
453
+ accelerators.add("cuda");
454
+ evidence.push("help_or_version");
455
+ }
456
+ if (hasPositiveVulkanEvidence(textEvidence)) accelerators.add("vulkan");
457
+ if (hasPositiveMetalEvidence(textEvidence)) accelerators.add("metal");
458
+ return {
459
+ version: parseVersionLine(version.stdout, version.stderr),
460
+ accelerators: [...accelerators],
461
+ evidence: [...new Set(evidence)],
462
+ };
463
+ }
464
+
465
+ async function readSdCppCapabilityManifest(
466
+ binary: string,
467
+ ): Promise<{ accelerators: SdCppAccelerator[] }> {
468
+ const candidates = [
469
+ `${binary}.json`,
470
+ `${binary}.manifest.json`,
471
+ join(dirname(binary), `${basename(binary)}.manifest.json`),
472
+ join(dirname(binary), "sd-cpp.manifest.json"),
473
+ join(dirname(binary), "manifest.json"),
474
+ ];
475
+ for (const candidate of [...new Set(candidates)]) {
476
+ try {
477
+ const parsed = JSON.parse(await fs.readFile(candidate, "utf8"));
478
+ return { accelerators: extractAccelerators(parsed) };
479
+ } catch {
480
+ // Missing or malformed sidecar manifests are non-fatal; help/version
481
+ // can still prove capability, and the caller will reject CUDA if not.
482
+ }
483
+ }
484
+ return { accelerators: [] };
485
+ }
486
+
487
+ function extractAccelerators(value: unknown): SdCppAccelerator[] {
488
+ const found = new Set<SdCppAccelerator>();
489
+ const visit = (node: unknown): void => {
490
+ if (Array.isArray(node)) {
491
+ for (const item of node) visit(item);
492
+ return;
493
+ }
494
+ if (typeof node === "string") {
495
+ const normalized = node.toLowerCase();
496
+ if (isSdCppAccelerator(normalized)) found.add(normalized);
497
+ return;
498
+ }
499
+ if (!node || typeof node !== "object") return;
500
+ for (const [key, child] of Object.entries(node)) {
501
+ const normalizedKey = key.toLowerCase();
502
+ if (isSdCppAccelerator(normalizedKey) && child === true) {
503
+ found.add(normalizedKey);
504
+ }
505
+ visit(child);
506
+ }
507
+ };
508
+ visit(value);
509
+ return [...found];
510
+ }
511
+
512
+ function isSdCppAccelerator(value: string): value is SdCppAccelerator {
513
+ return (
514
+ value === "cuda" ||
515
+ value === "vulkan" ||
516
+ value === "metal" ||
517
+ value === "cpu"
518
+ );
519
+ }
520
+
521
+ function hasPositiveCudaEvidence(text: string): boolean {
522
+ const lower = text.toLowerCase();
523
+ if (
524
+ /(without|no|disabled|disable|not built with|unsupported)[^\n]{0,40}cuda/.test(
525
+ lower,
526
+ )
527
+ ) {
528
+ return false;
529
+ }
530
+ return /(^|[^a-z0-9])(sd_cuda|ggml_cuda|cublas|cudart)([^a-z0-9]|$)/.test(
531
+ lower,
532
+ );
533
+ }
534
+
535
+ function hasPositiveVulkanEvidence(text: string): boolean {
536
+ return /\b(sd_vulkan|ggml_vulkan|vulkan)\b/i.test(text);
537
+ }
538
+
539
+ function hasPositiveMetalEvidence(text: string): boolean {
540
+ return /\b(sd_metal|ggml_metal|metal)\b/i.test(text);
541
+ }
542
+
543
+ function parseVersionLine(stdout: string, stderr: string): string | null {
544
+ const text = (stdout || stderr || "").trim();
545
+ if (!text) return null;
546
+ const firstLine = text.split(/\r?\n/).find((line) => line.trim().length > 0);
547
+ return firstLine?.trim() ?? null;
548
+ }
549
+
550
+ async function runSdCpp(
551
+ binary: string,
552
+ args: readonly string[],
553
+ opts: {
554
+ signal?: AbortSignal;
555
+ spawnImpl?: SdCppSpawnLike;
556
+ onProgressChunk?: ImageGenRequest["onProgressChunk"];
557
+ totalSteps: number;
558
+ },
559
+ ): Promise<void> {
560
+ await new Promise<void>((resolve, reject) => {
561
+ const proc = defaultSpawn(opts.spawnImpl)(binary, args, {
562
+ signal: opts.signal,
563
+ });
564
+ const stderr = proc.stderr;
565
+ // stable-diffusion.cpp prints `step: N/M` lines to stderr at each
566
+ // denoise iteration. Tail the stream and forward as progress chunks
567
+ // when the caller asked for them. Tolerate non-stream stderr (the
568
+ // test spawn may pass null) — progress is best-effort.
569
+ if (
570
+ opts.onProgressChunk &&
571
+ stderr &&
572
+ typeof (stderr as NodeJS.ReadableStream).on === "function"
573
+ ) {
574
+ let leftover = "";
575
+ (stderr as NodeJS.ReadableStream).on("data", (chunk: Buffer | string) => {
576
+ const text =
577
+ leftover +
578
+ (typeof chunk === "string" ? chunk : chunk.toString("utf8"));
579
+ const lines = text.split(/\r?\n/);
580
+ leftover = lines.pop() ?? "";
581
+ for (const line of lines) {
582
+ const m = line.match(/step:\s*(\d+)\s*\/\s*(\d+)/i);
583
+ if (!m) continue;
584
+ const step = Number(m[1]);
585
+ const total = Number(m[2]) || opts.totalSteps;
586
+ opts.onProgressChunk?.({ step, total });
587
+ }
588
+ });
589
+ }
590
+ proc.on("error", (err: Error) => reject(err));
591
+ proc.on("exit", (code: number | null) => {
592
+ if (code === 0) {
593
+ resolve();
594
+ return;
595
+ }
596
+ reject(
597
+ new ImageGenBackendUnavailableError(
598
+ "sd-cpp",
599
+ "subprocess_failed",
600
+ `[imagegen/sd-cpp] binary exited with code ${code}`,
601
+ ),
602
+ );
603
+ });
604
+ });
605
+ }
606
+
607
+ export function buildArgs(input: {
608
+ modelPath: string;
609
+ splitDiffusionModel?: boolean;
610
+ vae?: string;
611
+ llm?: string;
612
+ prompt: string;
613
+ negativePrompt?: string;
614
+ width: number;
615
+ height: number;
616
+ steps: number;
617
+ guidanceScale: number;
618
+ seed: number;
619
+ scheduler?: string;
620
+ output: string;
621
+ accelerator?: ImageGenLoadArgs["accelerator"];
622
+ }): string[] {
623
+ const args: string[] = [
624
+ input.splitDiffusionModel ? "--diffusion-model" : "--model",
625
+ input.modelPath,
626
+ "--prompt",
627
+ input.prompt,
628
+ "--width",
629
+ String(input.width),
630
+ "--height",
631
+ String(input.height),
632
+ "--steps",
633
+ String(input.steps),
634
+ "--cfg-scale",
635
+ String(input.guidanceScale),
636
+ "--seed",
637
+ String(input.seed),
638
+ "-o",
639
+ input.output,
640
+ ];
641
+ if (input.vae) {
642
+ args.push("--vae", input.vae);
643
+ }
644
+ if (input.llm) {
645
+ args.push("--llm", input.llm);
646
+ }
647
+ if (input.negativePrompt) {
648
+ args.push("--negative-prompt", input.negativePrompt);
649
+ }
650
+ if (input.scheduler) {
651
+ args.push("--sampling-method", input.scheduler);
652
+ }
653
+ if (input.accelerator === "vulkan") {
654
+ args.push("--backend", "vulkan0");
655
+ } else if (input.accelerator === "cpu") {
656
+ args.push("--backend", "cpu", "--params-backend", "cpu");
657
+ }
658
+ // `auto` / `cuda` / `metal` rely on the binary build's defaults.
659
+ return args;
660
+ }
661
+
662
+ /** 31-bit positive integer — sd-cpp stores seed as int32. */
663
+ export function pickSeed(): number {
664
+ return Math.floor(Math.random() * 0x7fffffff);
665
+ }
666
+
667
+ /** Resolve a caller-supplied seed or pick a random one. */
668
+ export function resolveSeed(seed: number | undefined): number {
669
+ return typeof seed === "number" && seed >= 0 ? seed : pickSeed();
670
+ }
671
+
672
+ export const PNG_SIGNATURE = [
673
+ 0x89, 0x50, 0x4e, 0x47, 0x0d, 0x0a, 0x1a, 0x0a,
674
+ ] as const;
675
+
676
+ /**
677
+ * Assert `bytes` begins with the PNG magic number. `label` is the
678
+ * `[imagegen/<backend>]` prefix used in the error message.
679
+ */
680
+ export function assertPngOutput(
681
+ bytes: Uint8Array,
682
+ label: string,
683
+ errorCode: ConstructorParameters<typeof ImageGenBackendUnavailableError>[1],
684
+ ): void {
685
+ if (bytes.length < PNG_SIGNATURE.length) {
686
+ throw new ImageGenBackendUnavailableError(
687
+ label,
688
+ errorCode,
689
+ `[imagegen/${label}] output too short (${bytes.length} bytes); not a PNG`,
690
+ );
691
+ }
692
+ for (let i = 0; i < PNG_SIGNATURE.length; i += 1) {
693
+ if (bytes[i] !== PNG_SIGNATURE[i]) {
694
+ throw new ImageGenBackendUnavailableError(
695
+ label,
696
+ errorCode,
697
+ `[imagegen/${label}] output missing PNG signature`,
698
+ );
699
+ }
700
+ }
701
+ }
702
+
703
+ /**
704
+ * Wrap Node's `spawn` in the narrower `SdCppSpawnLike` shape that the
705
+ * subprocess backends share. The cast is centralised here so call sites
706
+ * don't each need their own `as unknown as` escape.
707
+ */
708
+ export function defaultSpawn(
709
+ spawnImpl: SdCppSpawnLike | undefined,
710
+ ): SdCppSpawnLike {
711
+ if (spawnImpl) return spawnImpl;
712
+ const nodeSpawn: SdCppSpawnLike = (command, args, options) =>
713
+ spawn(command, [...args], options);
714
+ return nodeSpawn;
715
+ }