agent-orcha 0.0.5 → 0.0.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (404) hide show
  1. package/README.md +250 -1275
  2. package/dist/lib/agents/agent-executor.d.ts +4 -2
  3. package/dist/lib/agents/agent-executor.d.ts.map +1 -1
  4. package/dist/lib/agents/agent-executor.js +85 -53
  5. package/dist/lib/agents/agent-executor.js.map +1 -1
  6. package/dist/lib/agents/agent-loader.d.ts +3 -0
  7. package/dist/lib/agents/agent-loader.d.ts.map +1 -1
  8. package/dist/lib/agents/agent-loader.js +10 -1
  9. package/dist/lib/agents/agent-loader.js.map +1 -1
  10. package/dist/lib/agents/react-loop.d.ts.map +1 -1
  11. package/dist/lib/agents/react-loop.js +207 -142
  12. package/dist/lib/agents/react-loop.js.map +1 -1
  13. package/dist/lib/agents/types.d.ts +181 -18
  14. package/dist/lib/agents/types.d.ts.map +1 -1
  15. package/dist/lib/agents/types.js +18 -2
  16. package/dist/lib/agents/types.js.map +1 -1
  17. package/dist/lib/functions/function-loader.d.ts +2 -0
  18. package/dist/lib/functions/function-loader.d.ts.map +1 -1
  19. package/dist/lib/functions/function-loader.js +10 -0
  20. package/dist/lib/functions/function-loader.js.map +1 -1
  21. package/dist/lib/functions/simple-function-wrapper.js +3 -3
  22. package/dist/lib/functions/simple-function-wrapper.js.map +1 -1
  23. package/dist/lib/integrations/email.d.ts +38 -0
  24. package/dist/lib/integrations/email.d.ts.map +1 -0
  25. package/dist/lib/integrations/email.js +249 -0
  26. package/dist/lib/integrations/email.js.map +1 -0
  27. package/dist/lib/integrations/integration-manager.d.ts +5 -0
  28. package/dist/lib/integrations/integration-manager.d.ts.map +1 -1
  29. package/dist/lib/integrations/integration-manager.js +53 -3
  30. package/dist/lib/integrations/integration-manager.js.map +1 -1
  31. package/dist/lib/integrations/types.d.ts +187 -4
  32. package/dist/lib/integrations/types.d.ts.map +1 -1
  33. package/dist/lib/integrations/types.js +24 -1
  34. package/dist/lib/integrations/types.js.map +1 -1
  35. package/dist/lib/knowledge/knowledge-store.d.ts +7 -1
  36. package/dist/lib/knowledge/knowledge-store.d.ts.map +1 -1
  37. package/dist/lib/knowledge/knowledge-store.js +96 -8
  38. package/dist/lib/knowledge/knowledge-store.js.map +1 -1
  39. package/dist/lib/knowledge/loaders/file-loaders.d.ts +8 -3
  40. package/dist/lib/knowledge/loaders/file-loaders.d.ts.map +1 -1
  41. package/dist/lib/knowledge/loaders/file-loaders.js +96 -75
  42. package/dist/lib/knowledge/loaders/file-loaders.js.map +1 -1
  43. package/dist/lib/knowledge/loaders/web-loader.d.ts +12 -3
  44. package/dist/lib/knowledge/loaders/web-loader.d.ts.map +1 -1
  45. package/dist/lib/knowledge/loaders/web-loader.js +56 -22
  46. package/dist/lib/knowledge/loaders/web-loader.js.map +1 -1
  47. package/dist/lib/knowledge/sqlite-store.d.ts.map +1 -1
  48. package/dist/lib/knowledge/sqlite-store.js +19 -10
  49. package/dist/lib/knowledge/sqlite-store.js.map +1 -1
  50. package/dist/lib/knowledge/types.d.ts +69 -33
  51. package/dist/lib/knowledge/types.d.ts.map +1 -1
  52. package/dist/lib/knowledge/types.js +18 -3
  53. package/dist/lib/knowledge/types.js.map +1 -1
  54. package/dist/lib/llm/index.d.ts +1 -1
  55. package/dist/lib/llm/index.d.ts.map +1 -1
  56. package/dist/lib/llm/index.js +1 -1
  57. package/dist/lib/llm/index.js.map +1 -1
  58. package/dist/lib/llm/llm-call-logger.d.ts +3 -1
  59. package/dist/lib/llm/llm-call-logger.d.ts.map +1 -1
  60. package/dist/lib/llm/llm-call-logger.js +31 -26
  61. package/dist/lib/llm/llm-call-logger.js.map +1 -1
  62. package/dist/lib/llm/llm-config.d.ts +59 -8
  63. package/dist/lib/llm/llm-config.d.ts.map +1 -1
  64. package/dist/lib/llm/llm-config.js +163 -17
  65. package/dist/lib/llm/llm-config.js.map +1 -1
  66. package/dist/lib/llm/llm-factory.d.ts +1 -2
  67. package/dist/lib/llm/llm-factory.d.ts.map +1 -1
  68. package/dist/lib/llm/llm-factory.js +44 -8
  69. package/dist/lib/llm/llm-factory.js.map +1 -1
  70. package/dist/lib/llm/providers/anthropic-chat-model.d.ts +5 -1
  71. package/dist/lib/llm/providers/anthropic-chat-model.d.ts.map +1 -1
  72. package/dist/lib/llm/providers/anthropic-chat-model.js +118 -42
  73. package/dist/lib/llm/providers/anthropic-chat-model.js.map +1 -1
  74. package/dist/lib/llm/providers/gemini-chat-model.d.ts +3 -2
  75. package/dist/lib/llm/providers/gemini-chat-model.d.ts.map +1 -1
  76. package/dist/lib/llm/providers/gemini-chat-model.js +83 -24
  77. package/dist/lib/llm/providers/gemini-chat-model.js.map +1 -1
  78. package/dist/lib/llm/providers/openai-chat-model.d.ts +20 -1
  79. package/dist/lib/llm/providers/openai-chat-model.d.ts.map +1 -1
  80. package/dist/lib/llm/providers/openai-chat-model.js +265 -32
  81. package/dist/lib/llm/providers/openai-chat-model.js.map +1 -1
  82. package/dist/lib/llm/providers/openai-embeddings.d.ts.map +1 -1
  83. package/dist/lib/llm/providers/openai-embeddings.js +41 -10
  84. package/dist/lib/llm/providers/openai-embeddings.js.map +1 -1
  85. package/dist/lib/local-llm/binary-manager.d.ts +66 -0
  86. package/dist/lib/local-llm/binary-manager.d.ts.map +1 -0
  87. package/dist/lib/local-llm/binary-manager.js +441 -0
  88. package/dist/lib/local-llm/binary-manager.js.map +1 -0
  89. package/dist/lib/local-llm/engine-interface.d.ts +47 -0
  90. package/dist/lib/local-llm/engine-interface.d.ts.map +1 -0
  91. package/dist/lib/local-llm/engine-interface.js +2 -0
  92. package/dist/lib/local-llm/engine-interface.js.map +1 -0
  93. package/dist/lib/local-llm/engine-registry.d.ts +20 -0
  94. package/dist/lib/local-llm/engine-registry.d.ts.map +1 -0
  95. package/dist/lib/local-llm/engine-registry.js +56 -0
  96. package/dist/lib/local-llm/engine-registry.js.map +1 -0
  97. package/dist/lib/local-llm/engines/llama-cpp-engine.d.ts +31 -0
  98. package/dist/lib/local-llm/engines/llama-cpp-engine.d.ts.map +1 -0
  99. package/dist/lib/local-llm/engines/llama-cpp-engine.js +164 -0
  100. package/dist/lib/local-llm/engines/llama-cpp-engine.js.map +1 -0
  101. package/dist/lib/local-llm/engines/mlx-serve-engine.d.ts +31 -0
  102. package/dist/lib/local-llm/engines/mlx-serve-engine.d.ts.map +1 -0
  103. package/dist/lib/local-llm/engines/mlx-serve-engine.js +161 -0
  104. package/dist/lib/local-llm/engines/mlx-serve-engine.js.map +1 -0
  105. package/dist/lib/local-llm/gguf-reader.d.ts +20 -0
  106. package/dist/lib/local-llm/gguf-reader.d.ts.map +1 -0
  107. package/dist/lib/local-llm/gguf-reader.js +190 -0
  108. package/dist/lib/local-llm/gguf-reader.js.map +1 -0
  109. package/dist/lib/local-llm/index.d.ts +9 -0
  110. package/dist/lib/local-llm/index.d.ts.map +1 -0
  111. package/dist/lib/local-llm/index.js +6 -0
  112. package/dist/lib/local-llm/index.js.map +1 -0
  113. package/dist/lib/local-llm/llama-server-process.d.ts +42 -0
  114. package/dist/lib/local-llm/llama-server-process.d.ts.map +1 -0
  115. package/dist/lib/local-llm/llama-server-process.js +237 -0
  116. package/dist/lib/local-llm/llama-server-process.js.map +1 -0
  117. package/dist/lib/local-llm/mlx-binary-manager.d.ts +33 -0
  118. package/dist/lib/local-llm/mlx-binary-manager.d.ts.map +1 -0
  119. package/dist/lib/local-llm/mlx-binary-manager.js +211 -0
  120. package/dist/lib/local-llm/mlx-binary-manager.js.map +1 -0
  121. package/dist/lib/local-llm/mlx-server-process.d.ts +26 -0
  122. package/dist/lib/local-llm/mlx-server-process.d.ts.map +1 -0
  123. package/dist/lib/local-llm/mlx-server-process.js +210 -0
  124. package/dist/lib/local-llm/mlx-server-process.js.map +1 -0
  125. package/dist/lib/local-llm/model-manager.d.ts +33 -0
  126. package/dist/lib/local-llm/model-manager.d.ts.map +1 -0
  127. package/dist/lib/local-llm/model-manager.js +591 -0
  128. package/dist/lib/local-llm/model-manager.js.map +1 -0
  129. package/dist/lib/local-llm/types.d.ts +51 -0
  130. package/dist/lib/local-llm/types.d.ts.map +1 -0
  131. package/dist/lib/local-llm/types.js +2 -0
  132. package/dist/lib/local-llm/types.js.map +1 -0
  133. package/dist/lib/logger.d.ts +2 -0
  134. package/dist/lib/logger.d.ts.map +1 -1
  135. package/dist/lib/logger.js +68 -6
  136. package/dist/lib/logger.js.map +1 -1
  137. package/dist/lib/mcp/mcp-client.d.ts.map +1 -1
  138. package/dist/lib/mcp/mcp-client.js +5 -3
  139. package/dist/lib/mcp/mcp-client.js.map +1 -1
  140. package/dist/lib/mcp/types.d.ts +0 -9
  141. package/dist/lib/mcp/types.d.ts.map +1 -1
  142. package/dist/lib/mcp/types.js +1 -2
  143. package/dist/lib/mcp/types.js.map +1 -1
  144. package/dist/lib/memory/memory-manager.d.ts +1 -0
  145. package/dist/lib/memory/memory-manager.d.ts.map +1 -1
  146. package/dist/lib/memory/memory-manager.js +9 -0
  147. package/dist/lib/memory/memory-manager.js.map +1 -1
  148. package/dist/lib/orchestrator.d.ts +11 -8
  149. package/dist/lib/orchestrator.d.ts.map +1 -1
  150. package/dist/lib/orchestrator.js +246 -5
  151. package/dist/lib/orchestrator.js.map +1 -1
  152. package/dist/lib/sandbox/cdp-client.d.ts +15 -0
  153. package/dist/lib/sandbox/cdp-client.d.ts.map +1 -0
  154. package/dist/lib/sandbox/cdp-client.js +139 -0
  155. package/dist/lib/sandbox/cdp-client.js.map +1 -0
  156. package/dist/lib/sandbox/html-to-markdown.d.ts +9 -1
  157. package/dist/lib/sandbox/html-to-markdown.d.ts.map +1 -1
  158. package/dist/lib/sandbox/html-to-markdown.js +67 -10
  159. package/dist/lib/sandbox/html-to-markdown.js.map +1 -1
  160. package/dist/lib/sandbox/index.d.ts +6 -0
  161. package/dist/lib/sandbox/index.d.ts.map +1 -1
  162. package/dist/lib/sandbox/index.js +5 -0
  163. package/dist/lib/sandbox/index.js.map +1 -1
  164. package/dist/lib/sandbox/page-readiness.d.ts +37 -0
  165. package/dist/lib/sandbox/page-readiness.d.ts.map +1 -0
  166. package/dist/lib/sandbox/page-readiness.js +268 -0
  167. package/dist/lib/sandbox/page-readiness.js.map +1 -0
  168. package/dist/lib/sandbox/sandbox-browser.d.ts +4 -0
  169. package/dist/lib/sandbox/sandbox-browser.d.ts.map +1 -0
  170. package/dist/lib/sandbox/sandbox-browser.js +316 -0
  171. package/dist/lib/sandbox/sandbox-browser.js.map +1 -0
  172. package/dist/lib/sandbox/sandbox-container.d.ts +39 -0
  173. package/dist/lib/sandbox/sandbox-container.d.ts.map +1 -0
  174. package/dist/lib/sandbox/sandbox-container.js +176 -0
  175. package/dist/lib/sandbox/sandbox-container.js.map +1 -0
  176. package/dist/lib/sandbox/sandbox-file.d.ts +4 -0
  177. package/dist/lib/sandbox/sandbox-file.d.ts.map +1 -0
  178. package/dist/lib/sandbox/sandbox-file.js +169 -0
  179. package/dist/lib/sandbox/sandbox-file.js.map +1 -0
  180. package/dist/lib/sandbox/sandbox-shell.d.ts +5 -0
  181. package/dist/lib/sandbox/sandbox-shell.d.ts.map +1 -0
  182. package/dist/lib/sandbox/sandbox-shell.js +111 -0
  183. package/dist/lib/sandbox/sandbox-shell.js.map +1 -0
  184. package/dist/lib/sandbox/sandbox-web.d.ts.map +1 -1
  185. package/dist/lib/sandbox/sandbox-web.js +64 -24
  186. package/dist/lib/sandbox/sandbox-web.js.map +1 -1
  187. package/dist/lib/sandbox/types.d.ts +9 -0
  188. package/dist/lib/sandbox/types.d.ts.map +1 -1
  189. package/dist/lib/sandbox/types.js +1 -0
  190. package/dist/lib/sandbox/types.js.map +1 -1
  191. package/dist/lib/sandbox/vision-browser.d.ts +4 -0
  192. package/dist/lib/sandbox/vision-browser.d.ts.map +1 -0
  193. package/dist/lib/sandbox/vision-browser.js +298 -0
  194. package/dist/lib/sandbox/vision-browser.js.map +1 -0
  195. package/dist/lib/sea/app-window.d.ts +7 -0
  196. package/dist/lib/sea/app-window.d.ts.map +1 -0
  197. package/dist/lib/sea/app-window.js +95 -0
  198. package/dist/lib/sea/app-window.js.map +1 -0
  199. package/dist/lib/sea/bootstrap.d.ts +18 -0
  200. package/dist/lib/sea/bootstrap.d.ts.map +1 -0
  201. package/dist/lib/sea/bootstrap.js +103 -0
  202. package/dist/lib/sea/bootstrap.js.map +1 -0
  203. package/dist/lib/sea/sqlite-vec-shim.d.ts +3 -0
  204. package/dist/lib/sea/sqlite-vec-shim.d.ts.map +1 -0
  205. package/dist/lib/sea/sqlite-vec-shim.js +10 -0
  206. package/dist/lib/sea/sqlite-vec-shim.js.map +1 -0
  207. package/dist/lib/skills/skill-loader.d.ts +2 -0
  208. package/dist/lib/skills/skill-loader.d.ts.map +1 -1
  209. package/dist/lib/skills/skill-loader.js +12 -1
  210. package/dist/lib/skills/skill-loader.js.map +1 -1
  211. package/dist/lib/tasks/task-manager.d.ts +3 -1
  212. package/dist/lib/tasks/task-manager.d.ts.map +1 -1
  213. package/dist/lib/tasks/task-manager.js +11 -0
  214. package/dist/lib/tasks/task-manager.js.map +1 -1
  215. package/dist/lib/tasks/task-store.d.ts +1 -1
  216. package/dist/lib/tasks/task-store.d.ts.map +1 -1
  217. package/dist/lib/tasks/task-store.js.map +1 -1
  218. package/dist/lib/tasks/types.d.ts +18 -0
  219. package/dist/lib/tasks/types.d.ts.map +1 -1
  220. package/dist/lib/tools/built-in/integration-tools.d.ts +4 -0
  221. package/dist/lib/tools/built-in/integration-tools.d.ts.map +1 -0
  222. package/dist/lib/tools/built-in/integration-tools.js +47 -0
  223. package/dist/lib/tools/built-in/integration-tools.js.map +1 -0
  224. package/dist/lib/tools/built-in/knowledge-entity-lookup.tool.d.ts +1 -2
  225. package/dist/lib/tools/built-in/knowledge-entity-lookup.tool.d.ts.map +1 -1
  226. package/dist/lib/tools/built-in/knowledge-entity-lookup.tool.js +17 -17
  227. package/dist/lib/tools/built-in/knowledge-entity-lookup.tool.js.map +1 -1
  228. package/dist/lib/tools/built-in/knowledge-graph-schema.tool.d.ts.map +1 -1
  229. package/dist/lib/tools/built-in/knowledge-graph-schema.tool.js +2 -4
  230. package/dist/lib/tools/built-in/knowledge-graph-schema.tool.js.map +1 -1
  231. package/dist/lib/tools/built-in/knowledge-search.tool.js +4 -4
  232. package/dist/lib/tools/built-in/knowledge-search.tool.js.map +1 -1
  233. package/dist/lib/tools/built-in/knowledge-sql.tool.d.ts.map +1 -1
  234. package/dist/lib/tools/built-in/knowledge-sql.tool.js +74 -40
  235. package/dist/lib/tools/built-in/knowledge-sql.tool.js.map +1 -1
  236. package/dist/lib/tools/built-in/knowledge-tools-factory.js +2 -2
  237. package/dist/lib/tools/built-in/knowledge-tools-factory.js.map +1 -1
  238. package/dist/lib/tools/built-in/knowledge-traverse.tool.d.ts +1 -2
  239. package/dist/lib/tools/built-in/knowledge-traverse.tool.d.ts.map +1 -1
  240. package/dist/lib/tools/built-in/knowledge-traverse.tool.js +5 -11
  241. package/dist/lib/tools/built-in/knowledge-traverse.tool.js.map +1 -1
  242. package/dist/lib/tools/built-in/query-validators.d.ts.map +1 -1
  243. package/dist/lib/tools/built-in/query-validators.js +4 -0
  244. package/dist/lib/tools/built-in/query-validators.js.map +1 -1
  245. package/dist/lib/tools/workspace/workspace-tools.d.ts +1 -0
  246. package/dist/lib/tools/workspace/workspace-tools.d.ts.map +1 -1
  247. package/dist/lib/tools/workspace/workspace-tools.js +44 -4
  248. package/dist/lib/tools/workspace/workspace-tools.js.map +1 -1
  249. package/dist/lib/triggers/cron-trigger.d.ts +1 -1
  250. package/dist/lib/triggers/cron-trigger.d.ts.map +1 -1
  251. package/dist/lib/triggers/cron-trigger.js.map +1 -1
  252. package/dist/lib/triggers/trigger-manager.d.ts +1 -0
  253. package/dist/lib/triggers/trigger-manager.d.ts.map +1 -1
  254. package/dist/lib/triggers/trigger-manager.js +26 -0
  255. package/dist/lib/triggers/trigger-manager.js.map +1 -1
  256. package/dist/lib/triggers/webhook-trigger.d.ts +1 -1
  257. package/dist/lib/triggers/webhook-trigger.d.ts.map +1 -1
  258. package/dist/lib/triggers/webhook-trigger.js.map +1 -1
  259. package/dist/lib/types/llm-types.d.ts +22 -4
  260. package/dist/lib/types/llm-types.d.ts.map +1 -1
  261. package/dist/lib/types/llm-types.js +50 -0
  262. package/dist/lib/types/llm-types.js.map +1 -1
  263. package/dist/lib/types/tool-factory.d.ts +2 -2
  264. package/dist/lib/types/tool-factory.d.ts.map +1 -1
  265. package/dist/lib/types/tool-factory.js +9 -2
  266. package/dist/lib/types/tool-factory.js.map +1 -1
  267. package/dist/lib/utils/document-extract.d.ts +10 -0
  268. package/dist/lib/utils/document-extract.d.ts.map +1 -0
  269. package/dist/lib/utils/document-extract.js +149 -0
  270. package/dist/lib/utils/document-extract.js.map +1 -0
  271. package/dist/lib/utils/env-substitution.d.ts +6 -0
  272. package/dist/lib/utils/env-substitution.d.ts.map +1 -0
  273. package/dist/lib/utils/env-substitution.js +15 -0
  274. package/dist/lib/utils/env-substitution.js.map +1 -0
  275. package/dist/lib/workflows/react-workflow-executor.d.ts.map +1 -1
  276. package/dist/lib/workflows/react-workflow-executor.js +23 -17
  277. package/dist/lib/workflows/react-workflow-executor.js.map +1 -1
  278. package/dist/lib/workflows/types.d.ts +81 -55
  279. package/dist/lib/workflows/types.d.ts.map +1 -1
  280. package/dist/lib/workflows/types.js +10 -0
  281. package/dist/lib/workflows/types.js.map +1 -1
  282. package/dist/lib/workflows/workflow-loader.d.ts +3 -0
  283. package/dist/lib/workflows/workflow-loader.d.ts.map +1 -1
  284. package/dist/lib/workflows/workflow-loader.js +10 -1
  285. package/dist/lib/workflows/workflow-loader.js.map +1 -1
  286. package/dist/public/assets/logo.png +0 -0
  287. package/dist/public/chat.html +39 -0
  288. package/dist/public/index.html +6 -176
  289. package/dist/public/src/components/AgentComposer.js +807 -0
  290. package/dist/public/src/components/AgentsView.js +1812 -508
  291. package/dist/public/src/components/AppRoot.js +125 -38
  292. package/dist/public/src/components/GraphView.js +382 -300
  293. package/dist/public/src/components/IdeView.js +277 -86
  294. package/dist/public/src/components/KnowledgeView.js +94 -130
  295. package/dist/public/src/components/LlmView.js +15 -19
  296. package/dist/public/src/components/LocalLlmView.js +2440 -0
  297. package/dist/public/src/components/LogViewer.js +155 -0
  298. package/dist/public/src/components/McpView.js +41 -49
  299. package/dist/public/src/components/MonitorView.js +174 -83
  300. package/dist/public/src/components/NavBar.js +16 -26
  301. package/dist/public/src/components/StandaloneChat.js +875 -0
  302. package/dist/public/src/services/ApiService.js +203 -4
  303. package/dist/public/src/services/SessionStore.js +86 -0
  304. package/dist/public/src/services/StreamManager.js +183 -0
  305. package/dist/public/src/store.js +1 -3
  306. package/dist/public/src/utils/card.js +21 -0
  307. package/dist/public/src/utils/markdown.js +7 -0
  308. package/dist/public/styles.css +2777 -0
  309. package/dist/src/cli/commands/init.d.ts.map +1 -1
  310. package/dist/src/cli/commands/init.js +7 -1
  311. package/dist/src/cli/commands/init.js.map +1 -1
  312. package/dist/src/cli/commands/start.d.ts.map +1 -1
  313. package/dist/src/cli/commands/start.js +28 -5
  314. package/dist/src/cli/commands/start.js.map +1 -1
  315. package/dist/src/cli/index.js +19 -5
  316. package/dist/src/cli/index.js.map +1 -1
  317. package/dist/src/index.js +7 -1
  318. package/dist/src/index.js.map +1 -1
  319. package/dist/src/middleware/auth.d.ts.map +1 -1
  320. package/dist/src/middleware/auth.js +28 -6
  321. package/dist/src/middleware/auth.js.map +1 -1
  322. package/dist/src/middleware/rate-limit.d.ts +8 -0
  323. package/dist/src/middleware/rate-limit.d.ts.map +1 -0
  324. package/dist/src/middleware/rate-limit.js +21 -0
  325. package/dist/src/middleware/rate-limit.js.map +1 -0
  326. package/dist/src/routes/agents.route.d.ts.map +1 -1
  327. package/dist/src/routes/agents.route.js +138 -10
  328. package/dist/src/routes/agents.route.js.map +1 -1
  329. package/dist/src/routes/chat.route.d.ts +3 -0
  330. package/dist/src/routes/chat.route.d.ts.map +1 -0
  331. package/dist/src/routes/chat.route.js +156 -0
  332. package/dist/src/routes/chat.route.js.map +1 -0
  333. package/dist/src/routes/files.route.d.ts.map +1 -1
  334. package/dist/src/routes/files.route.js +37 -2
  335. package/dist/src/routes/files.route.js.map +1 -1
  336. package/dist/src/routes/llm.route.d.ts.map +1 -1
  337. package/dist/src/routes/llm.route.js +263 -8
  338. package/dist/src/routes/llm.route.js.map +1 -1
  339. package/dist/src/routes/local-llm.route.d.ts +3 -0
  340. package/dist/src/routes/local-llm.route.d.ts.map +1 -0
  341. package/dist/src/routes/local-llm.route.js +688 -0
  342. package/dist/src/routes/local-llm.route.js.map +1 -0
  343. package/dist/src/routes/logs.route.d.ts +3 -0
  344. package/dist/src/routes/logs.route.d.ts.map +1 -0
  345. package/dist/src/routes/logs.route.js +24 -0
  346. package/dist/src/routes/logs.route.js.map +1 -0
  347. package/dist/src/routes/tasks.route.d.ts.map +1 -1
  348. package/dist/src/routes/tasks.route.js +15 -1
  349. package/dist/src/routes/tasks.route.js.map +1 -1
  350. package/dist/src/routes/vnc.route.d.ts +12 -0
  351. package/dist/src/routes/vnc.route.d.ts.map +1 -0
  352. package/dist/src/routes/vnc.route.js +74 -0
  353. package/dist/src/routes/vnc.route.js.map +1 -0
  354. package/dist/src/routes/workflows.route.d.ts.map +1 -1
  355. package/dist/src/routes/workflows.route.js +24 -0
  356. package/dist/src/routes/workflows.route.js.map +1 -1
  357. package/dist/src/server.d.ts.map +1 -1
  358. package/dist/src/server.js +29 -3
  359. package/dist/src/server.js.map +1 -1
  360. package/dist/templates/Demo.md +152 -0
  361. package/dist/templates/README.md +12 -3
  362. package/dist/templates/agents/actor.agent.yaml +34 -0
  363. package/dist/templates/agents/architect.agent.yaml +20 -13
  364. package/dist/templates/agents/chatbot.agent.yaml +23 -27
  365. package/dist/templates/agents/corporate.agent.yaml +64 -0
  366. package/dist/templates/agents/functions.agent.yaml +29 -0
  367. package/dist/templates/agents/investment-analyst.agent.yaml +79 -0
  368. package/dist/templates/agents/music-librarian.agent.yaml +46 -0
  369. package/dist/templates/agents/network-security.agent.yaml +81 -0
  370. package/dist/templates/agents/transport-security.agent.yaml +69 -0
  371. package/dist/templates/agents/web-engineer.agent.yaml +98 -0
  372. package/dist/templates/agents/web-pilot.agent.yaml +57 -0
  373. package/dist/templates/knowledge/music-store/LICENSE.md +11 -0
  374. package/dist/templates/knowledge/music-store/musicstore.sqlite +0 -0
  375. package/dist/templates/knowledge/music-store/tables.png +0 -0
  376. package/dist/templates/knowledge/music-store.knowledge.yaml +138 -0
  377. package/dist/templates/knowledge/org-chart/personnel.csv +21 -21
  378. package/dist/templates/knowledge/org-chart.knowledge.yaml +4 -0
  379. package/dist/templates/knowledge/patient-records.knowledge.yaml +20 -0
  380. package/dist/templates/knowledge/pdf-patients/PDF_Deid_Deidentification_0.pdf +0 -0
  381. package/dist/templates/knowledge/pdf-patients/PDF_Deid_Deidentification_1.pdf +0 -0
  382. package/dist/templates/knowledge/pdf-patients/PDF_Deid_Deidentification_10.pdf +0 -0
  383. package/dist/templates/knowledge/pdf-patients/PDF_Deid_Deidentification_11.pdf +0 -0
  384. package/dist/templates/knowledge/pet-store.knowledge.yaml +3 -0
  385. package/dist/templates/knowledge/security-incidents/incidents.json +55935 -0
  386. package/dist/templates/knowledge/security-incidents.knowledge.yaml +46 -0
  387. package/dist/templates/knowledge/{example.knowledge.yaml → transcripts.knowledge.yaml} +9 -5
  388. package/dist/templates/knowledge/transport-ot/systems.csv +117 -0
  389. package/dist/templates/knowledge/transport-ot.knowledge.yaml +55 -0
  390. package/dist/templates/knowledge/web-docs.knowledge.yaml +1 -1
  391. package/dist/templates/llm.json +62 -22
  392. package/dist/templates/mcp.json +7 -4
  393. package/dist/templates/skills/orcha-builder/SKILL.md +148 -215
  394. package/dist/templates/skills/pii-guard/SKILL.md +22 -0
  395. package/dist/templates/skills/sandbox/SKILL.md +25 -48
  396. package/dist/templates/skills/web-pilot/SKILL.md +51 -0
  397. package/dist/templates/workflows/example.workflow.yaml +27 -35
  398. package/dist/templates/workflows/react-example.workflow.yaml +14 -19
  399. package/dist/templates/workflows/team-chat.workflow.yaml +47 -0
  400. package/package.json +17 -4
  401. package/dist/public/src/components/SkillsView.js +0 -137
  402. package/dist/public/src/components/WorkflowsView.js +0 -416
  403. package/dist/templates/agents/knowledge-broker.agent.yaml +0 -39
  404. package/dist/templates/agents/sandbox.agent.yaml +0 -56
@@ -0,0 +1,56 @@
1
+ import { LlamaCppEngine } from "./engines/llama-cpp-engine.js";
2
+ import { MlxServeEngine } from "./engines/mlx-serve-engine.js";
3
+ import { ModelManager } from "./model-manager.js";
4
+ export class EngineRegistry {
5
+ engines = new Map();
6
+ _baseDir = '';
7
+ constructor() {
8
+ this.register(new LlamaCppEngine());
9
+ this.register(new MlxServeEngine());
10
+ }
11
+ register(engine) {
12
+ this.engines.set(engine.engineName, engine);
13
+ }
14
+ getEngine(name) {
15
+ return this.engines.get(name);
16
+ }
17
+ getAvailableEngines() {
18
+ return [...this.engines.values()].filter(e => e.isAvailable());
19
+ }
20
+ getAllEngines() {
21
+ return [...this.engines.values()];
22
+ }
23
+ getAllStatus() {
24
+ const result = {};
25
+ for (const [name, engine] of this.engines) {
26
+ result[name] = engine.getStatus();
27
+ }
28
+ return result;
29
+ }
30
+ setBaseDir(dir) {
31
+ this._baseDir = dir;
32
+ for (const engine of this.engines.values()) {
33
+ engine.setBaseDir(dir);
34
+ }
35
+ }
36
+ killAllOrphans() {
37
+ for (const engine of this.engines.values()) {
38
+ engine.killOrphans();
39
+ }
40
+ }
41
+ async unloadAll() {
42
+ for (const engine of this.engines.values()) {
43
+ await engine.unloadChat();
44
+ await engine.unloadEmbedding();
45
+ }
46
+ }
47
+ async resolveModelPath(modelName) {
48
+ const manager = new ModelManager(this._baseDir);
49
+ const result = await manager.findModelFile(modelName);
50
+ if (!result)
51
+ throw new Error(`Local model "${modelName}" not found. Download it first.`);
52
+ return result;
53
+ }
54
+ }
55
+ export const engineRegistry = new EngineRegistry();
56
+ //# sourceMappingURL=engine-registry.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"engine-registry.js","sourceRoot":"","sources":["../../../lib/local-llm/engine-registry.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,cAAc,EAAE,MAAM,+BAA+B,CAAC;AAC/D,OAAO,EAAE,cAAc,EAAE,MAAM,+BAA+B,CAAC;AAC/D,OAAO,EAAE,YAAY,EAAE,MAAM,oBAAoB,CAAC;AAGlD,MAAM,OAAO,cAAc;IACjB,OAAO,GAAG,IAAI,GAAG,EAAuB,CAAC;IACzC,QAAQ,GAAG,EAAE,CAAC;IAEtB;QACE,IAAI,CAAC,QAAQ,CAAC,IAAI,cAAc,EAAE,CAAC,CAAC;QACpC,IAAI,CAAC,QAAQ,CAAC,IAAI,cAAc,EAAE,CAAC,CAAC;IACtC,CAAC;IAED,QAAQ,CAAC,MAAmB;QAC1B,IAAI,CAAC,OAAO,CAAC,GAAG,CAAC,MAAM,CAAC,UAAU,EAAE,MAAM,CAAC,CAAC;IAC9C,CAAC;IAED,SAAS,CAAC,IAAY;QACpB,OAAO,IAAI,CAAC,OAAO,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC;IAChC,CAAC;IAED,mBAAmB;QACjB,OAAO,CAAC,GAAG,IAAI,CAAC,OAAO,CAAC,MAAM,EAAE,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,WAAW,EAAE,CAAC,CAAC;IACjE,CAAC;IAED,aAAa;QACX,OAAO,CAAC,GAAG,IAAI,CAAC,OAAO,CAAC,MAAM,EAAE,CAAC,CAAC;IACpC,CAAC;IAED,YAAY;QACV,MAAM,MAAM,GAAiC,EAAE,CAAC;QAChD,KAAK,MAAM,CAAC,IAAI,EAAE,MAAM,CAAC,IAAI,IAAI,CAAC,OAAO,EAAE,CAAC;YAC1C,MAAM,CAAC,IAAI,CAAC,GAAG,MAAM,CAAC,SAAS,EAAE,CAAC;QACpC,CAAC;QACD,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,UAAU,CAAC,GAAW;QACpB,IAAI,CAAC,QAAQ,GAAG,GAAG,CAAC;QACpB,KAAK,MAAM,MAAM,IAAI,IAAI,CAAC,OAAO,CAAC,MAAM,EAAE,EAAE,CAAC;YAC3C,MAAM,CAAC,UAAU,CAAC,GAAG,CAAC,CAAC;QACzB,CAAC;IACH,CAAC;IAED,cAAc;QACZ,KAAK,MAAM,MAAM,IAAI,IAAI,CAAC,OAAO,CAAC,MAAM,EAAE,EAAE,CAAC;YAC3C,MAAM,CAAC,WAAW,EAAE,CAAC;QACvB,CAAC;IACH,CAAC;IAED,KAAK,CAAC,SAAS;QACb,KAAK,MAAM,MAAM,IAAI,IAAI,CAAC,OAAO,CAAC,MAAM,EAAE,EAAE,CAAC;YAC3C,MAAM,MAAM,CAAC,UAAU,EAAE,CAAC;YAC1B,MAAM,MAAM,CAAC,eAAe,EAAE,CAAC;QACjC,CAAC;IACH,CAAC;IAED,KAAK,CAAC,gBAAgB,CAAC,SAAiB;QACtC,MAAM,OAAO,GAAG,IAAI,YAAY,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QAChD,MAAM,MAAM,GAAG,MAAM,OAAO,CAAC,aAAa,CAAC,SAAS,CAAC,CAAC;QACtD,IAAI,CAAC,MAAM;YAAE,MAAM,IAAI,KAAK,CAAC,gBAAgB,SAAS,iCAAiC,CAAC,CAAC;QACzF,OAAO,MAAM,CAAC;IAChB,CAAC;CACF;AAED,MAAM,CAAC,MAAM,cAAc,GAAG,IAAI,cAAc,EAAE,CAAC"}
@@ -0,0 +1,31 @@
1
+ import type { LocalEngine, EngineChatStatus, EngineServerStatus, EngineStatus, LoadOptions } from '../engine-interface.ts';
2
+ export declare class LlamaCppEngine implements LocalEngine {
3
+ readonly engineName = "llama-cpp";
4
+ private _baseDir;
5
+ private chatServer;
6
+ private embeddingServer;
7
+ private _detectedContextSize;
8
+ private _memoryEstimate;
9
+ private _supportsVision;
10
+ setBaseDir(dir: string): void;
11
+ isAvailable(): boolean;
12
+ loadChat(modelPath: string, opts?: LoadOptions): Promise<void>;
13
+ unloadChat(): Promise<void>;
14
+ swapChat(modelPath: string, opts?: LoadOptions): Promise<void>;
15
+ ensureRunningChat(modelName: string, opts?: LoadOptions): Promise<void>;
16
+ getChatStatus(): EngineChatStatus;
17
+ getChatBaseUrl(): string | null;
18
+ loadEmbedding(modelPath: string): Promise<void>;
19
+ unloadEmbedding(): Promise<void>;
20
+ ensureRunningEmbedding(modelName: string): Promise<void>;
21
+ getEmbeddingStatus(): EngineServerStatus;
22
+ getEmbeddingBaseUrl(): string | null;
23
+ getStatus(): EngineStatus;
24
+ killOrphans(): void;
25
+ getBinaryVersion(): string | null;
26
+ getBinarySource(): 'managed' | 'system' | null;
27
+ checkForUpdate(): Promise<any>;
28
+ updateBinary(): Promise<void>;
29
+ private resolveModelPath;
30
+ }
31
+ //# sourceMappingURL=llama-cpp-engine.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"llama-cpp-engine.d.ts","sourceRoot":"","sources":["../../../../lib/local-llm/engines/llama-cpp-engine.ts"],"names":[],"mappings":"AAOA,OAAO,KAAK,EAAE,WAAW,EAAE,gBAAgB,EAAE,kBAAkB,EAAE,YAAY,EAAE,WAAW,EAAE,MAAM,wBAAwB,CAAC;AAE3H,qBAAa,cAAe,YAAW,WAAW;IAChD,QAAQ,CAAC,UAAU,eAAe;IAElC,OAAO,CAAC,QAAQ,CAAM;IACtB,OAAO,CAAC,UAAU,CAAmC;IACrD,OAAO,CAAC,eAAe,CAAmC;IAC1D,OAAO,CAAC,oBAAoB,CAAuB;IACnD,OAAO,CAAC,eAAe,CAAiF;IACxG,OAAO,CAAC,eAAe,CAAS;IAEhC,UAAU,CAAC,GAAG,EAAE,MAAM,GAAG,IAAI;IAI7B,WAAW,IAAI,OAAO;IAMhB,QAAQ,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,WAAW,GAAG,OAAO,CAAC,IAAI,CAAC;IA8C9D,UAAU,IAAI,OAAO,CAAC,IAAI,CAAC;IAM3B,QAAQ,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,WAAW,GAAG,OAAO,CAAC,IAAI,CAAC;IAK9D,iBAAiB,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,WAAW,GAAG,OAAO,CAAC,IAAI,CAAC;IAO7E,aAAa,IAAI,gBAAgB;IAYjC,cAAc,IAAI,MAAM,GAAG,IAAI;IAMzB,aAAa,CAAC,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;IAM/C,eAAe,IAAI,OAAO,CAAC,IAAI,CAAC;IAMhC,sBAAsB,CAAC,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;IAO9D,kBAAkB,IAAI,kBAAkB;IAWxC,mBAAmB,IAAI,MAAM,GAAG,IAAI;IAMpC,SAAS,IAAI,YAAY;IASzB,WAAW,IAAI,IAAI;IAMnB,gBAAgB,IAAI,MAAM,GAAG,IAAI;IAIjC,eAAe,IAAI,SAAS,GAAG,QAAQ,GAAG,IAAI;IAMxC,cAAc,IAAI,OAAO,CAAC,GAAG,CAAC;IAI9B,YAAY,IAAI,OAAO,CAAC,IAAI,CAAC;YAMrB,gBAAgB;CAM/B"}
@@ -0,0 +1,164 @@
1
+ import * as path from 'path';
2
+ import { LlamaServerProcess } from "../llama-server-process.js";
3
+ import { killOrphanedServers } from "../llama-server-process.js";
4
+ import { ModelManager } from "../model-manager.js";
5
+ import { readGGUFModelInfo, calculateOptimalContextSize, kvCacheBytesPerToken } from "../gguf-reader.js";
6
+ import { detectGpu, getBinaryVersion, isSystemBinary, updateBinary, checkForUpdate } from "../binary-manager.js";
7
+ import { logger } from "../../logger.js";
8
+ export class LlamaCppEngine {
9
+ engineName = 'llama-cpp';
10
+ _baseDir = '';
11
+ chatServer = null;
12
+ embeddingServer = null;
13
+ _detectedContextSize = null;
14
+ _memoryEstimate = null;
15
+ _supportsVision = false;
16
+ setBaseDir(dir) {
17
+ this._baseDir = dir;
18
+ }
19
+ isAvailable() {
20
+ return getBinaryVersion(this._baseDir) !== null;
21
+ }
22
+ // ─── Chat ───────────────────────────────────────────────────────────────────
23
+ async loadChat(modelPath, opts) {
24
+ if (!this.chatServer)
25
+ this.chatServer = new LlamaServerProcess(this._baseDir);
26
+ if (this.chatServer.running && this.chatServer.modelPath === modelPath)
27
+ return;
28
+ let contextSize = opts?.contextSize;
29
+ const modelInfo = await readGGUFModelInfo(modelPath);
30
+ if (!contextSize && modelInfo) {
31
+ contextSize = calculateOptimalContextSize(modelInfo);
32
+ }
33
+ if (modelInfo && contextSize) {
34
+ const kvBytes = contextSize * kvCacheBytesPerToken(modelInfo);
35
+ this._memoryEstimate = {
36
+ modelBytes: modelInfo.fileSizeBytes,
37
+ kvCacheBytes: kvBytes,
38
+ totalBytes: modelInfo.fileSizeBytes + kvBytes,
39
+ };
40
+ }
41
+ // Auto-detect multimodal projector (mmproj) for vision support
42
+ const modelFileName = path.basename(modelPath);
43
+ const manager = new ModelManager(this._baseDir);
44
+ const mmproj = await manager.findMmprojForModel(modelFileName);
45
+ this._supportsVision = !!mmproj;
46
+ if (mmproj) {
47
+ logger.info(`[LlamaCppEngine] Vision enabled with mmproj: ${path.basename(mmproj)}`);
48
+ }
49
+ this._detectedContextSize = contextSize ?? null;
50
+ const gpu = detectGpu();
51
+ const isGpu = gpu.accel !== 'none';
52
+ const isMetal = gpu.accel === 'metal';
53
+ await this.chatServer.start({
54
+ modelPath,
55
+ contextSize,
56
+ mmproj: mmproj ?? undefined,
57
+ gpuLayers: isGpu ? -1 : 0,
58
+ flashAttn: isGpu,
59
+ ...(isGpu ? { batchSize: 4096, ubatchSize: 1024 } : {}),
60
+ ...(isMetal ? { cacheTypeK: 'q8_0', cacheTypeV: 'q8_0', mlock: true } : {}),
61
+ ...(opts?.reasoningBudget !== undefined ? { reasoningBudget: opts.reasoningBudget } : {}),
62
+ });
63
+ }
64
+ async unloadChat() {
65
+ if (this.chatServer) {
66
+ await this.chatServer.stop();
67
+ }
68
+ }
69
+ async swapChat(modelPath, opts) {
70
+ await this.unloadChat();
71
+ await this.loadChat(modelPath, opts);
72
+ }
73
+ async ensureRunningChat(modelName, opts) {
74
+ if (this.chatServer?.running)
75
+ return;
76
+ logger.info(`[LlamaCppEngine] Auto-starting chat model: ${modelName}`);
77
+ const { filePath } = await this.resolveModelPath(modelName);
78
+ await this.loadChat(filePath, opts);
79
+ }
80
+ getChatStatus() {
81
+ const running = this.chatServer?.running ?? false;
82
+ return {
83
+ running,
84
+ activeModel: running ? (this.chatServer?.modelPath ?? null) : null,
85
+ port: this.chatServer?.port ?? null,
86
+ contextSize: this._detectedContextSize,
87
+ memoryEstimate: this._memoryEstimate,
88
+ supportsVision: this._supportsVision,
89
+ };
90
+ }
91
+ getChatBaseUrl() {
92
+ return this.chatServer?.ready ? this.chatServer.getBaseUrl() : null;
93
+ }
94
+ // ─── Embedding ──────────────────────────────────────────────────────────────
95
+ async loadEmbedding(modelPath) {
96
+ if (!this.embeddingServer)
97
+ this.embeddingServer = new LlamaServerProcess(this._baseDir, true);
98
+ if (this.embeddingServer.running && this.embeddingServer.modelPath === modelPath)
99
+ return;
100
+ await this.embeddingServer.start({ modelPath, embedding: true });
101
+ }
102
+ async unloadEmbedding() {
103
+ if (this.embeddingServer) {
104
+ await this.embeddingServer.stop();
105
+ }
106
+ }
107
+ async ensureRunningEmbedding(modelName) {
108
+ if (this.embeddingServer?.running)
109
+ return;
110
+ logger.info(`[LlamaCppEngine] Auto-starting embedding model: ${modelName}`);
111
+ const { filePath } = await this.resolveModelPath(modelName);
112
+ await this.loadEmbedding(filePath);
113
+ }
114
+ getEmbeddingStatus() {
115
+ const running = this.embeddingServer?.running ?? false;
116
+ return {
117
+ running,
118
+ activeModel: running ? (this.embeddingServer?.modelPath ?? null) : null,
119
+ port: this.embeddingServer?.port ?? null,
120
+ contextSize: null,
121
+ memoryEstimate: null,
122
+ };
123
+ }
124
+ getEmbeddingBaseUrl() {
125
+ return this.embeddingServer?.ready ? this.embeddingServer.getBaseUrl() : null;
126
+ }
127
+ // ─── Combined ───────────────────────────────────────────────────────────────
128
+ getStatus() {
129
+ return {
130
+ engineName: this.engineName,
131
+ available: this.isAvailable(),
132
+ chat: this.getChatStatus(),
133
+ embedding: this.getEmbeddingStatus(),
134
+ };
135
+ }
136
+ killOrphans() {
137
+ killOrphanedServers(this._baseDir);
138
+ }
139
+ // ─── Binary management ─────────────────────────────────────────────────────
140
+ getBinaryVersion() {
141
+ return getBinaryVersion(this._baseDir);
142
+ }
143
+ getBinarySource() {
144
+ const version = getBinaryVersion(this._baseDir);
145
+ if (!version)
146
+ return null;
147
+ return isSystemBinary() ? 'system' : 'managed';
148
+ }
149
+ async checkForUpdate() {
150
+ return checkForUpdate(this._baseDir);
151
+ }
152
+ async updateBinary() {
153
+ return updateBinary(this._baseDir);
154
+ }
155
+ // ─── Private ────────────────────────────────────────────────────────────────
156
+ async resolveModelPath(modelName) {
157
+ const manager = new ModelManager(this._baseDir);
158
+ const result = await manager.findModelFile(modelName);
159
+ if (!result)
160
+ throw new Error(`Local model "${modelName}" not found. Download it first.`);
161
+ return result;
162
+ }
163
+ }
164
+ //# sourceMappingURL=llama-cpp-engine.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"llama-cpp-engine.js","sourceRoot":"","sources":["../../../../lib/local-llm/engines/llama-cpp-engine.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,IAAI,MAAM,MAAM,CAAC;AAC7B,OAAO,EAAE,kBAAkB,EAAE,MAAM,4BAA4B,CAAC;AAChE,OAAO,EAAE,mBAAmB,EAAE,MAAM,4BAA4B,CAAC;AACjE,OAAO,EAAE,YAAY,EAAE,MAAM,qBAAqB,CAAC;AACnD,OAAO,EAAE,iBAAiB,EAAE,2BAA2B,EAAE,oBAAoB,EAAE,MAAM,mBAAmB,CAAC;AACzG,OAAO,EAAE,SAAS,EAAE,gBAAgB,EAAE,cAAc,EAAE,YAAY,EAAE,cAAc,EAAE,MAAM,sBAAsB,CAAC;AACjH,OAAO,EAAE,MAAM,EAAE,MAAM,iBAAiB,CAAC;AAGzC,MAAM,OAAO,cAAc;IAChB,UAAU,GAAG,WAAW,CAAC;IAE1B,QAAQ,GAAG,EAAE,CAAC;IACd,UAAU,GAA8B,IAAI,CAAC;IAC7C,eAAe,GAA8B,IAAI,CAAC;IAClD,oBAAoB,GAAkB,IAAI,CAAC;IAC3C,eAAe,GAA4E,IAAI,CAAC;IAChG,eAAe,GAAG,KAAK,CAAC;IAEhC,UAAU,CAAC,GAAW;QACpB,IAAI,CAAC,QAAQ,GAAG,GAAG,CAAC;IACtB,CAAC;IAED,WAAW;QACT,OAAO,gBAAgB,CAAC,IAAI,CAAC,QAAQ,CAAC,KAAK,IAAI,CAAC;IAClD,CAAC;IAED,+EAA+E;IAE/E,KAAK,CAAC,QAAQ,CAAC,SAAiB,EAAE,IAAkB;QAClD,IAAI,CAAC,IAAI,CAAC,UAAU;YAAE,IAAI,CAAC,UAAU,GAAG,IAAI,kBAAkB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QAC9E,IAAI,IAAI,CAAC,UAAU,CAAC,OAAO,IAAI,IAAI,CAAC,UAAU,CAAC,SAAS,KAAK,SAAS;YAAE,OAAO;QAE/E,IAAI,WAAW,GAAG,IAAI,EAAE,WAAW,CAAC;QAEpC,MAAM,SAAS,GAAG,MAAM,iBAAiB,CAAC,SAAS,CAAC,CAAC;QACrD,IAAI,CAAC,WAAW,IAAI,SAAS,EAAE,CAAC;YAC9B,WAAW,GAAG,2BAA2B,CAAC,SAAS,CAAC,CAAC;QACvD,CAAC;QAED,IAAI,SAAS,IAAI,WAAW,EAAE,CAAC;YAC7B,MAAM,OAAO,GAAG,WAAW,GAAG,oBAAoB,CAAC,SAAS,CAAC,CAAC;YAC9D,IAAI,CAAC,eAAe,GAAG;gBACrB,UAAU,EAAE,SAAS,CAAC,aAAa;gBACnC,YAAY,EAAE,OAAO;gBACrB,UAAU,EAAE,SAAS,CAAC,aAAa,GAAG,OAAO;aAC9C,CAAC;QACJ,CAAC;QAED,+DAA+D;QAC/D,MAAM,aAAa,GAAG,IAAI,CAAC,QAAQ,CAAC,SAAS,CAAC,CAAC;QAC/C,MAAM,OAAO,GAAG,IAAI,YAAY,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QAChD,MAAM,MAAM,GAAG,MAAM,OAAO,CAAC,kBAAkB,CAAC,aAAa,CAAC,CAAC;QAC/D,IAAI,CAAC,eAAe,GAAG,CAAC,CAAC,MAAM,CAAC;QAEhC,IAAI,MAAM,EAAE,CAAC;YACX,MAAM,CAAC,IAAI,CAAC,gDAAgD,IAAI,CAAC,QAAQ,CAAC,MAAM,CAAC,EAAE,CAAC,CAAC;QACvF,CAAC;QAED,IAAI,CAAC,oBAAoB,GAAG,WAAW,IAAI,IAAI,CAAC;QAChD,MAAM,GAAG,GAAG,SAAS,EAAE,CAAC;QACxB,MAAM,KAAK,GAAG,GAAG,CAAC,KAAK,KAAK,MAAM,CAAC;QACnC,MAAM,OAAO,GAAG,GAAG,CAAC,KAAK,KAAK,OAAO,CAAC;QACtC,MAAM,IAAI,CAAC,UAAU,CAAC,KAAK,CAAC;YAC1B,SAAS;YACT,WAAW;YACX,MAAM,EAAE,MAAM,IAAI,SAAS;YAC3B,SAAS,EAAE,KAAK,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;YACzB,SAAS,EAAE,KAAK;YAChB,GAAG,CAAC,KAAK,CAAC,CAAC,CAAC,EAAE,SAAS,EAAE,IAAI,EAAE,UAAU,EAAE,IAAI,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;YACvD,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,EAAE,UAAU,EAAE,MAAM,EAAE,UAAU,EAAE,MAAM,EAAE,KAAK,EAAE,IAAI,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;YAC3E,GAAG,CAAC,IAAI,EAAE,eAAe,KAAK,SAAS,CAAC,CAAC,CAAC,EAAE,eAAe,EAAE,IAAI,CAAC,eAAe,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;SAC1F,CAAC,CAAC;IACL,CAAC;IAED,KAAK,CAAC,UAAU;QACd,IAAI,IAAI,CAAC,UAAU,EAAE,CAAC;YACpB,MAAM,IAAI,CAAC,UAAU,CAAC,IAAI,EAAE,CAAC;QAC/B,CAAC;IACH,CAAC;IAED,KAAK,CAAC,QAAQ,CAAC,SAAiB,EAAE,IAAkB;QAClD,MAAM,IAAI,CAAC,UAAU,EAAE,CAAC;QACxB,MAAM,IAAI,CAAC,QAAQ,CAAC,SAAS,EAAE,IAAI,CAAC,CAAC;IACvC,CAAC;IAED,KAAK,CAAC,iBAAiB,CAAC,SAAiB,EAAE,IAAkB;QAC3D,IAAI,IAAI,CAAC,UAAU,EAAE,OAAO;YAAE,OAAO;QACrC,MAAM,CAAC,IAAI,CAAC,8CAA8C,SAAS,EAAE,CAAC,CAAC;QACvE,MAAM,EAAE,QAAQ,EAAE,GAAG,MAAM,IAAI,CAAC,gBAAgB,CAAC,SAAS,CAAC,CAAC;QAC5D,MAAM,IAAI,CAAC,QAAQ,CAAC,QAAQ,EAAE,IAAI,CAAC,CAAC;IACtC,CAAC;IAED,aAAa;QACX,MAAM,OAAO,GAAG,IAAI,CAAC,UAAU,EAAE,OAAO,IAAI,KAAK,CAAC;QAClD,OAAO;YACL,OAAO;YACP,WAAW,EAAE,OAAO,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,UAAU,EAAE,SAAS,IAAI,IAAI,CAAC,CAAC,CAAC,CAAC,IAAI;YAClE,IAAI,EAAE,IAAI,CAAC,UAAU,EAAE,IAAI,IAAI,IAAI;YACnC,WAAW,EAAE,IAAI,CAAC,oBAAoB;YACtC,cAAc,EAAE,IAAI,CAAC,eAAe;YACpC,cAAc,EAAE,IAAI,CAAC,eAAe;SACrC,CAAC;IACJ,CAAC;IAED,cAAc;QACZ,OAAO,IAAI,CAAC,UAAU,EAAE,KAAK,CAAC,CAAC,CAAC,IAAI,CAAC,UAAU,CAAC,UAAU,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC;IACtE,CAAC;IAED,+EAA+E;IAE/E,KAAK,CAAC,aAAa,CAAC,SAAiB;QACnC,IAAI,CAAC,IAAI,CAAC,eAAe;YAAE,IAAI,CAAC,eAAe,GAAG,IAAI,kBAAkB,CAAC,IAAI,CAAC,QAAQ,EAAE,IAAI,CAAC,CAAC;QAC9F,IAAI,IAAI,CAAC,eAAe,CAAC,OAAO,IAAI,IAAI,CAAC,eAAe,CAAC,SAAS,KAAK,SAAS;YAAE,OAAO;QACzF,MAAM,IAAI,CAAC,eAAe,CAAC,KAAK,CAAC,EAAE,SAAS,EAAE,SAAS,EAAE,IAAI,EAAE,CAAC,CAAC;IACnE,CAAC;IAED,KAAK,CAAC,eAAe;QACnB,IAAI,IAAI,CAAC,eAAe,EAAE,CAAC;YACzB,MAAM,IAAI,CAAC,eAAe,CAAC,IAAI,EAAE,CAAC;QACpC,CAAC;IACH,CAAC;IAED,KAAK,CAAC,sBAAsB,CAAC,SAAiB;QAC5C,IAAI,IAAI,CAAC,eAAe,EAAE,OAAO;YAAE,OAAO;QAC1C,MAAM,CAAC,IAAI,CAAC,mDAAmD,SAAS,EAAE,CAAC,CAAC;QAC5E,MAAM,EAAE,QAAQ,EAAE,GAAG,MAAM,IAAI,CAAC,gBAAgB,CAAC,SAAS,CAAC,CAAC;QAC5D,MAAM,IAAI,CAAC,aAAa,CAAC,QAAQ,CAAC,CAAC;IACrC,CAAC;IAED,kBAAkB;QAChB,MAAM,OAAO,GAAG,IAAI,CAAC,eAAe,EAAE,OAAO,IAAI,KAAK,CAAC;QACvD,OAAO;YACL,OAAO;YACP,WAAW,EAAE,OAAO,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,eAAe,EAAE,SAAS,IAAI,IAAI,CAAC,CAAC,CAAC,CAAC,IAAI;YACvE,IAAI,EAAE,IAAI,CAAC,eAAe,EAAE,IAAI,IAAI,IAAI;YACxC,WAAW,EAAE,IAAI;YACjB,cAAc,EAAE,IAAI;SACrB,CAAC;IACJ,CAAC;IAED,mBAAmB;QACjB,OAAO,IAAI,CAAC,eAAe,EAAE,KAAK,CAAC,CAAC,CAAC,IAAI,CAAC,eAAe,CAAC,UAAU,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC;IAChF,CAAC;IAED,+EAA+E;IAE/E,SAAS;QACP,OAAO;YACL,UAAU,EAAE,IAAI,CAAC,UAAU;YAC3B,SAAS,EAAE,IAAI,CAAC,WAAW,EAAE;YAC7B,IAAI,EAAE,IAAI,CAAC,aAAa,EAAE;YAC1B,SAAS,EAAE,IAAI,CAAC,kBAAkB,EAAE;SACrC,CAAC;IACJ,CAAC;IAED,WAAW;QACT,mBAAmB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;IACrC,CAAC;IAED,8EAA8E;IAE9E,gBAAgB;QACd,OAAO,gBAAgB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;IACzC,CAAC;IAED,eAAe;QACb,MAAM,OAAO,GAAG,gBAAgB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QAChD,IAAI,CAAC,OAAO;YAAE,OAAO,IAAI,CAAC;QAC1B,OAAO,cAAc,EAAE,CAAC,CAAC,CAAC,QAAQ,CAAC,CAAC,CAAC,SAAS,CAAC;IACjD,CAAC;IAED,KAAK,CAAC,cAAc;QAClB,OAAO,cAAc,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;IACvC,CAAC;IAED,KAAK,CAAC,YAAY;QAChB,OAAO,YAAY,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;IACrC,CAAC;IAED,+EAA+E;IAEvE,KAAK,CAAC,gBAAgB,CAAC,SAAiB;QAC9C,MAAM,OAAO,GAAG,IAAI,YAAY,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QAChD,MAAM,MAAM,GAAG,MAAM,OAAO,CAAC,aAAa,CAAC,SAAS,CAAC,CAAC;QACtD,IAAI,CAAC,MAAM;YAAE,MAAM,IAAI,KAAK,CAAC,gBAAgB,SAAS,iCAAiC,CAAC,CAAC;QACzF,OAAO,MAAM,CAAC;IAChB,CAAC;CACF"}
@@ -0,0 +1,31 @@
1
+ import type { LocalEngine, EngineChatStatus, EngineServerStatus, EngineStatus, LoadOptions } from '../engine-interface.ts';
2
+ export declare class MlxServeEngine implements LocalEngine {
3
+ readonly engineName = "mlx-serve";
4
+ private _baseDir;
5
+ private chatServer;
6
+ private embeddingServer;
7
+ private _detectedContextSize;
8
+ private _memoryEstimate;
9
+ private _supportsVision;
10
+ setBaseDir(dir: string): void;
11
+ isAvailable(): boolean;
12
+ loadChat(modelPath: string, opts?: LoadOptions): Promise<void>;
13
+ unloadChat(): Promise<void>;
14
+ swapChat(modelPath: string, opts?: LoadOptions): Promise<void>;
15
+ ensureRunningChat(modelName: string, opts?: LoadOptions): Promise<void>;
16
+ getChatStatus(): EngineChatStatus;
17
+ getChatBaseUrl(): string | null;
18
+ loadEmbedding(modelPath: string): Promise<void>;
19
+ unloadEmbedding(): Promise<void>;
20
+ ensureRunningEmbedding(modelName: string): Promise<void>;
21
+ getEmbeddingStatus(): EngineServerStatus;
22
+ getEmbeddingBaseUrl(): string | null;
23
+ getStatus(): EngineStatus;
24
+ killOrphans(): void;
25
+ getBinaryVersion(): string | null;
26
+ getBinarySource(): 'managed' | 'system' | null;
27
+ checkForUpdate(): Promise<any>;
28
+ updateBinary(): Promise<void>;
29
+ private resolveModelPath;
30
+ }
31
+ //# sourceMappingURL=mlx-serve-engine.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"mlx-serve-engine.d.ts","sourceRoot":"","sources":["../../../../lib/local-llm/engines/mlx-serve-engine.ts"],"names":[],"mappings":"AAKA,OAAO,KAAK,EAAE,WAAW,EAAE,gBAAgB,EAAE,kBAAkB,EAAE,YAAY,EAAE,WAAW,EAAE,MAAM,wBAAwB,CAAC;AAE3H,qBAAa,cAAe,YAAW,WAAW;IAChD,QAAQ,CAAC,UAAU,eAAe;IAElC,OAAO,CAAC,QAAQ,CAAM;IACtB,OAAO,CAAC,UAAU,CAAiC;IACnD,OAAO,CAAC,eAAe,CAAiC;IACxD,OAAO,CAAC,oBAAoB,CAAuB;IACnD,OAAO,CAAC,eAAe,CAAiF;IACxG,OAAO,CAAC,eAAe,CAAS;IAEhC,UAAU,CAAC,GAAG,EAAE,MAAM,GAAG,IAAI;IAI7B,WAAW,IAAI,OAAO;IAMhB,QAAQ,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,WAAW,GAAG,OAAO,CAAC,IAAI,CAAC;IAwC9D,UAAU,IAAI,OAAO,CAAC,IAAI,CAAC;IAM3B,QAAQ,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,WAAW,GAAG,OAAO,CAAC,IAAI,CAAC;IAK9D,iBAAiB,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,WAAW,GAAG,OAAO,CAAC,IAAI,CAAC;IAO7E,aAAa,IAAI,gBAAgB;IAYjC,cAAc,IAAI,MAAM,GAAG,IAAI;IAMzB,aAAa,CAAC,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;IAQ/C,eAAe,IAAI,OAAO,CAAC,IAAI,CAAC;IAMhC,sBAAsB,CAAC,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;IAO9D,kBAAkB,IAAI,kBAAkB;IAWxC,mBAAmB,IAAI,MAAM,GAAG,IAAI;IAMpC,SAAS,IAAI,YAAY;IASzB,WAAW,IAAI,IAAI;IAMnB,gBAAgB,IAAI,MAAM,GAAG,IAAI;IAIjC,eAAe,IAAI,SAAS,GAAG,QAAQ,GAAG,IAAI;IAMxC,cAAc,IAAI,OAAO,CAAC,GAAG,CAAC;IAI9B,YAAY,IAAI,OAAO,CAAC,IAAI,CAAC;YAMrB,gBAAgB;CAM/B"}
@@ -0,0 +1,161 @@
1
+ import { MlxServerProcess } from "../mlx-server-process.js";
2
+ import { killOrphanedMlxServers } from "../mlx-server-process.js";
3
+ import { ModelManager } from "../model-manager.js";
4
+ import { getMlxBinaryVersion, isMlxSystemBinary, updateMlxBinary, checkForMlxUpdate } from "../mlx-binary-manager.js";
5
+ import { logger } from "../../logger.js";
6
+ export class MlxServeEngine {
7
+ engineName = 'mlx-serve';
8
+ _baseDir = '';
9
+ chatServer = null;
10
+ embeddingServer = null;
11
+ _detectedContextSize = null;
12
+ _memoryEstimate = null;
13
+ _supportsVision = false;
14
+ setBaseDir(dir) {
15
+ this._baseDir = dir;
16
+ }
17
+ isAvailable() {
18
+ return getMlxBinaryVersion(this._baseDir) !== null && process.platform === 'darwin' && process.arch === 'arm64';
19
+ }
20
+ // ─── Chat ───────────────────────────────────────────────────────────────────
21
+ async loadChat(modelPath, opts) {
22
+ if (this.chatServer?.running && this.chatServer.modelPath === modelPath)
23
+ return;
24
+ if (!this.chatServer)
25
+ this.chatServer = new MlxServerProcess(this._baseDir);
26
+ this._memoryEstimate = null;
27
+ this._supportsVision = false;
28
+ this._detectedContextSize = opts?.contextSize ?? null;
29
+ await this.chatServer.start({ modelPath, contextSize: opts?.contextSize, reasoningBudget: opts?.reasoningBudget });
30
+ // Fetch /props from mlx-serve to get memory usage and context size
31
+ try {
32
+ const baseUrl = this.chatServer.getBaseUrl();
33
+ const res = await fetch(`${baseUrl}/props`);
34
+ if (res.ok) {
35
+ const props = await res.json();
36
+ const nCtx = props.default_generation_settings?.n_ctx;
37
+ if (nCtx && !this._detectedContextSize) {
38
+ this._detectedContextSize = nCtx;
39
+ }
40
+ const ctxSize = this._detectedContextSize ?? nCtx ?? 0;
41
+ const info = props.model_info;
42
+ // KV cache: layers × 2(K+V) × kv_heads × head_dim × 2(float16) × ctx
43
+ const kvCacheBytes = info
44
+ ? info.num_hidden_layers * 2 * info.num_key_value_heads * info.head_dim * 2 * ctxSize
45
+ : 0;
46
+ const modelBytes = props.memory?.active_bytes ?? 0;
47
+ if (modelBytes || kvCacheBytes) {
48
+ this._memoryEstimate = {
49
+ modelBytes,
50
+ kvCacheBytes,
51
+ totalBytes: modelBytes + kvCacheBytes,
52
+ };
53
+ }
54
+ }
55
+ }
56
+ catch (err) {
57
+ logger.warn('[MlxServeEngine] Failed to fetch /props:', err);
58
+ }
59
+ }
60
+ async unloadChat() {
61
+ if (this.chatServer) {
62
+ await this.chatServer.stop();
63
+ }
64
+ }
65
+ async swapChat(modelPath, opts) {
66
+ await this.unloadChat();
67
+ await this.loadChat(modelPath, opts);
68
+ }
69
+ async ensureRunningChat(modelName, opts) {
70
+ if (this.chatServer?.running)
71
+ return;
72
+ logger.info(`[MlxServeEngine] Auto-starting chat model: ${modelName}`);
73
+ const { filePath } = await this.resolveModelPath(modelName);
74
+ await this.loadChat(filePath, opts);
75
+ }
76
+ getChatStatus() {
77
+ const running = this.chatServer?.running ?? false;
78
+ return {
79
+ running,
80
+ activeModel: running ? (this.chatServer?.modelPath ?? null) : null,
81
+ port: this.chatServer?.port ?? null,
82
+ contextSize: this._detectedContextSize,
83
+ memoryEstimate: this._memoryEstimate,
84
+ supportsVision: this._supportsVision,
85
+ };
86
+ }
87
+ getChatBaseUrl() {
88
+ return this.chatServer?.ready ? this.chatServer.getBaseUrl() : null;
89
+ }
90
+ // ─── Embedding ──────────────────────────────────────────────────────────────
91
+ async loadEmbedding(modelPath) {
92
+ if (this.embeddingServer?.running && this.embeddingServer.modelPath === modelPath)
93
+ return;
94
+ if (!this.embeddingServer)
95
+ this.embeddingServer = new MlxServerProcess(this._baseDir, 'embedding');
96
+ await this.embeddingServer.start({ modelPath });
97
+ logger.info(`[MlxServeEngine] Embedding server ready on port ${this.embeddingServer.port}`);
98
+ }
99
+ async unloadEmbedding() {
100
+ if (this.embeddingServer) {
101
+ await this.embeddingServer.stop();
102
+ }
103
+ }
104
+ async ensureRunningEmbedding(modelName) {
105
+ if (this.embeddingServer?.running)
106
+ return;
107
+ logger.info(`[MlxServeEngine] Auto-starting embedding model: ${modelName}`);
108
+ const { filePath } = await this.resolveModelPath(modelName);
109
+ await this.loadEmbedding(filePath);
110
+ }
111
+ getEmbeddingStatus() {
112
+ const running = this.embeddingServer?.running ?? false;
113
+ return {
114
+ running,
115
+ activeModel: running ? (this.embeddingServer?.modelPath ?? null) : null,
116
+ port: this.embeddingServer?.port ?? null,
117
+ contextSize: null,
118
+ memoryEstimate: null,
119
+ };
120
+ }
121
+ getEmbeddingBaseUrl() {
122
+ return this.embeddingServer?.ready ? this.embeddingServer.getBaseUrl() : null;
123
+ }
124
+ // ─── Combined ───────────────────────────────────────────────────────────────
125
+ getStatus() {
126
+ return {
127
+ engineName: this.engineName,
128
+ available: this.isAvailable(),
129
+ chat: this.getChatStatus(),
130
+ embedding: this.getEmbeddingStatus(),
131
+ };
132
+ }
133
+ killOrphans() {
134
+ killOrphanedMlxServers(this._baseDir);
135
+ }
136
+ // ─── Binary management ─────────────────────────────────────────────────────
137
+ getBinaryVersion() {
138
+ return getMlxBinaryVersion(this._baseDir);
139
+ }
140
+ getBinarySource() {
141
+ const version = getMlxBinaryVersion(this._baseDir);
142
+ if (!version)
143
+ return null;
144
+ return isMlxSystemBinary() ? 'system' : 'managed';
145
+ }
146
+ async checkForUpdate() {
147
+ return checkForMlxUpdate(this._baseDir);
148
+ }
149
+ async updateBinary() {
150
+ return updateMlxBinary(this._baseDir);
151
+ }
152
+ // ─── Private ────────────────────────────────────────────────────────────────
153
+ async resolveModelPath(modelName) {
154
+ const manager = new ModelManager(this._baseDir);
155
+ const result = await manager.findModelFile(modelName);
156
+ if (!result)
157
+ throw new Error(`Local model "${modelName}" not found. Download it first.`);
158
+ return result;
159
+ }
160
+ }
161
+ //# sourceMappingURL=mlx-serve-engine.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"mlx-serve-engine.js","sourceRoot":"","sources":["../../../../lib/local-llm/engines/mlx-serve-engine.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,gBAAgB,EAAE,MAAM,0BAA0B,CAAC;AAC5D,OAAO,EAAE,sBAAsB,EAAE,MAAM,0BAA0B,CAAC;AAClE,OAAO,EAAE,YAAY,EAAE,MAAM,qBAAqB,CAAC;AACnD,OAAO,EAAE,mBAAmB,EAAE,iBAAiB,EAAE,eAAe,EAAE,iBAAiB,EAAE,MAAM,0BAA0B,CAAC;AACtH,OAAO,EAAE,MAAM,EAAE,MAAM,iBAAiB,CAAC;AAGzC,MAAM,OAAO,cAAc;IAChB,UAAU,GAAG,WAAW,CAAC;IAE1B,QAAQ,GAAG,EAAE,CAAC;IACd,UAAU,GAA4B,IAAI,CAAC;IAC3C,eAAe,GAA4B,IAAI,CAAC;IAChD,oBAAoB,GAAkB,IAAI,CAAC;IAC3C,eAAe,GAA4E,IAAI,CAAC;IAChG,eAAe,GAAG,KAAK,CAAC;IAEhC,UAAU,CAAC,GAAW;QACpB,IAAI,CAAC,QAAQ,GAAG,GAAG,CAAC;IACtB,CAAC;IAED,WAAW;QACT,OAAO,mBAAmB,CAAC,IAAI,CAAC,QAAQ,CAAC,KAAK,IAAI,IAAI,OAAO,CAAC,QAAQ,KAAK,QAAQ,IAAI,OAAO,CAAC,IAAI,KAAK,OAAO,CAAC;IAClH,CAAC;IAED,+EAA+E;IAE/E,KAAK,CAAC,QAAQ,CAAC,SAAiB,EAAE,IAAkB;QAClD,IAAI,IAAI,CAAC,UAAU,EAAE,OAAO,IAAI,IAAI,CAAC,UAAU,CAAC,SAAS,KAAK,SAAS;YAAE,OAAO;QAChF,IAAI,CAAC,IAAI,CAAC,UAAU;YAAE,IAAI,CAAC,UAAU,GAAG,IAAI,gBAAgB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QAE5E,IAAI,CAAC,eAAe,GAAG,IAAI,CAAC;QAC5B,IAAI,CAAC,eAAe,GAAG,KAAK,CAAC;QAC7B,IAAI,CAAC,oBAAoB,GAAG,IAAI,EAAE,WAAW,IAAI,IAAI,CAAC;QAEtD,MAAM,IAAI,CAAC,UAAU,CAAC,KAAK,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,IAAI,EAAE,WAAW,EAAE,eAAe,EAAE,IAAI,EAAE,eAAe,EAAE,CAAC,CAAC;QAEnH,mEAAmE;QACnE,IAAI,CAAC;YACH,MAAM,OAAO,GAAG,IAAI,CAAC,UAAU,CAAC,UAAU,EAAE,CAAC;YAC7C,MAAM,GAAG,GAAG,MAAM,KAAK,CAAC,GAAG,OAAO,QAAQ,CAAC,CAAC;YAC5C,IAAI,GAAG,CAAC,EAAE,EAAE,CAAC;gBACX,MAAM,KAAK,GAAG,MAAM,GAAG,CAAC,IAAI,EAAS,CAAC;gBACtC,MAAM,IAAI,GAAG,KAAK,CAAC,2BAA2B,EAAE,KAAK,CAAC;gBACtD,IAAI,IAAI,IAAI,CAAC,IAAI,CAAC,oBAAoB,EAAE,CAAC;oBACvC,IAAI,CAAC,oBAAoB,GAAG,IAAI,CAAC;gBACnC,CAAC;gBACD,MAAM,OAAO,GAAG,IAAI,CAAC,oBAAoB,IAAI,IAAI,IAAI,CAAC,CAAC;gBACvD,MAAM,IAAI,GAAG,KAAK,CAAC,UAAU,CAAC;gBAC9B,qEAAqE;gBACrE,MAAM,YAAY,GAAG,IAAI;oBACvB,CAAC,CAAC,IAAI,CAAC,iBAAiB,GAAG,CAAC,GAAG,IAAI,CAAC,mBAAmB,GAAG,IAAI,CAAC,QAAQ,GAAG,CAAC,GAAG,OAAO;oBACrF,CAAC,CAAC,CAAC,CAAC;gBACN,MAAM,UAAU,GAAG,KAAK,CAAC,MAAM,EAAE,YAAY,IAAI,CAAC,CAAC;gBACnD,IAAI,UAAU,IAAI,YAAY,EAAE,CAAC;oBAC/B,IAAI,CAAC,eAAe,GAAG;wBACrB,UAAU;wBACV,YAAY;wBACZ,UAAU,EAAE,UAAU,GAAG,YAAY;qBACtC,CAAC;gBACJ,CAAC;YACH,CAAC;QACH,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACb,MAAM,CAAC,IAAI,CAAC,0CAA0C,EAAE,GAAG,CAAC,CAAC;QAC/D,CAAC;IACH,CAAC;IAED,KAAK,CAAC,UAAU;QACd,IAAI,IAAI,CAAC,UAAU,EAAE,CAAC;YACpB,MAAM,IAAI,CAAC,UAAU,CAAC,IAAI,EAAE,CAAC;QAC/B,CAAC;IACH,CAAC;IAED,KAAK,CAAC,QAAQ,CAAC,SAAiB,EAAE,IAAkB;QAClD,MAAM,IAAI,CAAC,UAAU,EAAE,CAAC;QACxB,MAAM,IAAI,CAAC,QAAQ,CAAC,SAAS,EAAE,IAAI,CAAC,CAAC;IACvC,CAAC;IAED,KAAK,CAAC,iBAAiB,CAAC,SAAiB,EAAE,IAAkB;QAC3D,IAAI,IAAI,CAAC,UAAU,EAAE,OAAO;YAAE,OAAO;QACrC,MAAM,CAAC,IAAI,CAAC,8CAA8C,SAAS,EAAE,CAAC,CAAC;QACvE,MAAM,EAAE,QAAQ,EAAE,GAAG,MAAM,IAAI,CAAC,gBAAgB,CAAC,SAAS,CAAC,CAAC;QAC5D,MAAM,IAAI,CAAC,QAAQ,CAAC,QAAQ,EAAE,IAAI,CAAC,CAAC;IACtC,CAAC;IAED,aAAa;QACX,MAAM,OAAO,GAAG,IAAI,CAAC,UAAU,EAAE,OAAO,IAAI,KAAK,CAAC;QAClD,OAAO;YACL,OAAO;YACP,WAAW,EAAE,OAAO,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,UAAU,EAAE,SAAS,IAAI,IAAI,CAAC,CAAC,CAAC,CAAC,IAAI;YAClE,IAAI,EAAE,IAAI,CAAC,UAAU,EAAE,IAAI,IAAI,IAAI;YACnC,WAAW,EAAE,IAAI,CAAC,oBAAoB;YACtC,cAAc,EAAE,IAAI,CAAC,eAAe;YACpC,cAAc,EAAE,IAAI,CAAC,eAAe;SACrC,CAAC;IACJ,CAAC;IAED,cAAc;QACZ,OAAO,IAAI,CAAC,UAAU,EAAE,KAAK,CAAC,CAAC,CAAC,IAAI,CAAC,UAAU,CAAC,UAAU,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC;IACtE,CAAC;IAED,+EAA+E;IAE/E,KAAK,CAAC,aAAa,CAAC,SAAiB;QACnC,IAAI,IAAI,CAAC,eAAe,EAAE,OAAO,IAAI,IAAI,CAAC,eAAe,CAAC,SAAS,KAAK,SAAS;YAAE,OAAO;QAC1F,IAAI,CAAC,IAAI,CAAC,eAAe;YAAE,IAAI,CAAC,eAAe,GAAG,IAAI,gBAAgB,CAAC,IAAI,CAAC,QAAQ,EAAE,WAAW,CAAC,CAAC;QAEnG,MAAM,IAAI,CAAC,eAAe,CAAC,KAAK,CAAC,EAAE,SAAS,EAAE,CAAC,CAAC;QAChD,MAAM,CAAC,IAAI,CAAC,mDAAmD,IAAI,CAAC,eAAe,CAAC,IAAI,EAAE,CAAC,CAAC;IAC9F,CAAC;IAED,KAAK,CAAC,eAAe;QACnB,IAAI,IAAI,CAAC,eAAe,EAAE,CAAC;YACzB,MAAM,IAAI,CAAC,eAAe,CAAC,IAAI,EAAE,CAAC;QACpC,CAAC;IACH,CAAC;IAED,KAAK,CAAC,sBAAsB,CAAC,SAAiB;QAC5C,IAAI,IAAI,CAAC,eAAe,EAAE,OAAO;YAAE,OAAO;QAC1C,MAAM,CAAC,IAAI,CAAC,mDAAmD,SAAS,EAAE,CAAC,CAAC;QAC5E,MAAM,EAAE,QAAQ,EAAE,GAAG,MAAM,IAAI,CAAC,gBAAgB,CAAC,SAAS,CAAC,CAAC;QAC5D,MAAM,IAAI,CAAC,aAAa,CAAC,QAAQ,CAAC,CAAC;IACrC,CAAC;IAED,kBAAkB;QAChB,MAAM,OAAO,GAAG,IAAI,CAAC,eAAe,EAAE,OAAO,IAAI,KAAK,CAAC;QACvD,OAAO;YACL,OAAO;YACP,WAAW,EAAE,OAAO,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,eAAe,EAAE,SAAS,IAAI,IAAI,CAAC,CAAC,CAAC,CAAC,IAAI;YACvE,IAAI,EAAE,IAAI,CAAC,eAAe,EAAE,IAAI,IAAI,IAAI;YACxC,WAAW,EAAE,IAAI;YACjB,cAAc,EAAE,IAAI;SACrB,CAAC;IACJ,CAAC;IAED,mBAAmB;QACjB,OAAO,IAAI,CAAC,eAAe,EAAE,KAAK,CAAC,CAAC,CAAC,IAAI,CAAC,eAAe,CAAC,UAAU,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC;IAChF,CAAC;IAED,+EAA+E;IAE/E,SAAS;QACP,OAAO;YACL,UAAU,EAAE,IAAI,CAAC,UAAU;YAC3B,SAAS,EAAE,IAAI,CAAC,WAAW,EAAE;YAC7B,IAAI,EAAE,IAAI,CAAC,aAAa,EAAE;YAC1B,SAAS,EAAE,IAAI,CAAC,kBAAkB,EAAE;SACrC,CAAC;IACJ,CAAC;IAED,WAAW;QACT,sBAAsB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;IACxC,CAAC;IAED,8EAA8E;IAE9E,gBAAgB;QACd,OAAO,mBAAmB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;IAC5C,CAAC;IAED,eAAe;QACb,MAAM,OAAO,GAAG,mBAAmB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QACnD,IAAI,CAAC,OAAO;YAAE,OAAO,IAAI,CAAC;QAC1B,OAAO,iBAAiB,EAAE,CAAC,CAAC,CAAC,QAAQ,CAAC,CAAC,CAAC,SAAS,CAAC;IACpD,CAAC;IAED,KAAK,CAAC,cAAc;QAClB,OAAO,iBAAiB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;IAC1C,CAAC;IAED,KAAK,CAAC,YAAY;QAChB,OAAO,eAAe,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;IACxC,CAAC;IAED,+EAA+E;IAEvE,KAAK,CAAC,gBAAgB,CAAC,SAAiB;QAC9C,MAAM,OAAO,GAAG,IAAI,YAAY,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QAChD,MAAM,MAAM,GAAG,MAAM,OAAO,CAAC,aAAa,CAAC,SAAS,CAAC,CAAC;QACtD,IAAI,CAAC,MAAM;YAAE,MAAM,IAAI,KAAK,CAAC,gBAAgB,SAAS,iCAAiC,CAAC,CAAC;QACzF,OAAO,MAAM,CAAC;IAChB,CAAC;CACF"}
@@ -0,0 +1,20 @@
1
+ export interface GGUFModelInfo {
2
+ contextLength: number;
3
+ blockCount: number;
4
+ embeddingLength: number;
5
+ headCount: number;
6
+ headCountKv: number;
7
+ fileSizeBytes: number;
8
+ }
9
+ /**
10
+ * Reads model architecture info from a GGUF file's metadata header.
11
+ * Only reads the first 1MB — no model loading required.
12
+ */
13
+ export declare function readGGUFModelInfo(modelPath: string): Promise<GGUFModelInfo | null>;
14
+ /**
15
+ * Estimates KV cache bytes per token for a model.
16
+ * KV cache = 2 (K+V) * n_layers * n_kv_heads * head_dim * 2 bytes (f16)
17
+ */
18
+ export declare function kvCacheBytesPerToken(info: GGUFModelInfo): number;
19
+ export declare function calculateOptimalContextSize(info: GGUFModelInfo): number;
20
+ //# sourceMappingURL=gguf-reader.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"gguf-reader.d.ts","sourceRoot":"","sources":["../../../lib/local-llm/gguf-reader.ts"],"names":[],"mappings":"AASA,MAAM,WAAW,aAAa;IAC5B,aAAa,EAAE,MAAM,CAAC;IACtB,UAAU,EAAE,MAAM,CAAC;IACnB,eAAe,EAAE,MAAM,CAAC;IACxB,SAAS,EAAE,MAAM,CAAC;IAClB,WAAW,EAAE,MAAM,CAAC;IACpB,aAAa,EAAE,MAAM,CAAC;CACvB;AAED;;;GAGG;AACH,wBAAsB,iBAAiB,CAAC,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,aAAa,GAAG,IAAI,CAAC,CAkExF;AAED;;;GAGG;AACH,wBAAgB,oBAAoB,CAAC,IAAI,EAAE,aAAa,GAAG,MAAM,CAGhE;AA2BD,wBAAgB,2BAA2B,CAAC,IAAI,EAAE,aAAa,GAAG,MAAM,CAuBvE"}