agent-orcha 0.0.5 → 0.0.8
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +250 -1275
- package/dist/lib/agents/agent-executor.d.ts +4 -2
- package/dist/lib/agents/agent-executor.d.ts.map +1 -1
- package/dist/lib/agents/agent-executor.js +85 -53
- package/dist/lib/agents/agent-executor.js.map +1 -1
- package/dist/lib/agents/agent-loader.d.ts +3 -0
- package/dist/lib/agents/agent-loader.d.ts.map +1 -1
- package/dist/lib/agents/agent-loader.js +10 -1
- package/dist/lib/agents/agent-loader.js.map +1 -1
- package/dist/lib/agents/react-loop.d.ts.map +1 -1
- package/dist/lib/agents/react-loop.js +207 -142
- package/dist/lib/agents/react-loop.js.map +1 -1
- package/dist/lib/agents/types.d.ts +181 -18
- package/dist/lib/agents/types.d.ts.map +1 -1
- package/dist/lib/agents/types.js +18 -2
- package/dist/lib/agents/types.js.map +1 -1
- package/dist/lib/functions/function-loader.d.ts +2 -0
- package/dist/lib/functions/function-loader.d.ts.map +1 -1
- package/dist/lib/functions/function-loader.js +10 -0
- package/dist/lib/functions/function-loader.js.map +1 -1
- package/dist/lib/functions/simple-function-wrapper.js +3 -3
- package/dist/lib/functions/simple-function-wrapper.js.map +1 -1
- package/dist/lib/integrations/email.d.ts +38 -0
- package/dist/lib/integrations/email.d.ts.map +1 -0
- package/dist/lib/integrations/email.js +249 -0
- package/dist/lib/integrations/email.js.map +1 -0
- package/dist/lib/integrations/integration-manager.d.ts +5 -0
- package/dist/lib/integrations/integration-manager.d.ts.map +1 -1
- package/dist/lib/integrations/integration-manager.js +53 -3
- package/dist/lib/integrations/integration-manager.js.map +1 -1
- package/dist/lib/integrations/types.d.ts +187 -4
- package/dist/lib/integrations/types.d.ts.map +1 -1
- package/dist/lib/integrations/types.js +24 -1
- package/dist/lib/integrations/types.js.map +1 -1
- package/dist/lib/knowledge/knowledge-store.d.ts +7 -1
- package/dist/lib/knowledge/knowledge-store.d.ts.map +1 -1
- package/dist/lib/knowledge/knowledge-store.js +96 -8
- package/dist/lib/knowledge/knowledge-store.js.map +1 -1
- package/dist/lib/knowledge/loaders/file-loaders.d.ts +8 -3
- package/dist/lib/knowledge/loaders/file-loaders.d.ts.map +1 -1
- package/dist/lib/knowledge/loaders/file-loaders.js +96 -75
- package/dist/lib/knowledge/loaders/file-loaders.js.map +1 -1
- package/dist/lib/knowledge/loaders/web-loader.d.ts +12 -3
- package/dist/lib/knowledge/loaders/web-loader.d.ts.map +1 -1
- package/dist/lib/knowledge/loaders/web-loader.js +56 -22
- package/dist/lib/knowledge/loaders/web-loader.js.map +1 -1
- package/dist/lib/knowledge/sqlite-store.d.ts.map +1 -1
- package/dist/lib/knowledge/sqlite-store.js +19 -10
- package/dist/lib/knowledge/sqlite-store.js.map +1 -1
- package/dist/lib/knowledge/types.d.ts +69 -33
- package/dist/lib/knowledge/types.d.ts.map +1 -1
- package/dist/lib/knowledge/types.js +18 -3
- package/dist/lib/knowledge/types.js.map +1 -1
- package/dist/lib/llm/index.d.ts +1 -1
- package/dist/lib/llm/index.d.ts.map +1 -1
- package/dist/lib/llm/index.js +1 -1
- package/dist/lib/llm/index.js.map +1 -1
- package/dist/lib/llm/llm-call-logger.d.ts +3 -1
- package/dist/lib/llm/llm-call-logger.d.ts.map +1 -1
- package/dist/lib/llm/llm-call-logger.js +31 -26
- package/dist/lib/llm/llm-call-logger.js.map +1 -1
- package/dist/lib/llm/llm-config.d.ts +59 -8
- package/dist/lib/llm/llm-config.d.ts.map +1 -1
- package/dist/lib/llm/llm-config.js +163 -17
- package/dist/lib/llm/llm-config.js.map +1 -1
- package/dist/lib/llm/llm-factory.d.ts +1 -2
- package/dist/lib/llm/llm-factory.d.ts.map +1 -1
- package/dist/lib/llm/llm-factory.js +44 -8
- package/dist/lib/llm/llm-factory.js.map +1 -1
- package/dist/lib/llm/providers/anthropic-chat-model.d.ts +5 -1
- package/dist/lib/llm/providers/anthropic-chat-model.d.ts.map +1 -1
- package/dist/lib/llm/providers/anthropic-chat-model.js +118 -42
- package/dist/lib/llm/providers/anthropic-chat-model.js.map +1 -1
- package/dist/lib/llm/providers/gemini-chat-model.d.ts +3 -2
- package/dist/lib/llm/providers/gemini-chat-model.d.ts.map +1 -1
- package/dist/lib/llm/providers/gemini-chat-model.js +83 -24
- package/dist/lib/llm/providers/gemini-chat-model.js.map +1 -1
- package/dist/lib/llm/providers/openai-chat-model.d.ts +20 -1
- package/dist/lib/llm/providers/openai-chat-model.d.ts.map +1 -1
- package/dist/lib/llm/providers/openai-chat-model.js +265 -32
- package/dist/lib/llm/providers/openai-chat-model.js.map +1 -1
- package/dist/lib/llm/providers/openai-embeddings.d.ts.map +1 -1
- package/dist/lib/llm/providers/openai-embeddings.js +41 -10
- package/dist/lib/llm/providers/openai-embeddings.js.map +1 -1
- package/dist/lib/local-llm/binary-manager.d.ts +66 -0
- package/dist/lib/local-llm/binary-manager.d.ts.map +1 -0
- package/dist/lib/local-llm/binary-manager.js +441 -0
- package/dist/lib/local-llm/binary-manager.js.map +1 -0
- package/dist/lib/local-llm/engine-interface.d.ts +47 -0
- package/dist/lib/local-llm/engine-interface.d.ts.map +1 -0
- package/dist/lib/local-llm/engine-interface.js +2 -0
- package/dist/lib/local-llm/engine-interface.js.map +1 -0
- package/dist/lib/local-llm/engine-registry.d.ts +20 -0
- package/dist/lib/local-llm/engine-registry.d.ts.map +1 -0
- package/dist/lib/local-llm/engine-registry.js +56 -0
- package/dist/lib/local-llm/engine-registry.js.map +1 -0
- package/dist/lib/local-llm/engines/llama-cpp-engine.d.ts +31 -0
- package/dist/lib/local-llm/engines/llama-cpp-engine.d.ts.map +1 -0
- package/dist/lib/local-llm/engines/llama-cpp-engine.js +164 -0
- package/dist/lib/local-llm/engines/llama-cpp-engine.js.map +1 -0
- package/dist/lib/local-llm/engines/mlx-serve-engine.d.ts +31 -0
- package/dist/lib/local-llm/engines/mlx-serve-engine.d.ts.map +1 -0
- package/dist/lib/local-llm/engines/mlx-serve-engine.js +161 -0
- package/dist/lib/local-llm/engines/mlx-serve-engine.js.map +1 -0
- package/dist/lib/local-llm/gguf-reader.d.ts +20 -0
- package/dist/lib/local-llm/gguf-reader.d.ts.map +1 -0
- package/dist/lib/local-llm/gguf-reader.js +190 -0
- package/dist/lib/local-llm/gguf-reader.js.map +1 -0
- package/dist/lib/local-llm/index.d.ts +9 -0
- package/dist/lib/local-llm/index.d.ts.map +1 -0
- package/dist/lib/local-llm/index.js +6 -0
- package/dist/lib/local-llm/index.js.map +1 -0
- package/dist/lib/local-llm/llama-server-process.d.ts +42 -0
- package/dist/lib/local-llm/llama-server-process.d.ts.map +1 -0
- package/dist/lib/local-llm/llama-server-process.js +237 -0
- package/dist/lib/local-llm/llama-server-process.js.map +1 -0
- package/dist/lib/local-llm/mlx-binary-manager.d.ts +33 -0
- package/dist/lib/local-llm/mlx-binary-manager.d.ts.map +1 -0
- package/dist/lib/local-llm/mlx-binary-manager.js +211 -0
- package/dist/lib/local-llm/mlx-binary-manager.js.map +1 -0
- package/dist/lib/local-llm/mlx-server-process.d.ts +26 -0
- package/dist/lib/local-llm/mlx-server-process.d.ts.map +1 -0
- package/dist/lib/local-llm/mlx-server-process.js +210 -0
- package/dist/lib/local-llm/mlx-server-process.js.map +1 -0
- package/dist/lib/local-llm/model-manager.d.ts +33 -0
- package/dist/lib/local-llm/model-manager.d.ts.map +1 -0
- package/dist/lib/local-llm/model-manager.js +591 -0
- package/dist/lib/local-llm/model-manager.js.map +1 -0
- package/dist/lib/local-llm/types.d.ts +51 -0
- package/dist/lib/local-llm/types.d.ts.map +1 -0
- package/dist/lib/local-llm/types.js +2 -0
- package/dist/lib/local-llm/types.js.map +1 -0
- package/dist/lib/logger.d.ts +2 -0
- package/dist/lib/logger.d.ts.map +1 -1
- package/dist/lib/logger.js +68 -6
- package/dist/lib/logger.js.map +1 -1
- package/dist/lib/mcp/mcp-client.d.ts.map +1 -1
- package/dist/lib/mcp/mcp-client.js +5 -3
- package/dist/lib/mcp/mcp-client.js.map +1 -1
- package/dist/lib/mcp/types.d.ts +0 -9
- package/dist/lib/mcp/types.d.ts.map +1 -1
- package/dist/lib/mcp/types.js +1 -2
- package/dist/lib/mcp/types.js.map +1 -1
- package/dist/lib/memory/memory-manager.d.ts +1 -0
- package/dist/lib/memory/memory-manager.d.ts.map +1 -1
- package/dist/lib/memory/memory-manager.js +9 -0
- package/dist/lib/memory/memory-manager.js.map +1 -1
- package/dist/lib/orchestrator.d.ts +11 -8
- package/dist/lib/orchestrator.d.ts.map +1 -1
- package/dist/lib/orchestrator.js +246 -5
- package/dist/lib/orchestrator.js.map +1 -1
- package/dist/lib/sandbox/cdp-client.d.ts +15 -0
- package/dist/lib/sandbox/cdp-client.d.ts.map +1 -0
- package/dist/lib/sandbox/cdp-client.js +139 -0
- package/dist/lib/sandbox/cdp-client.js.map +1 -0
- package/dist/lib/sandbox/html-to-markdown.d.ts +9 -1
- package/dist/lib/sandbox/html-to-markdown.d.ts.map +1 -1
- package/dist/lib/sandbox/html-to-markdown.js +67 -10
- package/dist/lib/sandbox/html-to-markdown.js.map +1 -1
- package/dist/lib/sandbox/index.d.ts +6 -0
- package/dist/lib/sandbox/index.d.ts.map +1 -1
- package/dist/lib/sandbox/index.js +5 -0
- package/dist/lib/sandbox/index.js.map +1 -1
- package/dist/lib/sandbox/page-readiness.d.ts +37 -0
- package/dist/lib/sandbox/page-readiness.d.ts.map +1 -0
- package/dist/lib/sandbox/page-readiness.js +268 -0
- package/dist/lib/sandbox/page-readiness.js.map +1 -0
- package/dist/lib/sandbox/sandbox-browser.d.ts +4 -0
- package/dist/lib/sandbox/sandbox-browser.d.ts.map +1 -0
- package/dist/lib/sandbox/sandbox-browser.js +316 -0
- package/dist/lib/sandbox/sandbox-browser.js.map +1 -0
- package/dist/lib/sandbox/sandbox-container.d.ts +39 -0
- package/dist/lib/sandbox/sandbox-container.d.ts.map +1 -0
- package/dist/lib/sandbox/sandbox-container.js +176 -0
- package/dist/lib/sandbox/sandbox-container.js.map +1 -0
- package/dist/lib/sandbox/sandbox-file.d.ts +4 -0
- package/dist/lib/sandbox/sandbox-file.d.ts.map +1 -0
- package/dist/lib/sandbox/sandbox-file.js +169 -0
- package/dist/lib/sandbox/sandbox-file.js.map +1 -0
- package/dist/lib/sandbox/sandbox-shell.d.ts +5 -0
- package/dist/lib/sandbox/sandbox-shell.d.ts.map +1 -0
- package/dist/lib/sandbox/sandbox-shell.js +111 -0
- package/dist/lib/sandbox/sandbox-shell.js.map +1 -0
- package/dist/lib/sandbox/sandbox-web.d.ts.map +1 -1
- package/dist/lib/sandbox/sandbox-web.js +64 -24
- package/dist/lib/sandbox/sandbox-web.js.map +1 -1
- package/dist/lib/sandbox/types.d.ts +9 -0
- package/dist/lib/sandbox/types.d.ts.map +1 -1
- package/dist/lib/sandbox/types.js +1 -0
- package/dist/lib/sandbox/types.js.map +1 -1
- package/dist/lib/sandbox/vision-browser.d.ts +4 -0
- package/dist/lib/sandbox/vision-browser.d.ts.map +1 -0
- package/dist/lib/sandbox/vision-browser.js +298 -0
- package/dist/lib/sandbox/vision-browser.js.map +1 -0
- package/dist/lib/sea/app-window.d.ts +7 -0
- package/dist/lib/sea/app-window.d.ts.map +1 -0
- package/dist/lib/sea/app-window.js +95 -0
- package/dist/lib/sea/app-window.js.map +1 -0
- package/dist/lib/sea/bootstrap.d.ts +18 -0
- package/dist/lib/sea/bootstrap.d.ts.map +1 -0
- package/dist/lib/sea/bootstrap.js +103 -0
- package/dist/lib/sea/bootstrap.js.map +1 -0
- package/dist/lib/sea/sqlite-vec-shim.d.ts +3 -0
- package/dist/lib/sea/sqlite-vec-shim.d.ts.map +1 -0
- package/dist/lib/sea/sqlite-vec-shim.js +10 -0
- package/dist/lib/sea/sqlite-vec-shim.js.map +1 -0
- package/dist/lib/skills/skill-loader.d.ts +2 -0
- package/dist/lib/skills/skill-loader.d.ts.map +1 -1
- package/dist/lib/skills/skill-loader.js +12 -1
- package/dist/lib/skills/skill-loader.js.map +1 -1
- package/dist/lib/tasks/task-manager.d.ts +3 -1
- package/dist/lib/tasks/task-manager.d.ts.map +1 -1
- package/dist/lib/tasks/task-manager.js +11 -0
- package/dist/lib/tasks/task-manager.js.map +1 -1
- package/dist/lib/tasks/task-store.d.ts +1 -1
- package/dist/lib/tasks/task-store.d.ts.map +1 -1
- package/dist/lib/tasks/task-store.js.map +1 -1
- package/dist/lib/tasks/types.d.ts +18 -0
- package/dist/lib/tasks/types.d.ts.map +1 -1
- package/dist/lib/tools/built-in/integration-tools.d.ts +4 -0
- package/dist/lib/tools/built-in/integration-tools.d.ts.map +1 -0
- package/dist/lib/tools/built-in/integration-tools.js +47 -0
- package/dist/lib/tools/built-in/integration-tools.js.map +1 -0
- package/dist/lib/tools/built-in/knowledge-entity-lookup.tool.d.ts +1 -2
- package/dist/lib/tools/built-in/knowledge-entity-lookup.tool.d.ts.map +1 -1
- package/dist/lib/tools/built-in/knowledge-entity-lookup.tool.js +17 -17
- package/dist/lib/tools/built-in/knowledge-entity-lookup.tool.js.map +1 -1
- package/dist/lib/tools/built-in/knowledge-graph-schema.tool.d.ts.map +1 -1
- package/dist/lib/tools/built-in/knowledge-graph-schema.tool.js +2 -4
- package/dist/lib/tools/built-in/knowledge-graph-schema.tool.js.map +1 -1
- package/dist/lib/tools/built-in/knowledge-search.tool.js +4 -4
- package/dist/lib/tools/built-in/knowledge-search.tool.js.map +1 -1
- package/dist/lib/tools/built-in/knowledge-sql.tool.d.ts.map +1 -1
- package/dist/lib/tools/built-in/knowledge-sql.tool.js +74 -40
- package/dist/lib/tools/built-in/knowledge-sql.tool.js.map +1 -1
- package/dist/lib/tools/built-in/knowledge-tools-factory.js +2 -2
- package/dist/lib/tools/built-in/knowledge-tools-factory.js.map +1 -1
- package/dist/lib/tools/built-in/knowledge-traverse.tool.d.ts +1 -2
- package/dist/lib/tools/built-in/knowledge-traverse.tool.d.ts.map +1 -1
- package/dist/lib/tools/built-in/knowledge-traverse.tool.js +5 -11
- package/dist/lib/tools/built-in/knowledge-traverse.tool.js.map +1 -1
- package/dist/lib/tools/built-in/query-validators.d.ts.map +1 -1
- package/dist/lib/tools/built-in/query-validators.js +4 -0
- package/dist/lib/tools/built-in/query-validators.js.map +1 -1
- package/dist/lib/tools/workspace/workspace-tools.d.ts +1 -0
- package/dist/lib/tools/workspace/workspace-tools.d.ts.map +1 -1
- package/dist/lib/tools/workspace/workspace-tools.js +44 -4
- package/dist/lib/tools/workspace/workspace-tools.js.map +1 -1
- package/dist/lib/triggers/cron-trigger.d.ts +1 -1
- package/dist/lib/triggers/cron-trigger.d.ts.map +1 -1
- package/dist/lib/triggers/cron-trigger.js.map +1 -1
- package/dist/lib/triggers/trigger-manager.d.ts +1 -0
- package/dist/lib/triggers/trigger-manager.d.ts.map +1 -1
- package/dist/lib/triggers/trigger-manager.js +26 -0
- package/dist/lib/triggers/trigger-manager.js.map +1 -1
- package/dist/lib/triggers/webhook-trigger.d.ts +1 -1
- package/dist/lib/triggers/webhook-trigger.d.ts.map +1 -1
- package/dist/lib/triggers/webhook-trigger.js.map +1 -1
- package/dist/lib/types/llm-types.d.ts +22 -4
- package/dist/lib/types/llm-types.d.ts.map +1 -1
- package/dist/lib/types/llm-types.js +50 -0
- package/dist/lib/types/llm-types.js.map +1 -1
- package/dist/lib/types/tool-factory.d.ts +2 -2
- package/dist/lib/types/tool-factory.d.ts.map +1 -1
- package/dist/lib/types/tool-factory.js +9 -2
- package/dist/lib/types/tool-factory.js.map +1 -1
- package/dist/lib/utils/document-extract.d.ts +10 -0
- package/dist/lib/utils/document-extract.d.ts.map +1 -0
- package/dist/lib/utils/document-extract.js +149 -0
- package/dist/lib/utils/document-extract.js.map +1 -0
- package/dist/lib/utils/env-substitution.d.ts +6 -0
- package/dist/lib/utils/env-substitution.d.ts.map +1 -0
- package/dist/lib/utils/env-substitution.js +15 -0
- package/dist/lib/utils/env-substitution.js.map +1 -0
- package/dist/lib/workflows/react-workflow-executor.d.ts.map +1 -1
- package/dist/lib/workflows/react-workflow-executor.js +23 -17
- package/dist/lib/workflows/react-workflow-executor.js.map +1 -1
- package/dist/lib/workflows/types.d.ts +81 -55
- package/dist/lib/workflows/types.d.ts.map +1 -1
- package/dist/lib/workflows/types.js +10 -0
- package/dist/lib/workflows/types.js.map +1 -1
- package/dist/lib/workflows/workflow-loader.d.ts +3 -0
- package/dist/lib/workflows/workflow-loader.d.ts.map +1 -1
- package/dist/lib/workflows/workflow-loader.js +10 -1
- package/dist/lib/workflows/workflow-loader.js.map +1 -1
- package/dist/public/assets/logo.png +0 -0
- package/dist/public/chat.html +39 -0
- package/dist/public/index.html +6 -176
- package/dist/public/src/components/AgentComposer.js +807 -0
- package/dist/public/src/components/AgentsView.js +1812 -508
- package/dist/public/src/components/AppRoot.js +125 -38
- package/dist/public/src/components/GraphView.js +382 -300
- package/dist/public/src/components/IdeView.js +277 -86
- package/dist/public/src/components/KnowledgeView.js +94 -130
- package/dist/public/src/components/LlmView.js +15 -19
- package/dist/public/src/components/LocalLlmView.js +2440 -0
- package/dist/public/src/components/LogViewer.js +155 -0
- package/dist/public/src/components/McpView.js +41 -49
- package/dist/public/src/components/MonitorView.js +174 -83
- package/dist/public/src/components/NavBar.js +16 -26
- package/dist/public/src/components/StandaloneChat.js +875 -0
- package/dist/public/src/services/ApiService.js +203 -4
- package/dist/public/src/services/SessionStore.js +86 -0
- package/dist/public/src/services/StreamManager.js +183 -0
- package/dist/public/src/store.js +1 -3
- package/dist/public/src/utils/card.js +21 -0
- package/dist/public/src/utils/markdown.js +7 -0
- package/dist/public/styles.css +2777 -0
- package/dist/src/cli/commands/init.d.ts.map +1 -1
- package/dist/src/cli/commands/init.js +7 -1
- package/dist/src/cli/commands/init.js.map +1 -1
- package/dist/src/cli/commands/start.d.ts.map +1 -1
- package/dist/src/cli/commands/start.js +28 -5
- package/dist/src/cli/commands/start.js.map +1 -1
- package/dist/src/cli/index.js +19 -5
- package/dist/src/cli/index.js.map +1 -1
- package/dist/src/index.js +7 -1
- package/dist/src/index.js.map +1 -1
- package/dist/src/middleware/auth.d.ts.map +1 -1
- package/dist/src/middleware/auth.js +28 -6
- package/dist/src/middleware/auth.js.map +1 -1
- package/dist/src/middleware/rate-limit.d.ts +8 -0
- package/dist/src/middleware/rate-limit.d.ts.map +1 -0
- package/dist/src/middleware/rate-limit.js +21 -0
- package/dist/src/middleware/rate-limit.js.map +1 -0
- package/dist/src/routes/agents.route.d.ts.map +1 -1
- package/dist/src/routes/agents.route.js +138 -10
- package/dist/src/routes/agents.route.js.map +1 -1
- package/dist/src/routes/chat.route.d.ts +3 -0
- package/dist/src/routes/chat.route.d.ts.map +1 -0
- package/dist/src/routes/chat.route.js +156 -0
- package/dist/src/routes/chat.route.js.map +1 -0
- package/dist/src/routes/files.route.d.ts.map +1 -1
- package/dist/src/routes/files.route.js +37 -2
- package/dist/src/routes/files.route.js.map +1 -1
- package/dist/src/routes/llm.route.d.ts.map +1 -1
- package/dist/src/routes/llm.route.js +263 -8
- package/dist/src/routes/llm.route.js.map +1 -1
- package/dist/src/routes/local-llm.route.d.ts +3 -0
- package/dist/src/routes/local-llm.route.d.ts.map +1 -0
- package/dist/src/routes/local-llm.route.js +688 -0
- package/dist/src/routes/local-llm.route.js.map +1 -0
- package/dist/src/routes/logs.route.d.ts +3 -0
- package/dist/src/routes/logs.route.d.ts.map +1 -0
- package/dist/src/routes/logs.route.js +24 -0
- package/dist/src/routes/logs.route.js.map +1 -0
- package/dist/src/routes/tasks.route.d.ts.map +1 -1
- package/dist/src/routes/tasks.route.js +15 -1
- package/dist/src/routes/tasks.route.js.map +1 -1
- package/dist/src/routes/vnc.route.d.ts +12 -0
- package/dist/src/routes/vnc.route.d.ts.map +1 -0
- package/dist/src/routes/vnc.route.js +74 -0
- package/dist/src/routes/vnc.route.js.map +1 -0
- package/dist/src/routes/workflows.route.d.ts.map +1 -1
- package/dist/src/routes/workflows.route.js +24 -0
- package/dist/src/routes/workflows.route.js.map +1 -1
- package/dist/src/server.d.ts.map +1 -1
- package/dist/src/server.js +29 -3
- package/dist/src/server.js.map +1 -1
- package/dist/templates/Demo.md +152 -0
- package/dist/templates/README.md +12 -3
- package/dist/templates/agents/actor.agent.yaml +34 -0
- package/dist/templates/agents/architect.agent.yaml +20 -13
- package/dist/templates/agents/chatbot.agent.yaml +23 -27
- package/dist/templates/agents/corporate.agent.yaml +64 -0
- package/dist/templates/agents/functions.agent.yaml +29 -0
- package/dist/templates/agents/investment-analyst.agent.yaml +79 -0
- package/dist/templates/agents/music-librarian.agent.yaml +46 -0
- package/dist/templates/agents/network-security.agent.yaml +81 -0
- package/dist/templates/agents/transport-security.agent.yaml +69 -0
- package/dist/templates/agents/web-engineer.agent.yaml +98 -0
- package/dist/templates/agents/web-pilot.agent.yaml +57 -0
- package/dist/templates/knowledge/music-store/LICENSE.md +11 -0
- package/dist/templates/knowledge/music-store/musicstore.sqlite +0 -0
- package/dist/templates/knowledge/music-store/tables.png +0 -0
- package/dist/templates/knowledge/music-store.knowledge.yaml +138 -0
- package/dist/templates/knowledge/org-chart/personnel.csv +21 -21
- package/dist/templates/knowledge/org-chart.knowledge.yaml +4 -0
- package/dist/templates/knowledge/patient-records.knowledge.yaml +20 -0
- package/dist/templates/knowledge/pdf-patients/PDF_Deid_Deidentification_0.pdf +0 -0
- package/dist/templates/knowledge/pdf-patients/PDF_Deid_Deidentification_1.pdf +0 -0
- package/dist/templates/knowledge/pdf-patients/PDF_Deid_Deidentification_10.pdf +0 -0
- package/dist/templates/knowledge/pdf-patients/PDF_Deid_Deidentification_11.pdf +0 -0
- package/dist/templates/knowledge/pet-store.knowledge.yaml +3 -0
- package/dist/templates/knowledge/security-incidents/incidents.json +55935 -0
- package/dist/templates/knowledge/security-incidents.knowledge.yaml +46 -0
- package/dist/templates/knowledge/{example.knowledge.yaml → transcripts.knowledge.yaml} +9 -5
- package/dist/templates/knowledge/transport-ot/systems.csv +117 -0
- package/dist/templates/knowledge/transport-ot.knowledge.yaml +55 -0
- package/dist/templates/knowledge/web-docs.knowledge.yaml +1 -1
- package/dist/templates/llm.json +62 -22
- package/dist/templates/mcp.json +7 -4
- package/dist/templates/skills/orcha-builder/SKILL.md +148 -215
- package/dist/templates/skills/pii-guard/SKILL.md +22 -0
- package/dist/templates/skills/sandbox/SKILL.md +25 -48
- package/dist/templates/skills/web-pilot/SKILL.md +51 -0
- package/dist/templates/workflows/example.workflow.yaml +27 -35
- package/dist/templates/workflows/react-example.workflow.yaml +14 -19
- package/dist/templates/workflows/team-chat.workflow.yaml +47 -0
- package/package.json +17 -4
- package/dist/public/src/components/SkillsView.js +0 -137
- package/dist/public/src/components/WorkflowsView.js +0 -416
- package/dist/templates/agents/knowledge-broker.agent.yaml +0 -39
- package/dist/templates/agents/sandbox.agent.yaml +0 -56
|
@@ -0,0 +1,56 @@
|
|
|
1
|
+
import { LlamaCppEngine } from "./engines/llama-cpp-engine.js";
|
|
2
|
+
import { MlxServeEngine } from "./engines/mlx-serve-engine.js";
|
|
3
|
+
import { ModelManager } from "./model-manager.js";
|
|
4
|
+
export class EngineRegistry {
|
|
5
|
+
engines = new Map();
|
|
6
|
+
_baseDir = '';
|
|
7
|
+
constructor() {
|
|
8
|
+
this.register(new LlamaCppEngine());
|
|
9
|
+
this.register(new MlxServeEngine());
|
|
10
|
+
}
|
|
11
|
+
register(engine) {
|
|
12
|
+
this.engines.set(engine.engineName, engine);
|
|
13
|
+
}
|
|
14
|
+
getEngine(name) {
|
|
15
|
+
return this.engines.get(name);
|
|
16
|
+
}
|
|
17
|
+
getAvailableEngines() {
|
|
18
|
+
return [...this.engines.values()].filter(e => e.isAvailable());
|
|
19
|
+
}
|
|
20
|
+
getAllEngines() {
|
|
21
|
+
return [...this.engines.values()];
|
|
22
|
+
}
|
|
23
|
+
getAllStatus() {
|
|
24
|
+
const result = {};
|
|
25
|
+
for (const [name, engine] of this.engines) {
|
|
26
|
+
result[name] = engine.getStatus();
|
|
27
|
+
}
|
|
28
|
+
return result;
|
|
29
|
+
}
|
|
30
|
+
setBaseDir(dir) {
|
|
31
|
+
this._baseDir = dir;
|
|
32
|
+
for (const engine of this.engines.values()) {
|
|
33
|
+
engine.setBaseDir(dir);
|
|
34
|
+
}
|
|
35
|
+
}
|
|
36
|
+
killAllOrphans() {
|
|
37
|
+
for (const engine of this.engines.values()) {
|
|
38
|
+
engine.killOrphans();
|
|
39
|
+
}
|
|
40
|
+
}
|
|
41
|
+
async unloadAll() {
|
|
42
|
+
for (const engine of this.engines.values()) {
|
|
43
|
+
await engine.unloadChat();
|
|
44
|
+
await engine.unloadEmbedding();
|
|
45
|
+
}
|
|
46
|
+
}
|
|
47
|
+
async resolveModelPath(modelName) {
|
|
48
|
+
const manager = new ModelManager(this._baseDir);
|
|
49
|
+
const result = await manager.findModelFile(modelName);
|
|
50
|
+
if (!result)
|
|
51
|
+
throw new Error(`Local model "${modelName}" not found. Download it first.`);
|
|
52
|
+
return result;
|
|
53
|
+
}
|
|
54
|
+
}
|
|
55
|
+
export const engineRegistry = new EngineRegistry();
|
|
56
|
+
//# sourceMappingURL=engine-registry.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"engine-registry.js","sourceRoot":"","sources":["../../../lib/local-llm/engine-registry.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,cAAc,EAAE,MAAM,+BAA+B,CAAC;AAC/D,OAAO,EAAE,cAAc,EAAE,MAAM,+BAA+B,CAAC;AAC/D,OAAO,EAAE,YAAY,EAAE,MAAM,oBAAoB,CAAC;AAGlD,MAAM,OAAO,cAAc;IACjB,OAAO,GAAG,IAAI,GAAG,EAAuB,CAAC;IACzC,QAAQ,GAAG,EAAE,CAAC;IAEtB;QACE,IAAI,CAAC,QAAQ,CAAC,IAAI,cAAc,EAAE,CAAC,CAAC;QACpC,IAAI,CAAC,QAAQ,CAAC,IAAI,cAAc,EAAE,CAAC,CAAC;IACtC,CAAC;IAED,QAAQ,CAAC,MAAmB;QAC1B,IAAI,CAAC,OAAO,CAAC,GAAG,CAAC,MAAM,CAAC,UAAU,EAAE,MAAM,CAAC,CAAC;IAC9C,CAAC;IAED,SAAS,CAAC,IAAY;QACpB,OAAO,IAAI,CAAC,OAAO,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC;IAChC,CAAC;IAED,mBAAmB;QACjB,OAAO,CAAC,GAAG,IAAI,CAAC,OAAO,CAAC,MAAM,EAAE,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,WAAW,EAAE,CAAC,CAAC;IACjE,CAAC;IAED,aAAa;QACX,OAAO,CAAC,GAAG,IAAI,CAAC,OAAO,CAAC,MAAM,EAAE,CAAC,CAAC;IACpC,CAAC;IAED,YAAY;QACV,MAAM,MAAM,GAAiC,EAAE,CAAC;QAChD,KAAK,MAAM,CAAC,IAAI,EAAE,MAAM,CAAC,IAAI,IAAI,CAAC,OAAO,EAAE,CAAC;YAC1C,MAAM,CAAC,IAAI,CAAC,GAAG,MAAM,CAAC,SAAS,EAAE,CAAC;QACpC,CAAC;QACD,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,UAAU,CAAC,GAAW;QACpB,IAAI,CAAC,QAAQ,GAAG,GAAG,CAAC;QACpB,KAAK,MAAM,MAAM,IAAI,IAAI,CAAC,OAAO,CAAC,MAAM,EAAE,EAAE,CAAC;YAC3C,MAAM,CAAC,UAAU,CAAC,GAAG,CAAC,CAAC;QACzB,CAAC;IACH,CAAC;IAED,cAAc;QACZ,KAAK,MAAM,MAAM,IAAI,IAAI,CAAC,OAAO,CAAC,MAAM,EAAE,EAAE,CAAC;YAC3C,MAAM,CAAC,WAAW,EAAE,CAAC;QACvB,CAAC;IACH,CAAC;IAED,KAAK,CAAC,SAAS;QACb,KAAK,MAAM,MAAM,IAAI,IAAI,CAAC,OAAO,CAAC,MAAM,EAAE,EAAE,CAAC;YAC3C,MAAM,MAAM,CAAC,UAAU,EAAE,CAAC;YAC1B,MAAM,MAAM,CAAC,eAAe,EAAE,CAAC;QACjC,CAAC;IACH,CAAC;IAED,KAAK,CAAC,gBAAgB,CAAC,SAAiB;QACtC,MAAM,OAAO,GAAG,IAAI,YAAY,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QAChD,MAAM,MAAM,GAAG,MAAM,OAAO,CAAC,aAAa,CAAC,SAAS,CAAC,CAAC;QACtD,IAAI,CAAC,MAAM;YAAE,MAAM,IAAI,KAAK,CAAC,gBAAgB,SAAS,iCAAiC,CAAC,CAAC;QACzF,OAAO,MAAM,CAAC;IAChB,CAAC;CACF;AAED,MAAM,CAAC,MAAM,cAAc,GAAG,IAAI,cAAc,EAAE,CAAC"}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
import type { LocalEngine, EngineChatStatus, EngineServerStatus, EngineStatus, LoadOptions } from '../engine-interface.ts';
|
|
2
|
+
export declare class LlamaCppEngine implements LocalEngine {
|
|
3
|
+
readonly engineName = "llama-cpp";
|
|
4
|
+
private _baseDir;
|
|
5
|
+
private chatServer;
|
|
6
|
+
private embeddingServer;
|
|
7
|
+
private _detectedContextSize;
|
|
8
|
+
private _memoryEstimate;
|
|
9
|
+
private _supportsVision;
|
|
10
|
+
setBaseDir(dir: string): void;
|
|
11
|
+
isAvailable(): boolean;
|
|
12
|
+
loadChat(modelPath: string, opts?: LoadOptions): Promise<void>;
|
|
13
|
+
unloadChat(): Promise<void>;
|
|
14
|
+
swapChat(modelPath: string, opts?: LoadOptions): Promise<void>;
|
|
15
|
+
ensureRunningChat(modelName: string, opts?: LoadOptions): Promise<void>;
|
|
16
|
+
getChatStatus(): EngineChatStatus;
|
|
17
|
+
getChatBaseUrl(): string | null;
|
|
18
|
+
loadEmbedding(modelPath: string): Promise<void>;
|
|
19
|
+
unloadEmbedding(): Promise<void>;
|
|
20
|
+
ensureRunningEmbedding(modelName: string): Promise<void>;
|
|
21
|
+
getEmbeddingStatus(): EngineServerStatus;
|
|
22
|
+
getEmbeddingBaseUrl(): string | null;
|
|
23
|
+
getStatus(): EngineStatus;
|
|
24
|
+
killOrphans(): void;
|
|
25
|
+
getBinaryVersion(): string | null;
|
|
26
|
+
getBinarySource(): 'managed' | 'system' | null;
|
|
27
|
+
checkForUpdate(): Promise<any>;
|
|
28
|
+
updateBinary(): Promise<void>;
|
|
29
|
+
private resolveModelPath;
|
|
30
|
+
}
|
|
31
|
+
//# sourceMappingURL=llama-cpp-engine.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"llama-cpp-engine.d.ts","sourceRoot":"","sources":["../../../../lib/local-llm/engines/llama-cpp-engine.ts"],"names":[],"mappings":"AAOA,OAAO,KAAK,EAAE,WAAW,EAAE,gBAAgB,EAAE,kBAAkB,EAAE,YAAY,EAAE,WAAW,EAAE,MAAM,wBAAwB,CAAC;AAE3H,qBAAa,cAAe,YAAW,WAAW;IAChD,QAAQ,CAAC,UAAU,eAAe;IAElC,OAAO,CAAC,QAAQ,CAAM;IACtB,OAAO,CAAC,UAAU,CAAmC;IACrD,OAAO,CAAC,eAAe,CAAmC;IAC1D,OAAO,CAAC,oBAAoB,CAAuB;IACnD,OAAO,CAAC,eAAe,CAAiF;IACxG,OAAO,CAAC,eAAe,CAAS;IAEhC,UAAU,CAAC,GAAG,EAAE,MAAM,GAAG,IAAI;IAI7B,WAAW,IAAI,OAAO;IAMhB,QAAQ,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,WAAW,GAAG,OAAO,CAAC,IAAI,CAAC;IA8C9D,UAAU,IAAI,OAAO,CAAC,IAAI,CAAC;IAM3B,QAAQ,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,WAAW,GAAG,OAAO,CAAC,IAAI,CAAC;IAK9D,iBAAiB,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,WAAW,GAAG,OAAO,CAAC,IAAI,CAAC;IAO7E,aAAa,IAAI,gBAAgB;IAYjC,cAAc,IAAI,MAAM,GAAG,IAAI;IAMzB,aAAa,CAAC,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;IAM/C,eAAe,IAAI,OAAO,CAAC,IAAI,CAAC;IAMhC,sBAAsB,CAAC,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;IAO9D,kBAAkB,IAAI,kBAAkB;IAWxC,mBAAmB,IAAI,MAAM,GAAG,IAAI;IAMpC,SAAS,IAAI,YAAY;IASzB,WAAW,IAAI,IAAI;IAMnB,gBAAgB,IAAI,MAAM,GAAG,IAAI;IAIjC,eAAe,IAAI,SAAS,GAAG,QAAQ,GAAG,IAAI;IAMxC,cAAc,IAAI,OAAO,CAAC,GAAG,CAAC;IAI9B,YAAY,IAAI,OAAO,CAAC,IAAI,CAAC;YAMrB,gBAAgB;CAM/B"}
|
|
@@ -0,0 +1,164 @@
|
|
|
1
|
+
import * as path from 'path';
|
|
2
|
+
import { LlamaServerProcess } from "../llama-server-process.js";
|
|
3
|
+
import { killOrphanedServers } from "../llama-server-process.js";
|
|
4
|
+
import { ModelManager } from "../model-manager.js";
|
|
5
|
+
import { readGGUFModelInfo, calculateOptimalContextSize, kvCacheBytesPerToken } from "../gguf-reader.js";
|
|
6
|
+
import { detectGpu, getBinaryVersion, isSystemBinary, updateBinary, checkForUpdate } from "../binary-manager.js";
|
|
7
|
+
import { logger } from "../../logger.js";
|
|
8
|
+
export class LlamaCppEngine {
|
|
9
|
+
engineName = 'llama-cpp';
|
|
10
|
+
_baseDir = '';
|
|
11
|
+
chatServer = null;
|
|
12
|
+
embeddingServer = null;
|
|
13
|
+
_detectedContextSize = null;
|
|
14
|
+
_memoryEstimate = null;
|
|
15
|
+
_supportsVision = false;
|
|
16
|
+
setBaseDir(dir) {
|
|
17
|
+
this._baseDir = dir;
|
|
18
|
+
}
|
|
19
|
+
isAvailable() {
|
|
20
|
+
return getBinaryVersion(this._baseDir) !== null;
|
|
21
|
+
}
|
|
22
|
+
// ─── Chat ───────────────────────────────────────────────────────────────────
|
|
23
|
+
async loadChat(modelPath, opts) {
|
|
24
|
+
if (!this.chatServer)
|
|
25
|
+
this.chatServer = new LlamaServerProcess(this._baseDir);
|
|
26
|
+
if (this.chatServer.running && this.chatServer.modelPath === modelPath)
|
|
27
|
+
return;
|
|
28
|
+
let contextSize = opts?.contextSize;
|
|
29
|
+
const modelInfo = await readGGUFModelInfo(modelPath);
|
|
30
|
+
if (!contextSize && modelInfo) {
|
|
31
|
+
contextSize = calculateOptimalContextSize(modelInfo);
|
|
32
|
+
}
|
|
33
|
+
if (modelInfo && contextSize) {
|
|
34
|
+
const kvBytes = contextSize * kvCacheBytesPerToken(modelInfo);
|
|
35
|
+
this._memoryEstimate = {
|
|
36
|
+
modelBytes: modelInfo.fileSizeBytes,
|
|
37
|
+
kvCacheBytes: kvBytes,
|
|
38
|
+
totalBytes: modelInfo.fileSizeBytes + kvBytes,
|
|
39
|
+
};
|
|
40
|
+
}
|
|
41
|
+
// Auto-detect multimodal projector (mmproj) for vision support
|
|
42
|
+
const modelFileName = path.basename(modelPath);
|
|
43
|
+
const manager = new ModelManager(this._baseDir);
|
|
44
|
+
const mmproj = await manager.findMmprojForModel(modelFileName);
|
|
45
|
+
this._supportsVision = !!mmproj;
|
|
46
|
+
if (mmproj) {
|
|
47
|
+
logger.info(`[LlamaCppEngine] Vision enabled with mmproj: ${path.basename(mmproj)}`);
|
|
48
|
+
}
|
|
49
|
+
this._detectedContextSize = contextSize ?? null;
|
|
50
|
+
const gpu = detectGpu();
|
|
51
|
+
const isGpu = gpu.accel !== 'none';
|
|
52
|
+
const isMetal = gpu.accel === 'metal';
|
|
53
|
+
await this.chatServer.start({
|
|
54
|
+
modelPath,
|
|
55
|
+
contextSize,
|
|
56
|
+
mmproj: mmproj ?? undefined,
|
|
57
|
+
gpuLayers: isGpu ? -1 : 0,
|
|
58
|
+
flashAttn: isGpu,
|
|
59
|
+
...(isGpu ? { batchSize: 4096, ubatchSize: 1024 } : {}),
|
|
60
|
+
...(isMetal ? { cacheTypeK: 'q8_0', cacheTypeV: 'q8_0', mlock: true } : {}),
|
|
61
|
+
...(opts?.reasoningBudget !== undefined ? { reasoningBudget: opts.reasoningBudget } : {}),
|
|
62
|
+
});
|
|
63
|
+
}
|
|
64
|
+
async unloadChat() {
|
|
65
|
+
if (this.chatServer) {
|
|
66
|
+
await this.chatServer.stop();
|
|
67
|
+
}
|
|
68
|
+
}
|
|
69
|
+
async swapChat(modelPath, opts) {
|
|
70
|
+
await this.unloadChat();
|
|
71
|
+
await this.loadChat(modelPath, opts);
|
|
72
|
+
}
|
|
73
|
+
async ensureRunningChat(modelName, opts) {
|
|
74
|
+
if (this.chatServer?.running)
|
|
75
|
+
return;
|
|
76
|
+
logger.info(`[LlamaCppEngine] Auto-starting chat model: ${modelName}`);
|
|
77
|
+
const { filePath } = await this.resolveModelPath(modelName);
|
|
78
|
+
await this.loadChat(filePath, opts);
|
|
79
|
+
}
|
|
80
|
+
getChatStatus() {
|
|
81
|
+
const running = this.chatServer?.running ?? false;
|
|
82
|
+
return {
|
|
83
|
+
running,
|
|
84
|
+
activeModel: running ? (this.chatServer?.modelPath ?? null) : null,
|
|
85
|
+
port: this.chatServer?.port ?? null,
|
|
86
|
+
contextSize: this._detectedContextSize,
|
|
87
|
+
memoryEstimate: this._memoryEstimate,
|
|
88
|
+
supportsVision: this._supportsVision,
|
|
89
|
+
};
|
|
90
|
+
}
|
|
91
|
+
getChatBaseUrl() {
|
|
92
|
+
return this.chatServer?.ready ? this.chatServer.getBaseUrl() : null;
|
|
93
|
+
}
|
|
94
|
+
// ─── Embedding ──────────────────────────────────────────────────────────────
|
|
95
|
+
async loadEmbedding(modelPath) {
|
|
96
|
+
if (!this.embeddingServer)
|
|
97
|
+
this.embeddingServer = new LlamaServerProcess(this._baseDir, true);
|
|
98
|
+
if (this.embeddingServer.running && this.embeddingServer.modelPath === modelPath)
|
|
99
|
+
return;
|
|
100
|
+
await this.embeddingServer.start({ modelPath, embedding: true });
|
|
101
|
+
}
|
|
102
|
+
async unloadEmbedding() {
|
|
103
|
+
if (this.embeddingServer) {
|
|
104
|
+
await this.embeddingServer.stop();
|
|
105
|
+
}
|
|
106
|
+
}
|
|
107
|
+
async ensureRunningEmbedding(modelName) {
|
|
108
|
+
if (this.embeddingServer?.running)
|
|
109
|
+
return;
|
|
110
|
+
logger.info(`[LlamaCppEngine] Auto-starting embedding model: ${modelName}`);
|
|
111
|
+
const { filePath } = await this.resolveModelPath(modelName);
|
|
112
|
+
await this.loadEmbedding(filePath);
|
|
113
|
+
}
|
|
114
|
+
getEmbeddingStatus() {
|
|
115
|
+
const running = this.embeddingServer?.running ?? false;
|
|
116
|
+
return {
|
|
117
|
+
running,
|
|
118
|
+
activeModel: running ? (this.embeddingServer?.modelPath ?? null) : null,
|
|
119
|
+
port: this.embeddingServer?.port ?? null,
|
|
120
|
+
contextSize: null,
|
|
121
|
+
memoryEstimate: null,
|
|
122
|
+
};
|
|
123
|
+
}
|
|
124
|
+
getEmbeddingBaseUrl() {
|
|
125
|
+
return this.embeddingServer?.ready ? this.embeddingServer.getBaseUrl() : null;
|
|
126
|
+
}
|
|
127
|
+
// ─── Combined ───────────────────────────────────────────────────────────────
|
|
128
|
+
getStatus() {
|
|
129
|
+
return {
|
|
130
|
+
engineName: this.engineName,
|
|
131
|
+
available: this.isAvailable(),
|
|
132
|
+
chat: this.getChatStatus(),
|
|
133
|
+
embedding: this.getEmbeddingStatus(),
|
|
134
|
+
};
|
|
135
|
+
}
|
|
136
|
+
killOrphans() {
|
|
137
|
+
killOrphanedServers(this._baseDir);
|
|
138
|
+
}
|
|
139
|
+
// ─── Binary management ─────────────────────────────────────────────────────
|
|
140
|
+
getBinaryVersion() {
|
|
141
|
+
return getBinaryVersion(this._baseDir);
|
|
142
|
+
}
|
|
143
|
+
getBinarySource() {
|
|
144
|
+
const version = getBinaryVersion(this._baseDir);
|
|
145
|
+
if (!version)
|
|
146
|
+
return null;
|
|
147
|
+
return isSystemBinary() ? 'system' : 'managed';
|
|
148
|
+
}
|
|
149
|
+
async checkForUpdate() {
|
|
150
|
+
return checkForUpdate(this._baseDir);
|
|
151
|
+
}
|
|
152
|
+
async updateBinary() {
|
|
153
|
+
return updateBinary(this._baseDir);
|
|
154
|
+
}
|
|
155
|
+
// ─── Private ────────────────────────────────────────────────────────────────
|
|
156
|
+
async resolveModelPath(modelName) {
|
|
157
|
+
const manager = new ModelManager(this._baseDir);
|
|
158
|
+
const result = await manager.findModelFile(modelName);
|
|
159
|
+
if (!result)
|
|
160
|
+
throw new Error(`Local model "${modelName}" not found. Download it first.`);
|
|
161
|
+
return result;
|
|
162
|
+
}
|
|
163
|
+
}
|
|
164
|
+
//# sourceMappingURL=llama-cpp-engine.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"llama-cpp-engine.js","sourceRoot":"","sources":["../../../../lib/local-llm/engines/llama-cpp-engine.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,IAAI,MAAM,MAAM,CAAC;AAC7B,OAAO,EAAE,kBAAkB,EAAE,MAAM,4BAA4B,CAAC;AAChE,OAAO,EAAE,mBAAmB,EAAE,MAAM,4BAA4B,CAAC;AACjE,OAAO,EAAE,YAAY,EAAE,MAAM,qBAAqB,CAAC;AACnD,OAAO,EAAE,iBAAiB,EAAE,2BAA2B,EAAE,oBAAoB,EAAE,MAAM,mBAAmB,CAAC;AACzG,OAAO,EAAE,SAAS,EAAE,gBAAgB,EAAE,cAAc,EAAE,YAAY,EAAE,cAAc,EAAE,MAAM,sBAAsB,CAAC;AACjH,OAAO,EAAE,MAAM,EAAE,MAAM,iBAAiB,CAAC;AAGzC,MAAM,OAAO,cAAc;IAChB,UAAU,GAAG,WAAW,CAAC;IAE1B,QAAQ,GAAG,EAAE,CAAC;IACd,UAAU,GAA8B,IAAI,CAAC;IAC7C,eAAe,GAA8B,IAAI,CAAC;IAClD,oBAAoB,GAAkB,IAAI,CAAC;IAC3C,eAAe,GAA4E,IAAI,CAAC;IAChG,eAAe,GAAG,KAAK,CAAC;IAEhC,UAAU,CAAC,GAAW;QACpB,IAAI,CAAC,QAAQ,GAAG,GAAG,CAAC;IACtB,CAAC;IAED,WAAW;QACT,OAAO,gBAAgB,CAAC,IAAI,CAAC,QAAQ,CAAC,KAAK,IAAI,CAAC;IAClD,CAAC;IAED,+EAA+E;IAE/E,KAAK,CAAC,QAAQ,CAAC,SAAiB,EAAE,IAAkB;QAClD,IAAI,CAAC,IAAI,CAAC,UAAU;YAAE,IAAI,CAAC,UAAU,GAAG,IAAI,kBAAkB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QAC9E,IAAI,IAAI,CAAC,UAAU,CAAC,OAAO,IAAI,IAAI,CAAC,UAAU,CAAC,SAAS,KAAK,SAAS;YAAE,OAAO;QAE/E,IAAI,WAAW,GAAG,IAAI,EAAE,WAAW,CAAC;QAEpC,MAAM,SAAS,GAAG,MAAM,iBAAiB,CAAC,SAAS,CAAC,CAAC;QACrD,IAAI,CAAC,WAAW,IAAI,SAAS,EAAE,CAAC;YAC9B,WAAW,GAAG,2BAA2B,CAAC,SAAS,CAAC,CAAC;QACvD,CAAC;QAED,IAAI,SAAS,IAAI,WAAW,EAAE,CAAC;YAC7B,MAAM,OAAO,GAAG,WAAW,GAAG,oBAAoB,CAAC,SAAS,CAAC,CAAC;YAC9D,IAAI,CAAC,eAAe,GAAG;gBACrB,UAAU,EAAE,SAAS,CAAC,aAAa;gBACnC,YAAY,EAAE,OAAO;gBACrB,UAAU,EAAE,SAAS,CAAC,aAAa,GAAG,OAAO;aAC9C,CAAC;QACJ,CAAC;QAED,+DAA+D;QAC/D,MAAM,aAAa,GAAG,IAAI,CAAC,QAAQ,CAAC,SAAS,CAAC,CAAC;QAC/C,MAAM,OAAO,GAAG,IAAI,YAAY,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QAChD,MAAM,MAAM,GAAG,MAAM,OAAO,CAAC,kBAAkB,CAAC,aAAa,CAAC,CAAC;QAC/D,IAAI,CAAC,eAAe,GAAG,CAAC,CAAC,MAAM,CAAC;QAEhC,IAAI,MAAM,EAAE,CAAC;YACX,MAAM,CAAC,IAAI,CAAC,gDAAgD,IAAI,CAAC,QAAQ,CAAC,MAAM,CAAC,EAAE,CAAC,CAAC;QACvF,CAAC;QAED,IAAI,CAAC,oBAAoB,GAAG,WAAW,IAAI,IAAI,CAAC;QAChD,MAAM,GAAG,GAAG,SAAS,EAAE,CAAC;QACxB,MAAM,KAAK,GAAG,GAAG,CAAC,KAAK,KAAK,MAAM,CAAC;QACnC,MAAM,OAAO,GAAG,GAAG,CAAC,KAAK,KAAK,OAAO,CAAC;QACtC,MAAM,IAAI,CAAC,UAAU,CAAC,KAAK,CAAC;YAC1B,SAAS;YACT,WAAW;YACX,MAAM,EAAE,MAAM,IAAI,SAAS;YAC3B,SAAS,EAAE,KAAK,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;YACzB,SAAS,EAAE,KAAK;YAChB,GAAG,CAAC,KAAK,CAAC,CAAC,CAAC,EAAE,SAAS,EAAE,IAAI,EAAE,UAAU,EAAE,IAAI,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;YACvD,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,EAAE,UAAU,EAAE,MAAM,EAAE,UAAU,EAAE,MAAM,EAAE,KAAK,EAAE,IAAI,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;YAC3E,GAAG,CAAC,IAAI,EAAE,eAAe,KAAK,SAAS,CAAC,CAAC,CAAC,EAAE,eAAe,EAAE,IAAI,CAAC,eAAe,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;SAC1F,CAAC,CAAC;IACL,CAAC;IAED,KAAK,CAAC,UAAU;QACd,IAAI,IAAI,CAAC,UAAU,EAAE,CAAC;YACpB,MAAM,IAAI,CAAC,UAAU,CAAC,IAAI,EAAE,CAAC;QAC/B,CAAC;IACH,CAAC;IAED,KAAK,CAAC,QAAQ,CAAC,SAAiB,EAAE,IAAkB;QAClD,MAAM,IAAI,CAAC,UAAU,EAAE,CAAC;QACxB,MAAM,IAAI,CAAC,QAAQ,CAAC,SAAS,EAAE,IAAI,CAAC,CAAC;IACvC,CAAC;IAED,KAAK,CAAC,iBAAiB,CAAC,SAAiB,EAAE,IAAkB;QAC3D,IAAI,IAAI,CAAC,UAAU,EAAE,OAAO;YAAE,OAAO;QACrC,MAAM,CAAC,IAAI,CAAC,8CAA8C,SAAS,EAAE,CAAC,CAAC;QACvE,MAAM,EAAE,QAAQ,EAAE,GAAG,MAAM,IAAI,CAAC,gBAAgB,CAAC,SAAS,CAAC,CAAC;QAC5D,MAAM,IAAI,CAAC,QAAQ,CAAC,QAAQ,EAAE,IAAI,CAAC,CAAC;IACtC,CAAC;IAED,aAAa;QACX,MAAM,OAAO,GAAG,IAAI,CAAC,UAAU,EAAE,OAAO,IAAI,KAAK,CAAC;QAClD,OAAO;YACL,OAAO;YACP,WAAW,EAAE,OAAO,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,UAAU,EAAE,SAAS,IAAI,IAAI,CAAC,CAAC,CAAC,CAAC,IAAI;YAClE,IAAI,EAAE,IAAI,CAAC,UAAU,EAAE,IAAI,IAAI,IAAI;YACnC,WAAW,EAAE,IAAI,CAAC,oBAAoB;YACtC,cAAc,EAAE,IAAI,CAAC,eAAe;YACpC,cAAc,EAAE,IAAI,CAAC,eAAe;SACrC,CAAC;IACJ,CAAC;IAED,cAAc;QACZ,OAAO,IAAI,CAAC,UAAU,EAAE,KAAK,CAAC,CAAC,CAAC,IAAI,CAAC,UAAU,CAAC,UAAU,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC;IACtE,CAAC;IAED,+EAA+E;IAE/E,KAAK,CAAC,aAAa,CAAC,SAAiB;QACnC,IAAI,CAAC,IAAI,CAAC,eAAe;YAAE,IAAI,CAAC,eAAe,GAAG,IAAI,kBAAkB,CAAC,IAAI,CAAC,QAAQ,EAAE,IAAI,CAAC,CAAC;QAC9F,IAAI,IAAI,CAAC,eAAe,CAAC,OAAO,IAAI,IAAI,CAAC,eAAe,CAAC,SAAS,KAAK,SAAS;YAAE,OAAO;QACzF,MAAM,IAAI,CAAC,eAAe,CAAC,KAAK,CAAC,EAAE,SAAS,EAAE,SAAS,EAAE,IAAI,EAAE,CAAC,CAAC;IACnE,CAAC;IAED,KAAK,CAAC,eAAe;QACnB,IAAI,IAAI,CAAC,eAAe,EAAE,CAAC;YACzB,MAAM,IAAI,CAAC,eAAe,CAAC,IAAI,EAAE,CAAC;QACpC,CAAC;IACH,CAAC;IAED,KAAK,CAAC,sBAAsB,CAAC,SAAiB;QAC5C,IAAI,IAAI,CAAC,eAAe,EAAE,OAAO;YAAE,OAAO;QAC1C,MAAM,CAAC,IAAI,CAAC,mDAAmD,SAAS,EAAE,CAAC,CAAC;QAC5E,MAAM,EAAE,QAAQ,EAAE,GAAG,MAAM,IAAI,CAAC,gBAAgB,CAAC,SAAS,CAAC,CAAC;QAC5D,MAAM,IAAI,CAAC,aAAa,CAAC,QAAQ,CAAC,CAAC;IACrC,CAAC;IAED,kBAAkB;QAChB,MAAM,OAAO,GAAG,IAAI,CAAC,eAAe,EAAE,OAAO,IAAI,KAAK,CAAC;QACvD,OAAO;YACL,OAAO;YACP,WAAW,EAAE,OAAO,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,eAAe,EAAE,SAAS,IAAI,IAAI,CAAC,CAAC,CAAC,CAAC,IAAI;YACvE,IAAI,EAAE,IAAI,CAAC,eAAe,EAAE,IAAI,IAAI,IAAI;YACxC,WAAW,EAAE,IAAI;YACjB,cAAc,EAAE,IAAI;SACrB,CAAC;IACJ,CAAC;IAED,mBAAmB;QACjB,OAAO,IAAI,CAAC,eAAe,EAAE,KAAK,CAAC,CAAC,CAAC,IAAI,CAAC,eAAe,CAAC,UAAU,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC;IAChF,CAAC;IAED,+EAA+E;IAE/E,SAAS;QACP,OAAO;YACL,UAAU,EAAE,IAAI,CAAC,UAAU;YAC3B,SAAS,EAAE,IAAI,CAAC,WAAW,EAAE;YAC7B,IAAI,EAAE,IAAI,CAAC,aAAa,EAAE;YAC1B,SAAS,EAAE,IAAI,CAAC,kBAAkB,EAAE;SACrC,CAAC;IACJ,CAAC;IAED,WAAW;QACT,mBAAmB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;IACrC,CAAC;IAED,8EAA8E;IAE9E,gBAAgB;QACd,OAAO,gBAAgB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;IACzC,CAAC;IAED,eAAe;QACb,MAAM,OAAO,GAAG,gBAAgB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QAChD,IAAI,CAAC,OAAO;YAAE,OAAO,IAAI,CAAC;QAC1B,OAAO,cAAc,EAAE,CAAC,CAAC,CAAC,QAAQ,CAAC,CAAC,CAAC,SAAS,CAAC;IACjD,CAAC;IAED,KAAK,CAAC,cAAc;QAClB,OAAO,cAAc,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;IACvC,CAAC;IAED,KAAK,CAAC,YAAY;QAChB,OAAO,YAAY,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;IACrC,CAAC;IAED,+EAA+E;IAEvE,KAAK,CAAC,gBAAgB,CAAC,SAAiB;QAC9C,MAAM,OAAO,GAAG,IAAI,YAAY,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QAChD,MAAM,MAAM,GAAG,MAAM,OAAO,CAAC,aAAa,CAAC,SAAS,CAAC,CAAC;QACtD,IAAI,CAAC,MAAM;YAAE,MAAM,IAAI,KAAK,CAAC,gBAAgB,SAAS,iCAAiC,CAAC,CAAC;QACzF,OAAO,MAAM,CAAC;IAChB,CAAC;CACF"}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
import type { LocalEngine, EngineChatStatus, EngineServerStatus, EngineStatus, LoadOptions } from '../engine-interface.ts';
|
|
2
|
+
export declare class MlxServeEngine implements LocalEngine {
|
|
3
|
+
readonly engineName = "mlx-serve";
|
|
4
|
+
private _baseDir;
|
|
5
|
+
private chatServer;
|
|
6
|
+
private embeddingServer;
|
|
7
|
+
private _detectedContextSize;
|
|
8
|
+
private _memoryEstimate;
|
|
9
|
+
private _supportsVision;
|
|
10
|
+
setBaseDir(dir: string): void;
|
|
11
|
+
isAvailable(): boolean;
|
|
12
|
+
loadChat(modelPath: string, opts?: LoadOptions): Promise<void>;
|
|
13
|
+
unloadChat(): Promise<void>;
|
|
14
|
+
swapChat(modelPath: string, opts?: LoadOptions): Promise<void>;
|
|
15
|
+
ensureRunningChat(modelName: string, opts?: LoadOptions): Promise<void>;
|
|
16
|
+
getChatStatus(): EngineChatStatus;
|
|
17
|
+
getChatBaseUrl(): string | null;
|
|
18
|
+
loadEmbedding(modelPath: string): Promise<void>;
|
|
19
|
+
unloadEmbedding(): Promise<void>;
|
|
20
|
+
ensureRunningEmbedding(modelName: string): Promise<void>;
|
|
21
|
+
getEmbeddingStatus(): EngineServerStatus;
|
|
22
|
+
getEmbeddingBaseUrl(): string | null;
|
|
23
|
+
getStatus(): EngineStatus;
|
|
24
|
+
killOrphans(): void;
|
|
25
|
+
getBinaryVersion(): string | null;
|
|
26
|
+
getBinarySource(): 'managed' | 'system' | null;
|
|
27
|
+
checkForUpdate(): Promise<any>;
|
|
28
|
+
updateBinary(): Promise<void>;
|
|
29
|
+
private resolveModelPath;
|
|
30
|
+
}
|
|
31
|
+
//# sourceMappingURL=mlx-serve-engine.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"mlx-serve-engine.d.ts","sourceRoot":"","sources":["../../../../lib/local-llm/engines/mlx-serve-engine.ts"],"names":[],"mappings":"AAKA,OAAO,KAAK,EAAE,WAAW,EAAE,gBAAgB,EAAE,kBAAkB,EAAE,YAAY,EAAE,WAAW,EAAE,MAAM,wBAAwB,CAAC;AAE3H,qBAAa,cAAe,YAAW,WAAW;IAChD,QAAQ,CAAC,UAAU,eAAe;IAElC,OAAO,CAAC,QAAQ,CAAM;IACtB,OAAO,CAAC,UAAU,CAAiC;IACnD,OAAO,CAAC,eAAe,CAAiC;IACxD,OAAO,CAAC,oBAAoB,CAAuB;IACnD,OAAO,CAAC,eAAe,CAAiF;IACxG,OAAO,CAAC,eAAe,CAAS;IAEhC,UAAU,CAAC,GAAG,EAAE,MAAM,GAAG,IAAI;IAI7B,WAAW,IAAI,OAAO;IAMhB,QAAQ,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,WAAW,GAAG,OAAO,CAAC,IAAI,CAAC;IAwC9D,UAAU,IAAI,OAAO,CAAC,IAAI,CAAC;IAM3B,QAAQ,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,WAAW,GAAG,OAAO,CAAC,IAAI,CAAC;IAK9D,iBAAiB,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,WAAW,GAAG,OAAO,CAAC,IAAI,CAAC;IAO7E,aAAa,IAAI,gBAAgB;IAYjC,cAAc,IAAI,MAAM,GAAG,IAAI;IAMzB,aAAa,CAAC,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;IAQ/C,eAAe,IAAI,OAAO,CAAC,IAAI,CAAC;IAMhC,sBAAsB,CAAC,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;IAO9D,kBAAkB,IAAI,kBAAkB;IAWxC,mBAAmB,IAAI,MAAM,GAAG,IAAI;IAMpC,SAAS,IAAI,YAAY;IASzB,WAAW,IAAI,IAAI;IAMnB,gBAAgB,IAAI,MAAM,GAAG,IAAI;IAIjC,eAAe,IAAI,SAAS,GAAG,QAAQ,GAAG,IAAI;IAMxC,cAAc,IAAI,OAAO,CAAC,GAAG,CAAC;IAI9B,YAAY,IAAI,OAAO,CAAC,IAAI,CAAC;YAMrB,gBAAgB;CAM/B"}
|
|
@@ -0,0 +1,161 @@
|
|
|
1
|
+
import { MlxServerProcess } from "../mlx-server-process.js";
|
|
2
|
+
import { killOrphanedMlxServers } from "../mlx-server-process.js";
|
|
3
|
+
import { ModelManager } from "../model-manager.js";
|
|
4
|
+
import { getMlxBinaryVersion, isMlxSystemBinary, updateMlxBinary, checkForMlxUpdate } from "../mlx-binary-manager.js";
|
|
5
|
+
import { logger } from "../../logger.js";
|
|
6
|
+
export class MlxServeEngine {
|
|
7
|
+
engineName = 'mlx-serve';
|
|
8
|
+
_baseDir = '';
|
|
9
|
+
chatServer = null;
|
|
10
|
+
embeddingServer = null;
|
|
11
|
+
_detectedContextSize = null;
|
|
12
|
+
_memoryEstimate = null;
|
|
13
|
+
_supportsVision = false;
|
|
14
|
+
setBaseDir(dir) {
|
|
15
|
+
this._baseDir = dir;
|
|
16
|
+
}
|
|
17
|
+
isAvailable() {
|
|
18
|
+
return getMlxBinaryVersion(this._baseDir) !== null && process.platform === 'darwin' && process.arch === 'arm64';
|
|
19
|
+
}
|
|
20
|
+
// ─── Chat ───────────────────────────────────────────────────────────────────
|
|
21
|
+
async loadChat(modelPath, opts) {
|
|
22
|
+
if (this.chatServer?.running && this.chatServer.modelPath === modelPath)
|
|
23
|
+
return;
|
|
24
|
+
if (!this.chatServer)
|
|
25
|
+
this.chatServer = new MlxServerProcess(this._baseDir);
|
|
26
|
+
this._memoryEstimate = null;
|
|
27
|
+
this._supportsVision = false;
|
|
28
|
+
this._detectedContextSize = opts?.contextSize ?? null;
|
|
29
|
+
await this.chatServer.start({ modelPath, contextSize: opts?.contextSize, reasoningBudget: opts?.reasoningBudget });
|
|
30
|
+
// Fetch /props from mlx-serve to get memory usage and context size
|
|
31
|
+
try {
|
|
32
|
+
const baseUrl = this.chatServer.getBaseUrl();
|
|
33
|
+
const res = await fetch(`${baseUrl}/props`);
|
|
34
|
+
if (res.ok) {
|
|
35
|
+
const props = await res.json();
|
|
36
|
+
const nCtx = props.default_generation_settings?.n_ctx;
|
|
37
|
+
if (nCtx && !this._detectedContextSize) {
|
|
38
|
+
this._detectedContextSize = nCtx;
|
|
39
|
+
}
|
|
40
|
+
const ctxSize = this._detectedContextSize ?? nCtx ?? 0;
|
|
41
|
+
const info = props.model_info;
|
|
42
|
+
// KV cache: layers × 2(K+V) × kv_heads × head_dim × 2(float16) × ctx
|
|
43
|
+
const kvCacheBytes = info
|
|
44
|
+
? info.num_hidden_layers * 2 * info.num_key_value_heads * info.head_dim * 2 * ctxSize
|
|
45
|
+
: 0;
|
|
46
|
+
const modelBytes = props.memory?.active_bytes ?? 0;
|
|
47
|
+
if (modelBytes || kvCacheBytes) {
|
|
48
|
+
this._memoryEstimate = {
|
|
49
|
+
modelBytes,
|
|
50
|
+
kvCacheBytes,
|
|
51
|
+
totalBytes: modelBytes + kvCacheBytes,
|
|
52
|
+
};
|
|
53
|
+
}
|
|
54
|
+
}
|
|
55
|
+
}
|
|
56
|
+
catch (err) {
|
|
57
|
+
logger.warn('[MlxServeEngine] Failed to fetch /props:', err);
|
|
58
|
+
}
|
|
59
|
+
}
|
|
60
|
+
async unloadChat() {
|
|
61
|
+
if (this.chatServer) {
|
|
62
|
+
await this.chatServer.stop();
|
|
63
|
+
}
|
|
64
|
+
}
|
|
65
|
+
async swapChat(modelPath, opts) {
|
|
66
|
+
await this.unloadChat();
|
|
67
|
+
await this.loadChat(modelPath, opts);
|
|
68
|
+
}
|
|
69
|
+
async ensureRunningChat(modelName, opts) {
|
|
70
|
+
if (this.chatServer?.running)
|
|
71
|
+
return;
|
|
72
|
+
logger.info(`[MlxServeEngine] Auto-starting chat model: ${modelName}`);
|
|
73
|
+
const { filePath } = await this.resolveModelPath(modelName);
|
|
74
|
+
await this.loadChat(filePath, opts);
|
|
75
|
+
}
|
|
76
|
+
getChatStatus() {
|
|
77
|
+
const running = this.chatServer?.running ?? false;
|
|
78
|
+
return {
|
|
79
|
+
running,
|
|
80
|
+
activeModel: running ? (this.chatServer?.modelPath ?? null) : null,
|
|
81
|
+
port: this.chatServer?.port ?? null,
|
|
82
|
+
contextSize: this._detectedContextSize,
|
|
83
|
+
memoryEstimate: this._memoryEstimate,
|
|
84
|
+
supportsVision: this._supportsVision,
|
|
85
|
+
};
|
|
86
|
+
}
|
|
87
|
+
getChatBaseUrl() {
|
|
88
|
+
return this.chatServer?.ready ? this.chatServer.getBaseUrl() : null;
|
|
89
|
+
}
|
|
90
|
+
// ─── Embedding ──────────────────────────────────────────────────────────────
|
|
91
|
+
async loadEmbedding(modelPath) {
|
|
92
|
+
if (this.embeddingServer?.running && this.embeddingServer.modelPath === modelPath)
|
|
93
|
+
return;
|
|
94
|
+
if (!this.embeddingServer)
|
|
95
|
+
this.embeddingServer = new MlxServerProcess(this._baseDir, 'embedding');
|
|
96
|
+
await this.embeddingServer.start({ modelPath });
|
|
97
|
+
logger.info(`[MlxServeEngine] Embedding server ready on port ${this.embeddingServer.port}`);
|
|
98
|
+
}
|
|
99
|
+
async unloadEmbedding() {
|
|
100
|
+
if (this.embeddingServer) {
|
|
101
|
+
await this.embeddingServer.stop();
|
|
102
|
+
}
|
|
103
|
+
}
|
|
104
|
+
async ensureRunningEmbedding(modelName) {
|
|
105
|
+
if (this.embeddingServer?.running)
|
|
106
|
+
return;
|
|
107
|
+
logger.info(`[MlxServeEngine] Auto-starting embedding model: ${modelName}`);
|
|
108
|
+
const { filePath } = await this.resolveModelPath(modelName);
|
|
109
|
+
await this.loadEmbedding(filePath);
|
|
110
|
+
}
|
|
111
|
+
getEmbeddingStatus() {
|
|
112
|
+
const running = this.embeddingServer?.running ?? false;
|
|
113
|
+
return {
|
|
114
|
+
running,
|
|
115
|
+
activeModel: running ? (this.embeddingServer?.modelPath ?? null) : null,
|
|
116
|
+
port: this.embeddingServer?.port ?? null,
|
|
117
|
+
contextSize: null,
|
|
118
|
+
memoryEstimate: null,
|
|
119
|
+
};
|
|
120
|
+
}
|
|
121
|
+
getEmbeddingBaseUrl() {
|
|
122
|
+
return this.embeddingServer?.ready ? this.embeddingServer.getBaseUrl() : null;
|
|
123
|
+
}
|
|
124
|
+
// ─── Combined ───────────────────────────────────────────────────────────────
|
|
125
|
+
getStatus() {
|
|
126
|
+
return {
|
|
127
|
+
engineName: this.engineName,
|
|
128
|
+
available: this.isAvailable(),
|
|
129
|
+
chat: this.getChatStatus(),
|
|
130
|
+
embedding: this.getEmbeddingStatus(),
|
|
131
|
+
};
|
|
132
|
+
}
|
|
133
|
+
killOrphans() {
|
|
134
|
+
killOrphanedMlxServers(this._baseDir);
|
|
135
|
+
}
|
|
136
|
+
// ─── Binary management ─────────────────────────────────────────────────────
|
|
137
|
+
getBinaryVersion() {
|
|
138
|
+
return getMlxBinaryVersion(this._baseDir);
|
|
139
|
+
}
|
|
140
|
+
getBinarySource() {
|
|
141
|
+
const version = getMlxBinaryVersion(this._baseDir);
|
|
142
|
+
if (!version)
|
|
143
|
+
return null;
|
|
144
|
+
return isMlxSystemBinary() ? 'system' : 'managed';
|
|
145
|
+
}
|
|
146
|
+
async checkForUpdate() {
|
|
147
|
+
return checkForMlxUpdate(this._baseDir);
|
|
148
|
+
}
|
|
149
|
+
async updateBinary() {
|
|
150
|
+
return updateMlxBinary(this._baseDir);
|
|
151
|
+
}
|
|
152
|
+
// ─── Private ────────────────────────────────────────────────────────────────
|
|
153
|
+
async resolveModelPath(modelName) {
|
|
154
|
+
const manager = new ModelManager(this._baseDir);
|
|
155
|
+
const result = await manager.findModelFile(modelName);
|
|
156
|
+
if (!result)
|
|
157
|
+
throw new Error(`Local model "${modelName}" not found. Download it first.`);
|
|
158
|
+
return result;
|
|
159
|
+
}
|
|
160
|
+
}
|
|
161
|
+
//# sourceMappingURL=mlx-serve-engine.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"mlx-serve-engine.js","sourceRoot":"","sources":["../../../../lib/local-llm/engines/mlx-serve-engine.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,gBAAgB,EAAE,MAAM,0BAA0B,CAAC;AAC5D,OAAO,EAAE,sBAAsB,EAAE,MAAM,0BAA0B,CAAC;AAClE,OAAO,EAAE,YAAY,EAAE,MAAM,qBAAqB,CAAC;AACnD,OAAO,EAAE,mBAAmB,EAAE,iBAAiB,EAAE,eAAe,EAAE,iBAAiB,EAAE,MAAM,0BAA0B,CAAC;AACtH,OAAO,EAAE,MAAM,EAAE,MAAM,iBAAiB,CAAC;AAGzC,MAAM,OAAO,cAAc;IAChB,UAAU,GAAG,WAAW,CAAC;IAE1B,QAAQ,GAAG,EAAE,CAAC;IACd,UAAU,GAA4B,IAAI,CAAC;IAC3C,eAAe,GAA4B,IAAI,CAAC;IAChD,oBAAoB,GAAkB,IAAI,CAAC;IAC3C,eAAe,GAA4E,IAAI,CAAC;IAChG,eAAe,GAAG,KAAK,CAAC;IAEhC,UAAU,CAAC,GAAW;QACpB,IAAI,CAAC,QAAQ,GAAG,GAAG,CAAC;IACtB,CAAC;IAED,WAAW;QACT,OAAO,mBAAmB,CAAC,IAAI,CAAC,QAAQ,CAAC,KAAK,IAAI,IAAI,OAAO,CAAC,QAAQ,KAAK,QAAQ,IAAI,OAAO,CAAC,IAAI,KAAK,OAAO,CAAC;IAClH,CAAC;IAED,+EAA+E;IAE/E,KAAK,CAAC,QAAQ,CAAC,SAAiB,EAAE,IAAkB;QAClD,IAAI,IAAI,CAAC,UAAU,EAAE,OAAO,IAAI,IAAI,CAAC,UAAU,CAAC,SAAS,KAAK,SAAS;YAAE,OAAO;QAChF,IAAI,CAAC,IAAI,CAAC,UAAU;YAAE,IAAI,CAAC,UAAU,GAAG,IAAI,gBAAgB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QAE5E,IAAI,CAAC,eAAe,GAAG,IAAI,CAAC;QAC5B,IAAI,CAAC,eAAe,GAAG,KAAK,CAAC;QAC7B,IAAI,CAAC,oBAAoB,GAAG,IAAI,EAAE,WAAW,IAAI,IAAI,CAAC;QAEtD,MAAM,IAAI,CAAC,UAAU,CAAC,KAAK,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,IAAI,EAAE,WAAW,EAAE,eAAe,EAAE,IAAI,EAAE,eAAe,EAAE,CAAC,CAAC;QAEnH,mEAAmE;QACnE,IAAI,CAAC;YACH,MAAM,OAAO,GAAG,IAAI,CAAC,UAAU,CAAC,UAAU,EAAE,CAAC;YAC7C,MAAM,GAAG,GAAG,MAAM,KAAK,CAAC,GAAG,OAAO,QAAQ,CAAC,CAAC;YAC5C,IAAI,GAAG,CAAC,EAAE,EAAE,CAAC;gBACX,MAAM,KAAK,GAAG,MAAM,GAAG,CAAC,IAAI,EAAS,CAAC;gBACtC,MAAM,IAAI,GAAG,KAAK,CAAC,2BAA2B,EAAE,KAAK,CAAC;gBACtD,IAAI,IAAI,IAAI,CAAC,IAAI,CAAC,oBAAoB,EAAE,CAAC;oBACvC,IAAI,CAAC,oBAAoB,GAAG,IAAI,CAAC;gBACnC,CAAC;gBACD,MAAM,OAAO,GAAG,IAAI,CAAC,oBAAoB,IAAI,IAAI,IAAI,CAAC,CAAC;gBACvD,MAAM,IAAI,GAAG,KAAK,CAAC,UAAU,CAAC;gBAC9B,qEAAqE;gBACrE,MAAM,YAAY,GAAG,IAAI;oBACvB,CAAC,CAAC,IAAI,CAAC,iBAAiB,GAAG,CAAC,GAAG,IAAI,CAAC,mBAAmB,GAAG,IAAI,CAAC,QAAQ,GAAG,CAAC,GAAG,OAAO;oBACrF,CAAC,CAAC,CAAC,CAAC;gBACN,MAAM,UAAU,GAAG,KAAK,CAAC,MAAM,EAAE,YAAY,IAAI,CAAC,CAAC;gBACnD,IAAI,UAAU,IAAI,YAAY,EAAE,CAAC;oBAC/B,IAAI,CAAC,eAAe,GAAG;wBACrB,UAAU;wBACV,YAAY;wBACZ,UAAU,EAAE,UAAU,GAAG,YAAY;qBACtC,CAAC;gBACJ,CAAC;YACH,CAAC;QACH,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACb,MAAM,CAAC,IAAI,CAAC,0CAA0C,EAAE,GAAG,CAAC,CAAC;QAC/D,CAAC;IACH,CAAC;IAED,KAAK,CAAC,UAAU;QACd,IAAI,IAAI,CAAC,UAAU,EAAE,CAAC;YACpB,MAAM,IAAI,CAAC,UAAU,CAAC,IAAI,EAAE,CAAC;QAC/B,CAAC;IACH,CAAC;IAED,KAAK,CAAC,QAAQ,CAAC,SAAiB,EAAE,IAAkB;QAClD,MAAM,IAAI,CAAC,UAAU,EAAE,CAAC;QACxB,MAAM,IAAI,CAAC,QAAQ,CAAC,SAAS,EAAE,IAAI,CAAC,CAAC;IACvC,CAAC;IAED,KAAK,CAAC,iBAAiB,CAAC,SAAiB,EAAE,IAAkB;QAC3D,IAAI,IAAI,CAAC,UAAU,EAAE,OAAO;YAAE,OAAO;QACrC,MAAM,CAAC,IAAI,CAAC,8CAA8C,SAAS,EAAE,CAAC,CAAC;QACvE,MAAM,EAAE,QAAQ,EAAE,GAAG,MAAM,IAAI,CAAC,gBAAgB,CAAC,SAAS,CAAC,CAAC;QAC5D,MAAM,IAAI,CAAC,QAAQ,CAAC,QAAQ,EAAE,IAAI,CAAC,CAAC;IACtC,CAAC;IAED,aAAa;QACX,MAAM,OAAO,GAAG,IAAI,CAAC,UAAU,EAAE,OAAO,IAAI,KAAK,CAAC;QAClD,OAAO;YACL,OAAO;YACP,WAAW,EAAE,OAAO,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,UAAU,EAAE,SAAS,IAAI,IAAI,CAAC,CAAC,CAAC,CAAC,IAAI;YAClE,IAAI,EAAE,IAAI,CAAC,UAAU,EAAE,IAAI,IAAI,IAAI;YACnC,WAAW,EAAE,IAAI,CAAC,oBAAoB;YACtC,cAAc,EAAE,IAAI,CAAC,eAAe;YACpC,cAAc,EAAE,IAAI,CAAC,eAAe;SACrC,CAAC;IACJ,CAAC;IAED,cAAc;QACZ,OAAO,IAAI,CAAC,UAAU,EAAE,KAAK,CAAC,CAAC,CAAC,IAAI,CAAC,UAAU,CAAC,UAAU,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC;IACtE,CAAC;IAED,+EAA+E;IAE/E,KAAK,CAAC,aAAa,CAAC,SAAiB;QACnC,IAAI,IAAI,CAAC,eAAe,EAAE,OAAO,IAAI,IAAI,CAAC,eAAe,CAAC,SAAS,KAAK,SAAS;YAAE,OAAO;QAC1F,IAAI,CAAC,IAAI,CAAC,eAAe;YAAE,IAAI,CAAC,eAAe,GAAG,IAAI,gBAAgB,CAAC,IAAI,CAAC,QAAQ,EAAE,WAAW,CAAC,CAAC;QAEnG,MAAM,IAAI,CAAC,eAAe,CAAC,KAAK,CAAC,EAAE,SAAS,EAAE,CAAC,CAAC;QAChD,MAAM,CAAC,IAAI,CAAC,mDAAmD,IAAI,CAAC,eAAe,CAAC,IAAI,EAAE,CAAC,CAAC;IAC9F,CAAC;IAED,KAAK,CAAC,eAAe;QACnB,IAAI,IAAI,CAAC,eAAe,EAAE,CAAC;YACzB,MAAM,IAAI,CAAC,eAAe,CAAC,IAAI,EAAE,CAAC;QACpC,CAAC;IACH,CAAC;IAED,KAAK,CAAC,sBAAsB,CAAC,SAAiB;QAC5C,IAAI,IAAI,CAAC,eAAe,EAAE,OAAO;YAAE,OAAO;QAC1C,MAAM,CAAC,IAAI,CAAC,mDAAmD,SAAS,EAAE,CAAC,CAAC;QAC5E,MAAM,EAAE,QAAQ,EAAE,GAAG,MAAM,IAAI,CAAC,gBAAgB,CAAC,SAAS,CAAC,CAAC;QAC5D,MAAM,IAAI,CAAC,aAAa,CAAC,QAAQ,CAAC,CAAC;IACrC,CAAC;IAED,kBAAkB;QAChB,MAAM,OAAO,GAAG,IAAI,CAAC,eAAe,EAAE,OAAO,IAAI,KAAK,CAAC;QACvD,OAAO;YACL,OAAO;YACP,WAAW,EAAE,OAAO,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,eAAe,EAAE,SAAS,IAAI,IAAI,CAAC,CAAC,CAAC,CAAC,IAAI;YACvE,IAAI,EAAE,IAAI,CAAC,eAAe,EAAE,IAAI,IAAI,IAAI;YACxC,WAAW,EAAE,IAAI;YACjB,cAAc,EAAE,IAAI;SACrB,CAAC;IACJ,CAAC;IAED,mBAAmB;QACjB,OAAO,IAAI,CAAC,eAAe,EAAE,KAAK,CAAC,CAAC,CAAC,IAAI,CAAC,eAAe,CAAC,UAAU,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC;IAChF,CAAC;IAED,+EAA+E;IAE/E,SAAS;QACP,OAAO;YACL,UAAU,EAAE,IAAI,CAAC,UAAU;YAC3B,SAAS,EAAE,IAAI,CAAC,WAAW,EAAE;YAC7B,IAAI,EAAE,IAAI,CAAC,aAAa,EAAE;YAC1B,SAAS,EAAE,IAAI,CAAC,kBAAkB,EAAE;SACrC,CAAC;IACJ,CAAC;IAED,WAAW;QACT,sBAAsB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;IACxC,CAAC;IAED,8EAA8E;IAE9E,gBAAgB;QACd,OAAO,mBAAmB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;IAC5C,CAAC;IAED,eAAe;QACb,MAAM,OAAO,GAAG,mBAAmB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QACnD,IAAI,CAAC,OAAO;YAAE,OAAO,IAAI,CAAC;QAC1B,OAAO,iBAAiB,EAAE,CAAC,CAAC,CAAC,QAAQ,CAAC,CAAC,CAAC,SAAS,CAAC;IACpD,CAAC;IAED,KAAK,CAAC,cAAc;QAClB,OAAO,iBAAiB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;IAC1C,CAAC;IAED,KAAK,CAAC,YAAY;QAChB,OAAO,eAAe,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;IACxC,CAAC;IAED,+EAA+E;IAEvE,KAAK,CAAC,gBAAgB,CAAC,SAAiB;QAC9C,MAAM,OAAO,GAAG,IAAI,YAAY,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QAChD,MAAM,MAAM,GAAG,MAAM,OAAO,CAAC,aAAa,CAAC,SAAS,CAAC,CAAC;QACtD,IAAI,CAAC,MAAM;YAAE,MAAM,IAAI,KAAK,CAAC,gBAAgB,SAAS,iCAAiC,CAAC,CAAC;QACzF,OAAO,MAAM,CAAC;IAChB,CAAC;CACF"}
|
|
@@ -0,0 +1,20 @@
|
|
|
1
|
+
export interface GGUFModelInfo {
|
|
2
|
+
contextLength: number;
|
|
3
|
+
blockCount: number;
|
|
4
|
+
embeddingLength: number;
|
|
5
|
+
headCount: number;
|
|
6
|
+
headCountKv: number;
|
|
7
|
+
fileSizeBytes: number;
|
|
8
|
+
}
|
|
9
|
+
/**
|
|
10
|
+
* Reads model architecture info from a GGUF file's metadata header.
|
|
11
|
+
* Only reads the first 1MB — no model loading required.
|
|
12
|
+
*/
|
|
13
|
+
export declare function readGGUFModelInfo(modelPath: string): Promise<GGUFModelInfo | null>;
|
|
14
|
+
/**
|
|
15
|
+
* Estimates KV cache bytes per token for a model.
|
|
16
|
+
* KV cache = 2 (K+V) * n_layers * n_kv_heads * head_dim * 2 bytes (f16)
|
|
17
|
+
*/
|
|
18
|
+
export declare function kvCacheBytesPerToken(info: GGUFModelInfo): number;
|
|
19
|
+
export declare function calculateOptimalContextSize(info: GGUFModelInfo): number;
|
|
20
|
+
//# sourceMappingURL=gguf-reader.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"gguf-reader.d.ts","sourceRoot":"","sources":["../../../lib/local-llm/gguf-reader.ts"],"names":[],"mappings":"AASA,MAAM,WAAW,aAAa;IAC5B,aAAa,EAAE,MAAM,CAAC;IACtB,UAAU,EAAE,MAAM,CAAC;IACnB,eAAe,EAAE,MAAM,CAAC;IACxB,SAAS,EAAE,MAAM,CAAC;IAClB,WAAW,EAAE,MAAM,CAAC;IACpB,aAAa,EAAE,MAAM,CAAC;CACvB;AAED;;;GAGG;AACH,wBAAsB,iBAAiB,CAAC,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,aAAa,GAAG,IAAI,CAAC,CAkExF;AAED;;;GAGG;AACH,wBAAgB,oBAAoB,CAAC,IAAI,EAAE,aAAa,GAAG,MAAM,CAGhE;AA2BD,wBAAgB,2BAA2B,CAAC,IAAI,EAAE,aAAa,GAAG,MAAM,CAuBvE"}
|