agent-orcha 0.0.5 → 0.0.8
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +250 -1275
- package/dist/lib/agents/agent-executor.d.ts +4 -2
- package/dist/lib/agents/agent-executor.d.ts.map +1 -1
- package/dist/lib/agents/agent-executor.js +85 -53
- package/dist/lib/agents/agent-executor.js.map +1 -1
- package/dist/lib/agents/agent-loader.d.ts +3 -0
- package/dist/lib/agents/agent-loader.d.ts.map +1 -1
- package/dist/lib/agents/agent-loader.js +10 -1
- package/dist/lib/agents/agent-loader.js.map +1 -1
- package/dist/lib/agents/react-loop.d.ts.map +1 -1
- package/dist/lib/agents/react-loop.js +207 -142
- package/dist/lib/agents/react-loop.js.map +1 -1
- package/dist/lib/agents/types.d.ts +181 -18
- package/dist/lib/agents/types.d.ts.map +1 -1
- package/dist/lib/agents/types.js +18 -2
- package/dist/lib/agents/types.js.map +1 -1
- package/dist/lib/functions/function-loader.d.ts +2 -0
- package/dist/lib/functions/function-loader.d.ts.map +1 -1
- package/dist/lib/functions/function-loader.js +10 -0
- package/dist/lib/functions/function-loader.js.map +1 -1
- package/dist/lib/functions/simple-function-wrapper.js +3 -3
- package/dist/lib/functions/simple-function-wrapper.js.map +1 -1
- package/dist/lib/integrations/email.d.ts +38 -0
- package/dist/lib/integrations/email.d.ts.map +1 -0
- package/dist/lib/integrations/email.js +249 -0
- package/dist/lib/integrations/email.js.map +1 -0
- package/dist/lib/integrations/integration-manager.d.ts +5 -0
- package/dist/lib/integrations/integration-manager.d.ts.map +1 -1
- package/dist/lib/integrations/integration-manager.js +53 -3
- package/dist/lib/integrations/integration-manager.js.map +1 -1
- package/dist/lib/integrations/types.d.ts +187 -4
- package/dist/lib/integrations/types.d.ts.map +1 -1
- package/dist/lib/integrations/types.js +24 -1
- package/dist/lib/integrations/types.js.map +1 -1
- package/dist/lib/knowledge/knowledge-store.d.ts +7 -1
- package/dist/lib/knowledge/knowledge-store.d.ts.map +1 -1
- package/dist/lib/knowledge/knowledge-store.js +96 -8
- package/dist/lib/knowledge/knowledge-store.js.map +1 -1
- package/dist/lib/knowledge/loaders/file-loaders.d.ts +8 -3
- package/dist/lib/knowledge/loaders/file-loaders.d.ts.map +1 -1
- package/dist/lib/knowledge/loaders/file-loaders.js +96 -75
- package/dist/lib/knowledge/loaders/file-loaders.js.map +1 -1
- package/dist/lib/knowledge/loaders/web-loader.d.ts +12 -3
- package/dist/lib/knowledge/loaders/web-loader.d.ts.map +1 -1
- package/dist/lib/knowledge/loaders/web-loader.js +56 -22
- package/dist/lib/knowledge/loaders/web-loader.js.map +1 -1
- package/dist/lib/knowledge/sqlite-store.d.ts.map +1 -1
- package/dist/lib/knowledge/sqlite-store.js +19 -10
- package/dist/lib/knowledge/sqlite-store.js.map +1 -1
- package/dist/lib/knowledge/types.d.ts +69 -33
- package/dist/lib/knowledge/types.d.ts.map +1 -1
- package/dist/lib/knowledge/types.js +18 -3
- package/dist/lib/knowledge/types.js.map +1 -1
- package/dist/lib/llm/index.d.ts +1 -1
- package/dist/lib/llm/index.d.ts.map +1 -1
- package/dist/lib/llm/index.js +1 -1
- package/dist/lib/llm/index.js.map +1 -1
- package/dist/lib/llm/llm-call-logger.d.ts +3 -1
- package/dist/lib/llm/llm-call-logger.d.ts.map +1 -1
- package/dist/lib/llm/llm-call-logger.js +31 -26
- package/dist/lib/llm/llm-call-logger.js.map +1 -1
- package/dist/lib/llm/llm-config.d.ts +59 -8
- package/dist/lib/llm/llm-config.d.ts.map +1 -1
- package/dist/lib/llm/llm-config.js +163 -17
- package/dist/lib/llm/llm-config.js.map +1 -1
- package/dist/lib/llm/llm-factory.d.ts +1 -2
- package/dist/lib/llm/llm-factory.d.ts.map +1 -1
- package/dist/lib/llm/llm-factory.js +44 -8
- package/dist/lib/llm/llm-factory.js.map +1 -1
- package/dist/lib/llm/providers/anthropic-chat-model.d.ts +5 -1
- package/dist/lib/llm/providers/anthropic-chat-model.d.ts.map +1 -1
- package/dist/lib/llm/providers/anthropic-chat-model.js +118 -42
- package/dist/lib/llm/providers/anthropic-chat-model.js.map +1 -1
- package/dist/lib/llm/providers/gemini-chat-model.d.ts +3 -2
- package/dist/lib/llm/providers/gemini-chat-model.d.ts.map +1 -1
- package/dist/lib/llm/providers/gemini-chat-model.js +83 -24
- package/dist/lib/llm/providers/gemini-chat-model.js.map +1 -1
- package/dist/lib/llm/providers/openai-chat-model.d.ts +20 -1
- package/dist/lib/llm/providers/openai-chat-model.d.ts.map +1 -1
- package/dist/lib/llm/providers/openai-chat-model.js +265 -32
- package/dist/lib/llm/providers/openai-chat-model.js.map +1 -1
- package/dist/lib/llm/providers/openai-embeddings.d.ts.map +1 -1
- package/dist/lib/llm/providers/openai-embeddings.js +41 -10
- package/dist/lib/llm/providers/openai-embeddings.js.map +1 -1
- package/dist/lib/local-llm/binary-manager.d.ts +66 -0
- package/dist/lib/local-llm/binary-manager.d.ts.map +1 -0
- package/dist/lib/local-llm/binary-manager.js +441 -0
- package/dist/lib/local-llm/binary-manager.js.map +1 -0
- package/dist/lib/local-llm/engine-interface.d.ts +47 -0
- package/dist/lib/local-llm/engine-interface.d.ts.map +1 -0
- package/dist/lib/local-llm/engine-interface.js +2 -0
- package/dist/lib/local-llm/engine-interface.js.map +1 -0
- package/dist/lib/local-llm/engine-registry.d.ts +20 -0
- package/dist/lib/local-llm/engine-registry.d.ts.map +1 -0
- package/dist/lib/local-llm/engine-registry.js +56 -0
- package/dist/lib/local-llm/engine-registry.js.map +1 -0
- package/dist/lib/local-llm/engines/llama-cpp-engine.d.ts +31 -0
- package/dist/lib/local-llm/engines/llama-cpp-engine.d.ts.map +1 -0
- package/dist/lib/local-llm/engines/llama-cpp-engine.js +164 -0
- package/dist/lib/local-llm/engines/llama-cpp-engine.js.map +1 -0
- package/dist/lib/local-llm/engines/mlx-serve-engine.d.ts +31 -0
- package/dist/lib/local-llm/engines/mlx-serve-engine.d.ts.map +1 -0
- package/dist/lib/local-llm/engines/mlx-serve-engine.js +161 -0
- package/dist/lib/local-llm/engines/mlx-serve-engine.js.map +1 -0
- package/dist/lib/local-llm/gguf-reader.d.ts +20 -0
- package/dist/lib/local-llm/gguf-reader.d.ts.map +1 -0
- package/dist/lib/local-llm/gguf-reader.js +190 -0
- package/dist/lib/local-llm/gguf-reader.js.map +1 -0
- package/dist/lib/local-llm/index.d.ts +9 -0
- package/dist/lib/local-llm/index.d.ts.map +1 -0
- package/dist/lib/local-llm/index.js +6 -0
- package/dist/lib/local-llm/index.js.map +1 -0
- package/dist/lib/local-llm/llama-server-process.d.ts +42 -0
- package/dist/lib/local-llm/llama-server-process.d.ts.map +1 -0
- package/dist/lib/local-llm/llama-server-process.js +237 -0
- package/dist/lib/local-llm/llama-server-process.js.map +1 -0
- package/dist/lib/local-llm/mlx-binary-manager.d.ts +33 -0
- package/dist/lib/local-llm/mlx-binary-manager.d.ts.map +1 -0
- package/dist/lib/local-llm/mlx-binary-manager.js +211 -0
- package/dist/lib/local-llm/mlx-binary-manager.js.map +1 -0
- package/dist/lib/local-llm/mlx-server-process.d.ts +26 -0
- package/dist/lib/local-llm/mlx-server-process.d.ts.map +1 -0
- package/dist/lib/local-llm/mlx-server-process.js +210 -0
- package/dist/lib/local-llm/mlx-server-process.js.map +1 -0
- package/dist/lib/local-llm/model-manager.d.ts +33 -0
- package/dist/lib/local-llm/model-manager.d.ts.map +1 -0
- package/dist/lib/local-llm/model-manager.js +591 -0
- package/dist/lib/local-llm/model-manager.js.map +1 -0
- package/dist/lib/local-llm/types.d.ts +51 -0
- package/dist/lib/local-llm/types.d.ts.map +1 -0
- package/dist/lib/local-llm/types.js +2 -0
- package/dist/lib/local-llm/types.js.map +1 -0
- package/dist/lib/logger.d.ts +2 -0
- package/dist/lib/logger.d.ts.map +1 -1
- package/dist/lib/logger.js +68 -6
- package/dist/lib/logger.js.map +1 -1
- package/dist/lib/mcp/mcp-client.d.ts.map +1 -1
- package/dist/lib/mcp/mcp-client.js +5 -3
- package/dist/lib/mcp/mcp-client.js.map +1 -1
- package/dist/lib/mcp/types.d.ts +0 -9
- package/dist/lib/mcp/types.d.ts.map +1 -1
- package/dist/lib/mcp/types.js +1 -2
- package/dist/lib/mcp/types.js.map +1 -1
- package/dist/lib/memory/memory-manager.d.ts +1 -0
- package/dist/lib/memory/memory-manager.d.ts.map +1 -1
- package/dist/lib/memory/memory-manager.js +9 -0
- package/dist/lib/memory/memory-manager.js.map +1 -1
- package/dist/lib/orchestrator.d.ts +11 -8
- package/dist/lib/orchestrator.d.ts.map +1 -1
- package/dist/lib/orchestrator.js +246 -5
- package/dist/lib/orchestrator.js.map +1 -1
- package/dist/lib/sandbox/cdp-client.d.ts +15 -0
- package/dist/lib/sandbox/cdp-client.d.ts.map +1 -0
- package/dist/lib/sandbox/cdp-client.js +139 -0
- package/dist/lib/sandbox/cdp-client.js.map +1 -0
- package/dist/lib/sandbox/html-to-markdown.d.ts +9 -1
- package/dist/lib/sandbox/html-to-markdown.d.ts.map +1 -1
- package/dist/lib/sandbox/html-to-markdown.js +67 -10
- package/dist/lib/sandbox/html-to-markdown.js.map +1 -1
- package/dist/lib/sandbox/index.d.ts +6 -0
- package/dist/lib/sandbox/index.d.ts.map +1 -1
- package/dist/lib/sandbox/index.js +5 -0
- package/dist/lib/sandbox/index.js.map +1 -1
- package/dist/lib/sandbox/page-readiness.d.ts +37 -0
- package/dist/lib/sandbox/page-readiness.d.ts.map +1 -0
- package/dist/lib/sandbox/page-readiness.js +268 -0
- package/dist/lib/sandbox/page-readiness.js.map +1 -0
- package/dist/lib/sandbox/sandbox-browser.d.ts +4 -0
- package/dist/lib/sandbox/sandbox-browser.d.ts.map +1 -0
- package/dist/lib/sandbox/sandbox-browser.js +316 -0
- package/dist/lib/sandbox/sandbox-browser.js.map +1 -0
- package/dist/lib/sandbox/sandbox-container.d.ts +39 -0
- package/dist/lib/sandbox/sandbox-container.d.ts.map +1 -0
- package/dist/lib/sandbox/sandbox-container.js +176 -0
- package/dist/lib/sandbox/sandbox-container.js.map +1 -0
- package/dist/lib/sandbox/sandbox-file.d.ts +4 -0
- package/dist/lib/sandbox/sandbox-file.d.ts.map +1 -0
- package/dist/lib/sandbox/sandbox-file.js +169 -0
- package/dist/lib/sandbox/sandbox-file.js.map +1 -0
- package/dist/lib/sandbox/sandbox-shell.d.ts +5 -0
- package/dist/lib/sandbox/sandbox-shell.d.ts.map +1 -0
- package/dist/lib/sandbox/sandbox-shell.js +111 -0
- package/dist/lib/sandbox/sandbox-shell.js.map +1 -0
- package/dist/lib/sandbox/sandbox-web.d.ts.map +1 -1
- package/dist/lib/sandbox/sandbox-web.js +64 -24
- package/dist/lib/sandbox/sandbox-web.js.map +1 -1
- package/dist/lib/sandbox/types.d.ts +9 -0
- package/dist/lib/sandbox/types.d.ts.map +1 -1
- package/dist/lib/sandbox/types.js +1 -0
- package/dist/lib/sandbox/types.js.map +1 -1
- package/dist/lib/sandbox/vision-browser.d.ts +4 -0
- package/dist/lib/sandbox/vision-browser.d.ts.map +1 -0
- package/dist/lib/sandbox/vision-browser.js +298 -0
- package/dist/lib/sandbox/vision-browser.js.map +1 -0
- package/dist/lib/sea/app-window.d.ts +7 -0
- package/dist/lib/sea/app-window.d.ts.map +1 -0
- package/dist/lib/sea/app-window.js +95 -0
- package/dist/lib/sea/app-window.js.map +1 -0
- package/dist/lib/sea/bootstrap.d.ts +18 -0
- package/dist/lib/sea/bootstrap.d.ts.map +1 -0
- package/dist/lib/sea/bootstrap.js +103 -0
- package/dist/lib/sea/bootstrap.js.map +1 -0
- package/dist/lib/sea/sqlite-vec-shim.d.ts +3 -0
- package/dist/lib/sea/sqlite-vec-shim.d.ts.map +1 -0
- package/dist/lib/sea/sqlite-vec-shim.js +10 -0
- package/dist/lib/sea/sqlite-vec-shim.js.map +1 -0
- package/dist/lib/skills/skill-loader.d.ts +2 -0
- package/dist/lib/skills/skill-loader.d.ts.map +1 -1
- package/dist/lib/skills/skill-loader.js +12 -1
- package/dist/lib/skills/skill-loader.js.map +1 -1
- package/dist/lib/tasks/task-manager.d.ts +3 -1
- package/dist/lib/tasks/task-manager.d.ts.map +1 -1
- package/dist/lib/tasks/task-manager.js +11 -0
- package/dist/lib/tasks/task-manager.js.map +1 -1
- package/dist/lib/tasks/task-store.d.ts +1 -1
- package/dist/lib/tasks/task-store.d.ts.map +1 -1
- package/dist/lib/tasks/task-store.js.map +1 -1
- package/dist/lib/tasks/types.d.ts +18 -0
- package/dist/lib/tasks/types.d.ts.map +1 -1
- package/dist/lib/tools/built-in/integration-tools.d.ts +4 -0
- package/dist/lib/tools/built-in/integration-tools.d.ts.map +1 -0
- package/dist/lib/tools/built-in/integration-tools.js +47 -0
- package/dist/lib/tools/built-in/integration-tools.js.map +1 -0
- package/dist/lib/tools/built-in/knowledge-entity-lookup.tool.d.ts +1 -2
- package/dist/lib/tools/built-in/knowledge-entity-lookup.tool.d.ts.map +1 -1
- package/dist/lib/tools/built-in/knowledge-entity-lookup.tool.js +17 -17
- package/dist/lib/tools/built-in/knowledge-entity-lookup.tool.js.map +1 -1
- package/dist/lib/tools/built-in/knowledge-graph-schema.tool.d.ts.map +1 -1
- package/dist/lib/tools/built-in/knowledge-graph-schema.tool.js +2 -4
- package/dist/lib/tools/built-in/knowledge-graph-schema.tool.js.map +1 -1
- package/dist/lib/tools/built-in/knowledge-search.tool.js +4 -4
- package/dist/lib/tools/built-in/knowledge-search.tool.js.map +1 -1
- package/dist/lib/tools/built-in/knowledge-sql.tool.d.ts.map +1 -1
- package/dist/lib/tools/built-in/knowledge-sql.tool.js +74 -40
- package/dist/lib/tools/built-in/knowledge-sql.tool.js.map +1 -1
- package/dist/lib/tools/built-in/knowledge-tools-factory.js +2 -2
- package/dist/lib/tools/built-in/knowledge-tools-factory.js.map +1 -1
- package/dist/lib/tools/built-in/knowledge-traverse.tool.d.ts +1 -2
- package/dist/lib/tools/built-in/knowledge-traverse.tool.d.ts.map +1 -1
- package/dist/lib/tools/built-in/knowledge-traverse.tool.js +5 -11
- package/dist/lib/tools/built-in/knowledge-traverse.tool.js.map +1 -1
- package/dist/lib/tools/built-in/query-validators.d.ts.map +1 -1
- package/dist/lib/tools/built-in/query-validators.js +4 -0
- package/dist/lib/tools/built-in/query-validators.js.map +1 -1
- package/dist/lib/tools/workspace/workspace-tools.d.ts +1 -0
- package/dist/lib/tools/workspace/workspace-tools.d.ts.map +1 -1
- package/dist/lib/tools/workspace/workspace-tools.js +44 -4
- package/dist/lib/tools/workspace/workspace-tools.js.map +1 -1
- package/dist/lib/triggers/cron-trigger.d.ts +1 -1
- package/dist/lib/triggers/cron-trigger.d.ts.map +1 -1
- package/dist/lib/triggers/cron-trigger.js.map +1 -1
- package/dist/lib/triggers/trigger-manager.d.ts +1 -0
- package/dist/lib/triggers/trigger-manager.d.ts.map +1 -1
- package/dist/lib/triggers/trigger-manager.js +26 -0
- package/dist/lib/triggers/trigger-manager.js.map +1 -1
- package/dist/lib/triggers/webhook-trigger.d.ts +1 -1
- package/dist/lib/triggers/webhook-trigger.d.ts.map +1 -1
- package/dist/lib/triggers/webhook-trigger.js.map +1 -1
- package/dist/lib/types/llm-types.d.ts +22 -4
- package/dist/lib/types/llm-types.d.ts.map +1 -1
- package/dist/lib/types/llm-types.js +50 -0
- package/dist/lib/types/llm-types.js.map +1 -1
- package/dist/lib/types/tool-factory.d.ts +2 -2
- package/dist/lib/types/tool-factory.d.ts.map +1 -1
- package/dist/lib/types/tool-factory.js +9 -2
- package/dist/lib/types/tool-factory.js.map +1 -1
- package/dist/lib/utils/document-extract.d.ts +10 -0
- package/dist/lib/utils/document-extract.d.ts.map +1 -0
- package/dist/lib/utils/document-extract.js +149 -0
- package/dist/lib/utils/document-extract.js.map +1 -0
- package/dist/lib/utils/env-substitution.d.ts +6 -0
- package/dist/lib/utils/env-substitution.d.ts.map +1 -0
- package/dist/lib/utils/env-substitution.js +15 -0
- package/dist/lib/utils/env-substitution.js.map +1 -0
- package/dist/lib/workflows/react-workflow-executor.d.ts.map +1 -1
- package/dist/lib/workflows/react-workflow-executor.js +23 -17
- package/dist/lib/workflows/react-workflow-executor.js.map +1 -1
- package/dist/lib/workflows/types.d.ts +81 -55
- package/dist/lib/workflows/types.d.ts.map +1 -1
- package/dist/lib/workflows/types.js +10 -0
- package/dist/lib/workflows/types.js.map +1 -1
- package/dist/lib/workflows/workflow-loader.d.ts +3 -0
- package/dist/lib/workflows/workflow-loader.d.ts.map +1 -1
- package/dist/lib/workflows/workflow-loader.js +10 -1
- package/dist/lib/workflows/workflow-loader.js.map +1 -1
- package/dist/public/assets/logo.png +0 -0
- package/dist/public/chat.html +39 -0
- package/dist/public/index.html +6 -176
- package/dist/public/src/components/AgentComposer.js +807 -0
- package/dist/public/src/components/AgentsView.js +1812 -508
- package/dist/public/src/components/AppRoot.js +125 -38
- package/dist/public/src/components/GraphView.js +382 -300
- package/dist/public/src/components/IdeView.js +277 -86
- package/dist/public/src/components/KnowledgeView.js +94 -130
- package/dist/public/src/components/LlmView.js +15 -19
- package/dist/public/src/components/LocalLlmView.js +2440 -0
- package/dist/public/src/components/LogViewer.js +155 -0
- package/dist/public/src/components/McpView.js +41 -49
- package/dist/public/src/components/MonitorView.js +174 -83
- package/dist/public/src/components/NavBar.js +16 -26
- package/dist/public/src/components/StandaloneChat.js +875 -0
- package/dist/public/src/services/ApiService.js +203 -4
- package/dist/public/src/services/SessionStore.js +86 -0
- package/dist/public/src/services/StreamManager.js +183 -0
- package/dist/public/src/store.js +1 -3
- package/dist/public/src/utils/card.js +21 -0
- package/dist/public/src/utils/markdown.js +7 -0
- package/dist/public/styles.css +2777 -0
- package/dist/src/cli/commands/init.d.ts.map +1 -1
- package/dist/src/cli/commands/init.js +7 -1
- package/dist/src/cli/commands/init.js.map +1 -1
- package/dist/src/cli/commands/start.d.ts.map +1 -1
- package/dist/src/cli/commands/start.js +28 -5
- package/dist/src/cli/commands/start.js.map +1 -1
- package/dist/src/cli/index.js +19 -5
- package/dist/src/cli/index.js.map +1 -1
- package/dist/src/index.js +7 -1
- package/dist/src/index.js.map +1 -1
- package/dist/src/middleware/auth.d.ts.map +1 -1
- package/dist/src/middleware/auth.js +28 -6
- package/dist/src/middleware/auth.js.map +1 -1
- package/dist/src/middleware/rate-limit.d.ts +8 -0
- package/dist/src/middleware/rate-limit.d.ts.map +1 -0
- package/dist/src/middleware/rate-limit.js +21 -0
- package/dist/src/middleware/rate-limit.js.map +1 -0
- package/dist/src/routes/agents.route.d.ts.map +1 -1
- package/dist/src/routes/agents.route.js +138 -10
- package/dist/src/routes/agents.route.js.map +1 -1
- package/dist/src/routes/chat.route.d.ts +3 -0
- package/dist/src/routes/chat.route.d.ts.map +1 -0
- package/dist/src/routes/chat.route.js +156 -0
- package/dist/src/routes/chat.route.js.map +1 -0
- package/dist/src/routes/files.route.d.ts.map +1 -1
- package/dist/src/routes/files.route.js +37 -2
- package/dist/src/routes/files.route.js.map +1 -1
- package/dist/src/routes/llm.route.d.ts.map +1 -1
- package/dist/src/routes/llm.route.js +263 -8
- package/dist/src/routes/llm.route.js.map +1 -1
- package/dist/src/routes/local-llm.route.d.ts +3 -0
- package/dist/src/routes/local-llm.route.d.ts.map +1 -0
- package/dist/src/routes/local-llm.route.js +688 -0
- package/dist/src/routes/local-llm.route.js.map +1 -0
- package/dist/src/routes/logs.route.d.ts +3 -0
- package/dist/src/routes/logs.route.d.ts.map +1 -0
- package/dist/src/routes/logs.route.js +24 -0
- package/dist/src/routes/logs.route.js.map +1 -0
- package/dist/src/routes/tasks.route.d.ts.map +1 -1
- package/dist/src/routes/tasks.route.js +15 -1
- package/dist/src/routes/tasks.route.js.map +1 -1
- package/dist/src/routes/vnc.route.d.ts +12 -0
- package/dist/src/routes/vnc.route.d.ts.map +1 -0
- package/dist/src/routes/vnc.route.js +74 -0
- package/dist/src/routes/vnc.route.js.map +1 -0
- package/dist/src/routes/workflows.route.d.ts.map +1 -1
- package/dist/src/routes/workflows.route.js +24 -0
- package/dist/src/routes/workflows.route.js.map +1 -1
- package/dist/src/server.d.ts.map +1 -1
- package/dist/src/server.js +29 -3
- package/dist/src/server.js.map +1 -1
- package/dist/templates/Demo.md +152 -0
- package/dist/templates/README.md +12 -3
- package/dist/templates/agents/actor.agent.yaml +34 -0
- package/dist/templates/agents/architect.agent.yaml +20 -13
- package/dist/templates/agents/chatbot.agent.yaml +23 -27
- package/dist/templates/agents/corporate.agent.yaml +64 -0
- package/dist/templates/agents/functions.agent.yaml +29 -0
- package/dist/templates/agents/investment-analyst.agent.yaml +79 -0
- package/dist/templates/agents/music-librarian.agent.yaml +46 -0
- package/dist/templates/agents/network-security.agent.yaml +81 -0
- package/dist/templates/agents/transport-security.agent.yaml +69 -0
- package/dist/templates/agents/web-engineer.agent.yaml +98 -0
- package/dist/templates/agents/web-pilot.agent.yaml +57 -0
- package/dist/templates/knowledge/music-store/LICENSE.md +11 -0
- package/dist/templates/knowledge/music-store/musicstore.sqlite +0 -0
- package/dist/templates/knowledge/music-store/tables.png +0 -0
- package/dist/templates/knowledge/music-store.knowledge.yaml +138 -0
- package/dist/templates/knowledge/org-chart/personnel.csv +21 -21
- package/dist/templates/knowledge/org-chart.knowledge.yaml +4 -0
- package/dist/templates/knowledge/patient-records.knowledge.yaml +20 -0
- package/dist/templates/knowledge/pdf-patients/PDF_Deid_Deidentification_0.pdf +0 -0
- package/dist/templates/knowledge/pdf-patients/PDF_Deid_Deidentification_1.pdf +0 -0
- package/dist/templates/knowledge/pdf-patients/PDF_Deid_Deidentification_10.pdf +0 -0
- package/dist/templates/knowledge/pdf-patients/PDF_Deid_Deidentification_11.pdf +0 -0
- package/dist/templates/knowledge/pet-store.knowledge.yaml +3 -0
- package/dist/templates/knowledge/security-incidents/incidents.json +55935 -0
- package/dist/templates/knowledge/security-incidents.knowledge.yaml +46 -0
- package/dist/templates/knowledge/{example.knowledge.yaml → transcripts.knowledge.yaml} +9 -5
- package/dist/templates/knowledge/transport-ot/systems.csv +117 -0
- package/dist/templates/knowledge/transport-ot.knowledge.yaml +55 -0
- package/dist/templates/knowledge/web-docs.knowledge.yaml +1 -1
- package/dist/templates/llm.json +62 -22
- package/dist/templates/mcp.json +7 -4
- package/dist/templates/skills/orcha-builder/SKILL.md +148 -215
- package/dist/templates/skills/pii-guard/SKILL.md +22 -0
- package/dist/templates/skills/sandbox/SKILL.md +25 -48
- package/dist/templates/skills/web-pilot/SKILL.md +51 -0
- package/dist/templates/workflows/example.workflow.yaml +27 -35
- package/dist/templates/workflows/react-example.workflow.yaml +14 -19
- package/dist/templates/workflows/team-chat.workflow.yaml +47 -0
- package/package.json +17 -4
- package/dist/public/src/components/SkillsView.js +0 -137
- package/dist/public/src/components/WorkflowsView.js +0 -416
- package/dist/templates/agents/knowledge-broker.agent.yaml +0 -39
- package/dist/templates/agents/sandbox.agent.yaml +0 -56
|
@@ -0,0 +1,190 @@
|
|
|
1
|
+
import * as fs from 'fs/promises';
|
|
2
|
+
import { readFileSync } from 'fs';
|
|
3
|
+
import * as os from 'os';
|
|
4
|
+
import { logger } from "../logger.js";
|
|
5
|
+
const GGUF_MAGIC = 0x46554747; // "GGUF" in little-endian
|
|
6
|
+
const METADATA_BUFFER_SIZE = 1024 * 1024; // 1MB covers metadata for all models
|
|
7
|
+
const OS_RESERVED_BYTES = 4 * 1024 * 1024 * 1024; // Reserve 4GB for OS + apps
|
|
8
|
+
/**
|
|
9
|
+
* Reads model architecture info from a GGUF file's metadata header.
|
|
10
|
+
* Only reads the first 1MB — no model loading required.
|
|
11
|
+
*/
|
|
12
|
+
export async function readGGUFModelInfo(modelPath) {
|
|
13
|
+
let handle = null;
|
|
14
|
+
try {
|
|
15
|
+
handle = await fs.open(modelPath, 'r');
|
|
16
|
+
const stat = await handle.stat();
|
|
17
|
+
const buf = Buffer.alloc(METADATA_BUFFER_SIZE);
|
|
18
|
+
const { bytesRead } = await handle.read(buf, 0, buf.length, 0);
|
|
19
|
+
if (bytesRead < 24)
|
|
20
|
+
return null;
|
|
21
|
+
const magic = buf.readUInt32LE(0);
|
|
22
|
+
if (magic !== GGUF_MAGIC)
|
|
23
|
+
return null;
|
|
24
|
+
const version = buf.readUInt32LE(4);
|
|
25
|
+
if (version < 2 || version > 3)
|
|
26
|
+
return null;
|
|
27
|
+
const kvCount = Number(buf.readBigUInt64LE(16));
|
|
28
|
+
let pos = 24;
|
|
29
|
+
const info = { fileSizeBytes: stat.size };
|
|
30
|
+
const needed = new Set(['context_length', 'block_count', 'embedding_length', 'attention.head_count', 'attention.head_count_kv']);
|
|
31
|
+
for (let i = 0; i < kvCount && pos < bytesRead - 12 && needed.size > 0; i++) {
|
|
32
|
+
if (pos + 8 > bytesRead)
|
|
33
|
+
break;
|
|
34
|
+
const keyLen = Number(buf.readBigUInt64LE(pos));
|
|
35
|
+
pos += 8;
|
|
36
|
+
if (pos + keyLen > bytesRead)
|
|
37
|
+
break;
|
|
38
|
+
const key = buf.toString('utf-8', pos, pos + keyLen);
|
|
39
|
+
pos += keyLen;
|
|
40
|
+
if (pos + 4 > bytesRead)
|
|
41
|
+
break;
|
|
42
|
+
const vtype = buf.readUInt32LE(pos);
|
|
43
|
+
pos += 4;
|
|
44
|
+
if (key.endsWith('.context_length')) {
|
|
45
|
+
info.contextLength = readScalar(buf, pos, vtype) ?? 0;
|
|
46
|
+
needed.delete('context_length');
|
|
47
|
+
}
|
|
48
|
+
else if (key.endsWith('.block_count')) {
|
|
49
|
+
info.blockCount = readScalar(buf, pos, vtype) ?? 0;
|
|
50
|
+
needed.delete('block_count');
|
|
51
|
+
}
|
|
52
|
+
else if (key.endsWith('.embedding_length')) {
|
|
53
|
+
info.embeddingLength = readScalar(buf, pos, vtype) ?? 0;
|
|
54
|
+
needed.delete('embedding_length');
|
|
55
|
+
}
|
|
56
|
+
else if (key.endsWith('.attention.head_count_kv')) {
|
|
57
|
+
info.headCountKv = readScalar(buf, pos, vtype) ?? 0;
|
|
58
|
+
needed.delete('attention.head_count_kv');
|
|
59
|
+
}
|
|
60
|
+
else if (key.endsWith('.attention.head_count')) {
|
|
61
|
+
info.headCount = readScalar(buf, pos, vtype) ?? 0;
|
|
62
|
+
needed.delete('attention.head_count');
|
|
63
|
+
}
|
|
64
|
+
pos = skipValue(buf, pos, vtype, bytesRead);
|
|
65
|
+
if (pos < 0)
|
|
66
|
+
break;
|
|
67
|
+
}
|
|
68
|
+
if (!info.contextLength)
|
|
69
|
+
return null;
|
|
70
|
+
const result = info;
|
|
71
|
+
logger.info(`[GGUFReader] ${modelPath.split('/').pop()}: ctx=${result.contextLength} layers=${result.blockCount} embd=${result.embeddingLength} heads=${result.headCount} kv_heads=${result.headCountKv} size=${(result.fileSizeBytes / 1024 / 1024 / 1024).toFixed(1)}GB`);
|
|
72
|
+
return result;
|
|
73
|
+
}
|
|
74
|
+
catch (err) {
|
|
75
|
+
logger.warn(`[GGUFReader] Failed to read GGUF metadata: ${err}`);
|
|
76
|
+
return null;
|
|
77
|
+
}
|
|
78
|
+
finally {
|
|
79
|
+
await handle?.close();
|
|
80
|
+
}
|
|
81
|
+
}
|
|
82
|
+
/**
|
|
83
|
+
* Estimates KV cache bytes per token for a model.
|
|
84
|
+
* KV cache = 2 (K+V) * n_layers * n_kv_heads * head_dim * 2 bytes (f16)
|
|
85
|
+
*/
|
|
86
|
+
export function kvCacheBytesPerToken(info) {
|
|
87
|
+
const headDim = info.embeddingLength / info.headCount;
|
|
88
|
+
return 2 * info.blockCount * info.headCountKv * headDim * 2;
|
|
89
|
+
}
|
|
90
|
+
/**
|
|
91
|
+
* Calculates optimal context size based on available system RAM.
|
|
92
|
+
* Accounts for model weights, KV cache, and OS overhead.
|
|
93
|
+
*/
|
|
94
|
+
/**
|
|
95
|
+
* Returns effective total memory, respecting container cgroup limits.
|
|
96
|
+
* os.totalmem() returns host RAM even inside Docker, so we check cgroup first.
|
|
97
|
+
*/
|
|
98
|
+
function getEffectiveMemory() {
|
|
99
|
+
const hostRam = os.totalmem();
|
|
100
|
+
if (process.platform !== 'linux')
|
|
101
|
+
return hostRam;
|
|
102
|
+
try {
|
|
103
|
+
// cgroup v2
|
|
104
|
+
const raw = readFileSync('/sys/fs/cgroup/memory.max', 'utf-8').trim();
|
|
105
|
+
if (raw !== 'max')
|
|
106
|
+
return Math.min(Number(raw), hostRam);
|
|
107
|
+
}
|
|
108
|
+
catch { /* not cgroup v2 */ }
|
|
109
|
+
try {
|
|
110
|
+
// cgroup v1
|
|
111
|
+
const raw = readFileSync('/sys/fs/cgroup/memory/memory.limit_in_bytes', 'utf-8').trim();
|
|
112
|
+
const limit = Number(raw);
|
|
113
|
+
if (limit > 0 && limit < hostRam)
|
|
114
|
+
return limit;
|
|
115
|
+
}
|
|
116
|
+
catch { /* not cgroup v1 */ }
|
|
117
|
+
return hostRam;
|
|
118
|
+
}
|
|
119
|
+
export function calculateOptimalContextSize(info) {
|
|
120
|
+
const totalRam = getEffectiveMemory();
|
|
121
|
+
const availableForModel = totalRam - OS_RESERVED_BYTES;
|
|
122
|
+
const memAfterWeights = availableForModel - info.fileSizeBytes;
|
|
123
|
+
if (memAfterWeights <= 0) {
|
|
124
|
+
logger.warn(`[GGUFReader] Model file (${(info.fileSizeBytes / 1024 / 1024 / 1024).toFixed(1)}GB) exceeds available memory, using minimum context`);
|
|
125
|
+
return 2048;
|
|
126
|
+
}
|
|
127
|
+
const bytesPerToken = kvCacheBytesPerToken(info);
|
|
128
|
+
// Use at most 50% of available-after-weights for KV cache — leave headroom for runtime allocations
|
|
129
|
+
const maxCtxByRam = Math.floor((memAfterWeights * 0.5) / bytesPerToken);
|
|
130
|
+
// Hard cap: 32K tokens is practical for local models, avoids memory pressure on small machines
|
|
131
|
+
const MAX_CONTEXT_CAP = 32768;
|
|
132
|
+
const nativeCtx = info.contextLength;
|
|
133
|
+
const optimal = Math.min(maxCtxByRam, nativeCtx, MAX_CONTEXT_CAP);
|
|
134
|
+
// Floor to nearest 1024 for cleanliness, minimum 2048
|
|
135
|
+
const result = Math.max(2048, Math.floor(optimal / 1024) * 1024);
|
|
136
|
+
logger.info(`[GGUFReader] RAM: ${(totalRam / 1024 / 1024 / 1024).toFixed(0)}GB total, ${(memAfterWeights / 1024 / 1024 / 1024).toFixed(1)}GB available for KV | KV/token: ${bytesPerToken} bytes | max by RAM: ${maxCtxByRam} | native: ${nativeCtx} | cap: ${MAX_CONTEXT_CAP} | optimal: ${result}`);
|
|
137
|
+
return result;
|
|
138
|
+
}
|
|
139
|
+
function readScalar(buf, pos, vtype) {
|
|
140
|
+
switch (vtype) {
|
|
141
|
+
case 0: return buf.readUInt8(pos);
|
|
142
|
+
case 1: return buf.readInt8(pos);
|
|
143
|
+
case 2: return buf.readUInt16LE(pos);
|
|
144
|
+
case 3: return buf.readInt16LE(pos);
|
|
145
|
+
case 4: return buf.readUInt32LE(pos);
|
|
146
|
+
case 5: return buf.readInt32LE(pos);
|
|
147
|
+
case 6: return buf.readFloatLE(pos);
|
|
148
|
+
case 7: return buf.readUInt8(pos);
|
|
149
|
+
case 10: return Number(buf.readBigUInt64LE(pos));
|
|
150
|
+
case 11: return Number(buf.readBigInt64LE(pos));
|
|
151
|
+
case 12: return buf.readDoubleLE(pos);
|
|
152
|
+
default: return null;
|
|
153
|
+
}
|
|
154
|
+
}
|
|
155
|
+
function skipValue(buf, pos, vtype, limit) {
|
|
156
|
+
switch (vtype) {
|
|
157
|
+
case 0:
|
|
158
|
+
case 1:
|
|
159
|
+
case 7: return pos + 1;
|
|
160
|
+
case 2:
|
|
161
|
+
case 3: return pos + 2;
|
|
162
|
+
case 4:
|
|
163
|
+
case 5:
|
|
164
|
+
case 6: return pos + 4;
|
|
165
|
+
case 10:
|
|
166
|
+
case 11:
|
|
167
|
+
case 12: return pos + 8;
|
|
168
|
+
case 8: {
|
|
169
|
+
if (pos + 8 > limit)
|
|
170
|
+
return -1;
|
|
171
|
+
const len = Number(buf.readBigUInt64LE(pos));
|
|
172
|
+
return pos + 8 + len;
|
|
173
|
+
}
|
|
174
|
+
case 9: {
|
|
175
|
+
if (pos + 12 > limit)
|
|
176
|
+
return -1;
|
|
177
|
+
const elemType = buf.readUInt32LE(pos);
|
|
178
|
+
const count = Number(buf.readBigUInt64LE(pos + 4));
|
|
179
|
+
pos += 12;
|
|
180
|
+
for (let i = 0; i < count && pos < limit; i++) {
|
|
181
|
+
pos = skipValue(buf, pos, elemType, limit);
|
|
182
|
+
if (pos < 0)
|
|
183
|
+
return -1;
|
|
184
|
+
}
|
|
185
|
+
return pos;
|
|
186
|
+
}
|
|
187
|
+
default: return -1;
|
|
188
|
+
}
|
|
189
|
+
}
|
|
190
|
+
//# sourceMappingURL=gguf-reader.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"gguf-reader.js","sourceRoot":"","sources":["../../../lib/local-llm/gguf-reader.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,MAAM,aAAa,CAAC;AAClC,OAAO,EAAE,YAAY,EAAE,MAAM,IAAI,CAAC;AAClC,OAAO,KAAK,EAAE,MAAM,IAAI,CAAC;AACzB,OAAO,EAAE,MAAM,EAAE,MAAM,cAAc,CAAC;AAEtC,MAAM,UAAU,GAAG,UAAU,CAAC,CAAC,0BAA0B;AACzD,MAAM,oBAAoB,GAAG,IAAI,GAAG,IAAI,CAAC,CAAC,qCAAqC;AAC/E,MAAM,iBAAiB,GAAG,CAAC,GAAG,IAAI,GAAG,IAAI,GAAG,IAAI,CAAC,CAAC,4BAA4B;AAW9E;;;GAGG;AACH,MAAM,CAAC,KAAK,UAAU,iBAAiB,CAAC,SAAiB;IACvD,IAAI,MAAM,GAAyB,IAAI,CAAC;IACxC,IAAI,CAAC;QACH,MAAM,GAAG,MAAM,EAAE,CAAC,IAAI,CAAC,SAAS,EAAE,GAAG,CAAC,CAAC;QACvC,MAAM,IAAI,GAAG,MAAM,MAAM,CAAC,IAAI,EAAE,CAAC;QACjC,MAAM,GAAG,GAAG,MAAM,CAAC,KAAK,CAAC,oBAAoB,CAAC,CAAC;QAC/C,MAAM,EAAE,SAAS,EAAE,GAAG,MAAM,MAAM,CAAC,IAAI,CAAC,GAAG,EAAE,CAAC,EAAE,GAAG,CAAC,MAAM,EAAE,CAAC,CAAC,CAAC;QAC/D,IAAI,SAAS,GAAG,EAAE;YAAE,OAAO,IAAI,CAAC;QAEhC,MAAM,KAAK,GAAG,GAAG,CAAC,YAAY,CAAC,CAAC,CAAC,CAAC;QAClC,IAAI,KAAK,KAAK,UAAU;YAAE,OAAO,IAAI,CAAC;QAEtC,MAAM,OAAO,GAAG,GAAG,CAAC,YAAY,CAAC,CAAC,CAAC,CAAC;QACpC,IAAI,OAAO,GAAG,CAAC,IAAI,OAAO,GAAG,CAAC;YAAE,OAAO,IAAI,CAAC;QAE5C,MAAM,OAAO,GAAG,MAAM,CAAC,GAAG,CAAC,eAAe,CAAC,EAAE,CAAC,CAAC,CAAC;QAChD,IAAI,GAAG,GAAG,EAAE,CAAC;QAEb,MAAM,IAAI,GAA2B,EAAE,aAAa,EAAE,IAAI,CAAC,IAAI,EAAE,CAAC;QAClE,MAAM,MAAM,GAAG,IAAI,GAAG,CAAC,CAAC,gBAAgB,EAAE,aAAa,EAAE,kBAAkB,EAAE,sBAAsB,EAAE,yBAAyB,CAAC,CAAC,CAAC;QAEjI,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,OAAO,IAAI,GAAG,GAAG,SAAS,GAAG,EAAE,IAAI,MAAM,CAAC,IAAI,GAAG,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC;YAC5E,IAAI,GAAG,GAAG,CAAC,GAAG,SAAS;gBAAE,MAAM;YAC/B,MAAM,MAAM,GAAG,MAAM,CAAC,GAAG,CAAC,eAAe,CAAC,GAAG,CAAC,CAAC,CAAC;YAChD,GAAG,IAAI,CAAC,CAAC;YAET,IAAI,GAAG,GAAG,MAAM,GAAG,SAAS;gBAAE,MAAM;YACpC,MAAM,GAAG,GAAG,GAAG,CAAC,QAAQ,CAAC,OAAO,EAAE,GAAG,EAAE,GAAG,GAAG,MAAM,CAAC,CAAC;YACrD,GAAG,IAAI,MAAM,CAAC;YAEd,IAAI,GAAG,GAAG,CAAC,GAAG,SAAS;gBAAE,MAAM;YAC/B,MAAM,KAAK,GAAG,GAAG,CAAC,YAAY,CAAC,GAAG,CAAC,CAAC;YACpC,GAAG,IAAI,CAAC,CAAC;YAET,IAAI,GAAG,CAAC,QAAQ,CAAC,iBAAiB,CAAC,EAAE,CAAC;gBACpC,IAAI,CAAC,aAAa,GAAG,UAAU,CAAC,GAAG,EAAE,GAAG,EAAE,KAAK,CAAC,IAAI,CAAC,CAAC;gBACtD,MAAM,CAAC,MAAM,CAAC,gBAAgB,CAAC,CAAC;YAClC,CAAC;iBAAM,IAAI,GAAG,CAAC,QAAQ,CAAC,cAAc,CAAC,EAAE,CAAC;gBACxC,IAAI,CAAC,UAAU,GAAG,UAAU,CAAC,GAAG,EAAE,GAAG,EAAE,KAAK,CAAC,IAAI,CAAC,CAAC;gBACnD,MAAM,CAAC,MAAM,CAAC,aAAa,CAAC,CAAC;YAC/B,CAAC;iBAAM,IAAI,GAAG,CAAC,QAAQ,CAAC,mBAAmB,CAAC,EAAE,CAAC;gBAC7C,IAAI,CAAC,eAAe,GAAG,UAAU,CAAC,GAAG,EAAE,GAAG,EAAE,KAAK,CAAC,IAAI,CAAC,CAAC;gBACxD,MAAM,CAAC,MAAM,CAAC,kBAAkB,CAAC,CAAC;YACpC,CAAC;iBAAM,IAAI,GAAG,CAAC,QAAQ,CAAC,0BAA0B,CAAC,EAAE,CAAC;gBACpD,IAAI,CAAC,WAAW,GAAG,UAAU,CAAC,GAAG,EAAE,GAAG,EAAE,KAAK,CAAC,IAAI,CAAC,CAAC;gBACpD,MAAM,CAAC,MAAM,CAAC,yBAAyB,CAAC,CAAC;YAC3C,CAAC;iBAAM,IAAI,GAAG,CAAC,QAAQ,CAAC,uBAAuB,CAAC,EAAE,CAAC;gBACjD,IAAI,CAAC,SAAS,GAAG,UAAU,CAAC,GAAG,EAAE,GAAG,EAAE,KAAK,CAAC,IAAI,CAAC,CAAC;gBAClD,MAAM,CAAC,MAAM,CAAC,sBAAsB,CAAC,CAAC;YACxC,CAAC;YAED,GAAG,GAAG,SAAS,CAAC,GAAG,EAAE,GAAG,EAAE,KAAK,EAAE,SAAS,CAAC,CAAC;YAC5C,IAAI,GAAG,GAAG,CAAC;gBAAE,MAAM;QACrB,CAAC;QAED,IAAI,CAAC,IAAI,CAAC,aAAa;YAAE,OAAO,IAAI,CAAC;QAErC,MAAM,MAAM,GAAG,IAAqB,CAAC;QACrC,MAAM,CAAC,IAAI,CAAC,gBAAgB,SAAS,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,GAAG,EAAE,SAAS,MAAM,CAAC,aAAa,WAAW,MAAM,CAAC,UAAU,SAAS,MAAM,CAAC,eAAe,UAAU,MAAM,CAAC,SAAS,aAAa,MAAM,CAAC,WAAW,SAAS,CAAC,MAAM,CAAC,aAAa,GAAG,IAAI,GAAG,IAAI,GAAG,IAAI,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC;QAC5Q,OAAO,MAAM,CAAC;IAChB,CAAC;IAAC,OAAO,GAAG,EAAE,CAAC;QACb,MAAM,CAAC,IAAI,CAAC,8CAA8C,GAAG,EAAE,CAAC,CAAC;QACjE,OAAO,IAAI,CAAC;IACd,CAAC;YAAS,CAAC;QACT,MAAM,MAAM,EAAE,KAAK,EAAE,CAAC;IACxB,CAAC;AACH,CAAC;AAED;;;GAGG;AACH,MAAM,UAAU,oBAAoB,CAAC,IAAmB;IACtD,MAAM,OAAO,GAAG,IAAI,CAAC,eAAe,GAAG,IAAI,CAAC,SAAS,CAAC;IACtD,OAAO,CAAC,GAAG,IAAI,CAAC,UAAU,GAAG,IAAI,CAAC,WAAW,GAAG,OAAO,GAAG,CAAC,CAAC;AAC9D,CAAC;AAED;;;GAGG;AACH;;;GAGG;AACH,SAAS,kBAAkB;IACzB,MAAM,OAAO,GAAG,EAAE,CAAC,QAAQ,EAAE,CAAC;IAC9B,IAAI,OAAO,CAAC,QAAQ,KAAK,OAAO;QAAE,OAAO,OAAO,CAAC;IACjD,IAAI,CAAC;QACH,YAAY;QACZ,MAAM,GAAG,GAAG,YAAY,CAAC,2BAA2B,EAAE,OAAO,CAAC,CAAC,IAAI,EAAE,CAAC;QACtE,IAAI,GAAG,KAAK,KAAK;YAAE,OAAO,IAAI,CAAC,GAAG,CAAC,MAAM,CAAC,GAAG,CAAC,EAAE,OAAO,CAAC,CAAC;IAC3D,CAAC;IAAC,MAAM,CAAC,CAAC,mBAAmB,CAAC,CAAC;IAC/B,IAAI,CAAC;QACH,YAAY;QACZ,MAAM,GAAG,GAAG,YAAY,CAAC,6CAA6C,EAAE,OAAO,CAAC,CAAC,IAAI,EAAE,CAAC;QACxF,MAAM,KAAK,GAAG,MAAM,CAAC,GAAG,CAAC,CAAC;QAC1B,IAAI,KAAK,GAAG,CAAC,IAAI,KAAK,GAAG,OAAO;YAAE,OAAO,KAAK,CAAC;IACjD,CAAC;IAAC,MAAM,CAAC,CAAC,mBAAmB,CAAC,CAAC;IAC/B,OAAO,OAAO,CAAC;AACjB,CAAC;AAED,MAAM,UAAU,2BAA2B,CAAC,IAAmB;IAC7D,MAAM,QAAQ,GAAG,kBAAkB,EAAE,CAAC;IACtC,MAAM,iBAAiB,GAAG,QAAQ,GAAG,iBAAiB,CAAC;IACvD,MAAM,eAAe,GAAG,iBAAiB,GAAG,IAAI,CAAC,aAAa,CAAC;IAE/D,IAAI,eAAe,IAAI,CAAC,EAAE,CAAC;QACzB,MAAM,CAAC,IAAI,CAAC,4BAA4B,CAAC,IAAI,CAAC,aAAa,GAAG,IAAI,GAAG,IAAI,GAAG,IAAI,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,qDAAqD,CAAC,CAAC;QACnJ,OAAO,IAAI,CAAC;IACd,CAAC;IAED,MAAM,aAAa,GAAG,oBAAoB,CAAC,IAAI,CAAC,CAAC;IACjD,mGAAmG;IACnG,MAAM,WAAW,GAAG,IAAI,CAAC,KAAK,CAAC,CAAC,eAAe,GAAG,GAAG,CAAC,GAAG,aAAa,CAAC,CAAC;IACxE,+FAA+F;IAC/F,MAAM,eAAe,GAAG,KAAK,CAAC;IAC9B,MAAM,SAAS,GAAG,IAAI,CAAC,aAAa,CAAC;IAErC,MAAM,OAAO,GAAG,IAAI,CAAC,GAAG,CAAC,WAAW,EAAE,SAAS,EAAE,eAAe,CAAC,CAAC;IAClE,sDAAsD;IACtD,MAAM,MAAM,GAAG,IAAI,CAAC,GAAG,CAAC,IAAI,EAAE,IAAI,CAAC,KAAK,CAAC,OAAO,GAAG,IAAI,CAAC,GAAG,IAAI,CAAC,CAAC;IAEjE,MAAM,CAAC,IAAI,CAAC,qBAAqB,CAAC,QAAQ,GAAG,IAAI,GAAG,IAAI,GAAG,IAAI,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,aAAa,CAAC,eAAe,GAAG,IAAI,GAAG,IAAI,GAAG,IAAI,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,mCAAmC,aAAa,wBAAwB,WAAW,cAAc,SAAS,WAAW,eAAe,eAAe,MAAM,EAAE,CAAC,CAAC;IACtS,OAAO,MAAM,CAAC;AAChB,CAAC;AAED,SAAS,UAAU,CAAC,GAAW,EAAE,GAAW,EAAE,KAAa;IACzD,QAAQ,KAAK,EAAE,CAAC;QACd,KAAK,CAAC,CAAC,CAAC,OAAO,GAAG,CAAC,SAAS,CAAC,GAAG,CAAC,CAAC;QAClC,KAAK,CAAC,CAAC,CAAC,OAAO,GAAG,CAAC,QAAQ,CAAC,GAAG,CAAC,CAAC;QACjC,KAAK,CAAC,CAAC,CAAC,OAAO,GAAG,CAAC,YAAY,CAAC,GAAG,CAAC,CAAC;QACrC,KAAK,CAAC,CAAC,CAAC,OAAO,GAAG,CAAC,WAAW,CAAC,GAAG,CAAC,CAAC;QACpC,KAAK,CAAC,CAAC,CAAC,OAAO,GAAG,CAAC,YAAY,CAAC,GAAG,CAAC,CAAC;QACrC,KAAK,CAAC,CAAC,CAAC,OAAO,GAAG,CAAC,WAAW,CAAC,GAAG,CAAC,CAAC;QACpC,KAAK,CAAC,CAAC,CAAC,OAAO,GAAG,CAAC,WAAW,CAAC,GAAG,CAAC,CAAC;QACpC,KAAK,CAAC,CAAC,CAAC,OAAO,GAAG,CAAC,SAAS,CAAC,GAAG,CAAC,CAAC;QAClC,KAAK,EAAE,CAAC,CAAC,OAAO,MAAM,CAAC,GAAG,CAAC,eAAe,CAAC,GAAG,CAAC,CAAC,CAAC;QACjD,KAAK,EAAE,CAAC,CAAC,OAAO,MAAM,CAAC,GAAG,CAAC,cAAc,CAAC,GAAG,CAAC,CAAC,CAAC;QAChD,KAAK,EAAE,CAAC,CAAC,OAAO,GAAG,CAAC,YAAY,CAAC,GAAG,CAAC,CAAC;QACtC,OAAO,CAAC,CAAC,OAAO,IAAI,CAAC;IACvB,CAAC;AACH,CAAC;AAED,SAAS,SAAS,CAAC,GAAW,EAAE,GAAW,EAAE,KAAa,EAAE,KAAa;IACvE,QAAQ,KAAK,EAAE,CAAC;QACd,KAAK,CAAC,CAAC;QAAC,KAAK,CAAC,CAAC;QAAC,KAAK,CAAC,CAAC,CAAC,OAAO,GAAG,GAAG,CAAC,CAAC;QACvC,KAAK,CAAC,CAAC;QAAC,KAAK,CAAC,CAAC,CAAC,OAAO,GAAG,GAAG,CAAC,CAAC;QAC/B,KAAK,CAAC,CAAC;QAAC,KAAK,CAAC,CAAC;QAAC,KAAK,CAAC,CAAC,CAAC,OAAO,GAAG,GAAG,CAAC,CAAC;QACvC,KAAK,EAAE,CAAC;QAAC,KAAK,EAAE,CAAC;QAAC,KAAK,EAAE,CAAC,CAAC,OAAO,GAAG,GAAG,CAAC,CAAC;QAC1C,KAAK,CAAC,CAAC,CAAC,CAAC;YACP,IAAI,GAAG,GAAG,CAAC,GAAG,KAAK;gBAAE,OAAO,CAAC,CAAC,CAAC;YAC/B,MAAM,GAAG,GAAG,MAAM,CAAC,GAAG,CAAC,eAAe,CAAC,GAAG,CAAC,CAAC,CAAC;YAC7C,OAAO,GAAG,GAAG,CAAC,GAAG,GAAG,CAAC;QACvB,CAAC;QACD,KAAK,CAAC,CAAC,CAAC,CAAC;YACP,IAAI,GAAG,GAAG,EAAE,GAAG,KAAK;gBAAE,OAAO,CAAC,CAAC,CAAC;YAChC,MAAM,QAAQ,GAAG,GAAG,CAAC,YAAY,CAAC,GAAG,CAAC,CAAC;YACvC,MAAM,KAAK,GAAG,MAAM,CAAC,GAAG,CAAC,eAAe,CAAC,GAAG,GAAG,CAAC,CAAC,CAAC,CAAC;YACnD,GAAG,IAAI,EAAE,CAAC;YACV,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,KAAK,IAAI,GAAG,GAAG,KAAK,EAAE,CAAC,EAAE,EAAE,CAAC;gBAC9C,GAAG,GAAG,SAAS,CAAC,GAAG,EAAE,GAAG,EAAE,QAAQ,EAAE,KAAK,CAAC,CAAC;gBAC3C,IAAI,GAAG,GAAG,CAAC;oBAAE,OAAO,CAAC,CAAC,CAAC;YACzB,CAAC;YACD,OAAO,GAAG,CAAC;QACb,CAAC;QACD,OAAO,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC;IACrB,CAAC;AACH,CAAC"}
|
|
@@ -0,0 +1,9 @@
|
|
|
1
|
+
export { ModelManager } from './model-manager.ts';
|
|
2
|
+
export { engineRegistry } from './engine-registry.ts';
|
|
3
|
+
export type { LocalEngine, EngineStatus, EngineChatStatus, EngineServerStatus, LoadOptions } from './engine-interface.ts';
|
|
4
|
+
export { getBinaryPath, detectGpu } from './binary-manager.ts';
|
|
5
|
+
export type { GpuInfo } from './binary-manager.ts';
|
|
6
|
+
export { LlamaServerProcess } from './llama-server-process.ts';
|
|
7
|
+
export { MlxServerProcess, killOrphanedMlxServers } from './mlx-server-process.ts';
|
|
8
|
+
export type { LocalModel, LocalLlmStatus, HuggingFaceModelResult, HuggingFaceGgufFile, DownloadProgress, ActiveDownload, InterruptedDownload, LocalLlmState, } from './types.ts';
|
|
9
|
+
//# sourceMappingURL=index.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../lib/local-llm/index.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,YAAY,EAAE,MAAM,oBAAoB,CAAC;AAClD,OAAO,EAAE,cAAc,EAAE,MAAM,sBAAsB,CAAC;AACtD,YAAY,EAAE,WAAW,EAAE,YAAY,EAAE,gBAAgB,EAAE,kBAAkB,EAAE,WAAW,EAAE,MAAM,uBAAuB,CAAC;AAC1H,OAAO,EAAE,aAAa,EAAE,SAAS,EAAE,MAAM,qBAAqB,CAAC;AAC/D,YAAY,EAAE,OAAO,EAAE,MAAM,qBAAqB,CAAC;AACnD,OAAO,EAAE,kBAAkB,EAAE,MAAM,2BAA2B,CAAC;AAC/D,OAAO,EAAE,gBAAgB,EAAE,sBAAsB,EAAE,MAAM,yBAAyB,CAAC;AACnF,YAAY,EACV,UAAU,EACV,cAAc,EACd,sBAAsB,EACtB,mBAAmB,EACnB,gBAAgB,EAChB,cAAc,EACd,mBAAmB,EACnB,aAAa,GACd,MAAM,YAAY,CAAC"}
|
|
@@ -0,0 +1,6 @@
|
|
|
1
|
+
export { ModelManager } from "./model-manager.js";
|
|
2
|
+
export { engineRegistry } from "./engine-registry.js";
|
|
3
|
+
export { getBinaryPath, detectGpu } from "./binary-manager.js";
|
|
4
|
+
export { LlamaServerProcess } from "./llama-server-process.js";
|
|
5
|
+
export { MlxServerProcess, killOrphanedMlxServers } from "./mlx-server-process.js";
|
|
6
|
+
//# sourceMappingURL=index.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"index.js","sourceRoot":"","sources":["../../../lib/local-llm/index.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,YAAY,EAAE,MAAM,oBAAoB,CAAC;AAClD,OAAO,EAAE,cAAc,EAAE,MAAM,sBAAsB,CAAC;AAEtD,OAAO,EAAE,aAAa,EAAE,SAAS,EAAE,MAAM,qBAAqB,CAAC;AAE/D,OAAO,EAAE,kBAAkB,EAAE,MAAM,2BAA2B,CAAC;AAC/D,OAAO,EAAE,gBAAgB,EAAE,sBAAsB,EAAE,MAAM,yBAAyB,CAAC"}
|
|
@@ -0,0 +1,42 @@
|
|
|
1
|
+
export interface ServerOptions {
|
|
2
|
+
modelPath: string;
|
|
3
|
+
mmproj?: string;
|
|
4
|
+
port?: number;
|
|
5
|
+
embedding?: boolean;
|
|
6
|
+
gpuLayers?: number;
|
|
7
|
+
contextSize?: number;
|
|
8
|
+
flashAttn?: boolean;
|
|
9
|
+
threads?: number;
|
|
10
|
+
batchSize?: number;
|
|
11
|
+
ubatchSize?: number;
|
|
12
|
+
cacheTypeK?: string;
|
|
13
|
+
cacheTypeV?: string;
|
|
14
|
+
mlock?: boolean;
|
|
15
|
+
reasoningBudget?: number;
|
|
16
|
+
}
|
|
17
|
+
/**
|
|
18
|
+
* Kill any orphaned llama-server processes from a previous run.
|
|
19
|
+
* Call this once at startup before launching new servers.
|
|
20
|
+
*/
|
|
21
|
+
export declare function killOrphanedServers(baseDir: string): void;
|
|
22
|
+
export declare class LlamaServerProcess {
|
|
23
|
+
private proc;
|
|
24
|
+
private _port;
|
|
25
|
+
private _modelPath;
|
|
26
|
+
private _running;
|
|
27
|
+
private _ready;
|
|
28
|
+
private baseDir;
|
|
29
|
+
private isEmbedding;
|
|
30
|
+
private role;
|
|
31
|
+
constructor(baseDir: string, isEmbedding?: boolean);
|
|
32
|
+
get port(): number;
|
|
33
|
+
get modelPath(): string;
|
|
34
|
+
get running(): boolean;
|
|
35
|
+
get ready(): boolean;
|
|
36
|
+
start(options: ServerOptions): Promise<void>;
|
|
37
|
+
stop(): Promise<void>;
|
|
38
|
+
getBaseUrl(): string;
|
|
39
|
+
getServerProps(): Promise<any>;
|
|
40
|
+
private waitForReady;
|
|
41
|
+
}
|
|
42
|
+
//# sourceMappingURL=llama-server-process.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"llama-server-process.d.ts","sourceRoot":"","sources":["../../../lib/local-llm/llama-server-process.ts"],"names":[],"mappings":"AAOA,MAAM,WAAW,aAAa;IAC5B,SAAS,EAAE,MAAM,CAAC;IAClB,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,IAAI,CAAC,EAAE,MAAM,CAAC;IACd,SAAS,CAAC,EAAE,OAAO,CAAC;IACpB,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,WAAW,CAAC,EAAE,MAAM,CAAC;IACrB,SAAS,CAAC,EAAE,OAAO,CAAC;IACpB,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,KAAK,CAAC,EAAE,OAAO,CAAC;IAChB,eAAe,CAAC,EAAE,MAAM,CAAC;CAC1B;AA6BD;;;GAGG;AACH,wBAAgB,mBAAmB,CAAC,OAAO,EAAE,MAAM,GAAG,IAAI,CAwBzD;AAaD,qBAAa,kBAAkB;IAC7B,OAAO,CAAC,IAAI,CAA6B;IACzC,OAAO,CAAC,KAAK,CAAK;IAClB,OAAO,CAAC,UAAU,CAAM;IACxB,OAAO,CAAC,QAAQ,CAAS;IACzB,OAAO,CAAC,MAAM,CAAS;IACvB,OAAO,CAAC,OAAO,CAAS;IACxB,OAAO,CAAC,WAAW,CAAU;IAC7B,OAAO,CAAC,IAAI,CAAS;gBAET,OAAO,EAAE,MAAM,EAAE,WAAW,UAAQ;IAMhD,IAAI,IAAI,WAAyB;IACjC,IAAI,SAAS,WAA8B;IAC3C,IAAI,OAAO,YAA4B;IACvC,IAAI,KAAK,YAA0B;IAE7B,KAAK,CAAC,OAAO,EAAE,aAAa,GAAG,OAAO,CAAC,IAAI,CAAC;IAkE5C,IAAI,IAAI,OAAO,CAAC,IAAI,CAAC;IA4B3B,UAAU,IAAI,MAAM;IAId,cAAc,IAAI,OAAO,CAAC,GAAG,CAAC;YAUtB,YAAY;CAgB3B"}
|
|
@@ -0,0 +1,237 @@
|
|
|
1
|
+
import { spawn } from 'child_process';
|
|
2
|
+
import { existsSync, mkdirSync, writeFileSync, readFileSync, readdirSync, unlinkSync } from 'fs';
|
|
3
|
+
import * as net from 'net';
|
|
4
|
+
import * as path from 'path';
|
|
5
|
+
import { logger } from "../logger.js";
|
|
6
|
+
import { getBinaryPath } from "./binary-manager.js";
|
|
7
|
+
const HEALTH_POLL_MS = 500;
|
|
8
|
+
const STARTUP_TIMEOUT_MS = 120_000;
|
|
9
|
+
// ─── PID file management ──────────────────────────────────────────────────────
|
|
10
|
+
function pidDir(baseDir) {
|
|
11
|
+
return path.join(baseDir, '.llama-server', 'pids');
|
|
12
|
+
}
|
|
13
|
+
function pidFilePath(baseDir, role) {
|
|
14
|
+
return path.join(pidDir(baseDir), `${role}.json`);
|
|
15
|
+
}
|
|
16
|
+
function writePidFile(baseDir, role, info) {
|
|
17
|
+
const dir = pidDir(baseDir);
|
|
18
|
+
if (!existsSync(dir))
|
|
19
|
+
mkdirSync(dir, { recursive: true });
|
|
20
|
+
writeFileSync(pidFilePath(baseDir, role), JSON.stringify(info));
|
|
21
|
+
}
|
|
22
|
+
function removePidFile(baseDir, role) {
|
|
23
|
+
try {
|
|
24
|
+
unlinkSync(pidFilePath(baseDir, role));
|
|
25
|
+
}
|
|
26
|
+
catch { /* already gone */ }
|
|
27
|
+
}
|
|
28
|
+
function isProcessAlive(pid) {
|
|
29
|
+
try {
|
|
30
|
+
process.kill(pid, 0);
|
|
31
|
+
return true;
|
|
32
|
+
}
|
|
33
|
+
catch {
|
|
34
|
+
return false;
|
|
35
|
+
}
|
|
36
|
+
}
|
|
37
|
+
/**
|
|
38
|
+
* Kill any orphaned llama-server processes from a previous run.
|
|
39
|
+
* Call this once at startup before launching new servers.
|
|
40
|
+
*/
|
|
41
|
+
export function killOrphanedServers(baseDir) {
|
|
42
|
+
const dir = pidDir(baseDir);
|
|
43
|
+
if (!existsSync(dir))
|
|
44
|
+
return;
|
|
45
|
+
let files;
|
|
46
|
+
try {
|
|
47
|
+
files = readdirSync(dir);
|
|
48
|
+
}
|
|
49
|
+
catch {
|
|
50
|
+
return;
|
|
51
|
+
}
|
|
52
|
+
for (const file of files) {
|
|
53
|
+
if (!file.endsWith('.json'))
|
|
54
|
+
continue;
|
|
55
|
+
try {
|
|
56
|
+
const info = JSON.parse(readFileSync(path.join(dir, file), 'utf-8'));
|
|
57
|
+
if (info.pid && isProcessAlive(info.pid)) {
|
|
58
|
+
logger.warn(`[LlamaServer] Killing orphaned llama-server (PID ${info.pid}, port ${info.port})`);
|
|
59
|
+
try {
|
|
60
|
+
process.kill(info.pid, 'SIGTERM');
|
|
61
|
+
}
|
|
62
|
+
catch { /* already dead */ }
|
|
63
|
+
// Give it a moment, then force kill
|
|
64
|
+
setTimeout(() => {
|
|
65
|
+
try {
|
|
66
|
+
if (isProcessAlive(info.pid))
|
|
67
|
+
process.kill(info.pid, 'SIGKILL');
|
|
68
|
+
}
|
|
69
|
+
catch { /* gone */ }
|
|
70
|
+
}, 3000);
|
|
71
|
+
}
|
|
72
|
+
unlinkSync(path.join(dir, file));
|
|
73
|
+
}
|
|
74
|
+
catch { /* corrupt pid file, remove it */
|
|
75
|
+
try {
|
|
76
|
+
unlinkSync(path.join(dir, file));
|
|
77
|
+
}
|
|
78
|
+
catch { /* ignore */ }
|
|
79
|
+
}
|
|
80
|
+
}
|
|
81
|
+
}
|
|
82
|
+
async function findFreePort(start) {
|
|
83
|
+
return new Promise((resolve) => {
|
|
84
|
+
const server = net.createServer();
|
|
85
|
+
server.listen(start, '127.0.0.1', () => {
|
|
86
|
+
const port = server.address().port;
|
|
87
|
+
server.close(() => resolve(port));
|
|
88
|
+
});
|
|
89
|
+
server.on('error', () => findFreePort(start + 1).then(resolve));
|
|
90
|
+
});
|
|
91
|
+
}
|
|
92
|
+
export class LlamaServerProcess {
|
|
93
|
+
proc = null;
|
|
94
|
+
_port = 0;
|
|
95
|
+
_modelPath = '';
|
|
96
|
+
_running = false;
|
|
97
|
+
_ready = false;
|
|
98
|
+
baseDir;
|
|
99
|
+
isEmbedding;
|
|
100
|
+
role;
|
|
101
|
+
constructor(baseDir, isEmbedding = false) {
|
|
102
|
+
this.baseDir = baseDir;
|
|
103
|
+
this.isEmbedding = isEmbedding;
|
|
104
|
+
this.role = isEmbedding ? 'embedding' : 'chat';
|
|
105
|
+
}
|
|
106
|
+
get port() { return this._port; }
|
|
107
|
+
get modelPath() { return this._modelPath; }
|
|
108
|
+
get running() { return this._running; }
|
|
109
|
+
get ready() { return this._ready; }
|
|
110
|
+
async start(options) {
|
|
111
|
+
await this.stop();
|
|
112
|
+
const binaryPath = await getBinaryPath(this.baseDir);
|
|
113
|
+
this._port = options.port ?? await findFreePort(this.isEmbedding ? 9991 : 9990);
|
|
114
|
+
this._modelPath = options.modelPath;
|
|
115
|
+
const args = [
|
|
116
|
+
'--model', options.modelPath,
|
|
117
|
+
'--port', String(this._port),
|
|
118
|
+
'--host', '127.0.0.1',
|
|
119
|
+
'--n-gpu-layers', String(options.gpuLayers ?? -1),
|
|
120
|
+
'--parallel', '1',
|
|
121
|
+
];
|
|
122
|
+
if (options.mmproj)
|
|
123
|
+
args.push('--mmproj', options.mmproj);
|
|
124
|
+
if (options.contextSize)
|
|
125
|
+
args.push('--ctx-size', String(options.contextSize));
|
|
126
|
+
if (options.flashAttn !== false)
|
|
127
|
+
args.push('--flash-attn', 'on');
|
|
128
|
+
if (options.threads)
|
|
129
|
+
args.push('--threads', String(options.threads));
|
|
130
|
+
if (options.batchSize)
|
|
131
|
+
args.push('--batch-size', String(options.batchSize));
|
|
132
|
+
if (options.ubatchSize)
|
|
133
|
+
args.push('--ubatch-size', String(options.ubatchSize));
|
|
134
|
+
if (options.cacheTypeK)
|
|
135
|
+
args.push('--cache-type-k', options.cacheTypeK);
|
|
136
|
+
if (options.cacheTypeV)
|
|
137
|
+
args.push('--cache-type-v', options.cacheTypeV);
|
|
138
|
+
if (options.mlock)
|
|
139
|
+
args.push('--mlock');
|
|
140
|
+
if (options.reasoningBudget !== undefined) {
|
|
141
|
+
args.push('--reasoning-format', 'deepseek');
|
|
142
|
+
// TODO: llama-server b8280 and earlier only accept -1 or 0.
|
|
143
|
+
// Arbitrary budgets (N>0) land after b8280 — remove clamp once binary is updated.
|
|
144
|
+
const budget = options.reasoningBudget > 0 ? -1 : 0;
|
|
145
|
+
args.push('--reasoning-budget', String(budget));
|
|
146
|
+
}
|
|
147
|
+
if (options.embedding || this.isEmbedding)
|
|
148
|
+
args.push('--embedding');
|
|
149
|
+
logger.info(`[LlamaServer] Starting: ${binaryPath} ${args.join(' ')}`);
|
|
150
|
+
const binDir = path.dirname(binaryPath);
|
|
151
|
+
this.proc = spawn(binaryPath, args, {
|
|
152
|
+
stdio: ['ignore', 'ignore', 'pipe'],
|
|
153
|
+
env: { ...process.env, LD_LIBRARY_PATH: `${binDir}:${process.env.LD_LIBRARY_PATH ?? ''}` },
|
|
154
|
+
});
|
|
155
|
+
// Buffer stderr so we can surface it when the process crashes
|
|
156
|
+
const stderrChunks = [];
|
|
157
|
+
this.proc.stderr?.on('data', (data) => { stderrChunks.push(data); });
|
|
158
|
+
this.proc.on('exit', () => {
|
|
159
|
+
this._running = false;
|
|
160
|
+
this._ready = false;
|
|
161
|
+
this.proc = null;
|
|
162
|
+
removePidFile(this.baseDir, this.role);
|
|
163
|
+
});
|
|
164
|
+
this._running = true;
|
|
165
|
+
try {
|
|
166
|
+
await this.waitForReady();
|
|
167
|
+
}
|
|
168
|
+
catch (err) {
|
|
169
|
+
const stderr = Buffer.concat(stderrChunks).toString().trim();
|
|
170
|
+
if (stderr)
|
|
171
|
+
logger.error(`[LlamaServer] stderr:\n${stderr}`);
|
|
172
|
+
throw err;
|
|
173
|
+
}
|
|
174
|
+
this._ready = true;
|
|
175
|
+
writePidFile(this.baseDir, this.role, { pid: this.proc.pid, port: this._port, model: this._modelPath });
|
|
176
|
+
logger.info(`[LlamaServer] Ready on port ${this._port}`);
|
|
177
|
+
}
|
|
178
|
+
async stop() {
|
|
179
|
+
if (!this.proc)
|
|
180
|
+
return;
|
|
181
|
+
logger.info('[LlamaServer] Stopping');
|
|
182
|
+
this.proc.kill('SIGTERM');
|
|
183
|
+
await new Promise((resolve) => {
|
|
184
|
+
const timeout = setTimeout(() => {
|
|
185
|
+
this.proc?.kill('SIGKILL');
|
|
186
|
+
resolve();
|
|
187
|
+
}, 5000);
|
|
188
|
+
if (this.proc) {
|
|
189
|
+
this.proc.on('exit', () => {
|
|
190
|
+
clearTimeout(timeout);
|
|
191
|
+
resolve();
|
|
192
|
+
});
|
|
193
|
+
}
|
|
194
|
+
else {
|
|
195
|
+
clearTimeout(timeout);
|
|
196
|
+
resolve();
|
|
197
|
+
}
|
|
198
|
+
});
|
|
199
|
+
this.proc = null;
|
|
200
|
+
this._running = false;
|
|
201
|
+
this._ready = false;
|
|
202
|
+
}
|
|
203
|
+
getBaseUrl() {
|
|
204
|
+
return `http://127.0.0.1:${this._port}`;
|
|
205
|
+
}
|
|
206
|
+
async getServerProps() {
|
|
207
|
+
if (!this._ready)
|
|
208
|
+
return null;
|
|
209
|
+
try {
|
|
210
|
+
const res = await fetch(`${this.getBaseUrl()}/props`);
|
|
211
|
+
if (res.ok)
|
|
212
|
+
return res.json();
|
|
213
|
+
}
|
|
214
|
+
catch { /* server may be down */ }
|
|
215
|
+
return null;
|
|
216
|
+
}
|
|
217
|
+
async waitForReady() {
|
|
218
|
+
const start = Date.now();
|
|
219
|
+
while (Date.now() - start < STARTUP_TIMEOUT_MS) {
|
|
220
|
+
if (!this._running)
|
|
221
|
+
throw new Error('llama-server process exited during startup');
|
|
222
|
+
try {
|
|
223
|
+
const res = await fetch(`http://127.0.0.1:${this._port}/health`);
|
|
224
|
+
if (res.ok) {
|
|
225
|
+
const body = await res.json();
|
|
226
|
+
if (body.status === 'ok')
|
|
227
|
+
return;
|
|
228
|
+
}
|
|
229
|
+
}
|
|
230
|
+
catch { /* not ready yet */ }
|
|
231
|
+
await new Promise(r => setTimeout(r, HEALTH_POLL_MS));
|
|
232
|
+
}
|
|
233
|
+
await this.stop();
|
|
234
|
+
throw new Error(`llama-server failed to become ready within ${STARTUP_TIMEOUT_MS / 1000}s`);
|
|
235
|
+
}
|
|
236
|
+
}
|
|
237
|
+
//# sourceMappingURL=llama-server-process.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"llama-server-process.js","sourceRoot":"","sources":["../../../lib/local-llm/llama-server-process.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,KAAK,EAAqB,MAAM,eAAe,CAAC;AACzD,OAAO,EAAE,UAAU,EAAE,SAAS,EAAE,aAAa,EAAE,YAAY,EAAE,WAAW,EAAE,UAAU,EAAE,MAAM,IAAI,CAAC;AACjG,OAAO,KAAK,GAAG,MAAM,KAAK,CAAC;AAC3B,OAAO,KAAK,IAAI,MAAM,MAAM,CAAC;AAC7B,OAAO,EAAE,MAAM,EAAE,MAAM,cAAc,CAAC;AACtC,OAAO,EAAE,aAAa,EAAE,MAAM,qBAAqB,CAAC;AAmBpD,MAAM,cAAc,GAAG,GAAG,CAAC;AAC3B,MAAM,kBAAkB,GAAG,OAAO,CAAC;AAEnC,iFAAiF;AAEjF,SAAS,MAAM,CAAC,OAAe;IAC7B,OAAO,IAAI,CAAC,IAAI,CAAC,OAAO,EAAE,eAAe,EAAE,MAAM,CAAC,CAAC;AACrD,CAAC;AAED,SAAS,WAAW,CAAC,OAAe,EAAE,IAAY;IAChD,OAAO,IAAI,CAAC,IAAI,CAAC,MAAM,CAAC,OAAO,CAAC,EAAE,GAAG,IAAI,OAAO,CAAC,CAAC;AACpD,CAAC;AAED,SAAS,YAAY,CAAC,OAAe,EAAE,IAAY,EAAE,IAAkD;IACrG,MAAM,GAAG,GAAG,MAAM,CAAC,OAAO,CAAC,CAAC;IAC5B,IAAI,CAAC,UAAU,CAAC,GAAG,CAAC;QAAE,SAAS,CAAC,GAAG,EAAE,EAAE,SAAS,EAAE,IAAI,EAAE,CAAC,CAAC;IAC1D,aAAa,CAAC,WAAW,CAAC,OAAO,EAAE,IAAI,CAAC,EAAE,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC,CAAC,CAAC;AAClE,CAAC;AAED,SAAS,aAAa,CAAC,OAAe,EAAE,IAAY;IAClD,IAAI,CAAC;QAAC,UAAU,CAAC,WAAW,CAAC,OAAO,EAAE,IAAI,CAAC,CAAC,CAAC;IAAC,CAAC;IAAC,MAAM,CAAC,CAAC,kBAAkB,CAAC,CAAC;AAC9E,CAAC;AAED,SAAS,cAAc,CAAC,GAAW;IACjC,IAAI,CAAC;QAAC,OAAO,CAAC,IAAI,CAAC,GAAG,EAAE,CAAC,CAAC,CAAC;QAAC,OAAO,IAAI,CAAC;IAAC,CAAC;IAAC,MAAM,CAAC;QAAC,OAAO,KAAK,CAAC;IAAC,CAAC;AACpE,CAAC;AAED;;;GAGG;AACH,MAAM,UAAU,mBAAmB,CAAC,OAAe;IACjD,MAAM,GAAG,GAAG,MAAM,CAAC,OAAO,CAAC,CAAC;IAC5B,IAAI,CAAC,UAAU,CAAC,GAAG,CAAC;QAAE,OAAO;IAE7B,IAAI,KAAe,CAAC;IACpB,IAAI,CAAC;QAAC,KAAK,GAAG,WAAW,CAAC,GAAG,CAAC,CAAC;IAAC,CAAC;IAAC,MAAM,CAAC;QAAC,OAAO;IAAC,CAAC;IAEnD,KAAK,MAAM,IAAI,IAAI,KAAK,EAAE,CAAC;QACzB,IAAI,CAAC,IAAI,CAAC,QAAQ,CAAC,OAAO,CAAC;YAAE,SAAS;QACtC,IAAI,CAAC;YACH,MAAM,IAAI,GAAG,IAAI,CAAC,KAAK,CAAC,YAAY,CAAC,IAAI,CAAC,IAAI,CAAC,GAAG,EAAE,IAAI,CAAC,EAAE,OAAO,CAAC,CAAC,CAAC;YACrE,IAAI,IAAI,CAAC,GAAG,IAAI,cAAc,CAAC,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC;gBACzC,MAAM,CAAC,IAAI,CAAC,oDAAoD,IAAI,CAAC,GAAG,UAAU,IAAI,CAAC,IAAI,GAAG,CAAC,CAAC;gBAChG,IAAI,CAAC;oBAAC,OAAO,CAAC,IAAI,CAAC,IAAI,CAAC,GAAG,EAAE,SAAS,CAAC,CAAC;gBAAC,CAAC;gBAAC,MAAM,CAAC,CAAC,kBAAkB,CAAC,CAAC;gBACvE,oCAAoC;gBACpC,UAAU,CAAC,GAAG,EAAE;oBACd,IAAI,CAAC;wBAAC,IAAI,cAAc,CAAC,IAAI,CAAC,GAAG,CAAC;4BAAE,OAAO,CAAC,IAAI,CAAC,IAAI,CAAC,GAAG,EAAE,SAAS,CAAC,CAAC;oBAAC,CAAC;oBAAC,MAAM,CAAC,CAAC,UAAU,CAAC,CAAC;gBAC/F,CAAC,EAAE,IAAI,CAAC,CAAC;YACX,CAAC;YACD,UAAU,CAAC,IAAI,CAAC,IAAI,CAAC,GAAG,EAAE,IAAI,CAAC,CAAC,CAAC;QACnC,CAAC;QAAC,MAAM,CAAC,CAAC,iCAAiC;YACzC,IAAI,CAAC;gBAAC,UAAU,CAAC,IAAI,CAAC,IAAI,CAAC,GAAG,EAAE,IAAI,CAAC,CAAC,CAAC;YAAC,CAAC;YAAC,MAAM,CAAC,CAAC,YAAY,CAAC,CAAC;QAClE,CAAC;IACH,CAAC;AACH,CAAC;AAED,KAAK,UAAU,YAAY,CAAC,KAAa;IACvC,OAAO,IAAI,OAAO,CAAC,CAAC,OAAO,EAAE,EAAE;QAC7B,MAAM,MAAM,GAAG,GAAG,CAAC,YAAY,EAAE,CAAC;QAClC,MAAM,CAAC,MAAM,CAAC,KAAK,EAAE,WAAW,EAAE,GAAG,EAAE;YACrC,MAAM,IAAI,GAAI,MAAM,CAAC,OAAO,EAAsB,CAAC,IAAI,CAAC;YACxD,MAAM,CAAC,KAAK,CAAC,GAAG,EAAE,CAAC,OAAO,CAAC,IAAI,CAAC,CAAC,CAAC;QACpC,CAAC,CAAC,CAAC;QACH,MAAM,CAAC,EAAE,CAAC,OAAO,EAAE,GAAG,EAAE,CAAC,YAAY,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC,IAAI,CAAC,OAAO,CAAC,CAAC,CAAC;IAClE,CAAC,CAAC,CAAC;AACL,CAAC;AAED,MAAM,OAAO,kBAAkB;IACrB,IAAI,GAAwB,IAAI,CAAC;IACjC,KAAK,GAAG,CAAC,CAAC;IACV,UAAU,GAAG,EAAE,CAAC;IAChB,QAAQ,GAAG,KAAK,CAAC;IACjB,MAAM,GAAG,KAAK,CAAC;IACf,OAAO,CAAS;IAChB,WAAW,CAAU;IACrB,IAAI,CAAS;IAErB,YAAY,OAAe,EAAE,WAAW,GAAG,KAAK;QAC9C,IAAI,CAAC,OAAO,GAAG,OAAO,CAAC;QACvB,IAAI,CAAC,WAAW,GAAG,WAAW,CAAC;QAC/B,IAAI,CAAC,IAAI,GAAG,WAAW,CAAC,CAAC,CAAC,WAAW,CAAC,CAAC,CAAC,MAAM,CAAC;IACjD,CAAC;IAED,IAAI,IAAI,KAAK,OAAO,IAAI,CAAC,KAAK,CAAC,CAAC,CAAC;IACjC,IAAI,SAAS,KAAK,OAAO,IAAI,CAAC,UAAU,CAAC,CAAC,CAAC;IAC3C,IAAI,OAAO,KAAK,OAAO,IAAI,CAAC,QAAQ,CAAC,CAAC,CAAC;IACvC,IAAI,KAAK,KAAK,OAAO,IAAI,CAAC,MAAM,CAAC,CAAC,CAAC;IAEnC,KAAK,CAAC,KAAK,CAAC,OAAsB;QAChC,MAAM,IAAI,CAAC,IAAI,EAAE,CAAC;QAElB,MAAM,UAAU,GAAG,MAAM,aAAa,CAAC,IAAI,CAAC,OAAO,CAAC,CAAC;QACrD,IAAI,CAAC,KAAK,GAAG,OAAO,CAAC,IAAI,IAAI,MAAM,YAAY,CAAC,IAAI,CAAC,WAAW,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC;QAChF,IAAI,CAAC,UAAU,GAAG,OAAO,CAAC,SAAS,CAAC;QAEpC,MAAM,IAAI,GAAG;YACX,SAAS,EAAE,OAAO,CAAC,SAAS;YAC5B,QAAQ,EAAE,MAAM,CAAC,IAAI,CAAC,KAAK,CAAC;YAC5B,QAAQ,EAAE,WAAW;YACrB,gBAAgB,EAAE,MAAM,CAAC,OAAO,CAAC,SAAS,IAAI,CAAC,CAAC,CAAC;YACjD,YAAY,EAAE,GAAG;SAClB,CAAC;QAEF,IAAI,OAAO,CAAC,MAAM;YAAE,IAAI,CAAC,IAAI,CAAC,UAAU,EAAE,OAAO,CAAC,MAAM,CAAC,CAAC;QAC1D,IAAI,OAAO,CAAC,WAAW;YAAE,IAAI,CAAC,IAAI,CAAC,YAAY,EAAE,MAAM,CAAC,OAAO,CAAC,WAAW,CAAC,CAAC,CAAC;QAC9E,IAAI,OAAO,CAAC,SAAS,KAAK,KAAK;YAAE,IAAI,CAAC,IAAI,CAAC,cAAc,EAAE,IAAI,CAAC,CAAC;QACjE,IAAI,OAAO,CAAC,OAAO;YAAE,IAAI,CAAC,IAAI,CAAC,WAAW,EAAE,MAAM,CAAC,OAAO,CAAC,OAAO,CAAC,CAAC,CAAC;QACrE,IAAI,OAAO,CAAC,SAAS;YAAE,IAAI,CAAC,IAAI,CAAC,cAAc,EAAE,MAAM,CAAC,OAAO,CAAC,SAAS,CAAC,CAAC,CAAC;QAC5E,IAAI,OAAO,CAAC,UAAU;YAAE,IAAI,CAAC,IAAI,CAAC,eAAe,EAAE,MAAM,CAAC,OAAO,CAAC,UAAU,CAAC,CAAC,CAAC;QAC/E,IAAI,OAAO,CAAC,UAAU;YAAE,IAAI,CAAC,IAAI,CAAC,gBAAgB,EAAE,OAAO,CAAC,UAAU,CAAC,CAAC;QACxE,IAAI,OAAO,CAAC,UAAU;YAAE,IAAI,CAAC,IAAI,CAAC,gBAAgB,EAAE,OAAO,CAAC,UAAU,CAAC,CAAC;QACxE,IAAI,OAAO,CAAC,KAAK;YAAE,IAAI,CAAC,IAAI,CAAC,SAAS,CAAC,CAAC;QACxC,IAAI,OAAO,CAAC,eAAe,KAAK,SAAS,EAAE,CAAC;YAC1C,IAAI,CAAC,IAAI,CAAC,oBAAoB,EAAE,UAAU,CAAC,CAAC;YAC5C,4DAA4D;YAC5D,kFAAkF;YAClF,MAAM,MAAM,GAAG,OAAO,CAAC,eAAe,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;YACpD,IAAI,CAAC,IAAI,CAAC,oBAAoB,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC;QAClD,CAAC;QACD,IAAI,OAAO,CAAC,SAAS,IAAI,IAAI,CAAC,WAAW;YAAE,IAAI,CAAC,IAAI,CAAC,aAAa,CAAC,CAAC;QAEpE,MAAM,CAAC,IAAI,CAAC,2BAA2B,UAAU,IAAI,IAAI,CAAC,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;QAEvE,MAAM,MAAM,GAAG,IAAI,CAAC,OAAO,CAAC,UAAU,CAAC,CAAC;QACxC,IAAI,CAAC,IAAI,GAAG,KAAK,CAAC,UAAU,EAAE,IAAI,EAAE;YAClC,KAAK,EAAE,CAAC,QAAQ,EAAE,QAAQ,EAAE,MAAM,CAAC;YACnC,GAAG,EAAE,EAAE,GAAG,OAAO,CAAC,GAAG,EAAE,eAAe,EAAE,GAAG,MAAM,IAAI,OAAO,CAAC,GAAG,CAAC,eAAe,IAAI,EAAE,EAAE,EAAE;SAC3F,CAAC,CAAC;QAEH,8DAA8D;QAC9D,MAAM,YAAY,GAAa,EAAE,CAAC;QAClC,IAAI,CAAC,IAAI,CAAC,MAAM,EAAE,EAAE,CAAC,MAAM,EAAE,CAAC,IAAY,EAAE,EAAE,GAAG,YAAY,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;QAE7E,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC,MAAM,EAAE,GAAG,EAAE;YACxB,IAAI,CAAC,QAAQ,GAAG,KAAK,CAAC;YACtB,IAAI,CAAC,MAAM,GAAG,KAAK,CAAC;YACpB,IAAI,CAAC,IAAI,GAAG,IAAI,CAAC;YACjB,aAAa,CAAC,IAAI,CAAC,OAAO,EAAE,IAAI,CAAC,IAAI,CAAC,CAAC;QACzC,CAAC,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,GAAG,IAAI,CAAC;QACrB,IAAI,CAAC;YACH,MAAM,IAAI,CAAC,YAAY,EAAE,CAAC;QAC5B,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACb,MAAM,MAAM,GAAG,MAAM,CAAC,MAAM,CAAC,YAAY,CAAC,CAAC,QAAQ,EAAE,CAAC,IAAI,EAAE,CAAC;YAC7D,IAAI,MAAM;gBAAE,MAAM,CAAC,KAAK,CAAC,0BAA0B,MAAM,EAAE,CAAC,CAAC;YAC7D,MAAM,GAAG,CAAC;QACZ,CAAC;QACD,IAAI,CAAC,MAAM,GAAG,IAAI,CAAC;QACnB,YAAY,CAAC,IAAI,CAAC,OAAO,EAAE,IAAI,CAAC,IAAI,EAAE,EAAE,GAAG,EAAE,IAAI,CAAC,IAAK,CAAC,GAAI,EAAE,IAAI,EAAE,IAAI,CAAC,KAAK,EAAE,KAAK,EAAE,IAAI,CAAC,UAAU,EAAE,CAAC,CAAC;QAE1G,MAAM,CAAC,IAAI,CAAC,+BAA+B,IAAI,CAAC,KAAK,EAAE,CAAC,CAAC;IAC3D,CAAC;IAED,KAAK,CAAC,IAAI;QACR,IAAI,CAAC,IAAI,CAAC,IAAI;YAAE,OAAO;QAEvB,MAAM,CAAC,IAAI,CAAC,wBAAwB,CAAC,CAAC;QACtC,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,SAAS,CAAC,CAAC;QAE1B,MAAM,IAAI,OAAO,CAAO,CAAC,OAAO,EAAE,EAAE;YAClC,MAAM,OAAO,GAAG,UAAU,CAAC,GAAG,EAAE;gBAC9B,IAAI,CAAC,IAAI,EAAE,IAAI,CAAC,SAAS,CAAC,CAAC;gBAC3B,OAAO,EAAE,CAAC;YACZ,CAAC,EAAE,IAAI,CAAC,CAAC;YAET,IAAI,IAAI,CAAC,IAAI,EAAE,CAAC;gBACd,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC,MAAM,EAAE,GAAG,EAAE;oBACxB,YAAY,CAAC,OAAO,CAAC,CAAC;oBACtB,OAAO,EAAE,CAAC;gBACZ,CAAC,CAAC,CAAC;YACL,CAAC;iBAAM,CAAC;gBACN,YAAY,CAAC,OAAO,CAAC,CAAC;gBACtB,OAAO,EAAE,CAAC;YACZ,CAAC;QACH,CAAC,CAAC,CAAC;QAEH,IAAI,CAAC,IAAI,GAAG,IAAI,CAAC;QACjB,IAAI,CAAC,QAAQ,GAAG,KAAK,CAAC;QACtB,IAAI,CAAC,MAAM,GAAG,KAAK,CAAC;IACtB,CAAC;IAED,UAAU;QACR,OAAO,oBAAoB,IAAI,CAAC,KAAK,EAAE,CAAC;IAC1C,CAAC;IAED,KAAK,CAAC,cAAc;QAClB,IAAI,CAAC,IAAI,CAAC,MAAM;YAAE,OAAO,IAAI,CAAC;QAC9B,IAAI,CAAC;YACH,MAAM,GAAG,GAAG,MAAM,KAAK,CAAC,GAAG,IAAI,CAAC,UAAU,EAAE,QAAQ,CAAC,CAAC;YACtD,IAAI,GAAG,CAAC,EAAE;gBAAE,OAAO,GAAG,CAAC,IAAI,EAAE,CAAC;QAChC,CAAC;QAAC,MAAM,CAAC,CAAC,wBAAwB,CAAC,CAAC;QACpC,OAAO,IAAI,CAAC;IACd,CAAC;IAGO,KAAK,CAAC,YAAY;QACxB,MAAM,KAAK,GAAG,IAAI,CAAC,GAAG,EAAE,CAAC;QACzB,OAAO,IAAI,CAAC,GAAG,EAAE,GAAG,KAAK,GAAG,kBAAkB,EAAE,CAAC;YAC/C,IAAI,CAAC,IAAI,CAAC,QAAQ;gBAAE,MAAM,IAAI,KAAK,CAAC,4CAA4C,CAAC,CAAC;YAClF,IAAI,CAAC;gBACH,MAAM,GAAG,GAAG,MAAM,KAAK,CAAC,oBAAoB,IAAI,CAAC,KAAK,SAAS,CAAC,CAAC;gBACjE,IAAI,GAAG,CAAC,EAAE,EAAE,CAAC;oBACX,MAAM,IAAI,GAAQ,MAAM,GAAG,CAAC,IAAI,EAAE,CAAC;oBACnC,IAAI,IAAI,CAAC,MAAM,KAAK,IAAI;wBAAE,OAAO;gBACnC,CAAC;YACH,CAAC;YAAC,MAAM,CAAC,CAAC,mBAAmB,CAAC,CAAC;YAC/B,MAAM,IAAI,OAAO,CAAC,CAAC,CAAC,EAAE,CAAC,UAAU,CAAC,CAAC,EAAE,cAAc,CAAC,CAAC,CAAC;QACxD,CAAC;QACD,MAAM,IAAI,CAAC,IAAI,EAAE,CAAC;QAClB,MAAM,IAAI,KAAK,CAAC,8CAA8C,kBAAkB,GAAG,IAAI,GAAG,CAAC,CAAC;IAC9F,CAAC;CACF"}
|
|
@@ -0,0 +1,33 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Resolve the path to the mlx-serve binary.
|
|
3
|
+
*
|
|
4
|
+
* 1. Check if `mlx-serve` is on PATH (system install)
|
|
5
|
+
* 2. Check if already downloaded to `<baseDir>/.mlx-serve/macos-arm64/`
|
|
6
|
+
* 3. Download from GitHub releases (macOS ARM64 only)
|
|
7
|
+
*/
|
|
8
|
+
export declare function getMlxBinaryPath(baseDir: string): Promise<string>;
|
|
9
|
+
/**
|
|
10
|
+
* Get the version string from the local mlx-serve binary without triggering a download.
|
|
11
|
+
*/
|
|
12
|
+
export declare function getMlxBinaryVersion(baseDir: string): string | null;
|
|
13
|
+
/**
|
|
14
|
+
* Check if mlx-serve is a system install (on PATH) vs managed by us.
|
|
15
|
+
*/
|
|
16
|
+
export declare function isMlxSystemBinary(): boolean;
|
|
17
|
+
export interface MlxUpdateInfo {
|
|
18
|
+
available: boolean;
|
|
19
|
+
currentVersion: string | null;
|
|
20
|
+
latestVersion: string | null;
|
|
21
|
+
latestTag: string | null;
|
|
22
|
+
publishedAt: string | null;
|
|
23
|
+
}
|
|
24
|
+
/**
|
|
25
|
+
* Compare local mlx-serve version with latest GitHub release.
|
|
26
|
+
* Uses semver comparison (e.g., 0.3.0 vs 0.3.1).
|
|
27
|
+
*/
|
|
28
|
+
export declare function checkForMlxUpdate(baseDir: string): Promise<MlxUpdateInfo>;
|
|
29
|
+
/**
|
|
30
|
+
* Delete the current managed binary and re-download the latest release from GitHub.
|
|
31
|
+
*/
|
|
32
|
+
export declare function updateMlxBinary(baseDir: string): Promise<void>;
|
|
33
|
+
//# sourceMappingURL=mlx-binary-manager.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"mlx-binary-manager.d.ts","sourceRoot":"","sources":["../../../lib/local-llm/mlx-binary-manager.ts"],"names":[],"mappings":"AAeA;;;;;;GAMG;AACH,wBAAsB,gBAAgB,CAAC,OAAO,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAqBvE;AAkFD;;GAEG;AACH,wBAAgB,mBAAmB,CAAC,OAAO,EAAE,MAAM,GAAG,MAAM,GAAG,IAAI,CAiClE;AAED;;GAEG;AACH,wBAAgB,iBAAiB,IAAI,OAAO,CAS3C;AAED,MAAM,WAAW,aAAa;IAC5B,SAAS,EAAE,OAAO,CAAC;IACnB,cAAc,EAAE,MAAM,GAAG,IAAI,CAAC;IAC9B,aAAa,EAAE,MAAM,GAAG,IAAI,CAAC;IAC7B,SAAS,EAAE,MAAM,GAAG,IAAI,CAAC;IACzB,WAAW,EAAE,MAAM,GAAG,IAAI,CAAC;CAC5B;AAED;;;GAGG;AACH,wBAAsB,iBAAiB,CAAC,OAAO,EAAE,MAAM,GAAG,OAAO,CAAC,aAAa,CAAC,CAmB/E;AAED;;GAEG;AACH,wBAAsB,eAAe,CAAC,OAAO,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC,CAOpE"}
|