@tmhs/local-ai-mcp 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (60) hide show
  1. package/LICENSE +34 -0
  2. package/README.md +126 -0
  3. package/dist/catalog/models.d.ts +11 -0
  4. package/dist/catalog/models.js +114 -0
  5. package/dist/catalog/models.js.map +1 -0
  6. package/dist/config.d.ts +7 -0
  7. package/dist/config.js +22 -0
  8. package/dist/config.js.map +1 -0
  9. package/dist/hardware/index.d.ts +16 -0
  10. package/dist/hardware/index.js +30 -0
  11. package/dist/hardware/index.js.map +1 -0
  12. package/dist/hardware/linux.d.ts +2 -0
  13. package/dist/hardware/linux.js +48 -0
  14. package/dist/hardware/linux.js.map +1 -0
  15. package/dist/hardware/windows.d.ts +2 -0
  16. package/dist/hardware/windows.js +60 -0
  17. package/dist/hardware/windows.js.map +1 -0
  18. package/dist/http.d.ts +14 -0
  19. package/dist/http.js +61 -0
  20. package/dist/http.js.map +1 -0
  21. package/dist/index.d.ts +2 -0
  22. package/dist/index.js +24 -0
  23. package/dist/index.js.map +1 -0
  24. package/dist/providers/lmstudio.d.ts +44 -0
  25. package/dist/providers/lmstudio.js +181 -0
  26. package/dist/providers/lmstudio.js.map +1 -0
  27. package/dist/providers/manager.d.ts +9 -0
  28. package/dist/providers/manager.js +31 -0
  29. package/dist/providers/manager.js.map +1 -0
  30. package/dist/providers/ollama.d.ts +34 -0
  31. package/dist/providers/ollama.js +157 -0
  32. package/dist/providers/ollama.js.map +1 -0
  33. package/dist/providers/types.d.ts +102 -0
  34. package/dist/providers/types.js +2 -0
  35. package/dist/providers/types.js.map +1 -0
  36. package/dist/tools/catalog.d.ts +3 -0
  37. package/dist/tools/catalog.js +55 -0
  38. package/dist/tools/catalog.js.map +1 -0
  39. package/dist/tools/context.d.ts +8 -0
  40. package/dist/tools/context.js +2 -0
  41. package/dist/tools/context.js.map +1 -0
  42. package/dist/tools/delegation.d.ts +3 -0
  43. package/dist/tools/delegation.js +54 -0
  44. package/dist/tools/delegation.js.map +1 -0
  45. package/dist/tools/discovery.d.ts +3 -0
  46. package/dist/tools/discovery.js +61 -0
  47. package/dist/tools/discovery.js.map +1 -0
  48. package/dist/tools/helpers.d.ts +42 -0
  49. package/dist/tools/helpers.js +83 -0
  50. package/dist/tools/helpers.js.map +1 -0
  51. package/dist/tools/index.d.ts +3 -0
  52. package/dist/tools/index.js +13 -0
  53. package/dist/tools/index.js.map +1 -0
  54. package/dist/tools/lifecycle.d.ts +3 -0
  55. package/dist/tools/lifecycle.js +66 -0
  56. package/dist/tools/lifecycle.js.map +1 -0
  57. package/dist/tools/ops.d.ts +12 -0
  58. package/dist/tools/ops.js +113 -0
  59. package/dist/tools/ops.js.map +1 -0
  60. package/package.json +54 -0
package/LICENSE ADDED
@@ -0,0 +1,34 @@
1
+ Creative Commons Attribution-NonCommercial-NoDerivatives 4.0 International
2
+
3
+ Copyright (c) 2026 TM Hospitality Strategies
4
+
5
+ This work is licensed under the Creative Commons
6
+ Attribution-NonCommercial-NoDerivatives 4.0 International License.
7
+
8
+ You are free to:
9
+
10
+ Share - copy and redistribute the material in any medium or format.
11
+
12
+ The licensor cannot revoke these freedoms as long as you follow the
13
+ license terms.
14
+
15
+ Under the following terms:
16
+
17
+ Attribution - You must give appropriate credit, provide a link to the
18
+ license, and indicate if changes were made. You may do so in any
19
+ reasonable manner, but not in any way that suggests the licensor
20
+ endorses you or your use.
21
+
22
+ NonCommercial - You may not use the material for commercial purposes.
23
+
24
+ NoDerivatives - If you remix, transform, or build upon the material,
25
+ you may not distribute the modified material.
26
+
27
+ No additional restrictions - You may not apply legal terms or
28
+ technological measures that legally restrict others from doing
29
+ anything the license permits.
30
+
31
+ Full license text:
32
+ https://creativecommons.org/licenses/by-nc-nd/4.0/legalcode
33
+
34
+ SPDX-License-Identifier: CC-BY-NC-ND-4.0
package/README.md ADDED
@@ -0,0 +1,126 @@
1
+ # Local AI MCP
2
+
3
+ **Unified MCP server for managing local model runtimes (Ollama, LM Studio, and more): provider-agnostic discovery, lifecycle, hardware-fit, and delegated inference.**
4
+
5
+ ![License: CC-BY-NC-ND-4.0](https://img.shields.io/badge/license-CC--BY--NC--ND--4.0-green)
6
+ ![Version](https://img.shields.io/badge/version-0.1.0-blue)
7
+ ![Type](https://img.shields.io/badge/type-mcp--server-7c3aed)
8
+
9
+ ---
10
+
11
+ Local AI MCP is an [MCP](https://modelcontextprotocol.io) server that turns your local model runtimes into an agent-callable control plane. It is **operations-first**: its primary job is to discover, inspect, fit, and manage the models running on your own machine. It speaks to runtimes over their local HTTP APIs and exposes one consistent tool surface across them, so an agent does not need to know whether a model lives in Ollama or LM Studio.
12
+
13
+ The server communicates over **stdio only**. It is a *client* to your local runtimes and never opens a network listener of its own.
14
+
15
+ ## Why an ops-first local-model server
16
+
17
+ - **Discovery and lifecycle, not just chat.** List what is installed, what is loaded, pull and remove models, load and unload them, and check their fit against your hardware before you commit VRAM to them.
18
+ - **Hardware-aware.** `system_resources` and `fit_check` read your real RAM and GPU/VRAM so an agent can pick a model that will actually run, and `suggest_model` ranks candidates by task *and* by what fits.
19
+ - **Provider-agnostic.** Every tool takes an optional `provider` argument. Omit it and the tool operates across all detected runtimes, aggregating results per provider.
20
+
21
+ ## Inference is delegation, not chat
22
+
23
+ The `complete` and `embed` tools exist to **delegate (offload) inference to a local model** for cost control and privacy: keep tokens and data on your own hardware instead of sending them to a hosted API. They are deliberately framed as delegated/offloaded inference primitives, not as a conversational chat surface.
24
+
25
+ ## The provider-adapter model
26
+
27
+ Each runtime is implemented as an adapter behind a single `Provider` interface (`src/providers/types.ts`) with a uniform method set: `detect`, `health`, `listModels`, `listLoaded`, `modelInfo`, `pull`, `remove`, `load`, `unload`, `complete`, `embed`, and `capabilities`. Adding a runtime means adding one adapter; the tool layer is unchanged.
28
+
29
+ | Adapter | Default host | Transport | Notes |
30
+ |---------|--------------|-----------|-------|
31
+ | **Ollama** (`src/providers/ollama.ts`) | `http://localhost:11434` | Native REST + OpenAI-compatible | `load`/`unload` map to Ollama `keep_alive` semantics (`keep_alive` to load, `keep_alive: 0` to unload). `complete`/`embed` use the OpenAI-compatible `/v1` routes. |
32
+ | **LM Studio** (`src/providers/lmstudio.ts`) | `http://localhost:1234` | REST (`/api/v0`) + OpenAI-compatible | Uses the `lms` CLI for `load`/`unload`/`pull`/`remove` when present; falls back to REST for `listModels`/`listLoaded`/`complete`/`embed`. |
33
+
34
+ **Auto-detection:** on each call the server probes the configured local endpoints to determine which runtimes are live. Hardware probing is isolated in `src/hardware/` and branches by platform (Windows / Linux); it exposes total/free RAM and, where detectable, GPU name and VRAM.
35
+
36
+ ## Tool surface (16 tools)
37
+
38
+ ### Discovery
39
+ | Tool | Description |
40
+ |------|-------------|
41
+ | `list_providers` | Configured runtimes, their host, live/detected status, and capabilities. |
42
+ | `list_models` | Installed models across detected providers (or one provider). |
43
+ | `list_loaded` | Models currently resident in memory. |
44
+ | `model_info` | Detailed metadata for a model. |
45
+
46
+ ### Lifecycle
47
+ | Tool | Description |
48
+ |------|-------------|
49
+ | `pull_model` | Download a model. **Heavy: may transfer multiple GB.** |
50
+ | `remove_model` | Delete a model from disk. **Destructive: requires `confirm: true` and refuses without it.** |
51
+ | `load_model` | Load a model into memory (Ollama `keep_alive`; LM Studio `lms load`). |
52
+ | `unload_model` | Evict a model from memory. |
53
+
54
+ ### Ops
55
+ | Tool | Description |
56
+ |------|-------------|
57
+ | `health_check` | Liveness and version per provider. |
58
+ | `system_resources` | Total/free RAM, CPU count, and GPU/VRAM. |
59
+ | `fit_check` | Whether a model fits in free VRAM (GPU) or RAM (CPU), with the numbers. |
60
+ | `benchmark` | Measure latency and tokens/sec with one small completion. **Heavy: runs real inference.** |
61
+
62
+ ### Registry
63
+ | Tool | Description |
64
+ |------|-------------|
65
+ | `search_available` | Search a curated catalog of well-known models (Ollama library oriented). |
66
+ | `suggest_model` | Recommend a model for a task, ranked by what fits your detected hardware. |
67
+
68
+ ### Delegation (offloaded inference)
69
+ | Tool | Description |
70
+ |------|-------------|
71
+ | `complete` | Delegate a completion to a local model (cost/privacy offload, not chat). |
72
+ | `embed` | Delegate embedding generation to a local model. |
73
+
74
+ Every tool except `system_resources` accepts an optional `provider` (`ollama` \| `lmstudio`). Omit it to operate across all detected runtimes.
75
+
76
+ ## Install and run
77
+
78
+ ```bash
79
+ npx @tmhs/local-ai-mcp
80
+ ```
81
+
82
+ ### Claude Desktop / Cursor config
83
+
84
+ ```json
85
+ {
86
+ "mcpServers": {
87
+ "local-ai": {
88
+ "command": "npx",
89
+ "args": ["-y", "@tmhs/local-ai-mcp"],
90
+ "env": {
91
+ "OLLAMA_HOST": "http://localhost:11434",
92
+ "LMSTUDIO_HOST": "http://localhost:1234"
93
+ }
94
+ }
95
+ }
96
+ }
97
+ ```
98
+
99
+ ## Configuration
100
+
101
+ All configuration is via environment variables with sane defaults:
102
+
103
+ | Variable | Default | Description |
104
+ |----------|---------|-------------|
105
+ | `OLLAMA_HOST` | `http://localhost:11434` | Ollama base URL (scheme optional; added if missing). |
106
+ | `LMSTUDIO_HOST` | `http://localhost:1234` | LM Studio base URL. |
107
+ | `LOCAL_AI_REQUEST_TIMEOUT_MS` | `120000` | Timeout for normal requests (inference, pull progress, etc.). |
108
+ | `LOCAL_AI_DETECT_TIMEOUT_MS` | `1500` | Timeout for provider auto-detection probes. |
109
+
110
+ ## Development
111
+
112
+ ```bash
113
+ npm install
114
+ npm run build # tsc -> dist/
115
+ npm test # vitest; runs fully offline (mocked HTTP, stubbed hardware)
116
+ ```
117
+
118
+ The test suite requires **no running runtime and no downloaded model**: every HTTP call is mocked and hardware probing is stubbed.
119
+
120
+ ## License
121
+
122
+ CC-BY-NC-ND-4.0 -- see [LICENSE](LICENSE).
123
+
124
+ ---
125
+
126
+ **Built by TMHSDigital**
@@ -0,0 +1,11 @@
1
+ export interface CatalogModel {
2
+ name: string;
3
+ family: string;
4
+ parameterSize: string;
5
+ approxSizeBytes: number;
6
+ quantization: string;
7
+ tasks: string[];
8
+ }
9
+ export declare const CATALOG: CatalogModel[];
10
+ export declare function searchCatalog(query: string): CatalogModel[];
11
+ export declare function fitsIn(approxSizeBytes: number, freeBytes: number): boolean;
@@ -0,0 +1,114 @@
1
+ const GB = 1024 * 1024 * 1024;
2
+ export const CATALOG = [
3
+ {
4
+ name: "llama3.2:3b",
5
+ family: "llama",
6
+ parameterSize: "3B",
7
+ approxSizeBytes: Math.round(2.0 * GB),
8
+ quantization: "Q4_K_M",
9
+ tasks: ["chat", "general"],
10
+ },
11
+ {
12
+ name: "llama3.1:8b",
13
+ family: "llama",
14
+ parameterSize: "8B",
15
+ approxSizeBytes: Math.round(4.7 * GB),
16
+ quantization: "Q4_K_M",
17
+ tasks: ["chat", "general", "reasoning"],
18
+ },
19
+ {
20
+ name: "qwen2.5-coder:7b",
21
+ family: "qwen2",
22
+ parameterSize: "7B",
23
+ approxSizeBytes: Math.round(4.7 * GB),
24
+ quantization: "Q4_K_M",
25
+ tasks: ["code", "general"],
26
+ },
27
+ {
28
+ name: "qwen2.5:14b",
29
+ family: "qwen2",
30
+ parameterSize: "14B",
31
+ approxSizeBytes: Math.round(9.0 * GB),
32
+ quantization: "Q4_K_M",
33
+ tasks: ["chat", "general", "reasoning"],
34
+ },
35
+ {
36
+ name: "mistral:7b",
37
+ family: "mistral",
38
+ parameterSize: "7B",
39
+ approxSizeBytes: Math.round(4.1 * GB),
40
+ quantization: "Q4_0",
41
+ tasks: ["chat", "general"],
42
+ },
43
+ {
44
+ name: "gemma2:9b",
45
+ family: "gemma2",
46
+ parameterSize: "9B",
47
+ approxSizeBytes: Math.round(5.4 * GB),
48
+ quantization: "Q4_0",
49
+ tasks: ["chat", "general"],
50
+ },
51
+ {
52
+ name: "phi3.5:3.8b",
53
+ family: "phi3",
54
+ parameterSize: "3.8B",
55
+ approxSizeBytes: Math.round(2.2 * GB),
56
+ quantization: "Q4_0",
57
+ tasks: ["chat", "general", "reasoning"],
58
+ },
59
+ {
60
+ name: "nomic-embed-text",
61
+ family: "nomic-bert",
62
+ parameterSize: "137M",
63
+ approxSizeBytes: Math.round(0.27 * GB),
64
+ quantization: "F16",
65
+ tasks: ["embed"],
66
+ },
67
+ {
68
+ name: "mxbai-embed-large",
69
+ family: "bert",
70
+ parameterSize: "335M",
71
+ approxSizeBytes: Math.round(0.67 * GB),
72
+ quantization: "F16",
73
+ tasks: ["embed"],
74
+ },
75
+ {
76
+ name: "llava:7b",
77
+ family: "llama",
78
+ parameterSize: "7B",
79
+ approxSizeBytes: Math.round(4.7 * GB),
80
+ quantization: "Q4_0",
81
+ tasks: ["vision", "chat"],
82
+ },
83
+ {
84
+ name: "deepseek-r1:7b",
85
+ family: "qwen2",
86
+ parameterSize: "7B",
87
+ approxSizeBytes: Math.round(4.7 * GB),
88
+ quantization: "Q4_K_M",
89
+ tasks: ["reasoning", "chat"],
90
+ },
91
+ {
92
+ name: "codellama:13b",
93
+ family: "llama",
94
+ parameterSize: "13B",
95
+ approxSizeBytes: Math.round(7.4 * GB),
96
+ quantization: "Q4_0",
97
+ tasks: ["code", "general"],
98
+ },
99
+ ];
100
+ export function searchCatalog(query) {
101
+ const q = query.trim().toLowerCase();
102
+ if (!q)
103
+ return [...CATALOG];
104
+ return CATALOG.filter((m) => {
105
+ return (m.name.toLowerCase().includes(q) ||
106
+ m.family.toLowerCase().includes(q) ||
107
+ m.parameterSize.toLowerCase().includes(q) ||
108
+ m.tasks.some((t) => t.toLowerCase().includes(q)));
109
+ });
110
+ }
111
+ export function fitsIn(approxSizeBytes, freeBytes) {
112
+ return approxSizeBytes * 1.2 <= freeBytes;
113
+ }
114
+ //# sourceMappingURL=models.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"models.js","sourceRoot":"","sources":["../../src/catalog/models.ts"],"names":[],"mappings":"AASA,MAAM,EAAE,GAAG,IAAI,GAAG,IAAI,GAAG,IAAI,CAAC;AAE9B,MAAM,CAAC,MAAM,OAAO,GAAmB;IACrC;QACE,IAAI,EAAE,aAAa;QACnB,MAAM,EAAE,OAAO;QACf,aAAa,EAAE,IAAI;QACnB,eAAe,EAAE,IAAI,CAAC,KAAK,CAAC,GAAG,GAAG,EAAE,CAAC;QACrC,YAAY,EAAE,QAAQ;QACtB,KAAK,EAAE,CAAC,MAAM,EAAE,SAAS,CAAC;KAC3B;IACD;QACE,IAAI,EAAE,aAAa;QACnB,MAAM,EAAE,OAAO;QACf,aAAa,EAAE,IAAI;QACnB,eAAe,EAAE,IAAI,CAAC,KAAK,CAAC,GAAG,GAAG,EAAE,CAAC;QACrC,YAAY,EAAE,QAAQ;QACtB,KAAK,EAAE,CAAC,MAAM,EAAE,SAAS,EAAE,WAAW,CAAC;KACxC;IACD;QACE,IAAI,EAAE,kBAAkB;QACxB,MAAM,EAAE,OAAO;QACf,aAAa,EAAE,IAAI;QACnB,eAAe,EAAE,IAAI,CAAC,KAAK,CAAC,GAAG,GAAG,EAAE,CAAC;QACrC,YAAY,EAAE,QAAQ;QACtB,KAAK,EAAE,CAAC,MAAM,EAAE,SAAS,CAAC;KAC3B;IACD;QACE,IAAI,EAAE,aAAa;QACnB,MAAM,EAAE,OAAO;QACf,aAAa,EAAE,KAAK;QACpB,eAAe,EAAE,IAAI,CAAC,KAAK,CAAC,GAAG,GAAG,EAAE,CAAC;QACrC,YAAY,EAAE,QAAQ;QACtB,KAAK,EAAE,CAAC,MAAM,EAAE,SAAS,EAAE,WAAW,CAAC;KACxC;IACD;QACE,IAAI,EAAE,YAAY;QAClB,MAAM,EAAE,SAAS;QACjB,aAAa,EAAE,IAAI;QACnB,eAAe,EAAE,IAAI,CAAC,KAAK,CAAC,GAAG,GAAG,EAAE,CAAC;QACrC,YAAY,EAAE,MAAM;QACpB,KAAK,EAAE,CAAC,MAAM,EAAE,SAAS,CAAC;KAC3B;IACD;QACE,IAAI,EAAE,WAAW;QACjB,MAAM,EAAE,QAAQ;QAChB,aAAa,EAAE,IAAI;QACnB,eAAe,EAAE,IAAI,CAAC,KAAK,CAAC,GAAG,GAAG,EAAE,CAAC;QACrC,YAAY,EAAE,MAAM;QACpB,KAAK,EAAE,CAAC,MAAM,EAAE,SAAS,CAAC;KAC3B;IACD;QACE,IAAI,EAAE,aAAa;QACnB,MAAM,EAAE,MAAM;QACd,aAAa,EAAE,MAAM;QACrB,eAAe,EAAE,IAAI,CAAC,KAAK,CAAC,GAAG,GAAG,EAAE,CAAC;QACrC,YAAY,EAAE,MAAM;QACpB,KAAK,EAAE,CAAC,MAAM,EAAE,SAAS,EAAE,WAAW,CAAC;KACxC;IACD;QACE,IAAI,EAAE,kBAAkB;QACxB,MAAM,EAAE,YAAY;QACpB,aAAa,EAAE,MAAM;QACrB,eAAe,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,GAAG,EAAE,CAAC;QACtC,YAAY,EAAE,KAAK;QACnB,KAAK,EAAE,CAAC,OAAO,CAAC;KACjB;IACD;QACE,IAAI,EAAE,mBAAmB;QACzB,MAAM,EAAE,MAAM;QACd,aAAa,EAAE,MAAM;QACrB,eAAe,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,GAAG,EAAE,CAAC;QACtC,YAAY,EAAE,KAAK;QACnB,KAAK,EAAE,CAAC,OAAO,CAAC;KACjB;IACD;QACE,IAAI,EAAE,UAAU;QAChB,MAAM,EAAE,OAAO;QACf,aAAa,EAAE,IAAI;QACnB,eAAe,EAAE,IAAI,CAAC,KAAK,CAAC,GAAG,GAAG,EAAE,CAAC;QACrC,YAAY,EAAE,MAAM;QACpB,KAAK,EAAE,CAAC,QAAQ,EAAE,MAAM,CAAC;KAC1B;IACD;QACE,IAAI,EAAE,gBAAgB;QACtB,MAAM,EAAE,OAAO;QACf,aAAa,EAAE,IAAI;QACnB,eAAe,EAAE,IAAI,CAAC,KAAK,CAAC,GAAG,GAAG,EAAE,CAAC;QACrC,YAAY,EAAE,QAAQ;QACtB,KAAK,EAAE,CAAC,WAAW,EAAE,MAAM,CAAC;KAC7B;IACD;QACE,IAAI,EAAE,eAAe;QACrB,MAAM,EAAE,OAAO;QACf,aAAa,EAAE,KAAK;QACpB,eAAe,EAAE,IAAI,CAAC,KAAK,CAAC,GAAG,GAAG,EAAE,CAAC;QACrC,YAAY,EAAE,MAAM;QACpB,KAAK,EAAE,CAAC,MAAM,EAAE,SAAS,CAAC;KAC3B;CACF,CAAC;AAEF,MAAM,UAAU,aAAa,CAAC,KAAa;IACzC,MAAM,CAAC,GAAG,KAAK,CAAC,IAAI,EAAE,CAAC,WAAW,EAAE,CAAC;IACrC,IAAI,CAAC,CAAC;QAAE,OAAO,CAAC,GAAG,OAAO,CAAC,CAAC;IAC5B,OAAO,OAAO,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,EAAE;QAC1B,OAAO,CACL,CAAC,CAAC,IAAI,CAAC,WAAW,EAAE,CAAC,QAAQ,CAAC,CAAC,CAAC;YAChC,CAAC,CAAC,MAAM,CAAC,WAAW,EAAE,CAAC,QAAQ,CAAC,CAAC,CAAC;YAClC,CAAC,CAAC,aAAa,CAAC,WAAW,EAAE,CAAC,QAAQ,CAAC,CAAC,CAAC;YACzC,CAAC,CAAC,KAAK,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,WAAW,EAAE,CAAC,QAAQ,CAAC,CAAC,CAAC,CAAC,CACjD,CAAC;IACJ,CAAC,CAAC,CAAC;AACL,CAAC;AAED,MAAM,UAAU,MAAM,CAAC,eAAuB,EAAE,SAAiB;IAC/D,OAAO,eAAe,GAAG,GAAG,IAAI,SAAS,CAAC;AAC5C,CAAC"}
@@ -0,0 +1,7 @@
1
+ export interface Config {
2
+ ollamaHost: string;
3
+ lmstudioHost: string;
4
+ requestTimeoutMs: number;
5
+ detectTimeoutMs: number;
6
+ }
7
+ export declare function loadConfig(env?: NodeJS.ProcessEnv): Config;
package/dist/config.js ADDED
@@ -0,0 +1,22 @@
1
+ function normalizeHost(value) {
2
+ let host = value.trim();
3
+ if (!/^https?:\/\//i.test(host)) {
4
+ host = `http://${host}`;
5
+ }
6
+ return host.replace(/\/+$/, "");
7
+ }
8
+ function parseIntEnv(value, fallback) {
9
+ if (value === undefined || value.trim() === "")
10
+ return fallback;
11
+ const n = Number.parseInt(value, 10);
12
+ return Number.isFinite(n) && n > 0 ? n : fallback;
13
+ }
14
+ export function loadConfig(env = process.env) {
15
+ return {
16
+ ollamaHost: normalizeHost(env.OLLAMA_HOST ?? "http://localhost:11434"),
17
+ lmstudioHost: normalizeHost(env.LMSTUDIO_HOST ?? "http://localhost:1234"),
18
+ requestTimeoutMs: parseIntEnv(env.LOCAL_AI_REQUEST_TIMEOUT_MS, 120000),
19
+ detectTimeoutMs: parseIntEnv(env.LOCAL_AI_DETECT_TIMEOUT_MS, 1500),
20
+ };
21
+ }
22
+ //# sourceMappingURL=config.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"config.js","sourceRoot":"","sources":["../src/config.ts"],"names":[],"mappings":"AAOA,SAAS,aAAa,CAAC,KAAa;IAClC,IAAI,IAAI,GAAG,KAAK,CAAC,IAAI,EAAE,CAAC;IACxB,IAAI,CAAC,eAAe,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAChC,IAAI,GAAG,UAAU,IAAI,EAAE,CAAC;IAC1B,CAAC;IACD,OAAO,IAAI,CAAC,OAAO,CAAC,MAAM,EAAE,EAAE,CAAC,CAAC;AAClC,CAAC;AAED,SAAS,WAAW,CAAC,KAAyB,EAAE,QAAgB;IAC9D,IAAI,KAAK,KAAK,SAAS,IAAI,KAAK,CAAC,IAAI,EAAE,KAAK,EAAE;QAAE,OAAO,QAAQ,CAAC;IAChE,MAAM,CAAC,GAAG,MAAM,CAAC,QAAQ,CAAC,KAAK,EAAE,EAAE,CAAC,CAAC;IACrC,OAAO,MAAM,CAAC,QAAQ,CAAC,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,QAAQ,CAAC;AACpD,CAAC;AAED,MAAM,UAAU,UAAU,CAAC,MAAyB,OAAO,CAAC,GAAG;IAC7D,OAAO;QACL,UAAU,EAAE,aAAa,CAAC,GAAG,CAAC,WAAW,IAAI,wBAAwB,CAAC;QACtE,YAAY,EAAE,aAAa,CAAC,GAAG,CAAC,aAAa,IAAI,uBAAuB,CAAC;QACzE,gBAAgB,EAAE,WAAW,CAAC,GAAG,CAAC,2BAA2B,EAAE,MAAM,CAAC;QACtE,eAAe,EAAE,WAAW,CAAC,GAAG,CAAC,0BAA0B,EAAE,IAAI,CAAC;KACnE,CAAC;AACJ,CAAC"}
@@ -0,0 +1,16 @@
1
+ export interface GpuInfo {
2
+ name: string;
3
+ vramTotalBytes?: number;
4
+ vramFreeBytes?: number;
5
+ }
6
+ export interface SystemResources {
7
+ platform: string;
8
+ ramTotalBytes: number;
9
+ ramFreeBytes: number;
10
+ cpuCount: number;
11
+ gpus: GpuInfo[];
12
+ }
13
+ export interface HardwareProbe {
14
+ getSystemResources(): Promise<SystemResources>;
15
+ }
16
+ export declare function createHardwareProbe(): HardwareProbe;
@@ -0,0 +1,30 @@
1
+ import os from "node:os";
2
+ export function createHardwareProbe() {
3
+ return {
4
+ async getSystemResources() {
5
+ const platform = os.platform();
6
+ let gpus = [];
7
+ try {
8
+ if (platform === "win32") {
9
+ const mod = await import("./windows.js");
10
+ gpus = mod.probeGpus();
11
+ }
12
+ else if (platform === "linux") {
13
+ const mod = await import("./linux.js");
14
+ gpus = mod.probeGpus();
15
+ }
16
+ }
17
+ catch {
18
+ gpus = [];
19
+ }
20
+ return {
21
+ platform,
22
+ ramTotalBytes: os.totalmem(),
23
+ ramFreeBytes: os.freemem(),
24
+ cpuCount: os.cpus().length,
25
+ gpus,
26
+ };
27
+ },
28
+ };
29
+ }
30
+ //# sourceMappingURL=index.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"index.js","sourceRoot":"","sources":["../../src/hardware/index.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,MAAM,SAAS,CAAC;AAoBzB,MAAM,UAAU,mBAAmB;IACjC,OAAO;QACL,KAAK,CAAC,kBAAkB;YACtB,MAAM,QAAQ,GAAG,EAAE,CAAC,QAAQ,EAAE,CAAC;YAC/B,IAAI,IAAI,GAAc,EAAE,CAAC;YACzB,IAAI,CAAC;gBACH,IAAI,QAAQ,KAAK,OAAO,EAAE,CAAC;oBACzB,MAAM,GAAG,GAAG,MAAM,MAAM,CAAC,cAAc,CAAC,CAAC;oBACzC,IAAI,GAAG,GAAG,CAAC,SAAS,EAAE,CAAC;gBACzB,CAAC;qBAAM,IAAI,QAAQ,KAAK,OAAO,EAAE,CAAC;oBAChC,MAAM,GAAG,GAAG,MAAM,MAAM,CAAC,YAAY,CAAC,CAAC;oBACvC,IAAI,GAAG,GAAG,CAAC,SAAS,EAAE,CAAC;gBACzB,CAAC;YACH,CAAC;YAAC,MAAM,CAAC;gBACP,IAAI,GAAG,EAAE,CAAC;YACZ,CAAC;YACD,OAAO;gBACL,QAAQ;gBACR,aAAa,EAAE,EAAE,CAAC,QAAQ,EAAE;gBAC5B,YAAY,EAAE,EAAE,CAAC,OAAO,EAAE;gBAC1B,QAAQ,EAAE,EAAE,CAAC,IAAI,EAAE,CAAC,MAAM;gBAC1B,IAAI;aACL,CAAC;QACJ,CAAC;KACF,CAAC;AACJ,CAAC"}
@@ -0,0 +1,2 @@
1
+ import type { GpuInfo } from "./index.js";
2
+ export declare function probeGpus(): GpuInfo[];
@@ -0,0 +1,48 @@
1
+ import { spawnSync } from "node:child_process";
2
+ const MB = 1024 * 1024;
3
+ function parseNvidiaSmi(stdout) {
4
+ const gpus = [];
5
+ for (const line of stdout.split(/\r?\n/)) {
6
+ const trimmed = line.trim();
7
+ if (!trimmed)
8
+ continue;
9
+ const parts = trimmed.split(",").map((p) => p.trim());
10
+ if (parts.length < 3)
11
+ continue;
12
+ const [name, totalMb, freeMb] = parts;
13
+ gpus.push({
14
+ name,
15
+ vramTotalBytes: Number.isFinite(Number(totalMb)) ? Number(totalMb) * MB : undefined,
16
+ vramFreeBytes: Number.isFinite(Number(freeMb)) ? Number(freeMb) * MB : undefined,
17
+ });
18
+ }
19
+ return gpus;
20
+ }
21
+ export function probeGpus() {
22
+ try {
23
+ const smi = spawnSync("nvidia-smi", ["--query-gpu=name,memory.total,memory.free", "--format=csv,noheader,nounits"], { encoding: "utf8" });
24
+ if (smi.status === 0 && smi.stdout && smi.stdout.trim()) {
25
+ const gpus = parseNvidiaSmi(smi.stdout);
26
+ if (gpus.length > 0)
27
+ return gpus;
28
+ }
29
+ }
30
+ catch {
31
+ // fall through to lspci fallback
32
+ }
33
+ try {
34
+ const lspci = spawnSync("lspci", { encoding: "utf8" });
35
+ if (lspci.status === 0 && lspci.stdout) {
36
+ return lspci.stdout
37
+ .split(/\r?\n/)
38
+ .filter((line) => /VGA compatible controller|3D controller/i.test(line))
39
+ .map((line) => ({ name: line.replace(/^\S+\s+/, "").trim() }))
40
+ .filter((g) => g.name);
41
+ }
42
+ }
43
+ catch {
44
+ // fall through
45
+ }
46
+ return [];
47
+ }
48
+ //# sourceMappingURL=linux.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"linux.js","sourceRoot":"","sources":["../../src/hardware/linux.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,SAAS,EAAE,MAAM,oBAAoB,CAAC;AAG/C,MAAM,EAAE,GAAG,IAAI,GAAG,IAAI,CAAC;AAEvB,SAAS,cAAc,CAAC,MAAc;IACpC,MAAM,IAAI,GAAc,EAAE,CAAC;IAC3B,KAAK,MAAM,IAAI,IAAI,MAAM,CAAC,KAAK,CAAC,OAAO,CAAC,EAAE,CAAC;QACzC,MAAM,OAAO,GAAG,IAAI,CAAC,IAAI,EAAE,CAAC;QAC5B,IAAI,CAAC,OAAO;YAAE,SAAS;QACvB,MAAM,KAAK,GAAG,OAAO,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC,CAAC;QACtD,IAAI,KAAK,CAAC,MAAM,GAAG,CAAC;YAAE,SAAS;QAC/B,MAAM,CAAC,IAAI,EAAE,OAAO,EAAE,MAAM,CAAC,GAAG,KAAK,CAAC;QACtC,IAAI,CAAC,IAAI,CAAC;YACR,IAAI;YACJ,cAAc,EAAE,MAAM,CAAC,QAAQ,CAAC,MAAM,CAAC,OAAO,CAAC,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC,OAAO,CAAC,GAAG,EAAE,CAAC,CAAC,CAAC,SAAS;YACnF,aAAa,EAAE,MAAM,CAAC,QAAQ,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC,MAAM,CAAC,GAAG,EAAE,CAAC,CAAC,CAAC,SAAS;SACjF,CAAC,CAAC;IACL,CAAC;IACD,OAAO,IAAI,CAAC;AACd,CAAC;AAED,MAAM,UAAU,SAAS;IACvB,IAAI,CAAC;QACH,MAAM,GAAG,GAAG,SAAS,CACnB,YAAY,EACZ,CAAC,2CAA2C,EAAE,+BAA+B,CAAC,EAC9E,EAAE,QAAQ,EAAE,MAAM,EAAE,CACrB,CAAC;QACF,IAAI,GAAG,CAAC,MAAM,KAAK,CAAC,IAAI,GAAG,CAAC,MAAM,IAAI,GAAG,CAAC,MAAM,CAAC,IAAI,EAAE,EAAE,CAAC;YACxD,MAAM,IAAI,GAAG,cAAc,CAAC,GAAG,CAAC,MAAM,CAAC,CAAC;YACxC,IAAI,IAAI,CAAC,MAAM,GAAG,CAAC;gBAAE,OAAO,IAAI,CAAC;QACnC,CAAC;IACH,CAAC;IAAC,MAAM,CAAC;QACP,iCAAiC;IACnC,CAAC;IAED,IAAI,CAAC;QACH,MAAM,KAAK,GAAG,SAAS,CAAC,OAAO,EAAE,EAAE,QAAQ,EAAE,MAAM,EAAE,CAAC,CAAC;QACvD,IAAI,KAAK,CAAC,MAAM,KAAK,CAAC,IAAI,KAAK,CAAC,MAAM,EAAE,CAAC;YACvC,OAAO,KAAK,CAAC,MAAM;iBAChB,KAAK,CAAC,OAAO,CAAC;iBACd,MAAM,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,0CAA0C,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;iBACvE,GAAG,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,CAAC,EAAE,IAAI,EAAE,IAAI,CAAC,OAAO,CAAC,SAAS,EAAE,EAAE,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,CAAC;iBAC7D,MAAM,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC;QAC3B,CAAC;IACH,CAAC;IAAC,MAAM,CAAC;QACP,eAAe;IACjB,CAAC;IAED,OAAO,EAAE,CAAC;AACZ,CAAC"}
@@ -0,0 +1,2 @@
1
+ import type { GpuInfo } from "./index.js";
2
+ export declare function probeGpus(): GpuInfo[];
@@ -0,0 +1,60 @@
1
+ import { spawnSync } from "node:child_process";
2
+ const MB = 1024 * 1024;
3
+ function parseNvidiaSmi(stdout) {
4
+ const gpus = [];
5
+ for (const line of stdout.split(/\r?\n/)) {
6
+ const trimmed = line.trim();
7
+ if (!trimmed)
8
+ continue;
9
+ const parts = trimmed.split(",").map((p) => p.trim());
10
+ if (parts.length < 3)
11
+ continue;
12
+ const [name, totalMb, freeMb] = parts;
13
+ gpus.push({
14
+ name,
15
+ vramTotalBytes: Number.isFinite(Number(totalMb)) ? Number(totalMb) * MB : undefined,
16
+ vramFreeBytes: Number.isFinite(Number(freeMb)) ? Number(freeMb) * MB : undefined,
17
+ });
18
+ }
19
+ return gpus;
20
+ }
21
+ export function probeGpus() {
22
+ try {
23
+ const smi = spawnSync("nvidia-smi", ["--query-gpu=name,memory.total,memory.free", "--format=csv,noheader,nounits"], { encoding: "utf8" });
24
+ if (smi.status === 0 && smi.stdout && smi.stdout.trim()) {
25
+ const gpus = parseNvidiaSmi(smi.stdout);
26
+ if (gpus.length > 0)
27
+ return gpus;
28
+ }
29
+ }
30
+ catch {
31
+ // fall through to PowerShell fallback
32
+ }
33
+ try {
34
+ const ps = spawnSync("powershell", [
35
+ "-NoProfile",
36
+ "-Command",
37
+ "Get-CimInstance Win32_VideoController | Select-Object Name,AdapterRAM | ConvertTo-Json -Compress",
38
+ ], { encoding: "utf8" });
39
+ if (ps.status === 0 && ps.stdout && ps.stdout.trim()) {
40
+ const parsed = JSON.parse(ps.stdout);
41
+ const list = Array.isArray(parsed) ? parsed : [parsed];
42
+ return list
43
+ .map((item) => {
44
+ const obj = item;
45
+ return {
46
+ name: obj.Name ?? "Unknown GPU",
47
+ vramTotalBytes: typeof obj.AdapterRAM === "number" && obj.AdapterRAM > 0
48
+ ? obj.AdapterRAM
49
+ : undefined,
50
+ };
51
+ })
52
+ .filter((g) => g.name);
53
+ }
54
+ }
55
+ catch {
56
+ // fall through
57
+ }
58
+ return [];
59
+ }
60
+ //# sourceMappingURL=windows.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"windows.js","sourceRoot":"","sources":["../../src/hardware/windows.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,SAAS,EAAE,MAAM,oBAAoB,CAAC;AAG/C,MAAM,EAAE,GAAG,IAAI,GAAG,IAAI,CAAC;AAEvB,SAAS,cAAc,CAAC,MAAc;IACpC,MAAM,IAAI,GAAc,EAAE,CAAC;IAC3B,KAAK,MAAM,IAAI,IAAI,MAAM,CAAC,KAAK,CAAC,OAAO,CAAC,EAAE,CAAC;QACzC,MAAM,OAAO,GAAG,IAAI,CAAC,IAAI,EAAE,CAAC;QAC5B,IAAI,CAAC,OAAO;YAAE,SAAS;QACvB,MAAM,KAAK,GAAG,OAAO,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC,CAAC;QACtD,IAAI,KAAK,CAAC,MAAM,GAAG,CAAC;YAAE,SAAS;QAC/B,MAAM,CAAC,IAAI,EAAE,OAAO,EAAE,MAAM,CAAC,GAAG,KAAK,CAAC;QACtC,IAAI,CAAC,IAAI,CAAC;YACR,IAAI;YACJ,cAAc,EAAE,MAAM,CAAC,QAAQ,CAAC,MAAM,CAAC,OAAO,CAAC,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC,OAAO,CAAC,GAAG,EAAE,CAAC,CAAC,CAAC,SAAS;YACnF,aAAa,EAAE,MAAM,CAAC,QAAQ,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC,MAAM,CAAC,GAAG,EAAE,CAAC,CAAC,CAAC,SAAS;SACjF,CAAC,CAAC;IACL,CAAC;IACD,OAAO,IAAI,CAAC;AACd,CAAC;AAED,MAAM,UAAU,SAAS;IACvB,IAAI,CAAC;QACH,MAAM,GAAG,GAAG,SAAS,CACnB,YAAY,EACZ,CAAC,2CAA2C,EAAE,+BAA+B,CAAC,EAC9E,EAAE,QAAQ,EAAE,MAAM,EAAE,CACrB,CAAC;QACF,IAAI,GAAG,CAAC,MAAM,KAAK,CAAC,IAAI,GAAG,CAAC,MAAM,IAAI,GAAG,CAAC,MAAM,CAAC,IAAI,EAAE,EAAE,CAAC;YACxD,MAAM,IAAI,GAAG,cAAc,CAAC,GAAG,CAAC,MAAM,CAAC,CAAC;YACxC,IAAI,IAAI,CAAC,MAAM,GAAG,CAAC;gBAAE,OAAO,IAAI,CAAC;QACnC,CAAC;IACH,CAAC;IAAC,MAAM,CAAC;QACP,sCAAsC;IACxC,CAAC;IAED,IAAI,CAAC;QACH,MAAM,EAAE,GAAG,SAAS,CAClB,YAAY,EACZ;YACE,YAAY;YACZ,UAAU;YACV,kGAAkG;SACnG,EACD,EAAE,QAAQ,EAAE,MAAM,EAAE,CACrB,CAAC;QACF,IAAI,EAAE,CAAC,MAAM,KAAK,CAAC,IAAI,EAAE,CAAC,MAAM,IAAI,EAAE,CAAC,MAAM,CAAC,IAAI,EAAE,EAAE,CAAC;YACrD,MAAM,MAAM,GAAY,IAAI,CAAC,KAAK,CAAC,EAAE,CAAC,MAAM,CAAC,CAAC;YAC9C,MAAM,IAAI,GAAG,KAAK,CAAC,OAAO,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC;YACvD,OAAO,IAAI;iBACR,GAAG,CAAC,CAAC,IAAI,EAAE,EAAE;gBACZ,MAAM,GAAG,GAAG,IAA8C,CAAC;gBAC3D,OAAO;oBACL,IAAI,EAAE,GAAG,CAAC,IAAI,IAAI,aAAa;oBAC/B,cAAc,EACZ,OAAO,GAAG,CAAC,UAAU,KAAK,QAAQ,IAAI,GAAG,CAAC,UAAU,GAAG,CAAC;wBACtD,CAAC,CAAC,GAAG,CAAC,UAAU;wBAChB,CAAC,CAAC,SAAS;iBAChB,CAAC;YACJ,CAAC,CAAC;iBACD,MAAM,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC;QAC3B,CAAC;IACH,CAAC;IAAC,MAAM,CAAC;QACP,eAAe;IACjB,CAAC;IAED,OAAO,EAAE,CAAC;AACZ,CAAC"}
package/dist/http.d.ts ADDED
@@ -0,0 +1,14 @@
1
+ export declare class HttpError extends Error {
2
+ status: number;
3
+ body: string;
4
+ constructor(status: number, body: string, message?: string);
5
+ }
6
+ export interface HttpOptions {
7
+ method?: string;
8
+ headers?: Record<string, string>;
9
+ body?: string;
10
+ timeoutMs?: number;
11
+ }
12
+ export declare function httpText(url: string, opts?: HttpOptions): Promise<string>;
13
+ export declare function httpJson<T>(url: string, opts?: HttpOptions): Promise<T>;
14
+ export declare function probe(url: string, timeoutMs: number): Promise<boolean>;
package/dist/http.js ADDED
@@ -0,0 +1,61 @@
1
+ export class HttpError extends Error {
2
+ status;
3
+ body;
4
+ constructor(status, body, message) {
5
+ super(message ?? `HTTP ${status}`);
6
+ this.name = "HttpError";
7
+ this.status = status;
8
+ this.body = body;
9
+ }
10
+ }
11
+ const DEFAULT_TIMEOUT_MS = 120000;
12
+ export async function httpText(url, opts = {}) {
13
+ const { method = "GET", headers = {}, body, timeoutMs = DEFAULT_TIMEOUT_MS } = opts;
14
+ const controller = new AbortController();
15
+ const timer = setTimeout(() => controller.abort(), timeoutMs);
16
+ try {
17
+ const res = await fetch(url, {
18
+ method,
19
+ headers,
20
+ body,
21
+ signal: controller.signal,
22
+ });
23
+ const text = await res.text();
24
+ if (!res.ok) {
25
+ throw new HttpError(res.status, text, `HTTP ${res.status} for ${method} ${url}`);
26
+ }
27
+ return text;
28
+ }
29
+ finally {
30
+ clearTimeout(timer);
31
+ }
32
+ }
33
+ export async function httpJson(url, opts = {}) {
34
+ const headers = {
35
+ Accept: "application/json",
36
+ ...(opts.headers ?? {}),
37
+ };
38
+ if (opts.body !== undefined && headers["Content-Type"] === undefined) {
39
+ headers["Content-Type"] = "application/json";
40
+ }
41
+ const text = await httpText(url, { ...opts, headers });
42
+ if (text.trim() === "") {
43
+ return {};
44
+ }
45
+ return JSON.parse(text);
46
+ }
47
+ export async function probe(url, timeoutMs) {
48
+ const controller = new AbortController();
49
+ const timer = setTimeout(() => controller.abort(), timeoutMs);
50
+ try {
51
+ const res = await fetch(url, { method: "GET", signal: controller.signal });
52
+ return res.ok;
53
+ }
54
+ catch {
55
+ return false;
56
+ }
57
+ finally {
58
+ clearTimeout(timer);
59
+ }
60
+ }
61
+ //# sourceMappingURL=http.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"http.js","sourceRoot":"","sources":["../src/http.ts"],"names":[],"mappings":"AAAA,MAAM,OAAO,SAAU,SAAQ,KAAK;IAClC,MAAM,CAAS;IACf,IAAI,CAAS;IACb,YAAY,MAAc,EAAE,IAAY,EAAE,OAAgB;QACxD,KAAK,CAAC,OAAO,IAAI,QAAQ,MAAM,EAAE,CAAC,CAAC;QACnC,IAAI,CAAC,IAAI,GAAG,WAAW,CAAC;QACxB,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC;QACrB,IAAI,CAAC,IAAI,GAAG,IAAI,CAAC;IACnB,CAAC;CACF;AASD,MAAM,kBAAkB,GAAG,MAAM,CAAC;AAElC,MAAM,CAAC,KAAK,UAAU,QAAQ,CAAC,GAAW,EAAE,OAAoB,EAAE;IAChE,MAAM,EAAE,MAAM,GAAG,KAAK,EAAE,OAAO,GAAG,EAAE,EAAE,IAAI,EAAE,SAAS,GAAG,kBAAkB,EAAE,GAAG,IAAI,CAAC;IACpF,MAAM,UAAU,GAAG,IAAI,eAAe,EAAE,CAAC;IACzC,MAAM,KAAK,GAAG,UAAU,CAAC,GAAG,EAAE,CAAC,UAAU,CAAC,KAAK,EAAE,EAAE,SAAS,CAAC,CAAC;IAC9D,IAAI,CAAC;QACH,MAAM,GAAG,GAAG,MAAM,KAAK,CAAC,GAAG,EAAE;YAC3B,MAAM;YACN,OAAO;YACP,IAAI;YACJ,MAAM,EAAE,UAAU,CAAC,MAAM;SAC1B,CAAC,CAAC;QACH,MAAM,IAAI,GAAG,MAAM,GAAG,CAAC,IAAI,EAAE,CAAC;QAC9B,IAAI,CAAC,GAAG,CAAC,EAAE,EAAE,CAAC;YACZ,MAAM,IAAI,SAAS,CAAC,GAAG,CAAC,MAAM,EAAE,IAAI,EAAE,QAAQ,GAAG,CAAC,MAAM,QAAQ,MAAM,IAAI,GAAG,EAAE,CAAC,CAAC;QACnF,CAAC;QACD,OAAO,IAAI,CAAC;IACd,CAAC;YAAS,CAAC;QACT,YAAY,CAAC,KAAK,CAAC,CAAC;IACtB,CAAC;AACH,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,QAAQ,CAAI,GAAW,EAAE,OAAoB,EAAE;IACnE,MAAM,OAAO,GAA2B;QACtC,MAAM,EAAE,kBAAkB;QAC1B,GAAG,CAAC,IAAI,CAAC,OAAO,IAAI,EAAE,CAAC;KACxB,CAAC;IACF,IAAI,IAAI,CAAC,IAAI,KAAK,SAAS,IAAI,OAAO,CAAC,cAAc,CAAC,KAAK,SAAS,EAAE,CAAC;QACrE,OAAO,CAAC,cAAc,CAAC,GAAG,kBAAkB,CAAC;IAC/C,CAAC;IACD,MAAM,IAAI,GAAG,MAAM,QAAQ,CAAC,GAAG,EAAE,EAAE,GAAG,IAAI,EAAE,OAAO,EAAE,CAAC,CAAC;IACvD,IAAI,IAAI,CAAC,IAAI,EAAE,KAAK,EAAE,EAAE,CAAC;QACvB,OAAO,EAAO,CAAC;IACjB,CAAC;IACD,OAAO,IAAI,CAAC,KAAK,CAAC,IAAI,CAAM,CAAC;AAC/B,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,KAAK,CAAC,GAAW,EAAE,SAAiB;IACxD,MAAM,UAAU,GAAG,IAAI,eAAe,EAAE,CAAC;IACzC,MAAM,KAAK,GAAG,UAAU,CAAC,GAAG,EAAE,CAAC,UAAU,CAAC,KAAK,EAAE,EAAE,SAAS,CAAC,CAAC;IAC9D,IAAI,CAAC;QACH,MAAM,GAAG,GAAG,MAAM,KAAK,CAAC,GAAG,EAAE,EAAE,MAAM,EAAE,KAAK,EAAE,MAAM,EAAE,UAAU,CAAC,MAAM,EAAE,CAAC,CAAC;QAC3E,OAAO,GAAG,CAAC,EAAE,CAAC;IAChB,CAAC;IAAC,MAAM,CAAC;QACP,OAAO,KAAK,CAAC;IACf,CAAC;YAAS,CAAC;QACT,YAAY,CAAC,KAAK,CAAC,CAAC;IACtB,CAAC;AACH,CAAC"}
@@ -0,0 +1,2 @@
1
+ #!/usr/bin/env node
2
+ export {};
package/dist/index.js ADDED
@@ -0,0 +1,24 @@
1
+ #!/usr/bin/env node
2
+ import { McpServer } from "@modelcontextprotocol/sdk/server/mcp.js";
3
+ import { StdioServerTransport } from "@modelcontextprotocol/sdk/server/stdio.js";
4
+ import { loadConfig } from "./config.js";
5
+ import { createHardwareProbe } from "./hardware/index.js";
6
+ import { ProviderManager } from "./providers/manager.js";
7
+ import { registerAll } from "./tools/index.js";
8
+ async function main() {
9
+ const config = loadConfig(process.env);
10
+ const manager = new ProviderManager(config);
11
+ const hardware = createHardwareProbe();
12
+ const ctx = { manager, hardware, config };
13
+ const server = new McpServer({ name: "local-ai-mcp", version: "0.1.0" });
14
+ registerAll(server, ctx);
15
+ const transport = new StdioServerTransport();
16
+ await server.connect(transport);
17
+ // stdout is the MCP channel; all logs must go to stderr only.
18
+ process.stderr.write(`local-ai-mcp ready (ollama=${config.ollamaHost}, lmstudio=${config.lmstudioHost})\n`);
19
+ }
20
+ main().catch((err) => {
21
+ process.stderr.write(`local-ai-mcp fatal: ${err instanceof Error ? err.stack : String(err)}\n`);
22
+ process.exit(1);
23
+ });
24
+ //# sourceMappingURL=index.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"index.js","sourceRoot":"","sources":["../src/index.ts"],"names":[],"mappings":";AACA,OAAO,EAAE,SAAS,EAAE,MAAM,yCAAyC,CAAC;AACpE,OAAO,EAAE,oBAAoB,EAAE,MAAM,2CAA2C,CAAC;AACjF,OAAO,EAAE,UAAU,EAAE,MAAM,aAAa,CAAC;AACzC,OAAO,EAAE,mBAAmB,EAAE,MAAM,qBAAqB,CAAC;AAC1D,OAAO,EAAE,eAAe,EAAE,MAAM,wBAAwB,CAAC;AAEzD,OAAO,EAAE,WAAW,EAAE,MAAM,kBAAkB,CAAC;AAE/C,KAAK,UAAU,IAAI;IACjB,MAAM,MAAM,GAAG,UAAU,CAAC,OAAO,CAAC,GAAG,CAAC,CAAC;IACvC,MAAM,OAAO,GAAG,IAAI,eAAe,CAAC,MAAM,CAAC,CAAC;IAC5C,MAAM,QAAQ,GAAG,mBAAmB,EAAE,CAAC;IACvC,MAAM,GAAG,GAAgB,EAAE,OAAO,EAAE,QAAQ,EAAE,MAAM,EAAE,CAAC;IAEvD,MAAM,MAAM,GAAG,IAAI,SAAS,CAAC,EAAE,IAAI,EAAE,cAAc,EAAE,OAAO,EAAE,OAAO,EAAE,CAAC,CAAC;IACzE,WAAW,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;IAEzB,MAAM,SAAS,GAAG,IAAI,oBAAoB,EAAE,CAAC;IAC7C,MAAM,MAAM,CAAC,OAAO,CAAC,SAAS,CAAC,CAAC;IAEhC,8DAA8D;IAC9D,OAAO,CAAC,MAAM,CAAC,KAAK,CAClB,8BAA8B,MAAM,CAAC,UAAU,cAAc,MAAM,CAAC,YAAY,KAAK,CACtF,CAAC;AACJ,CAAC;AAED,IAAI,EAAE,CAAC,KAAK,CAAC,CAAC,GAAG,EAAE,EAAE;IACnB,OAAO,CAAC,MAAM,CAAC,KAAK,CAAC,uBAAuB,GAAG,YAAY,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,KAAK,CAAC,CAAC,CAAC,MAAM,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC;IAChG,OAAO,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC;AAClB,CAAC,CAAC,CAAC"}