npm - llm-checker - Versions diffs - 3.5.0 → 3.5.2 - Mend

llm-checker 3.5.0 → 3.5.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

package/README.md +35 -43
package/bin/enhanced_cli.js +426 -0
package/bin/mcp-server.mjs +60 -0
package/package.json +6 -2
package/src/commands/roadmap-tools.js +368 -0
package/src/data/CLAUDE.md +17 -0
package/src/hardware/CLAUDE.md +18 -0
package/src/hardware/backends/CLAUDE.md +17 -0
package/src/hardware/backends/cpu-detector.js +66 -6
package/src/hardware/unified-detector.js +173 -1
package/src/models/CLAUDE.md +23 -0
package/src/ollama/CLAUDE.md +30 -0
package/src/ollama/client.js +81 -0
package/src/plugins/CLAUDE.md +17 -0
package/src/utils/CLAUDE.md +17 -0

package/src/hardware/unified-detector.js CHANGED Viewed

@@ -9,6 +9,7 @@ const CUDADetector = require('./backends/cuda-detector');
 const ROCmDetector = require('./backends/rocm-detector');
 const IntelDetector = require('./backends/intel-detector');
 const CPUDetector = require('./backends/cpu-detector');
+const si = require('systeminformation');
 class UnifiedDetector {
     constructor() {
@@ -37,6 +38,7 @@ class UnifiedDetector {
             backends: {},
             primary: null,
             cpu: null,
+            systemGpu: null,
             summary: {
                 bestBackend: 'cpu',
                 totalVRAM: 0,
@@ -122,6 +124,30 @@ class UnifiedDetector {
             }
         }
+        // Fallback GPU inventory via systeminformation (Windows/Linux) when no
+        // accelerator backend is currently available (CUDA/ROCm/Metal/Intel).
+        const hasAcceleratedBackend = Boolean(
+            result.backends.cuda?.available ||
+            result.backends.rocm?.available ||
+            result.backends.metal?.available ||
+            result.backends.intel?.available
+        );
+        if (!hasAcceleratedBackend && (process.platform === 'win32' || process.platform === 'linux')) {
+            try {
+                const genericGpuInfo = await this.detectSystemGpuFallback();
+                if (genericGpuInfo?.available) {
+                    result.systemGpu = genericGpuInfo;
+                    result.backends.generic = {
+                        available: true,
+                        info: genericGpuInfo
+                    };
+                }
+            } catch (e) {
+                result.backends.generic = { available: false, error: e.message };
+            }
+        }
         // Select the best available backend
         result.primary = this.selectPrimaryBackend(result.backends);
@@ -251,11 +277,22 @@ class UnifiedDetector {
         }
         else if (result.cpu) {
             summary.speedCoefficient = result.cpu.speedCoefficient;
+            if (result.systemGpu?.available && Array.isArray(result.systemGpu.gpus) && result.systemGpu.gpus.length > 0) {
+                const inventory = this.summarizeGPUInventory(result.systemGpu.gpus);
+                summary.totalVRAM = result.systemGpu.totalVRAM || 0;
+                summary.gpuCount = result.systemGpu.gpus.length;
+                summary.isMultiGPU = Boolean(result.systemGpu.isMultiGPU);
+                summary.gpuModel = inventory.primaryModel || null;
+                summary.gpuInventory = inventory.displayName || summary.gpuModel;
+                summary.gpuModels = inventory.models;
+                summary.hasHeterogeneousGPU = inventory.isHeterogeneous;
+            }
         }
         // Effective memory for LLM loading
         // For GPU: use VRAM; for CPU/Metal: use system RAM
-        if (summary.totalVRAM > 0 && primary?.type !== 'metal') {
+        if (summary.totalVRAM > 0 && ['cuda', 'rocm', 'intel'].includes(primary?.type)) {
             summary.effectiveMemory = summary.totalVRAM;
         } else {
             // Use 70% of system RAM for models (leave room for OS)
@@ -286,6 +323,137 @@ class UnifiedDetector {
         };
     }
+    async detectSystemGpuFallback() {
+        const graphics = await si.graphics();
+        const controllers = Array.isArray(graphics?.controllers) ? graphics.controllers : [];
+        if (controllers.length === 0) {
+            return {
+                available: false,
+                source: 'systeminformation',
+                gpus: [],
+                totalVRAM: 0,
+                isMultiGPU: false,
+                hasDedicated: false
+            };
+        }
+        const normalized = controllers
+            .map((controller) => {
+                const name = String(controller?.model || controller?.name || '').replace(/\s+/g, ' ').trim();
+                if (!name || name.toLowerCase() === 'unknown') return null;
+                const nameLower = name.toLowerCase();
+                if (nameLower.includes('microsoft basic') || nameLower.includes('standard vga')) return null;
+                const isIntegrated = this.isIntegratedGPUModel(name);
+                let vram = this.normalizeFallbackVRAM(controller?.vram || controller?.memoryTotal || controller?.memory || 0);
+                // For dedicated cards, estimate VRAM from model if runtime did not report memory.
+                if (!isIntegrated && vram === 0) {
+                    vram = this.estimateFallbackVRAM(name);
+                }
+                return {
+                    name,
+                    vendor: controller?.vendor || '',
+                    type: isIntegrated ? 'integrated' : 'dedicated',
+                    memory: { total: vram }
+                };
+            })
+            .filter(Boolean);
+        if (normalized.length === 0) {
+            return {
+                available: false,
+                source: 'systeminformation',
+                gpus: [],
+                totalVRAM: 0,
+                isMultiGPU: false,
+                hasDedicated: false
+            };
+        }
+        const dedicated = normalized.filter((gpu) => gpu.type === 'dedicated');
+        const totalVRAM = dedicated.length > 0
+            ? dedicated.reduce((sum, gpu) => sum + (gpu.memory?.total || 0), 0)
+            : 0;
+        return {
+            available: true,
+            source: 'systeminformation',
+            gpus: normalized,
+            totalVRAM,
+            isMultiGPU: dedicated.length > 1,
+            hasDedicated: dedicated.length > 0
+        };
+    }
+    normalizeFallbackVRAM(value) {
+        const num = Number(value);
+        if (!Number.isFinite(num) || num <= 0) return 0;
+        // Bytes -> GB
+        if (num > 1024 * 1024) {
+            return Math.round(num / (1024 * 1024 * 1024));
+        }
+        // MB -> GB
+        if (num >= 1024) {
+            return Math.round(num / 1024);
+        }
+        // Likely already GB
+        if (num >= 1 && num <= 80) {
+            return Math.round(num);
+        }
+        return 0;
+    }
+    isIntegratedGPUModel(model) {
+        const lower = String(model || '').toLowerCase();
+        if (!lower) return false;
+        if (lower.includes('radeon rx') || lower.includes('rtx') || lower.includes('gtx') ||
+            lower.includes('geforce') || lower.includes('tesla') || lower.includes('quadro') ||
+            lower.includes('instinct') || lower.includes('arc a') || lower.includes('radeon pro')) {
+            return false;
+        }
+        return (
+            lower.includes('intel') ||
+            lower.includes('iris') ||
+            lower.includes('uhd') ||
+            lower.includes('hd graphics') ||
+            lower.includes('radeon graphics') ||
+            lower.includes('radeon(tm) graphics') ||
+            lower.includes('vega') ||
+            lower.includes('apple')
+        );
+    }
+    estimateFallbackVRAM(model) {
+        const lower = String(model || '').toLowerCase();
+        if (!lower) return 0;
+        if (lower.includes('rx 7900')) return 24;
+        if (lower.includes('rx 7800')) return 16;
+        if (lower.includes('rx 7700')) return 12;
+        if (lower.includes('rx 7600 xt')) return 16;
+        if (lower.includes('rx 7600')) return 8;
+        if (lower.includes('rx 6900') || lower.includes('rx 6800')) return 16;
+        if (lower.includes('rx 6700')) return 12;
+        if (lower.includes('rtx 5090')) return 32;
+        if (lower.includes('rtx 4090') || lower.includes('rtx 3090')) return 24;
+        if (lower.includes('rtx 5080') || lower.includes('rtx 4080')) return 16;
+        if (lower.includes('rtx 5070') || lower.includes('rtx 4070') || lower.includes('rtx 3060')) return 12;
+        if (lower.includes('rtx 4060') || lower.includes('rtx 3070')) return 8;
+        return 0;
+    }
     /**
      * Generate hardware fingerprint for benchmarks
      */
@@ -448,6 +616,10 @@ class UnifiedDetector {
             return `${gpuDesc} (${summary.totalVRAM}GB) + ${summary.cpuModel}`;
         }
         else {
+            if (summary.gpuModel && summary.gpuCount > 0) {
+                const gpuDesc = summary.gpuInventory || summary.gpuModel;
+                return `${gpuDesc} (${summary.totalVRAM}GB VRAM detected, CPU backend) + ${summary.cpuModel}`;
+            }
             return `${summary.cpuModel} (${Math.round(summary.systemRAM)}GB RAM, CPU-only)`;
         }
     }

package/src/models/CLAUDE.md ADDED Viewed

@@ -0,0 +1,23 @@
+<claude-mem-context>
+# Recent Activity
+<!-- This section is auto-generated by claude-mem. Edit content outside the tags. -->
+### Feb 12, 2026
+| ID | Time | T | Title | Read |
+|----|------|---|-------|------|
+| #3442 | 9:59 PM | 🔵 | Static Model Database Structure - Hardcoded LLM Specifications | ~572 |
+### Feb 13, 2026
+| ID | Time | T | Title | Read |
+|----|------|---|-------|------|
+| #3699 | 12:05 AM | ✅ | Git Push Consolidated Architecture Changes to GitHub | ~367 |
+### Feb 14, 2026
+| ID | Time | T | Title | Read |
+|----|------|---|-------|------|
+| #4339 | 6:49 PM | 🟣 | MCP server implementation and documentation added to llm-checker repository | ~457 |
+</claude-mem-context>

package/src/ollama/CLAUDE.md ADDED Viewed

@@ -0,0 +1,30 @@
+<claude-mem-context>
+# Recent Activity
+<!-- This section is auto-generated by claude-mem. Edit content outside the tags. -->
+### Feb 12, 2026
+| ID | Time | T | Title | Read |
+|----|------|---|-------|------|
+| #3500 | 10:26 PM | 🔴 | pullModel() Stream Handling Improved - Success Validation Added | ~458 |
+| #3499 | " | 🔴 | Race Condition Fixed in Ollama Availability Cache | ~440 |
+| #3498 | 10:25 PM | 🔵 | testModelPerformance() Timeout Already Fixed | ~418 |
+| #3497 | " | 🔴 | Timeout Fixed in deleteModel() Using AbortController | ~391 |
+| #3496 | " | 🔴 | Timeout Fixed in testConnection() Using AbortController | ~395 |
+| #3495 | " | 🔴 | Fixed unbounded memory growth in native scraper HTTP request handler | ~361 |
+| #3493 | " | 🔴 | Fixed race condition in checkOllamaAvailability() with promise deduplication | ~398 |
+| #3491 | 10:24 PM | 🔴 | Added missing clearTimeout() in testModelPerformance() | ~319 |
+| #3489 | " | 🔴 | Fixed node-fetch timeout handling in testModelPerformance() | ~332 |
+| #3488 | " | 🔴 | Fixed node-fetch timeout handling in testConnection() tags check | ~303 |
+| #3486 | " | 🔴 | Fixed node-fetch timeout handling in getRunningModels() | ~308 |
+| #3484 | 10:23 PM | 🔵 | Ollama Client Timeout Implementation - Mixed Patterns with AbortController | ~554 |
+| #3443 | 9:59 PM | 🔵 | Ollama Native Scraper - Web Scraping with Dual Cache Strategy | ~594 |
+| #3437 | 9:58 PM | 🔵 | Ollama Client Implementation - HTTP API Wrapper with Connection Management | ~605 |
+### Feb 14, 2026
+| ID | Time | T | Title | Read |
+|----|------|---|-------|------|
+| #4339 | 6:49 PM | 🟣 | MCP server implementation and documentation added to llm-checker repository | ~457 |
+</claude-mem-context>

package/src/ollama/client.js CHANGED Viewed

@@ -458,6 +458,87 @@ class OllamaClient {
             };
         }
     }
+    async showModel(modelName) {
+        const availability = await this.checkOllamaAvailability();
+        if (!availability.available) {
+            throw new Error(`Ollama not available: ${availability.error}`);
+        }
+        try {
+            const controller = new AbortController();
+            const timeoutId = setTimeout(() => controller.abort(), 15000);
+            const response = await fetch(`${this.baseURL}/api/show`, {
+                method: 'POST',
+                signal: controller.signal,
+                headers: { 'Content-Type': 'application/json' },
+                body: JSON.stringify({ model: modelName })
+            });
+            clearTimeout(timeoutId);
+            if (!response.ok) {
+                const errorText = await response.text();
+                throw new Error(`HTTP ${response.status}: ${response.statusText} - ${errorText}`);
+            }
+            return response.json();
+        } catch (error) {
+            throw new Error(`Failed to show model info: ${error.message}`);
+        }
+    }
+    async chat(modelName, messages, options = {}) {
+        const availability = await this.checkOllamaAvailability();
+        if (!availability.available) {
+            throw new Error(`Ollama not available: ${availability.error}`);
+        }
+        const {
+            tools,
+            format,
+            keepAlive,
+            timeoutMs = 45000,
+            generationOptions = {}
+        } = options;
+        const payload = {
+            model: modelName,
+            messages: Array.isArray(messages) ? messages : [],
+            stream: false
+        };
+        if (Array.isArray(tools) && tools.length > 0) payload.tools = tools;
+        if (format) payload.format = format;
+        if (keepAlive) payload.keep_alive = keepAlive;
+        if (generationOptions && Object.keys(generationOptions).length > 0) {
+            payload.options = generationOptions;
+        }
+        try {
+            const controller = new AbortController();
+            const timeoutId = setTimeout(() => controller.abort(), timeoutMs);
+            const response = await fetch(`${this.baseURL}/api/chat`, {
+                method: 'POST',
+                signal: controller.signal,
+                headers: { 'Content-Type': 'application/json' },
+                body: JSON.stringify(payload)
+            });
+            clearTimeout(timeoutId);
+            if (!response.ok) {
+                const errorText = await response.text();
+                throw new Error(`HTTP ${response.status}: ${response.statusText} - ${errorText}`);
+            }
+            return response.json();
+        } catch (error) {
+            throw new Error(`Failed to run chat request: ${error.message}`);
+        }
+    }
 }
 module.exports = OllamaClient;

package/src/plugins/CLAUDE.md ADDED Viewed

@@ -0,0 +1,17 @@
+<claude-mem-context>
+# Recent Activity
+<!-- This section is auto-generated by claude-mem. Edit content outside the tags. -->
+### Feb 12, 2026
+| ID | Time | T | Title | Read |
+|----|------|---|-------|------|
+| #3462 | 10:02 PM | 🔵 | Plugin System Architecture - Hook-Based Extensibility Framework | ~648 |
+### Feb 14, 2026
+| ID | Time | T | Title | Read |
+|----|------|---|-------|------|
+| #4339 | 6:49 PM | 🟣 | MCP server implementation and documentation added to llm-checker repository | ~457 |
+</claude-mem-context>

package/src/utils/CLAUDE.md ADDED Viewed

@@ -0,0 +1,17 @@
+<claude-mem-context>
+# Recent Activity
+<!-- This section is auto-generated by claude-mem. Edit content outside the tags. -->
+### Feb 12, 2026
+| ID | Time | T | Title | Read |
+|----|------|---|-------|------|
+| #3438 | 9:58 PM | 🔵 | Configuration Management System - Comprehensive Settings with Environment Overrides | ~580 |
+### Feb 14, 2026
+| ID | Time | T | Title | Read |
+|----|------|---|-------|------|
+| #4339 | 6:49 PM | 🟣 | MCP server implementation and documentation added to llm-checker repository | ~457 |
+</claude-mem-context>