npm - llm-checker - Versions diffs - 3.5.11 → 3.5.13 - Mend

llm-checker 3.5.11 → 3.5.13

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

package/README.md +83 -17
package/bin/cli.js +40 -0
package/bin/enhanced_cli.js +384 -35
package/package.json +2 -1
package/src/ai/model-selector.js +47 -16
package/src/ai/multi-objective-selector.js +55 -9
package/src/data/model-database.js +92 -1
package/src/data/seed/README.md +8 -0
package/src/data/seed/models.db +0 -0
package/src/hardware/backends/rocm-detector.js +469 -68
package/src/hardware/unified-detector.js +69 -18
package/src/index.js +59 -8
package/src/models/ai-check-selector.js +27 -2
package/src/models/deterministic-selector.js +84 -7
package/src/ollama/client.js +121 -0
package/src/ollama/enhanced-scraper.js +40 -26
package/src/ollama/native-scraper.js +52 -27
package/src/ui/cli-theme.js +139 -24
package/src/ui/interactive-panel.js +1 -18
package/src/utils/verbose-progress.js +144 -187

package/bin/enhanced_cli.js CHANGED Viewed

@@ -4,6 +4,7 @@ const chalk = require('chalk');
 const ora = require('ora');
 const { table } = require('table');
 const os = require('os');
+const readline = require('readline');
 const { spawn } = require('child_process');
 // LLMChecker is loaded lazily to avoid slow systeminformation init
 let _LLMChecker = null;
@@ -49,6 +50,7 @@ const {
     buildComplianceReport,
     serializeComplianceReport
 } = require('../src/policy/audit-reporter');
+const { estimateTokenSpeedFromHardware } = require('../src/utils/token-speed-estimator');
 const { renderCommandHeader, renderPersistentBanner } = require('../src/ui/cli-theme');
 const { launchInteractivePanel } = require('../src/ui/interactive-panel');
 const policyManager = new PolicyManager();
@@ -881,6 +883,11 @@ function formatGpuInventoryList(models = []) {
 // Helper function to get hardware tier for display
 function getHardwareTierForDisplay(hardware) {
+    const canonicalTier = hardware?.summary?.hardwareTier;
+    if (typeof canonicalTier === 'string' && canonicalTier.trim()) {
+        return canonicalTier.replace(/_/g, ' ').toUpperCase();
+    }
     const ram = hardware.memory.total;
     const cores = hardware.cpu.cores;
     const gpuModel = hardware.gpu?.model || '';
@@ -923,6 +930,21 @@ function getHardwareTierForDisplay(hardware) {
     return tier;
 }
+function getBackendLabelForDisplay(hardware) {
+    const summary = hardware?.summary || {};
+    if (typeof summary.bestBackendLabel === 'string' && summary.bestBackendLabel.trim()) {
+        return summary.bestBackendLabel;
+    }
+    const backendName = summary.backendName || String(summary.bestBackend || 'cpu').toUpperCase();
+    if (summary.runtimeBackend && summary.runtimeBackend !== summary.bestBackend) {
+        return `${backendName} + ${summary.runtimeBackendName || summary.runtimeBackend} assist`;
+    }
+    return backendName;
+}
 function formatSpeed(speed) {
     const speedMap = {
         'very_fast': 'very_fast',
@@ -963,18 +985,25 @@ function displaySystemInfo(hardware, analysis) {
     const gpuColor = hardware.gpu.dedicated ? chalk.green : chalk.hex('#FFA500');
     const integratedList = formatGpuInventoryList(hardware.gpu.integratedGpuModels || hardware.summary?.integratedGpuModels);
     const dedicatedList = formatGpuInventoryList(hardware.gpu.dedicatedGpuModels || hardware.summary?.dedicatedGpuModels);
+    const integratedSharedMemory = hardware.gpu.sharedMemory || hardware.summary?.integratedSharedMemory || 0;
+    const vramDisplay = !hardware.gpu.dedicated && integratedSharedMemory > 0
+        ? `${integratedSharedMemory}GB shared`
+        : (hardware.gpu.vram === 0 && hardware.gpu.model && hardware.gpu.model.toLowerCase().includes('apple')
+            ? 'Unified Memory'
+            : `${hardware.gpu.vram || 'N/A'}GB`);
     const lines = [
         `${chalk.cyan('CPU:')} ${cpuColor(hardware.cpu.brand)} ${chalk.gray(`(${hardware.cpu.cores} cores, ${hardware.cpu.speed}GHz)`)}`,
         `${chalk.cyan('Architecture:')} ${hardware.cpu.architecture}`,
         `${chalk.cyan('RAM:')} ${ramColor(hardware.memory.total + 'GB')}`,
         `${chalk.cyan('GPU:')} ${gpuColor(hardware.gpu.model || 'Not detected')}`,
-        `${chalk.cyan('VRAM:')} ${hardware.gpu.vram === 0 && hardware.gpu.model && hardware.gpu.model.toLowerCase().includes('apple') ? 'Unified Memory' : `${hardware.gpu.vram || 'N/A'}GB`}${hardware.gpu.dedicated ? chalk.green(' (Dedicated)') : chalk.hex('#FFA500')(' (Integrated)')}`,
+        `${chalk.cyan('Backend:')} ${chalk.white(getBackendLabelForDisplay(hardware))}`,
+        `${chalk.cyan('VRAM:')} ${vramDisplay}${hardware.gpu.dedicated ? chalk.green(' (Dedicated)') : chalk.hex('#FFA500')(' (Integrated)')}`,
         `${chalk.cyan('Dedicated GPUs:')} ${chalk.green(dedicatedList)}`,
         `${chalk.cyan('Integrated GPUs:')} ${chalk.hex('#FFA500')(integratedList)}`,
     ];
-    const tier = analysis.summary.hardwareTier?.replace('_', ' ').toUpperCase() || 'UNKNOWN';
+    const tier = analysis.summary.hardwareTier?.replace(/_/g, ' ').toUpperCase() || getHardwareTierForDisplay(hardware);
     const tierColor = tier.includes('HIGH') ? chalk.green : tier.includes('MEDIUM') ? chalk.yellow : chalk.red;
     lines.push(`${chalk.bold('Hardware Tier:')} ${tierColor.bold(tier)}`);
@@ -1405,6 +1434,266 @@ function displayCalibratedRoutingDecision(commandName, calibratedPolicy, routeDe
     console.log(chalk.blue('╰'));
 }
+function parseAiRunModelSizeB(value) {
+    const match = String(value || '').match(/(\d+(?:\.\d+)?)\s*([kmb])\+?/i);
+    if (!match) return null;
+    const amount = Number(match[1]);
+    if (!Number.isFinite(amount) || amount <= 0) return null;
+    const unit = match[2].toLowerCase();
+    if (unit === 'b') return amount;
+    if (unit === 'm') return amount / 1000;
+    if (unit === 'k') return amount / 1_000_000;
+    return null;
+}
+function normalizeAiRunModelName(value) {
+    return String(value || '')
+        .trim()
+        .toLowerCase()
+        .replace(/:latest$/, '');
+}
+function findAiRunLocalModel(localModels = [], modelName = '') {
+    const target = normalizeAiRunModelName(modelName);
+    if (!target) return null;
+    return localModels.find((model) => {
+        const name = normalizeAiRunModelName(model.name || model.model);
+        if (!name) return false;
+        return name === target || name.includes(target) || target.includes(name);
+    }) || null;
+}
+function resolveAiRunModelSizeB(modelName, aiSelector, localModel = null) {
+    const localParameterSize = localModel?.details?.parameter_size || localModel?.size;
+    const parsedLocalSize = parseAiRunModelSizeB(localParameterSize);
+    if (parsedLocalSize) return parsedLocalSize;
+    const parsedNameSize = parseAiRunModelSizeB(modelName);
+    if (parsedNameSize) return parsedNameSize;
+    if (aiSelector && typeof aiSelector.estimateModelSize === 'function') {
+        const selectorSize = Number(aiSelector.estimateModelSize(modelName));
+        if (Number.isFinite(selectorSize) && selectorSize > 0) return selectorSize;
+    }
+    return 7;
+}
+function formatAiRunNumber(value, decimals = 1) {
+    const number = Number(value);
+    if (!Number.isFinite(number)) return 'N/A';
+    return number.toFixed(decimals).replace(/\.0$/, '');
+}
+function estimateAiRunWorkingSetGB(modelSizeB, localModel = null) {
+    const fileSizeGB = Number(localModel?.fileSizeGB) || 0;
+    const parameterEstimateGB = (Number(modelSizeB) * 0.75) + 2;
+    if (fileSizeGB > 0) {
+        return Math.max(fileSizeGB * 1.15, parameterEstimateGB * 0.85);
+    }
+    return parameterEstimateGB;
+}
+function formatAiRunHardwareSummary(systemInfo = {}) {
+    const cpuBrand = systemInfo.cpu?.brand || systemInfo.cpu?.model || 'CPU';
+    const cores = systemInfo.cpu?.cores ? ` (${systemInfo.cpu.cores} cores)` : '';
+    const memory = systemInfo.memory?.total ? `${systemInfo.memory.total}GB RAM` : 'RAM unknown';
+    const gpu = systemInfo.gpu?.model || 'GPU not detected';
+    return `${cpuBrand}${cores}, ${memory}, ${gpu}`;
+}
+function formatAiRunMethod(method = '') {
+    return String(method || 'selector')
+        .replace(/[_-]+/g, ' ')
+        .replace(/\b\w/g, (letter) => letter.toUpperCase());
+}
+function formatAiRunReason(reason = '') {
+    const text = String(reason || '').replace(/\s+/g, ' ').trim();
+    if (!text) return 'Selected from local model compatibility scoring.';
+    return text.length > 120 ? `${text.slice(0, 117)}...` : text;
+}
+function formatAiRunMeasuredSpeed(benchmark = null) {
+    if (!benchmark) return null;
+    if (!benchmark.success) {
+        return `not available (${benchmark.error || 'benchmark failed'})`;
+    }
+    const parts = [];
+    if (Number(benchmark.evalTokensPerSecond) > 0) {
+        parts.push(`${formatAiRunNumber(benchmark.evalTokensPerSecond)} eval t/s`);
+    }
+    if (Number(benchmark.endToEndTokensPerSecond) > 0) {
+        parts.push(`${formatAiRunNumber(benchmark.endToEndTokensPerSecond)} end-to-end t/s`);
+    }
+    if (parts.length === 0 && Number(benchmark.tokensPerSecond) > 0) {
+        parts.push(`${formatAiRunNumber(benchmark.tokensPerSecond)} t/s`);
+    }
+    const generated = Number(benchmark.tokensGenerated) > 0
+        ? `, ${benchmark.tokensGenerated} tokens`
+        : '';
+    return `${parts.join(', ')}${generated}`;
+}
+function displayAiRunReference({ result, systemInfo, taskHint, candidateModels, localModels, aiSelector, benchmark }) {
+    const localModel = findAiRunLocalModel(localModels, result.bestModel);
+    const modelSizeB = resolveAiRunModelSizeB(result.bestModel, aiSelector, localModel);
+    const speedEstimate = estimateTokenSpeedFromHardware(systemInfo, {
+        modelSizeB,
+        modelName: result.bestModel
+    });
+    const workingSetGB = estimateAiRunWorkingSetGB(modelSizeB, localModel);
+    const localCount = result.localModelsCount || candidateModels.length;
+    const dbCount = result.totalModelsEvaluated;
+    const confidence = Number(result.confidence);
+    const confidenceText = Number.isFinite(confidence)
+        ? `${Math.round(confidence * 100)}%`
+        : 'N/A';
+    const idealModel = result.recommendedFromDatabase;
+    const usesFallback = idealModel && idealModel !== result.bestModel && result.isRecommendedInstalled === false;
+    const measuredSpeed = formatAiRunMeasuredSpeed(benchmark);
+    console.log('\n' + chalk.bold('AI Run reference'));
+    console.log(chalk.gray('----------------'));
+    console.log(`${chalk.gray('Task:')} ${chalk.white(taskHint || 'general')}`);
+    console.log(`${chalk.gray('Selected local model:')} ${chalk.green.bold(result.bestModel)}`);
+    if (idealModel) {
+        const idealStatus = usesFallback ? chalk.yellow('not installed') : chalk.green('available');
+        console.log(`${chalk.gray('Best database match:')} ${chalk.cyan(idealModel)} ${chalk.gray('(')}${idealStatus}${chalk.gray(')')}`);
+    }
+    console.log(`${chalk.gray('Why this model:')} ${formatAiRunReason(result.reasoning || result.reason)}`);
+    console.log(`${chalk.gray('Confidence:')} ${chalk.white(confidenceText)} ${chalk.gray(`via ${formatAiRunMethod(result.method)}`)}`);
+    console.log(`${chalk.gray('Models evaluated:')} ${chalk.white(`${localCount} local`)}${dbCount ? chalk.gray(`, ${dbCount} database`) : ''}`);
+    console.log(`${chalk.gray('Hardware:')} ${formatAiRunHardwareSummary(systemInfo)}`);
+    console.log(`${chalk.gray('Estimated speed:')} ${chalk.yellow(`~${speedEstimate.tokensPerSecond} tokens/sec`)} ${chalk.gray(`${speedEstimate.backend}, generation only`)}`);
+    if (measuredSpeed) {
+        const speedColor = benchmark?.success ? chalk.green : chalk.yellow;
+        console.log(`${chalk.gray('Measured speed:')} ${speedColor(measuredSpeed)}`);
+    }
+    console.log(`${chalk.gray('Memory reference:')} ${chalk.white(`~${formatAiRunNumber(modelSizeB)}B params, ~${formatAiRunNumber(workingSetGB)}GB working set`)}`);
+    if (usesFallback) {
+        console.log(`${chalk.gray('Install ideal model:')} ${chalk.cyan(`ollama pull ${idealModel}`)}`);
+    }
+}
+function formatAiRunTurnSpeed(result = {}) {
+    const evalSpeed = Number(result.evalTokensPerSecond);
+    const preferredSpeed = evalSpeed > 0 ? evalSpeed : Number(result.tokensPerSecond);
+    if (!Number.isFinite(preferredSpeed) || preferredSpeed <= 0) {
+        return '[speed unavailable]';
+    }
+    return `[${formatAiRunNumber(preferredSpeed)} tokens/sec]`;
+}
+async function runAiRunChatTurn(client, modelName, messages) {
+    let printed = false;
+    const result = await client.streamChat(
+        modelName,
+        messages,
+        {
+            keepAlive: '5m',
+            timeoutMs: 180000
+        },
+        (chunk) => {
+            printed = true;
+            process.stdout.write(chunk);
+        }
+    );
+    if (!printed && result.response) {
+        process.stdout.write(result.response);
+    }
+    const responseText = result.response || result.message?.content || '';
+    const needsSpace = responseText.length > 0 && !/\s$/.test(responseText);
+    process.stdout.write(`${needsSpace ? ' ' : ''}${chalk.gray(formatAiRunTurnSpeed(result))}\n\n`);
+    return result;
+}
+function askAiRunQuestion(rl, promptText) {
+    return new Promise((resolve) => {
+        let settled = false;
+        const handleClose = () => {
+            if (!settled) {
+                settled = true;
+                resolve(null);
+            }
+        };
+        rl.once('close', handleClose);
+        rl.question(promptText, (answer) => {
+            if (settled) return;
+            settled = true;
+            rl.off('close', handleClose);
+            resolve(answer);
+        });
+    });
+}
+async function runAiRunInteractiveChat(client, modelName) {
+    const rl = readline.createInterface({
+        input: process.stdin,
+        output: process.stdout
+    });
+    const messages = [];
+    let closed = false;
+    rl.on('SIGINT', () => {
+        process.stdout.write('\n');
+        rl.close();
+    });
+    rl.on('close', () => {
+        closed = true;
+    });
+    try {
+        while (!closed) {
+            const input = await askAiRunQuestion(rl, chalk.cyan('>>> '));
+            if (input === null) break;
+            const trimmed = String(input || '').trim();
+            if (!trimmed) {
+                continue;
+            }
+            if (['/bye', '/exit', '/quit', 'q'].includes(trimmed.toLowerCase())) {
+                break;
+            }
+            if (['/?', '/help'].includes(trimmed.toLowerCase())) {
+                console.log('Commands: /bye, /exit, /quit');
+                continue;
+            }
+            messages.push({ role: 'user', content: input });
+            try {
+                const response = await runAiRunChatTurn(client, modelName, messages);
+                const assistantContent = response.response || response.message?.content || '';
+                messages.push({ role: 'assistant', content: assistantContent });
+            } catch (error) {
+                console.error(chalk.red(`Chat request failed: ${error.message}`));
+            }
+        }
+    } finally {
+        rl.close();
+    }
+}
 function displayModelsStats(originalCount, filteredCount, options) {
     console.log('\n' + chalk.bgGreen.white.bold('  DATABASE STATS '));
     console.log(chalk.green('╭' + '─'.repeat(60)));
@@ -1758,6 +2047,7 @@ function displaySimplifiedSystemInfo(hardware) {
     console.log(`Memory: ${chalk.white(memInfo)}`);
     console.log(`GPU: ${chalk.white(gpuInfo)}`);
     console.log(`Architecture: ${chalk.white(hardware.cpu.architecture)}`);
+    console.log(`Backend: ${chalk.white(getBackendLabelForDisplay(hardware))}`);
     const tier = getHardwareTierForDisplay(hardware);
     const tierColor = tier.includes('HIGH') ? chalk.green : tier.includes('MEDIUM') ? chalk.yellow : chalk.red;
@@ -3182,7 +3472,7 @@ program
         const spinner = ora('Checking Ollama integration...').start();
         try {
-            const checker = new (getLLMChecker())();
+            const checker = new (getLLMChecker())({ verbose: false });
             const analysis = await checker.analyze();
             if (!analysis.ollamaInfo.available) {
@@ -3884,14 +4174,15 @@ program
     .option('--json', 'Output in JSON format')
     .action(async (options) => {
         if (!options.json) showAsciiArt('list-models');
-        const spinner = ora('📋 Loading models database...').start();
+        const spinner = options.json ? null : ora('📋 Loading models database...').start();
         try {
             const checker = new (getLLMChecker())();
-            const data = await checker.ollamaScraper.scrapeAllModels(false);
+            const data = await checker.loadOllamaModelData();
             if (!data || !data.models) {
-                spinner.fail('No models found in database');
+                if (spinner) spinner.fail('No models found in database');
+                else console.error('No models found in database');
                 return;
             }
@@ -3982,9 +4273,9 @@ program
                         return (b.pulls || 0) - (a.pulls || 0);
                     });
-                    spinner.text = `Sorted by hardware compatibility (${getHardwareTierForDisplay(hardware)})`;
+                    if (spinner) spinner.text = `Sorted by hardware compatibility (${getHardwareTierForDisplay(hardware)})`;
                 } catch (error) {
-                    console.warn('Could not sort by hardware compatibility:', error.message);
+                    if (!options.json) console.warn('Could not sort by hardware compatibility:', error.message);
                     // Fallback a ordenar por popularidad
                     models.sort((a, b) => (b.pulls || 0) - (a.pulls || 0));
                 }
@@ -3997,7 +4288,7 @@ program
             const limit = parseInt(options.limit) || 50;
             const displayModels = models.slice(0, limit);
-            spinner.succeed(`✅ Found ${models.length} models (showing ${displayModels.length})`);
+            if (spinner) spinner.succeed(`✅ Found ${models.length} models (showing ${displayModels.length})`);
             if (options.json) {
                 console.log(JSON.stringify(displayModels, null, 2));
@@ -4020,7 +4311,7 @@ program
             }
         } catch (error) {
-            spinner.fail('Failed to load models');
+            if (spinner) spinner.fail('Failed to load models');
             console.error(chalk.red('Error:'), error.message);
             if (process.env.DEBUG) {
                 console.error(error.stack);
@@ -4121,6 +4412,8 @@ program
         '--calibrated [file]',
         'Enable calibrated routing policy (optional file path; defaults to ~/.llm-checker/calibration-policy.{yaml,yml,json})'
     )
+    .option('--benchmark', 'Run a short local speed test before launching')
+    .option('--reference-only', 'Show model choice and speed reference without launching Ollama')
     .action(async (options) => {
         showAsciiArt('ai-run');
         // Check if Ollama is installed first
@@ -4134,6 +4427,14 @@ program
             const aiSelector = new AIModelSelector();
             const checker = new (getLLMChecker())();
             const systemInfo = await checker.getSystemInfo();
+            let ollamaClient = null;
+            const getOllamaClient = () => {
+                if (!ollamaClient) {
+                    const OllamaClient = require('../src/ollama/client');
+                    ollamaClient = new OllamaClient();
+                }
+                return ollamaClient;
+            };
             const routingPreference = resolveRoutingPolicyPreference({
                 policyOption: options.policy,
                 calibratedOption: options.calibrated
@@ -4142,18 +4443,18 @@ program
             // Get available models or use provided ones
             let candidateModels = options.models;
+            let localModels = [];
             if (!candidateModels) {
-                spinner.text = '📋 Getting available Ollama models...';
-                const OllamaClient = require('../src/ollama/client');
-                const client = new OllamaClient();
+                spinner.text = 'Getting available Ollama models...';
+                const client = getOllamaClient();
                 try {
-                    const models = await client.getLocalModels();
-                    candidateModels = models.map(m => m.name || m.model);
+                    localModels = await client.getLocalModels();
+                    candidateModels = localModels.map(m => m.name || m.model);
                     if (candidateModels.length === 0) {
-                        spinner.fail('❌ No Ollama models found');
+                        spinner.fail('No Ollama models found');
                         console.log('\nInstall some models first:');
                         console.log('  ollama pull llama2:7b');
                         console.log('  ollama pull mistral:7b');
@@ -4161,7 +4462,7 @@ program
                         return;
                     }
                 } catch (error) {
-                    spinner.fail('❌ Failed to get Ollama models');
+                    spinner.fail('Failed to get Ollama models');
                     console.error(chalk.red('Error:'), error.message);
                     return;
                 }
@@ -4202,28 +4503,62 @@ program
                         )}) are not installed locally. Falling back to AI selector.`
                     );
                 }
-                result = await aiSelector.selectBestModel(candidateModels, systemSpecs, taskHint);
+                result = await aiSelector.selectBestModel(candidateModels, systemSpecs, taskHint, { silent: true });
             }
             spinner.succeed(`Selected ${chalk.green.bold(result.bestModel)} (${result.method}, ${Math.round(result.confidence * 100)}% confidence)`);
+            let benchmark = null;
+            if (options.benchmark) {
+                const benchmarkSpinner = ora(`Measuring local throughput for ${result.bestModel}...`).start();
+                try {
+                    benchmark = await getOllamaClient().testModelPerformance(
+                        result.bestModel,
+                        'Write one concise sentence about local LLM performance.'
+                    );
+                    if (benchmark.success) {
+                        benchmarkSpinner.succeed(`Measured ${formatAiRunNumber(benchmark.tokensPerSecond)} tokens/sec`);
+                    } else {
+                        benchmarkSpinner.stop();
+                        console.log(chalk.yellow(`Benchmark unavailable: ${benchmark.error || 'unknown error'}`));
+                    }
+                } catch (error) {
+                    benchmark = { success: false, error: error.message };
+                    benchmarkSpinner.stop();
+                    console.log(chalk.yellow(`Benchmark unavailable: ${error.message}`));
+                }
+            }
             displayCalibratedRoutingDecision('ai-run', calibratedPolicy, routeDecision, routingPreference.warnings);
+            displayAiRunReference({
+                result,
+                systemInfo,
+                taskHint,
+                candidateModels,
+                localModels,
+                aiSelector,
+                benchmark
+            });
+            if (options.referenceOnly) {
+                console.log(chalk.gray('\nReference-only mode: not launching Ollama.'));
+                return;
+            }
-            // Execute the selected model
-            console.log(chalk.magenta.bold(`\nLaunching ${result.bestModel}...`));
-            console.log(chalk.gray(`Tip: Type ${chalk.cyan('/bye')} to exit the chat when finished\n`));
-            const args = ['run', result.bestModel];
             if (options.prompt) {
-                args.push(options.prompt);
+                console.log(chalk.cyan(`\n>>> ${options.prompt}`));
+                await runAiRunChatTurn(
+                    getOllamaClient(),
+                    result.bestModel,
+                    [{ role: 'user', content: options.prompt }]
+                );
+                return;
             }
-            const ollamaProcess = spawn('ollama', args, {
-                stdio: 'inherit'
-            });
-            ollamaProcess.on('error', (error) => {
-                console.error(chalk.red('Failed to launch Ollama:'), error.message);
-            });
+            console.log(chalk.magenta.bold(`\nStarting chat with ${result.bestModel}...`));
+            console.log(chalk.gray(`Tip: Type ${chalk.cyan('/bye')} to exit the chat when finished\n`));
+            await runAiRunInteractiveChat(getOllamaClient(), result.bestModel);
         } catch (error) {
             console.error(chalk.red('❌ AI-powered execution failed:'), error.message);
@@ -5058,7 +5393,7 @@ program
             console.log(`  ${detector.getHardwareDescription()}`);
             console.log(`  Tier: ${chalk.cyan(detector.getHardwareTier().replace('_', ' ').toUpperCase())}`);
             console.log(`  Max model size: ${chalk.green(detector.getMaxModelSize() + 'GB')}`);
-            console.log(`  Best backend: ${chalk.cyan(hardware.summary.bestBackend)}`);
+            console.log(`  Best backend: ${chalk.cyan(getBackendLabelForDisplay(hardware))}`);
             if (hardware.summary.runtimeBackend && hardware.summary.runtimeBackend !== hardware.summary.bestBackend) {
                 console.log(`  Runtime assist: ${chalk.green(hardware.summary.runtimeBackendName || hardware.summary.runtimeBackend)}`);
             }
@@ -5106,9 +5441,23 @@ program
                 if (backend === 'rocm' && info.info) {
                     console.log(`  ROCm: ${info.info.rocmVersion}`);
-                    console.log(`  Total VRAM: ${info.info.totalVRAM}GB`);
+                    const integratedOnly = (info.info.gpus || []).length > 0 &&
+                        (info.info.gpus || []).every((gpu) => gpu.type === 'integrated');
+                    if (integratedOnly) {
+                        console.log(`  Total dedicated aperture: ${info.info.totalVRAM || 0}GB`);
+                        console.log(`  Total shared memory: ${info.info.totalSharedMemory || 0}GB`);
+                    } else {
+                        console.log(`  Total VRAM: ${info.info.totalVRAM}GB`);
+                    }
                     for (const gpu of info.info.gpus) {
-                        console.log(`  ${gpu.name}: ${gpu.memory.total}GB`);
+                        if (gpu.type === 'integrated') {
+                            const dedicated = gpu.memory?.dedicated || 0;
+                            const shared = gpu.memory?.shared || gpu.memory?.total || 0;
+                            const dedicatedLabel = dedicated > 0 ? `, ${dedicated}GB aperture` : '';
+                            console.log(`  ${gpu.name}: ${shared}GB shared${dedicatedLabel} (Integrated)`);
+                        } else {
+                            console.log(`  ${gpu.name}: ${gpu.memory.total}GB`);
+                        }
                     }
                 }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "llm-checker",
-  "version": "3.5.11",
+  "version": "3.5.13",
   "description": "Intelligent CLI tool with AI-powered model selection that analyzes your hardware and recommends optimal LLM models for your system",
   "bin": {
     "llm-checker": "bin/cli.js",
@@ -36,6 +36,7 @@
     "list-models": "node bin/enhanced_cli.js list-models",
     "ai-check": "node bin/enhanced_cli.js ai-check",
     "ai-run": "node bin/enhanced_cli.js ai-run",
+    "sync:seed": "node bin/enhanced_cli.js sync --force --quiet && node scripts/update-seed-db.js",
     "benchmark": "cd ml-model && python python/benchmark_collector.py",
     "train-ai": "cd ml-model && python python/train_model.py",
     "postinstall": "echo 'LLM Checker installed. Run: llm-checker hw-detect'"