npm - llm-checker - Versions diffs - 3.2.0 → 3.2.2 - Mend

llm-checker 3.2.0 → 3.2.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

package/README.md +106 -7
package/analyzer/compatibility.js +20 -0
package/bin/cli.js +14 -0
package/bin/enhanced_cli.js +580 -36
package/package.json +11 -3
package/src/ai/multi-objective-selector.js +28 -4
package/src/hardware/backends/cuda-detector.js +32 -11
package/src/hardware/detector.js +107 -5
package/src/hardware/specs.js +8 -1
package/src/index.js +161 -31
package/src/models/deterministic-selector.js +406 -22
package/src/models/expanded_database.js +8 -2
package/src/models/intelligent-selector.js +89 -4
package/src/models/scoring-engine.js +4 -0
package/src/models/speculative-decoding-estimator.js +245 -0
package/src/policy/audit-reporter.js +420 -0
package/src/policy/cli-policy.js +403 -0
package/src/policy/policy-engine.js +497 -0
package/src/policy/policy-manager.js +324 -0
package/src/provenance/model-provenance.js +176 -0
package/src/runtime/runtime-support.js +174 -0
package/bin/CLAUDE.md +0 -27
package/src/CLAUDE.md +0 -18
package/src/data/CLAUDE.md +0 -17
package/src/hardware/CLAUDE.md +0 -18
package/src/hardware/backends/CLAUDE.md +0 -17
package/src/models/CLAUDE.md +0 -23
package/src/ollama/CLAUDE.md +0 -30
package/src/plugins/CLAUDE.md +0 -17
package/src/utils/CLAUDE.md +0 -17

package/README.md CHANGED Viewed

@@ -17,6 +17,7 @@
   <a href="https://www.npmjs.com/package/llm-checker"><img src="https://img.shields.io/npm/v/llm-checker?style=flat-square&color=0066FF" alt="npm version"></a>
   <a href="https://www.npmjs.com/package/llm-checker"><img src="https://img.shields.io/npm/dm/llm-checker?style=flat-square&color=0066FF" alt="npm downloads"></a>
   <a href="https://opensource.org/licenses/MIT"><img src="https://img.shields.io/badge/License-MIT-0066FF?style=flat-square" alt="License"></a>
+  <a href="https://discord.gg/mnmYrA7T"><img src="https://img.shields.io/discord/1457032977849520374?style=flat-square&color=0066FF&label=Discord" alt="Discord"></a>
   <a href="https://nodejs.org/"><img src="https://img.shields.io/badge/node-%3E%3D16-0066FF?style=flat-square" alt="Node.js"></a>
 </p>
@@ -26,7 +27,8 @@
   <a href="#claude-code-mcp">Claude MCP</a> &bull;
   <a href="#commands">Commands</a> &bull;
   <a href="#scoring-system">Scoring</a> &bull;
-  <a href="#supported-hardware">Hardware</a>
+  <a href="#supported-hardware">Hardware</a> &bull;
+  <a href="https://discord.gg/mnmYrA7T"><img src="https://cdn.simpleicons.org/discord/0066FF" alt="Discord" width="14" height="14"> Discord</a>
 </p>
 ---
@@ -43,7 +45,7 @@ Choosing the right LLM for your hardware is complex. With thousands of model var
 | | Feature | Description |
 |:---:|---|---|
-| **35+** | Curated Models | Hand-picked catalog covering all major families and sizes (1B-32B) |
+| **200+** | Dynamic Model Pool | Uses full scraped Ollama catalog/variants when available (with curated fallback) |
 | **4D** | Scoring Engine | Quality, Speed, Fit, Context &mdash; weighted by use case |
 | **Multi-GPU** | Hardware Detection | Apple Silicon, NVIDIA CUDA, AMD ROCm, Intel Arc, CPU |
 | **Calibrated** | Memory Estimation | Bytes-per-parameter formula validated against real Ollama sizes |
@@ -52,6 +54,20 @@ Choosing the right LLM for your hardware is complex. With thousands of model var
 ---
+## Comparison with Other Tooling (e.g. `llmfit`)
+LLM Checker and `llmfit` solve related but different problems:
+| Tool | Primary Focus | Typical Output |
+|------|---------------|----------------|
+| **LLM Checker** | Hardware-aware **model selection** for local inference | Ranked recommendations, compatibility scores, pull/run commands |
+| **llmfit** | LLM workflow support and model-fit evaluation from another angle | Different optimization workflow and selection heuristics |
+If your goal is: *"What should I run on this exact machine right now?"*, use **LLM Checker** first.
+If your goal is broader experimentation across custom pipelines, using both tools can be complementary.
+---
 ## Installation
 ```bash
@@ -73,6 +89,32 @@ npm install sql.js
 ---
+## Distribution
+LLM Checker is published in all primary channels:
+- npm (latest): [`llm-checker@3.2.1`](https://www.npmjs.com/package/llm-checker)
+- GitHub Release: [`v3.2.1` (2026-02-17)](https://github.com/Pavelevich/llm-checker/releases/tag/v3.2.1)
+- GitHub Packages: [`@pavelevich/llm-checker`](https://github.com/users/Pavelevich/packages/npm/package/llm-checker)
+### v3.2.1 Highlights
+- Added vLLM/MLX runtime support and speculative decoding estimation.
+- Improved GPU detection, added DGX Spark/GB10 support, strengthened Node runtime guards, and updated tooling comparison notes.
+### Optional: Install from GitHub Packages
+```bash
+# 1) Configure registry + token (PAT with read:packages)
+echo "@pavelevich:registry=https://npm.pkg.github.com" >> ~/.npmrc
+echo "//npm.pkg.github.com/:_authToken=${GITHUB_TOKEN}" >> ~/.npmrc
+# 2) Install
+npm install -g @pavelevich/llm-checker@3.2.1
+```
+---
 ## Quick Start
 ```bash
@@ -184,6 +226,58 @@ Claude will automatically call the right tools and give you actionable results.
 | `search <query>` | Search models with filters and intelligent scoring |
 | `smart-recommend` | Advanced recommendations using the full scoring engine |
+### Enterprise Policy Commands
+| Command | Description |
+|---------|-------------|
+| `policy init` | Generate a `policy.yaml` template for enterprise governance |
+| `policy validate` | Validate a policy file and return non-zero on schema errors |
+| `audit export` | Evaluate policy outcomes and export compliance reports (`json`, `csv`, `sarif`) |
+### Policy Enforcement in `check` and `recommend`
+Both `check` and `recommend` support `--policy <file>`.
+- In `audit` mode, policy violations are reported but the command exits with `0`.
+- In `enforce` mode, blocking violations return non-zero (default `1`).
+- You can override the non-zero code with `enforcement.exit_code` in `policy.yaml`.
+Examples:
+```bash
+llm-checker check --policy ./policy.yaml
+llm-checker check --policy ./policy.yaml --use-case coding --runtime vllm
+llm-checker recommend --policy ./policy.yaml --category coding
+```
+### Policy Audit Export
+Use `audit export` when you need machine-readable compliance evidence for CI/CD gates, governance reviews, or security tooling.
+```bash
+# Single report format
+llm-checker audit export --policy ./policy.yaml --command check --format json --out ./reports/check-policy.json
+# Export all configured formats (json, csv, sarif)
+llm-checker audit export --policy ./policy.yaml --command check --format all --out-dir ./reports
+```
+- `--command check|recommend` chooses the candidate source.
+- `--format all` honors `reporting.formats` in your policy (falls back to `json,csv,sarif`).
+- In `enforce` mode with blocking violations, reports are still written before non-zero exit.
+### Provenance Fields in Reports
+Each finding includes normalized model provenance fields:
+- `source`
+- `registry`
+- `version`
+- `license`
+- `digest`
+If a field is unavailable from model metadata, reports use `"unknown"` instead of omitting the field. This keeps downstream parsers deterministic.
 ### AI Commands
 | Command | Description |
@@ -263,7 +357,9 @@ llm-checker search qwen --quant Q4_K_M --max-size 8
 ## Model Catalog
-The built-in catalog includes 35+ models from the most popular Ollama families:
+LLM Checker prioritizes the full scraped Ollama model cache (all families/sizes/variants) and falls back to a built-in curated catalog when cache is unavailable.
+The curated fallback catalog includes 35+ models from the most popular Ollama families:
 | Family | Models | Best For |
 |--------|--------|----------|
@@ -277,7 +373,7 @@ The built-in catalog includes 35+ models from the most popular Ollama families:
 | **LLaVA** | 7B, 13B | Vision |
 | **Embeddings** | nomic-embed-text, mxbai-embed-large, bge-m3, all-minilm | RAG, search |
-Models are automatically combined with any locally installed Ollama models for scoring.
+All available models are automatically combined with locally installed Ollama models for scoring.
 ---
@@ -404,7 +500,7 @@ The selector automatically picks the best quantization that fits your available
 **Selector Pipeline:**
 1. **Hardware profiling** &mdash; CPU, GPU, RAM, acceleration backend
-2. **Model pool** &mdash; Merge catalog + installed Ollama models (deduped)
+2. **Model pool** &mdash; Merge full Ollama scraped pool (or curated fallback) + installed models (deduped)
 3. **Category filter** &mdash; Keep models relevant to the use case
 4. **Quantization selection** &mdash; Best quant that fits in memory budget
 5. **4D scoring** &mdash; Q, S, F, C with category-specific weights
@@ -463,7 +559,7 @@ src/
     deterministic-selector.js  # Primary selection algorithm
     scoring-config.js          # Centralized scoring weights
     scoring-engine.js          # Advanced scoring (smart-recommend)
-    catalog.json               # Curated model catalog (35+ models)
+    catalog.json               # Curated fallback catalog (35+ models)
   ai/
     multi-objective-selector.js  # Multi-objective optimization
     ai-check-selector.js        # LLM-based evaluation
@@ -487,6 +583,9 @@ MIT License &mdash; see [LICENSE](LICENSE) for details.
 <p align="center">
   <a href="https://github.com/Pavelevich/llm-checker">GitHub</a> &bull;
+  <a href="https://github.com/Pavelevich/llm-checker/releases">Releases</a> &bull;
   <a href="https://www.npmjs.com/package/llm-checker">npm</a> &bull;
-  <a href="https://github.com/Pavelevich/llm-checker/issues">Issues</a>
+  <a href="https://github.com/users/Pavelevich/packages/npm/package/llm-checker">GitHub Packages</a> &bull;
+  <a href="https://github.com/Pavelevich/llm-checker/issues">Issues</a> &bull;
+  <a href="https://discord.gg/mnmYrA7T">Discord</a>
 </p>

package/analyzer/compatibility.js CHANGED Viewed

@@ -1,4 +1,10 @@
 const { getLogger } = require('../src/utils/logger');
+const {
+    normalizeRuntime,
+    getRuntimeDisplayName,
+    runtimeSupportedOnHardware,
+    runtimeSupportsSpeculativeDecoding
+} = require('../src/runtime/runtime-support');
 class CompatibilityAnalyzer {
     constructor() {
@@ -451,6 +457,7 @@ class CompatibilityAnalyzer {
     generateRecommendations(hardware, results, options = {}) {
         const recommendations = [];
+        const runtime = normalizeRuntime(options.runtime || 'ollama');
         const tier = this.getHardwareTier(hardware);
         if (hardware.memory.total < 16) {
@@ -511,6 +518,19 @@ class CompatibilityAnalyzer {
             }
         }
+        if (runtime !== 'ollama') {
+            const runtimeLabel = getRuntimeDisplayName(runtime);
+            if (runtimeSupportedOnHardware(runtime, hardware)) {
+                recommendations.push(`Runtime selected: ${runtimeLabel}`);
+            } else {
+                recommendations.push(`${runtimeLabel} is not recommended on this hardware (fallback to Ollama).`);
+            }
+            if (runtimeSupportsSpeculativeDecoding(runtime)) {
+                recommendations.push(`Enable speculative decoding in ${runtimeLabel} for higher throughput.`);
+            }
+        }
         return recommendations;
     }

package/bin/cli.js ADDED Viewed

@@ -0,0 +1,14 @@
+#!/usr/bin/env node
+'use strict';
+const majorNodeVersion = Number.parseInt(process.versions.node.split('.')[0], 10);
+if (!Number.isFinite(majorNodeVersion) || majorNodeVersion < 16) {
+    console.error(
+        `[llm-checker] Unsupported Node.js version: ${process.versions.node}. ` +
+        'Please use Node.js 16 or newer.'
+    );
+    process.exit(1);
+}
+require('./enhanced_cli');