npm - @dotsetlabs/bellwether - Versions diffs - 1.0.1 → 1.0.3 - Mend

@dotsetlabs/bellwether 1.0.1 → 1.0.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

package/CHANGELOG.md +50 -0
package/README.md +3 -2
package/dist/cache/response-cache.d.ts +4 -2
package/dist/cache/response-cache.js +68 -30
package/dist/cli/commands/baseline.js +23 -4
package/dist/cli/commands/check.js +212 -36
package/dist/cli/commands/registry.js +143 -5
package/dist/cli/index.js +6 -4
package/dist/cli/output.d.ts +1 -0
package/dist/cli/output.js +32 -8
package/dist/config/template.d.ts +2 -0
package/dist/config/template.js +8 -2
package/dist/interview/interviewer.js +70 -50
package/dist/interview/orchestrator.js +49 -22
package/dist/llm/anthropic.js +49 -16
package/dist/llm/client.d.ts +2 -0
package/dist/llm/client.js +61 -0
package/dist/llm/ollama.js +9 -4
package/dist/llm/openai.js +34 -23
package/dist/transport/base-transport.d.ts +1 -1
package/dist/transport/http-transport.d.ts +2 -2
package/dist/transport/http-transport.js +26 -6
package/dist/transport/mcp-client.d.ts +18 -6
package/dist/transport/mcp-client.js +49 -19
package/dist/transport/sse-transport.d.ts +1 -1
package/dist/transport/sse-transport.js +4 -2
package/dist/transport/stdio-transport.d.ts +1 -1
package/dist/transport/stdio-transport.js +1 -1
package/dist/utils/timeout.d.ts +10 -2
package/dist/utils/timeout.js +9 -5
package/dist/version.js +1 -1
package/dist/workflow/executor.js +18 -13
package/dist/workflow/loader.js +4 -1
package/dist/workflow/state-tracker.js +22 -18
package/man/bellwether.1 +204 -0
package/man/bellwether.1.md +148 -0
package/package.json +8 -9

package/CHANGELOG.md CHANGED Viewed

@@ -7,6 +7,56 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 ## [Unreleased]
+## [1.0.3] - 2026-02-02
+### Added
+- Added `version` input to GitHub Action for explicit npm version selection
+  - Action now derives version from ref (e.g., `v1.0.3`) or accepts explicit `inputs.version`
+  - Provides clear error message when version cannot be determined
+- Added `signal` option to LLM completion requests for request cancellation via AbortSignal
+- Added AbortController integration to timeout utilities for proper request cancellation
+- Added JSON extraction from mixed LLM responses (handles prose around JSON blocks)
+### Changed
+- Improved timeout handling with AbortController propagation across LLM and transport layers
+- Improved error handling and resource cleanup in interview, orchestrator, and transport modules
+- Refactored response cache, workflow executor, and state tracker for better reliability
+- Updated CI/CD and GitHub/GitLab integration documentation
+### Fixed
+- Fixed GitHub Action stderr handling in check command output capture
+- Fixed various code formatting and linting issues across LLM clients and transport modules
+## [1.0.2] - 2026-01-30
+### Added
+- Added SARIF and JUnit output format support for `bellwether check` without baseline comparison
+  - Use `--format sarif` for GitHub Code Scanning integration
+  - Use `--format junit` for CI/CD test reporting
+- Added registry validation indicators showing environment variable requirements
+  - Servers requiring setup now display ⚙ indicator
+  - Environment variables show ✓/✗ status based on whether they're set
+  - Automatic detection of common service patterns (postgres→DATABASE_URL, etc.)
+  - Setup hints displayed for unconfigured servers
+### Changed
+- Security and thorough presets now enable security testing by default (`check.security.enabled: true`)
+### Fixed
+- Fixed baseline path resolution in `baseline compare` to be consistent with `baseline show`
+  - Now checks both output directory and current working directory before failing
+- Fixed `bellwether auth status` requiring a config file
+  - Auth commands now work without bellwether.yaml present
+- Fixed ANSI escape codes appearing in non-TTY output (e.g., when piping to files)
+  - StreamingDisplay now checks for TTY before applying ANSI styling
+  - Automatically respects `NO_COLOR` and `FORCE_COLOR=0` environment variables
 ## [1.0.1] - 2026-01-29
 ### Added

package/README.md CHANGED Viewed

@@ -124,8 +124,9 @@ Requires LLM (Ollama for free local, or OpenAI/Anthropic). Generates `AGENTS.md`
 ## GitHub Action
 ```yaml
-- uses: dotsetlabs/bellwether@v1
+- uses: dotsetlabs/bellwether@v1.0.2
   with:
+    version: '1.0.2'
     server-command: 'npx @mcp/your-server'
     baseline-path: './bellwether-baseline.json'
     fail-on-severity: 'warning'
@@ -167,7 +168,7 @@ bellwether init --preset local npx @mcp/server # Local Ollama (free)
 ```bash
 git clone https://github.com/dotsetlabs/bellwether
-cd bellwether/cli
+cd bellwether
 npm install
 npm run build
 npm test

package/dist/cache/response-cache.d.ts CHANGED Viewed

@@ -10,6 +10,8 @@ export interface CacheEntry<T> {
     value: T;
     /** When the entry was created */
     createdAt: Date;
+    /** When the entry was last accessed */
+    lastAccessedAt: Date;
     /** When the entry expires */
     expiresAt: Date;
     /** Cache key (hash) */
@@ -99,9 +101,9 @@ export declare class ResponseCache {
      */
     private evictIfNeeded;
     /**
-     * Evict the oldest entry (LRU based on creation time).
+     * Evict the least recently used entry (LRU based on last access time).
      */
-    private evictOldest;
+    private evictLeastRecentlyUsed;
     /**
      * Estimate the size of a value in bytes.
      */

package/dist/cache/response-cache.js CHANGED Viewed

@@ -30,21 +30,9 @@ export class ResponseCache {
      * Generate a cache key from input data.
      */
     generateKey(...parts) {
-        const serialized = parts.map((p) => {
-            if (typeof p === 'string')
-                return p;
-            if (typeof p === 'undefined')
-                return 'undefined';
-            if (p === null)
-                return 'null';
-            try {
-                return JSON.stringify(p, Object.keys(p).sort());
-            }
-            catch {
-                return String(p);
-            }
-        }).join('|');
-        return createHash('sha256').update(serialized).digest('hex').slice(0, 16);
+        const serialized = parts.map((p) => stableStringify(p)).join('|');
+        // Use 128-bit hash (32 hex chars) to reduce collision risk.
+        return createHash('sha256').update(serialized).digest('hex').slice(0, 32);
     }
     /**
      * Get an entry from cache.
@@ -66,6 +54,7 @@ export class ResponseCache {
             return undefined;
         }
         entry.hitCount++;
+        entry.lastAccessedAt = new Date();
         this.stats.hits++;
         logger.debug({ key, hitCount: entry.hitCount }, 'Cache hit');
         return entry.value;
@@ -86,6 +75,7 @@ export class ResponseCache {
         const entry = {
             value,
             createdAt: now,
+            lastAccessedAt: now,
             expiresAt: new Date(now.getTime() + ttl),
             key,
             description: options?.description,
@@ -168,31 +158,30 @@ export class ResponseCache {
     evictIfNeeded(newEntrySize) {
         // Check entry count
         while (this.cache.size >= this.config.maxEntries) {
-            this.evictOldest();
+            this.evictLeastRecentlyUsed();
         }
         // Check size
-        while (this.totalSizeBytes + newEntrySize > this.config.maxSizeBytes &&
-            this.cache.size > 0) {
-            this.evictOldest();
+        while (this.totalSizeBytes + newEntrySize > this.config.maxSizeBytes && this.cache.size > 0) {
+            this.evictLeastRecentlyUsed();
         }
     }
     /**
-     * Evict the oldest entry (LRU based on creation time).
+     * Evict the least recently used entry (LRU based on last access time).
      */
-    evictOldest() {
-        let oldestKey;
-        let oldestTime = Infinity;
+    evictLeastRecentlyUsed() {
+        let lruKey;
+        let oldestAccessTime = Infinity;
         for (const [key, entry] of this.cache) {
-            const time = entry.createdAt.getTime();
-            if (time < oldestTime) {
-                oldestTime = time;
-                oldestKey = key;
+            const time = entry.lastAccessedAt.getTime();
+            if (time < oldestAccessTime) {
+                oldestAccessTime = time;
+                lruKey = key;
             }
         }
-        if (oldestKey) {
-            this.delete(oldestKey);
+        if (lruKey) {
+            this.delete(lruKey);
             this.stats.evictions++;
-            logger.debug({ key: oldestKey }, 'Evicted cache entry');
+            logger.debug({ key: lruKey }, 'Evicted cache entry');
         }
     }
     /**
@@ -207,6 +196,55 @@ export class ResponseCache {
         }
     }
 }
+/**
+ * Stable, deterministic JSON stringify with deep key sorting.
+ * Falls back to string conversion for unsupported types.
+ */
+function stableStringify(value) {
+    const seen = new WeakSet();
+    const normalize = (input) => {
+        if (input === null || input === undefined)
+            return input;
+        const type = typeof input;
+        if (type === 'string' || type === 'number' || type === 'boolean') {
+            return input;
+        }
+        if (type === 'bigint') {
+            return input.toString();
+        }
+        if (type === 'symbol' || type === 'function') {
+            return String(input);
+        }
+        if (input instanceof Date) {
+            return input.toISOString();
+        }
+        if (Array.isArray(input)) {
+            return input.map((item) => normalize(item));
+        }
+        if (typeof input === 'object') {
+            const obj = input;
+            if (seen.has(obj)) {
+                return '[Circular]';
+            }
+            seen.add(obj);
+            const keys = Object.keys(obj).sort();
+            const normalized = {};
+            for (const key of keys) {
+                normalized[key] = normalize(obj[key]);
+            }
+            return normalized;
+        }
+        try {
+            return JSON.parse(JSON.stringify(input));
+        }
+        catch {
+            return String(input);
+        }
+    };
+    const normalized = normalize(value);
+    const json = JSON.stringify(normalized);
+    return json === undefined ? 'undefined' : json;
+}
 /**
  * Specialized cache for tool responses.
  */

package/dist/cli/commands/baseline.js CHANGED Viewed

@@ -146,12 +146,31 @@ baselineCommand
         output.error('No baseline path provided. Set baseline.path or baseline.comparePath in config, or pass a path argument.');
         process.exit(EXIT_CODES.ERROR);
     }
-    const baselineBaseDir = baselinePath ? process.cwd() : outputDir;
-    const fullBaselinePath = resolvedBaselinePath.startsWith('/')
-        ? resolvedBaselinePath
-        : join(baselineBaseDir, resolvedBaselinePath);
+    // Resolve baseline path consistently with 'show' command:
+    // 1. If absolute path, use as-is
+    // 2. First try relative to outputDir (e.g., .bellwether/)
+    // 3. Fall back to relative to cwd
+    let fullBaselinePath;
+    if (resolvedBaselinePath.startsWith('/')) {
+        fullBaselinePath = resolvedBaselinePath;
+    }
+    else {
+        const outputDirPath = join(outputDir, resolvedBaselinePath);
+        const cwdPath = join(process.cwd(), resolvedBaselinePath);
+        if (existsSync(outputDirPath)) {
+            fullBaselinePath = outputDirPath;
+        }
+        else if (existsSync(cwdPath)) {
+            fullBaselinePath = cwdPath;
+        }
+        else {
+            // Default to outputDir path for error message consistency
+            fullBaselinePath = outputDirPath;
+        }
+    }
     if (!existsSync(fullBaselinePath)) {
         output.error(`Baseline not found: ${fullBaselinePath}`);
+        output.error('\nRun `bellwether baseline save` to create a baseline.');
         process.exit(EXIT_CODES.ERROR);
     }
     let previousBaseline;

package/dist/cli/commands/check.js CHANGED Viewed

@@ -13,7 +13,7 @@ import { MCPClient } from '../../transport/mcp-client.js';
 import { discover } from '../../discovery/discovery.js';
 import { Interviewer } from '../../interview/interviewer.js';
 import { generateContractMd, generateJsonReport } from '../../docs/generator.js';
-import { loadConfig, ConfigNotFoundError, parseCommandString } from '../../config/loader.js';
+import { loadConfig, ConfigNotFoundError, parseCommandString, } from '../../config/loader.js';
 import { validateConfigForCheck, getConfigWarnings } from '../../config/validator.js';
 import { createBaseline, loadBaseline, saveBaseline, getToolFingerprints, toToolCapability, compareBaselines, acceptDrift, formatDiffText, formatDiffJson, formatDiffCompact, formatDiffGitHubActions, formatDiffMarkdown, formatDiffJUnit, formatDiffSarif, applySeverityConfig, shouldFailOnDiff, analyzeForIncremental, formatIncrementalSummary, runSecurityTests, parseSecurityCategories, getAllSecurityCategories, } from '../../baseline/index.js';
 import { convertAssertions } from '../../baseline/converter.js';
@@ -21,7 +21,7 @@ import { getMetricsCollector, resetMetricsCollector } from '../../metrics/collec
 import { getGlobalCache, resetGlobalCache } from '../../cache/response-cache.js';
 import { InterviewProgressBar, formatCheckBanner } from '../utils/progress.js';
 import { buildCheckSummary, colorizeConfidence, formatConfidenceLevel, formatToolResultLine, } from '../output/terminal-reporter.js';
-import { loadScenariosFromFile, tryLoadDefaultScenarios, DEFAULT_SCENARIOS_FILE } from '../../scenarios/index.js';
+import { loadScenariosFromFile, tryLoadDefaultScenarios, DEFAULT_SCENARIOS_FILE, } from '../../scenarios/index.js';
 import { loadWorkflowsFromFile, tryLoadDefaultWorkflows, DEFAULT_WORKFLOWS_FILE, WorkflowExecutor, generateWorkflowsFromTools, generateWorkflowYamlContent, } from '../../workflow/index.js';
 import * as output from '../output.js';
 import { extractServerContextFromArgs } from '../utils/server-context.js';
@@ -73,14 +73,6 @@ export const checkCommand = new Command('check')
         output.error(error instanceof Error ? error.message : String(error));
         process.exit(EXIT_CODES.ERROR);
     }
-    const warnings = getConfigWarnings(config);
-    if (warnings.length > 0) {
-        output.warn('Configuration warnings:');
-        for (const warning of warnings) {
-            output.warn(`  - ${warning}`);
-        }
-        output.newline();
-    }
     // Extract settings from config
     const timeout = config.server.timeout;
     const outputDir = config.output.dir;
@@ -105,7 +97,8 @@ export const checkCommand = new Command('check')
         minimumSeverity: options.minSeverity ?? config.baseline.severity.minimumSeverity,
         failOnSeverity: options.failOnSeverity ?? config.baseline.severity.failOnSeverity,
         suppressWarnings: config.baseline.severity.suppressWarnings,
-        aspectOverrides: config.baseline.severity.aspectOverrides,
+        aspectOverrides: config.baseline.severity
+            .aspectOverrides,
     };
     // Resolve check options from config (no CLI overrides for these)
     const incrementalEnabled = config.check.incremental;
@@ -114,9 +107,26 @@ export const checkCommand = new Command('check')
     const parallelWorkers = config.check.parallelWorkers;
     const performanceThreshold = config.check.performanceThreshold / PERCENTAGE_CONVERSION.DIVISOR;
     const diffFormat = options.format ?? config.check.diffFormat;
+    const machineReadableFormats = new Set(['json', 'junit', 'sarif']);
+    const machineReadable = machineReadableFormats.has(String(diffFormat).toLowerCase());
+    if (machineReadable) {
+        // Suppress standard CLI output to keep stdout clean for machine-readable formats.
+        output.configureOutput({ quiet: true });
+    }
+    const warnings = getConfigWarnings(config);
+    if (warnings.length > 0) {
+        output.warn('Configuration warnings:');
+        for (const warning of warnings) {
+            output.warn(`  - ${warning}`);
+        }
+        if (!machineReadable) {
+            output.newline();
+        }
+    }
     // Resolve security options from config
     const securityEnabled = config.check.security.enabled;
-    let securityCategories = config.check.security.categories;
+    let securityCategories = config.check.security
+        .categories;
     // Validate security categories
     try {
         securityCategories = parseSecurityCategories(securityCategories.join(','));
@@ -141,13 +151,15 @@ export const checkCommand = new Command('check')
         ? `${serverCommand} ${args.join(' ')}`.trim()
         : (remoteUrl ?? 'unknown');
     // Display startup banner
-    const banner = formatCheckBanner({
-        serverCommand: serverIdentifier,
-    });
-    output.info(banner);
-    output.newline();
-    output.info('Check: Schema validation and drift detection (free, deterministic)');
-    output.newline();
+    if (!machineReadable) {
+        const banner = formatCheckBanner({
+            serverCommand: serverIdentifier,
+        });
+        output.info(banner);
+        output.newline();
+        output.info('Check: Schema validation and drift detection (free, deterministic)');
+        output.newline();
+    }
     // Initialize metrics collector
     resetMetricsCollector();
     const metricsCollector = getMetricsCollector();
@@ -182,9 +194,12 @@ export const checkCommand = new Command('check')
         }
         // Discovery phase
         output.info('Discovering capabilities...');
-        const discovery = await discover(mcpClient, transport === 'stdio' ? serverCommand : remoteUrl ?? serverCommand, transport === 'stdio' ? args : []);
+        const discovery = await discover(mcpClient, transport === 'stdio' ? serverCommand : (remoteUrl ?? serverCommand), transport === 'stdio' ? args : []);
         const resourceCount = discovery.resources?.length ?? 0;
-        const discoveryParts = [`${discovery.tools.length} tools`, `${discovery.prompts.length} prompts`];
+        const discoveryParts = [
+            `${discovery.tools.length} tools`,
+            `${discovery.prompts.length} prompts`,
+        ];
         if (resourceCount > 0) {
             discoveryParts.push(`${resourceCount} resources`);
         }
@@ -228,7 +243,9 @@ export const checkCommand = new Command('check')
             }
             else {
                 incrementalBaseline = loadBaseline(baselinePath);
-                const result = analyzeForIncremental(discovery.tools, incrementalBaseline, { maxCacheAgeHours: incrementalCacheHours });
+                const result = analyzeForIncremental(discovery.tools, incrementalBaseline, {
+                    maxCacheAgeHours: incrementalCacheHours,
+                });
                 incrementalResult = result;
                 const summary = formatIncrementalSummary(result.changeSummary);
                 output.info(`Incremental analysis: ${summary}`);
@@ -240,7 +257,7 @@ export const checkCommand = new Command('check')
                 else {
                     output.info(`Testing ${result.toolsToTest.length} tools (${result.toolsToSkip.length} cached)\n`);
                     // Filter discovery to only include tools that need testing
-                    discovery.tools = discovery.tools.filter(t => result.toolsToTest.includes(t.name));
+                    discovery.tools = discovery.tools.filter((t) => result.toolsToTest.includes(t.name));
                 }
             }
         }
@@ -323,7 +340,7 @@ export const checkCommand = new Command('check')
             interviewer.setServerContext(serverContext);
         }
         // Set up progress display
-        const progressBar = new InterviewProgressBar({ enabled: !verbose });
+        const progressBar = new InterviewProgressBar({ enabled: !verbose && !machineReadable });
         const reportedTools = new Set();
         const progressCallback = (progress) => {
             if (verbose) {
@@ -462,7 +479,7 @@ export const checkCommand = new Command('check')
                         try {
                             const response = await mcpClient.callTool(tool.name, args);
                             const content = response.content
-                                .map((c) => c.type === 'text' ? c.text : '')
+                                .map((c) => (c.type === 'text' ? c.text : ''))
                                 .join('\n');
                             return {
                                 isError: response.isError ?? false,
@@ -580,7 +597,7 @@ export const checkCommand = new Command('check')
                     const workflowResult = await workflowExecutor.execute(workflow);
                     workflowResults.push(workflowResult);
                     const statusIcon = workflowResult.success ? '\u2713' : '\u2717';
-                    const stepsInfo = `${workflowResult.steps.filter(s => s.success).length}/${workflow.steps.length} steps`;
+                    const stepsInfo = `${workflowResult.steps.filter((s) => s.success).length}/${workflow.steps.length} steps`;
                     if (workflowResult.success) {
                         output.success(`  ${statusIcon} ${workflow.name} (${stepsInfo}) - ${workflowResult.durationMs}ms`);
                     }
@@ -599,7 +616,7 @@ export const checkCommand = new Command('check')
                 }
             }
             // Workflow summary
-            const passed = workflowResults.filter(r => r.success).length;
+            const passed = workflowResults.filter((r) => r.success).length;
             const failed = workflowResults.length - passed;
             output.newline();
             if (failed === 0) {
@@ -631,9 +648,7 @@ export const checkCommand = new Command('check')
         }
         if (writeJson) {
             // Add workflow results to the result object for the JSON report
-            const resultWithWorkflows = workflowResults.length > 0
-                ? { ...result, workflowResults }
-                : result;
+            const resultWithWorkflows = workflowResults.length > 0 ? { ...result, workflowResults } : result;
             let jsonReport;
             try {
                 jsonReport = generateJsonReport(resultWithWorkflows, {
@@ -671,10 +686,7 @@ export const checkCommand = new Command('check')
         if (incrementalResult && incrementalResult.cachedFingerprints.length > 0) {
             // Merge new fingerprints with cached ones
             const cachedTools = incrementalResult.cachedFingerprints.map(toToolCapability);
-            const mergedTools = [
-                ...currentBaseline.capabilities.tools,
-                ...cachedTools,
-            ].sort((a, b) => a.name.localeCompare(b.name));
+            const mergedTools = [...currentBaseline.capabilities.tools, ...cachedTools].sort((a, b) => a.name.localeCompare(b.name));
             currentBaseline = {
                 ...currentBaseline,
                 capabilities: {
@@ -768,6 +780,18 @@ export const checkCommand = new Command('check')
             saveBaseline(currentBaseline, saveBaselinePath);
             output.info(`\nBaseline saved: ${saveBaselinePath}`);
         }
+        // Output formatted results for sarif/junit when no baseline comparison
+        // This allows CI systems to consume check results even without drift detection
+        if (!baselinePath) {
+            const formattedCheckResults = formatCheckResults(currentBaseline, diffFormat);
+            if (formattedCheckResults) {
+                if (!machineReadable) {
+                    output.info('\n--- Check Results ---');
+                }
+                // Output directly to stdout for machine-readable formats
+                console.log(formattedCheckResults);
+            }
+        }
         // Handle baseline comparison
         if (baselinePath) {
             if (!existsSync(baselinePath)) {
@@ -780,10 +804,17 @@ export const checkCommand = new Command('check')
             });
             // Apply severity configuration (filtering, overrides)
             const diff = applySeverityConfig(rawDiff, severityConfig);
-            output.info('\n--- Drift Report ---');
+            if (!machineReadable) {
+                output.info('\n--- Drift Report ---');
+            }
             // Select formatter based on --format option
             const formattedDiff = formatDiff(diff, diffFormat, baselinePath);
-            output.info(formattedDiff);
+            if (machineReadable) {
+                console.log(formattedDiff);
+            }
+            else {
+                output.info(formattedDiff);
+            }
             // Report performance regressions if detected
             if (diff.performanceReport?.hasRegressions) {
                 output.warn('\n--- Performance Regressions ---');
@@ -919,4 +950,149 @@ function formatDiff(diff, format, baselinePath) {
             return formatDiffText(diff);
     }
 }
+/**
+ * Format check results as JUnit XML (for CI systems that expect test results).
+ * This is used when --format junit is specified but no baseline comparison occurs.
+ */
+function formatCheckResultsJUnit(baseline) {
+    const tools = getToolFingerprints(baseline);
+    const lines = [];
+    const securityFailures = tools.filter((t) => t.securityFingerprint?.findings?.some((f) => f.riskLevel === 'critical' || f.riskLevel === 'high')).length;
+    lines.push('<?xml version="1.0" encoding="UTF-8"?>');
+    lines.push('<testsuites>');
+    lines.push(`  <testsuite name="bellwether-check" tests="${tools.length}" failures="${securityFailures}" errors="0">`);
+    for (const tool of tools) {
+        const successRate = tool.baselineSuccessRate ?? 1;
+        const status = successRate >= 0.9 ? 'passed' : 'warning';
+        lines.push(`    <testcase name="${tool.name}" classname="mcp-tools" time="0">`);
+        lines.push(`      <system-out>Success rate: ${(successRate * 100).toFixed(0)}%</system-out>`);
+        if (status === 'warning') {
+            lines.push(`      <system-err>Tool has success rate below 90%</system-err>`);
+        }
+        lines.push('    </testcase>');
+    }
+    // Add security findings as test cases if present
+    const securityTools = tools.filter((t) => t.securityFingerprint?.findings?.length);
+    if (securityTools.length > 0) {
+        lines.push(`    <!-- Security findings -->`);
+        for (const tool of securityTools) {
+            const findings = tool.securityFingerprint?.findings ?? [];
+            const criticalHigh = findings.filter((f) => f.riskLevel === 'critical' || f.riskLevel === 'high').length;
+            if (criticalHigh > 0) {
+                lines.push(`    <testcase name="${tool.name}-security" classname="security">`);
+                lines.push(`      <failure message="${criticalHigh} critical/high security findings">`);
+                for (const finding of findings.filter((f) => f.riskLevel === 'critical' || f.riskLevel === 'high')) {
+                    lines.push(`        ${finding.riskLevel.toUpperCase()}: ${finding.title} (${finding.cweId})`);
+                }
+                lines.push(`      </failure>`);
+                lines.push('    </testcase>');
+            }
+        }
+    }
+    lines.push('  </testsuite>');
+    lines.push('</testsuites>');
+    return lines.join('\n');
+}
+/**
+ * Format check results as SARIF (for GitHub Code Scanning and other tools).
+ * This is used when --format sarif is specified but no baseline comparison occurs.
+ */
+function formatCheckResultsSarif(baseline) {
+    const tools = getToolFingerprints(baseline);
+    const serverUri = baseline.metadata?.serverCommand || baseline.server.name || 'mcp-server';
+    const results = [];
+    // Add results for tools with security findings
+    const securityTools = tools.filter((t) => t.securityFingerprint?.findings?.length);
+    for (const tool of securityTools) {
+        const findings = tool.securityFingerprint?.findings ?? [];
+        for (const finding of findings) {
+            const level = finding.riskLevel === 'critical' || finding.riskLevel === 'high'
+                ? 'error'
+                : finding.riskLevel === 'medium'
+                    ? 'warning'
+                    : 'note';
+            results.push({
+                ruleId: finding.cweId || 'BWH-SEC',
+                level,
+                message: { text: `[${tool.name}] ${finding.title}: ${finding.description}` },
+                locations: [
+                    {
+                        physicalLocation: {
+                            artifactLocation: { uri: serverUri },
+                            region: { startLine: 1 },
+                        },
+                    },
+                ],
+            });
+        }
+    }
+    // Add results for tools with low success rate
+    for (const tool of tools) {
+        const successRate = tool.baselineSuccessRate ?? 1;
+        if (successRate < 0.9) {
+            results.push({
+                ruleId: 'BWH-REL',
+                level: 'warning',
+                message: {
+                    text: `Tool "${tool.name}" has ${(successRate * 100).toFixed(0)}% success rate`,
+                },
+                locations: [
+                    {
+                        physicalLocation: {
+                            artifactLocation: { uri: serverUri },
+                            region: { startLine: 1 },
+                        },
+                    },
+                ],
+            });
+        }
+    }
+    const sarif = {
+        $schema: 'https://raw.githubusercontent.com/oasis-tcs/sarif-spec/master/Schemata/sarif-schema-2.1.0.json',
+        version: '2.1.0',
+        runs: [
+            {
+                tool: {
+                    driver: {
+                        name: 'bellwether',
+                        version: '1.0.0',
+                        informationUri: 'https://github.com/dotsetlabs/bellwether',
+                        rules: [
+                            {
+                                id: 'BWH-SEC',
+                                name: 'SecurityFinding',
+                                shortDescription: { text: 'Security vulnerability detected' },
+                                defaultConfiguration: { level: 'warning' },
+                            },
+                            {
+                                id: 'BWH-REL',
+                                name: 'LowReliability',
+                                shortDescription: { text: 'Tool reliability below threshold' },
+                                defaultConfiguration: { level: 'warning' },
+                            },
+                        ],
+                    },
+                },
+                results,
+            },
+        ],
+    };
+    return JSON.stringify(sarif, null, 2);
+}
+/**
+ * Format check results using the specified output format.
+ * Used when no baseline comparison occurs.
+ */
+function formatCheckResults(baseline, format) {
+    switch (format.toLowerCase()) {
+        case 'junit':
+        case 'junit-xml':
+        case 'xml':
+            return formatCheckResultsJUnit(baseline);
+        case 'sarif':
+            return formatCheckResultsSarif(baseline);
+        default:
+            return null; // No special formatting needed for other formats
+    }
+}
 //# sourceMappingURL=check.js.map