npm - agent-gauntlet - Versions diffs - 0.10.0 → 0.11.0 - Mend

agent-gauntlet 0.10.0 → 0.11.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (71) hide show

package/README.md +25 -23
package/dist/index.js +9226 -0
package/dist/index.js.map +65 -0
package/dist/scripts/status.js +280 -0
package/dist/scripts/status.js.map +10 -0
package/package.json +22 -8
package/src/built-in-reviews/code-quality.md +0 -25
package/src/built-in-reviews/index.ts +0 -28
package/src/bun-plugins.d.ts +0 -4
package/src/cli-adapters/claude.ts +0 -327
package/src/cli-adapters/codex.ts +0 -290
package/src/cli-adapters/cursor.ts +0 -128
package/src/cli-adapters/gemini.ts +0 -510
package/src/cli-adapters/github-copilot.ts +0 -141
package/src/cli-adapters/index.ts +0 -250
package/src/cli-adapters/thinking-budget.ts +0 -23
package/src/commands/check.ts +0 -311
package/src/commands/ci/index.ts +0 -15
package/src/commands/ci/init.ts +0 -96
package/src/commands/ci/list-jobs.ts +0 -90
package/src/commands/clean.ts +0 -54
package/src/commands/detect.ts +0 -173
package/src/commands/health.ts +0 -169
package/src/commands/help.ts +0 -34
package/src/commands/index.ts +0 -13
package/src/commands/init.ts +0 -1878
package/src/commands/list.ts +0 -33
package/src/commands/review.ts +0 -311
package/src/commands/run.ts +0 -29
package/src/commands/shared.ts +0 -267
package/src/commands/stop-hook.ts +0 -567
package/src/commands/validate.ts +0 -20
package/src/commands/wait-ci.ts +0 -518
package/src/config/ci-loader.ts +0 -33
package/src/config/ci-schema.ts +0 -28
package/src/config/global.ts +0 -87
package/src/config/loader.ts +0 -301
package/src/config/schema.ts +0 -165
package/src/config/stop-hook-config.ts +0 -130
package/src/config/types.ts +0 -65
package/src/config/validator.ts +0 -592
package/src/core/change-detector.ts +0 -137
package/src/core/diff-stats.ts +0 -442
package/src/core/entry-point.ts +0 -190
package/src/core/job.ts +0 -96
package/src/core/run-executor.ts +0 -621
package/src/core/runner.ts +0 -290
package/src/gates/check.ts +0 -118
package/src/gates/resolve-check-command.ts +0 -21
package/src/gates/result.ts +0 -54
package/src/gates/review.ts +0 -1333
package/src/hooks/adapters/claude-stop-hook.ts +0 -99
package/src/hooks/adapters/cursor-stop-hook.ts +0 -122
package/src/hooks/adapters/types.ts +0 -94
package/src/hooks/stop-hook-handler.ts +0 -748
package/src/index.ts +0 -47
package/src/output/app-logger.ts +0 -214
package/src/output/console-log.ts +0 -168
package/src/output/console.ts +0 -359
package/src/output/logger.ts +0 -126
package/src/output/sinks/console-sink.ts +0 -59
package/src/output/sinks/file-sink.ts +0 -110
package/src/scripts/status.ts +0 -433
package/src/templates/workflow.yml +0 -79
package/src/types/gauntlet-status.ts +0 -79
package/src/utils/debug-log.ts +0 -392
package/src/utils/diff-parser.ts +0 -103
package/src/utils/execution-state.ts +0 -472
package/src/utils/log-parser.ts +0 -696
package/src/utils/sanitizer.ts +0 -3
package/src/utils/session-ref.ts +0 -91

package/src/scripts/status.ts DELETED Viewed

@@ -1,433 +0,0 @@
-#!/usr/bin/env bun
-/**
- * Gauntlet Status Script
- *
- * Parses the configured log_dir (default: gauntlet_logs/) to produce a structured
- * summary of the most recent gauntlet session from the .debug.log, plus a file
- * inventory of all log/JSON files for further inspection.
- *
- * This script handles structured data only (debug log events). Detailed failure
- * analysis (reading individual check logs, review JSONs) is left to the caller
- * (the /gauntlet-status skill) since log formats vary by check type.
- */
-import fs from "node:fs";
-import path from "node:path";
-// --- Types ---
-interface RunStart {
-	timestamp: string;
-	mode: string;
-	baseRef?: string;
-	filesChanged: number;
-	linesAdded: number;
-	linesRemoved: number;
-	gates: number;
-}
-interface GateResult {
-	timestamp: string;
-	gateId: string;
-	cli?: string;
-	status: string;
-	duration: string;
-	violations?: number;
-}
-interface RunEnd {
-	timestamp: string;
-	status: string;
-	fixed: number;
-	skipped: number;
-	failed: number;
-	iterations: number;
-	duration: string;
-}
-interface StopHookEntry {
-	timestamp: string;
-	decision: string;
-	reason: string;
-}
-interface SessionRun {
-	start: RunStart;
-	gates: GateResult[];
-	end?: RunEnd;
-	stopHook?: StopHookEntry;
-}
-// --- Parsing helpers ---
-function parseKeyValue(text: string): Record<string, string> {
-	const result: Record<string, string> = {};
-	for (const match of text.matchAll(/(\w+)=(\S+)/g)) {
-		const key = match[1];
-		const value = match[2];
-		if (key && value) result[key] = value;
-	}
-	return result;
-}
-function parseTimestamp(line: string): string {
-	const m = line.match(/^\[([^\]]+)\]/);
-	return m?.[1] ?? "";
-}
-function parseEventType(line: string): string {
-	const m = line.match(/^\[[^\]]+\]\s+(\S+)/);
-	return m?.[1] ?? "";
-}
-function parseEventBody(line: string): string {
-	const m = line.match(/^\[[^\]]+\]\s+\S+\s*(.*)/);
-	return m?.[1] ?? "";
-}
-// --- Debug log parsing ---
-function parseDebugLog(content: string, sessionStartTime?: Date): SessionRun[] {
-	const lines = content.split("\n").filter((l) => l.trim());
-	const sessions: SessionRun[] = [];
-	let current: SessionRun | null = null;
-	for (const line of lines) {
-		const event = parseEventType(line);
-		const body = parseEventBody(line);
-		const ts = parseTimestamp(line);
-		switch (event) {
-			case "RUN_START": {
-				// Skip runs that predate the current session's log files
-				if (sessionStartTime && new Date(ts) < sessionStartTime) {
-					current = null;
-					break;
-				}
-				const kv = parseKeyValue(body);
-				current = {
-					start: {
-						timestamp: ts,
-						mode: kv.mode ?? "unknown",
-						baseRef: kv.base_ref,
-						filesChanged: Number(kv.files_changed ?? kv.changes ?? 0),
-						linesAdded: Number(kv.lines_added ?? 0),
-						linesRemoved: Number(kv.lines_removed ?? 0),
-						gates: Number(kv.gates ?? 0),
-					},
-					gates: [],
-				};
-				sessions.push(current);
-				break;
-			}
-			case "GATE_RESULT": {
-				if (!current) break;
-				const gateIdMatch = body.match(/^(\S+)/);
-				const kv = parseKeyValue(body);
-				current.gates.push({
-					timestamp: ts,
-					gateId: gateIdMatch?.[1] ?? "unknown",
-					cli: kv.cli,
-					status: kv.status ?? "unknown",
-					duration: kv.duration ?? "?",
-					violations:
-						kv.violations !== undefined ? Number(kv.violations) : undefined,
-				});
-				break;
-			}
-			case "RUN_END": {
-				if (!current) break;
-				const kv = parseKeyValue(body);
-				current.end = {
-					timestamp: ts,
-					status: kv.status ?? "unknown",
-					fixed: Number(kv.fixed ?? 0),
-					skipped: Number(kv.skipped ?? 0),
-					failed: Number(kv.failed ?? 0),
-					iterations: Number(kv.iterations ?? 0),
-					duration: kv.duration ?? "?",
-				};
-				break;
-			}
-			case "STOP_HOOK": {
-				if (!current) break;
-				const kv = parseKeyValue(body);
-				current.stopHook = {
-					timestamp: ts,
-					decision: kv.decision ?? "unknown",
-					reason: kv.reason ?? "unknown",
-				};
-				break;
-			}
-		}
-	}
-	return sessions;
-}
-/**
- * Find the earliest mtime of non-hidden log files in the directory.
- * This marks the start of the current session.
- */
-function getSessionStartTime(logDir: string): Date | undefined {
-	const entries = fs
-		.readdirSync(logDir)
-		.filter((f) => !f.startsWith(".") && f !== "previous");
-	let earliest: number | undefined;
-	for (const entry of entries) {
-		const mtime = fs.statSync(path.join(logDir, entry)).mtimeMs;
-		if (earliest === undefined || mtime < earliest) {
-			earliest = mtime;
-		}
-	}
-	return earliest !== undefined ? new Date(earliest) : undefined;
-}
-// --- File inventory ---
-function formatFileInventory(logDir: string): string[] {
-	const lines: string[] = [];
-	const entries = fs
-		.readdirSync(logDir)
-		.filter((f) => !f.startsWith(".") && f !== "previous");
-	if (entries.length === 0) return lines;
-	const checks: string[] = [];
-	const reviews: string[] = [];
-	const other: string[] = [];
-	for (const entry of entries.sort()) {
-		const fullPath = path.join(logDir, entry);
-		const stat = fs.statSync(fullPath);
-		const sizeKB = (stat.size / 1024).toFixed(1);
-		const line = `- ${fullPath} (${sizeKB} KB)`;
-		if (entry.startsWith("review_")) {
-			reviews.push(line);
-		} else if (entry.startsWith("check_")) {
-			checks.push(line);
-		} else {
-			other.push(line);
-		}
-	}
-	lines.push("### Log Files");
-	lines.push("");
-	if (checks.length > 0) {
-		lines.push("**Check logs:**");
-		lines.push(...checks);
-	}
-	if (reviews.length > 0) {
-		lines.push("**Review logs/JSON:**");
-		lines.push(...reviews);
-	}
-	if (other.length > 0) {
-		lines.push("**Other:**");
-		lines.push(...other);
-	}
-	lines.push("");
-	return lines;
-}
-// --- Summary output ---
-function formatStatusLine(end: RunEnd): string {
-	return end.status === "pass"
-		? "PASSED"
-		: end.status === "fail"
-			? "FAILED"
-			: end.status.toUpperCase();
-}
-function formatAllRuns(sessions: SessionRun[]): string[] {
-	const lines: string[] = [];
-	lines.push("### All Runs in Session");
-	lines.push("");
-	for (let i = 0; i < sessions.length; i++) {
-		const s = sessions[i];
-		if (!s) continue;
-		const status = s.end ? s.end.status : "in-progress";
-		const duration = s.end ? s.end.duration : "?";
-		lines.push(
-			`${i + 1}. [${s.start.timestamp}] mode=${s.start.mode} status=${status} duration=${duration}`,
-		);
-	}
-	lines.push("");
-	return lines;
-}
-function formatSession(sessions: SessionRun[], logDir: string): string {
-	if (sessions.length === 0) {
-		return "No gauntlet runs found in logs.";
-	}
-	const lastComplete = [...sessions].reverse().find((s) => s.end);
-	const session = lastComplete ?? sessions[sessions.length - 1];
-	if (!session) return "No gauntlet runs found in logs.";
-	const lines: string[] = [];
-	// Header
-	lines.push("## Gauntlet Session Summary");
-	lines.push("");
-	// Overall status
-	if (session.end) {
-		lines.push(`**Status:** ${formatStatusLine(session.end)}`);
-		lines.push(`**Iterations:** ${session.end.iterations}`);
-		lines.push(`**Duration:** ${session.end.duration}`);
-		lines.push(
-			`**Fixed:** ${session.end.fixed} | **Skipped:** ${session.end.skipped} | **Failed:** ${session.end.failed}`,
-		);
-	} else {
-		lines.push("**Status:** In Progress (no RUN_END found)");
-	}
-	lines.push("");
-	// Diff stats
-	lines.push("### Diff Stats");
-	lines.push(`- Mode: ${session.start.mode}`);
-	if (session.start.baseRef) {
-		lines.push(`- Base ref: ${session.start.baseRef}`);
-	}
-	lines.push(`- Files changed: ${session.start.filesChanged}`);
-	lines.push(
-		`- Lines: +${session.start.linesAdded} / -${session.start.linesRemoved}`,
-	);
-	lines.push(`- Gates: ${session.start.gates}`);
-	lines.push("");
-	// Gate results
-	lines.push("### Gate Results");
-	lines.push("");
-	lines.push("| Gate | CLI | Status | Duration | Violations |");
-	lines.push("|------|-----|--------|----------|------------|");
-	for (const gate of session.gates) {
-		const violations =
-			gate.violations !== undefined ? String(gate.violations) : "-";
-		const statusIcon = gate.status === "pass" ? "pass" : "FAIL";
-		lines.push(
-			`| ${gate.gateId} | ${gate.cli ?? "-"} | ${statusIcon} | ${gate.duration} | ${violations} |`,
-		);
-	}
-	lines.push("");
-	// Stop hook
-	if (session.stopHook) {
-		lines.push("### Stop Hook");
-		lines.push(`- Decision: ${session.stopHook.decision}`);
-		lines.push(`- Reason: ${session.stopHook.reason}`);
-		lines.push("");
-	}
-	// File inventory
-	lines.push(...formatFileInventory(logDir));
-	// All sessions summary (if multiple runs)
-	if (sessions.length > 1) {
-		lines.push(...formatAllRuns(sessions));
-	}
-	return lines.join("\n");
-}
-// --- Main ---
-/**
- * Read the configured log_dir from .gauntlet/config.yml.
- * Falls back to "gauntlet_logs" if not found.
- */
-function getLogDir(cwd: string): string {
-	const configPath = path.join(cwd, ".gauntlet", "config.yml");
-	try {
-		const content = fs.readFileSync(configPath, "utf-8");
-		const match = content.match(/^log_dir:\s*(.+)$/m);
-		if (match?.[1]) return match[1].trim();
-	} catch {
-		// Config not found — use default
-	}
-	return "gauntlet_logs";
-}
-/**
- * Resolve the log directory and debug log path.
- * Returns null if no logs are found (after printing a message).
- */
-function resolveLogPaths(
-	activeDir: string,
-): { logDir: string; debugLogPath: string } | null {
-	const previousDir = path.join(activeDir, "previous");
-	const debugLogPath = path.join(activeDir, ".debug.log");
-	// Check active directory first for non-debug log files
-	const activeHasLogs =
-		fs.existsSync(activeDir) &&
-		fs
-			.readdirSync(activeDir)
-			.some((f) => !f.startsWith(".") && f !== "previous");
-	if (activeHasLogs) {
-		return { logDir: activeDir, debugLogPath };
-	}
-	if (!fs.existsSync(previousDir)) {
-		console.log("No gauntlet_logs directory found.");
-		return null;
-	}
-	// Fall back to previous directory — cleanLogs archives files directly here
-	const logDir = resolvePreviousLogDir(previousDir);
-	if (!logDir) return null;
-	// Debug log stays in the main gauntlet_logs dir, not in previous/
-	return { logDir, debugLogPath };
-}
-function resolvePreviousLogDir(previousDir: string): string | null {
-	const prevEntries = fs.readdirSync(previousDir);
-	const hasDirectFiles = prevEntries.some(
-		(f) => f.endsWith(".log") || f.endsWith(".json"),
-	);
-	if (hasDirectFiles) return previousDir;
-	// Legacy: check for timestamped subdirectories
-	const prevDirs = prevEntries
-		.map((d) => path.join(previousDir, d))
-		.filter((d) => fs.statSync(d).isDirectory())
-		.sort()
-		.reverse();
-	if (prevDirs.length === 0) {
-		console.log("No gauntlet logs found.");
-		return null;
-	}
-	return prevDirs[0] as string;
-}
-function main(): void {
-	const cwd = process.cwd();
-	const logDirName = getLogDir(cwd);
-	const activeDir = path.join(cwd, logDirName);
-	const paths = resolveLogPaths(activeDir);
-	if (!paths) {
-		process.exit(0);
-	}
-	// Parse debug log, filtering to current session based on log file timestamps
-	let sessions: SessionRun[] = [];
-	if (fs.existsSync(paths.debugLogPath)) {
-		const debugContent = fs.readFileSync(paths.debugLogPath, "utf-8");
-		const sessionStart = getSessionStartTime(paths.logDir);
-		sessions = parseDebugLog(debugContent, sessionStart);
-	}
-	// Format and output
-	const output = formatSession(sessions, paths.logDir);
-	console.log(output);
-}
-main();

package/src/templates/workflow.yml DELETED Viewed

@@ -1,79 +0,0 @@
-name: Gauntlet CI
-on:
-  push:
-    branches: [main]
-  pull_request:
-    branches: [main]
-jobs:
-  discover:
-    name: Discover Jobs
-    runs-on: ubuntu-latest
-    outputs:
-      matrix: ${{ steps.discover.outputs.matrix }}
-      runtimes: ${{ steps.discover.outputs.runtimes }}
-    steps:
-      - uses: actions/checkout@v4
-      - name: Install agent-gauntlet
-        run: |
-          curl -fsSL https://bun.sh/install | bash
-          echo "$HOME/.bun/bin" >> $GITHUB_PATH
-          export PATH="$HOME/.bun/bin:$PATH"
-          bun add -g pacaplan/agent-gauntlet
-      - name: Discover gauntlet jobs
-        id: discover
-        run: |
-          output=$(agent-gauntlet ci list-jobs)
-          echo "matrix=$(echo "$output" | jq -c '.matrix')" >> $GITHUB_OUTPUT
-          echo "runtimes=$(echo "$output" | jq -c '.runtimes')" >> $GITHUB_OUTPUT
-  checks:
-    name: ${{ matrix.job.name }} (${{ matrix.job.entry_point }})
-    runs-on: ubuntu-latest
-    needs: discover
-    if: ${{ needs.discover.outputs.matrix != '[]' }}
-    strategy:
-      fail-fast: false
-      matrix:
-        job: ${{ fromJson(needs.discover.outputs.matrix) }}
-    # Services will be injected here by agent-gauntlet
-    steps:
-      - uses: actions/checkout@v4
-      - name: Set up Ruby
-        if: contains(matrix.job.runtimes, 'ruby')
-        uses: ruby/setup-ruby@v1
-        with:
-          ruby-version: ${{ fromJson(needs.discover.outputs.runtimes).ruby.version }}
-          bundler-cache: ${{ fromJson(needs.discover.outputs.runtimes).ruby.bundler_cache }}
-          working-directory: ${{ matrix.job.working_directory }}
-      - name: Set up Node
-        if: contains(matrix.job.runtimes, 'node')
-        uses: actions/setup-node@v4
-        with:
-          node-version: ${{ fromJson(needs.discover.outputs.runtimes).node.version }}
-      - name: Set up Bun
-        if: contains(matrix.job.runtimes, 'bun')
-        uses: oven-sh/setup-bun@v1
-        with:
-          bun-version: ${{ fromJson(needs.discover.outputs.runtimes).bun.version }}
-      - name: Run global setup
-        if: ${{ matrix.job.global_setup != '' }}
-        run: ${{ matrix.job.global_setup }}
-      - name: Run check setup
-        if: ${{ matrix.job.setup != '' }}
-        working-directory: ${{ matrix.job.working_directory }}
-        run: ${{ matrix.job.setup }}
-      - name: Run check
-        working-directory: ${{ matrix.job.working_directory }}
-        run: ${{ matrix.job.command }}

package/src/types/gauntlet-status.ts DELETED Viewed

@@ -1,79 +0,0 @@
-/**
- * All possible outcomes from gauntlet operations.
- * Used by both the run executor and stop-hook - NO MAPPING REQUIRED.
- */
-export type GauntletStatus =
-	// Run outcomes (from executor)
-	| "passed" // All gates passed
-	| "passed_with_warnings" // Some issues were skipped
-	| "no_applicable_gates" // No gates matched current changes
-	| "no_changes" // No changes detected
-	| "failed" // Gates failed, retries remaining
-	| "retry_limit_exceeded" // Max retries reached
-	| "lock_conflict" // Another run in progress
-	| "error" // Unexpected error (includes config errors)
-	| "pr_push_required" // Gates passed but PR needs to be created/updated
-	// CI workflow statuses (after PR is pushed)
-	| "ci_pending" // CI checks still running
-	| "ci_failed" // CI checks failed or review changes requested
-	| "ci_passed" // CI checks passed, no blocking reviews
-	| "ci_timeout" // CI wait attempts exhausted
-	// Stop-hook pre-checks (before running executor)
-	| "no_config" // No .gauntlet/config.yml found
-	| "stop_hook_active" // Infinite loop prevention
-	| "interval_not_elapsed" // Run interval hasn't passed
-	| "invalid_input" // Failed to parse hook JSON input
-	| "stop_hook_disabled"; // Stop hook disabled via configuration
-export interface RunResult {
-	status: GauntletStatus;
-	/** Human-friendly message explaining the outcome */
-	message: string;
-	/** Number of gates that ran */
-	gatesRun?: number;
-	/** Number of gates that failed */
-	gatesFailed?: number;
-	/** Path to latest console log file */
-	consoleLogPath?: string;
-	/** Error message if status is "error" */
-	errorMessage?: string;
-	/** Interval minutes (when status is "interval_not_elapsed") */
-	intervalMinutes?: number;
-	/** Individual gate results (available when gates were executed) */
-	gateResults?: Array<{
-		jobId: string;
-		status: "pass" | "fail" | "error";
-		logPath?: string;
-		logPaths?: string[];
-		subResults?: Array<{
-			nameSuffix: string;
-			status: "pass" | "fail" | "error";
-			logPath?: string;
-		}>;
-	}>;
-}
-/**
- * Determine if a status should block the stop hook.
- */
-export function isBlockingStatus(status: GauntletStatus): boolean {
-	return (
-		status === "failed" ||
-		status === "pr_push_required" ||
-		status === "ci_pending" ||
-		status === "ci_failed"
-	);
-}
-/**
- * Determine if a status indicates successful completion (exit code 0).
- */
-export function isSuccessStatus(status: GauntletStatus): boolean {
-	return (
-		status === "passed" ||
-		status === "passed_with_warnings" ||
-		status === "no_applicable_gates" ||
-		status === "no_changes" ||
-		status === "ci_passed"
-	);
-}