npm - agent-gauntlet - Versions diffs - 0.10.0 → 0.11.0 - Mend

agent-gauntlet 0.10.0 → 0.11.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (71) hide show

package/README.md +25 -23
package/dist/index.js +9226 -0
package/dist/index.js.map +65 -0
package/dist/scripts/status.js +280 -0
package/dist/scripts/status.js.map +10 -0
package/package.json +22 -8
package/src/built-in-reviews/code-quality.md +0 -25
package/src/built-in-reviews/index.ts +0 -28
package/src/bun-plugins.d.ts +0 -4
package/src/cli-adapters/claude.ts +0 -327
package/src/cli-adapters/codex.ts +0 -290
package/src/cli-adapters/cursor.ts +0 -128
package/src/cli-adapters/gemini.ts +0 -510
package/src/cli-adapters/github-copilot.ts +0 -141
package/src/cli-adapters/index.ts +0 -250
package/src/cli-adapters/thinking-budget.ts +0 -23
package/src/commands/check.ts +0 -311
package/src/commands/ci/index.ts +0 -15
package/src/commands/ci/init.ts +0 -96
package/src/commands/ci/list-jobs.ts +0 -90
package/src/commands/clean.ts +0 -54
package/src/commands/detect.ts +0 -173
package/src/commands/health.ts +0 -169
package/src/commands/help.ts +0 -34
package/src/commands/index.ts +0 -13
package/src/commands/init.ts +0 -1878
package/src/commands/list.ts +0 -33
package/src/commands/review.ts +0 -311
package/src/commands/run.ts +0 -29
package/src/commands/shared.ts +0 -267
package/src/commands/stop-hook.ts +0 -567
package/src/commands/validate.ts +0 -20
package/src/commands/wait-ci.ts +0 -518
package/src/config/ci-loader.ts +0 -33
package/src/config/ci-schema.ts +0 -28
package/src/config/global.ts +0 -87
package/src/config/loader.ts +0 -301
package/src/config/schema.ts +0 -165
package/src/config/stop-hook-config.ts +0 -130
package/src/config/types.ts +0 -65
package/src/config/validator.ts +0 -592
package/src/core/change-detector.ts +0 -137
package/src/core/diff-stats.ts +0 -442
package/src/core/entry-point.ts +0 -190
package/src/core/job.ts +0 -96
package/src/core/run-executor.ts +0 -621
package/src/core/runner.ts +0 -290
package/src/gates/check.ts +0 -118
package/src/gates/resolve-check-command.ts +0 -21
package/src/gates/result.ts +0 -54
package/src/gates/review.ts +0 -1333
package/src/hooks/adapters/claude-stop-hook.ts +0 -99
package/src/hooks/adapters/cursor-stop-hook.ts +0 -122
package/src/hooks/adapters/types.ts +0 -94
package/src/hooks/stop-hook-handler.ts +0 -748
package/src/index.ts +0 -47
package/src/output/app-logger.ts +0 -214
package/src/output/console-log.ts +0 -168
package/src/output/console.ts +0 -359
package/src/output/logger.ts +0 -126
package/src/output/sinks/console-sink.ts +0 -59
package/src/output/sinks/file-sink.ts +0 -110
package/src/scripts/status.ts +0 -433
package/src/templates/workflow.yml +0 -79
package/src/types/gauntlet-status.ts +0 -79
package/src/utils/debug-log.ts +0 -392
package/src/utils/diff-parser.ts +0 -103
package/src/utils/execution-state.ts +0 -472
package/src/utils/log-parser.ts +0 -696
package/src/utils/sanitizer.ts +0 -3
package/src/utils/session-ref.ts +0 -91

package/src/cli-adapters/github-copilot.ts DELETED Viewed

@@ -1,141 +0,0 @@
-import { exec } from "node:child_process";
-import fs from "node:fs/promises";
-import os from "node:os";
-import path from "node:path";
-import { promisify } from "node:util";
-import { type CLIAdapter, runStreamingCommand } from "./index.js";
-const execAsync = promisify(exec);
-const MAX_BUFFER_BYTES = 10 * 1024 * 1024;
-export class GitHubCopilotAdapter implements CLIAdapter {
-	name = "github-copilot";
-	async isAvailable(): Promise<boolean> {
-		try {
-			await execAsync("which copilot");
-			return true;
-		} catch {
-			return false;
-		}
-	}
-	async checkHealth(): Promise<{
-		available: boolean;
-		status: "healthy" | "missing" | "unhealthy";
-		message?: string;
-	}> {
-		const available = await this.isAvailable();
-		if (!available) {
-			return {
-				available: false,
-				status: "missing",
-				message: "Command not found",
-			};
-		}
-		return { available: true, status: "healthy", message: "Ready" };
-	}
-	getProjectCommandDir(): string | null {
-		// GitHub Copilot CLI does not support custom commands (feature request #618)
-		return null;
-	}
-	getUserCommandDir(): string | null {
-		// GitHub Copilot CLI does not support custom commands (feature request #618)
-		return null;
-	}
-	getProjectSkillDir(): string | null {
-		return null;
-	}
-	getUserSkillDir(): string | null {
-		return null;
-	}
-	getCommandExtension(): string {
-		return ".md";
-	}
-	canUseSymlink(): boolean {
-		// Not applicable - no command directory support
-		return false;
-	}
-	transformCommand(markdownContent: string): string {
-		// Not applicable - no command directory support
-		return markdownContent;
-	}
-	async execute(opts: {
-		prompt: string;
-		diff: string;
-		model?: string;
-		timeoutMs?: number;
-		onOutput?: (chunk: string) => void;
-	}): Promise<string> {
-		const fullContent = `${opts.prompt}\n\n--- DIFF ---\n${opts.diff}`;
-		const tmpDir = os.tmpdir();
-		// Include process.pid for uniqueness across concurrent processes
-		const tmpFile = path.join(
-			tmpDir,
-			`gauntlet-copilot-${process.pid}-${Date.now()}.txt`,
-		);
-		await fs.writeFile(tmpFile, fullContent);
-		// Copilot reads from stdin when no -p flag is provided
-		// Tool whitelist: cat/grep/ls/find/head/tail are required for the AI to read
-		// and analyze code files during review. While these tools can access files,
-		// they are read-only and necessary for code review functionality.
-		// The copilot CLI is scoped to the repo directory by default.
-		// git is excluded to prevent access to commit history (review should only see diff).
-		const args = [
-			"--allow-tool",
-			"shell(cat)",
-			"--allow-tool",
-			"shell(grep)",
-			"--allow-tool",
-			"shell(ls)",
-			"--allow-tool",
-			"shell(find)",
-			"--allow-tool",
-			"shell(head)",
-			"--allow-tool",
-			"shell(tail)",
-		];
-		const cleanup = () => fs.unlink(tmpFile).catch(() => {});
-		// If onOutput callback is provided, use spawn for real-time streaming
-		if (opts.onOutput) {
-			return runStreamingCommand({
-				command: "copilot",
-				args,
-				tmpFile,
-				timeoutMs: opts.timeoutMs,
-				onOutput: opts.onOutput,
-				cleanup,
-			});
-		}
-		// Otherwise use exec for buffered output
-		// Shell command construction: We use exec() with shell piping instead of execFile()
-		// because copilot requires stdin input. The tmpFile path is system-controlled
-		// (os.tmpdir() + Date.now() + process.pid), not user-supplied, eliminating injection risk.
-		// Double quotes handle paths with spaces. This pattern matches claude.ts:131.
-		try {
-			const cmd = `cat "${tmpFile}" | copilot --allow-tool "shell(cat)" --allow-tool "shell(grep)" --allow-tool "shell(ls)" --allow-tool "shell(find)" --allow-tool "shell(head)" --allow-tool "shell(tail)"`;
-			const { stdout } = await execAsync(cmd, {
-				timeout: opts.timeoutMs,
-				maxBuffer: MAX_BUFFER_BYTES,
-			});
-			return stdout;
-		} finally {
-			// Cleanup errors are intentionally ignored - the tmp file will be cleaned up by OS
-			await cleanup();
-		}
-	}
-}

package/src/cli-adapters/index.ts DELETED Viewed

@@ -1,250 +0,0 @@
-import { type ChildProcess, spawn } from "node:child_process";
-import type { FileHandle } from "node:fs/promises";
-import fs from "node:fs/promises";
-export interface CLIAdapterHealth {
-	available: boolean;
-	status: "healthy" | "missing" | "unhealthy";
-	message?: string;
-}
-/**
- * Collects stderr from a child process and returns a getter for the accumulated output.
- * Also forwards each chunk to the optional onOutput callback.
- */
-export function collectStderr(
-	child: ChildProcess,
-	onOutput?: (text: string) => void,
-): () => string {
-	const chunks: string[] = [];
-	child.stderr?.on("data", (data: Buffer) => {
-		const text = data.toString();
-		chunks.push(text);
-		onOutput?.(text);
-	});
-	return () => chunks.join("");
-}
-/**
- * Builds an Error for a non-zero process exit, including stdout and stderr if available.
- * Both stdout and stderr are included to ensure usage limit messages are captured
- * regardless of which stream the CLI writes them to.
- */
-export function processExitError(
-	code: number | null,
-	getStderr: () => string,
-	getStdout?: () => string,
-): Error {
-	const stderr = getStderr();
-	const stdout = getStdout?.() ?? "";
-	const output = [stdout, stderr].filter(Boolean).join("\n");
-	return new Error(
-		`Process exited with code ${code}${output ? `\n${output}` : ""}`,
-	);
-}
-export async function runStreamingCommand(opts: {
-	command: string;
-	args: string[];
-	tmpFile: string;
-	timeoutMs?: number;
-	onOutput?: (chunk: string) => void;
-	cleanup: () => Promise<void>;
-	env?: NodeJS.ProcessEnv;
-}): Promise<string> {
-	return new Promise((resolve, reject) => {
-		const chunks: string[] = [];
-		const inputStream = fs.open(opts.tmpFile, "r").then((handle) => {
-			const stream = handle.createReadStream();
-			return { stream, handle };
-		});
-		inputStream
-			.then(({ stream, handle }) => {
-				const child = spawn(opts.command, opts.args, {
-					stdio: ["pipe", "pipe", "pipe"],
-					env: opts.env,
-				});
-				stream.pipe(child.stdin);
-				let timeoutId: ReturnType<typeof setTimeout> | undefined;
-				if (opts.timeoutMs) {
-					timeoutId = setTimeout(() => {
-						child.kill("SIGTERM");
-						reject(new Error("Command timed out"));
-					}, opts.timeoutMs);
-				}
-				child.stdout.on("data", (data: Buffer) => {
-					const chunk = data.toString();
-					chunks.push(chunk);
-					opts.onOutput?.(chunk);
-				});
-				const getStderr = collectStderr(child, opts.onOutput);
-				child.on("close", (code) => {
-					void finalizeProcessClose({
-						code,
-						timeoutId,
-						handle,
-						cleanup: opts.cleanup,
-						chunks,
-						getStderr,
-						resolve,
-						reject,
-					});
-				});
-				child.on("error", (err) => {
-					if (timeoutId) clearTimeout(timeoutId);
-					handle.close().catch(() => {});
-					opts.cleanup().then(() => reject(err));
-				});
-			})
-			.catch((err) => {
-				opts.cleanup().then(() => reject(err));
-			});
-	});
-}
-export async function finalizeProcessClose(opts: {
-	code: number | null;
-	timeoutId?: ReturnType<typeof setTimeout>;
-	handle: FileHandle;
-	cleanup: () => Promise<void>;
-	chunks: string[];
-	getStderr: () => string;
-	resolve: (value: string) => void;
-	reject: (error: Error) => void;
-}): Promise<void> {
-	if (opts.timeoutId) clearTimeout(opts.timeoutId);
-	await opts.handle.close().catch(() => {});
-	await opts.cleanup();
-	if (opts.code === 0 || opts.code === null) {
-		opts.resolve(opts.chunks.join(""));
-	} else {
-		opts.reject(
-			processExitError(opts.code, opts.getStderr, () => opts.chunks.join("")),
-		);
-	}
-}
-export function isUsageLimit(output: string): boolean {
-	const lower = output.toLowerCase();
-	return (
-		lower.includes("usage limit") ||
-		lower.includes("quota exceeded") ||
-		lower.includes("quota will reset") ||
-		lower.includes("credit balance is too low") ||
-		lower.includes("out of extra usage") ||
-		lower.includes("out of usage")
-	);
-}
-export interface CLIAdapter {
-	name: string;
-	isAvailable(): Promise<boolean>;
-	checkHealth(): Promise<CLIAdapterHealth>;
-	execute(opts: {
-		prompt: string;
-		diff: string;
-		model?: string;
-		timeoutMs?: number;
-		/** Optional callback for real-time output streaming */
-		onOutput?: (chunk: string) => void;
-		/** Whether to allow tool use for this adapter. Defaults to true. */
-		allowToolUse?: boolean;
-		/** Thinking budget level (off/low/medium/high). */
-		thinkingBudget?: string;
-	}): Promise<string>;
-	/**
-	 * Returns the project-scoped command directory path (relative to project root).
-	 * Returns null if the CLI only supports user-level commands.
-	 */
-	getProjectCommandDir(): string | null;
-	/**
-	 * Returns the user-level command directory path (absolute path).
-	 * Returns null if the CLI doesn't support user-level commands.
-	 */
-	getUserCommandDir(): string | null;
-	/**
-	 * Returns the project-scoped skill directory path (relative to project root).
-	 * Returns null if the CLI doesn't support the skills model.
-	 */
-	getProjectSkillDir(): string | null;
-	/**
-	 * Returns the user-level skill directory path (absolute path).
-	 * Returns null if the CLI doesn't support the skills model.
-	 */
-	getUserSkillDir(): string | null;
-	/**
-	 * Returns the command file extension used by this CLI.
-	 */
-	getCommandExtension(): string;
-	/**
-	 * Returns true if this adapter can use symlinks (same format as source Markdown).
-	 */
-	canUseSymlink(): boolean;
-	/**
-	 * Transforms gauntlet command content to this CLI's format.
-	 * The source content is always Markdown with YAML frontmatter.
-	 */
-	transformCommand(markdownContent: string): string;
-}
-import { ClaudeAdapter } from "./claude.js";
-import { CodexAdapter } from "./codex.js";
-import { CursorAdapter } from "./cursor.js";
-import { GeminiAdapter } from "./gemini.js";
-import { GitHubCopilotAdapter } from "./github-copilot.js";
-export {
-	GeminiAdapter,
-	CodexAdapter,
-	ClaudeAdapter,
-	GitHubCopilotAdapter,
-	CursorAdapter,
-};
-// Adapter registry: keys should use lowercase with hyphens for multi-word names
-const adapters: Record<string, CLIAdapter> = {
-	gemini: new GeminiAdapter(),
-	codex: new CodexAdapter(),
-	claude: new ClaudeAdapter(),
-	"github-copilot": new GitHubCopilotAdapter(),
-	cursor: new CursorAdapter(),
-};
-export function getAdapter(name: string): CLIAdapter | undefined {
-	return adapters[name];
-}
-export function getAllAdapters(): CLIAdapter[] {
-	return Object.values(adapters);
-}
-/**
- * Returns all adapters that support project-scoped commands.
- */
-export function getProjectCommandAdapters(): CLIAdapter[] {
-	return Object.values(adapters).filter(
-		(a) => a.getProjectCommandDir() !== null,
-	);
-}
-/**
- * Returns all adapters that support user-level commands.
- */
-export function getUserCommandAdapters(): CLIAdapter[] {
-	return Object.values(adapters).filter((a) => a.getUserCommandDir() !== null);
-}
-/**
- * Returns all valid CLI tool names (adapter registry keys).
- */
-export function getValidCLITools(): string[] {
-	return Object.keys(adapters);
-}

package/src/cli-adapters/thinking-budget.ts DELETED Viewed

@@ -1,23 +0,0 @@
-/** Maps unified thinking budget levels to Claude MAX_THINKING_TOKENS values. */
-export const CLAUDE_THINKING_TOKENS: Record<string, number> = {
-	off: 0,
-	low: 8000,
-	medium: 16000,
-	high: 31999,
-};
-/** Maps unified thinking budget levels to Codex model_reasoning_effort values. */
-export const CODEX_REASONING_EFFORT: Record<string, string> = {
-	off: "minimal",
-	low: "low",
-	medium: "medium",
-	high: "high",
-};
-/** Maps unified thinking budget levels to Gemini thinkingBudget values. */
-export const GEMINI_THINKING_BUDGET: Record<string, number> = {
-	off: 0,
-	low: 4096,
-	medium: 8192,
-	high: 24576,
-};