npm - @pi-agents/orchid - Versions diffs - 0.1.0-beta.0 - Mend

@pi-agents/orchid 0.1.0-beta.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (163) hide show

package/CHANGELOG.md +41 -0
package/LICENSE +21 -0
package/README.md +246 -0
package/agents/AGENTS-MANIFEST.md +42 -0
package/agents/brain.md +42 -0
package/agents/context-builder.md +46 -0
package/agents/delegate.md +12 -0
package/agents/dev-1.md +42 -0
package/agents/oracle.md +73 -0
package/agents/planner.md +55 -0
package/agents/researcher.md +52 -0
package/agents/reviewer.md +79 -0
package/agents/scout.md +50 -0
package/agents/tester.md +45 -0
package/agents/worker.md +55 -0
package/extensions/ralph.ts +1 -0
package/extensions/reviewer-extension.ts +125 -0
package/extensions/task-orchestrator.ts +28 -0
package/package.json +63 -0
package/prompts/gather-context-and-clarify.md +13 -0
package/prompts/parallel-cleanup.md +59 -0
package/prompts/parallel-context-build.md +53 -0
package/prompts/parallel-handoff-plan.md +59 -0
package/prompts/parallel-research.md +50 -0
package/prompts/parallel-review.md +54 -0
package/prompts/review-loop.md +41 -0
package/skills/orchid/SKILL.md +214 -0
package/skills/orchid/orchid-cleanup/SKILL.md +122 -0
package/skills/orchid/orchid-converge/SKILL.md +124 -0
package/skills/orchid/orchid-decompose/SKILL.md +201 -0
package/skills/orchid/orchid-doctor/SKILL.md +162 -0
package/skills/orchid/orchid-investigate/SKILL.md +102 -0
package/skills/orchid/orchid-launch/SKILL.md +147 -0
package/skills/ralph/SKILL.md +73 -0
package/skills/subagents/pi-subagents/SKILL.md +813 -0
package/src/index.ts +7 -0
package/src/orchestrator/abort.ts +534 -0
package/src/orchestrator/agent-bridge-extension.ts +1020 -0
package/src/orchestrator/agent-host.ts +954 -0
package/src/orchestrator/cleanup.ts +776 -0
package/src/orchestrator/config-loader.ts +1412 -0
package/src/orchestrator/config-schema.ts +690 -0
package/src/orchestrator/config.ts +81 -0
package/src/orchestrator/context-window.ts +66 -0
package/src/orchestrator/diagnostic-reports.ts +475 -0
package/src/orchestrator/diagnostics.ts +394 -0
package/src/orchestrator/discovery.ts +1833 -0
package/src/orchestrator/engine-worker.ts +415 -0
package/src/orchestrator/engine.ts +5940 -0
package/src/orchestrator/execution.ts +3104 -0
package/src/orchestrator/extension.ts +5934 -0
package/src/orchestrator/formatting.ts +785 -0
package/src/orchestrator/git.ts +88 -0
package/src/orchestrator/index.ts +28 -0
package/src/orchestrator/lane-runner.ts +1787 -0
package/src/orchestrator/mailbox.ts +780 -0
package/src/orchestrator/merge.ts +3414 -0
package/src/orchestrator/messages.ts +1062 -0
package/src/orchestrator/migrations.ts +278 -0
package/src/orchestrator/naming.ts +117 -0
package/src/orchestrator/path-resolver.ts +275 -0
package/src/orchestrator/persistence.ts +2625 -0
package/src/orchestrator/process-registry.ts +452 -0
package/src/orchestrator/quality-gate.ts +1085 -0
package/src/orchestrator/resume.ts +3488 -0
package/src/orchestrator/sessions.ts +57 -0
package/src/orchestrator/settings-loader.ts +136 -0
package/src/orchestrator/settings-tui.ts +2208 -0
package/src/orchestrator/sidecar-telemetry.ts +267 -0
package/src/orchestrator/supervisor.ts +4548 -0
package/src/orchestrator/task-executor-core.ts +675 -0
package/src/orchestrator/tmux-compat.ts +37 -0
package/src/orchestrator/tool-allowlist-constants.ts +37 -0
package/src/orchestrator/types.ts +4465 -0
package/src/orchestrator/verification.ts +547 -0
package/src/orchestrator/waves.ts +1564 -0
package/src/orchestrator/workspace.ts +707 -0
package/src/orchestrator/worktree.ts +2725 -0
package/src/ralph/index.ts +825 -0
package/src/subagents/agents/agent-management.ts +648 -0
package/src/subagents/agents/agent-scope.ts +6 -0
package/src/subagents/agents/agent-selection.ts +23 -0
package/src/subagents/agents/agent-serializer.ts +86 -0
package/src/subagents/agents/agents.ts +832 -0
package/src/subagents/agents/chain-serializer.ts +137 -0
package/src/subagents/agents/frontmatter.ts +29 -0
package/src/subagents/agents/identity.ts +30 -0
package/src/subagents/agents/skills.ts +632 -0
package/src/subagents/extension/config.ts +16 -0
package/src/subagents/extension/control-notices.ts +92 -0
package/src/subagents/extension/doctor.ts +199 -0
package/src/subagents/extension/fanout-child.ts +170 -0
package/src/subagents/extension/index.ts +573 -0
package/src/subagents/extension/schemas.ts +168 -0
package/src/subagents/intercom/intercom-bridge.ts +379 -0
package/src/subagents/intercom/result-intercom.ts +377 -0
package/src/subagents/runs/background/async-execution.ts +712 -0
package/src/subagents/runs/background/async-job-tracker.ts +310 -0
package/src/subagents/runs/background/async-resume.ts +345 -0
package/src/subagents/runs/background/async-status.ts +325 -0
package/src/subagents/runs/background/completion-dedupe.ts +63 -0
package/src/subagents/runs/background/notify.ts +108 -0
package/src/subagents/runs/background/parallel-groups.ts +45 -0
package/src/subagents/runs/background/result-watcher.ts +307 -0
package/src/subagents/runs/background/run-id-resolver.ts +83 -0
package/src/subagents/runs/background/run-status.ts +269 -0
package/src/subagents/runs/background/stale-run-reconciler.ts +336 -0
package/src/subagents/runs/background/subagent-runner.ts +1808 -0
package/src/subagents/runs/background/top-level-async.ts +13 -0
package/src/subagents/runs/foreground/chain-clarify.ts +1333 -0
package/src/subagents/runs/foreground/chain-execution.ts +938 -0
package/src/subagents/runs/foreground/execution.ts +918 -0
package/src/subagents/runs/foreground/subagent-executor.ts +2527 -0
package/src/subagents/runs/shared/completion-guard.ts +147 -0
package/src/subagents/runs/shared/long-running-guard.ts +175 -0
package/src/subagents/runs/shared/mcp-direct-tool-allowlist.ts +365 -0
package/src/subagents/runs/shared/model-fallback.ts +103 -0
package/src/subagents/runs/shared/nested-events.ts +819 -0
package/src/subagents/runs/shared/nested-path.ts +52 -0
package/src/subagents/runs/shared/nested-render.ts +115 -0
package/src/subagents/runs/shared/parallel-utils.ts +109 -0
package/src/subagents/runs/shared/pi-args.ts +220 -0
package/src/subagents/runs/shared/pi-spawn.ts +115 -0
package/src/subagents/runs/shared/run-history.ts +60 -0
package/src/subagents/runs/shared/single-output.ts +164 -0
package/src/subagents/runs/shared/subagent-control.ts +226 -0
package/src/subagents/runs/shared/subagent-prompt-runtime.ts +170 -0
package/src/subagents/runs/shared/worktree.ts +577 -0
package/src/subagents/shared/artifacts.ts +98 -0
package/src/subagents/shared/atomic-json.ts +16 -0
package/src/subagents/shared/file-coalescer.ts +40 -0
package/src/subagents/shared/fork-context.ts +76 -0
package/src/subagents/shared/formatters.ts +133 -0
package/src/subagents/shared/jsonl-writer.ts +81 -0
package/src/subagents/shared/model-info.ts +78 -0
package/src/subagents/shared/post-exit-stdio-guard.ts +85 -0
package/src/subagents/shared/session-identity.ts +10 -0
package/src/subagents/shared/session-tokens.ts +44 -0
package/src/subagents/shared/settings.ts +397 -0
package/src/subagents/shared/status-format.ts +49 -0
package/src/subagents/shared/types.ts +822 -0
package/src/subagents/shared/utils.ts +450 -0
package/src/subagents/slash/prompt-template-bridge.ts +397 -0
package/src/subagents/slash/slash-bridge.ts +174 -0
package/src/subagents/slash/slash-commands.ts +528 -0
package/src/subagents/slash/slash-live-state.ts +292 -0
package/src/subagents/tui/render-helpers.ts +80 -0
package/src/subagents/tui/render.ts +1358 -0
package/templates/agents/local/supervisor.md +33 -0
package/templates/agents/local/task-merger.md +27 -0
package/templates/agents/local/task-reviewer.md +30 -0
package/templates/agents/local/task-worker.md +34 -0
package/templates/agents/supervisor-routing.md +92 -0
package/templates/agents/supervisor.md +229 -0
package/templates/agents/task-merger.md +214 -0
package/templates/agents/task-reviewer.md +260 -0
package/templates/agents/task-worker-segment.md +44 -0
package/templates/agents/task-worker.md +557 -0
package/templates/tasks/CONTEXT.md +30 -0
package/templates/tasks/EXAMPLE-001-hello-world/PROMPT.md +98 -0
package/templates/tasks/EXAMPLE-001-hello-world/STATUS.md +73 -0
package/templates/tasks/EXAMPLE-002-parallel-smoke/PROMPT.md +97 -0
package/templates/tasks/EXAMPLE-002-parallel-smoke/STATUS.md +73 -0

package/src/orchestrator/verification.ts ADDED Viewed

@@ -0,0 +1,547 @@
+/**
+ * Verification baseline fingerprinting system.
+ *
+ * Captures test output before and after merge, parses it into normalized
+ * fingerprints, and diffs to identify genuinely new failures vs pre-existing ones.
+ *
+ * Design notes:
+ *
+ * **Runner result schema:** Each command produces a CommandResult with:
+ *   - commandId: string key from testing.commands config
+ *   - exitCode: number (process exit code, -1 for spawn errors)
+ *   - stdout: string (captured raw stdout)
+ *   - stderr: string (captured raw stderr)
+ *   - durationMs: number
+ *   - error: string | null (spawn/timeout error message)
+ *
+ * **Fingerprint equality key:** Composite of all five fields joined by \0:
+ *   `${commandId}\0${file}\0${case}\0${kind}\0${messageNorm}`
+ *   Duplicates within a single run are collapsed before diffing.
+ *
+ * **messageNorm normalization rules:**
+ *   1. Strip ANSI escape sequences
+ *   2. Normalize path separators (backslash → forward slash)
+ *   3. Remove duration strings (e.g., "(42ms)", "(1.2s)")
+ *   4. Remove ISO-8601 timestamps
+ *   5. Collapse whitespace (runs of space/tab/newline → single space, then trim)
+ *   6. Truncate to 512 chars (bound fingerprint size)
+ *
+ * **Fallback for non-JSON output:**
+ *   If legacy Vitest JSON parsing fails (truncated, missing, non-JSON), produce
+ *   a single fingerprint with kind: "command_error" and the first 512 chars
+ *   of stderr (or stdout) as messageNorm.
+ *
+ * **Compatibility note:**
+ *   OrchID's default tests use Node.js native `node:test`. The Vitest parser
+ *   in this module is retained only for backward compatibility when projects
+ *   provide custom `testing.commands` that still emit Vitest JSON.
+ *
+ * @module orch/verification
+ */
+import { spawnSync } from "child_process";
+// ── Types ────────────────────────────────────────────────────────────
+/**
+ * A configured verification command from testing.commands config.
+ */
+export interface VerificationCommand {
+	/** Stable key from config (e.g., "test", "build") — used as commandId */
+	id: string;
+	/** Shell command string to execute */
+	command: string;
+}
+/**
+ * Result of running a single verification command.
+ */
+export interface CommandResult {
+	/** Key from testing.commands config (e.g., "test", "build") */
+	commandId: string;
+	/** Process exit code. -1 for spawn/timeout errors. */
+	exitCode: number;
+	/** Captured stdout */
+	stdout: string;
+	/** Captured stderr */
+	stderr: string;
+	/** Wall-clock duration in milliseconds */
+	durationMs: number;
+	/** Error message if command failed to spawn or timed out; null otherwise */
+	error: string | null;
+}
+/**
+ * Normalized test fingerprint identifying a single test outcome.
+ *
+ * Equality is determined by ALL five fields — the composite key.
+ */
+export interface TestFingerprint {
+	/** Command that produced this result (key from testing.commands) */
+	commandId: string;
+	/** Source file path (normalized to forward slashes) */
+	file: string;
+	/** Test case full name (describe > it chain) */
+	case: string;
+	/** Failure classification */
+	kind: "assertion_error" | "runtime_error" | "timeout" | "command_error" | "unknown";
+	/** Normalized failure message (see normalization rules in module doc) */
+	messageNorm: string;
+}
+/**
+ * A captured verification baseline or post-merge snapshot.
+ */
+export interface VerificationBaseline {
+	/** When this baseline was captured (ISO 8601) */
+	capturedAt: string;
+	/** Command results (one per configured command) */
+	commandResults: CommandResult[];
+	/** Deduplicated fingerprints extracted from all command results */
+	fingerprints: TestFingerprint[];
+}
+/**
+ * Result of diffing two fingerprint sets.
+ */
+export interface FingerprintDiff {
+	/** Failures present in postMerge but not in baseline */
+	newFailures: TestFingerprint[];
+	/** Failures present in both baseline and postMerge (pre-existing) */
+	preExisting: TestFingerprint[];
+	/** Failures in baseline that disappeared in postMerge (fixed) */
+	fixed: TestFingerprint[];
+}
+// ── Normalization Helpers ────────────────────────────────────────────
+/** Max length for normalized message strings */
+const MESSAGE_NORM_MAX_LENGTH = 512;
+// Built via `new RegExp` so Biome's noControlCharactersInRegex (which only
+// inspects regex literals) does not flag the \u001b/\u009b escapes that are
+// fundamental to ANSI sequence detection. Runtime behavior is identical to
+// the prior literal regex; this is a static-analysis adjustment only.
+const ANSI_REGEX = new RegExp(
+	"[\\u001b\\u009b]\\[[()#;?]*(?:[0-9]{1,4}(?:;[0-9]{0,4})*)?[0-9A-ORZcf-nqry=><~]",
+	"g",
+);
+/** Match duration strings like (42ms), (1.2s), (3m 12s), 42 ms, 1200ms */
+const DURATION_REGEX = /\(?\d+(?:\.\d+)?\s*(?:ms|s|m)\s*(?:\d+(?:\.\d+)?\s*(?:ms|s))?\)?/g;
+/** Match ISO-8601 timestamps like 2026-03-20T12:34:56.789Z */
+const TIMESTAMP_REGEX = /\d{4}-\d{2}-\d{2}T\d{2}:\d{2}:\d{2}(?:\.\d+)?Z?/g;
+/**
+ * Normalize a failure message for stable fingerprinting.
+ *
+ * 1. Strip ANSI escape sequences
+ * 2. Normalize path separators (\ → /)
+ * 3. Remove duration strings (e.g., "(42ms)", "(1.2s)")
+ * 4. Remove ISO-8601 timestamps
+ * 5. Collapse whitespace
+ * 6. Truncate to MESSAGE_NORM_MAX_LENGTH
+ */
+export function normalizeMessage(raw: string): string {
+	let msg = raw;
+	// 1. Strip ANSI
+	msg = msg.replace(ANSI_REGEX, "");
+	// 2. Normalize path separators
+	msg = msg.replace(/\\/g, "/");
+	// 3. Remove duration strings
+	msg = msg.replace(DURATION_REGEX, "");
+	// 4. Remove ISO-8601 timestamps
+	msg = msg.replace(TIMESTAMP_REGEX, "");
+	// 5. Collapse whitespace
+	msg = msg.replace(/\s+/g, " ").trim();
+	// 6. Truncate
+	if (msg.length > MESSAGE_NORM_MAX_LENGTH) {
+		msg = msg.slice(0, MESSAGE_NORM_MAX_LENGTH);
+	}
+	return msg;
+}
+/**
+ * Normalize a file path for stable fingerprinting.
+ * Converts backslashes to forward slashes.
+ */
+export function normalizeFilePath(raw: string): string {
+	return raw.replace(/\\/g, "/");
+}
+/**
+ * Compute a stable string key for a fingerprint used in set operations.
+ * Fields joined by null byte (unlikely in test output).
+ */
+export function fingerprintKey(fp: TestFingerprint): string {
+	return `${fp.commandId}\0${fp.file}\0${fp.case}\0${fp.kind}\0${fp.messageNorm}`;
+}
+// ── Command Runner ───────────────────────────────────────────────────
+/** Default timeout for verification commands: 5 minutes */
+const DEFAULT_COMMAND_TIMEOUT_MS = 5 * 60 * 1000;
+/**
+ * Run configured verification commands and return per-command results.
+ *
+ * Commands are iterated in deterministic insertion order of the
+ * `testing.commands` config map. Each command runs synchronously in
+ * the specified working directory (typically the merge worktree).
+ *
+ * @param commands  - Map of commandId → shell command string (from testing.commands config)
+ * @param cwd       - Working directory to run commands in
+ * @param timeoutMs - Per-command timeout in milliseconds (default: 5 min)
+ * @returns Array of CommandResult in config iteration order
+ */
+export function runVerificationCommands(
+	commands: Record<string, string>,
+	cwd: string,
+	timeoutMs: number = DEFAULT_COMMAND_TIMEOUT_MS,
+): CommandResult[] {
+	const results: CommandResult[] = [];
+	for (const [commandId, command] of Object.entries(commands)) {
+		const start = Date.now();
+		try {
+			const isWindows = process.platform === "win32";
+			const shell = isWindows ? "cmd" : "/bin/sh";
+			const shellArgs = isWindows ? ["/c", command] : ["-c", command];
+			const proc = spawnSync(shell, shellArgs, {
+				cwd,
+				encoding: "utf-8",
+				timeout: timeoutMs,
+				stdio: ["pipe", "pipe", "pipe"],
+				// Ensure child processes don't inherit stdin
+				env: { ...process.env },
+			});
+			const durationMs = Date.now() - start;
+			if (proc.error) {
+				// Spawn error or timeout
+				const isTimeout = (proc.error as NodeJS.ErrnoException).code === "ETIMEDOUT";
+				results.push({
+					commandId,
+					exitCode: -1,
+					stdout: proc.stdout || "",
+					stderr: proc.stderr || "",
+					durationMs,
+					error: isTimeout
+						? `Command timed out after ${timeoutMs}ms`
+						: `Spawn error: ${proc.error.message}`,
+				});
+			} else {
+				results.push({
+					commandId,
+					exitCode: proc.status ?? -1,
+					stdout: proc.stdout || "",
+					stderr: proc.stderr || "",
+					durationMs,
+					error: null,
+				});
+			}
+		} catch (err: unknown) {
+			const durationMs = Date.now() - start;
+			const message = err instanceof Error ? err.message : String(err);
+			results.push({
+				commandId,
+				exitCode: -1,
+				stdout: "",
+				stderr: "",
+				durationMs,
+				error: `Unexpected error: ${message}`,
+			});
+		}
+	}
+	return results;
+}
+// ── Test Output Parsers ──────────────────────────────────────────────
+/**
+ * Vitest JSON reporter output shape (subset of fields we care about).
+ */
+interface VitestJsonResult {
+	testResults?: Array<{
+		name?: string;
+		status?: string;
+		message?: string;
+		assertionResults?: Array<{
+			fullName?: string;
+			status?: string;
+			failureMessages?: string[];
+		}>;
+	}>;
+}
+/**
+ * Classify a failure message into a kind.
+ */
+function classifyFailureKind(message: string): TestFingerprint["kind"] {
+	const lower = message.toLowerCase();
+	if (lower.includes("timeout") || lower.includes("timed out")) {
+		return "timeout";
+	}
+	if (
+		lower.includes("assert") ||
+		lower.includes("expect") ||
+		lower.includes("tobe") ||
+		lower.includes("toequal") ||
+		lower.includes("tohave")
+	) {
+		return "assertion_error";
+	}
+	if (
+		lower.includes("referenceerror") ||
+		lower.includes("typeerror") ||
+		lower.includes("syntaxerror") ||
+		lower.includes("cannot find module") ||
+		lower.includes("is not defined") ||
+		lower.includes("is not a function")
+	) {
+		return "runtime_error";
+	}
+	return "unknown";
+}
+/**
+ * Parse legacy Vitest JSON reporter output into test fingerprints.
+ *
+ * Expects stdout to contain a JSON object matching Vitest's JSON reporter format.
+ * Only failed tests produce fingerprints (passed tests are irrelevant for baseline diffing).
+ *
+ * If JSON parsing fails or the structure is unexpected, returns null to signal
+ * that the caller should use fallback fingerprinting.
+ *
+ * @param commandId - The command that produced this output
+ * @param stdout    - Raw stdout from the Vitest command (legacy compatibility path)
+ * @returns Array of fingerprints for failed tests, or null if parsing fails
+ */
+export function parseVitestOutput(commandId: string, stdout: string): TestFingerprint[] | null {
+	// Try to extract JSON from stdout (Vitest may prepend/append non-JSON lines)
+	let json: VitestJsonResult;
+	try {
+		// First attempt: parse the whole stdout as JSON
+		json = JSON.parse(stdout);
+	} catch {
+		// Second attempt: find the first { and last } to extract JSON block
+		const firstBrace = stdout.indexOf("{");
+		const lastBrace = stdout.lastIndexOf("}");
+		if (firstBrace === -1 || lastBrace === -1 || lastBrace <= firstBrace) {
+			return null;
+		}
+		try {
+			json = JSON.parse(stdout.slice(firstBrace, lastBrace + 1));
+		} catch {
+			return null;
+		}
+	}
+	if (!json || !Array.isArray(json.testResults)) {
+		return null;
+	}
+	const fingerprints: TestFingerprint[] = [];
+	for (const testFile of json.testResults) {
+		const file = normalizeFilePath(testFile.name || "unknown");
+		const assertions = testFile.assertionResults;
+		const hasAssertions = Array.isArray(assertions) && assertions.length > 0;
+		if (hasAssertions) {
+			for (const assertion of assertions!) {
+				// Only fingerprint failures
+				if (assertion.status !== "failed") continue;
+				const caseName = assertion.fullName || "unknown";
+				const messages = assertion.failureMessages || [];
+				const rawMessage = messages.join("\n") || "no failure message";
+				fingerprints.push({
+					commandId,
+					file,
+					case: caseName,
+					kind: classifyFailureKind(rawMessage),
+					messageNorm: normalizeMessage(rawMessage),
+				});
+			}
+		}
+		// Suite-level failures: testResults[].status === "failed" with no assertion-level details.
+		// This covers setup/import/runtime-at-file-load errors where Vitest marks the file as
+		// failed but produces no assertionResults (or only non-failed ones).
+		if (testFile.status === "failed") {
+			const hasFailedAssertions = hasAssertions && assertions!.some((a) => a.status === "failed");
+			if (!hasFailedAssertions) {
+				// No assertion-level failures captured — emit suite-level runtime_error fingerprint
+				const suiteMessage = testFile.message || "Suite failed with no message";
+				fingerprints.push({
+					commandId,
+					file,
+					case: "<suite>",
+					kind: "runtime_error",
+					messageNorm: normalizeMessage(suiteMessage),
+				});
+			}
+		}
+	}
+	return fingerprints;
+}
+/**
+ * Parse test output into normalized fingerprints.
+ *
+ * Strategy:
+ * 1. Try legacy Vitest JSON adapter
+ * 2. If parsing fails: produce a fallback command_error fingerprint
+ *
+ * The adapter pattern is extensible — future parsers for jest, pytest, etc.
+ * can be added here as additional try paths before the fallback.
+ *
+ * @param commandResult - Result from runVerificationCommands
+ * @returns Array of fingerprints (always non-empty for failed commands)
+ */
+export function parseTestOutput(commandResult: CommandResult): TestFingerprint[] {
+	const { commandId, exitCode, stdout, stderr, error } = commandResult;
+	// If command had a spawn/timeout error, produce a command_error fingerprint
+	if (error) {
+		return [
+			{
+				commandId,
+				file: "",
+				case: "",
+				kind: "command_error",
+				messageNorm: normalizeMessage(error),
+			},
+		];
+	}
+	// If exit code is 0, no failures to fingerprint
+	if (exitCode === 0) {
+		return [];
+	}
+	// Try legacy Vitest JSON adapter
+	const vitestFingerprints = parseVitestOutput(commandId, stdout);
+	if (vitestFingerprints !== null && vitestFingerprints.length > 0) {
+		return vitestFingerprints;
+	}
+	// Vitest JSON parsed successfully but produced zero fingerprints with non-zero exit.
+	// This can happen if the JSON structure is valid but contains no failure details
+	// we could extract. Fall through to the generic fallback below.
+	// Fallback: command_error fingerprint with stderr (or stdout if stderr is empty)
+	const fallbackMessage = stderr.trim() || stdout.trim() || "Command failed with no output";
+	return [
+		{
+			commandId,
+			file: "",
+			case: "",
+			kind: "command_error",
+			messageNorm: normalizeMessage(fallbackMessage),
+		},
+	];
+}
+// ── Fingerprint Diffing ──────────────────────────────────────────────
+/**
+ * Deduplicate fingerprints by their composite key.
+ * Preserves the first occurrence of each unique fingerprint.
+ */
+export function deduplicateFingerprints(fingerprints: TestFingerprint[]): TestFingerprint[] {
+	const seen = new Set<string>();
+	const result: TestFingerprint[] = [];
+	for (const fp of fingerprints) {
+		const key = fingerprintKey(fp);
+		if (!seen.has(key)) {
+			seen.add(key);
+			result.push(fp);
+		}
+	}
+	return result;
+}
+/**
+ * Diff two fingerprint sets to identify new failures, pre-existing failures, and fixes.
+ *
+ * Uses set-based comparison on the composite fingerprint key.
+ * Both sets are deduplicated before comparison.
+ *
+ * @param baseline  - Fingerprints from pre-merge verification run
+ * @param postMerge - Fingerprints from post-merge verification run
+ * @returns FingerprintDiff with new failures, pre-existing, and fixed sets
+ */
+export function diffFingerprints(
+	baseline: TestFingerprint[],
+	postMerge: TestFingerprint[],
+): FingerprintDiff {
+	const dedupBaseline = deduplicateFingerprints(baseline);
+	const dedupPostMerge = deduplicateFingerprints(postMerge);
+	const baselineKeys = new Set(dedupBaseline.map(fingerprintKey));
+	const postMergeKeys = new Set(dedupPostMerge.map(fingerprintKey));
+	const newFailures: TestFingerprint[] = [];
+	const preExisting: TestFingerprint[] = [];
+	const fixed: TestFingerprint[] = [];
+	// Classify post-merge fingerprints
+	for (const fp of dedupPostMerge) {
+		const key = fingerprintKey(fp);
+		if (baselineKeys.has(key)) {
+			preExisting.push(fp);
+		} else {
+			newFailures.push(fp);
+		}
+	}
+	// Find fixed: in baseline but not in post-merge
+	for (const fp of dedupBaseline) {
+		const key = fingerprintKey(fp);
+		if (!postMergeKeys.has(key)) {
+			fixed.push(fp);
+		}
+	}
+	return { newFailures, preExisting, fixed };
+}
+// ── Baseline Capture ─────────────────────────────────────────────────
+/**
+ * Run verification commands and capture a complete baseline snapshot.
+ *
+ * @param commands  - Map of commandId → shell command string
+ * @param cwd       - Working directory (merge worktree)
+ * @param timeoutMs - Per-command timeout
+ * @returns VerificationBaseline with command results and extracted fingerprints
+ */
+export function captureBaseline(
+	commands: Record<string, string>,
+	cwd: string,
+	timeoutMs?: number,
+): VerificationBaseline {
+	const commandResults = runVerificationCommands(commands, cwd, timeoutMs);
+	// Extract fingerprints from all command results
+	const allFingerprints: TestFingerprint[] = [];
+	for (const result of commandResults) {
+		const fps = parseTestOutput(result);
+		allFingerprints.push(...fps);
+	}
+	return {
+		capturedAt: new Date().toISOString(),
+		commandResults,
+		fingerprints: deduplicateFingerprints(allFingerprints),
+	};
+}