npm - @agentplate/cli - Versions diffs - 1.0.0 → 1.2.0 - Mend

@agentplate/cli 1.0.0 → 1.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

package/CHANGELOG.md +50 -0
package/agents/coordinator.md +43 -13
package/agents/lead.md +8 -1
package/package.json +5 -5
package/src/agents/capacity.test.ts +55 -0
package/src/agents/capacity.ts +50 -0
package/src/agents/drive.test.ts +155 -0
package/src/agents/drive.ts +200 -0
package/src/agents/system-prompt.ts +2 -1
package/src/commands/sling.test.ts +84 -0
package/src/commands/sling.ts +73 -117
package/src/commands/spec.test.ts +142 -0
package/src/commands/spec.ts +192 -0
package/src/commands/turn.test.ts +101 -0
package/src/commands/turn.ts +113 -0
package/src/config.test.ts +18 -0
package/src/config.ts +6 -1
package/src/errors.ts +11 -0
package/src/index.ts +4 -0
package/src/insights/quality-gates.test.ts +43 -0
package/src/insights/quality-gates.ts +30 -31
package/src/merge/auto.test.ts +157 -0
package/src/merge/auto.ts +118 -0
package/src/paths.ts +2 -1
package/src/runtimes/resolve.test.ts +49 -0
package/src/runtimes/resolve.ts +11 -7
package/src/sessions/store.test.ts +13 -0
package/src/sessions/store.ts +20 -0
package/src/types.ts +16 -1
package/src/version.ts +1 -1
package/src/wizard/setup.test.ts +45 -0
package/src/wizard/setup.ts +119 -6
package/ui/dist/assets/index-DAq3_wei.css +1 -0
package/ui/dist/assets/index-DjRGeS6V.js +4227 -0
package/ui/dist/index.html +2 -2
package/ui/dist/assets/index-C7rXIMER.css +0 -1
package/ui/dist/assets/index-W4kbr4by.js +0 -4526

package/src/commands/turn.test.ts ADDED Viewed

@@ -0,0 +1,101 @@
+/**
+ * `agentplate turn` command tests. Real initialized temp project + a real (mock)
+ * runtime turn. Drives the exported command's action via parseAsync.
+ */
+import { afterEach, beforeEach, describe, expect, test } from "bun:test";
+import { mkdirSync, mkdtempSync, rmSync, writeFileSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import {
+	AGENTPLATE_DIR,
+	CONFIG_FILE,
+	DEFAULT_CONFIG,
+	serializeConfig,
+	setProjectRootOverride,
+} from "../config.ts";
+import { NotFoundError, ValidationError } from "../errors.ts";
+import { sessionsDbPath } from "../paths.ts";
+import { createSessionStore } from "../sessions/store.ts";
+import type { AgentSession, SessionState } from "../types.ts";
+import { createTurnCommand } from "./turn.ts";
+let root: string;
+let worktree: string;
+function seedSession(over: Partial<AgentSession>): void {
+	const store = createSessionStore(sessionsDbPath(root));
+	const now = new Date().toISOString();
+	try {
+		store.upsertSession({
+			id: `session-${crypto.randomUUID()}`,
+			agentName: "builder-1",
+			capability: "builder",
+			taskId: "task-1",
+			runId: "run-1",
+			worktreePath: worktree,
+			branchName: "agentplate/builder-1",
+			state: "idle",
+			parentAgent: "lead-1",
+			depth: 1,
+			pid: null,
+			runtimeSessionId: "sess-prior",
+			startedAt: now,
+			lastActivity: now,
+			...over,
+		});
+	} finally {
+		store.close();
+	}
+}
+function sessionState(agent: string): SessionState | undefined {
+	const store = createSessionStore(sessionsDbPath(root));
+	try {
+		return store.getSessionByAgent(agent)?.state;
+	} finally {
+		store.close();
+	}
+}
+async function runTurnCmd(agent: string): Promise<void> {
+	await createTurnCommand().parseAsync([agent], { from: "user" });
+}
+beforeEach(() => {
+	root = mkdtempSync(join(tmpdir(), "agentplate-turn-cmd-"));
+	worktree = mkdtempSync(join(tmpdir(), "agentplate-turn-wt-"));
+	mkdirSync(join(root, AGENTPLATE_DIR), { recursive: true });
+	const config = structuredClone(DEFAULT_CONFIG);
+	config.runtime.default = "mock";
+	writeFileSync(join(root, AGENTPLATE_DIR, CONFIG_FILE), serializeConfig(config), "utf8");
+	setProjectRootOverride(root);
+	process.env.AGENTPLATE_MOCK_CMD = "true";
+});
+afterEach(() => {
+	setProjectRootOverride(null);
+	rmSync(root, { recursive: true, force: true });
+	rmSync(worktree, { recursive: true, force: true });
+	process.env.AGENTPLATE_MOCK_CMD = undefined;
+});
+describe("agentplate turn — refusals", () => {
+	test("throws NotFoundError for an unknown agent", async () => {
+		await expect(runTurnCmd("ghost")).rejects.toBeInstanceOf(NotFoundError);
+	});
+	test("refuses a terminal (completed) agent", async () => {
+		seedSession({ state: "completed" });
+		await expect(runTurnCmd("builder-1")).rejects.toBeInstanceOf(ValidationError);
+	});
+});
+describe("agentplate turn — runs the next turn", () => {
+	test("an idle agent takes another turn and transitions", async () => {
+		seedSession({ state: "idle" });
+		await runTurnCmd("builder-1");
+		// No terminal mail from the mock no-op → stays idle (ran without throwing).
+		expect(sessionState("builder-1")).toBe("idle");
+	});
+});

package/src/commands/turn.ts ADDED Viewed

@@ -0,0 +1,113 @@
+/**
+ * `agentplate turn <agent>` — run the NEXT headless turn for an existing agent.
+ *
+ * Where `sling` opens a fresh runtime session (turn 1), `turn` **resumes** it: it
+ * passes the session's captured `runtimeSessionId` to the runtime's `--resume`, so
+ * follow-up turns keep the warm context and skip the cold-start cost. The agent's
+ * unread mail is injected as the turn's prompt; the shared {@link driveTurn} core
+ * handles the state transition, skills loop, and auto-merge identically to turn 1.
+ *
+ * This is the multi-turn primitive: a coordinator/lead (or a future watcher) calls
+ * it when new mail arrives for an `idle` agent. Spawn-per-turn is preserved — each
+ * call is one fresh, resumed runtime subprocess.
+ */
+import { existsSync } from "node:fs";
+import { Command } from "commander";
+import { driveTurn } from "../agents/drive.ts";
+import { buildDefaultManifest, getDefinition, loadManifest } from "../agents/manifest.ts";
+import { findProjectRoot, isInitialized, loadConfig } from "../config.ts";
+import { NotFoundError, ValidationError } from "../errors.ts";
+import { createEventStore } from "../events/store.ts";
+import { jsonOutput } from "../json.ts";
+import { brand, muted, printInfo, printSuccess } from "../logging/color.ts";
+import { createMailClient } from "../mail/client.ts";
+import { eventsDbPath, manifestFilePath, sessionsDbPath } from "../paths.ts";
+import { getRuntime } from "../runtimes/registry.ts";
+import { resolveModel } from "../runtimes/resolve.ts";
+import { createSessionStore } from "../sessions/store.ts";
+import type { SessionState } from "../types.ts";
+interface TurnOptions {
+	json?: boolean;
+}
+/** States a turn can be driven from: paused/awaiting mail (not terminal, not mid-turn). */
+const DRIVABLE_STATES: ReadonlySet<SessionState> = new Set<SessionState>(["idle", "booting"]);
+export function createTurnCommand(): Command {
+	return new Command("turn")
+		.description("Run the next (resumed) turn for an existing agent")
+		.argument("<agent>", "agent name")
+		.option("--json", "output JSON")
+		.action(async (agent: string, opts: TurnOptions, command: Command) => {
+			const useJson = command.optsWithGlobals().json === true;
+			const root = findProjectRoot();
+			if (!isInitialized(root)) {
+				throw new ValidationError("Not initialized. Run `agentplate setup` first.");
+			}
+			const config = loadConfig(root);
+			const store = createSessionStore(sessionsDbPath(root));
+			const mail = createMailClient(root);
+			const events = createEventStore(eventsDbPath(root));
+			try {
+				const session = store.getSessionByAgent(agent);
+				if (!session) throw new NotFoundError(`No agent named "${agent}".`);
+				if (!DRIVABLE_STATES.has(session.state)) {
+					throw new ValidationError(
+						`Agent "${agent}" is ${session.state}; only an idle agent can take another turn.`,
+					);
+				}
+				const manifestPath = manifestFilePath(root);
+				const manifest = existsSync(manifestPath)
+					? loadManifest(manifestPath)
+					: buildDefaultManifest();
+				const def = getDefinition(manifest, session.capability);
+				const runtime = getRuntime(config.runtime.default, config.runtime.default);
+				const model = resolveModel(config, root, def.model, session.capability);
+				// The next turn's user text is the agent's unread mail (e.g. a child's
+				// reply or operator direction); fall back to a continue nudge.
+				const injected = mail.checkInject(agent);
+				const prompt =
+					injected.trim().length > 0
+						? injected
+						: "Continue your task. If it is complete, send your terminal mail.";
+				const { finalState, exitCode } = await driveTurn({
+					root,
+					config,
+					runtime,
+					store,
+					events,
+					mail,
+					session,
+					model,
+					prompt,
+					// Warm start: resume the runtime session captured on a prior turn.
+					resumeSessionId: session.runtimeSessionId ?? undefined,
+				});
+				if (useJson) {
+					jsonOutput({
+						agent,
+						capability: session.capability,
+						taskId: session.taskId,
+						state: finalState,
+						resumed: Boolean(session.runtimeSessionId),
+						exitCode,
+					});
+					return;
+				}
+				printSuccess(`${brand(agent)} [${session.capability}] → ${finalState}`);
+				printInfo(`  resumed: ${session.runtimeSessionId ? "yes (warm)" : "no (cold)"}`);
+				printInfo(`  worktree:${muted(` ${session.worktreePath}`)}`);
+			} finally {
+				events.close();
+				mail.close();
+				store.close();
+			}
+		});
+}

package/src/config.test.ts CHANGED Viewed

@@ -45,6 +45,13 @@ describe("loadConfig", () => {
 		expect(cfg.merge.aiResolveEnabled).toBe(true);
 	});
+	test("an old config without merge.autoMerge inherits the 'off' default (deep merge)", () => {
+		writeConfig(root, "config.yaml", "merge:\n  aiResolveEnabled: true\n");
+		const cfg = loadConfig(root);
+		expect(cfg.merge.autoMerge).toBe("off");
+		expect(cfg.merge.aiResolveEnabled).toBe(true);
+	});
 	test("config.local.yaml overrides config.yaml", () => {
 		writeConfig(root, "config.yaml", "runtime:\n  default: claude\n");
 		writeConfig(root, "config.local.yaml", "runtime:\n  default: gemini\n");
@@ -74,6 +81,17 @@ describe("validateConfig", () => {
 	test("accepts the defaults", () => {
 		expect(() => validateConfig(structuredClone(DEFAULT_CONFIG))).not.toThrow();
 	});
+	test("auto-merge defaults to off", () => {
+		expect(DEFAULT_CONFIG.merge.autoMerge).toBe("off");
+	});
+	test("rejects an unknown merge.autoMerge mode", () => {
+		const cfg = structuredClone(DEFAULT_CONFIG);
+		// @ts-expect-error intentionally invalid value
+		cfg.merge.autoMerge = "always";
+		expect(() => validateConfig(cfg)).toThrow();
+	});
 });
 describe("isInitialized / serializeConfig", () => {

package/src/config.ts CHANGED Viewed

@@ -13,7 +13,7 @@ import { existsSync, readFileSync } from "node:fs";
 import { join, resolve } from "node:path";
 import yaml from "js-yaml";
 import { ConfigError } from "./errors.ts";
-import type { AgentplateConfig } from "./types.ts";
+import type { AgentplateConfig, AutoMergeMode } from "./types.ts";
 /** Directory (relative to project root) holding all Agentplate state. */
 export const AGENTPLATE_DIR = ".agentplate";
@@ -46,6 +46,7 @@ export const DEFAULT_CONFIG: AgentplateConfig = {
 	},
 	merge: {
 		aiResolveEnabled: true,
+		autoMerge: "off",
 	},
 	skills: {
 		enabled: true,
@@ -175,6 +176,10 @@ export function validateConfig(config: AgentplateConfig): void {
 			"config.agents.idleTimeoutMinutes must be >= 0 (0 disables idle reaping)",
 		);
 	}
+	const autoMergeModes: AutoMergeMode[] = ["off", "on-gates-pass", "on-complete"];
+	if (!autoMergeModes.includes(config.merge.autoMerge)) {
+		throw new ConfigError(`config.merge.autoMerge must be one of: ${autoMergeModes.join(", ")}`);
+	}
 }
 /**

package/src/errors.ts CHANGED Viewed

@@ -63,6 +63,17 @@ export class NotFoundError extends AgentplateError {
 	}
 }
+/**
+ * A spawn was refused because it would exceed a configured orchestration limit
+ * (maxConcurrent / maxAgentsPerLead / maxDepth). Distinct exit code so callers
+ * (a lead/coordinator) can recognize "at capacity — back off and retry later".
+ */
+export class CapacityError extends AgentplateError {
+	constructor(message: string) {
+		super(message, "CAPACITY_EXCEEDED", 5);
+	}
+}
 /** Type guard: is the given value a AgentplateError? */
 export function isAgentplateError(value: unknown): value is AgentplateError {
 	return value instanceof AgentplateError;

package/src/index.ts CHANGED Viewed

@@ -30,9 +30,11 @@ import { createSetupCommand } from "./commands/setup.ts";
 import { createShipCommand } from "./commands/ship.ts";
 import { createSkillCommand } from "./commands/skill.ts";
 import { createSlingCommand } from "./commands/sling.ts";
+import { createSpecCommand } from "./commands/spec.ts";
 import { createStatusCommand } from "./commands/status.ts";
 import { createStopCommand } from "./commands/stop.ts";
 import { createTuiCommand } from "./commands/tui.ts";
+import { createTurnCommand } from "./commands/turn.ts";
 import { createWorktreeCommand } from "./commands/worktree.ts";
 import { setProjectRootOverride } from "./config.ts";
 import { isAgentplateError } from "./errors.ts";
@@ -95,6 +97,8 @@ function buildProgram(): Command {
 	// Orchestration
 	program.addCommand(createCoordinatorCommand());
 	program.addCommand(createSlingCommand());
+	program.addCommand(createTurnCommand());
+	program.addCommand(createSpecCommand());
 	program.addCommand(createStatusCommand());
 	program.addCommand(createMailCommand());
 	program.addCommand(createMergeCommand());

package/src/insights/quality-gates.test.ts ADDED Viewed

@@ -0,0 +1,43 @@
+/**
+ * Tests for runQualityGates. Real subprocesses (no mocks) — gates are shell
+ * commands, so we use `true`/`false`/`sleep` to exercise pass/fail/partial and to
+ * prove the gates run concurrently (wall-clock < sum of durations).
+ */
+import { describe, expect, test } from "bun:test";
+import type { QualityGate } from "../types.ts";
+import { runQualityGates } from "./quality-gates.ts";
+const gate = (name: string, command: string): QualityGate => ({ name, command });
+describe("runQualityGates", () => {
+	test("returns null when there are no gates", async () => {
+		expect(await runQualityGates([], process.cwd())).toBeNull();
+	});
+	test("all passing → success", async () => {
+		const out = await runQualityGates([gate("a", "true"), gate("b", "true")], process.cwd());
+		expect(out?.status).toBe("success");
+		expect(out?.results.every((r) => r.passed)).toBe(true);
+	});
+	test("all failing → failure", async () => {
+		const out = await runQualityGates([gate("a", "false"), gate("b", "false")], process.cwd());
+		expect(out?.status).toBe("failure");
+	});
+	test("mixed → partial", async () => {
+		const out = await runQualityGates([gate("ok", "true"), gate("bad", "false")], process.cwd());
+		expect(out?.status).toBe("partial");
+		// Order is preserved across the concurrent run.
+		expect(out?.results.map((r) => r.name)).toEqual(["ok", "bad"]);
+	});
+	test("gates run concurrently (wall-clock well under the sum)", async () => {
+		const gates = [gate("s1", "sleep 0.3"), gate("s2", "sleep 0.3"), gate("s3", "sleep 0.3")];
+		const out = await runQualityGates(gates, process.cwd());
+		expect(out?.status).toBe("success");
+		// Sequential would be ~900ms; concurrent should be well under that.
+		expect(out?.totalDurationMs ?? Number.POSITIVE_INFINITY).toBeLessThan(700);
+	});
+});

package/src/insights/quality-gates.ts CHANGED Viewed

@@ -34,37 +34,36 @@ export async function runQualityGates(
 ): Promise<QualityGateOutcome | null> {
 	if (gates.length === 0) return null;
-	const results: GateResult[] = [];
-	let total = 0;
-	for (const gate of gates) {
-		const started = performance.now();
-		let exitCode = 1;
-		try {
-			// Run the gate through the platform shell: `cmd /c` on Windows (no bash
-			// there), `bash -lc` elsewhere. `.cmd` shims (biome/tsc) resolve under both.
-			const shellArgv =
-				process.platform === "win32"
-					? ["cmd", "/d", "/s", "/c", gate.command]
-					: ["bash", "-lc", gate.command];
-			const proc = Bun.spawn(shellArgv, {
-				cwd,
-				stdout: "pipe",
-				stderr: "pipe",
-			});
-			exitCode = await proc.exited;
-		} catch {
-			exitCode = 1;
-		}
-		const durationMs = Math.round(performance.now() - started);
-		total += durationMs;
-		results.push({
-			name: gate.name,
-			command: gate.command,
-			passed: exitCode === 0,
-			exitCode,
-			durationMs,
-		});
-	}
+	// Gates are independent checks, so run them concurrently and measure the
+	// outcome by wall-clock — `totalDurationMs` is the elapsed time of the whole
+	// batch (the slowest gate), not the sum of all gates.
+	const overallStart = performance.now();
+	const results: GateResult[] = await Promise.all(
+		gates.map(async (gate): Promise<GateResult> => {
+			const started = performance.now();
+			let exitCode = 1;
+			try {
+				// Run the gate through the platform shell: `cmd /c` on Windows (no bash
+				// there), `bash -lc` elsewhere. `.cmd` shims (biome/tsc) resolve under both.
+				const shellArgv =
+					process.platform === "win32"
+						? ["cmd", "/d", "/s", "/c", gate.command]
+						: ["bash", "-lc", gate.command];
+				const proc = Bun.spawn(shellArgv, { cwd, stdout: "pipe", stderr: "pipe" });
+				exitCode = await proc.exited;
+			} catch {
+				exitCode = 1;
+			}
+			return {
+				name: gate.name,
+				command: gate.command,
+				passed: exitCode === 0,
+				exitCode,
+				durationMs: Math.round(performance.now() - started),
+			};
+		}),
+	);
+	const total = Math.round(performance.now() - overallStart);
 	const passed = results.filter((r) => r.passed).length;
 	const status: OutcomeStatus =

package/src/merge/auto.test.ts ADDED Viewed

@@ -0,0 +1,157 @@
+/**
+ * Tests for auto-merge (maybeAutoMerge).
+ *
+ * Real git repos in temp dirs (per "never mock what you can use for real"), the
+ * real merge queue + lock, and a recording mail stub so we can assert the outcome
+ * notifications without a mail DB. Covers the mode gate, the capability skip, the
+ * gates-pass fail-closed rule, a clean landing, and a reported conflict.
+ */
+import { afterEach, beforeEach, describe, expect, test } from "bun:test";
+import { existsSync, mkdirSync, mkdtempSync, rmSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import type { Capability, NewMail } from "../types.ts";
+import { type AutoMergeParams, maybeAutoMerge } from "./auto.ts";
+let repo: string;
+async function git(...args: string[]): Promise<string> {
+	const proc = Bun.spawn(["git", ...args], { cwd: repo, stdout: "pipe", stderr: "pipe" });
+	const [stdout, stderr, exitCode] = await Promise.all([
+		new Response(proc.stdout).text(),
+		new Response(proc.stderr).text(),
+		proc.exited,
+	]);
+	if (exitCode !== 0) throw new Error(`git ${args.join(" ")} failed (${exitCode}): ${stderr}`);
+	return stdout;
+}
+/** Recording mail stub satisfying the `{ send }` surface maybeAutoMerge needs. */
+function recordingMail() {
+	const sent: Array<{ type: string; subject: string; to: string }> = [];
+	return {
+		sent,
+		send: (m: NewMail) => {
+			sent.push({ type: m.type, subject: m.subject, to: m.to });
+		},
+	};
+}
+/** Build params with sensible defaults; override per test. */
+function params(
+	over: Partial<AutoMergeParams> & { mail: ReturnType<typeof recordingMail> },
+): AutoMergeParams {
+	return {
+		root: repo,
+		branchName: "agentplate/builder-x",
+		targetBranch: "main",
+		capability: "builder" as Capability,
+		agentName: "builder-x",
+		taskId: "task-x",
+		parent: "lead-1",
+		mode: "on-complete",
+		aiResolveEnabled: true,
+		gateStatus: null,
+		...over,
+	};
+}
+beforeEach(async () => {
+	repo = mkdtempSync(join(tmpdir(), "agentplate-automerge-"));
+	mkdirSync(join(repo, ".agentplate"), { recursive: true });
+	await git("init", "-q");
+	await git("config", "user.email", "test@agentplate.dev");
+	await git("config", "user.name", "Agentplate Test");
+	await git("checkout", "-q", "-b", "main");
+	await Bun.write(join(repo, "base.txt"), "base\n");
+	await git("add", "-A");
+	await git("commit", "-q", "-m", "initial");
+});
+afterEach(() => {
+	rmSync(repo, { recursive: true, force: true });
+});
+/** Create a worker branch with a new-file commit, then return to main. */
+async function workerBranchWithCommit(branch: string, file: string): Promise<void> {
+	await git("checkout", "-q", "-b", branch);
+	await Bun.write(join(repo, file), "from worker\n");
+	await git("add", "-A");
+	await git("commit", "-q", "-m", `add ${file}`);
+	await git("checkout", "-q", "main");
+}
+describe("maybeAutoMerge — gating", () => {
+	test("mode 'off' never merges", async () => {
+		const mail = recordingMail();
+		await workerBranchWithCommit("agentplate/builder-x", "feature.txt");
+		const out = await maybeAutoMerge(params({ mail, mode: "off" }));
+		expect(out).toEqual({ merged: false, reason: "disabled" });
+		expect(existsSync(join(repo, "feature.txt"))).toBe(false);
+		expect(mail.sent).toHaveLength(0);
+	});
+	test("read-only capabilities are skipped", async () => {
+		const mail = recordingMail();
+		for (const capability of ["scout", "merger"] as Capability[]) {
+			const out = await maybeAutoMerge(params({ mail, capability }));
+			expect(out).toEqual({ merged: false, reason: "capability-skipped" });
+		}
+		expect(mail.sent).toHaveLength(0);
+	});
+	test("on-gates-pass holds (fail-closed) when gates did not pass", async () => {
+		const mail = recordingMail();
+		await workerBranchWithCommit("agentplate/builder-x", "feature.txt");
+		for (const gateStatus of [null, "failure", "partial"] as const) {
+			const out = await maybeAutoMerge(params({ mail, mode: "on-gates-pass", gateStatus }));
+			expect(out).toEqual({ merged: false, reason: "gates-not-passed" });
+		}
+		expect(existsSync(join(repo, "feature.txt"))).toBe(false);
+		expect(mail.sent.every((m) => m.type === "status")).toBe(true);
+	});
+});
+describe("maybeAutoMerge — landing", () => {
+	test("on-complete lands the branch and reports 'merged'", async () => {
+		const mail = recordingMail();
+		await workerBranchWithCommit("agentplate/builder-x", "feature.txt");
+		const out = await maybeAutoMerge(params({ mail, mode: "on-complete" }));
+		expect(out).toEqual({ merged: true, status: "merged", tier: "clean-merge" });
+		expect(existsSync(join(repo, "feature.txt"))).toBe(true); // landed on main
+		expect(mail.sent).toHaveLength(1);
+		expect(mail.sent[0]).toMatchObject({ type: "merged", to: "lead-1" });
+	});
+	test("on-gates-pass merges on a clean gate success", async () => {
+		const mail = recordingMail();
+		await workerBranchWithCommit("agentplate/builder-x", "feature.txt");
+		const out = await maybeAutoMerge(
+			params({ mail, mode: "on-gates-pass", gateStatus: "success" }),
+		);
+		expect(out).toMatchObject({ merged: true, status: "merged" });
+		expect(existsSync(join(repo, "feature.txt"))).toBe(true);
+	});
+	test("an unresolved conflict reports 'merge_failed' (never throws)", async () => {
+		const mail = recordingMail();
+		// Both branches edit base.txt differently -> conflict; aiResolveEnabled=false
+		// makes mergeBranch abort and fail.
+		await git("checkout", "-q", "-b", "agentplate/builder-x");
+		await Bun.write(join(repo, "base.txt"), "worker change\n");
+		await git("add", "-A");
+		await git("commit", "-q", "-m", "worker edits base");
+		await git("checkout", "-q", "main");
+		await Bun.write(join(repo, "base.txt"), "main change\n");
+		await git("add", "-A");
+		await git("commit", "-q", "-m", "main edits base");
+		const out = await maybeAutoMerge(
+			params({ mail, mode: "on-complete", aiResolveEnabled: false }),
+		);
+		expect(out.merged).toBe(false);
+		expect(out).toMatchObject({ reason: "merge-failed" });
+		expect(mail.sent[0]).toMatchObject({ type: "merge_failed" });
+	});
+});