npm - @os-eco/overstory-cli - Versions diffs - 0.8.5 → 0.8.7 - Mend

@os-eco/overstory-cli 0.8.5 → 0.8.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (53) hide show

package/README.md +13 -9
package/agents/coordinator.md +52 -4
package/package.json +1 -1
package/src/agents/hooks-deployer.test.ts +185 -12
package/src/agents/hooks-deployer.ts +57 -1
package/src/commands/clean.test.ts +136 -0
package/src/commands/clean.ts +198 -4
package/src/commands/coordinator.test.ts +494 -6
package/src/commands/coordinator.ts +200 -4
package/src/commands/dashboard.ts +84 -18
package/src/commands/ecosystem.test.ts +101 -0
package/src/commands/init.test.ts +211 -0
package/src/commands/init.ts +93 -15
package/src/commands/log.test.ts +10 -11
package/src/commands/log.ts +31 -32
package/src/commands/prime.ts +30 -5
package/src/commands/sling.test.ts +33 -0
package/src/commands/sling.ts +416 -358
package/src/commands/spec.ts +8 -2
package/src/commands/stop.test.ts +127 -6
package/src/commands/stop.ts +95 -43
package/src/commands/supervisor.ts +2 -0
package/src/commands/watch.ts +29 -9
package/src/config.test.ts +72 -0
package/src/config.ts +26 -1
package/src/index.ts +4 -1
package/src/merge/resolver.test.ts +383 -25
package/src/merge/resolver.ts +291 -98
package/src/runtimes/claude.test.ts +32 -7
package/src/runtimes/claude.ts +19 -4
package/src/runtimes/codex.test.ts +13 -0
package/src/runtimes/codex.ts +18 -2
package/src/runtimes/copilot.ts +3 -0
package/src/runtimes/cursor.test.ts +497 -0
package/src/runtimes/cursor.ts +205 -0
package/src/runtimes/gemini.ts +3 -0
package/src/runtimes/opencode.ts +3 -0
package/src/runtimes/pi.test.ts +119 -2
package/src/runtimes/pi.ts +64 -12
package/src/runtimes/registry.test.ts +21 -1
package/src/runtimes/registry.ts +3 -0
package/src/runtimes/sapling.ts +3 -0
package/src/runtimes/types.ts +5 -0
package/src/schema-consistency.test.ts +1 -0
package/src/sessions/store.test.ts +178 -0
package/src/sessions/store.ts +44 -8
package/src/types.ts +25 -1
package/src/watchdog/daemon.test.ts +257 -0
package/src/watchdog/daemon.ts +66 -23
package/src/worktree/manager.test.ts +65 -1
package/src/worktree/manager.ts +36 -0
package/src/worktree/tmux.test.ts +150 -0
package/src/worktree/tmux.ts +126 -23

package/src/commands/sling.ts CHANGED Viewed

@@ -38,12 +38,15 @@ import { createRunStore } from "../sessions/store.ts";
 import type { TrackerIssue } from "../tracker/factory.ts";
 import { createTrackerClient, resolveBackend, trackerCliName } from "../tracker/factory.ts";
 import type { AgentSession, OverlayConfig } from "../types.ts";
-import { createWorktree } from "../worktree/manager.ts";
+import { createWorktree, rollbackWorktree } from "../worktree/manager.ts";
 import { spawnHeadlessAgent } from "../worktree/process.ts";
 import {
 	capturePaneContent,
+	checkSessionState,
 	createSession,
 	ensureTmuxAvailable,
+	isSessionAlive,
+	killSession,
 	sendKeys,
 	waitForTuiReady,
 } from "../worktree/tmux.ts";
@@ -274,6 +277,27 @@ export function shouldShowScoutWarning(
 	return !parentHasScouts(sessions, parentAgent);
 }
+/**
+ * Resolve which canonical repo directories should be writable to an
+ * interactive agent runtime in addition to its worktree sandbox.
+ *
+ * All interactive agents need `.overstory` so they can access shared mail,
+ * metrics, and session state. Only `lead` agents need canonical `.git`
+ * because they can spawn child worktrees from inside the runtime.
+ *
+ * @param projectRoot - Absolute path to the canonical repository root
+ * @param capability - Capability being launched
+ */
+export function getSharedWritableDirs(projectRoot: string, capability: string): string[] {
+	const sharedWritableDirs = [join(projectRoot, ".overstory")];
+	if (capability === "lead") {
+		sharedWritableDirs.push(join(projectRoot, ".git"));
+	}
+	return sharedWritableDirs;
+}
 /**
  * Check if any active agent is already working on the given task ID.
  * Returns the agent name if locked, or null if the task is free.
@@ -569,47 +593,63 @@ export async function slingCommand(taskId: string, opts: SlingOptions): Promise<
 	// 4. Resolve or create run_id for this spawn
 	const overstoryDir = join(config.project.root, ".overstory");
 	const currentRunPath = join(overstoryDir, "current-run.txt");
-	let runId: string;
-	const currentRunFile = Bun.file(currentRunPath);
-	if (await currentRunFile.exists()) {
-		runId = (await currentRunFile.text()).trim();
-	} else {
-		runId = `run-${new Date().toISOString().replace(/[:.]/g, "-")}`;
-		const runStore = createRunStore(join(overstoryDir, "sessions.db"));
-		try {
-			runStore.createRun({
-				id: runId,
-				startedAt: new Date().toISOString(),
-				coordinatorSessionId: null,
-				status: "active",
-			});
-		} finally {
-			runStore.close();
-		}
-		await Bun.write(currentRunPath, runId);
-	}
-	// 4b. Check per-run session limit
-	if (config.agents.maxSessionsPerRun > 0) {
-		const runCheckStore = createRunStore(join(overstoryDir, "sessions.db"));
-		try {
-			const run = runCheckStore.getRun(runId);
-			if (run && checkRunSessionLimit(config.agents.maxSessionsPerRun, run.agentCount)) {
-				throw new AgentError(
-					`Run session limit reached: ${run.agentCount}/${config.agents.maxSessionsPerRun} agents spawned in run "${runId}". ` +
-						`Increase agents.maxSessionsPerRun in config.yaml or start a new run.`,
-					{ agentName: name },
-				);
-			}
-		} finally {
-			runCheckStore.close();
-		}
-	}
 	// 5. Check name uniqueness and concurrency limit against active sessions
+	// (Session store opened here so we can also use it for parent run ID inheritance in step 4.)
 	const { store } = openSessionStore(overstoryDir);
 	try {
+		// 4a. Resolve run ID: inherit from parent → current-run.txt fallback → create new.
+		// Parent inheritance ensures child agents belong to the same run as their coordinator.
+		const runId = await (async (): Promise<string> => {
+			if (parentAgent) {
+				const parentSession = store.getByName(parentAgent);
+				if (parentSession?.runId) {
+					return parentSession.runId;
+				}
+			}
+			// Fallback: read current-run.txt (backward compat with single-coordinator setups).
+			const currentRunFile = Bun.file(currentRunPath);
+			if (await currentRunFile.exists()) {
+				const text = (await currentRunFile.text()).trim();
+				if (text) return text;
+			}
+			// Create a new run if none exists.
+			const newRunId = `run-${new Date().toISOString().replace(/[:.]/g, "-")}`;
+			const runStore = createRunStore(join(overstoryDir, "sessions.db"));
+			try {
+				runStore.createRun({
+					id: newRunId,
+					startedAt: new Date().toISOString(),
+					coordinatorSessionId: null,
+					coordinatorName: null,
+					status: "active",
+				});
+			} finally {
+				runStore.close();
+			}
+			await Bun.write(currentRunPath, newRunId);
+			return newRunId;
+		})();
+		// 4b. Check per-run session limit
+		if (config.agents.maxSessionsPerRun > 0) {
+			const runCheckStore = createRunStore(join(overstoryDir, "sessions.db"));
+			try {
+				const run = runCheckStore.getRun(runId);
+				if (run && checkRunSessionLimit(config.agents.maxSessionsPerRun, run.agentCount)) {
+					throw new AgentError(
+						`Run session limit reached: ${run.agentCount}/${config.agents.maxSessionsPerRun} agents spawned in run "${runId}". ` +
+							`Increase agents.maxSessionsPerRun in config.yaml or start a new run.`,
+						{ agentName: name },
+					);
+				}
+			} finally {
+				runCheckStore.close();
+			}
+		}
 		const activeSessions = store.getActive();
 		if (activeSessions.length >= config.agents.maxConcurrent) {
 			throw new AgentError(
@@ -724,367 +764,385 @@ export async function slingCommand(taskId: string, opts: SlingOptions): Promise<
 			taskId: taskId,
 		});
-		// 8. Generate + write overlay CLAUDE.md
-		const agentDefPath = join(config.project.root, config.agents.baseDir, agentDef.file);
-		const baseDefinition = await Bun.file(agentDefPath).text();
+		try {
+			// 8. Generate + write overlay CLAUDE.md
+			const agentDefPath = join(config.project.root, config.agents.baseDir, agentDef.file);
+			const baseDefinition = await Bun.file(agentDefPath).text();
-		// 8a. Fetch file-scoped mulch expertise if mulch is enabled and files are provided
-		let mulchExpertise: string | undefined;
-		if (config.mulch.enabled && fileScope.length > 0) {
-			try {
-				const mulch = createMulchClient(config.project.root);
-				mulchExpertise = await mulch.prime(undefined, undefined, {
-					files: fileScope,
-					sortByScore: true,
-				});
-			} catch {
-				// Non-fatal: mulch expertise is supplementary context
-				mulchExpertise = undefined;
+			// 8a. Fetch file-scoped mulch expertise if mulch is enabled and files are provided
+			let mulchExpertise: string | undefined;
+			if (config.mulch.enabled && fileScope.length > 0) {
+				try {
+					const mulch = createMulchClient(config.project.root);
+					mulchExpertise = await mulch.prime(undefined, undefined, {
+						files: fileScope,
+						sortByScore: true,
+					});
+				} catch {
+					// Non-fatal: mulch expertise is supplementary context
+					mulchExpertise = undefined;
+				}
 			}
-		}
-		// Resolve runtime before overlayConfig so we can pass runtime.instructionPath
-		const runtime = getRuntime(opts.runtime, config, capability);
+			// Resolve runtime before overlayConfig so we can pass runtime.instructionPath
+			const runtime = getRuntime(opts.runtime, config, capability);
-		const overlayConfig: OverlayConfig = {
-			agentName: name,
-			taskId: taskId,
-			specPath: absoluteSpecPath,
-			branchName,
-			worktreePath,
-			fileScope,
-			mulchDomains: config.mulch.enabled
-				? inferDomainsFromFiles(fileScope, config.mulch.domains)
-				: [],
-			parentAgent: parentAgent,
-			depth,
-			canSpawn: agentDef.canSpawn,
-			capability,
-			baseDefinition,
-			mulchExpertise,
-			skipScout: skipScout && capability === "lead",
-			skipReview: opts.skipReview === true && capability === "lead",
-			maxAgentsOverride:
-				opts.dispatchMaxAgents !== undefined
-					? Number.parseInt(opts.dispatchMaxAgents, 10)
-					: undefined,
-			qualityGates: config.project.qualityGates,
-			trackerCli: trackerCliName(resolvedBackend),
-			trackerName: resolvedBackend,
-			instructionPath: runtime.instructionPath,
-		};
+			const overlayConfig: OverlayConfig = {
+				agentName: name,
+				taskId: taskId,
+				specPath: absoluteSpecPath,
+				branchName,
+				worktreePath,
+				fileScope,
+				mulchDomains: config.mulch.enabled
+					? inferDomainsFromFiles(fileScope, config.mulch.domains)
+					: [],
+				parentAgent: parentAgent,
+				depth,
+				canSpawn: agentDef.canSpawn,
+				capability,
+				baseDefinition,
+				mulchExpertise,
+				skipScout: skipScout && capability === "lead",
+				skipReview: opts.skipReview === true && capability === "lead",
+				maxAgentsOverride:
+					opts.dispatchMaxAgents !== undefined
+						? Number.parseInt(opts.dispatchMaxAgents, 10)
+						: undefined,
+				qualityGates: config.project.qualityGates,
+				trackerCli: trackerCliName(resolvedBackend),
+				trackerName: resolvedBackend,
+				instructionPath: runtime.instructionPath,
+			};
-		try {
 			await writeOverlay(worktreePath, overlayConfig, config.project.root, runtime.instructionPath);
-		} catch (err) {
-			// Clean up the orphaned worktree created in step 7 (overstory-p4st)
-			try {
-				const cleanupProc = Bun.spawn(["git", "worktree", "remove", "--force", worktreePath], {
-					cwd: config.project.root,
-					stdout: "pipe",
-					stderr: "pipe",
-				});
-				await cleanupProc.exited;
-			} catch {
-				// Best-effort cleanup; the original error is more important
-			}
-			throw err;
-		}
-		// 9. Resolve runtime + model (needed for deployConfig, spawn, and beacon)
-		const resolvedModel = resolveModel(config, manifest, capability, agentDef.model);
+			// 9. Resolve runtime + model (needed for deployConfig, spawn, and beacon)
+			const resolvedModel = resolveModel(config, manifest, capability, agentDef.model);
-		// 9a. Deploy hooks config (capability-specific guards)
-		await runtime.deployConfig(worktreePath, undefined, {
-			agentName: name,
-			capability,
-			worktreePath,
-			qualityGates: config.project.qualityGates,
-		});
-		// 9b. Send auto-dispatch mail so it exists when SessionStart hook fires.
-		// This eliminates the race where coordinator sends dispatch AFTER agent boots.
-		const dispatch = buildAutoDispatch({
-			agentName: name,
-			taskId,
-			capability,
-			specPath: absoluteSpecPath,
-			parentAgent,
-			instructionPath: runtime.instructionPath,
-		});
-		const mailStore = createMailStore(join(overstoryDir, "mail.db"));
-		try {
-			const mailClient = createMailClient(mailStore);
-			mailClient.send({
-				from: dispatch.from,
-				to: dispatch.to,
-				subject: dispatch.subject,
-				body: dispatch.body,
-				type: "dispatch",
-				priority: "normal",
+			// 9a. Deploy hooks config (capability-specific guards)
+			await runtime.deployConfig(worktreePath, undefined, {
+				agentName: name,
+				capability,
+				worktreePath,
+				qualityGates: config.project.qualityGates,
 			});
-		} finally {
-			mailStore.close();
-		}
-		// 10. Claim tracker issue
-		if (config.taskTracker.enabled && !skipTaskCheck) {
-			try {
-				await tracker.claim(taskId);
-			} catch {
-				// Non-fatal: issue may already be claimed
-			}
-		}
-		// 11. Create agent identity (if new)
-		const identityBaseDir = join(config.project.root, ".overstory", "agents");
-		const existingIdentity = await loadIdentity(identityBaseDir, name);
-		if (!existingIdentity) {
-			await createIdentity(identityBaseDir, {
-				name,
+			// 9b. Send auto-dispatch mail so it exists when SessionStart hook fires.
+			// This eliminates the race where coordinator sends dispatch AFTER agent boots.
+			const dispatch = buildAutoDispatch({
+				agentName: name,
+				taskId,
 				capability,
-				created: new Date().toISOString(),
-				sessionsCompleted: 0,
-				expertiseDomains: config.mulch.enabled ? config.mulch.domains : [],
-				recentTasks: [],
+				specPath: absoluteSpecPath,
+				parentAgent,
+				instructionPath: runtime.instructionPath,
 			});
-		}
+			const mailStore = createMailStore(join(overstoryDir, "mail.db"));
+			try {
+				const mailClient = createMailClient(mailStore);
+				mailClient.send({
+					from: dispatch.from,
+					to: dispatch.to,
+					subject: dispatch.subject,
+					body: dispatch.body,
+					type: "dispatch",
+					priority: "normal",
+				});
+			} finally {
+				mailStore.close();
+			}
-		// 11b. Save applied mulch record IDs for session-end outcome tracking.
-		// Written to .overstory/agents/{name}/applied-records.json so log.ts
-		// can append outcomes when the session completes.
-		if (mulchExpertise) {
-			const appliedRecords = extractMulchRecordIds(mulchExpertise);
-			if (appliedRecords.length > 0) {
-				const appliedRecordsPath = join(identityBaseDir, name, "applied-records.json");
-				const appliedData = { taskId, agentName: name, capability, records: appliedRecords };
+			// 10. Claim tracker issue
+			if (config.taskTracker.enabled && !skipTaskCheck) {
 				try {
-					await Bun.write(appliedRecordsPath, `${JSON.stringify(appliedData, null, "\t")}\n`);
+					await tracker.claim(taskId);
 				} catch {
-					// Non-fatal: outcome tracking is supplementary context
+					// Non-fatal: issue may already be claimed
 				}
 			}
-		}
-		// 11c. Spawn: headless runtimes bypass tmux entirely; tmux path is unchanged.
-		if (runtime.headless === true && runtime.buildDirectSpawn) {
-			const directEnv = {
-				...runtime.buildEnv(resolvedModel),
-				OVERSTORY_AGENT_NAME: name,
-				OVERSTORY_WORKTREE_PATH: worktreePath,
-			};
-			const argv = runtime.buildDirectSpawn({
-				cwd: worktreePath,
-				env: directEnv,
-				...(resolvedModel.isExplicitOverride ? { model: resolvedModel.model } : {}),
-				instructionPath: runtime.instructionPath,
-			});
+			// 11. Create agent identity (if new)
+			const identityBaseDir = join(config.project.root, ".overstory", "agents");
+			const existingIdentity = await loadIdentity(identityBaseDir, name);
+			if (!existingIdentity) {
+				await createIdentity(identityBaseDir, {
+					name,
+					capability,
+					created: new Date().toISOString(),
+					sessionsCompleted: 0,
+					expertiseDomains: config.mulch.enabled ? config.mulch.domains : [],
+					recentTasks: [],
+				});
+			}
-			// Create a timestamped log dir for this headless agent session.
-			// Always redirect stdout to a file. This prevents SIGPIPE death:
-			// ov sling exits after spawning, closing the pipe's read end.
-			// If stdout is a pipe, the agent dies on the next write (SIGPIPE).
-			// File writes have no such limit, and the agent survives the CLI exit.
-			//
-			// Note: RPC connection wiring is intentionally omitted here. The RPC pipe
-			// is only useful when the spawner stays alive to consume it. ov sling is
-			// a short-lived CLI — any connection created here dies with the process.
-			const logTimestamp = new Date().toISOString().replace(/[:.]/g, "-");
-			const agentLogDir = join(overstoryDir, "logs", name, logTimestamp);
-			mkdirSync(agentLogDir, { recursive: true });
-			const headlessProc = await spawnHeadlessAgent(argv, {
-				cwd: worktreePath,
-				env: { ...(process.env as Record<string, string>), ...directEnv },
-				stdoutFile: join(agentLogDir, "stdout.log"),
-				stderrFile: join(agentLogDir, "stderr.log"),
-			});
+			// 11b. Save applied mulch record IDs for session-end outcome tracking.
+			// Written to .overstory/agents/{name}/applied-records.json so log.ts
+			// can append outcomes when the session completes.
+			if (mulchExpertise) {
+				const appliedRecords = extractMulchRecordIds(mulchExpertise);
+				if (appliedRecords.length > 0) {
+					const appliedRecordsPath = join(identityBaseDir, name, "applied-records.json");
+					const appliedData = { taskId, agentName: name, capability, records: appliedRecords };
+					try {
+						await Bun.write(appliedRecordsPath, `${JSON.stringify(appliedData, null, "\t")}\n`);
+					} catch {
+						// Non-fatal: outcome tracking is supplementary context
+					}
+				}
+			}
-			// 13. Record session with empty tmuxSession (no tmux pane for headless agents).
-			const session: AgentSession = {
-				id: `session-${Date.now()}-${name}`,
-				agentName: name,
-				capability,
-				worktreePath,
-				branchName,
-				taskId: taskId,
-				tmuxSession: "",
-				state: "booting",
-				pid: headlessProc.pid,
-				parentAgent: parentAgent,
-				depth,
-				runId,
-				startedAt: new Date().toISOString(),
-				lastActivity: new Date().toISOString(),
-				escalationLevel: 0,
-				stalledSince: null,
-				transcriptPath: null,
-			};
-			store.upsert(session);
+			// 11c. Spawn: headless runtimes bypass tmux entirely; tmux path is unchanged.
+			if (runtime.headless === true && runtime.buildDirectSpawn) {
+				const directEnv = {
+					...runtime.buildEnv(resolvedModel),
+					OVERSTORY_AGENT_NAME: name,
+					OVERSTORY_WORKTREE_PATH: worktreePath,
+					OVERSTORY_TASK_ID: taskId,
+				};
+				const argv = runtime.buildDirectSpawn({
+					cwd: worktreePath,
+					env: directEnv,
+					...(resolvedModel.isExplicitOverride ? { model: resolvedModel.model } : {}),
+					instructionPath: runtime.instructionPath,
+				});
-			const runStore = createRunStore(join(overstoryDir, "sessions.db"));
-			try {
-				runStore.incrementAgentCount(runId);
-			} finally {
-				runStore.close();
-			}
+				// Create a timestamped log dir for this headless agent session.
+				// Always redirect stdout to a file. This prevents SIGPIPE death:
+				// ov sling exits after spawning, closing the pipe's read end.
+				// If stdout is a pipe, the agent dies on the next write (SIGPIPE).
+				// File writes have no such limit, and the agent survives the CLI exit.
+				//
+				// Note: RPC connection wiring is intentionally omitted here. The RPC pipe
+				// is only useful when the spawner stays alive to consume it. ov sling is
+				// a short-lived CLI — any connection created here dies with the process.
+				const logTimestamp = new Date().toISOString().replace(/[:.]/g, "-");
+				const agentLogDir = join(overstoryDir, "logs", name, logTimestamp);
+				mkdirSync(agentLogDir, { recursive: true });
+				const headlessProc = await spawnHeadlessAgent(argv, {
+					cwd: worktreePath,
+					env: { ...(process.env as Record<string, string>), ...directEnv },
+					stdoutFile: join(agentLogDir, "stdout.log"),
+					stderrFile: join(agentLogDir, "stderr.log"),
+				});
-			// 14. Output result (headless)
-			if (opts.json ?? false) {
-				jsonOutput("sling", {
+				// 13. Record session with empty tmuxSession (no tmux pane for headless agents).
+				const session: AgentSession = {
+					id: `session-${Date.now()}-${name}`,
 					agentName: name,
 					capability,
-					taskId,
-					branch: branchName,
-					worktree: worktreePath,
+					worktreePath,
+					branchName,
+					taskId: taskId,
 					tmuxSession: "",
+					state: "booting",
 					pid: headlessProc.pid,
-				});
+					parentAgent: parentAgent,
+					depth,
+					runId,
+					startedAt: new Date().toISOString(),
+					lastActivity: new Date().toISOString(),
+					escalationLevel: 0,
+					stalledSince: null,
+					transcriptPath: null,
+				};
+				store.upsert(session);
+				const runStore = createRunStore(join(overstoryDir, "sessions.db"));
+				try {
+					runStore.incrementAgentCount(runId);
+				} finally {
+					runStore.close();
+				}
+				// 14. Output result (headless)
+				if (opts.json ?? false) {
+					jsonOutput("sling", {
+						agentName: name,
+						capability,
+						taskId,
+						branch: branchName,
+						worktree: worktreePath,
+						tmuxSession: "",
+						pid: headlessProc.pid,
+					});
+				} else {
+					printSuccess("Agent launched (headless)", name);
+					process.stdout.write(`   Task:     ${taskId}\n`);
+					process.stdout.write(`   Branch:   ${branchName}\n`);
+					process.stdout.write(`   Worktree: ${worktreePath}\n`);
+					process.stdout.write(`   PID:      ${headlessProc.pid}\n`);
+				}
 			} else {
-				printSuccess("Agent launched (headless)", name);
-				process.stdout.write(`   Task:     ${taskId}\n`);
-				process.stdout.write(`   Branch:   ${branchName}\n`);
-				process.stdout.write(`   Worktree: ${worktreePath}\n`);
-				process.stdout.write(`   PID:      ${headlessProc.pid}\n`);
-			}
-		} else {
-			// 11c. Preflight: verify tmux is available before attempting session creation
-			await ensureTmuxAvailable();
-			// 12. Create tmux session running claude in interactive mode
-			const tmuxSessionName = `overstory-${config.project.name}-${name}`;
-			const spawnCmd = runtime.buildSpawnCommand({
-				model: resolvedModel.model,
-				permissionMode: "bypass",
-				cwd: worktreePath,
-				env: {
+				// 11c. Preflight: verify tmux is available before attempting session creation
+				await ensureTmuxAvailable();
+				// 12. Create tmux session running claude in interactive mode
+				const tmuxSessionName = `overstory-${config.project.name}-${name}`;
+				const spawnCmd = runtime.buildSpawnCommand({
+					model: resolvedModel.model,
+					permissionMode: "bypass",
+					cwd: worktreePath,
+					sharedWritableDirs: getSharedWritableDirs(config.project.root, capability),
+					env: {
+						...runtime.buildEnv(resolvedModel),
+						OVERSTORY_AGENT_NAME: name,
+						OVERSTORY_WORKTREE_PATH: worktreePath,
+						OVERSTORY_TASK_ID: taskId,
+					},
+				});
+				const pid = await createSession(tmuxSessionName, worktreePath, spawnCmd, {
 					...runtime.buildEnv(resolvedModel),
 					OVERSTORY_AGENT_NAME: name,
 					OVERSTORY_WORKTREE_PATH: worktreePath,
-				},
-			});
-			const pid = await createSession(tmuxSessionName, worktreePath, spawnCmd, {
-				...runtime.buildEnv(resolvedModel),
-				OVERSTORY_AGENT_NAME: name,
-				OVERSTORY_WORKTREE_PATH: worktreePath,
-			});
-			// 13. Record session BEFORE sending the beacon so that hook-triggered
-			// updateLastActivity() can find the entry and transition booting->working.
-			// Without this, a race exists: hooks fire before the session is persisted,
-			// leaving the agent stuck in "booting" (overstory-036f).
-			const session: AgentSession = {
-				id: `session-${Date.now()}-${name}`,
-				agentName: name,
-				capability,
-				worktreePath,
-				branchName,
-				taskId: taskId,
-				tmuxSession: tmuxSessionName,
-				state: "booting",
-				pid,
-				parentAgent: parentAgent,
-				depth,
-				runId,
-				startedAt: new Date().toISOString(),
-				lastActivity: new Date().toISOString(),
-				escalationLevel: 0,
-				stalledSince: null,
-				transcriptPath: null,
-			};
+					OVERSTORY_TASK_ID: taskId,
+				});
-			store.upsert(session);
+				// 13. Record session BEFORE sending the beacon so that hook-triggered
+				// updateLastActivity() can find the entry and transition booting->working.
+				// Without this, a race exists: hooks fire before the session is persisted,
+				// leaving the agent stuck in "booting" (overstory-036f).
+				const session: AgentSession = {
+					id: `session-${Date.now()}-${name}`,
+					agentName: name,
+					capability,
+					worktreePath,
+					branchName,
+					taskId: taskId,
+					tmuxSession: tmuxSessionName,
+					state: "booting",
+					pid,
+					parentAgent: parentAgent,
+					depth,
+					runId,
+					startedAt: new Date().toISOString(),
+					lastActivity: new Date().toISOString(),
+					escalationLevel: 0,
+					stalledSince: null,
+					transcriptPath: null,
+				};
+				store.upsert(session);
+				// Increment agent count for the run
+				const runStore = createRunStore(join(overstoryDir, "sessions.db"));
+				try {
+					runStore.incrementAgentCount(runId);
+				} finally {
+					runStore.close();
+				}
-			// Increment agent count for the run
-			const runStore = createRunStore(join(overstoryDir, "sessions.db"));
-			try {
-				runStore.incrementAgentCount(runId);
-			} finally {
-				runStore.close();
-			}
+				// 13b. Give slow shells time to finish initializing before polling for TUI readiness.
+				const shellDelay = config.runtime?.shellInitDelayMs ?? 0;
+				if (shellDelay > 0) {
+					await Bun.sleep(shellDelay);
+				}
-			// 13b. Give slow shells time to finish initializing before polling for TUI readiness.
-			const shellDelay = config.runtime?.shellInitDelayMs ?? 0;
-			if (shellDelay > 0) {
-				await Bun.sleep(shellDelay);
-			}
+				// Wait for Claude Code TUI to render before sending input.
+				// Polling capture-pane is more reliable than a fixed sleep because
+				// TUI init time varies by machine load and model state.
+				const tuiReady = await waitForTuiReady(tmuxSessionName, (content) =>
+					runtime.detectReady(content),
+				);
+				if (!tuiReady) {
+					const alive = await isSessionAlive(tmuxSessionName);
+					store.updateState(name, "completed");
+					if (alive) {
+						await killSession(tmuxSessionName);
+						throw new AgentError(
+							`Agent tmux session "${tmuxSessionName}" did not become ready during startup. The runtime may still be waiting on an interactive dialog or initializing too slowly.`,
+							{ agentName: name },
+						);
+					}
-			// Wait for Claude Code TUI to render before sending input.
-			// Polling capture-pane is more reliable than a fixed sleep because
-			// TUI init time varies by machine load and model state.
-			await waitForTuiReady(tmuxSessionName, (content) => runtime.detectReady(content));
-			// Buffer for the input handler to attach after initial render
-			await Bun.sleep(1_000);
+					const sessionState = await checkSessionState(tmuxSessionName);
+					const detail =
+						sessionState === "no_server"
+							? "The tmux server is no longer running. It may have crashed or been killed externally."
+							: "The agent process may have crashed or exited immediately before the TUI became ready.";
+					throw new AgentError(
+						`Agent tmux session "${tmuxSessionName}" died during startup. ${detail}`,
+						{ agentName: name },
+					);
+				}
+				// Buffer for the input handler to attach after initial render
+				await Bun.sleep(1_000);
-			const beacon = buildBeacon({
-				agentName: name,
-				capability,
-				taskId,
-				parentAgent,
-				depth,
-				instructionPath: runtime.instructionPath,
-			});
-			await sendKeys(tmuxSessionName, beacon);
-			// 13c. Follow-up Enters with increasing delays to ensure submission.
-			// Claude Code's TUI may consume early Enters during late initialization
-			// (overstory-yhv6). An Enter on an empty input line is harmless.
-			for (const delay of [1_000, 2_000, 3_000, 5_000]) {
-				await Bun.sleep(delay);
-				await sendKeys(tmuxSessionName, "");
-			}
+				const beacon = buildBeacon({
+					agentName: name,
+					capability,
+					taskId,
+					parentAgent,
+					depth,
+					instructionPath: runtime.instructionPath,
+				});
+				await sendKeys(tmuxSessionName, beacon);
+				// 13c. Follow-up Enters with increasing delays to ensure submission.
+				// Claude Code's TUI may consume early Enters during late initialization
+				// (overstory-yhv6). An Enter on an empty input line is harmless.
+				for (const delay of [1_000, 2_000, 3_000, 5_000]) {
+					await Bun.sleep(delay);
+					await sendKeys(tmuxSessionName, "");
+				}
-			// 13d. Verify beacon was received — if pane still shows the welcome
-			// screen (detectReady returns "ready"), resend the beacon. Claude Code's TUI
-			// sometimes consumes the Enter keystroke during late initialization, swallowing
-			// the beacon text entirely (overstory-3271).
-			//
-			// Skipped for runtimes that return false from requiresBeaconVerification().
-			// Pi's TUI idle and processing states are indistinguishable via detectReady
-			// (both show "pi v..." header and the token-usage status bar), so the loop
-			// would incorrectly conclude the beacon was not received and spam duplicate
-			// startup messages.
-			const needsVerification =
-				!runtime.requiresBeaconVerification || runtime.requiresBeaconVerification();
-			if (needsVerification) {
-				const verifyAttempts = 5;
-				for (let v = 0; v < verifyAttempts; v++) {
-					await Bun.sleep(2_000);
-					const paneContent = await capturePaneContent(tmuxSessionName);
-					if (paneContent) {
-						const readyState = runtime.detectReady(paneContent);
-						if (readyState.phase !== "ready") {
-							break; // Agent is processing — beacon was received
+				// 13d. Verify beacon was received — if pane still shows the welcome
+				// screen (detectReady returns "ready"), resend the beacon. Claude Code's TUI
+				// sometimes consumes the Enter keystroke during late initialization, swallowing
+				// the beacon text entirely (overstory-3271).
+				//
+				// Skipped for runtimes that return false from requiresBeaconVerification().
+				// Pi's TUI idle and processing states are indistinguishable via detectReady
+				// (both show "pi v..." header and the token-usage status bar), so the loop
+				// would incorrectly conclude the beacon was not received and spam duplicate
+				// startup messages.
+				const needsVerification =
+					!runtime.requiresBeaconVerification || runtime.requiresBeaconVerification();
+				if (needsVerification) {
+					const verifyAttempts = 5;
+					for (let v = 0; v < verifyAttempts; v++) {
+						await Bun.sleep(2_000);
+						const paneContent = await capturePaneContent(tmuxSessionName);
+						if (paneContent) {
+							const readyState = runtime.detectReady(paneContent);
+							if (readyState.phase !== "ready") {
+								break; // Agent is processing — beacon was received
+							}
 						}
+						// Still at welcome/idle screen — resend beacon
+						await sendKeys(tmuxSessionName, beacon);
+						await Bun.sleep(1_000);
+						await sendKeys(tmuxSessionName, ""); // Follow-up Enter
 					}
-					// Still at welcome/idle screen — resend beacon
-					await sendKeys(tmuxSessionName, beacon);
-					await Bun.sleep(1_000);
-					await sendKeys(tmuxSessionName, ""); // Follow-up Enter
 				}
-			}
-			// 14. Output result
-			const output = {
-				agentName: name,
-				capability,
-				taskId,
-				branch: branchName,
-				worktree: worktreePath,
-				tmuxSession: tmuxSessionName,
-				pid,
-			};
-			if (opts.json ?? false) {
-				jsonOutput("sling", output);
-			} else {
-				printSuccess("Agent launched", name);
-				process.stdout.write(`   Task:     ${taskId}\n`);
-				process.stdout.write(`   Branch:   ${branchName}\n`);
-				process.stdout.write(`   Worktree: ${worktreePath}\n`);
-				process.stdout.write(`   Tmux:     ${tmuxSessionName}\n`);
-				process.stdout.write(`   PID:      ${pid}\n`);
+				// 14. Output result
+				const output = {
+					agentName: name,
+					capability,
+					taskId,
+					branch: branchName,
+					worktree: worktreePath,
+					tmuxSession: tmuxSessionName,
+					pid,
+				};
+				if (opts.json ?? false) {
+					jsonOutput("sling", output);
+				} else {
+					printSuccess("Agent launched", name);
+					process.stdout.write(`   Task:     ${taskId}\n`);
+					process.stdout.write(`   Branch:   ${branchName}\n`);
+					process.stdout.write(`   Worktree: ${worktreePath}\n`);
+					process.stdout.write(`   Tmux:     ${tmuxSessionName}\n`);
+					process.stdout.write(`   PID:      ${pid}\n`);
+				}
 			}
+		} catch (err) {
+			await rollbackWorktree(config.project.root, worktreePath, branchName);
+			throw err;
 		}
 	} finally {
 		store.close();