npm - @os-eco/overstory-cli - Versions diffs - 0.8.0 → 0.8.2 - Mend

@os-eco/overstory-cli 0.8.0 → 0.8.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

package/README.md +3 -1
package/package.json +1 -1
package/src/commands/dashboard.test.ts +86 -0
package/src/commands/dashboard.ts +8 -4
package/src/commands/feed.test.ts +8 -0
package/src/commands/inspect.test.ts +156 -1
package/src/commands/inspect.ts +19 -4
package/src/commands/replay.test.ts +8 -0
package/src/commands/sling.ts +218 -121
package/src/commands/status.test.ts +77 -0
package/src/commands/status.ts +6 -3
package/src/commands/stop.test.ts +134 -0
package/src/commands/stop.ts +41 -11
package/src/commands/trace.test.ts +8 -0
package/src/index.ts +1 -1
package/src/logging/theme.ts +4 -0
package/src/runtimes/connections.test.ts +74 -0
package/src/runtimes/connections.ts +34 -0
package/src/runtimes/registry.test.ts +1 -1
package/src/runtimes/registry.ts +2 -0
package/src/runtimes/sapling.test.ts +1237 -0
package/src/runtimes/sapling.ts +698 -0
package/src/runtimes/types.ts +45 -0
package/src/types.ts +5 -1
package/src/watchdog/daemon.ts +34 -0
package/src/watchdog/health.test.ts +102 -0
package/src/watchdog/health.ts +140 -69
package/src/worktree/process.test.ts +101 -0
package/src/worktree/process.ts +111 -0
package/src/worktree/tmux.ts +5 -0

package/src/runtimes/sapling.ts ADDED Viewed

@@ -0,0 +1,698 @@
+// Sapling runtime adapter for overstory's AgentRuntime interface.
+// Implements the AgentRuntime contract for the `sp` CLI (Sapling headless coding agent).
+//
+// Key characteristics:
+// - Headless: Sapling runs as a Bun subprocess (no tmux TUI)
+// - Instruction file: SAPLING.md (auto-read from worktree root)
+// - Communication: NDJSON event stream on stdout (--json)
+// - Guards: .sapling/guards.json (written by deployConfig from guard-rules.ts constants)
+// - Events: NDJSON stream on stdout (parsed for token usage and agent events)
+import { mkdir } from "node:fs/promises";
+import { dirname, join } from "node:path";
+import {
+	DANGEROUS_BASH_PATTERNS,
+	INTERACTIVE_TOOLS,
+	NATIVE_TEAM_TOOLS,
+	SAFE_BASH_PREFIXES,
+	WRITE_TOOLS,
+} from "../agents/guard-rules.ts";
+import { DEFAULT_QUALITY_GATES } from "../config.ts";
+import type { ResolvedModel } from "../types.ts";
+import type {
+	AgentEvent,
+	AgentRuntime,
+	ConnectionState,
+	DirectSpawnOpts,
+	HooksDef,
+	OverlayContent,
+	ReadyState,
+	RpcProcessHandle,
+	RuntimeConnection,
+	SpawnOpts,
+	TranscriptSummary,
+} from "./types.ts";
+/**
+ * Fallback map for bare model aliases when no ANTHROPIC_DEFAULT_*_MODEL env var is set.
+ * Used by buildDirectSpawn() to resolve short names to concrete model IDs.
+ */
+const SAPLING_ALIAS_FALLBACKS: Record<string, string> = {
+	haiku: "claude-haiku-4-5-20251001",
+	sonnet: "claude-sonnet-4-6-20251015",
+	opus: "claude-opus-4-6-20251015",
+};
+/**
+ * Bash patterns that modify files and require path boundary validation
+ * for implementation agents (builder/merger). Mirrors the constant in pi-guards.ts.
+ */
+const FILE_MODIFYING_BASH_PATTERNS = [
+	"sed\\s+-i",
+	"sed\\s+--in-place",
+	"echo\\s+.*>",
+	"printf\\s+.*>",
+	"cat\\s+.*>",
+	"tee\\s",
+	"\\bmv\\s",
+	"\\bcp\\s",
+	"\\brm\\s",
+	"\\bmkdir\\s",
+	"\\btouch\\s",
+	"\\bchmod\\s",
+	"\\bchown\\s",
+	">>",
+	"\\binstall\\s",
+	"\\brsync\\s",
+];
+/** Capabilities that must not modify project files (read-only mode). */
+const NON_IMPLEMENTATION_CAPABILITIES = new Set([
+	"scout",
+	"reviewer",
+	"lead",
+	"coordinator",
+	"supervisor",
+	"monitor",
+]);
+/** Coordination capabilities that get git add/commit whitelisted for metadata sync. */
+const COORDINATION_CAPABILITIES = new Set(["coordinator", "supervisor", "monitor"]);
+/**
+ * Build the full guards configuration object for .sapling/guards.json.
+ *
+ * Translates overstory guard-rules.ts constants and HooksDef fields into a
+ * JSON-serializable format that the `sp` CLI can consume to enforce:
+ * - Path boundary: all writes must target files within worktreePath.
+ * - Blocked tools: NATIVE_TEAM_TOOLS and INTERACTIVE_TOOLS for all agents;
+ *   WRITE_TOOLS additionally for non-implementation capabilities.
+ * - Bash guards: DANGEROUS_BASH_PATTERNS blocklist (non-impl) or
+ *   FILE_MODIFYING_BASH_PATTERNS path boundary (impl), with SAFE_BASH_PREFIXES.
+ * - Quality gates: commands agents must pass before reporting completion.
+ * - Event config: argv arrays for activity tracking via `ov log`.
+ *
+ * @param hooks - Agent identity, capability, worktree path, and optional quality gates.
+ * @returns JSON-serializable guards configuration object.
+ */
+function buildGuardsConfig(hooks: HooksDef): Record<string, unknown> {
+	const { agentName, capability, worktreePath, qualityGates } = hooks;
+	const gates = qualityGates ?? DEFAULT_QUALITY_GATES;
+	const isNonImpl = NON_IMPLEMENTATION_CAPABILITIES.has(capability);
+	const isCoordination = COORDINATION_CAPABILITIES.has(capability);
+	// Build safe Bash prefixes: base set + coordination extras + quality gate commands.
+	const safePrefixes: string[] = [
+		...SAFE_BASH_PREFIXES,
+		...(isCoordination ? ["git add", "git commit"] : []),
+		...gates.map((g) => g.command),
+	];
+	return {
+		// Schema version for forward-compatibility.
+		version: 1,
+		// Agent identity (injected into event tracking commands).
+		agentName,
+		capability,
+		// Path boundary: all file writes must target paths within this directory.
+		// Equivalent to the worktree's exclusive file scope.
+		pathBoundary: worktreePath,
+		// Read-only mode: true for non-implementation capabilities (scout, reviewer, lead, etc.).
+		// When true, write tools are blocked in addition to the always-blocked tool set.
+		readOnly: isNonImpl,
+		// Tool names blocked for ALL agents.
+		// - nativeTeamTools: use `ov sling` for delegation instead.
+		// - interactiveTools: escalate via `ov mail --type question` instead.
+		blockedTools: [...NATIVE_TEAM_TOOLS, ...INTERACTIVE_TOOLS],
+		// Tool names blocked only for read-only (non-implementation) agents.
+		// Empty array for implementation agents (builder/merger).
+		writeToolsBlocked: isNonImpl ? [...WRITE_TOOLS] : [],
+		// Write/edit tool names subject to path boundary enforcement (all agents).
+		writeToolNames: [...WRITE_TOOLS],
+		bashGuards: {
+			// Safe Bash prefixes: bypass dangerous pattern checks when matched.
+			// Includes base overstory commands, optional git add/commit for coordination,
+			// and quality gate command prefixes.
+			safePrefixes,
+			// Dangerous Bash patterns: blocked for non-implementation agents.
+			// Each string is a regex fragment (grep -qE compatible).
+			dangerousPatterns: DANGEROUS_BASH_PATTERNS,
+			// File-modifying Bash patterns: require path boundary check for implementation agents.
+			// Each string is a regex fragment; matched paths must fall within pathBoundary.
+			fileModifyingPatterns: FILE_MODIFYING_BASH_PATTERNS,
+		},
+		// Quality gate commands that must pass before the agent reports task completion.
+		qualityGates: gates.map((g) => ({
+			name: g.name,
+			command: g.command,
+			description: g.description,
+		})),
+		// Activity tracking event configuration.
+		// Each value is an argv array passed to Bun.spawn() — no shell interpolation.
+		// The `sp` runtime fires these on the corresponding lifecycle events.
+		eventConfig: {
+			// Fires before each tool executes (updates lastActivity in SessionStore).
+			onToolStart: ["ov", "log", "tool-start", "--agent", agentName],
+			// Fires after each tool completes.
+			onToolEnd: ["ov", "log", "tool-end", "--agent", agentName],
+			// Fires when the agent's work loop completes or the process exits.
+			onSessionEnd: ["ov", "log", "session-end", "--agent", agentName],
+		},
+	};
+}
+/** Pending JSON-RPC getState request waiting for a response. */
+interface PendingRequest {
+	resolve: (state: ConnectionState) => void;
+	reject: (err: Error) => void;
+	timer: ReturnType<typeof setTimeout>;
+}
+/**
+ * RPC connection to a running Sapling agent process.
+ *
+ * Communicates over stdin/stdout using a simple NDJSON protocol:
+ * - Fire-and-forget control messages (steer, followUp, abort) written as plain NDJSON.
+ * - getState() uses JSON-RPC 2.0 (id + method) with a background reader routing responses.
+ *
+ * Background drainStdout() loop reads stdout and routes JSON-RPC 2.0 responses
+ * (lines with `jsonrpc` field and numeric `id`) to pending getState() waiters.
+ * All other NDJSON events are silently discarded.
+ *
+ * Not exported — constructed only by SaplingRuntime.connect().
+ */
+class SaplingConnection implements RuntimeConnection {
+	private nextId = 0;
+	private readonly pending = new Map<number, PendingRequest>();
+	private closed = false;
+	private readonly proc: RpcProcessHandle;
+	private readonly timeoutMs: number;
+	constructor(proc: RpcProcessHandle, timeoutMs = 5000) {
+		this.proc = proc;
+		this.timeoutMs = timeoutMs;
+		this.drainStdout();
+	}
+	/**
+	 * Background reader: consumes stdout, routes JSON-RPC responses to pending waiters.
+	 * Follows the same buffer/split pattern as parseEvents().
+	 * On stream end or error, rejects all pending requests.
+	 */
+	private drainStdout(): void {
+		const reader = this.proc.stdout.getReader();
+		const decoder = new TextDecoder();
+		let buffer = "";
+		const processLine = (line: string): void => {
+			const trimmed = line.trim();
+			if (!trimmed) return;
+			let parsed: Record<string, unknown>;
+			try {
+				parsed = JSON.parse(trimmed) as Record<string, unknown>;
+			} catch {
+				// Skip malformed lines — partial writes or non-JSON debug output
+				return;
+			}
+			// Route JSON-RPC 2.0 responses: must have jsonrpc field and numeric id
+			if (parsed.jsonrpc !== undefined && typeof parsed.id === "number") {
+				const pending = this.pending.get(parsed.id);
+				if (pending) {
+					clearTimeout(pending.timer);
+					this.pending.delete(parsed.id);
+					pending.resolve(parsed.result as ConnectionState);
+				}
+			}
+			// Non-RPC NDJSON lines are silently discarded
+		};
+		const read = async (): Promise<void> => {
+			try {
+				while (true) {
+					const { done, value } = await reader.read();
+					if (done) break;
+					buffer += decoder.decode(value, { stream: true });
+					const lines = buffer.split("\n");
+					buffer = lines.pop() ?? "";
+					for (const line of lines) {
+						processLine(line);
+					}
+				}
+				// Flush remaining buffer on clean stream end
+				if (buffer.trim()) {
+					processLine(buffer);
+				}
+			} catch {
+				// Stream error — fall through to reject all pending
+			} finally {
+				reader.releaseLock();
+				// Reject all pending on stream end or error
+				for (const [, pending] of this.pending) {
+					clearTimeout(pending.timer);
+					pending.reject(new Error("connection closed"));
+				}
+				this.pending.clear();
+			}
+		};
+		// Fire-and-forget background reader
+		read().catch(() => {
+			// Errors are handled in the finally block above
+		});
+	}
+	/** Write a JSON message + newline to stdin. */
+	private writeMsg(msg: Record<string, unknown>): void {
+		const line = `${JSON.stringify(msg)}\n`;
+		const result = this.proc.stdin.write(line);
+		if (result instanceof Promise) {
+			result.catch(() => {
+				// Fire-and-forget write errors are non-fatal for control messages
+			});
+		}
+	}
+	async sendPrompt(text: string): Promise<void> {
+		this.writeMsg({ method: "steer", params: { content: text } });
+	}
+	async followUp(text: string): Promise<void> {
+		this.writeMsg({ method: "followUp", params: { content: text } });
+	}
+	async abort(): Promise<void> {
+		this.writeMsg({ method: "abort" });
+	}
+	getState(): Promise<ConnectionState> {
+		if (this.closed) {
+			return Promise.reject(new Error("connection closed"));
+		}
+		const id = this.nextId++;
+		return new Promise<ConnectionState>((resolve, reject) => {
+			const timer = setTimeout(() => {
+				this.pending.delete(id);
+				reject(new Error("getState timed out"));
+			}, this.timeoutMs);
+			this.pending.set(id, { resolve, reject, timer });
+			// Send the request — on write failure, clean up the pending entry
+			const line = `${JSON.stringify({ id, method: "getState" })}\n`;
+			const result = this.proc.stdin.write(line);
+			if (result instanceof Promise) {
+				result.catch(() => {
+					clearTimeout(timer);
+					this.pending.delete(id);
+					reject(new Error("write failed"));
+				});
+			}
+		});
+	}
+	close(): void {
+		this.closed = true;
+		for (const [, pending] of this.pending) {
+			clearTimeout(pending.timer);
+			pending.reject(new Error("connection closed"));
+		}
+		this.pending.clear();
+	}
+}
+/**
+ * Sapling runtime adapter.
+ *
+ * Implements AgentRuntime for the `sp` CLI (Sapling headless coding agent).
+ * Sapling workers run as headless Bun subprocesses — they communicate via
+ * JSON-RPC on stdin/stdout rather than a TUI in a tmux pane. This means
+ * all tmux lifecycle methods (buildSpawnCommand, detectReady, requiresBeaconVerification)
+ * are stubs: the orchestrator checks `runtime.headless === true` and takes the
+ * direct-spawn code path instead.
+ *
+ * Instructions are delivered via `SAPLING.md` in the worktree root.
+ * Guard configuration is written to `.sapling/guards.json` (stub for Wave 3).
+ *
+ * Hardware impact: Sapling workers use 60–120 MB RAM vs 250–400 MB for TUI agents,
+ * enabling 4–6× more concurrent workers on a typical developer machine.
+ */
+export class SaplingRuntime implements AgentRuntime {
+	/** Unique identifier for this runtime. */
+	readonly id = "sapling";
+	/** Relative path to the instruction file within a worktree. */
+	readonly instructionPath = "SAPLING.md";
+	/**
+	 * Whether this runtime is headless (no tmux, direct subprocess).
+	 * Headless runtimes bypass all tmux session management and use Bun.spawn directly.
+	 */
+	readonly headless = true;
+	/**
+	 * Build the shell command string to spawn a Sapling agent in a tmux pane.
+	 *
+	 * This method exists for the TUI fallback path (e.g., `ov sling --runtime sapling`
+	 * on a host that has tmux). Under normal operation, Sapling is headless and
+	 * buildDirectSpawn() is used instead.
+	 *
+	 * Maps SpawnOpts to `sp run` flags:
+	 * - `model` → `--model <model>`
+	 * - `appendSystemPromptFile` → prepended via `$(cat ...)` shell expansion
+	 * - `appendSystemPrompt` → appended inline
+	 * - `permissionMode` is accepted but NOT mapped — Sapling enforces security
+	 *   via .sapling/guards.json rather than permission flags.
+	 *
+	 * @param opts - Spawn options (model, appendSystemPrompt; permissionMode ignored)
+	 * @returns Shell command string suitable for tmux new-session -c
+	 */
+	buildSpawnCommand(opts: SpawnOpts): string {
+		let cmd = `sp run --model ${opts.model} --json`;
+		if (opts.appendSystemPromptFile) {
+			// Read role definition from file at shell expansion time — avoids tmux
+			// IPC message size limits. Append the "read SAPLING.md" instruction.
+			const escaped = opts.appendSystemPromptFile.replace(/'/g, "'\\''");
+			cmd += ` "$(cat '${escaped}')"' Read SAPLING.md for your task assignment and begin immediately.'`;
+		} else if (opts.appendSystemPrompt) {
+			// Inline role definition + instruction to read SAPLING.md.
+			const prompt = `${opts.appendSystemPrompt}\n\nRead SAPLING.md for your task assignment and begin immediately.`;
+			const escaped = prompt.replace(/'/g, "'\\''");
+			cmd += ` '${escaped}'`;
+		} else {
+			cmd += ` 'Read SAPLING.md for your task assignment and begin immediately.'`;
+		}
+		return cmd;
+	}
+	/**
+	 * Build the argv array for a headless one-shot Sapling invocation.
+	 *
+	 * Returns an argv array suitable for `Bun.spawn()`. The `sp print` subcommand
+	 * processes a prompt and exits, printing the result to stdout.
+	 *
+	 * Used by merge/resolver.ts (AI-assisted conflict resolution) and
+	 * watchdog/triage.ts (AI-assisted failure classification).
+	 *
+	 * @param prompt - The prompt to pass as the argument
+	 * @param model - Optional model override
+	 * @returns Argv array for Bun.spawn
+	 */
+	buildPrintCommand(prompt: string, model?: string): string[] {
+		const cmd = ["sp", "print"];
+		if (model !== undefined) {
+			cmd.push("--model", model);
+		}
+		cmd.push(prompt);
+		return cmd;
+	}
+	/**
+	 * Build the argv array for Bun.spawn() to launch a Sapling agent subprocess.
+	 *
+	 * Returns an argv array that starts the Sapling agent with NDJSON event output. The agent
+	 * reads its instructions from the file at `opts.instructionPath`, processes
+	 * the task, emits NDJSON events on stdout, and exits on completion.
+	 *
+	 * @param opts - Direct spawn options (cwd, env, model, instructionPath)
+	 * @returns Argv array for Bun.spawn — do not shell-interpolate
+	 */
+	buildDirectSpawn(opts: DirectSpawnOpts): string[] {
+		// Resolve the actual model name: if this is an alias (e.g. "sonnet") routed
+		// through a gateway, the real model ID is in the env vars. Sapling passes
+		// --model directly to the SDK, so it needs the actual model ID, not the alias.
+		let model = opts.model;
+		let resolved = false;
+		if (opts.env) {
+			const aliasKey = `ANTHROPIC_DEFAULT_${model.toUpperCase()}_MODEL`;
+			const envResolved = opts.env[aliasKey];
+			if (envResolved) {
+				model = envResolved;
+				resolved = true;
+			}
+		}
+		// Fallback: bare aliases (haiku/sonnet/opus) with no gateway env var → concrete model ID.
+		if (!resolved) {
+			const fallback = SAPLING_ALIAS_FALLBACKS[model];
+			if (fallback !== undefined) {
+				model = fallback;
+			}
+		}
+		return [
+			"sp",
+			"run",
+			"--model",
+			model,
+			"--json",
+			"--cwd",
+			opts.cwd,
+			"--system-prompt-file",
+			opts.instructionPath,
+			"Read SAPLING.md for your task assignment and begin immediately.",
+		];
+	}
+	/**
+	 * Deploy per-agent instructions and guard configuration to a worktree.
+	 *
+	 * Writes the overlay content to `SAPLING.md` in the worktree root.
+	 * Also writes `.sapling/guards.json` with the full guard configuration
+	 * derived from `hooks` — translating overstory guard-rules.ts constants
+	 * into JSON-serializable form for the `sp` CLI to enforce.
+	 *
+	 * @param worktreePath - Absolute path to the agent's git worktree
+	 * @param overlay - Overlay content to write as SAPLING.md, or undefined for hooks-only deployment
+	 * @param hooks - Agent identity, capability, and quality gates for guard config
+	 */
+	async deployConfig(
+		worktreePath: string,
+		overlay: OverlayContent | undefined,
+		hooks: HooksDef,
+	): Promise<void> {
+		// Write SAPLING.md instruction file (only when overlay is provided).
+		if (overlay) {
+			const saplingPath = join(worktreePath, this.instructionPath);
+			await mkdir(dirname(saplingPath), { recursive: true });
+			await Bun.write(saplingPath, overlay.content);
+		}
+		// Always write .sapling/guards.json — even when overlay is undefined
+		// (hooks-only deployment for coordinator/supervisor/monitor).
+		const guardsPath = join(worktreePath, ".sapling", "guards.json");
+		await mkdir(dirname(guardsPath), { recursive: true });
+		await Bun.write(guardsPath, `${JSON.stringify(buildGuardsConfig(hooks), null, 2)}\n`);
+	}
+	/**
+	 * Sapling is headless — always ready.
+	 *
+	 * Sapling runs as a direct subprocess that emits a `{"type":"ready"}` event
+	 * on stdout when initialization completes. Tmux-based readiness detection
+	 * is never used for Sapling workers.
+	 *
+	 * @param _paneContent - Captured tmux pane content (unused)
+	 * @returns Always `{ phase: "ready" }`
+	 */
+	detectReady(_paneContent: string): ReadyState {
+		return { phase: "ready" };
+	}
+	/**
+	 * Sapling does not require beacon verification/resend.
+	 *
+	 * The beacon verification loop exists because Claude Code's TUI sometimes
+	 * swallows the initial Enter during late initialization. Sapling is headless —
+	 * it communicates via stdin/stdout with no TUI startup delay.
+	 */
+	requiresBeaconVerification(): boolean {
+		return false;
+	}
+	/**
+	 * Parse a Sapling NDJSON transcript file into normalized token usage.
+	 *
+	 * Sapling emits NDJSON events on stdout during execution. The transcript
+	 * file records these events. Token usage is extracted from events that
+	 * carry a `usage` object with `input_tokens` and/or `output_tokens` fields.
+	 * Model identity is extracted from any event that carries a `model` field.
+	 *
+	 * Returns null if the file does not exist or cannot be parsed.
+	 *
+	 * @param path - Absolute path to the Sapling NDJSON transcript file
+	 * @returns Aggregated token usage, or null if unavailable
+	 */
+	async parseTranscript(path: string): Promise<TranscriptSummary | null> {
+		const file = Bun.file(path);
+		if (!(await file.exists())) {
+			return null;
+		}
+		try {
+			const text = await file.text();
+			const lines = text.split("\n").filter((l) => l.trim().length > 0);
+			let inputTokens = 0;
+			let outputTokens = 0;
+			let model = "";
+			for (const line of lines) {
+				let event: Record<string, unknown>;
+				try {
+					event = JSON.parse(line) as Record<string, unknown>;
+				} catch {
+					// Skip malformed lines — partial writes during capture.
+					continue;
+				}
+				// Extract token usage from any event carrying a usage object.
+				if (typeof event.usage === "object" && event.usage !== null) {
+					const usage = event.usage as Record<string, unknown>;
+					if (typeof usage.input_tokens === "number") {
+						inputTokens += usage.input_tokens;
+					}
+					if (typeof usage.output_tokens === "number") {
+						outputTokens += usage.output_tokens;
+					}
+				}
+				// Capture model from any event that carries it.
+				if (typeof event.model === "string" && event.model && !model) {
+					model = event.model;
+				}
+			}
+			return { inputTokens, outputTokens, model };
+		} catch {
+			return null;
+		}
+	}
+	/**
+	 * Parse NDJSON stdout from a Sapling agent subprocess into typed AgentEvent objects.
+	 *
+	 * Reads the ReadableStream from Bun.spawn() stdout, buffers partial lines,
+	 * and yields a typed AgentEvent for each complete JSON line. Malformed lines
+	 * (partial writes, non-JSON output) are silently skipped.
+	 *
+	 * The NDJSON format mirrors Pi's `--mode json` output so `ov feed`, `ov trace`,
+	 * and `ov costs` work without runtime-specific parsing.
+	 *
+	 * @param stream - ReadableStream<Uint8Array> from Bun.spawn stdout
+	 * @yields Parsed AgentEvent objects in emission order
+	 */
+	async *parseEvents(stream: ReadableStream<Uint8Array>): AsyncIterable<AgentEvent> {
+		const reader = stream.getReader();
+		const decoder = new TextDecoder();
+		let buffer = "";
+		try {
+			while (true) {
+				const result = await reader.read();
+				if (result.done) break;
+				buffer += decoder.decode(result.value, { stream: true });
+				// Split on newlines, keeping the remainder in the buffer.
+				const lines = buffer.split("\n");
+				// The last element is either empty or an incomplete line.
+				buffer = lines.pop() ?? "";
+				for (const line of lines) {
+					const trimmed = line.trim();
+					if (!trimmed) continue;
+					try {
+						const event = JSON.parse(trimmed) as AgentEvent;
+						yield event;
+					} catch {
+						// Skip malformed lines — partial writes or debug output.
+					}
+				}
+			}
+			// Flush any remaining buffer content after stream ends.
+			const remaining = buffer.trim();
+			if (remaining) {
+				try {
+					const event = JSON.parse(remaining) as AgentEvent;
+					yield event;
+				} catch {
+					// Skip malformed trailing line.
+				}
+			}
+		} finally {
+			reader.releaseLock();
+		}
+	}
+	/**
+	 * Build runtime-specific environment variables for spawning sapling.
+	 *
+	 * Translates overstory's gateway provider env vars into what sapling expects.
+	 * Worktrees don't have .env files (gitignored), so overstory must pass
+	 * provider credentials — same as it does for every other runtime.
+	 *
+	 * Key translations:
+	 * - ANTHROPIC_AUTH_TOKEN → ANTHROPIC_API_KEY (sapling SDK reads API_KEY)
+	 * - ANTHROPIC_BASE_URL passed through as-is
+	 * - SAPLING_BACKEND=sdk forced when gateway provider is configured
+	 *
+	 * @param model - Resolved model with optional provider env vars
+	 * @returns Environment variable map for sapling subprocess
+	 */
+	/**
+	 * Establish a direct RPC connection to a running Sapling agent process.
+	 *
+	 * Returns a SaplingConnection that multiplexes getState() JSON-RPC 2.0
+	 * requests over stdin/stdout alongside the normal NDJSON event stream.
+	 *
+	 * @param process - Stdin/stdout handles from the spawned agent subprocess
+	 * @returns RuntimeConnection for RPC-based health checks and control
+	 */
+	connect(process: RpcProcessHandle): RuntimeConnection {
+		return new SaplingConnection(process);
+	}
+	buildEnv(model: ResolvedModel): Record<string, string> {
+		const env: Record<string, string> = {
+			// Clear Claude Code session markers so sapling doesn't auto-detect
+			// SDK backend when spawned from a Claude Code session (CLAUDECODE=1).
+			CLAUDECODE: "",
+			CLAUDE_CODE_SSE_PORT: "",
+			CLAUDE_CODE_ENTRYPOINT: "",
+		};
+		const providerEnv = model.env ?? {};
+		// Gateway providers use ANTHROPIC_AUTH_TOKEN; sapling's SDK reads ANTHROPIC_API_KEY.
+		if (providerEnv.ANTHROPIC_AUTH_TOKEN) {
+			env.ANTHROPIC_API_KEY = providerEnv.ANTHROPIC_AUTH_TOKEN;
+		}
+		if (providerEnv.ANTHROPIC_BASE_URL) {
+			env.ANTHROPIC_BASE_URL = providerEnv.ANTHROPIC_BASE_URL;
+		}
+		// Force SDK backend when a gateway provider is configured.
+		if (providerEnv.ANTHROPIC_AUTH_TOKEN || providerEnv.ANTHROPIC_BASE_URL) {
+			env.SAPLING_BACKEND = "sdk";
+		}
+		// Forward model alias env vars so buildDirectSpawn can resolve gateway-routed models.
+		// resolveProviderEnv sets ANTHROPIC_DEFAULT_<ALIAS>_MODEL (e.g. ANTHROPIC_DEFAULT_SONNET_MODEL)
+		// to point to the real model ID behind the gateway. Without forwarding these,
+		// buildDirectSpawn cannot find the real model ID and falls back to the bare alias.
+		for (const [key, value] of Object.entries(providerEnv)) {
+			if (key.startsWith("ANTHROPIC_DEFAULT_") && key.endsWith("_MODEL")) {
+				env[key] = value;
+			}
+		}
+		return env;
+	}
+}