npm - @oh-my-pi/pi-coding-agent - Versions diffs - 15.11.4 → 15.11.7 - Mend

@oh-my-pi/pi-coding-agent 15.11.4 → 15.11.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (98) hide show

package/CHANGELOG.md +82 -1
package/dist/cli.js +520 -451
package/dist/types/cli/bench-cli.d.ts +78 -0
package/dist/types/cli/usage-cli.d.ts +10 -1
package/dist/types/commands/bench.d.ts +29 -0
package/dist/types/commands/usage.d.ts +9 -0
package/dist/types/config/model-resolver.d.ts +3 -2
package/dist/types/config/settings-schema.d.ts +125 -3
package/dist/types/edit/renderer.d.ts +1 -0
package/dist/types/modes/components/oauth-selector.d.ts +10 -1
package/dist/types/modes/components/reset-usage-selector.d.ts +12 -0
package/dist/types/modes/components/session-selector.d.ts +1 -1
package/dist/types/modes/components/settings-selector.d.ts +8 -1
package/dist/types/modes/components/snapcompact-shape-preview.d.ts +31 -0
package/dist/types/modes/components/tool-execution.d.ts +18 -0
package/dist/types/modes/controllers/selector-controller.d.ts +1 -0
package/dist/types/modes/interactive-mode.d.ts +10 -0
package/dist/types/modes/session-observer-registry.d.ts +2 -0
package/dist/types/modes/setup-wizard/scenes/sign-in.d.ts +3 -0
package/dist/types/modes/setup-wizard/scenes/types.d.ts +10 -1
package/dist/types/modes/setup-wizard/scenes/web-search.d.ts +3 -0
package/dist/types/modes/types.d.ts +2 -0
package/dist/types/modes/utils/context-usage.d.ts +6 -1
package/dist/types/session/agent-session.d.ts +14 -1
package/dist/types/session/auth-storage.d.ts +1 -1
package/dist/types/session/codex-auto-reset.d.ts +107 -0
package/dist/types/session/snapcompact-inline.d.ts +107 -4
package/dist/types/slash-commands/helpers/reset-usage.d.ts +27 -0
package/dist/types/task/render.d.ts +1 -0
package/dist/types/tools/bash.d.ts +2 -0
package/dist/types/tools/eval-render.d.ts +1 -0
package/dist/types/tools/renderers.d.ts +13 -0
package/dist/types/tools/ssh.d.ts +1 -0
package/dist/types/tools/todo.d.ts +0 -11
package/package.json +11 -11
package/src/cli/bench-cli.ts +437 -0
package/src/cli/usage-cli.ts +187 -16
package/src/cli-commands.ts +1 -0
package/src/commands/bench.ts +42 -0
package/src/commands/usage.ts +8 -0
package/src/config/model-registry.ts +52 -5
package/src/config/model-resolver.ts +36 -5
package/src/config/settings-schema.ts +148 -3
package/src/config/settings.ts +9 -0
package/src/edit/renderer.ts +5 -0
package/src/hindsight/client.ts +26 -1
package/src/hindsight/state.ts +6 -2
package/src/internal-urls/docs-index.generated.ts +2 -2
package/src/mcp/transports/stdio.ts +81 -7
package/src/modes/components/oauth-selector.ts +67 -7
package/src/modes/components/reset-usage-selector.ts +161 -0
package/src/modes/components/session-selector.ts +8 -2
package/src/modes/components/settings-selector.ts +89 -47
package/src/modes/components/snapcompact-shape-preview-doc.md +11 -0
package/src/modes/components/snapcompact-shape-preview.ts +192 -0
package/src/modes/components/tool-execution.ts +26 -0
package/src/modes/components/transcript-container.ts +23 -1
package/src/modes/controllers/command-controller.ts +24 -1
package/src/modes/controllers/input-controller.ts +8 -6
package/src/modes/controllers/selector-controller.ts +72 -2
package/src/modes/interactive-mode.ts +83 -0
package/src/modes/session-observer-registry.ts +61 -3
package/src/modes/setup-wizard/index.ts +1 -0
package/src/modes/setup-wizard/scenes/glyph.ts +24 -6
package/src/modes/setup-wizard/scenes/providers.ts +36 -2
package/src/modes/setup-wizard/scenes/sign-in.ts +10 -1
package/src/modes/setup-wizard/scenes/theme.ts +28 -1
package/src/modes/setup-wizard/scenes/types.ts +10 -1
package/src/modes/setup-wizard/scenes/web-search.ts +22 -6
package/src/modes/setup-wizard/wizard-overlay.ts +38 -1
package/src/modes/theme/theme.ts +2 -2
package/src/modes/types.ts +2 -0
package/src/modes/utils/context-usage.ts +75 -1
package/src/prompts/bench.md +7 -0
package/src/prompts/system/snapcompact-context-frames-note.md +1 -0
package/src/prompts/system/snapcompact-context-stub.md +1 -0
package/src/prompts/system/snapcompact-toolresult-note.md +1 -1
package/src/prompts/tools/browser.md +33 -43
package/src/prompts/tools/eval.md +27 -50
package/src/prompts/tools/irc.md +29 -31
package/src/prompts/tools/read.md +31 -37
package/src/prompts/tools/todo.md +1 -2
package/src/sdk.ts +4 -2
package/src/session/agent-session.ts +136 -6
package/src/session/auth-storage.ts +3 -0
package/src/session/codex-auto-reset.ts +190 -0
package/src/session/snapcompact-inline.ts +404 -75
package/src/slash-commands/builtin-registry.ts +145 -8
package/src/slash-commands/helpers/context-report.ts +28 -1
package/src/slash-commands/helpers/reset-usage.ts +66 -0
package/src/slash-commands/helpers/usage-report.ts +12 -0
package/src/task/index.ts +30 -7
package/src/task/render.ts +34 -19
package/src/tools/bash.ts +3 -0
package/src/tools/eval-render.ts +4 -0
package/src/tools/renderers.ts +13 -0
package/src/tools/ssh.ts +3 -0
package/src/tools/todo.ts +8 -128

package/src/slash-commands/builtin-registry.ts CHANGED Viewed

@@ -2,6 +2,7 @@ import * as fs from "node:fs/promises";
 import * as os from "node:os";
 import * as path from "node:path";
 import { getOAuthProviders } from "@oh-my-pi/pi-ai/oauth";
+import { setNextRequestDebugPath } from "@oh-my-pi/pi-ai/utils/request-debug";
 import { Snowflake, setProjectDir } from "@oh-my-pi/pi-utils";
 import { $ } from "bun";
 import type { SettingPath, SettingValue } from "../config/settings";
@@ -21,7 +22,7 @@ import {
 } from "../extensibility/plugins/marketplace";
 import { resolveMemoryBackend } from "../memory-backend";
 import type { InteractiveModeContext } from "../modes/types";
-import type { FreshSessionResult } from "../session/agent-session";
+import type { AgentSession, FreshSessionResult } from "../session/agent-session";
 import { formatShakeSummary, type ShakeMode } from "../session/shake-types";
 import { getChangelogPath, parseChangelog } from "../utils/changelog";
 import { buildContextReportText } from "./helpers/context-report";
@@ -29,6 +30,7 @@ import { formatDuration } from "./helpers/format";
 import { createMarketplaceManager } from "./helpers/marketplace-manager";
 import { handleMcpAcp } from "./helpers/mcp";
 import { commandConsumed, errorMessage, parseSlashCommand, parseSubcommand, usage } from "./helpers/parse";
+import { describeRedeemOutcome, type ResetUsageAccount, toResetUsageAccounts } from "./helpers/reset-usage";
 import { handleSshAcp } from "./helpers/ssh";
 import { launchStatsDashboard, parseStatsDashboardArgs } from "./helpers/stats-dashboard";
 import { handleTodoAcp } from "./helpers/todo";
@@ -65,6 +67,95 @@ const shutdownHandlerTui = (_command: ParsedSlashCommand, runtime: TuiSlashComma
 	return commandConsumed();
 };
+async function handleUsageResetCommand(
+	arg: string,
+	session: AgentSession,
+	output: SlashCommandRuntime["output"],
+): Promise<void> {
+	let accounts: ResetUsageAccount[];
+	try {
+		accounts = toResetUsageAccounts(await session.listResetCredits());
+	} catch (error) {
+		await output(`Could not load saved resets: ${errorMessage(error)}`);
+		return;
+	}
+	if (accounts.length === 0) {
+		await output("No Codex accounts found. Use /login to add one.");
+		return;
+	}
+	const targetArg = arg.trim();
+	if (!targetArg) {
+		const lines = ["Saved Codex rate-limit resets:"];
+		for (const account of accounts) {
+			const detail = account.error ? `unavailable (${account.error})` : `${account.availableCount} available`;
+			lines.push(`- ${account.label}: ${detail}${account.active ? " (active)" : ""}`);
+		}
+		lines.push("", "Spend one with `/usage reset <account email>` or `/usage reset active`.");
+		await output(lines.join("\n"));
+		return;
+	}
+	const wanted = targetArg.toLowerCase();
+	const target =
+		wanted === "active"
+			? accounts.find(account => account.active)
+			: accounts.find(
+					account =>
+						account.label.toLowerCase() === wanted ||
+						account.target.email?.toLowerCase() === wanted ||
+						account.target.accountId?.toLowerCase() === wanted,
+				);
+	if (!target) {
+		await output(`No Codex account matches "${targetArg}".`);
+		return;
+	}
+	if (target.availableCount <= 0) {
+		await output(`${target.label}: no saved resets to spend.`);
+		return;
+	}
+	const outcome = await session.redeemResetCredit(target.target);
+	await output(describeRedeemOutcome(outcome, target.label));
+}
+const DEBUG_DUMP_NEXT_REQUEST_USAGE = "Usage: /debug dump-next-request <path>";
+function resolveDebugRequestDumpPath(target: string, cwd: string): string {
+	const expanded =
+		target === "~"
+			? os.homedir()
+			: target.startsWith("~/") || target.startsWith("~\\")
+				? path.join(os.homedir(), target.slice(2))
+				: target;
+	return path.resolve(cwd, expanded);
+}
+async function handleDebugSubcommand(
+	args: string,
+	cwd: string,
+	output: (text: string) => Promise<void> | void,
+): Promise<SlashCommandResult> {
+	const { verb, rest } = parseSubcommand(args);
+	switch (verb) {
+		case "":
+			await output(DEBUG_DUMP_NEXT_REQUEST_USAGE);
+			return commandConsumed();
+		case "dump-next-request":
+		case "dump-request":
+		case "next-request": {
+			if (!rest) {
+				await output(DEBUG_DUMP_NEXT_REQUEST_USAGE);
+				return commandConsumed();
+			}
+			const requestPath = resolveDebugRequestDumpPath(rest, cwd);
+			setNextRequestDebugPath(requestPath);
+			await output(`Next AI provider request will be dumped to ${requestPath}`);
+			return commandConsumed();
+		}
+		default:
+			await output(`Unknown /debug subcommand "${verb}". ${DEBUG_DUMP_NEXT_REQUEST_USAGE}`);
+			return commandConsumed();
+	}
+}
 /** Parse the `/shake` subcommand into a {@link ShakeMode}; empty defaults to elide. */
 function parseShakeMode(args: string): ShakeMode | { error: string } {
 	const verb = args.trim().toLowerCase();
@@ -551,12 +642,41 @@ const BUILTIN_SLASH_COMMAND_REGISTRY: ReadonlyArray<SlashCommandSpec> = [
 		name: "usage",
 		description: "Show provider usage and limits",
 		acpDescription: "Show token usage",
-		handle: async (_command, runtime) => {
-			await runtime.output(await buildUsageReportText(runtime));
-			return commandConsumed();
+		acpInputHint: "[show|reset [account|active]]",
+		subcommands: [
+			{ name: "show", description: "Show provider usage and limits" },
+			{ name: "reset", description: "Spend a saved Codex rate-limit reset", usage: "[account|active]" },
+		],
+		allowArgs: true,
+		handle: async (command, runtime) => {
+			const { verb, rest } = parseSubcommand(command.args);
+			if (!verb || (verb === "show" && !rest)) {
+				await runtime.output(await buildUsageReportText(runtime));
+				return commandConsumed();
+			}
+			if (verb === "reset") {
+				await handleUsageResetCommand(rest, runtime.session, runtime.output);
+				return commandConsumed();
+			}
+			return usage("Usage: /usage [show|reset [account|active]]", runtime);
 		},
-		handleTui: async (_command, runtime) => {
-			await runtime.ctx.handleUsageCommand();
+		handleTui: async (command, runtime) => {
+			const { verb, rest } = parseSubcommand(command.args);
+			if (!verb || (verb === "show" && !rest)) {
+				await runtime.ctx.handleUsageCommand();
+				runtime.ctx.editor.setText("");
+				return;
+			}
+			if (verb === "reset") {
+				if (rest) {
+					await handleUsageResetCommand(rest, runtime.ctx.session, text => runtime.ctx.showStatus(text));
+				} else {
+					await runtime.ctx.showResetUsageSelector();
+				}
+				runtime.ctx.editor.setText("");
+				return;
+			}
+			runtime.ctx.showStatus("Usage: /usage [show|reset [account|active]]");
 			runtime.ctx.editor.setText("");
 		},
 	},
@@ -974,8 +1094,25 @@ const BUILTIN_SLASH_COMMAND_REGISTRY: ReadonlyArray<SlashCommandSpec> = [
 	{
 		name: "debug",
 		description: "Open debug tools selector",
-		handleTui: (_command, runtime) => {
-			runtime.ctx.showDebugSelector();
+		allowArgs: true,
+		subcommands: [
+			{
+				name: "dump-next-request",
+				description: "Dump the next AI provider HTTP request as JSON",
+				usage: "<path>",
+			},
+		],
+		handle: async (command, runtime) =>
+			handleDebugSubcommand(command.args, runtime.cwd, text => runtime.output(text)),
+		handleTui: async (command, runtime) => {
+			const args = command.args.trim();
+			if (args.length === 0) {
+				runtime.ctx.showDebugSelector();
+			} else {
+				await handleDebugSubcommand(args, runtime.ctx.sessionManager.getCwd(), text =>
+					runtime.ctx.showStatus(text),
+				);
+			}
 			runtime.ctx.editor.setText("");
 		},
 	},

package/src/slash-commands/helpers/context-report.ts CHANGED Viewed

@@ -9,7 +9,7 @@ import { renderAsciiBar } from "./format";
  */
 export function buildContextReportText(runtime: SlashCommandRuntime): string {
 	try {
-		const breakdown = computeContextBreakdown(runtime.session);
+		const breakdown = computeContextBreakdown(runtime.session, { snapcompactSavings: true });
 		if (breakdown.contextWindow <= 0) {
 			return "Context usage is unavailable: no model is selected for this session.";
 		}
@@ -30,6 +30,33 @@ export function buildContextReportText(runtime: SlashCommandRuntime): string {
 			const fraction = breakdown.freeTokens / breakdown.contextWindow;
 			lines.push(`  ${"Free".padEnd(16)} ${renderAsciiBar(fraction)}  ${breakdown.freeTokens} tokens`);
 		}
+		const snap = breakdown.snapcompact;
+		if (snap) {
+			if (!snap.visionCapable) {
+				lines.push("Snapcompact: inactive (model has no image input)");
+			} else {
+				lines.push("Snapcompact (estimated wire savings):");
+				if (snap.systemPrompt) {
+					const sp = snap.systemPrompt;
+					lines.push(
+						sp.applied
+							? `  System prompt: ${sp.textTokens} text tokens → ${sp.frames} frame${sp.frames === 1 ? "" : "s"} ≈ ${sp.imageTokens} tokens (saves ~${sp.savedTokens})`
+							: "  System prompt: stays text (no net savings)",
+					);
+				}
+				if (snap.toolResults) {
+					const tr = snap.toolResults;
+					lines.push(
+						tr.swapped > 0
+							? `  Tool results: ${tr.swapped} of ${tr.total} imaged, ${tr.textTokens} text tokens → ${tr.frames} frames ≈ ${tr.imageTokens} tokens (saves ~${tr.savedTokens})`
+							: `  Tool results: none imaged (${tr.total} in history)`,
+					);
+				}
+				if (snap.savedTokens > 0) {
+					lines.push(`  Estimated next request: ~${breakdown.usedTokens - snap.savedTokens} tokens on the wire`);
+				}
+			}
+		}
 		return lines.join("\n");
 	} catch {
 		const fallback = runtime.session.getContextUsage();

package/src/slash-commands/helpers/reset-usage.ts ADDED Viewed

@@ -0,0 +1,66 @@
+/**
+ * Shared helpers for the `/usage reset` command (TUI selector + ACP): turn the
+ * live per-account reset-credit status into selector rows, and map a redeem
+ * outcome code to a human message.
+ */
+import type { ResetCreditAccountStatus, ResetCreditRedeemOutcome, ResetCreditTarget } from "../../session/auth-storage";
+export const CODEX_PROVIDER_ID = "openai-codex";
+/** One Codex account row for the reset-usage selector. */
+export interface ResetUsageAccount {
+	/** Display label (email, else account id). */
+	label: string;
+	/** Saved resets redeemable for this account right now. */
+	availableCount: number;
+	/** Identifies the account when redeeming. */
+	target: ResetCreditTarget;
+	/** Whether this is the session's active Codex account. */
+	active: boolean;
+	/** Set when this account could not be reached (token/list failure). */
+	error?: string;
+}
+/**
+ * Map live per-account reset status to selector rows. Sorted with the active
+ * account first, then most-credits, then label.
+ */
+export function toResetUsageAccounts(statuses: ResetCreditAccountStatus[]): ResetUsageAccount[] {
+	return statuses
+		.map(status => ({
+			label: status.email ?? status.accountId ?? "account",
+			availableCount: status.availableCount,
+			target: {
+				credentialId: status.credentialId,
+				accountId: status.accountId,
+				email: status.email,
+			} satisfies ResetCreditTarget,
+			active: status.active,
+			error: status.error,
+		}))
+		.sort((a, b) => {
+			if (a.active !== b.active) return a.active ? -1 : 1;
+			if (a.availableCount !== b.availableCount) return b.availableCount - a.availableCount;
+			return a.label.localeCompare(b.label);
+		});
+}
+/** Human-facing summary of a redeem outcome for status lines and ACP output. */
+export function describeRedeemOutcome(outcome: ResetCreditRedeemOutcome, label: string): string {
+	switch (outcome.code) {
+		case "reset":
+			return `Reset applied for ${label} — your rate-limit window has been refreshed.`;
+		case "already_redeemed":
+			return `${label}: that reset was already redeemed.`;
+		case "no_credit":
+			return `${label}: no saved resets available to spend.`;
+		case "nothing_to_reset":
+			return `${label}: nothing to reset right now — your limits aren't constrained, so no credit was spent.`;
+		case "no_account":
+			return `Could not find a stored Codex account matching "${label}".`;
+		case "account_unavailable":
+			return `${label}: could not authenticate this account — try /login.`;
+		default:
+			return `${label}: reset did not apply (${outcome.code}).`;
+	}
+}

package/src/slash-commands/helpers/usage-report.ts CHANGED Viewed

@@ -54,6 +54,18 @@ function renderUsageReports(
 		const activeAccount = resolveActiveAccount?.(provider);
 		for (const report of providerReports) {
 			const inUse = reportMatchesActiveAccount(report, activeAccount);
+			const savedResets = report.resetCredits?.availableCount ?? 0;
+			if (savedResets > 0) {
+				const resetLabel =
+					typeof report.metadata?.email === "string"
+						? report.metadata.email
+						: typeof report.metadata?.accountId === "string"
+							? report.metadata.accountId
+							: "account";
+				lines.push(
+					`- ${resetLabel}: ${savedResets} saved rate-limit reset${savedResets === 1 ? "" : "s"} available — /usage reset to spend`,
+				);
+			}
 			if (report.limits.length === 0) {
 				const email = typeof report.metadata?.email === "string" ? report.metadata.email : "account";
 				lines.push(`- ${email}: no limits reported`);

package/src/task/index.ts CHANGED Viewed

@@ -698,7 +698,14 @@ export class TaskTool implements AgentTool<TaskToolSchemaInstance, TaskToolDetai
 					buildDetails("running", ownJobId) as unknown as Record<string, unknown>,
 				);
 				try {
-					const result = await this.#executeSync(toolCallId, spawnParams, runSignal, undefined, agentId);
+					const result = await this.#executeSync(
+						toolCallId,
+						spawnParams,
+						runSignal,
+						undefined,
+						agentId,
+						progress.index,
+					);
 					const finalText = result.content.find(part => part.type === "text")?.text ?? "(no output)";
 					const singleResult = result.details?.results[0];
 					// A missing result means the sync path failed at the tool level
@@ -781,7 +788,14 @@ export class TaskTool implements AgentTool<TaskToolSchemaInstance, TaskToolDetai
 		if (spawnItems.length === 1) {
 			await semaphore.acquire();
 			try {
-				return await this.#executeSync(toolCallId, spawnParamsFor(params, spawnItems[0]), signal, onUpdate);
+				return await this.#executeSync(
+					toolCallId,
+					spawnParamsFor(params, spawnItems[0]),
+					signal,
+					onUpdate,
+					undefined,
+					0,
+				);
 			} finally {
 				semaphore.release();
 			}
@@ -818,7 +832,14 @@ export class TaskTool implements AgentTool<TaskToolSchemaInstance, TaskToolDetai
 								}
 							}
 						: undefined;
-					return await this.#executeSync(toolCallId, spawnParamsFor(params, item), workerSignal, itemOnUpdate);
+					return await this.#executeSync(
+						toolCallId,
+						spawnParamsFor(params, item),
+						workerSignal,
+						itemOnUpdate,
+						undefined,
+						index,
+					);
 				} finally {
 					semaphore.release();
 				}
@@ -875,8 +896,9 @@ export class TaskTool implements AgentTool<TaskToolSchemaInstance, TaskToolDetai
 		signal?: AbortSignal,
 		onUpdate?: AgentToolUpdateCallback<TaskToolDetails>,
 		preAllocatedId?: string,
+		spawnIndex = 0,
 	): Promise<AgentToolResult<TaskToolDetails>> {
-		return this.#runSpawn(toolCallId, params, signal, onUpdate, preAllocatedId);
+		return this.#runSpawn(toolCallId, params, signal, onUpdate, preAllocatedId, spawnIndex);
 	}
 	/** Spawn a fresh subagent and run it to completion. */
@@ -886,6 +908,7 @@ export class TaskTool implements AgentTool<TaskToolSchemaInstance, TaskToolDetai
 		signal?: AbortSignal,
 		onUpdate?: AgentToolUpdateCallback<TaskToolDetails>,
 		preAllocatedId?: string,
+		spawnIndex = 0,
 	): Promise<AgentToolResult<TaskToolDetails>> {
 		const startTime = Date.now();
 		const { agents, projectAgentsDir } = await discoverAgents(this.session.cwd);
@@ -1070,7 +1093,7 @@ export class TaskTool implements AgentTool<TaskToolSchemaInstance, TaskToolDetai
 			// Progress tracking for the single agent
 			let latestProgress: AgentProgress = {
-				index: 0,
+				index: spawnIndex,
 				id: agentId,
 				agent: agentName,
 				agentSource: agent.source,
@@ -1120,7 +1143,7 @@ export class TaskTool implements AgentTool<TaskToolSchemaInstance, TaskToolDetai
 				context: sharedContext,
 				planReference,
 				description: params.description,
-				index: 0,
+				index: spawnIndex,
 				parentToolCallId: toolCallId,
 				id: agentId,
 				taskDepth,
@@ -1226,7 +1249,7 @@ export class TaskTool implements AgentTool<TaskToolSchemaInstance, TaskToolDetai
 				} catch (err) {
 					const message = err instanceof Error ? err.message : String(err);
 					return {
-						index: 0,
+						index: spawnIndex,
 						id: agentId,
 						agent: agent.name,
 						agentSource: agent.source,

package/src/task/render.ts CHANGED Viewed

@@ -165,7 +165,7 @@ function formatJsonScalar(value: unknown, _theme: Theme): string {
 	return "";
 }
-function formatTaskId(id: string): string {
+export function formatTaskId(id: string): string {
 	// Ids are name-based (e.g. "Anna", "Anna-2"); a "." separates nesting levels
 	// (e.g. "Anna.Bob"). Render the hierarchy with a ">" breadcrumb.
 	const segments = id.split(".");
@@ -627,7 +627,13 @@ function createMarkdownSectionRenderer(text: string, theme: Theme): AssignmentSe
  */
 export function renderCall(args: TaskParams, options: TaskRenderOptions, theme: Theme): Component {
 	const showIsolated = "isolated" in args && args.isolated === true;
-	const header = renderStatusLine({ icon: "pending", title: "Task", description: args.agent }, theme);
+	// Dispatch glyph from the first frame: spawning is non-blocking, so a
+	// pending/hourglass icon would misread the call as something the turn
+	// waits on.
+	const header = renderStatusLine(
+		{ iconOverride: theme.styledSymbol("tool.task", "accent"), title: "Task", description: args.agent },
+		theme,
+	);
 	const assignmentSection = createAssignmentSectionRenderer(args, theme);
 	const contextSection = createContextSectionRenderer(args, theme);
 	return framedBlock(theme, width => {
@@ -692,21 +698,23 @@ function renderAgentProgress(
 	const indent = prefix ? `${prefix} ` : "";
 	let statusLine: string;
 	if (progress.status === "running" || progress.status === "pending") {
-		// Live (or queued) agents use the task icon: detached async spawns can
-		// stay "pending" while real work is running, so a pending/hourglass glyph
-		// reads wrong in the transcript. Keep the row static; the Task tool header
-		// already carries any live animation.
-		const taskIcon = theme.styledSymbol("tool.task", frozen ? "dim" : "accent");
+		// Live (or queued) agents use the same dot finished rows keep: detached
+		// async spawns can stay "pending" while real work is running, so a
+		// pending/hourglass or spinner glyph reads wrong in the transcript. Keep
+		// the row static; the Task tool header already carries the dispatch icon.
+		const dot = theme.styledSymbol("status.done", frozen ? "dim" : "accent");
 		const nameColor = frozen ? "dim" : "accent";
 		const name = theme.fg(nameColor, description ? theme.bold(displayId) : displayId);
-		statusLine = `${indent}${taskIcon} ${name}`;
+		statusLine = `${indent}${dot} ${name}`;
 		if (description) {
 			statusLine += `${theme.fg(nameColor, ":")} ${theme.fg(nameColor, description)}`;
 		}
+	} else if (progress.status === "completed") {
+		// Finished rows keep the dot but settle from accent to the plain
+		// foreground: completion reads as a color change, not a new glyph.
+		statusLine = `${indent}${theme.styledSymbol("status.done", "text")} ${theme.fg("text", titlePart)}`;
 	} else {
-		const glyph =
-			progress.status === "completed" ? theme.styledSymbol("status.done", "accent") : theme.fg(iconColor, icon);
-		statusLine = `${indent}${glyph} ${theme.fg("accent", titlePart)}`;
+		statusLine = `${indent}${theme.fg(iconColor, icon)} ${theme.fg("accent", titlePart)}`;
 	}
 	// Show retry-blocked badge so the parent immediately sees that a child
@@ -982,7 +990,7 @@ function renderAgentResult(
 		: needsWarning
 			? theme.status.warning
 			: success
-				? theme.styledSymbol("status.done", "accent")
+				? theme.styledSymbol("status.done", "text")
 				: theme.status.error;
 	const iconColor = needsWarning ? "warning" : success ? "success" : mergeFailed ? "warning" : "error";
 	const statusText = aborted
@@ -999,11 +1007,10 @@ function renderAgentResult(
 	const description = result.description?.trim();
 	const displayId = formatTaskId(result.id);
 	const titlePart = description ? `${theme.bold(displayId)}: ${description}` : displayId;
-	let statusLine = `${prefix ? `${prefix} ` : ""}${theme.fg(iconColor, icon)} ${theme.fg("accent", titlePart)} ${formatBadge(
-		statusText,
-		iconColor,
-		theme,
-	)}`;
+	let statusLine = `${prefix ? `${prefix} ` : ""}${theme.fg(iconColor, icon)} ${theme.fg(
+		success && !needsWarning ? "text" : "accent",
+		titlePart,
+	)} ${formatBadge(statusText, iconColor, theme)}`;
 	const showBadge = settings.get("task.showResolvedModelBadge");
 	statusLine = appendAgentStats(
 		statusLine,
@@ -1217,8 +1224,16 @@ export function renderResult(
 	const metaLabel = countLabel ? (agentLabel ? `${countLabel}: ${agentLabel}` : countLabel) : agentLabel;
 	const header = renderStatusLine(
 		{
-			icon: icon === "success" ? undefined : icon,
-			iconOverride: icon === "success" ? theme.styledSymbol("status.done", "accent") : undefined,
+			icon: icon === "success" || icon === "running" ? undefined : icon,
+			// While agents are in flight the header shows the dispatch glyph, not a
+			// spinner: async spawns return immediately, so "running" means
+			// "delegated to peers", not "this call is blocking the turn".
+			iconOverride:
+				icon === "running"
+					? theme.styledSymbol("tool.task", "accent")
+					: icon === "success"
+						? theme.styledSymbol("status.done", "accent")
+						: undefined,
 			title: "Task",
 			meta: metaLabel ? [metaLabel] : undefined,
 		},

package/src/tools/bash.ts CHANGED Viewed

@@ -1385,6 +1385,9 @@ export function createShellRenderer<TArgs>(config: ShellRendererConfig<TArgs>) {
 		},
 		mergeCallAndResult: true,
 		inline: true,
+		// Pending preview caps the command to a viewport-sized tail window that
+		// shifts while args stream; keep it out of native scrollback mid-run.
+		provisionalPendingPreview: true,
 	};
 }

package/src/tools/eval-render.ts CHANGED Viewed

@@ -754,4 +754,8 @@ export const evalToolRenderer = {
 	mergeCallAndResult: true,
 	inline: true,
+	// Pending preview shows tail-window code cells; the result render
+	// interleaves each cell's output under its code, re-laying-out every row
+	// below the first cell. Keep the preview out of native scrollback mid-run.
+	provisionalPendingPreview: true,
 };

package/src/tools/renderers.ts CHANGED Viewed

@@ -43,6 +43,19 @@ export type ToolRenderer = {
 	mergeCallAndResult?: boolean;
 	/** Render without background box, inline in the response flow */
 	inline?: boolean;
+	/**
+	 * Collapsed pending preview is provisional — a tail-window or otherwise
+	 * re-anchored view the result render replaces wholesale (an edit's
+	 * streamed-diff tail, bash/ssh command caps, eval cells whose outputs
+	 * interleave under each cell). Its rows must never commit to native
+	 * scrollback mid-run; see
+	 * `ToolExecutionComponent.isTranscriptBlockCommitStable`. Absent = the
+	 * pending preview streams top-anchored append-shaped rows the result
+	 * render preserves (task context/assignment, write content), which stay
+	 * commit-eligible so a call taller than the viewport scrolls into history
+	 * instead of reading as cut off.
+	 */
+	provisionalPendingPreview?: boolean;
 };
 export const toolRenderers: Record<string, ToolRenderer> = {

package/src/tools/ssh.ts CHANGED Viewed

@@ -346,4 +346,7 @@ export const sshToolRenderer = {
 		});
 	},
 	mergeCallAndResult: true,
+	// Pending preview caps the command to a viewport-sized tail window that
+	// shifts while args stream; keep it out of native scrollback mid-run.
+	provisionalPendingPreview: true,
 };