npm - @oh-my-pi/pi-coding-agent - Versions diffs - 15.11.3 → 15.11.4 - Mend

@oh-my-pi/pi-coding-agent 15.11.3 → 15.11.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (103) hide show

package/CHANGELOG.md +54 -0
package/dist/cli.js +353 -294
package/dist/types/config/api-key-resolver.d.ts +9 -3
package/dist/types/config/keybindings.d.ts +1 -1
package/dist/types/config/model-discovery.d.ts +6 -4
package/dist/types/config/model-registry.d.ts +7 -4
package/dist/types/config/settings-schema.d.ts +458 -155
package/dist/types/export/html/template.generated.d.ts +1 -1
package/dist/types/mnemopi/config.d.ts +3 -1
package/dist/types/modes/components/settings-defs.d.ts +9 -2
package/dist/types/modes/components/settings-selector.d.ts +9 -4
package/dist/types/modes/components/tool-execution.d.ts +12 -1
package/dist/types/modes/components/transcript-container.d.ts +12 -0
package/dist/types/modes/controllers/input-controller.d.ts +9 -1
package/dist/types/modes/theme/theme.d.ts +23 -3
package/dist/types/session/agent-session.d.ts +14 -7
package/dist/types/session/auth-storage.d.ts +1 -1
package/dist/types/session/snapcompact-inline.d.ts +28 -0
package/dist/types/slash-commands/helpers/active-oauth-account.d.ts +14 -0
package/dist/types/system-prompt.d.ts +3 -1
package/dist/types/task/render.d.ts +16 -6
package/dist/types/tools/gh.d.ts +3 -0
package/dist/types/tools/render-utils.d.ts +8 -16
package/dist/types/utils/session-color.d.ts +15 -3
package/dist/types/web/kagi.d.ts +1 -2
package/dist/types/web/search/providers/codex.d.ts +1 -1
package/dist/types/web/search/providers/gemini.d.ts +9 -6
package/package.json +11 -11
package/src/auto-thinking/classifier.ts +1 -5
package/src/commit/model-selection.ts +3 -6
package/src/config/api-key-resolver.ts +10 -3
package/src/config/keybindings.ts +1 -1
package/src/config/model-discovery.ts +60 -46
package/src/config/model-registry.ts +21 -8
package/src/config/model-resolver.ts +57 -3
package/src/config/settings-schema.ts +601 -153
package/src/eval/completion-bridge.ts +1 -5
package/src/export/html/template.generated.ts +1 -1
package/src/export/html/template.js +13 -6
package/src/internal-urls/docs-index.generated.ts +5 -5
package/src/internal-urls/issue-pr-protocol.ts +10 -4
package/src/memories/index.ts +2 -10
package/src/mnemopi/backend.ts +30 -8
package/src/mnemopi/config.ts +6 -1
package/src/mnemopi/state.ts +6 -0
package/src/modes/components/extensions/inspector-panel.ts +6 -2
package/src/modes/components/plan-review-overlay.ts +15 -17
package/src/modes/components/plugin-settings.ts +22 -5
package/src/modes/components/settings-defs.ts +19 -4
package/src/modes/components/settings-selector.ts +493 -93
package/src/modes/components/status-line/component.ts +3 -1
package/src/modes/components/status-line/segments.ts +3 -1
package/src/modes/components/tool-execution.ts +69 -12
package/src/modes/components/transcript-container.ts +26 -0
package/src/modes/components/tree-selector.ts +16 -6
package/src/modes/controllers/command-controller.ts +37 -7
package/src/modes/controllers/event-controller.ts +1 -0
package/src/modes/controllers/input-controller.ts +68 -6
package/src/modes/controllers/selector-controller.ts +81 -61
package/src/modes/interactive-mode.ts +4 -2
package/src/modes/rpc/rpc-mode.ts +2 -1
package/src/modes/shared.ts +2 -0
package/src/modes/theme/theme.ts +100 -7
package/src/modes/utils/context-usage.ts +3 -1
package/src/modes/utils/hotkeys-markdown.ts +1 -1
package/src/modes/utils/ui-helpers.ts +9 -5
package/src/prompts/system/personalities/default.md +26 -0
package/src/prompts/system/personalities/friendly.md +17 -0
package/src/prompts/system/personalities/pragmatic.md +15 -0
package/src/prompts/system/snapcompact-system-frames-note.md +1 -0
package/src/prompts/system/snapcompact-system-stub.md +1 -0
package/src/prompts/system/snapcompact-toolresult-note.md +1 -0
package/src/prompts/system/system-prompt.md +5 -22
package/src/prompts/tools/task.md +3 -3
package/src/sdk.ts +22 -1
package/src/session/agent-session.ts +91 -24
package/src/session/auth-storage.ts +1 -0
package/src/session/session-dump-format.ts +8 -1
package/src/session/session-manager.ts +5 -5
package/src/session/snapcompact-inline.ts +187 -0
package/src/slash-commands/helpers/active-oauth-account.ts +44 -0
package/src/slash-commands/helpers/usage-report.ts +24 -3
package/src/system-prompt.ts +15 -1
package/src/task/render.ts +29 -19
package/src/tool-discovery/tool-index.ts +2 -0
package/src/tools/bash.ts +10 -3
package/src/tools/eval-render.ts +13 -8
package/src/tools/gh.ts +39 -1
package/src/tools/image-gen.ts +114 -78
package/src/tools/inspect-image.ts +1 -5
package/src/tools/job.ts +25 -5
package/src/tools/read.ts +1 -57
package/src/tools/render-utils.ts +29 -31
package/src/tools/ssh.ts +3 -3
package/src/tools/tts.ts +40 -20
package/src/utils/clipboard.ts +56 -4
package/src/utils/commit-message-generator.ts +1 -5
package/src/utils/session-color.ts +83 -9
package/src/utils/title-generator.ts +1 -1
package/src/web/kagi.ts +26 -27
package/src/web/search/providers/codex.ts +42 -40
package/src/web/search/providers/gemini.ts +42 -22
package/src/web/search/providers/perplexity.ts +22 -10

package/src/session/agent-session.ts CHANGED Viewed

@@ -107,7 +107,7 @@ import {
 	relativePathWithinRoot,
 	Snowflake,
 } from "@oh-my-pi/pi-utils";
-import { snapcompactCompact } from "@oh-my-pi/snapcompact";
+import * as snapcompact from "@oh-my-pi/snapcompact";
 import { type AsyncJob, type AsyncJobDeliveryState, AsyncJobManager } from "../async";
 import { classifyDifficulty } from "../auto-thinking/classifier";
 import { reset as resetCapabilities } from "../capability";
@@ -855,8 +855,13 @@ function extractPermissionLocations(
  *  `tag` is set only by `enqueueCustomMessageDisplay` (used for skill-prompt
  *  custom messages queued during streaming) and is matched by the custom-role
  *  `message_start` dequeue branch; user-message pushes leave it undefined and
- *  rely on the existing text-equality match. */
-type QueuedDisplayEntry = { text: string; tag?: string };
+ *  rely on the existing text-equality match. `images` carries the original
+ *  (pre-normalization) image blocks so queue restoration (Esc / Alt+Up) can
+ *  hand them back to the editor instead of dropping them. */
+type QueuedDisplayEntry = { text: string; tag?: string; images?: ImageContent[] };
+/** Entry returned by {@link AgentSession.clearQueue} / {@link AgentSession.popLastQueuedMessage}. */
+export type RestoredQueuedMessage = { text: string; images?: ImageContent[] };
 export class AgentSession {
 	readonly agent: Agent;
@@ -5028,7 +5033,7 @@ export class AgentSession {
 	async #queueSteer(text: string, images?: ImageContent[]): Promise<void> {
 		const normalizedImages = await normalizeModelContextImages(images);
 		const displayText = text || (images && images.length > 0 ? "[Image]" : "");
-		this.#steeringMessages.push({ text: displayText });
+		this.#steeringMessages.push({ text: displayText, images });
 		const content: (TextContent | ImageContent)[] = [{ type: "text", text }];
 		if (normalizedImages && normalizedImages.length > 0) {
 			content.push(...normalizedImages);
@@ -5040,6 +5045,16 @@ export class AgentSession {
 			attribution: "user",
 			timestamp: Date.now(),
 		});
+		// A steer can land on an idle session: the caller checked isStreaming
+		// before the (potentially slow) image normalization above, so the turn
+		// may have ended in between. Without a drain the message would strand in
+		// the queue until the next manual prompt — schedule an immediate continue,
+		// mirroring #queueFollowUp's idle-path delivery.
+		if (this.#canAutoContinueForFollowUp()) {
+			this.#scheduleAgentContinue({
+				shouldContinue: () => this.#canAutoContinueForFollowUp() && this.agent.hasQueuedMessages(),
+			});
+		}
 	}
 	/**
@@ -5048,7 +5063,7 @@ export class AgentSession {
 	async #queueFollowUp(text: string, images?: ImageContent[]): Promise<void> {
 		const normalizedImages = await normalizeModelContextImages(images);
 		const displayText = text || (images && images.length > 0 ? "[Image]" : "");
-		this.#followUpMessages.push({ text: displayText });
+		this.#followUpMessages.push({ text: displayText, images });
 		const content: (TextContent | ImageContent)[] = [{ type: "text", text }];
 		if (normalizedImages && normalizedImages.length > 0) {
 			content.push(...normalizedImages);
@@ -5297,12 +5312,14 @@ export class AgentSession {
 	}
 	/**
-	 * Clear queued messages and return them.
-	 * Useful for restoring to editor when user aborts.
+	 * Clear queued messages and return them (text plus any attached images).
+	 * Useful for restoring to editor when user aborts. The internal entry
+	 * arrays are handed out as-is — a `tag` (if any) is inert once the record
+	 * leaves the queue.
 	 */
-	clearQueue(): { steering: string[]; followUp: string[] } {
-		const steering = this.#steeringMessages.map(e => e.text);
-		const followUp = this.#followUpMessages.map(e => e.text);
+	clearQueue(): { steering: RestoredQueuedMessage[]; followUp: RestoredQueuedMessage[] } {
+		const steering = this.#steeringMessages;
+		const followUp = this.#followUpMessages;
 		this.#steeringMessages = [];
 		this.#followUpMessages = [];
 		this.agent.clearAllQueues();
@@ -5328,21 +5345,21 @@ export class AgentSession {
 	/**
 	 * Pop the last queued message (steering first, then follow-up).
 	 * Used by dequeue keybinding to restore messages to editor one at a time.
-	 * Returns the popped entry's `.text`; the tag (if any) dies with the
-	 * record — no orphan state can outlive the queue entry.
+	 * Returns the popped entry's text and images; the tag (if any) dies with
+	 * the record — no orphan state can outlive the queue entry.
 	 */
-	popLastQueuedMessage(): string | undefined {
+	popLastQueuedMessage(): RestoredQueuedMessage | undefined {
 		// Pop from steering first (LIFO)
 		if (this.#steeringMessages.length > 0) {
 			const entry = this.#steeringMessages.pop();
 			this.agent.popLastSteer();
-			return entry?.text;
+			return entry;
 		}
 		// Then from follow-up
 		if (this.#followUpMessages.length > 0) {
 			const entry = this.#followUpMessages.pop();
 			this.agent.popLastFollowUp();
-			return entry?.text;
+			return entry;
 		}
 		return undefined;
 	}
@@ -6368,7 +6385,10 @@ export class AgentSession {
 				details = compactionPrep.details;
 				preserveData = compactionPrep.preserveData;
 			} else if (snapcompactReady) {
-				const snapcompactResult = await snapcompactCompact(preparation, { convertToLlm, model: this.model });
+				const snapcompactResult = await snapcompact.compact(preparation, {
+					convertToLlm,
+					model: this.model,
+				});
 				summary = snapcompactResult.summary;
 				shortSummary = snapcompactResult.shortSummary;
 				firstKeptEntryId = snapcompactResult.firstKeptEntryId;
@@ -6582,7 +6602,7 @@ export class AgentSession {
 			const rawHandoffText = await generateHandoff(
 				this.agent.state.messages,
 				model,
-				apiKey,
+				this.#modelRegistry.resolver(model, this.sessionId),
 				{
 					systemPrompt: this.#obfuscateForProvider(this.#baseSystemPrompt),
 					tools: obfuscateProviderTools(this.#obfuscator, this.agent.state.tools),
@@ -7252,6 +7272,22 @@ export class AgentSession {
 		this.#closeProviderSessionsForModelSwitch(currentModel, currentModel);
 	}
+	#resetCurrentResponsesProviderSession(reason: string): void {
+		const currentModel = this.model;
+		if (currentModel?.api !== "openai-responses" && currentModel?.api !== "openai-codex-responses") {
+			return;
+		}
+		this.#closeProviderSessionsForModelSwitch(currentModel, currentModel);
+		this.agent.appendOnlyContext?.invalidateForModelChange();
+		logger.debug("Reset Responses provider session after stale replay error", {
+			provider: currentModel.provider,
+			model: currentModel.id,
+			api: currentModel.api,
+			reason,
+		});
+	}
 	/**
 	 * Re-evaluate append-only context mode, creating or destroying the
 	 * manager as needed. Called on model switch AND setting change.
@@ -7577,7 +7613,7 @@ export class AgentSession {
 				return await compact(
 					this.#obfuscatePreparationForProvider(preparation),
 					candidate,
-					apiKey,
+					this.#modelRegistry.resolver(candidate, this.sessionId),
 					this.#obfuscateTextForProvider(customInstructions),
 					signal,
 					{
@@ -7882,7 +7918,10 @@ export class AgentSession {
 			} else if (action === "snapcompact") {
 				// Local, deterministic: render discarded history onto PNG frames.
 				// No model candidates, no API key, no retry loop.
-				const snapcompactResult = await snapcompactCompact(preparation, { convertToLlm, model: this.model });
+				const snapcompactResult = await snapcompact.compact(preparation, {
+					convertToLlm,
+					model: this.model,
+				});
 				summary = snapcompactResult.summary;
 				shortSummary = snapcompactResult.shortSummary;
 				firstKeptEntryId = snapcompactResult.firstKeptEntryId;
@@ -7906,7 +7945,7 @@ export class AgentSession {
 							compactResult = await compact(
 								this.#obfuscatePreparationForProvider(preparation),
 								candidate,
-								apiKey,
+								this.#modelRegistry.resolver(candidate, this.sessionId),
 								undefined,
 								autoCompactionSignal,
 								{
@@ -8293,11 +8332,32 @@ export class AgentSession {
 		if (isContextOverflow(message, contextWindow)) return false;
 		if (this.#isClassifierRefusal(message)) return true;
+		if (this.#isStaleOpenAIResponsesReplayError(message)) return true;
 		const err = message.errorMessage;
 		return this.#isTransientErrorMessage(err) || isUsageLimitError(err);
 	}
+	#isStaleOpenAIResponsesReplayError(message: AssistantMessage): boolean {
+		const currentApi = this.model?.api;
+		if (
+			message.api !== "openai-responses" &&
+			message.api !== "openai-codex-responses" &&
+			currentApi !== "openai-responses" &&
+			currentApi !== "openai-codex-responses"
+		) {
+			return false;
+		}
+		const errorMessage = message.errorMessage;
+		if (!errorMessage) return false;
+		return (
+			/\bItem with id ['"][^'"]+['"] not found\.?/i.test(errorMessage) ||
+			(/previous[ _]?response/i.test(errorMessage) && /not[ _]?found|invalid|expired|stale/i.test(errorMessage))
+		);
+	}
 	#isClassifierRefusal(message: AssistantMessage): boolean {
 		if (message.stopReason !== "error") return false;
 		const stopType = message.stopDetails?.type;
@@ -8631,15 +8691,22 @@ export class AgentSession {
 		}
 		const errorMessage = message.errorMessage || "Unknown error";
+		const staleOpenAIResponsesReplayError = this.#isStaleOpenAIResponsesReplayError(message);
 		const parsedRetryAfterMs = this.#parseRetryAfterMsFromError(errorMessage);
-		let delayMs = calculateRetryBackoffDelayMs(retrySettings.baseDelayMs, this.#retryAttempt);
+		let delayMs = staleOpenAIResponsesReplayError
+			? 0
+			: calculateRetryBackoffDelayMs(retrySettings.baseDelayMs, this.#retryAttempt);
 		let switchedCredential = false;
 		let switchedModel = false;
 		// Set when a usage-limit error pinned the wait to credential
 		// availability — suppresses the generic retry-after bump below.
 		let usageLimitWaitMs: number | undefined;
-		if (this.model && isUsageLimitError(errorMessage)) {
+		if (staleOpenAIResponsesReplayError) {
+			this.#resetCurrentResponsesProviderSession("stale replay error");
+		}
+		if (this.model && !staleOpenAIResponsesReplayError && isUsageLimitError(errorMessage)) {
 			const retryAfterMs = parsedRetryAfterMs ?? calculateRateLimitBackoffMs(parseRateLimitReason(errorMessage));
 			const outcome = await this.#modelRegistry.authStorage.markUsageLimitReached(
 				this.model.provider,
@@ -8676,7 +8743,7 @@ export class AgentSession {
 		}
 		const currentSelector = this.model ? formatRetryFallbackSelector(this.model, this.thinkingLevel) : undefined;
-		if (!switchedCredential && currentSelector) {
+		if (!staleOpenAIResponsesReplayError && !switchedCredential && currentSelector) {
 			if (retrySettings.modelFallback) {
 				if (!classifierRefusal) {
 					this.#noteRetryFallbackCooldown(currentSelector, parsedRetryAfterMs, errorMessage);
@@ -9813,7 +9880,7 @@ export class AgentSession {
 			const branchSummarySettings = this.settings.getGroup("branchSummary");
 			const result = await generateBranchSummary(entriesToSummarize, {
 				model,
-				apiKey,
+				apiKey: this.#modelRegistry.resolver(model, this.sessionId),
 				signal: this.#branchSummaryAbortController.signal,
 				customInstructions: this.#obfuscateTextForProvider(options.customInstructions),
 				reserveTokens: branchSummarySettings.reserveTokens,

package/src/session/auth-storage.ts CHANGED Viewed

@@ -12,6 +12,7 @@ export type {
 	AuthStorageOptions,
 	CredentialOrigin,
 	CredentialOriginKind,
+	OAuthAccountIdentity,
 	OAuthCredential,
 	SerializedAuthStorage,
 	SnapshotResponse,

package/src/session/session-dump-format.ts CHANGED Viewed

@@ -4,6 +4,7 @@
 import type { AgentMessage, ThinkingLevel } from "@oh-my-pi/pi-agent-core";
 import { INTENT_FIELD } from "@oh-my-pi/pi-agent-core";
 import type { AssistantMessage, Model } from "@oh-my-pi/pi-ai";
+import { isZodSchema, zodToWireSchema } from "@oh-my-pi/pi-ai/utils/schema";
 import {
 	type BashExecutionMessage,
 	type BranchSummaryMessage,
@@ -47,6 +48,12 @@ function stripTypeBoxFields(obj: unknown): unknown {
 	return obj;
 }
+/** Resolve tool parameters to a plain JSON Schema object for dump output. */
+function toolParametersToJsonSchema(parameters: unknown): unknown {
+	if (isZodSchema(parameters)) return zodToWireSchema(parameters);
+	return stripTypeBoxFields(parameters);
+}
 /** Serialize an object as XML parameter elements, one per key. */
 function formatArgsAsXml(args: Record<string, unknown>, indent = "\t"): string {
 	const parts: string[] = [];
@@ -89,7 +96,7 @@ export function formatSessionDumpText(options: FormatSessionDumpTextOptions): st
 		for (const tool of tools) {
 			lines.push(`<tool name="${tool.name}">`);
 			lines.push(tool.description);
-			const parametersClean = stripTypeBoxFields(tool.parameters);
+			const parametersClean = toolParametersToJsonSchema(tool.parameters);
 			lines.push(`\nParameters:\n${formatArgsAsXml(parametersClean as Record<string, unknown>)}`);
 			lines.push("<" + "/tool>\n");
 		}

package/src/session/session-manager.ts CHANGED Viewed

@@ -27,7 +27,7 @@ import {
 	Snowflake,
 	toError,
 } from "@oh-my-pi/pi-utils";
-import { getPreservedSnapcompactArchive, snapcompactImages } from "@oh-my-pi/snapcompact";
+import * as snapcompact from "@oh-my-pi/snapcompact";
 import { ArtifactManager } from "./artifacts";
 import {
 	type BlobPutOptions,
@@ -712,7 +712,7 @@ export function buildSessionContext(
 		// the component can report them.
 		for (const entry of path) {
 			if (entry.type === "compaction") {
-				const snapcompactArchive = getPreservedSnapcompactArchive(entry.preserveData);
+				const snapcompactArchive = snapcompact.getPreservedArchive(entry.preserveData);
 				messages.push(
 					createCompactionSummaryMessage(
 						entry.summary,
@@ -720,7 +720,7 @@ export function buildSessionContext(
 						entry.timestamp,
 						entry.shortSummary,
 						undefined,
-						snapcompactArchive ? snapcompactImages(snapcompactArchive) : undefined,
+						snapcompactArchive ? snapcompact.images(snapcompactArchive) : undefined,
 					),
 				);
 			} else {
@@ -744,7 +744,7 @@ export function buildSessionContext(
 		// Emit summary first; re-attach any archived snapcompact frames so the
 		// model can keep reading the archived history after every context rebuild.
-		const snapcompactArchive = getPreservedSnapcompactArchive(compaction.preserveData);
+		const snapcompactArchive = snapcompact.getPreservedArchive(compaction.preserveData);
 		messages.push(
 			createCompactionSummaryMessage(
 				compaction.summary,
@@ -752,7 +752,7 @@ export function buildSessionContext(
 				compaction.timestamp,
 				compaction.shortSummary,
 				providerPayload,
-				snapcompactArchive ? snapcompactImages(snapcompactArchive) : undefined,
+				snapcompactArchive ? snapcompact.images(snapcompactArchive) : undefined,
 			),
 		);

package/src/session/snapcompact-inline.ts ADDED Viewed

@@ -0,0 +1,187 @@
+/**
+ * Snapcompact inline imaging: per-request transform that swaps the system
+ * prompt and/or large historical tool results for dense PNG frames on
+ * vision-capable models.
+ *
+ * Runs inside the agent loop's `transformProviderContext` hook — after the
+ * persisted history is converted to the outgoing `Context`, before the
+ * provider stream call. It only ever builds NEW message objects/arrays; the
+ * input context shares `content` array references with the persisted
+ * `SessionMessageEntry` messages, so mutation would leak rendered images
+ * into session.jsonl.
+ */
+import type { Context, ImageContent, Model, TextContent, ToolResultMessage, UserMessage } from "@oh-my-pi/pi-ai";
+import { countTokens } from "@oh-my-pi/pi-natives";
+import * as snapcompact from "@oh-my-pi/snapcompact";
+import systemFramesNote from "../prompts/system/snapcompact-system-frames-note.md" with { type: "text" };
+import systemStub from "../prompts/system/snapcompact-system-stub.md" with { type: "text" };
+import toolResultNote from "../prompts/system/snapcompact-toolresult-note.md" with { type: "text" };
+export interface SnapcompactInlineOptions {
+	renderSystemPrompt: boolean;
+	renderToolResults: boolean;
+}
+/**
+ * Image-count budget per provider. Snapcompact frames are 1568px (<2000px) so
+ * dimension/size limits never bind; only COUNT does. Strictest mainstream is
+ * Groq (~5), so unknown providers get the safe floor.
+ */
+const INLINE_IMAGE_BUDGET_BY_PROVIDER: Record<string, number> = {
+	anthropic: 90,
+	"amazon-bedrock": 90,
+	openai: 200,
+	google: 200,
+	"google-vertex": 200,
+	"google-gemini-cli": 200,
+};
+const DEFAULT_INLINE_IMAGE_BUDGET = 5;
+const MAX_SYSTEM_PROMPT_FRAMES = 6;
+/** Tool results under this many tokens are never rasterized — the swap can't
+ *  save enough to justify trading crisp text for an image. */
+const MIN_TOOL_RESULT_TOKENS = 3000;
+/** Render only if imageTokens <= textTokens * SAVINGS_MARGIN. */
+const SAVINGS_MARGIN = 0.9;
+/** Count image blocks already present across all message contents. */
+function countContextImages(context: Context): number {
+	let count = 0;
+	for (const message of context.messages) {
+		const content = message.content;
+		if (typeof content === "string") continue;
+		for (const block of content) {
+			if (block.type === "image") count++;
+		}
+	}
+	return count;
+}
+function isTextContent(block: TextContent | ImageContent): block is TextContent {
+	return block.type === "text";
+}
+/** Image tokens must undercut text tokens by the margin to be worth rendering. */
+function passesSavingsGate(frames: number, shape: snapcompact.Shape, textTokens: number): boolean {
+	return frames * shape.frameTokenEstimate <= textTokens * SAVINGS_MARGIN;
+}
+interface FrameCacheEntry {
+	hash: number | bigint;
+	frames: ImageContent[];
+}
+/**
+ * Stateless with respect to the model (passed per call, so mid-session model
+ * switches re-resolve shape and budget); stateful only for the render caches,
+ * which live as long as the session's Agent.
+ */
+export class SnapcompactInlineTransformer {
+	/** Rendered tool-result frames keyed by toolCallId. */
+	#toolCache = new Map<string, FrameCacheEntry>();
+	#systemCache?: FrameCacheEntry;
+	constructor(private readonly options: SnapcompactInlineOptions) {}
+	transform(context: Context, model: Model): Context {
+		// Vision gate: providers silently DROP images on text-only models —
+		// rendering would lose the content entirely.
+		if (!model.input.includes("image")) return context;
+		const shape = snapcompact.resolveShape(model.api);
+		let budget =
+			(INLINE_IMAGE_BUDGET_BY_PROVIDER[model.provider] ?? DEFAULT_INLINE_IMAGE_BUDGET) - countContextImages(context);
+		if (budget <= 0) return context;
+		const messages = [...context.messages];
+		let changed = false;
+		if (this.options.renderToolResults) {
+			const toolResultIndices: number[] = [];
+			const liveToolCallIds = new Set<string>();
+			for (let i = 0; i < messages.length; i++) {
+				const message = messages[i];
+				if (message.role !== "toolResult") continue;
+				toolResultIndices.push(i);
+				liveToolCallIds.add(message.toolCallId);
+			}
+			// Oldest-first for cache-stable bytes; skip the LAST tool result so
+			// the freshest output stays crisp text.
+			for (let k = 0; k < toolResultIndices.length - 1 && budget > 0; k++) {
+				const index = toolResultIndices[k];
+				const message = messages[index] as ToolResultMessage;
+				// Don't re-image results that already carry images (screenshots etc.).
+				if (message.content.some(block => block.type === "image")) continue;
+				const text = message.content
+					.filter(isTextContent)
+					.map(block => block.text)
+					.join("\n");
+				const textTokens = countTokens(text);
+				if (textTokens < MIN_TOOL_RESULT_TOKENS) continue;
+				const needed = snapcompact.frames(text, { shape });
+				if (needed === 0 || needed > budget) continue;
+				if (!passesSavingsGate(needed, shape, textTokens)) continue;
+				const frames = this.#framesFor(this.#toolCache, message.toolCallId, text, shape);
+				messages[index] = { ...message, content: [{ type: "text", text: toolResultNote }, ...frames] };
+				budget -= frames.length;
+				changed = true;
+			}
+			// Drop cache entries for tool calls no longer in the context
+			// (compacted away) so the cache stays bounded by live history.
+			for (const key of this.#toolCache.keys()) {
+				if (!liveToolCallIds.has(key)) this.#toolCache.delete(key);
+			}
+		}
+		let systemPrompt = context.systemPrompt;
+		if (this.options.renderSystemPrompt && context.systemPrompt?.length && budget > 0) {
+			const joined = context.systemPrompt.join("\n\n");
+			const needed = snapcompact.frames(joined, { shape });
+			const userIndex = messages.findIndex(message => message.role === "user");
+			if (
+				needed > 0 &&
+				needed <= Math.min(budget, MAX_SYSTEM_PROMPT_FRAMES) &&
+				passesSavingsGate(needed, shape, countTokens(joined)) &&
+				// No user message to carry the frames → leave the prompt as text.
+				userIndex >= 0
+			) {
+				const hash = Bun.hash(joined);
+				let cached = this.#systemCache;
+				if (!cached || cached.hash !== hash) {
+					cached = {
+						hash,
+						frames: snapcompact.renderMany(joined, { shape, maxFrames: MAX_SYSTEM_PROMPT_FRAMES }),
+					};
+					this.#systemCache = cached;
+				}
+				const frames = cached.frames;
+				const original = messages[userIndex] as UserMessage;
+				const originalContent: (TextContent | ImageContent)[] =
+					typeof original.content === "string" ? [{ type: "text", text: original.content }] : original.content;
+				messages[userIndex] = {
+					...original,
+					content: [{ type: "text", text: systemFramesNote }, ...frames, ...originalContent],
+				};
+				systemPrompt = [systemStub];
+				budget -= frames.length;
+				changed = true;
+			}
+		}
+		if (!changed) return context;
+		return { ...context, systemPrompt, messages };
+	}
+	#framesFor(
+		cache: Map<string, FrameCacheEntry>,
+		key: string,
+		text: string,
+		shape: snapcompact.Shape,
+	): ImageContent[] {
+		const hash = Bun.hash(text);
+		const cached = cache.get(key);
+		if (cached && cached.hash === hash) return cached.frames;
+		const frames = snapcompact.renderMany(text, { shape });
+		cache.set(key, { hash, frames });
+		return frames;
+	}
+}

package/src/slash-commands/helpers/active-oauth-account.ts ADDED Viewed

@@ -0,0 +1,44 @@
+import type { UsageLimit, UsageReport } from "@oh-my-pi/pi-ai";
+import type { OAuthAccountIdentity } from "../../session/auth-storage";
+function normalizeIdentityValue(value: unknown): string | undefined {
+	return typeof value === "string" && value.trim() ? value.trim().toLowerCase() : undefined;
+}
+/**
+ * True when a single usage-limit column belongs to the given OAuth identity.
+ *
+ * Single definition of the matching rules for both `/usage` renderers:
+ * - `accountId` ↔ report metadata `accountId`/`account_id` or `limit.scope.accountId`
+ * - `email`     ↔ report metadata `email`
+ * - `projectId` ↔ report metadata `projectId` or `limit.scope.projectId`
+ *   (Google-style providers key usage on the GCP project, not an account id)
+ */
+export function limitMatchesActiveAccount(
+	report: UsageReport,
+	limit: UsageLimit,
+	identity: OAuthAccountIdentity | undefined,
+): boolean {
+	if (!identity) return false;
+	const metadata = report.metadata ?? {};
+	const activeAccountId = normalizeIdentityValue(identity.accountId);
+	if (activeAccountId) {
+		const reportAccountId = normalizeIdentityValue(metadata.accountId) ?? normalizeIdentityValue(metadata.account_id);
+		if (reportAccountId === activeAccountId) return true;
+		if (normalizeIdentityValue(limit.scope.accountId) === activeAccountId) return true;
+	}
+	const activeEmail = normalizeIdentityValue(identity.email);
+	if (activeEmail && normalizeIdentityValue(metadata.email) === activeEmail) return true;
+	const activeProjectId = normalizeIdentityValue(identity.projectId);
+	if (activeProjectId) {
+		if (normalizeIdentityValue(metadata.projectId) === activeProjectId) return true;
+		if (normalizeIdentityValue(limit.scope.projectId) === activeProjectId) return true;
+	}
+	return false;
+}
+/** True when any limit column in `report` belongs to the given OAuth identity. */
+export function reportMatchesActiveAccount(report: UsageReport, identity: OAuthAccountIdentity | undefined): boolean {
+	if (!identity) return false;
+	return report.limits.some(limit => limitMatchesActiveAccount(report, limit, identity));
+}

package/src/slash-commands/helpers/usage-report.ts CHANGED Viewed

@@ -1,5 +1,7 @@
 import type { UsageLimit, UsageReport } from "@oh-my-pi/pi-ai";
+import type { OAuthAccountIdentity } from "../../session/auth-storage";
 import type { SlashCommandRuntime } from "../types";
+import { reportMatchesActiveAccount } from "./active-oauth-account";
 import { formatDuration, renderAsciiBar } from "./format";
 function formatProviderName(provider: string): string {
@@ -31,7 +33,11 @@ function formatUsageReportAccount(report: UsageReport, limit: UsageLimit, index:
 	return `account ${index + 1}`;
 }
-function renderUsageReports(reports: UsageReport[], nowMs: number): string {
+function renderUsageReports(
+	reports: UsageReport[],
+	nowMs: number,
+	resolveActiveAccount?: (provider: string) => OAuthAccountIdentity | undefined,
+): string {
 	const latestFetchedAt = Math.max(...reports.map(report => report.fetchedAt ?? 0));
 	const lines = [`Usage${latestFetchedAt ? ` (${formatDuration(nowMs - latestFetchedAt)} ago)` : ""}`];
 	const grouped = new Map<string, UsageReport[]>();
@@ -45,7 +51,9 @@ function renderUsageReports(reports: UsageReport[], nowMs: number): string {
 		left.localeCompare(right),
 	)) {
 		lines.push("", formatProviderName(provider));
+		const activeAccount = resolveActiveAccount?.(provider);
 		for (const report of providerReports) {
+			const inUse = reportMatchesActiveAccount(report, activeAccount);
 			if (report.limits.length === 0) {
 				const email = typeof report.metadata?.email === "string" ? report.metadata.email : "account";
 				lines.push(`- ${email}: no limits reported`);
@@ -56,7 +64,9 @@ function renderUsageReports(reports: UsageReport[], nowMs: number): string {
 				const window = limit.window?.label ?? limit.scope.windowId;
 				const tier = limit.scope.tier ? ` (${limit.scope.tier})` : "";
 				lines.push(`- ${limit.label}${tier}${window ? ` — ${window}` : ""}`);
-				lines.push(`  ${formatUsageReportAccount(report, limit, index)}: ${formatUsageAmount(limit)}`);
+				lines.push(
+					`  ${formatUsageReportAccount(report, limit, index)}: ${formatUsageAmount(limit)}${inUse ? "  ← in use by this session" : ""}`,
+				);
 				lines.push(`  ${renderAsciiBar(limit.amount.usedFraction)}`);
 				if (limit.window?.resetsAt && limit.window.resetsAt > nowMs) {
 					lines.push(`  resets in ${formatDuration(limit.window.resetsAt - nowMs)}`);
@@ -79,7 +89,18 @@ export async function buildUsageReportText(runtime: SlashCommandRuntime): Promis
 	};
 	if (provider.fetchUsageReports) {
 		const reports = await provider.fetchUsageReports();
-		if (reports && reports.length > 0) return renderUsageReports(reports, Date.now());
+		if (reports && reports.length > 0) {
+			const currentProvider = runtime.session.model?.provider;
+			const activeAccount = currentProvider
+				? runtime.session.modelRegistry.authStorage.getOAuthAccountIdentity(
+						currentProvider,
+						runtime.session.sessionId,
+					)
+				: undefined;
+			return renderUsageReports(reports, Date.now(), providerId =>
+				providerId === currentProvider ? activeAccount : undefined,
+			);
+		}
 	}
 	const stats = runtime.session.sessionManager.getUsageStatistics();