npm - @oh-my-pi/pi-coding-agent - Versions diffs - 15.2.4 → 15.3.1 - Mend

@oh-my-pi/pi-coding-agent 15.2.4 → 15.3.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (55) hide show

package/CHANGELOG.md +20 -0
package/dist/types/config/model-registry.d.ts +26 -0
package/dist/types/config/settings-schema.d.ts +34 -1
package/dist/types/config/settings.d.ts +6 -0
package/dist/types/discovery/helpers.d.ts +1 -0
package/dist/types/goals/runtime.d.ts +4 -0
package/dist/types/modes/components/status-line/types.d.ts +10 -0
package/dist/types/modes/components/status-line.d.ts +16 -0
package/dist/types/modes/interactive-mode.d.ts +3 -1
package/dist/types/modes/types.d.ts +3 -1
package/dist/types/modes/utils/context-usage.d.ts +17 -0
package/dist/types/modes/utils/ui-helpers.d.ts +5 -1
package/dist/types/session/agent-session.d.ts +9 -0
package/dist/types/session/session-manager.d.ts +10 -0
package/dist/types/task/executor.d.ts +3 -1
package/dist/types/task/types.d.ts +35 -0
package/dist/types/tools/bash-command-fixup.d.ts +0 -5
package/dist/types/utils/clipboard.d.ts +3 -1
package/dist/types/utils/image-resize.d.ts +4 -1
package/package.json +7 -7
package/src/config/model-registry.ts +46 -21
package/src/config/settings-schema.ts +29 -1
package/src/config/settings.ts +19 -0
package/src/discovery/helpers.ts +5 -1
package/src/extensibility/plugins/legacy-pi-compat.ts +27 -5
package/src/goals/runtime.ts +35 -13
package/src/hashline/parser.ts +6 -1
package/src/internal-urls/docs-index.generated.ts +2 -1
package/src/main.ts +1 -1
package/src/modes/components/model-selector.ts +53 -22
package/src/modes/components/status-line/segments.ts +53 -0
package/src/modes/components/status-line/types.ts +4 -0
package/src/modes/components/status-line.ts +243 -15
package/src/modes/controllers/command-controller.ts +9 -0
package/src/modes/controllers/event-controller.ts +8 -0
package/src/modes/interactive-mode.ts +23 -8
package/src/modes/theme/theme.ts +1 -1
package/src/modes/types.ts +1 -1
package/src/modes/utils/context-usage.ts +42 -8
package/src/modes/utils/ui-helpers.ts +11 -1
package/src/prompts/agents/frontmatter.md +1 -0
package/src/sdk.ts +24 -0
package/src/session/agent-session.ts +70 -0
package/src/session/session-manager.ts +119 -1
package/src/slash-commands/builtin-registry.ts +15 -0
package/src/task/executor.ts +50 -1
package/src/task/index.ts +11 -0
package/src/task/render.ts +26 -2
package/src/task/types.ts +35 -0
package/src/tools/bash-command-fixup.ts +0 -10
package/src/tools/bash.ts +1 -9
package/src/utils/clipboard.ts +79 -3
package/src/utils/image-resize.ts +78 -30
package/dist/types/modes/components/status-line-segment-editor.d.ts +0 -24
package/src/modes/components/status-line-segment-editor.ts +0 -359

package/CHANGELOG.md CHANGED Viewed

@@ -2,6 +2,18 @@
 ## [Unreleased]
+## [15.3.0] - 2026-05-25
+### Added
+- Added `OMP_NO_WEBP` environment variable to disable WebP encoding in image resize, fixing HTTP 400 errors when attaching browser snapshots to vision models running on local llama.cpp (which uses STB library that lacks WebP support)
+- Fixed loop mode submitting the next prompt while a background async-job delivery turn (idle flush) was still pending, which could cause the job result to be silently dropped and make the session appear to keep firing while work was ongoing ([#1294](https://github.com/can1357/oh-my-pi/issues/1294))
+- Fixed clipboard image paste (Ctrl+V) silently failing on WSL2 by routing image reads through a `powershell.exe` bridge when WSL interop is detected, since `arboard` returns `ContentNotAvailable` under WSLg ([#1280](https://github.com/can1357/oh-my-pi/issues/1280))
+- Fixed extension `ctx.ui.notify()` messages emitted during `session_start` being cleared before the first interactive render ([#1316](https://github.com/can1357/oh-my-pi/issues/1316)).
+- Fixed append-only context mode not being recomputed after model switches — the mode was frozen at session construction time using the initial model's provider, so `provider.appendOnlyContext=auto` left append-only enabled after switching away from DeepSeek (or disabled after switching to DeepSeek) for the rest of the session
+### Fixed
+- Fixed clipboard image paste (Ctrl+V) silently failing on WSL2 by routing image reads through a `powershell.exe` bridge when WSL interop is detected, since `arboard` returns `ContentNotAvailable` under WSLg ([#1280](https://github.com/can1357/oh-my-pi/issues/1280))
 ## [15.2.4] - 2026-05-22
 ### Breaking Changes
@@ -114,6 +126,10 @@
 - Fixed streaming edit previews for `apply_patch` and `hashline` jittering as the model typed `+added` lines. Two root causes addressed: (1) the trailing partial line of the streaming text input is now trimmed at each tick so a half-typed `+added` line no longer flickers; (2) the preview is rendered in the model's input order during streaming instead of re-deriving a unified diff via `Diff.structuredPatch`, whose coalescing previously reshuffled existing `+added` lines downward each time a new `-removed` line arrived. Existing additions now stay put and the preview only grows at the bottom while streaming. A residual trailing `-removed`/hunk-header block whose matching `+added` companion has not yet arrived is also suppressed until the additions land.
 - Fixed Perplexity web search appearing "logged out" roughly an hour after `omp auth login perplexity`. The search provider's `findOAuthToken` was honoring the bogus `expires = login_time + 1h` written by older logins (Perplexity JWTs typically omit `exp` because sessions are server-side) and silently dropping the credential. The loader now decodes the JWT's `exp` claim directly and only skips when the JWT itself is expired; tokens without an `exp` claim are treated as non-expiring.
+### Fixed
+- Fixed `legacy-pi-compat` failing to load plugin extensions (e.g. `pi-schedule-prompt@0.3.0`) that import `@mariozechner/pi-ai` when running from a compiled binary. `getResolvedSpecifier` called `Bun.resolveSync` against `import.meta.dir` inside `/$bunfs/root`, where the virtual FS exposes no resolvable `node_modules` tree at runtime; the throw silently dropped the plugin. The fix lets `rewriteLegacyPiImports` fall back gracefully on resolution failure so that `rewriteBareImportsForLegacyExtension` — which already runs immediately after — can resolve the original specifier against the plugin's own installed peer deps instead. The same fallback is applied to `resolveLegacyPiSpecifier` (the Bun plugin shim's `onResolve` handler) for tool/hook files loaded directly via Bun's import system. ([#1215](https://github.com/can1357/oh-my-pi/issues/1215))
 ## [15.1.7] - 2026-05-19
 ### Fixed
@@ -122,6 +138,9 @@
 - Fixed hashline edit payloads that use a readability space after `~` by warning on separator-padding-shaped payload blocks and tightening the model prompt. ([#1166](https://github.com/can1357/oh-my-pi/issues/1166))
 - Fixed ACP bash permission requests to include execute tool metadata and command content so clients can render command approval prompts consistently. ([#1189](https://github.com/can1357/oh-my-pi/issues/1189))
 - Fixed the status-line fast-mode indicator (`⚡`) rendering for scoped service tiers (`openai-only`, `claude-only`) even when the active model's provider didn't realize them — e.g. `serviceTier: "openai-only"` would still show the indicator next to a Claude model the wire request couldn't apply fast mode to. The indicator now consults a new `AgentSession.isFastModeActive()` predicate that runs the configured tier through `resolveServiceTier(tier, model.provider)` and only lights up when the result is `"priority"` for the current model. `isFastModeEnabled()` keeps its scope-aware semantics so `/fast on|off|toggle` and `/fast status` continue to reflect the user's configured intent.
+### Fixed
+- Fixed status-line context% computation freezing the UI for ~1.1 s every 2 s on long sessions (2,000+ messages). The earlier alignment fix (which uses `computeContextBreakdown` to match the `/context` slash command) was running on every agent event via `updateEditorTopBorder()` (event-controller.ts:163), and `computeContextBreakdown` walks every message through the native `countTokens` tokenizer (~0.5 ms each) — for the user's 2,312-message session this was ~1,120 ms synchronous blocking per cache miss, producing the user-visible "jittery rendering" and "status bar disappearing during streaming". `StatusLineComponent.getCachedContextBreakdown()` now uses an incremental per-message token cache: messages are walked ONCE during warm-up, and subsequent refreshes only compute tokens for the NEW messages appended since last call (typically 0–1 per refresh during streaming). The LAST message is always recomputed because its content may still be growing mid-stream; all prior messages are immutable once a newer message exists. Compaction (messages array shrinks) resets the cache. Non-message tokens (system prompt + tools + skills) are cached separately and invalidated via a cheap identity fingerprint. Result: 2,300-message warm refresh drops from ~1,120 ms to ~0.04 ms — 28,000× faster. Functional parity with the prior `computeContextBreakdown` path is preserved.
 ### Added
@@ -156,6 +175,7 @@
 - Fixed `deferAgentInitiatedTurns` handling during ACP async-job draining so background completion follow-up turns are delivered even when agent-initiated turns are deferred
 - Fixed ACP ordinary file-editing calls (`edit`, `write`, `ast_edit`) incorrectly requesting `session/request_permission` before every call, while keeping permission prompts for edit operations that delete or move files; permission requests now report the gated tool call as `pending` so clients can render the approval UI instead of returning `Permission request cancelled` without a visible prompt. ([#1134](https://github.com/can1357/oh-my-pi/pull/1134) by [@jiwangyihao](https://github.com/jiwangyihao))
 - Fixed the session tree selector to preserve a readable message column when deeply nested branch gutters would otherwise consume the viewport. ([#1144](https://github.com/can1357/oh-my-pi/issues/1144))
+- Fixed the TUI model selector to keep provider tab labels separate from provider ids, so the human-readable Ollama Cloud tab refreshes and filters `ollama-cloud` models correctly. ([#1153](https://github.com/can1357/oh-my-pi/issues/1153))
 ## [15.1.3] - 2026-05-17
 ### Breaking Changes

package/dist/types/config/model-registry.d.ts CHANGED Viewed

@@ -213,6 +213,32 @@ export declare const ModelsConfigFile: ConfigFile<{
         exclude?: string[] | undefined;
     } | undefined;
 }>;
+/** Provider override config (baseUrl, headers, apiKey, compat, transport) without custom models */
+interface ProviderOverride {
+    baseUrl?: string;
+    headers?: Record<string, string>;
+    apiKey?: string;
+    authHeader?: boolean;
+    compat?: Model<Api>["compat"];
+    transport?: Model<Api>["transport"];
+}
+/**
+ * Merge a freshly discovered model with the matching bundled/configured entry
+ * (or a runtime provider override when no bundled entry exists).
+ *
+ * `baseUrl` resolution priority:
+ *   1. User-set `providerOverride.baseUrl` (explicit override in models.json)
+ *   2. Discovered baseUrl (xiaomi `tp-` token-plan keys resolve to
+ *      `token-plan-sgp.xiaomimimo.com` at discovery time)
+ *   3. Existing bundled baseUrl (the host baked into `models.json`)
+ *
+ * Without (1), the user's override would lose to discovery; without (2)
+ * preferred over (3), the bundled `api.xiaomimimo.com` would shadow the
+ * tp- token-plan host and produce 401s on the first stream call.
+ * See `xiaomi-tp-discovery-merge.test.ts` and the `refresh()` baseUrl-override
+ * regression in `model-registry.test.ts`.
+ */
+export declare function mergeDiscoveredModel<TApi extends Api>(model: Model<TApi>, existing: Model<Api> | undefined, providerOverride?: Pick<ProviderOverride, "baseUrl" | "headers" | "transport">): Model<TApi>;
 export type ProviderDiscoveryStatus = "idle" | "ok" | "empty" | "cached" | "unavailable" | "unauthenticated";
 export interface ProviderDiscoveryState {
     provider: string;

package/dist/types/config/settings-schema.d.ts CHANGED Viewed

@@ -23,7 +23,7 @@ export declare const TAB_METADATA: Record<SettingTab, {
     icon: `tab.${string}`;
 }>;
 /** Status line segment identifiers */
-export type StatusLineSegmentId = "pi" | "model" | "mode" | "path" | "git" | "pr" | "subagents" | "token_in" | "token_out" | "token_total" | "token_rate" | "cost" | "context_pct" | "context_total" | "time_spent" | "time" | "session" | "hostname" | "cache_read" | "cache_write" | "session_name";
+export type StatusLineSegmentId = "pi" | "model" | "mode" | "path" | "git" | "pr" | "subagents" | "token_in" | "token_out" | "token_total" | "token_rate" | "cost" | "context_pct" | "context_total" | "time_spent" | "time" | "session" | "hostname" | "cache_read" | "cache_write" | "session_name" | "usage";
 /** Submenu choice metadata. */
 export type SubmenuOption<V extends string = string> = {
     value: V;
@@ -991,6 +991,15 @@ export declare const SETTINGS_SCHEMA: {
         readonly type: "number";
         readonly default: 2000;
     };
+    readonly "retry.maxDelayMs": {
+        readonly type: "number";
+        readonly default: number;
+        readonly ui: {
+            readonly tab: "model";
+            readonly label: "Max Retry Delay";
+            readonly description: "Maximum wait between retries, in ms. When the provider asks us to wait longer than this and no credential or model fallback succeeds, the request fails fast instead of sleeping (e.g. 3-hour Anthropic rate-limit windows).";
+        };
+    };
     readonly "retry.fallbackChains": {
         readonly type: "record";
         readonly default: Record<string, string[]>;
@@ -3075,6 +3084,29 @@ export declare const SETTINGS_SCHEMA: {
             readonly description: "Use Parallel extract API for URL fetching when credentials are available";
         };
     };
+    readonly "provider.appendOnlyContext": {
+        readonly type: "enum";
+        readonly values: readonly ["auto", "on", "off"];
+        readonly default: "auto";
+        readonly ui: {
+            readonly tab: "providers";
+            readonly label: "Append-Only Context";
+            readonly description: "Cache system prompt + tool specs and keep an append-only message log so provider prefix caches (DeepSeek, Anthropic) hit at maximum rate. Auto enables for DeepSeek.";
+            readonly options: readonly [{
+                readonly value: "auto";
+                readonly label: "Auto";
+                readonly description: "Enable for DeepSeek (recommended)";
+            }, {
+                readonly value: "on";
+                readonly label: "On";
+                readonly description: "Always enable append-only context";
+            }, {
+                readonly value: "off";
+                readonly label: "Off";
+                readonly description: "Disable append-only context";
+            }];
+        };
+    };
     readonly "exa.enabled": {
         readonly type: "boolean";
         readonly default: true;
@@ -3283,6 +3315,7 @@ export interface RetrySettings {
     enabled: boolean;
     maxRetries: number;
     baseDelayMs: number;
+    maxDelayMs: number;
 }
 export interface MemoriesSettings {
     enabled: boolean;

package/dist/types/config/settings.d.ts CHANGED Viewed

@@ -113,6 +113,12 @@ export declare class Settings {
      */
     setDisabledProviders(ids: string[]): void;
 }
+/**
+ * Subscribe to append-only mode setting changes.
+ * Returns an unsubscribe function. Multiple sessions (main + subagents)
+ * can register independently without overwriting each other.
+ */
+export declare function onAppendOnlyModeChanged(cb: (value: string) => void): () => void;
 export declare function isSettingsInitialized(): boolean;
 /**
  * Reset the global singleton for testing.

package/dist/types/discovery/helpers.d.ts CHANGED Viewed

@@ -101,6 +101,7 @@ export interface ParsedAgentFields {
     model?: string[];
     output?: unknown;
     thinkingLevel?: ThinkingLevel;
+    autoloadSkills?: string[];
     blocking?: boolean;
 }
 /**

package/dist/types/goals/runtime.d.ts CHANGED Viewed

@@ -54,6 +54,10 @@ export declare class GoalRuntime {
         objective: string;
         tokenBudget?: number;
     }): Promise<GoalModeState>;
+    replaceGoal(input: {
+        objective: string;
+        tokenBudget?: number;
+    }): Promise<GoalModeState>;
     resumeGoal(): Promise<GoalModeState>;
     pauseGoal(): Promise<GoalModeState | undefined>;
     dropGoal(): Promise<Goal | undefined>;

package/dist/types/modes/components/status-line/types.d.ts CHANGED Viewed

@@ -44,6 +44,16 @@ export interface SegmentContext {
             url: string;
         } | null;
     };
+    usage: {
+        fiveHour?: {
+            percent: number;
+            resetMinutes?: number;
+        };
+        sevenDay?: {
+            percent: number;
+            resetHours?: number;
+        };
+    } | null;
 }
 export interface RenderedSegment {
     content: string;

package/dist/types/modes/components/status-line.d.ts CHANGED Viewed

@@ -53,6 +53,22 @@ export declare class StatusLineComponent implements Component {
     watchBranch(onBranchChange: () => void): void;
     dispose(): void;
     invalidate(): void;
+    /**
+     * Background-refresh the Anthropic OAuth quota report. Guarded by a 5-min
+     * TTL on both success (cache lifetime) and error (backoff). Exposed
+     * (non-private) so unit tests can verify the backoff invariant.
+     */
+    refreshUsageInBackground(): void;
+    /**
+     * Compute the (cached) used-tokens / context-window totals for the
+     * status-line context% segment. Exposed (non-private) so unit tests can
+     * verify the incremental-cache invariants; not part of any external
+     * API.
+     */
+    getCachedContextBreakdown(): {
+        usedTokens: number;
+        contextWindow: number;
+    };
     getTopBorder(width: number): {
         content: string;
         width: number;

package/dist/types/modes/interactive-mode.d.ts CHANGED Viewed

@@ -171,7 +171,9 @@ export declare class InteractiveMode implements InteractiveModeContext {
         updateFooter?: boolean;
         populateHistory?: boolean;
     }): void;
-    renderInitialMessages(prebuiltContext?: SessionContext): void;
+    renderInitialMessages(prebuiltContext?: SessionContext, options?: {
+        preserveExistingChat?: boolean;
+    }): void;
     getUserMessageText(message: Message): string;
     findLastAssistantMessage(): AssistantMessage | undefined;
     extractAssistantText(message: AssistantMessage): string;

package/dist/types/modes/types.d.ts CHANGED Viewed

@@ -168,7 +168,9 @@ export interface InteractiveModeContext {
         updateFooter?: boolean;
         populateHistory?: boolean;
     }): void;
-    renderInitialMessages(prebuiltContext?: SessionContext): void;
+    renderInitialMessages(prebuiltContext?: SessionContext, options?: {
+        preserveExistingChat?: boolean;
+    }): void;
     getUserMessageText(message: Message): string;
     findLastAssistantMessage(): AssistantMessage | undefined;
     extractAssistantText(message: AssistantMessage): string;

package/dist/types/modes/utils/context-usage.d.ts CHANGED Viewed

@@ -1,5 +1,7 @@
 import type { Model } from "@oh-my-pi/pi-ai";
+import type { Skill } from "../../extensibility/skills";
 import type { AgentSession } from "../../session/agent-session";
+import type { Tool } from "../../tools";
 import type { theme as Theme } from "../theme/theme";
 type CategoryId = "systemPrompt" | "systemContext" | "systemTools" | "skills" | "messages";
 interface CategoryInfo {
@@ -17,6 +19,21 @@ export interface ContextBreakdown {
     autoCompactBufferTokens: number;
     freeTokens: number;
 }
+export declare function estimateSkillsTokens(skills: readonly Skill[]): number;
+export declare function estimateToolSchemaTokens(tools: ReadonlyArray<Pick<Tool, "name" | "description" | "parameters">>): number;
+/**
+ * Compute just the NON-MESSAGE token total: system prompt (with its skills
+ * section subtracted, since skills are tokenized separately) + system context
+ * (the rest of the system-prompt array) + tools + skills.
+ *
+ * Exposed so callers like `StatusLineComponent` can cache the non-message
+ * total separately from the message total. Non-message inputs (skills,
+ * tools, system prompt) change rarely; the message list grows on every
+ * streaming turn. Splitting the two lets the caller refresh each on its own
+ * cadence — non-message recomputed only when the inputs identity changes,
+ * messages walked incrementally as new entries append.
+ */
+export declare function computeNonMessageTokens(session: AgentSession): number;
 /**
  * Compute a breakdown of estimated context usage by category for the active
  * session and model.

package/dist/types/modes/utils/ui-helpers.d.ts CHANGED Viewed

@@ -3,6 +3,9 @@ import type { AssistantMessage, Message } from "@oh-my-pi/pi-ai";
 import { type Component } from "@oh-my-pi/pi-tui";
 import type { InteractiveModeContext } from "../../modes/types";
 import type { SessionContext } from "../../session/session-manager";
+interface RenderInitialMessagesOptions {
+    preserveExistingChat?: boolean;
+}
 export declare class UiHelpers {
     #private;
     private ctx;
@@ -31,7 +34,7 @@ export declare class UiHelpers {
         updateFooter?: boolean;
         populateHistory?: boolean;
     }): void;
-    renderInitialMessages(prebuiltContext?: SessionContext): void;
+    renderInitialMessages(prebuiltContext?: SessionContext, options?: RenderInitialMessagesOptions): void;
     clearEditor(): void;
     showError(errorMessage: string): void;
     showWarning(warningMessage: string): void;
@@ -47,3 +50,4 @@ export declare class UiHelpers {
     findLastAssistantMessage(): AssistantMessage | undefined;
     extractAssistantText(message: AssistantMessage): string;
 }
+export {};

package/dist/types/session/agent-session.d.ts CHANGED Viewed

@@ -417,6 +417,15 @@ export declare class AgentSession {
     refreshRpcHostTools(rpcTools: AgentTool[]): Promise<void>;
     /** Whether auto-compaction is currently running */
     get isCompacting(): boolean;
+    /**
+     * Whether idle-flush tasks, auto-continuations, or other short-lived
+     * post-prompt work are pending.  True in the brief window after
+     * `session.prompt()` returns but before a scheduled background delivery
+     * (e.g. an async-job result) has finished its own streaming turn.
+     * Loop-mode and similar auto-submit paths should treat this as a block
+     * to avoid racing against the delivery turn.
+     */
+    get hasPostPromptWork(): boolean;
     /** All messages including custom types like BashExecutionMessage */
     get messages(): AgentMessage[];
     buildDisplaySessionContext(): SessionContext;

package/dist/types/session/session-manager.d.ts CHANGED Viewed

@@ -214,6 +214,16 @@ declare class RecentSessionInfo {
     /** Human-readable relative time (e.g., "2 hours ago") */
     get timeAgo(): string;
 }
+/**
+ * Promote orphaned `<basename>.jsonl.<snowflake>.bak` backups created by
+ * `#replaceSessionFileAfterEperm` back to their primary path when the primary
+ * is missing. This runs once per session-dir scan, before the main `*.jsonl`
+ * glob, so a crash between the two renames in the EPERM-rewrite path does not
+ * leave the user's last good state stranded outside the loader's view.
+ *
+ * Exported for testing.
+ */
+export declare function recoverOrphanedBackups(sessionDir: string, storage: SessionStorage): Promise<void>;
 /** Exported for testing */
 export declare function findMostRecentSession(sessionDir: string, storage?: SessionStorage): Promise<string | null>;
 /** Get recent sessions for display in welcome screen */

package/dist/types/task/executor.d.ts CHANGED Viewed

@@ -7,7 +7,7 @@ import type { AgentTelemetryConfig, ThinkingLevel } from "@oh-my-pi/pi-agent-cor
 import { ModelRegistry } from "../config/model-registry";
 import type { PromptTemplate } from "../config/prompt-templates";
 import { Settings } from "../config/settings";
-import type { Skill } from "../extensibility/skills";
+import { type Skill } from "../extensibility/skills";
 import type { HindsightSessionState } from "../hindsight/state";
 import type { LocalProtocolOptions } from "../internal-urls";
 import type { MCPManager } from "../mcp/manager";
@@ -73,6 +73,8 @@ export interface ExecutorOptions {
      * transition explicitly.
      */
     parentTelemetry?: AgentTelemetryConfig;
+    /** Skills to autoload via sendCustomMessage before the first prompt */
+    autoloadSkills?: Skill[];
 }
 export interface YieldItem {
     data?: unknown;

package/dist/types/task/types.d.ts CHANGED Viewed

@@ -148,6 +148,7 @@ export interface AgentDefinition {
     thinkingLevel?: ThinkingLevel;
     output?: unknown;
     blocking?: boolean;
+    autoloadSkills?: string[];
     source: AgentSource;
     filePath?: string;
 }
@@ -189,6 +190,30 @@ export interface AgentProgress {
     modelOverride?: string | string[];
     /** Data extracted by registered subprocess tool handlers (keyed by tool name) */
     extractedToolData?: Record<string, unknown[]>;
+    /**
+     * Auto-retry state when the subagent is sleeping between provider retries
+     * (e.g. 429 rate-limit with retry-after). Cleared when the retry resolves
+     * or fails. Surfacing this to the parent prevents the task tool from
+     * looking indefinitely "in progress" when a child is actually blocked on
+     * provider quota.
+     */
+    retryState?: {
+        attempt: number;
+        maxAttempts: number;
+        delayMs: number;
+        errorMessage: string;
+        startedAtMs: number;
+    };
+    /**
+     * Terminal retry failure surfaced once the subagent gave up retrying
+     * (e.g. retry-after exceeded the cap, or all attempts exhausted). Carries
+     * the final error so the parent UI can render "blocked: rate-limited"
+     * instead of waiting for a status that never arrives.
+     */
+    retryFailure?: {
+        attempt: number;
+        errorMessage: string;
+    };
 }
 /** Result from a single agent execution */
 export interface SingleResult {
@@ -227,6 +252,16 @@ export interface SingleResult {
     nestedPatches?: NestedRepoPatch[];
     /** Data extracted by registered subprocess tool handlers (keyed by tool name) */
     extractedToolData?: Record<string, unknown[]>;
+    /**
+     * Terminal retry failure, when the subagent exited because the auto-retry
+     * loop gave up (retry-after exceeded the cap, or all attempts exhausted).
+     * Lets the parent task tool surface a "blocked: rate-limited" outcome
+     * instead of a generic failure.
+     */
+    retryFailure?: {
+        attempt: number;
+        errorMessage: string;
+    };
     /** Output metadata for agent:// URL integration */
     outputMeta?: {
         lineCount: number;

package/dist/types/tools/bash-command-fixup.d.ts CHANGED Viewed

@@ -9,8 +9,3 @@ export interface BashFixupResult {
  * or no-op transform, returns the input verbatim with `stripped: []`.
  */
 export declare function applyBashFixups(command: string): BashFixupResult;
-/**
- * Human-readable notice for the fixups that fired. Mirrors the shape of
- * `formatTimeoutClampNotice` so it can ride alongside the other bash notices.
- */
-export declare function formatBashFixupNotice(stripped: readonly string[]): string | undefined;

package/dist/types/utils/clipboard.d.ts CHANGED Viewed

@@ -13,7 +13,9 @@ export declare function copyToClipboard(text: string): Promise<void>;
  * Read an image from the system clipboard.
  *
  * Returns null on Termux (no image clipboard support) or when no display
- * server is available (headless/SSH without forwarding).
+ * server is available (headless/SSH without forwarding). Under WSL the
+ * Windows clipboard is reached through `powershell.exe`, since WSLg's
+ * Wayland clipboard does not carry image payloads through to `arboard`.
  *
  * @returns PNG payload or null when no image is available.
  */

package/dist/types/utils/image-resize.d.ts CHANGED Viewed

@@ -4,6 +4,7 @@ export interface ImageResizeOptions {
     maxHeight?: number;
     maxBytes?: number;
     jpegQuality?: number;
+    excludeWebP?: boolean;
 }
 export interface ResizedImage {
     buffer: Uint8Array;
@@ -20,11 +21,13 @@ export interface ResizedImage {
  *
  * Strategy:
  *  1. Probe metadata. If already within all limits, return original.
- *  2. Resize to fit max dimensions and encode at high quality across PNG/JPEG/WebP — return smallest.
+ *  2. Resize to fit max dimensions and encode at high quality across PNG/JPEG (+ WebP) — return smallest.
  *  3. If still too large, walk a lossy JPEG/WebP quality ladder.
  *  4. If still too large, walk a dimension-scale ladder × quality ladder.
  *  5. If still too large, return the smallest variant produced.
  *
+ * Set OMP_NO_WEBP to exclude WebP from encoding (llama.cpp STB doesn't decode it).
+ *
  * Backed by `Bun.Image`: a chainable native pipeline that runs decode/transform/encode
  * off the JS thread when the terminal (`.bytes()`) is awaited.
  */

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
 	"type": "module",
 	"name": "@oh-my-pi/pi-coding-agent",
-	"version": "15.2.4",
+	"version": "15.3.1",
 	"description": "Coding agent CLI with read, bash, edit, write tools and session management",
 	"homepage": "https://omp.sh",
 	"author": "Can Boluk",
@@ -47,12 +47,12 @@
 		"@agentclientprotocol/sdk": "0.21.0",
 		"@babel/parser": "^7.29.3",
 		"@mozilla/readability": "^0.6.0",
-		"@oh-my-pi/omp-stats": "15.2.4",
-		"@oh-my-pi/pi-agent-core": "15.2.4",
-		"@oh-my-pi/pi-ai": "15.2.4",
-		"@oh-my-pi/pi-natives": "15.2.4",
-		"@oh-my-pi/pi-tui": "15.2.4",
-		"@oh-my-pi/pi-utils": "15.2.4",
+		"@oh-my-pi/omp-stats": "15.3.1",
+		"@oh-my-pi/pi-agent-core": "15.3.1",
+		"@oh-my-pi/pi-ai": "15.3.1",
+		"@oh-my-pi/pi-natives": "15.3.1",
+		"@oh-my-pi/pi-tui": "15.3.1",
+		"@oh-my-pi/pi-utils": "15.3.1",
 		"@puppeteer/browsers": "^2.13.0",
 		"@types/turndown": "5.0.6",
 		"@xterm/headless": "^6.0.0",

package/src/config/model-registry.ts CHANGED Viewed

@@ -252,6 +252,45 @@ interface ProviderOverride {
 	transport?: Model<Api>["transport"];
 }
+/**
+ * Merge a freshly discovered model with the matching bundled/configured entry
+ * (or a runtime provider override when no bundled entry exists).
+ *
+ * `baseUrl` resolution priority:
+ *   1. User-set `providerOverride.baseUrl` (explicit override in models.json)
+ *   2. Discovered baseUrl (xiaomi `tp-` token-plan keys resolve to
+ *      `token-plan-sgp.xiaomimimo.com` at discovery time)
+ *   3. Existing bundled baseUrl (the host baked into `models.json`)
+ *
+ * Without (1), the user's override would lose to discovery; without (2)
+ * preferred over (3), the bundled `api.xiaomimimo.com` would shadow the
+ * tp- token-plan host and produce 401s on the first stream call.
+ * See `xiaomi-tp-discovery-merge.test.ts` and the `refresh()` baseUrl-override
+ * regression in `model-registry.test.ts`.
+ */
+export function mergeDiscoveredModel<TApi extends Api>(
+	model: Model<TApi>,
+	existing: Model<Api> | undefined,
+	providerOverride?: Pick<ProviderOverride, "baseUrl" | "headers" | "transport">,
+): Model<TApi> {
+	if (existing) {
+		return {
+			...model,
+			baseUrl: providerOverride?.baseUrl ?? model.baseUrl ?? existing.baseUrl,
+			headers: existing.headers ? { ...existing.headers, ...model.headers } : model.headers,
+		};
+	}
+	if (providerOverride) {
+		return {
+			...model,
+			baseUrl: providerOverride.baseUrl ?? model.baseUrl,
+			headers: providerOverride.headers ? { ...model.headers, ...providerOverride.headers } : model.headers,
+			...(providerOverride.transport !== undefined ? { transport: providerOverride.transport } : {}),
+		};
+	}
+	return model;
+}
 interface DiscoveryProviderConfig {
 	provider: string;
 	api: Api;
@@ -1182,27 +1221,13 @@ export class ModelRegistry {
 			return;
 		}
 		const discoveredModels = this.#applyHardcodedModelPolicies(
-			discovered.map(model => {
-				const existing = this.find(model.provider, model.id);
-				if (existing) {
-					return {
-						...model,
-						baseUrl: existing.baseUrl,
-						headers: existing.headers ? { ...existing.headers, ...model.headers } : model.headers,
-					};
-				}
-				const providerOverride = this.#providerOverrides.get(model.provider);
-				return providerOverride
-					? {
-							...model,
-							baseUrl: providerOverride.baseUrl ?? model.baseUrl,
-							headers: providerOverride.headers
-								? { ...model.headers, ...providerOverride.headers }
-								: model.headers,
-							...(providerOverride.transport !== undefined ? { transport: providerOverride.transport } : {}),
-						}
-					: model;
-			}),
+			discovered.map(model =>
+				mergeDiscoveredModel(
+					model,
+					this.find(model.provider, model.id),
+					this.#providerOverrides.get(model.provider),
+				),
+			),
 		);
 		const resolved = this.#mergeResolvedModels(this.#models, discoveredModels);
 		const withConfigModels = this.#mergeCustomModels(resolved, this.#customModelOverlays);

package/src/config/settings-schema.ts CHANGED Viewed

@@ -81,7 +81,8 @@ export type StatusLineSegmentId =
 	| "hostname"
 	| "cache_read"
 	| "cache_write"
-	| "session_name";
+	| "session_name"
+	| "usage";
 /** Submenu choice metadata. */
 export type SubmenuOption<V extends string = string> = {
@@ -836,6 +837,16 @@ export const SETTINGS_SCHEMA = {
 	},
 	"retry.baseDelayMs": { type: "number", default: 2000 },
+	"retry.maxDelayMs": {
+		type: "number",
+		default: 5 * 60 * 1000,
+		ui: {
+			tab: "model",
+			label: "Max Retry Delay",
+			description:
+				"Maximum wait between retries, in ms. When the provider asks us to wait longer than this and no credential or model fallback succeeds, the request fails fast instead of sleeping (e.g. 3-hour Anthropic rate-limit windows).",
+		},
+	},
 	"retry.fallbackChains": { type: "record", default: {} as Record<string, string[]> },
 	"retry.fallbackRevertPolicy": {
 		type: "enum",
@@ -2612,6 +2623,22 @@ export const SETTINGS_SCHEMA = {
 			description: "Use Parallel extract API for URL fetching when credentials are available",
 		},
 	},
+	"provider.appendOnlyContext": {
+		type: "enum",
+		values: ["auto", "on", "off"] as const,
+		default: "auto",
+		ui: {
+			tab: "providers",
+			label: "Append-Only Context",
+			description:
+				"Cache system prompt + tool specs and keep an append-only message log so provider prefix caches (DeepSeek, Anthropic) hit at maximum rate. Auto enables for DeepSeek.",
+			options: [
+				{ value: "auto", label: "Auto", description: "Enable for DeepSeek (recommended)" },
+				{ value: "on", label: "On", description: "Always enable append-only context" },
+				{ value: "off", label: "Off", description: "Disable append-only context" },
+			],
+		},
+	},
 	// Exa
 	"exa.enabled": {
@@ -2843,6 +2870,7 @@ export interface RetrySettings {
 	enabled: boolean;
 	maxRetries: number;
 	baseDelayMs: number;
+	maxDelayMs: number;
 }
 export interface MemoriesSettings {