npm - @oh-my-pi/pi-coding-agent - Versions diffs - 13.9.2 → 13.9.4 - Mend

@oh-my-pi/pi-coding-agent 13.9.2 → 13.9.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (53) hide show

package/CHANGELOG.md +64 -0
package/examples/sdk/02-custom-model.ts +2 -1
package/package.json +7 -7
package/src/cli/args.ts +10 -6
package/src/cli/list-models.ts +2 -2
package/src/commands/launch.ts +3 -3
package/src/config/model-registry.ts +136 -38
package/src/config/model-resolver.ts +47 -21
package/src/config/settings-schema.ts +56 -2
package/src/discovery/helpers.ts +3 -3
package/src/extensibility/custom-tools/types.ts +2 -0
package/src/extensibility/extensions/loader.ts +3 -2
package/src/extensibility/extensions/types.ts +10 -7
package/src/extensibility/hooks/types.ts +2 -0
package/src/main.ts +5 -22
package/src/memories/index.ts +7 -3
package/src/modes/components/footer.ts +10 -8
package/src/modes/components/model-selector.ts +33 -38
package/src/modes/components/settings-defs.ts +32 -3
package/src/modes/components/settings-selector.ts +16 -5
package/src/modes/components/status-line/context-thresholds.ts +68 -0
package/src/modes/components/status-line/segments.ts +11 -12
package/src/modes/components/status-line.ts +2 -6
package/src/modes/components/thinking-selector.ts +7 -7
package/src/modes/components/tree-selector.ts +3 -2
package/src/modes/controllers/command-controller.ts +11 -26
package/src/modes/controllers/event-controller.ts +16 -3
package/src/modes/controllers/input-controller.ts +4 -2
package/src/modes/controllers/selector-controller.ts +5 -4
package/src/modes/interactive-mode.ts +2 -2
package/src/modes/rpc/rpc-client.ts +5 -10
package/src/modes/rpc/rpc-types.ts +5 -5
package/src/modes/theme/theme.ts +8 -3
package/src/priority.json +1 -0
package/src/prompts/system/auto-handoff-threshold-focus.md +1 -0
package/src/prompts/system/system-prompt.md +18 -2
package/src/prompts/tools/hashline.md +139 -83
package/src/sdk.ts +24 -16
package/src/session/agent-session.ts +261 -118
package/src/session/agent-storage.ts +14 -14
package/src/session/compaction/compaction.ts +500 -13
package/src/session/messages.ts +12 -1
package/src/session/session-manager.ts +77 -19
package/src/slash-commands/builtin-registry.ts +48 -0
package/src/task/agents.ts +3 -2
package/src/task/executor.ts +2 -2
package/src/task/types.ts +2 -1
package/src/thinking.ts +87 -0
package/src/tools/browser.ts +15 -6
package/src/tools/fetch.ts +118 -100
package/src/tools/index.ts +2 -1
package/src/web/kagi.ts +62 -7
package/src/web/search/providers/exa.ts +74 -3

package/CHANGELOG.md CHANGED Viewed

@@ -2,6 +2,70 @@
 ## [Unreleased]
+## [13.9.4] - 2026-03-07
+### Added
+- Automatic detection of Ollama model capabilities including reasoning/thinking support and vision input via the `/api/show` endpoint
+- Improved Kagi API error handling with extraction of detailed error messages from JSON and plain text responses
+### Changed
+- Updated Kagi provider description to clarify requirement for Kagi Search API beta access
+## [13.9.3] - 2026-03-07
+### Breaking Changes
+- Changed `ThinkingLevel` type to be imported from `@oh-my-pi/pi-agent-core` instead of `@oh-my-pi/pi-ai`
+- Changed thinking level representation from string literals to `Effort` enum values (e.g., `Effort.High` instead of `"high"`)
+- Changed `getThinkingLevel()` return type to `ThinkingLevel | undefined` to support models without thinking support
+- Changed model `reasoning` property to `thinking` property with `ThinkingConfig` for explicit effort level configuration
+- Changed `thinkingLevel` in session context to be optional (`ThinkingLevel | undefined`) instead of always present
+### Added
+- Added `thinking.ts` module with `getThinkingLevelMetadata()` and `resolveThinkingLevelForModel()` utilities for thinking level handling
+- Added `ThinkingConfig` support to model definitions for specifying supported thinking effort levels per model
+- Added `enrichModelThinking()` function to apply thinking configuration to models during registry initialization
+- Added `clampThinkingLevelForModel()` function to constrain thinking levels to model-supported ranges
+- Added `getSupportedEfforts()` function to retrieve available thinking efforts for a model
+- Added `Effort` enum import from `@oh-my-pi/pi-ai` for type-safe thinking level representation
+- Added `/fast` slash command to toggle OpenAI service tier priority mode for faster response processing
+- Added `serviceTier` setting to control OpenAI processing priority (none, auto, default, flex, scale, priority)
+- Added `compaction.remoteEnabled` setting to control use of remote compaction endpoints
+- Added remote compaction support for OpenAI and OpenAI Codex models with encrypted reasoning preservation
+- Added fast mode indicator (⚡) to model segment in status line when priority service tier is active
+- Added context usage threshold levels (normal, warning, purple, error) with token-aware thresholds for better context awareness
+- Added `isFastModeEnabled()`, `setFastMode()`, and `toggleFastMode()` methods to AgentSession for fast mode control
+### Changed
+- Changed credential deletion to disable credentials with persisted cause instead of permanent deletion
+- Added `disabledCause` parameter to credential deletion methods to track reason for disabling
+- Changed thinking level parsing to use `parseEffort()` from local thinking module instead of `parseThinkingLevel()` from pi-ai
+- Changed model list display to show supported thinking efforts (e.g., "low,medium,high") instead of yes/no reasoning indicator
+- Changed footer and status line to check `model.thinking` instead of `model.reasoning` for thinking level display
+- Changed thinking selector to work with `Effort` type instead of `ThinkingLevel` for available levels
+- Changed model resolver to return `undefined` for thinking level instead of `"off"` when no thinking is specified
+- Changed compaction reasoning parameters to use `Effort` enum values instead of string literals
+- Changed RPC types to use `Effort` for cycling thinking levels and `ThinkingLevel | undefined` for session state
+- Changed theme thinking border color function to accept both `ThinkingLevel` and `Effort` types
+- Changed context usage coloring in footer and status line to use token-aware thresholds instead of fixed percentages
+- Changed compaction to preserve OpenAI remote compaction state and encrypted reasoning across sessions
+- Changed compaction to skip emitting kept messages when using OpenAI remote compaction with preserved history
+- Changed session context to include `serviceTier` field for tracking active service tier across session branches
+- Changed `compact()` function to accept `remoteInstructions` option for custom remote compaction prompts
+- Changed model registry to apply hardcoded policies (gpt-5.4 context window) consistently across all model loading paths
+### Fixed
+- Fixed OpenAI remote compaction to correctly append incremental responses instead of replacing entire history
+- Fixed thinking level display logic in main.ts to correctly check for undefined instead of "off"
+- Fixed model registry to preserve explicit thinking configuration on runtime-registered models
+- Fixed usage limit reset time calculation to use absolute `resetsAt` timestamps instead of deprecated `resetInMs` field
+- Fixed compaction summary message creation to no longer be automatically added to chat during compaction (now handled by session manager)
+- Fixed Kagi web search errors to surface the provider's beta-access message and clarified that Kagi search requires Search API beta access
 ## [13.9.2] - 2026-03-05
 ### Added

package/examples/sdk/02-custom-model.ts CHANGED Viewed

@@ -3,6 +3,7 @@
  *
  * Shows how to select a specific model and thinking level.
  */
+import { ThinkingLevel } from "@oh-my-pi/pi-agent-core";
 import { getModel } from "@oh-my-pi/pi-ai";
 import { createAgentSession, discoverAuthStorage, discoverModels } from "@oh-my-pi/pi-coding-agent";
@@ -32,7 +33,7 @@ console.log(
 if (available.length > 0) {
 	const { session } = await createAgentSession({
 		model: available[0],
-		thinkingLevel: "medium", // off, low, medium, high
+		thinkingLevel: ThinkingLevel.Medium, // off, low, medium, high
 		authStorage,
 		modelRegistry,
 	});

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
 	"type": "module",
 	"name": "@oh-my-pi/pi-coding-agent",
-	"version": "13.9.2",
+	"version": "13.9.4",
 	"description": "Coding agent CLI with read, bash, edit, write tools and session management",
 	"homepage": "https://github.com/can1357/oh-my-pi",
 	"author": "Can Boluk",
@@ -41,12 +41,12 @@
 	},
 	"dependencies": {
 		"@mozilla/readability": "^0.6",
-		"@oh-my-pi/omp-stats": "13.9.2",
-		"@oh-my-pi/pi-agent-core": "13.9.2",
-		"@oh-my-pi/pi-ai": "13.9.2",
-		"@oh-my-pi/pi-natives": "13.9.2",
-		"@oh-my-pi/pi-tui": "13.9.2",
-		"@oh-my-pi/pi-utils": "13.9.2",
+		"@oh-my-pi/omp-stats": "13.9.4",
+		"@oh-my-pi/pi-agent-core": "13.9.4",
+		"@oh-my-pi/pi-ai": "13.9.4",
+		"@oh-my-pi/pi-natives": "13.9.4",
+		"@oh-my-pi/pi-tui": "13.9.4",
+		"@oh-my-pi/pi-utils": "13.9.4",
 		"@sinclair/typebox": "^0.34",
 		"@xterm/headless": "^6.0",
 		"ajv": "^8.18",

package/src/cli/args.ts CHANGED Viewed

@@ -1,9 +1,10 @@
 /**
  * CLI argument parsing and help display
  */
-import { getAvailableThinkingLevels, parseThinkingLevel, type ThinkingLevel } from "@oh-my-pi/pi-ai";
+import { type Effort, THINKING_EFFORTS } from "@oh-my-pi/pi-ai";
 import { APP_NAME, CONFIG_DIR_NAME, logger } from "@oh-my-pi/pi-utils";
 import chalk from "chalk";
+import { parseEffort } from "../thinking";
 import { BUILTIN_TOOLS } from "../tools";
 export type Mode = "text" | "json" | "rpc";
@@ -19,7 +20,7 @@ export interface Args {
 	apiKey?: string;
 	systemPrompt?: string;
 	appendSystemPrompt?: string;
-	thinking?: ThinkingLevel;
+	thinking?: Effort;
 	continue?: boolean;
 	resume?: string | true;
 	help?: boolean;
@@ -107,7 +108,10 @@ export function parseArgs(args: string[], extensionFlags?: Map<string, { type: "
 		} else if (arg === "--no-pty") {
 			result.noPty = true;
 		} else if (arg === "--tools" && i + 1 < args.length) {
-			const toolNames = args[++i].split(",").map(s => s.trim());
+			const toolNames = args[++i]
+				.split(",")
+				.map(s => s.trim().toLowerCase())
+				.filter(Boolean);
 			const validTools: string[] = [];
 			for (const name of toolNames) {
 				if (name in BUILTIN_TOOLS) {
@@ -122,13 +126,13 @@ export function parseArgs(args: string[], extensionFlags?: Map<string, { type: "
 			result.tools = validTools;
 		} else if (arg === "--thinking" && i + 1 < args.length) {
 			const rawThinking = args[++i];
-			const thinking = parseThinkingLevel(rawThinking);
+			const thinking = parseEffort(rawThinking);
 			if (thinking !== undefined) {
 				result.thinking = thinking;
 			} else {
 				logger.warn("Invalid thinking level passed to --thinking", {
 					level: rawThinking,
-					validThinkingLevels: getAvailableThinkingLevels(),
+					validThinkingLevels: THINKING_EFFORTS,
 				});
 			}
 		} else if (arg === "--print" || arg === "-p") {
@@ -207,7 +211,7 @@ export function getExtraHelpText(): string {
   MISTRAL_API_KEY            - Mistral models
   ZAI_API_KEY                - z.ai models (ZhipuAI/GLM)
   MINIMAX_API_KEY            - MiniMax models
-  OPENCODE_API_KEY           - OpenCode models
+  OPENCODE_API_KEY           - OpenCode Zen/OpenCode Go models
   CURSOR_ACCESS_TOKEN        - Cursor AI models
   AI_GATEWAY_API_KEY         - Vercel AI Gateway

package/src/cli/list-models.ts CHANGED Viewed

@@ -1,7 +1,7 @@
 /**
  * List available models with optional fuzzy search
  */
-import type { Api, Model } from "@oh-my-pi/pi-ai";
+import { type Api, getSupportedEfforts, type Model } from "@oh-my-pi/pi-ai";
 import { formatNumber } from "@oh-my-pi/pi-utils";
 import type { ModelRegistry } from "../config/model-registry";
 import { fuzzyFilter } from "../utils/fuzzy";
@@ -41,7 +41,7 @@ export async function listModels(modelRegistry: ModelRegistry, searchPattern?: s
 		model: m.id,
 		context: formatNumber(m.contextWindow),
 		maxOut: formatNumber(m.maxTokens),
-		thinking: m.reasoning ? "yes" : "no",
+		thinking: m.thinking ? getSupportedEfforts(m).join(",") : m.reasoning ? "yes" : "-",
 		images: m.input.includes("image") ? "yes" : "no",
 	}));

package/src/commands/launch.ts CHANGED Viewed

@@ -2,7 +2,7 @@
  * Root command for the coding agent CLI.
  */
-import { getAvailableThinkingLevels } from "@oh-my-pi/pi-ai";
+import { THINKING_EFFORTS } from "@oh-my-pi/pi-ai";
 import { APP_NAME } from "@oh-my-pi/pi-utils";
 import { Args, Command, Flags } from "@oh-my-pi/pi-utils/cli";
 import { parseArgs } from "../cli/args";
@@ -86,8 +86,8 @@ export default class Index extends Command {
 			description: "Comma-separated list of tools to enable (default: all)",
 		}),
 		thinking: Flags.string({
-			description: `Set thinking level: ${getAvailableThinkingLevels().join(", ")}`,
-			options: getAvailableThinkingLevels(),
+			description: `Set thinking level: ${THINKING_EFFORTS.join(", ")}`,
+			options: [...THINKING_EFFORTS],
 		}),
 		hook: Flags.string({
 			description: "Load a hook/extension file (can be used multiple times)",

package/src/config/model-registry.ts CHANGED Viewed

@@ -4,6 +4,7 @@ import {
 	type Context,
 	createModelManager,
 	DEFAULT_LOCAL_TOKEN,
+	enrichModelThinking,
 	getBundledModels,
 	getBundledProviders,
 	googleAntigravityModelManagerOptions,
@@ -18,10 +19,11 @@ import {
 	registerCustomApi,
 	registerOAuthProvider,
 	type SimpleStreamOptions,
+	type ThinkingConfig,
 	unregisterCustomApis,
 	unregisterOAuthProviders,
 } from "@oh-my-pi/pi-ai";
-import { logger } from "@oh-my-pi/pi-utils";
+import { isRecord, logger } from "@oh-my-pi/pi-utils";
 import { type Static, Type } from "@sinclair/typebox";
 import { type ConfigError, ConfigFile } from "../config";
 import type { ThemeColor } from "../modes/theme/theme";
@@ -72,6 +74,28 @@ const OpenAICompatSchema = Type.Object({
 	vercelGatewayRouting: Type.Optional(VercelGatewayRoutingSchema),
 });
+const EffortSchema = Type.Union([
+	Type.Literal("minimal"),
+	Type.Literal("low"),
+	Type.Literal("medium"),
+	Type.Literal("high"),
+	Type.Literal("xhigh"),
+]);
+const ThinkingControlModeSchema = Type.Union([
+	Type.Literal("effort"),
+	Type.Literal("budget"),
+	Type.Literal("google-level"),
+	Type.Literal("anthropic-adaptive"),
+	Type.Literal("anthropic-budget-effort"),
+]);
+const ModelThinkingSchema = Type.Object({
+	minLevel: EffortSchema,
+	maxLevel: EffortSchema,
+	mode: ThinkingControlModeSchema,
+});
 // Schema for custom model definition
 // Most fields are optional with sensible defaults for local models (Ollama, LM Studio, etc.)
 const ModelDefinitionSchema = Type.Object({
@@ -88,7 +112,9 @@ const ModelDefinitionSchema = Type.Object({
 			Type.Literal("google-vertex"),
 		]),
 	),
+	baseUrl: Type.Optional(Type.String({ minLength: 1 })),
 	reasoning: Type.Optional(Type.Boolean()),
+	thinking: Type.Optional(ModelThinkingSchema),
 	input: Type.Optional(Type.Array(Type.Union([Type.Literal("text"), Type.Literal("image")]))),
 	cost: Type.Optional(
 		Type.Object({
@@ -110,6 +136,7 @@ const ModelDefinitionSchema = Type.Object({
 const ModelOverrideSchema = Type.Object({
 	name: Type.Optional(Type.String({ minLength: 1 })),
 	reasoning: Type.Optional(Type.Boolean()),
+	thinking: Type.Optional(ModelThinkingSchema),
 	input: Type.Optional(Type.Array(Type.Union([Type.Literal("text"), Type.Literal("image")]))),
 	cost: Type.Optional(
 		Type.Object({
@@ -375,6 +402,7 @@ function applyModelOverride(model: Model<Api>, override: ModelOverride): Model<A
 	const result = { ...model };
 	if (override.name !== undefined) result.name = override.name;
 	if (override.reasoning !== undefined) result.reasoning = override.reasoning;
+	if (override.thinking !== undefined) result.thinking = override.thinking as ThinkingConfig;
 	if (override.input !== undefined) result.input = override.input as ("text" | "image")[];
 	if (override.contextWindow !== undefined) result.contextWindow = override.contextWindow;
 	if (override.maxTokens !== undefined) result.maxTokens = override.maxTokens;
@@ -392,14 +420,16 @@ function applyModelOverride(model: Model<Api>, override: ModelOverride): Model<A
 		result.headers = { ...model.headers, ...override.headers };
 	}
 	result.compat = mergeCompat(model.compat, override.compat);
-	return result;
+	return enrichModelThinking(result);
 }
 interface CustomModelDefinitionLike {
 	id: string;
 	name?: string;
 	api?: Api;
+	baseUrl?: string;
 	reasoning?: boolean;
+	thinking?: ThinkingConfig;
 	input?: ("text" | "image")[];
 	cost?: { input: number; output: number; cacheRead: number; cacheWrite: number };
 	contextWindow?: number;
@@ -445,13 +475,14 @@ function buildCustomModel(
 	const withDefaults = options.useDefaults;
 	const cost = modelDef.cost ?? (withDefaults ? { input: 0, output: 0, cacheRead: 0, cacheWrite: 0 } : undefined);
 	const input = modelDef.input ?? (withDefaults ? ["text"] : undefined);
-	return {
+	return enrichModelThinking({
 		id: modelDef.id,
 		name: modelDef.name ?? (withDefaults ? modelDef.id : undefined),
 		api,
 		provider: providerName,
-		baseUrl: providerBaseUrl,
+		baseUrl: modelDef.baseUrl ?? providerBaseUrl,
 		reasoning: modelDef.reasoning ?? (withDefaults ? false : undefined),
+		thinking: modelDef.thinking as ThinkingConfig | undefined,
 		input: input as ("text" | "image")[],
 		cost,
 		contextWindow: modelDef.contextWindow ?? (withDefaults ? 128000 : undefined),
@@ -460,7 +491,7 @@ function buildCustomModel(
 		compat: modelDef.compat,
 		contextPromotionTarget: modelDef.contextPromotionTarget,
 		premiumMultiplier: modelDef.premiumMultiplier,
-	} as Model<Api>;
+	} as Model<Api>);
 }
 /**
@@ -537,7 +568,7 @@ export class ModelRegistry {
 		const builtInModels = this.#loadBuiltInModels(overrides, modelOverrides);
 		const combined = this.#mergeCustomModels(builtInModels, customModels);
-		this.#models = combined;
+		this.#models = this.#applyHardcodedModelPolicies(combined);
 	}
 	/** Load built-in models, applying provider and per-model overrides */
@@ -716,7 +747,7 @@ export class ModelRegistry {
 					: model;
 			}),
 		);
-		this.#models = this.#applyModelOverrides(merged, this.#modelOverrides);
+		this.#models = this.#applyHardcodedModelPolicies(this.#applyModelOverrides(merged, this.#modelOverrides));
 	}
 	async #discoverProviderModels(providerConfig: DiscoveryProviderConfig): Promise<Model<Api>[]> {
@@ -831,12 +862,57 @@ export class ModelRegistry {
 		}
 	}
+	async #discoverOllamaModelMetadata(
+		endpoint: string,
+		modelId: string,
+		headers: Record<string, string> | undefined,
+	): Promise<{ reasoning: boolean; input: ("text" | "image")[] } | null> {
+		const showUrl = `${endpoint}/api/show`;
+		try {
+			const response = await fetch(showUrl, {
+				method: "POST",
+				headers: { ...(headers ?? {}), "Content-Type": "application/json" },
+				body: JSON.stringify({ model: modelId }),
+				signal: AbortSignal.timeout(1500),
+			});
+			if (!response.ok) {
+				return null;
+			}
+			const payload = (await response.json()) as unknown;
+			if (!isRecord(payload)) {
+				return null;
+			}
+			const capabilities = payload.capabilities;
+			if (Array.isArray(capabilities)) {
+				const normalized = new Set(
+					capabilities.flatMap(capability => (typeof capability === "string" ? [capability.toLowerCase()] : [])),
+				);
+				const supportsVision = normalized.has("vision") || normalized.has("image");
+				return {
+					reasoning: normalized.has("thinking"),
+					input: supportsVision ? ["text", "image"] : ["text"],
+				};
+			}
+			if (!isRecord(capabilities)) {
+				return null;
+			}
+			const supportsVision = capabilities.vision === true || capabilities.image === true;
+			return {
+				reasoning: capabilities.thinking === true,
+				input: supportsVision ? ["text", "image"] : ["text"],
+			};
+		} catch {
+			return null;
+		}
+	}
 	async #discoverOllamaModels(providerConfig: DiscoveryProviderConfig): Promise<Model<Api>[]> {
 		const endpoint = this.#normalizeOllamaBaseUrl(providerConfig.baseUrl);
 		const tagsUrl = `${endpoint}/api/tags`;
+		const headers = { ...(providerConfig.headers ?? {}) };
 		try {
 			const response = await fetch(tagsUrl, {
-				headers: { ...(providerConfig.headers ?? {}) },
+				headers,
 				signal: AbortSignal.timeout(3000),
 			});
 			if (!response.ok) {
@@ -848,25 +924,34 @@ export class ModelRegistry {
 				return [];
 			}
 			const payload = (await response.json()) as { models?: Array<{ name?: string; model?: string }> };
-			const models = payload.models ?? [];
-			const discovered: Model<Api>[] = [];
-			for (const item of models) {
+			const entries = (payload.models ?? []).flatMap(item => {
 				const id = item.model || item.name;
-				if (!id) continue;
-				discovered.push({
-					id,
-					name: item.name || id,
+				return id ? [{ id, name: item.name || id }] : [];
+			});
+			const metadataById = new Map(
+				await Promise.all(
+					entries.map(
+						async entry =>
+							[entry.id, await this.#discoverOllamaModelMetadata(endpoint, entry.id, headers)] as const,
+					),
+				),
+			);
+			const discovered = entries.map(entry => {
+				const metadata = metadataById.get(entry.id);
+				return enrichModelThinking({
+					id: entry.id,
+					name: entry.name,
 					api: providerConfig.api,
 					provider: providerConfig.provider,
 					baseUrl: `${endpoint}/v1`,
-					reasoning: false,
-					input: ["text"],
+					reasoning: metadata?.reasoning ?? false,
+					input: metadata?.input ?? ["text"],
 					cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0 },
 					contextWindow: 128000,
 					maxTokens: 8192,
 					headers: providerConfig.headers,
 				});
-			}
+			});
 			return this.#applyProviderModelOverrides(providerConfig.provider, discovered);
 		} catch (error) {
 			logger.warn("model discovery failed for provider", {
@@ -907,24 +992,26 @@ export class ModelRegistry {
 			for (const item of models) {
 				const id = item.id;
 				if (!id) continue;
-				discovered.push({
-					id,
-					name: id,
-					api: providerConfig.api,
-					provider: providerConfig.provider,
-					baseUrl,
-					reasoning: false,
-					input: ["text"],
-					cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0 },
-					contextWindow: 128000,
-					maxTokens: 8192,
-					headers,
-					compat: {
-						supportsStore: false,
-						supportsDeveloperRole: false,
-						supportsReasoningEffort: false,
-					},
-				});
+				discovered.push(
+					enrichModelThinking({
+						id,
+						name: id,
+						api: providerConfig.api,
+						provider: providerConfig.provider,
+						baseUrl,
+						reasoning: false,
+						input: ["text"],
+						cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0 },
+						contextWindow: 128000,
+						maxTokens: 8192,
+						headers,
+						compat: {
+							supportsStore: false,
+							supportsDeveloperRole: false,
+							supportsReasoningEffort: false,
+						},
+					}),
+				);
 			}
 			return this.#applyProviderModelOverrides(providerConfig.provider, discovered);
 		} catch (error) {
@@ -980,6 +1067,15 @@ export class ModelRegistry {
 		});
 	}
+	#applyHardcodedModelPolicies(models: Model<Api>[]): Model<Api>[] {
+		return models.map(model => {
+			if (model.id === "gpt-5.4") {
+				return { ...model, contextWindow: 1_000_000 };
+			}
+			return model;
+		});
+	}
 	#parseModels(config: ModelsConfig): Model<Api>[] {
 		const models: Model<Api>[] = [];
@@ -997,7 +1093,7 @@ export class ModelRegistry {
 					providerConfig.headers,
 					providerConfig.apiKey,
 					providerConfig.authHeader,
-					modelDef,
+					modelDef as CustomModelDefinitionLike,
 					{ useDefaults: true },
 				);
 				if (!model) continue;
@@ -1150,7 +1246,7 @@ export class ModelRegistry {
 					config.headers,
 					config.apiKey,
 					config.authHeader,
-					modelDef,
+					modelDef as CustomModelDefinitionLike,
 					{ useDefaults: false },
 				);
 				if (!model) {
@@ -1205,7 +1301,9 @@ export interface ProviderConfigInput {
 		id: string;
 		name: string;
 		api?: Api;
+		baseUrl?: string;
 		reasoning: boolean;
+		thinking?: ThinkingConfig;
 		input: ("text" | "image")[];
 		cost: { input: number; output: number; cacheRead: number; cacheWrite: number };
 		contextWindow: number;