npm - aigetwey - Versions diffs - 1.0.1 - Mend

aigetwey 1.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (216) hide show

package/CHANGELOG.md +84 -0
package/LICENSE +21 -0
package/README.md +302 -0
package/assets/logo.svg +8 -0
package/assets/screenshot.png +0 -0
package/assets/wordmark.svg +9 -0
package/config.example.yaml +56 -0
package/dashboard/.env.example +12 -0
package/dashboard/next-env.d.ts +6 -0
package/dashboard/next.config.ts +12 -0
package/dashboard/package-lock.json +1771 -0
package/dashboard/package.json +29 -0
package/dashboard/postcss.config.mjs +5 -0
package/dashboard/src/app/(console)/combos/page.tsx +10 -0
package/dashboard/src/app/(console)/config/page.tsx +5 -0
package/dashboard/src/app/(console)/console/page.tsx +92 -0
package/dashboard/src/app/(console)/endpoint/page.tsx +5 -0
package/dashboard/src/app/(console)/layout.tsx +17 -0
package/dashboard/src/app/(console)/page.tsx +8 -0
package/dashboard/src/app/(console)/providers/[id]/page.tsx +6 -0
package/dashboard/src/app/(console)/providers/page.tsx +5 -0
package/dashboard/src/app/(console)/quota/page.tsx +5 -0
package/dashboard/src/app/(console)/tools/[id]/page.tsx +6 -0
package/dashboard/src/app/(console)/tools/page.tsx +5 -0
package/dashboard/src/app/(console)/usage/page.tsx +24 -0
package/dashboard/src/app/api/cli-detect/[tool]/route.ts +253 -0
package/dashboard/src/app/api/gw/[...path]/route.ts +89 -0
package/dashboard/src/app/api/login/route.ts +30 -0
package/dashboard/src/app/api/logout/route.ts +9 -0
package/dashboard/src/app/api/password/route.ts +34 -0
package/dashboard/src/app/globals.css +340 -0
package/dashboard/src/app/icon.svg +8 -0
package/dashboard/src/app/layout.tsx +28 -0
package/dashboard/src/app/login/page.tsx +60 -0
package/dashboard/src/components/AreaChart.tsx +115 -0
package/dashboard/src/components/Badge.tsx +32 -0
package/dashboard/src/components/Button.tsx +60 -0
package/dashboard/src/components/CapacityBadges.tsx +40 -0
package/dashboard/src/components/Checkbox.tsx +40 -0
package/dashboard/src/components/CliToolConfig.tsx +63 -0
package/dashboard/src/components/ConfigEditor.tsx +199 -0
package/dashboard/src/components/ConfirmModal.tsx +36 -0
package/dashboard/src/components/CooldownTimer.tsx +42 -0
package/dashboard/src/components/EndpointView.tsx +439 -0
package/dashboard/src/components/Icon.tsx +25 -0
package/dashboard/src/components/KeyReveal.tsx +78 -0
package/dashboard/src/components/Lamp.tsx +8 -0
package/dashboard/src/components/LogTable.tsx +223 -0
package/dashboard/src/components/LogoutButton.tsx +20 -0
package/dashboard/src/components/ModelPicker.tsx +121 -0
package/dashboard/src/components/ModelSelectModal.tsx +126 -0
package/dashboard/src/components/PasswordEditor.tsx +86 -0
package/dashboard/src/components/PricingEditor.tsx +171 -0
package/dashboard/src/components/ProviderDetail.tsx +566 -0
package/dashboard/src/components/ProviderManager.tsx +311 -0
package/dashboard/src/components/QuotaView.tsx +78 -0
package/dashboard/src/components/Rail.tsx +82 -0
package/dashboard/src/components/RichCard.tsx +46 -0
package/dashboard/src/components/RoutingView.tsx +329 -0
package/dashboard/src/components/ThemeProvider.tsx +36 -0
package/dashboard/src/components/ToastProvider.tsx +58 -0
package/dashboard/src/components/ToolDetail.tsx +475 -0
package/dashboard/src/components/TopBar.tsx +128 -0
package/dashboard/src/components/UsageView.tsx +151 -0
package/dashboard/src/components/ui.tsx +54 -0
package/dashboard/src/lib/capabilities.ts +318 -0
package/dashboard/src/lib/cliTools.ts +120 -0
package/dashboard/src/lib/client.ts +190 -0
package/dashboard/src/lib/gateway.ts +269 -0
package/dashboard/src/lib/session.ts +71 -0
package/dashboard/src/middleware.ts +37 -0
package/dashboard/tsconfig.json +21 -0
package/dist/adapters/anthropic.js +289 -0
package/dist/adapters/anthropic.js.map +1 -0
package/dist/adapters/gemini.js +268 -0
package/dist/adapters/gemini.js.map +1 -0
package/dist/adapters/index.js +8 -0
package/dist/adapters/index.js.map +1 -0
package/dist/adapters/openai.js +13 -0
package/dist/adapters/openai.js.map +1 -0
package/dist/cli/tray/autostart.js +152 -0
package/dist/cli/tray/autostart.js.map +1 -0
package/dist/cli/tray/icon.js +4 -0
package/dist/cli/tray/icon.js.map +1 -0
package/dist/cli/tray/tray.js +141 -0
package/dist/cli/tray/tray.js.map +1 -0
package/dist/cli/tray/trayRuntime.js +91 -0
package/dist/cli/tray/trayRuntime.js.map +1 -0
package/dist/cli.js +361 -0
package/dist/cli.js.map +1 -0
package/dist/config.js +728 -0
package/dist/config.js.map +1 -0
package/dist/core/authStore.js +78 -0
package/dist/core/authStore.js.map +1 -0
package/dist/core/canonical.js +9 -0
package/dist/core/canonical.js.map +1 -0
package/dist/core/console-buffer.js +25 -0
package/dist/core/console-buffer.js.map +1 -0
package/dist/core/fallback.js +62 -0
package/dist/core/fallback.js.map +1 -0
package/dist/core/handler.js +174 -0
package/dist/core/handler.js.map +1 -0
package/dist/core/keypool.js +105 -0
package/dist/core/keypool.js.map +1 -0
package/dist/core/quota.js +165 -0
package/dist/core/quota.js.map +1 -0
package/dist/core/state.js +52 -0
package/dist/core/state.js.map +1 -0
package/dist/db.js +193 -0
package/dist/db.js.map +1 -0
package/dist/headroom/compress.js +44 -0
package/dist/headroom/compress.js.map +1 -0
package/dist/headroom/detect.js +108 -0
package/dist/headroom/detect.js.map +1 -0
package/dist/headroom/process.js +158 -0
package/dist/headroom/process.js.map +1 -0
package/dist/inject/caveman.js +30 -0
package/dist/inject/caveman.js.map +1 -0
package/dist/inject/index.js +24 -0
package/dist/inject/index.js.map +1 -0
package/dist/inject/ponytail.js +19 -0
package/dist/inject/ponytail.js.map +1 -0
package/dist/middleware/auth.js +66 -0
package/dist/middleware/auth.js.map +1 -0
package/dist/providers/capabilities.js +246 -0
package/dist/providers/capabilities.js.map +1 -0
package/dist/providers/free.js +43 -0
package/dist/providers/free.js.map +1 -0
package/dist/providers/pricing.js +224 -0
package/dist/providers/pricing.js.map +1 -0
package/dist/providers/vertex.js +97 -0
package/dist/providers/vertex.js.map +1 -0
package/dist/routes/admin.js +622 -0
package/dist/routes/admin.js.map +1 -0
package/dist/routes/health.js +4 -0
package/dist/routes/health.js.map +1 -0
package/dist/routes/index.js +12 -0
package/dist/routes/index.js.map +1 -0
package/dist/routes/v1.js +75 -0
package/dist/routes/v1.js.map +1 -0
package/dist/rtk/detect.js +50 -0
package/dist/rtk/detect.js.map +1 -0
package/dist/rtk/filters.js +85 -0
package/dist/rtk/filters.js.map +1 -0
package/dist/rtk/index.js +39 -0
package/dist/rtk/index.js.map +1 -0
package/dist/server.js +100 -0
package/dist/server.js.map +1 -0
package/dist/stream/anthropic-stream.js +239 -0
package/dist/stream/anthropic-stream.js.map +1 -0
package/dist/stream/chunk.js +7 -0
package/dist/stream/chunk.js.map +1 -0
package/dist/stream/gemini-stream.js +135 -0
package/dist/stream/gemini-stream.js.map +1 -0
package/dist/stream/index.js +12 -0
package/dist/stream/index.js.map +1 -0
package/dist/stream/openai-stream.js +34 -0
package/dist/stream/openai-stream.js.map +1 -0
package/dist/stream/sse.js +64 -0
package/dist/stream/sse.js.map +1 -0
package/dist/translator/thinking.js +70 -0
package/dist/translator/thinking.js.map +1 -0
package/dist/translator/thinkingUnified.js +322 -0
package/dist/translator/thinkingUnified.js.map +1 -0
package/dist/upstream/client.js +120 -0
package/dist/upstream/client.js.map +1 -0
package/package.json +76 -0
package/run.sh +27 -0
package/src/adapters/anthropic.ts +377 -0
package/src/adapters/gemini.ts +341 -0
package/src/adapters/index.ts +17 -0
package/src/adapters/openai.ts +22 -0
package/src/cli/tray/autostart.ts +133 -0
package/src/cli/tray/icon.ts +4 -0
package/src/cli/tray/tray.ts +156 -0
package/src/cli/tray/trayRuntime.ts +90 -0
package/src/cli.ts +379 -0
package/src/config.ts +777 -0
package/src/core/authStore.ts +86 -0
package/src/core/canonical.ts +93 -0
package/src/core/console-buffer.ts +39 -0
package/src/core/fallback.ts +116 -0
package/src/core/handler.ts +236 -0
package/src/core/keypool.ts +152 -0
package/src/core/quota.ts +214 -0
package/src/core/state.ts +65 -0
package/src/db.ts +280 -0
package/src/headroom/compress.ts +78 -0
package/src/headroom/detect.ts +119 -0
package/src/headroom/process.ts +166 -0
package/src/inject/caveman.ts +35 -0
package/src/inject/index.ts +46 -0
package/src/inject/ponytail.ts +31 -0
package/src/middleware/auth.ts +76 -0
package/src/providers/capabilities.ts +297 -0
package/src/providers/free.ts +53 -0
package/src/providers/pricing.ts +261 -0
package/src/providers/vertex.ts +117 -0
package/src/routes/admin.ts +716 -0
package/src/routes/health.ts +5 -0
package/src/routes/index.ts +24 -0
package/src/routes/v1.ts +87 -0
package/src/rtk/detect.ts +55 -0
package/src/rtk/filters.ts +94 -0
package/src/rtk/index.ts +58 -0
package/src/server.ts +108 -0
package/src/stream/anthropic-stream.ts +310 -0
package/src/stream/chunk.ts +46 -0
package/src/stream/gemini-stream.ts +158 -0
package/src/stream/index.ts +23 -0
package/src/stream/openai-stream.ts +41 -0
package/src/stream/sse.ts +72 -0
package/src/translator/thinking.ts +64 -0
package/src/translator/thinkingUnified.ts +319 -0
package/src/upstream/client.ts +155 -0
package/tsconfig.json +20 -0

package/src/providers/capabilities.ts ADDED Viewed

@@ -0,0 +1,297 @@
+// Model capabilities — what each model can read/do beyond plain text.
+//
+// Fallback order (first match wins), result merged over DEFAULT_CAPABILITIES:
+//   1. PROVIDER_CAPABILITIES[provider][model]  — provider-specific override
+//   2. MODEL_CAPABILITIES[model]               — canonical exact id (handles exceptions)
+//   3. PATTERN_CAPABILITIES                     — glob match, ordered specific -> generic
+//   4. DEFAULT_CAPABILITIES                     — safe floor (always returned)
+//
+// ── HOW TO ADD / UPDATE A MODEL ──────────────────────────────────────
+// Authoritative data source: https://models.dev/api.json (145 providers, 4000+
+// models, MIT). Each model exposes the exact fields we map below:
+//   modalities.input  ["text","image","pdf","audio","video"] -> vision / pdf / audioInput / videoInput
+//   modalities.output ["text","image","audio"]               -> imageOutput / audioOutput
+//   reasoning   -> reasoning      tool_call    -> tools
+//   limit.context -> contextWindow   limit.output -> maxOutput
+// Look up the model id, then:
+//   • If a PATTERN below already covers it correctly -> nothing to do.
+//   • If it is an exception (pattern would mis-match) -> add an exact entry to
+//     MODEL_CAPABILITIES (only the fields that differ from DEFAULT).
+//   • If a whole new family -> add an ordered PATTERN (specific before generic).
+// NOTE: models.dev has NO "search" flag (web search is a runtime tool, not a
+// model spec); set `search` from vendor docs (Claude 4.x+, GPT-5.x/4o, Gemini
+// 2.0+, Grok, Perplexity). Verify with: curl -s https://models.dev/api.json
+/**
+ * Safe floor — every resolved result is merged over this so consumers
+ * never need null-checks. Most modern LLMs meet these limits.
+ */
+export interface Caps {
+  vision: boolean;
+  pdf: boolean;
+  audioInput: boolean;
+  videoInput: boolean;
+  imageOutput: boolean;
+  audioOutput: boolean;
+  search: boolean;
+  tools: boolean;
+  reasoning: boolean;
+  thinkingFormat: string | null;
+  thinkingCanDisable: boolean;
+  thinkingRange: { min: number; max: number } | null;
+  contextWindow: number;
+  maxOutput: number;
+}
+/**
+ * Glob (* = wildcard) match, anchored + case-insensitive. aigetwey's
+ * pricing.matchPattern so capabilities resolve identically.
+ */
+export function matchPattern(pattern: string, model: string): boolean {
+  const regex = new RegExp(
+    "^" + pattern.split("*").map((s) => s.replace(/[.*+?^${}()|[\]\\]/g, "\\$&")).join(".*") + "$",
+    "i",
+  );
+  return regex.test(model);
+}
+export const DEFAULT_CAPABILITIES: Caps = {
+  // input modalities
+  vision: false,        // read images
+  pdf: false,           // read PDF / documents
+  audioInput: false,    // read audio
+  videoInput: false,    // read video
+  // output modalities
+  imageOutput: false,   // generate images
+  audioOutput: false,   // generate audio
+  // features
+  search: false,        // built-in web search tool / grounding
+  tools: true,          // function / tool calling
+  reasoning: false,     // thinking / reasoning
+  // thinking wire format (only meaningful when reasoning:true). null → derive from transport.format.
+  // enum: openai|claude-adaptive|claude-budget|gemini-level|gemini-budget|zai|qwen|deepseek|kimi|minimax|hunyuan|step
+  thinkingFormat: null,
+  thinkingCanDisable: true,  // false → model cannot turn thinking off (clamp to min instead of disable)
+  thinkingRange: null,       // { min, max } for budget formats; null = no clamp
+  // limits (tokens)
+  contextWindow: 200000,
+  maxOutput: 64000,
+};
+// User-added model metadata can carry dashboard service kinds instead of the
+// runtime capability names used here. Map those typed model kinds into input /
+// output capabilities so custom vision models are not treated as text-only.
+const SERVICE_KIND_CAPABILITIES: Record<string, Partial<Caps>> = {
+  imageToText: { vision: true },
+  image: { imageOutput: true },
+  stt: { audioInput: true },
+  tts: { audioOutput: true },
+  embedding: { tools: false },
+};
+export function capabilitiesFromServiceKind(kind: string): Partial<Caps> | null {
+  return SERVICE_KIND_CAPABILITIES[kind] || null;
+}
+/**
+ * Canonical exact-id overrides — used for exceptions that patterns would
+ * otherwise mis-match. Only declare deltas vs DEFAULT.
+ */
+export const MODEL_CAPABILITIES: Record<string, Partial<Caps>> = {
+  // Claude 4.6/4.7 have 1M context + adaptive thinking (override generic claude pattern)
+  "claude-opus-4.6":   { vision: true, reasoning: true, search: true, thinkingFormat: "claude-adaptive", contextWindow: 1000000, maxOutput: 128000 },
+  "claude-opus-4.7":   { vision: true, reasoning: true, search: true, thinkingFormat: "claude-adaptive", contextWindow: 1000000, maxOutput: 128000 },
+  "claude-opus-4-6":   { vision: true, reasoning: true, search: true, thinkingFormat: "claude-adaptive", contextWindow: 1000000, maxOutput: 128000 },
+  "claude-sonnet-4.6": { vision: true, reasoning: true, search: true, thinkingFormat: "claude-adaptive", contextWindow: 1000000, maxOutput: 64000 },
+  "claude-sonnet-4-6": { vision: true, reasoning: true, search: true, thinkingFormat: "claude-adaptive", contextWindow: 1000000, maxOutput: 64000 },
+  // Gemini image-gen / OpenAI image / xai image variants
+  "gpt-image-1":       { imageOutput: true, tools: false },
+  // GLM vision variant (text GLM has no vision)
+  "glm-4.6v":          { vision: true, reasoning: true, thinkingFormat: "zai", contextWindow: 128000 },
+  // Qwen plain coder/text (no vision) — registry "vision-model" / "coder-model" aliases
+  "vision-model":      { vision: true, reasoning: true, thinkingFormat: "qwen", contextWindow: 1000000 },
+  "coder-model":       { reasoning: true, thinkingFormat: "qwen", contextWindow: 1000000 },
+};
+/**
+ * Provider-specific capability overrides. Keyed by provider alias/id.
+ */
+export const PROVIDER_CAPABILITIES: Record<string, Record<string, Partial<Caps>>> = {
+  // CodeBuddy.cn — authoritative per-model metadata from the gateway's model
+  // config (contextWindow=maxInputTokens, maxOutput=maxOutputTokens, vision=
+  // supportsImages). Every model reasons via OpenAI-style reasoning_effort
+  // (see registry thinkingFormat). `onlyReasoning` models can't turn thinking
+  // off → thinkingCanDisable:false (clamped to minimal instead of disabled).
+  "codebuddy-cn": {
+    "glm-5.2":            { reasoning: true, thinkingFormat: "openai", thinkingCanDisable: false, contextWindow: 1000000, maxOutput: 48000 },
+    "glm-5.1":            { reasoning: true, thinkingFormat: "openai", thinkingCanDisable: false, contextWindow: 200000, maxOutput: 48000 },
+    "glm-5.0":            { reasoning: true, thinkingFormat: "openai", contextWindow: 200000, maxOutput: 48000 },
+    "glm-5.0-turbo":      { reasoning: true, thinkingFormat: "openai", thinkingCanDisable: false, contextWindow: 200000, maxOutput: 48000 },
+    "glm-5v-turbo":       { vision: true, reasoning: true, thinkingFormat: "openai", thinkingCanDisable: false, contextWindow: 200000, maxOutput: 38000 },
+    "glm-4.7":            { reasoning: true, thinkingFormat: "openai", contextWindow: 200000, maxOutput: 48000 },
+    "minimax-m3":         { vision: true, reasoning: true, thinkingFormat: "openai", thinkingCanDisable: false, contextWindow: 512000, maxOutput: 48000 },
+    "minimax-m2.7":       { vision: true, reasoning: true, thinkingFormat: "openai", thinkingCanDisable: false, contextWindow: 200000, maxOutput: 48000 },
+    "kimi-k2.7":          { vision: true, reasoning: true, thinkingFormat: "openai", thinkingCanDisable: false, contextWindow: 256000, maxOutput: 32000 },
+    "kimi-k2.6":          { vision: true, reasoning: true, thinkingFormat: "openai", thinkingCanDisable: false, contextWindow: 256000, maxOutput: 32000 },
+    "kimi-k2.5":          { vision: true, reasoning: true, thinkingFormat: "openai", thinkingCanDisable: false, contextWindow: 164000, maxOutput: 32000 },
+    "hy3-preview":        { vision: true, reasoning: true, thinkingFormat: "openai", thinkingCanDisable: false, contextWindow: 192000, maxOutput: 64000 },
+    "deepseek-v4-pro":    { vision: true, reasoning: true, thinkingFormat: "openai", thinkingCanDisable: false, contextWindow: 1000000, maxOutput: 50000 },
+    "deepseek-v4-flash":  { vision: true, reasoning: true, thinkingFormat: "openai", thinkingCanDisable: false, contextWindow: 1000000, maxOutput: 50000 },
+    "deepseek-v3-2-volc": { reasoning: true, thinkingFormat: "openai", thinkingCanDisable: false, contextWindow: 96000, maxOutput: 32000 },
+  },
+};
+/**
+ * Pattern fallback — glob (* = wildcard), matched case-insensitively and
+ * anchored (^...$) so a pattern must match the full model id. ORDER MATTERS:
+ * vision/specific variants first, text-only/generic families last, to avoid
+ * a broad family pattern swallowing an exception (e.g. glm-4.6v vs glm-5).
+ */
+export const PATTERN_CAPABILITIES: Array<{ pattern: string; caps: Partial<Caps> }> = [
+  // ── Claude (4.6+ = adaptive thinking; older/haiku = budget) ──────
+  { pattern: "*claude*opus-4.6*",   caps: { vision: true, reasoning: true, search: true, thinkingFormat: "claude-adaptive" } },
+  { pattern: "*claude*opus-4.7*",   caps: { vision: true, reasoning: true, search: true, thinkingFormat: "claude-adaptive" } },
+  { pattern: "*claude*opus-4.8*",   caps: { vision: true, reasoning: true, search: true, thinkingFormat: "claude-adaptive" } },
+  { pattern: "*claude*sonnet-4.6*", caps: { vision: true, reasoning: true, search: true, thinkingFormat: "claude-adaptive" } },
+  { pattern: "*claude*sonnet-4.7*", caps: { vision: true, reasoning: true, search: true, thinkingFormat: "claude-adaptive" } },
+  { pattern: "*claude*haiku*",  caps: { vision: true, reasoning: true, search: true, thinkingFormat: "claude-budget" } },
+  { pattern: "*claude*opus*",   caps: { vision: true, reasoning: true, search: true, thinkingFormat: "claude-budget" } },
+  { pattern: "*claude*sonnet*", caps: { vision: true, reasoning: true, search: true, thinkingFormat: "claude-budget" } },
+  { pattern: "*claude*fable*",  caps: { vision: true, reasoning: true, search: true, thinkingFormat: "claude-budget", contextWindow: 1000000, maxOutput: 128000 } },
+  { pattern: "*claude*mythos*", caps: { vision: true, reasoning: true, search: true, thinkingFormat: "claude-budget", contextWindow: 1000000, maxOutput: 128000 } },
+  { pattern: "*claude-3*",      caps: { vision: true } },
+  { pattern: "*claude*",        caps: { vision: true, reasoning: true, search: true, thinkingFormat: "claude-budget" } },
+  // ── Gemini (all 2.0+ multimodal + google_search grounding, 1M ctx) ─
+  { pattern: "*gemini*image*",  caps: { vision: true, imageOutput: true, contextWindow: 1048576 } },
+  { pattern: "*gemini-3*pro*",  caps: { vision: true, audioInput: true, videoInput: true, reasoning: true, search: true, thinkingFormat: "gemini-level", thinkingCanDisable: false, contextWindow: 1048576, maxOutput: 65535 } },
+  { pattern: "*gemini-3*",      caps: { vision: true, audioInput: true, videoInput: true, reasoning: true, search: true, thinkingFormat: "gemini-level", thinkingCanDisable: false, contextWindow: 1048576, maxOutput: 65536 } },
+  { pattern: "*gemini-2.5*",    caps: { vision: true, audioInput: true, videoInput: true, reasoning: true, search: true, thinkingFormat: "gemini-budget", thinkingRange: { min: 0, max: 24576 }, contextWindow: 1048576, maxOutput: 65536 } },
+  { pattern: "*gemini-2*",      caps: { vision: true, audioInput: true, videoInput: true, search: true, contextWindow: 1048576, maxOutput: 65536 } },
+  { pattern: "*gemini*",        caps: { vision: true, search: true, contextWindow: 1048576 } },
+  { pattern: "*gemma*",         caps: { vision: true, contextWindow: 128000 } },
+  { pattern: "*nanobanana*",    caps: { vision: true, imageOutput: true } },
+  // ── OpenAI GPT-5.x (vision + thinking + web search) ──────────────
+  { pattern: "*gpt-5*image*",   caps: { imageOutput: true } },
+  { pattern: "*gpt-5*codex*",   caps: { reasoning: true, search: true, thinkingFormat: "openai", contextWindow: 400000, maxOutput: 128000 } },
+  { pattern: "*gpt-5*",         caps: { vision: true, reasoning: true, search: true, thinkingFormat: "openai", contextWindow: 400000, maxOutput: 128000 } },
+  { pattern: "*gpt-4o*",        caps: { vision: true, search: true, contextWindow: 128000, maxOutput: 16384 } },
+  { pattern: "*gpt-4.1*",       caps: { vision: true, contextWindow: 1000000, maxOutput: 32768 } },
+  { pattern: "*gpt-4-turbo*",   caps: { vision: true, contextWindow: 128000 } },
+  { pattern: "*gpt-4*",         caps: { contextWindow: 128000 } },
+  { pattern: "*gpt-3.5*",       caps: { contextWindow: 16385, maxOutput: 4096 } },
+  { pattern: "*gpt-oss*",       caps: { reasoning: true, thinkingFormat: "openai", contextWindow: 128000 } },
+  // ── OpenAI o-series (reasoning, vision) ──────────────────────────
+  { pattern: "*o1-mini*",       caps: { reasoning: true, thinkingFormat: "openai", contextWindow: 128000 } },
+  { pattern: "*o1*",            caps: { vision: true, reasoning: true, thinkingFormat: "openai", contextWindow: 200000, maxOutput: 100000 } },
+  { pattern: "*o3*",            caps: { vision: true, reasoning: true, thinkingFormat: "openai", contextWindow: 200000, maxOutput: 100000 } },
+  { pattern: "*o4*",            caps: { vision: true, reasoning: true, thinkingFormat: "openai", contextWindow: 200000, maxOutput: 100000 } },
+  // ── Grok (vision + Live Search) ──────────────────────────────────
+  { pattern: "*grok*image*",    caps: { imageOutput: true } },
+  { pattern: "*grok-code*",     caps: { reasoning: true, thinkingFormat: "openai", contextWindow: 256000 } },
+  { pattern: "*grok-4*",        caps: { vision: true, reasoning: true, search: true, thinkingFormat: "openai", contextWindow: 256000 } },
+  { pattern: "*grok-3*",        caps: { vision: true, reasoning: true, search: true, thinkingFormat: "openai", contextWindow: 131072 } },
+  { pattern: "*grok*",          caps: { vision: true, reasoning: true, search: true, thinkingFormat: "openai", contextWindow: 256000 } },
+  // ── Qwen (enable_thinking + thinking_budget; QwQ = thinking-only) ─
+  { pattern: "*qwen*vl*",       caps: { vision: true, reasoning: true, thinkingFormat: "qwen", contextWindow: 262144 } },
+  { pattern: "*qwen*max*",      caps: { vision: true, reasoning: true, thinkingFormat: "qwen", contextWindow: 1000000, maxOutput: 65536 } },
+  { pattern: "*qwen*plus*",     caps: { vision: true, reasoning: true, thinkingFormat: "qwen", contextWindow: 1000000, maxOutput: 65536 } },
+  { pattern: "*qwen*235b*",     caps: { reasoning: true, thinkingFormat: "qwen", contextWindow: 262144 } },
+  { pattern: "*qwen*coder*",    caps: { reasoning: true, thinkingFormat: "qwen", contextWindow: 1000000 } },
+  { pattern: "*qwq*",           caps: { reasoning: true, thinkingFormat: "qwen", thinkingCanDisable: false, contextWindow: 131072 } },
+  { pattern: "*qwen*",          caps: { reasoning: true, thinkingFormat: "qwen", contextWindow: 262144 } },
+  // ── Kimi (enabled→reasoning_effort; K2.7-code cannot disable) ─────
+  { pattern: "*kimi*k2.7*code*", caps: { vision: true, reasoning: true, thinkingFormat: "kimi", thinkingCanDisable: false, contextWindow: 262144, maxOutput: 262144 } },
+  { pattern: "*kimi*k2*",       caps: { vision: true, reasoning: true, thinkingFormat: "kimi", contextWindow: 262144, maxOutput: 262144 } },
+  { pattern: "*kimi*",          caps: { reasoning: true, thinkingFormat: "kimi", contextWindow: 262144 } },
+  // ── GLM / Z.ai (thinking.enabled; disable via enable_thinking:false) ─
+  { pattern: "*glm-5*",         caps: { reasoning: true, thinkingFormat: "zai", contextWindow: 200000, maxOutput: 128000 } },
+  { pattern: "*glm-4.7*",       caps: { reasoning: true, thinkingFormat: "zai", contextWindow: 200000, maxOutput: 128000 } },
+  { pattern: "*glm-4*",         caps: { reasoning: true, thinkingFormat: "zai", contextWindow: 200000 } },
+  { pattern: "*glm*",           caps: { reasoning: true, thinkingFormat: "zai", contextWindow: 200000 } },
+  // ── DeepSeek (thinking.enabled + reasoning_effort; r1 = thinking-only) ─
+  { pattern: "*deepseek-v4*",   caps: { reasoning: true, thinkingFormat: "deepseek", contextWindow: 1000000, maxOutput: 384000 } },
+  { pattern: "*reasoner*",      caps: { reasoning: true, thinkingFormat: "deepseek", thinkingCanDisable: false, contextWindow: 128000 } },
+  { pattern: "*deepseek-r*",    caps: { reasoning: true, thinkingFormat: "deepseek", thinkingCanDisable: false, contextWindow: 128000 } },
+  { pattern: "*deepseek-chat*", caps: { contextWindow: 128000 } },
+  { pattern: "*deepseek*",      caps: { reasoning: true, thinkingFormat: "deepseek", contextWindow: 128000 } },
+  // ── MiniMax (M3 = adaptive; M2.x cannot disable) ─────────────────
+  { pattern: "*minimax*image*", caps: { imageOutput: true } },
+  { pattern: "*minimax-m3*",    caps: { vision: true, reasoning: true, thinkingFormat: "minimax", contextWindow: 1048576, maxOutput: 512000 } },
+  { pattern: "*minimax-m2.7*",  caps: { reasoning: true, thinkingFormat: "minimax", thinkingCanDisable: false, contextWindow: 204800, maxOutput: 131072 } },
+  { pattern: "*minimax*",       caps: { reasoning: true, thinkingFormat: "minimax", thinkingCanDisable: false, contextWindow: 200000, maxOutput: 131072 } },
+  // ── Xiaomi MiMo (vision, 1M / 262K ctx) ──────────────────────────
+  { pattern: "*mimo*v2.5*",     caps: { vision: true, contextWindow: 1048576, maxOutput: 131072 } },
+  { pattern: "*mimo*omni*",     caps: { vision: true, audioInput: true, contextWindow: 262144, maxOutput: 131072 } },
+  { pattern: "*mimo*",          caps: { vision: true, contextWindow: 262144, maxOutput: 131072 } },
+  // ── Llama (4 = vision/1M; 3.x = text-only/128K) ──────────────────
+  { pattern: "*llama-4*",       caps: { vision: true, contextWindow: 1000000 } },
+  { pattern: "*llama*",         caps: { contextWindow: 128000 } },
+  // ── Mistral (Large 3 = vision/256K; codestral text) ──────────────
+  { pattern: "*codestral*",     caps: { contextWindow: 256000 } },
+  { pattern: "*mistral-large*", caps: { vision: true, contextWindow: 256000 } },
+  { pattern: "*mistral*",       caps: { contextWindow: 128000 } },
+  // ── Cohere (Command A Vision = vision; others text) ──────────────
+  { pattern: "*command-a-vision*", caps: { vision: true, contextWindow: 128000 } },
+  { pattern: "*command*",       caps: { contextWindow: 128000 } },
+  // ── Perplexity (web search native) ───────────────────────────────
+  { pattern: "*sonar*",         caps: { search: true, contextWindow: 128000 } },
+  { pattern: "*pplx*",          caps: { search: true, contextWindow: 128000 } },
+  { pattern: "*perplexity*",    caps: { search: true, contextWindow: 128000 } },
+  // ── Others ───────────────────────────────────────────────────────
+  { pattern: "*hunyuan*",       caps: { reasoning: true, thinkingFormat: "hunyuan", contextWindow: 262144, maxOutput: 262144 } },
+  { pattern: "hy3*",            caps: { reasoning: true, thinkingFormat: "hunyuan", contextWindow: 262144, maxOutput: 262144 } },
+  { pattern: "*step-*",         caps: { reasoning: true, thinkingFormat: "step", contextWindow: 128000 } },
+  { pattern: "*nemotron*",      caps: { reasoning: true, contextWindow: 128000 } },
+  { pattern: "*ling-*",         caps: { reasoning: true, contextWindow: 128000 } },
+];
+/**
+ * Resolve capabilities for a model using the 4-step fallback chain,
+ * merged over DEFAULT_CAPABILITIES so the result is always complete.
+ *
+ * @param {string} provider
+ * @param {string} model
+ * @returns {object} full capabilities object
+ */
+export function getCapabilitiesForModel(provider: string | null, model: string): Caps {
+  if (!model) return { ...DEFAULT_CAPABILITIES };
+  // 1. Provider-specific override
+  if (provider && PROVIDER_CAPABILITIES[provider]?.[model]) {
+    return { ...DEFAULT_CAPABILITIES, ...PROVIDER_CAPABILITIES[provider][model] };
+  }
+  // 2. Canonical exact (strip vendor prefix: "anthropic/claude-opus-4.7" -> "claude-opus-4.7")
+  const baseModel = (model.includes("/") ? model.split("/").pop() : model) ?? model;
+  if (MODEL_CAPABILITIES[baseModel]) return { ...DEFAULT_CAPABILITIES, ...MODEL_CAPABILITIES[baseModel] };
+  if (MODEL_CAPABILITIES[model]) return { ...DEFAULT_CAPABILITIES, ...MODEL_CAPABILITIES[model] };
+  // 3. Pattern match (first match wins)
+  for (const { pattern, caps } of PATTERN_CAPABILITIES) {
+    if (matchPattern(pattern, baseModel) || matchPattern(pattern, model)) {
+      return { ...DEFAULT_CAPABILITIES, ...caps };
+    }
+  }
+  // 4. Floor
+  return { ...DEFAULT_CAPABILITIES };
+}

package/src/providers/free.ts ADDED Viewed

@@ -0,0 +1,53 @@
+/**
+ * Free passthrough providers (e.g. OpenCode Free). These speak OpenAI format,
+ * need no upstream auth, and expose their catalog at `{base_url}/models`. The
+ * gateway already routes them through the normal pipeline (the key pool hands
+ * out an empty key, the client omits the auth header); this module only adds the
+ * one extra capability they need — fetching the model list at runtime so it
+ * doesn't have to be hand-maintained in config.
+ */
+import { request } from "undici";
+import type { Provider } from "../config.js";
+export interface FetchedModel {
+  id: string;
+}
+export interface ModelFetchResult {
+  ok: boolean;
+  models: FetchedModel[];
+  error?: string;
+}
+/**
+ * Fetch a provider's model catalog from `{base_url}/models` (OpenAI shape:
+ * `{ data: [{ id }] }`). Never throws — returns a structured result so the
+ * dashboard's "Connect OpenCode Free" button can surface failures inline.
+ */
+export async function fetchModels(provider: Provider): Promise<ModelFetchResult> {
+  const base = provider.base_url.replace(/\/$/, "");
+  const headers: Record<string, string> = { ...(provider.headers ?? {}) };
+  // a free provider has no key; a keyed one still gets its bearer for /models.
+  const key = provider.api_keys?.[0] ?? provider.api_key;
+  if (key && !provider.free) headers["authorization"] = `Bearer ${key}`;
+  try {
+    const res = await request(`${base}/models`, {
+      method: "GET",
+      headers,
+      headersTimeout: 15_000,
+      bodyTimeout: 15_000,
+    });
+    if (res.statusCode >= 400) {
+      await res.body.dump();
+      return { ok: false, models: [], error: `models endpoint returned ${res.statusCode}` };
+    }
+    const body = (await res.body.json()) as { data?: Array<{ id?: unknown }> };
+    const models = (body.data ?? [])
+      .map((m) => (typeof m.id === "string" ? { id: m.id } : null))
+      .filter((m): m is FetchedModel => m !== null);
+    return { ok: true, models };
+  } catch (e) {
+    return { ok: false, models: [], error: (e as Error).message };
+  }
+}

package/src/providers/pricing.ts ADDED Viewed

@@ -0,0 +1,261 @@
+// Pricing rates for AI models — all rates in $/1M tokens
+//
+// Fallback order (first match wins):
+//   1. PROVIDER_PRICING[provider][model]  — provider-specific override
+//   2. MODEL_PRICING[model]               — canonical model price (provider-agnostic)
+//   3. PATTERN_PRICING                    — glob pattern match (e.g. "codex-*")
+/**
+ * All rates in $/1M tokens. Implemented for aigetwey so cost auto-resolves per model the same way. See
+ *
+ */
+export interface Pricing {
+  input: number;
+  output: number;
+  cached?: number;
+  reasoning?: number;
+  cache_creation?: number;
+}
+/**
+ * Canonical model pricing — provider-agnostic.
+ * Cover all known models; deduplicated across providers.
+ */
+export const MODEL_PRICING: Record<string, Pricing> = {
+  // === Anthropic / Claude ===
+  "claude-opus-4-6":              { input: 5.00,  output: 25.00, cached: 0.50,  reasoning: 25.00,  cache_creation: 6.25  },
+  "claude-opus-4-5-20251101":     { input: 5.00,  output: 25.00, cached: 0.50,  reasoning: 25.00,  cache_creation: 6.25  },
+  "claude-sonnet-4-6":            { input: 3.00,  output: 15.00, cached: 0.30,  reasoning: 15.00,  cache_creation: 3.75  },
+  "claude-sonnet-4-5-20250929":   { input: 3.00,  output: 15.00, cached: 0.30,  reasoning: 15.00,  cache_creation: 3.75  },
+  "claude-haiku-4-5-20251001":    { input: 1.00,  output: 5.00,  cached: 0.10,  reasoning: 5.00,   cache_creation: 1.25  },
+  "claude-sonnet-4-20250514":     { input: 3.00,  output: 15.00, cached: 1.50,  reasoning: 15.00,  cache_creation: 3.00  },
+  "claude-opus-4-20250514":       { input: 15.00, output: 25.00, cached: 7.50,  reasoning: 112.50, cache_creation: 15.00 },
+  "claude-3-5-sonnet-20241022":   { input: 3.00,  output: 15.00, cached: 1.50,  reasoning: 15.00,  cache_creation: 3.00  },
+  "claude-haiku-4.5":             { input: 0.50,  output: 2.50,  cached: 0.05,  reasoning: 3.75,   cache_creation: 0.50  },
+  "claude-opus-4.1":              { input: 5.00,  output: 25.00, cached: 0.50,  reasoning: 37.50,  cache_creation: 5.00  },
+  "claude-opus-4.5":              { input: 5.00,  output: 25.00, cached: 0.50,  reasoning: 37.50,  cache_creation: 5.00  },
+  "claude-opus-4.6":              { input: 5.00,  output: 25.00, cached: 0.50,  reasoning: 37.50,  cache_creation: 5.00  },
+  "claude-sonnet-4":              { input: 3.00,  output: 15.00, cached: 0.30,  reasoning: 22.50,  cache_creation: 3.00  },
+  "claude-sonnet-4.5":            { input: 3.00,  output: 15.00, cached: 0.30,  reasoning: 22.50,  cache_creation: 3.00  },
+  "claude-sonnet-4.6":            { input: 3.00,  output: 15.00, cached: 0.30,  reasoning: 22.50,  cache_creation: 3.00  },
+  "claude-opus-4-5-thinking":     { input: 5.00,  output: 25.00, cached: 0.50,  reasoning: 37.50,  cache_creation: 5.00  },
+  "claude-opus-4-6-thinking":     { input: 5.00,  output: 25.00, cached: 0.50,  reasoning: 37.50,  cache_creation: 5.00  },
+  // === OpenAI / GPT ===
+  "gpt-3.5-turbo":                { input: 0.50,  output: 1.50,  cached: 0.25,  reasoning: 2.25,   cache_creation: 0.50  },
+  "gpt-4":                        { input: 2.50,  output: 10.00, cached: 1.25,  reasoning: 15.00,  cache_creation: 2.50  },
+  "gpt-4-turbo":                  { input: 10.00, output: 30.00, cached: 5.00,  reasoning: 45.00,  cache_creation: 10.00 },
+  "gpt-4o":                       { input: 2.50,  output: 10.00, cached: 1.25,  reasoning: 15.00,  cache_creation: 2.50  },
+  "gpt-4o-mini":                  { input: 0.15,  output: 0.60,  cached: 0.075, reasoning: 0.90,   cache_creation: 0.15  },
+  "gpt-4.1":                      { input: 2.50,  output: 10.00, cached: 1.25,  reasoning: 15.00,  cache_creation: 2.50  },
+  "gpt-5":                        { input: 3.00,  output: 12.00, cached: 1.50,  reasoning: 18.00,  cache_creation: 3.00  },
+  "gpt-5-mini":                   { input: 0.75,  output: 3.00,  cached: 0.375, reasoning: 4.50,   cache_creation: 0.75  },
+  "gpt-5-codex":                  { input: 3.00,  output: 12.00, cached: 1.50,  reasoning: 18.00,  cache_creation: 3.00  },
+  "gpt-5.1":                      { input: 4.00,  output: 16.00, cached: 2.00,  reasoning: 24.00,  cache_creation: 4.00  },
+  "gpt-5.1-codex":                { input: 4.00,  output: 16.00, cached: 2.00,  reasoning: 24.00,  cache_creation: 4.00  },
+  "gpt-5.1-codex-mini":           { input: 1.50,  output: 6.00,  cached: 0.75,  reasoning: 9.00,   cache_creation: 1.50  },
+  "gpt-5.1-codex-mini-high":      { input: 2.00,  output: 8.00,  cached: 1.00,  reasoning: 12.00,  cache_creation: 2.00  },
+  "gpt-5.1-codex-max":            { input: 8.00,  output: 32.00, cached: 4.00,  reasoning: 48.00,  cache_creation: 8.00  },
+  "gpt-5.2":                      { input: 5.00,  output: 20.00, cached: 2.50,  reasoning: 30.00,  cache_creation: 5.00  },
+  "gpt-5.2-codex":                { input: 5.00,  output: 20.00, cached: 2.50,  reasoning: 30.00,  cache_creation: 5.00  },
+  "gpt-5.3-codex":                { input: 6.00,  output: 24.00, cached: 3.00,  reasoning: 36.00,  cache_creation: 6.00  },
+  "gpt-5.3-codex-xhigh":         { input: 10.00, output: 40.00, cached: 5.00,  reasoning: 60.00,  cache_creation: 10.00 },
+  "gpt-5.3-codex-high":          { input: 8.00,  output: 32.00, cached: 4.00,  reasoning: 48.00,  cache_creation: 8.00  },
+  "gpt-5.3-codex-low":           { input: 4.00,  output: 16.00, cached: 2.00,  reasoning: 24.00,  cache_creation: 4.00  },
+  "gpt-5.3-codex-none":          { input: 3.00,  output: 12.00, cached: 1.50,  reasoning: 18.00,  cache_creation: 3.00  },
+  "gpt-5.3-codex-spark":         { input: 3.00,  output: 12.00, cached: 0.30,  reasoning: 12.00,  cache_creation: 3.00  },
+  "o1":                           { input: 15.00, output: 60.00, cached: 7.50,  reasoning: 90.00,  cache_creation: 15.00 },
+  "o1-mini":                      { input: 3.00,  output: 12.00, cached: 1.50,  reasoning: 18.00,  cache_creation: 3.00  },
+  // === Gemini ===
+  "gemini-3-flash-preview":       { input: 0.50,  output: 3.00,  cached: 0.03,  reasoning: 4.50,   cache_creation: 0.50  },
+  "gemini-3-pro-preview":         { input: 2.00,  output: 12.00, cached: 0.25,  reasoning: 18.00,  cache_creation: 2.00  },
+  "gemini-3.1-pro-low":           { input: 2.00,  output: 12.00, cached: 0.25,  reasoning: 18.00,  cache_creation: 2.00  },
+  "gemini-3.1-pro-high":          { input: 4.00,  output: 18.00, cached: 0.50,  reasoning: 27.00,  cache_creation: 4.00  },
+  "gemini-pro-agent":             { input: 4.00,  output: 18.00, cached: 0.50,  reasoning: 27.00,  cache_creation: 4.00  },
+  "gemini-3-flash-agent":         { input: 0.50,  output: 3.00,  cached: 0.03,  reasoning: 4.50,   cache_creation: 0.50  },
+  "gemini-3.5-flash-low":         { input: 0.50,  output: 3.00,  cached: 0.03,  reasoning: 4.50,   cache_creation: 0.50  },
+  "gemini-3.5-flash-extra-low":   { input: 0.50,  output: 3.00,  cached: 0.03,  reasoning: 4.50,   cache_creation: 0.50  },
+  "gemini-3-flash":               { input: 0.50,  output: 3.00,  cached: 0.03,  reasoning: 4.50,   cache_creation: 0.50  },
+  "gemini-2.5-pro":               { input: 2.00,  output: 12.00, cached: 0.25,  reasoning: 18.00,  cache_creation: 2.00  },
+  "gemini-2.5-flash":             { input: 0.30,  output: 2.50,  cached: 0.03,  reasoning: 3.75,   cache_creation: 0.30  },
+  "gemini-2.5-flash-lite":        { input: 0.15,  output: 1.25,  cached: 0.015, reasoning: 1.875,  cache_creation: 0.15  },
+  // === Qwen ===
+  "qwen3-coder-plus":             { input: 1.00,  output: 4.00,  cached: 0.50,  reasoning: 6.00,   cache_creation: 1.00  },
+  "qwen3-coder-flash":            { input: 0.50,  output: 2.00,  cached: 0.25,  reasoning: 3.00,   cache_creation: 0.50  },
+  // === Kimi ===
+  "kimi-k2":                      { input: 1.00,  output: 4.00,  cached: 0.50,  reasoning: 6.00,   cache_creation: 1.00  },
+  "kimi-k2-thinking":             { input: 1.50,  output: 6.00,  cached: 0.75,  reasoning: 9.00,   cache_creation: 1.50  },
+  "kimi-k2.5":                    { input: 1.20,  output: 4.80,  cached: 0.60,  reasoning: 7.20,   cache_creation: 1.20  },
+  "kimi-k2.5-thinking":           { input: 1.80,  output: 7.20,  cached: 0.90,  reasoning: 10.80,  cache_creation: 1.80  },
+  "kimi-latest":                  { input: 1.00,  output: 4.00,  cached: 0.50,  reasoning: 6.00,   cache_creation: 1.00  },
+  // === DeepSeek ===
+  "deepseek-chat":                { input: 0.14,  output: 0.28,  cached: 0.0028, reasoning: 0.28,   cache_creation: 0.14  },
+  "deepseek-reasoner":            { input: 0.14,  output: 0.28,  cached: 0.0028, reasoning: 0.28,   cache_creation: 0.14  },
+  "deepseek-r1":                  { input: 0.14,  output: 0.28,  cached: 0.0028, reasoning: 0.28,   cache_creation: 0.14  },
+  "deepseek-v3.2-chat":           { input: 0.14,  output: 0.28,  cached: 0.0028, reasoning: 0.28,   cache_creation: 0.14  },
+  "deepseek-v3.2-reasoner":       { input: 0.14,  output: 0.28,  cached: 0.0028, reasoning: 0.28,   cache_creation: 0.14  },
+  "deepseek-v4-flash":            { input: 0.14,  output: 0.28,  cached: 0.0028, reasoning: 0.28,   cache_creation: 0.14  },
+  "deepseek-v4-pro":              { input: 0.435, output: 0.87,  cached: 0.003625, reasoning: 0.87,  cache_creation: 0.435 },
+  // === GLM ===
+  "glm-4.6":                      { input: 0.50,  output: 2.00,  cached: 0.25,  reasoning: 3.00,   cache_creation: 0.50  },
+  "glm-4.6v":                     { input: 0.75,  output: 3.00,  cached: 0.375, reasoning: 4.50,   cache_creation: 0.75  },
+  "glm-4.7":                      { input: 0.75,  output: 3.00,  cached: 0.375, reasoning: 4.50,   cache_creation: 0.75  },
+  "glm-5":                        { input: 1.00,  output: 4.00,  cached: 0.50,  reasoning: 6.00,   cache_creation: 1.00  },
+  // === MiniMax ===
+  "MiniMax-M3":                   { input: 0.30,  output: 1.20,  cached: 0.06,  reasoning: 1.80,   cache_creation: 0.30  },
+  "MiniMax-M2.1":                 { input: 0.50,  output: 2.00,  cached: 0.25,  reasoning: 3.00,   cache_creation: 0.50  },
+  "MiniMax-M2.5":                 { input: 0.50,  output: 2.00,  cached: 0.25,  reasoning: 3.00,   cache_creation: 0.50  },
+  "MiniMax-M2.7":                 { input: 0.50,  output: 2.00,  cached: 0.25,  reasoning: 3.00,   cache_creation: 0.50  },
+  "minimax-m2.1":                 { input: 0.50,  output: 2.00,  cached: 0.25,  reasoning: 3.00,   cache_creation: 0.50  },
+  "minimax-m2.5":                 { input: 0.60,  output: 2.40,  cached: 0.30,  reasoning: 3.60,   cache_creation: 0.60  },
+  // === Grok ===
+  "grok-code-fast-1":             { input: 0.50,  output: 2.00,  cached: 0.25,  reasoning: 3.00,   cache_creation: 0.50  },
+  // === OpenRouter fallback ===
+  "auto":                         { input: 2.00,  output: 8.00,  cached: 1.00,  reasoning: 12.00,  cache_creation: 2.00  },
+  // === Misc ===
+  "oswe-vscode-prime":            { input: 1.00,  output: 4.00,  cached: 0.50,  reasoning: 6.00,   cache_creation: 1.00  },
+  "gpt-oss-120b-medium":          { input: 0.50,  output: 2.00,  cached: 0.25,  reasoning: 3.00,   cache_creation: 0.50  },
+  "vision-model":                 { input: 1.50,  output: 6.00,  cached: 0.75,  reasoning: 9.00,   cache_creation: 1.50  },
+  "coder-model":                  { input: 1.50,  output: 6.00,  cached: 0.75,  reasoning: 9.00,   cache_creation: 1.50  },
+};
+/**
+ * Provider-specific pricing overrides.
+ * Only include entries where price DIFFERS from MODEL_PRICING.
+ * Keyed by provider alias (cc, cx, gc, gh, ...) or provider id (openai, anthropic, ...).
+ */
+export const PROVIDER_PRICING: Record<string, Record<string, Pricing>> = {
+  // GitHub Copilot (gh) — gpt-5.3-codex has different rate than canonical
+  gh: {
+    "gpt-5.3-codex": { input: 1.75, output: 14.00, cached: 0.175, reasoning: 14.00, cache_creation: 1.75 },
+  },
+};
+/**
+ * Pattern-based pricing fallback — matched when no exact model entry found.
+ * Patterns use simple glob: "*" matches any substring.
+ * First match wins — order matters.
+ */
+export const PATTERN_PRICING: Array<{ pattern: string; pricing: Pricing }> = [
+  // --- Codex variants ---
+  { pattern: "*-codex-xhigh",   pricing: { input: 10.00, output: 40.00, cached: 5.00,  reasoning: 60.00,  cache_creation: 10.00 } },
+  { pattern: "*-codex-high",    pricing: { input: 8.00,  output: 32.00, cached: 4.00,  reasoning: 48.00,  cache_creation: 8.00  } },
+  { pattern: "*-codex-max",     pricing: { input: 8.00,  output: 32.00, cached: 4.00,  reasoning: 48.00,  cache_creation: 8.00  } },
+  { pattern: "*-codex-mini-*",  pricing: { input: 1.50,  output: 6.00,  cached: 0.75,  reasoning: 9.00,   cache_creation: 1.50  } },
+  { pattern: "*-codex-mini",    pricing: { input: 1.50,  output: 6.00,  cached: 0.75,  reasoning: 9.00,   cache_creation: 1.50  } },
+  { pattern: "*-codex-low",     pricing: { input: 4.00,  output: 16.00, cached: 2.00,  reasoning: 24.00,  cache_creation: 4.00  } },
+  { pattern: "*-codex-none",    pricing: { input: 3.00,  output: 12.00, cached: 1.50,  reasoning: 18.00,  cache_creation: 3.00  } },
+  { pattern: "*-codex-spark",   pricing: { input: 3.00,  output: 12.00, cached: 0.30,  reasoning: 12.00,  cache_creation: 3.00  } },
+  { pattern: "codex-*",         pricing: { input: 3.00,  output: 12.00, cached: 1.50,  reasoning: 18.00,  cache_creation: 3.00  } },
+  { pattern: "*-codex",         pricing: { input: 3.00,  output: 12.00, cached: 1.50,  reasoning: 18.00,  cache_creation: 3.00  } },
+  // --- Claude ---
+  { pattern: "claude-opus-*",   pricing: { input: 5.00,  output: 25.00, cached: 0.50,  reasoning: 25.00,  cache_creation: 6.25  } },
+  { pattern: "claude-sonnet-*", pricing: { input: 3.00,  output: 15.00, cached: 0.30,  reasoning: 15.00,  cache_creation: 3.75  } },
+  { pattern: "claude-haiku-*",  pricing: { input: 1.00,  output: 5.00,  cached: 0.10,  reasoning: 5.00,   cache_creation: 1.25  } },
+  { pattern: "claude-*",        pricing: { input: 3.00,  output: 15.00, cached: 0.30,  reasoning: 15.00,  cache_creation: 3.75  } },
+  // --- Gemini (specific first, generic last) ---
+  { pattern: "gemini-*-flash-lite", pricing: { input: 0.15, output: 1.25, cached: 0.015, reasoning: 1.875, cache_creation: 0.15 } },
+  { pattern: "gemini-*-flash",  pricing: { input: 0.30,  output: 2.50,  cached: 0.03,  reasoning: 3.75,   cache_creation: 0.30  } },
+  { pattern: "gemini-*-pro",    pricing: { input: 2.00,  output: 12.00, cached: 0.25,  reasoning: 18.00,  cache_creation: 2.00  } },
+  { pattern: "gemini-3-*",      pricing: { input: 0.50,  output: 3.00,  cached: 0.03,  reasoning: 4.50,   cache_creation: 0.50  } },
+  { pattern: "gemini-2.5-*",    pricing: { input: 0.30,  output: 2.50,  cached: 0.03,  reasoning: 3.75,   cache_creation: 0.30  } },
+  { pattern: "gemini-*",        pricing: { input: 0.50,  output: 3.00,  cached: 0.03,  reasoning: 4.50,   cache_creation: 0.50  } },
+  // --- GPT (specific first, generic last) ---
+  { pattern: "gpt-5.3-*",       pricing: { input: 6.00,  output: 24.00, cached: 3.00,  reasoning: 36.00,  cache_creation: 6.00  } },
+  { pattern: "gpt-5.2-*",       pricing: { input: 5.00,  output: 20.00, cached: 2.50,  reasoning: 30.00,  cache_creation: 5.00  } },
+  { pattern: "gpt-5.1-*",       pricing: { input: 4.00,  output: 16.00, cached: 2.00,  reasoning: 24.00,  cache_creation: 4.00  } },
+  { pattern: "gpt-5-*",         pricing: { input: 3.00,  output: 12.00, cached: 1.50,  reasoning: 18.00,  cache_creation: 3.00  } },
+  { pattern: "gpt-5*",          pricing: { input: 3.00,  output: 12.00, cached: 1.50,  reasoning: 18.00,  cache_creation: 3.00  } },
+  { pattern: "gpt-4o-*",        pricing: { input: 0.15,  output: 0.60,  cached: 0.075, reasoning: 0.90,   cache_creation: 0.15  } },
+  { pattern: "gpt-4o",          pricing: { input: 2.50,  output: 10.00, cached: 1.25,  reasoning: 15.00,  cache_creation: 2.50  } },
+  { pattern: "gpt-4*",          pricing: { input: 2.50,  output: 10.00, cached: 1.25,  reasoning: 15.00,  cache_creation: 2.50  } },
+  // --- o1 / o-series ---
+  { pattern: "o1-*",            pricing: { input: 3.00,  output: 12.00, cached: 1.50,  reasoning: 18.00,  cache_creation: 3.00  } },
+  { pattern: "o1",              pricing: { input: 15.00, output: 60.00, cached: 7.50,  reasoning: 90.00,  cache_creation: 15.00 } },
+  { pattern: "o3-*",            pricing: { input: 10.00, output: 40.00, cached: 5.00,  reasoning: 60.00,  cache_creation: 10.00 } },
+  { pattern: "o4-*",            pricing: { input: 2.00,  output: 8.00,  cached: 1.00,  reasoning: 12.00,  cache_creation: 2.00  } },
+  // --- Qwen ---
+  { pattern: "qwen3-coder-*",   pricing: { input: 1.00,  output: 4.00,  cached: 0.50,  reasoning: 6.00,   cache_creation: 1.00  } },
+  { pattern: "qwen*-coder-*",   pricing: { input: 1.00,  output: 4.00,  cached: 0.50,  reasoning: 6.00,   cache_creation: 1.00  } },
+  { pattern: "qwen*",           pricing: { input: 0.50,  output: 2.00,  cached: 0.25,  reasoning: 3.00,   cache_creation: 0.50  } },
+  // --- Kimi ---
+  { pattern: "kimi-*-thinking",  pricing: { input: 1.80,  output: 7.20,  cached: 0.90,  reasoning: 10.80,  cache_creation: 1.80  } },
+  { pattern: "kimi-k2*",        pricing: { input: 1.20,  output: 4.80,  cached: 0.60,  reasoning: 7.20,   cache_creation: 1.20  } },
+  { pattern: "kimi-*",          pricing: { input: 1.00,  output: 4.00,  cached: 0.50,  reasoning: 6.00,   cache_creation: 1.00  } },
+  // --- DeepSeek ---
+  { pattern: "deepseek-*reasoner*", pricing: { input: 0.14, output: 0.28, cached: 0.0028, reasoning: 0.28, cache_creation: 0.14 } },
+  { pattern: "deepseek-r*",     pricing: { input: 0.14,  output: 0.28,  cached: 0.0028, reasoning: 0.28,   cache_creation: 0.14  } },
+  { pattern: "deepseek-v*",     pricing: { input: 0.14,  output: 0.28,  cached: 0.0028, reasoning: 0.28,   cache_creation: 0.14  } },
+  { pattern: "deepseek-*",      pricing: { input: 0.14,  output: 0.28,  cached: 0.0028, reasoning: 0.28,   cache_creation: 0.14  } },
+  // --- GLM ---
+  { pattern: "glm-5*",          pricing: { input: 1.00,  output: 4.00,  cached: 0.50,  reasoning: 6.00,   cache_creation: 1.00  } },
+  { pattern: "glm-4*",          pricing: { input: 0.75,  output: 3.00,  cached: 0.375, reasoning: 4.50,   cache_creation: 0.75  } },
+  { pattern: "glm-*",           pricing: { input: 0.50,  output: 2.00,  cached: 0.25,  reasoning: 3.00,   cache_creation: 0.50  } },
+  // --- MiniMax ---
+  { pattern: "MiniMax-*",       pricing: { input: 0.50,  output: 2.00,  cached: 0.25,  reasoning: 3.00,   cache_creation: 0.50  } },
+  { pattern: "minimax-*",       pricing: { input: 0.50,  output: 2.00,  cached: 0.25,  reasoning: 3.00,   cache_creation: 0.50  } },
+  // --- Grok ---
+  { pattern: "grok-code-*",     pricing: { input: 0.50,  output: 2.00,  cached: 0.25,  reasoning: 3.00,   cache_creation: 0.50  } },
+  { pattern: "grok-*",          pricing: { input: 0.50,  output: 2.00,  cached: 0.25,  reasoning: 3.00,   cache_creation: 0.50  } },
+];
+/**
+ * Match a model ID against a glob pattern (* = wildcard). Case-insensitive:
+ * registry ids mix casing (e.g. "MiniMax-M2.5" vs "minimax-m2.5").
+ */
+export function matchPattern(pattern: string, model: string): boolean {
+  const regex = new RegExp("^" + pattern.split("*").map(s => s.replace(/[.*+?^${}()|[\]\\]/g, "\\$&")).join(".*") + "$", "i");
+  return regex.test(model);
+}
+/**
+ * Resolve pricing for a model using the 3-step fallback chain:
+ *   1. PROVIDER_PRICING[provider][model]
+ *   2. MODEL_PRICING[model]
+ *   3. PATTERN_PRICING (glob match)
+ *
+ * @param {string} provider
+ * @param {string} model
+ * @returns {object|null}
+ */
+export function getPricingForModel(provider: string | null, model: string): Pricing | null {
+  if (!model) return null;
+  // 1. Provider-specific override
+  if (provider && PROVIDER_PRICING[provider]?.[model]) {
+    return PROVIDER_PRICING[provider][model];
+  }
+  // 2. Canonical model pricing (strip vendor prefix if needed: "deepseek/deepseek-chat" → "deepseek-chat")
+  const baseModel = (model.includes("/") ? model.split("/").pop() : model) ?? model;
+  if (MODEL_PRICING[baseModel]) return MODEL_PRICING[baseModel];
+  if (MODEL_PRICING[model]) return MODEL_PRICING[model];
+  // 3. Pattern match
+  for (const { pattern, pricing } of PATTERN_PRICING) {
+    if (matchPattern(pattern, baseModel) || matchPattern(pattern, model)) {
+      return pricing;
+    }
+  }
+  return null;
+}