npm - cost-katana-cli - Versions diffs - 2.2.2 → 2.2.4 - Mend

cost-katana-cli 2.2.2 → 2.2.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/dist/constants/models.d.ts +248 -118
package/dist/constants/models.d.ts.map +1 -1
package/dist/constants/models.js +318 -154
package/dist/constants/models.js.map +1 -1
package/dist/utils/models.d.ts.map +1 -1
package/dist/utils/models.js +2476 -754
package/dist/utils/models.js.map +1 -1
package/package.json +1 -1

package/dist/utils/models.js CHANGED Viewed

@@ -18,7 +18,146 @@ function getModelProvider(model) {
 }
 exports.AVAILABLE_MODELS = [
     // === OpenAI Models ===
-    // === GPT-5 Models (Latest) ===
+    // === GPT-5.2 Models (Latest) ===
+    {
+        id: 'gpt-5.2',
+        name: 'GPT-5.2',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 1.75, output: 14.0 },
+        capabilities: ['text', 'reasoning', 'analysis', 'coding', 'agents'],
+        category: 'text',
+        isLatest: true,
+        notes: 'Latest GPT-5 model. Standard: $1.75/$14.00 per 1M tokens. Batch: $0.875/$7.00. Flex: $0.875/$7.00. Priority: $3.50/$28.00. Cached input: $0.175 (standard), $0.0875 (batch/flex), $0.35 (priority)',
+    },
+    {
+        id: 'gpt-5.2-pro',
+        name: 'GPT-5.2 Pro',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 21.0, output: 168.0 },
+        capabilities: [
+            'text',
+            'reasoning',
+            'analysis',
+            'coding',
+            'agents',
+            'premium',
+        ],
+        category: 'text',
+        isLatest: true,
+        notes: 'Premium version of GPT-5.2. Standard: $21.00/$168.00 per 1M tokens. Batch: $10.50/$84.00',
+    },
+    {
+        id: 'gpt-5.2-codex',
+        name: 'GPT-5.2-Codex',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 1.75, output: 14.0 },
+        capabilities: ['code', 'programming', 'agents', 'coding'],
+        category: 'code',
+        isLatest: true,
+        notes: 'GPT-5.2 optimized for agentic coding in Codex. Standard: $1.75/$14.00 per 1M tokens. Priority: $3.50/$28.00. Cached input: $0.175 (standard), $0.35 (priority)',
+    },
+    {
+        id: 'gpt-5.2-chat-latest',
+        name: 'GPT-5.2 Chat',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 1.75, output: 14.0 },
+        capabilities: ['text', 'chat', 'reasoning', 'analysis'],
+        category: 'text',
+        isLatest: true,
+        notes: 'GPT-5.2 model used in ChatGPT. Standard: $1.75/$14.00 per 1M tokens. Cached input: $0.175',
+    },
+    // === GPT-5.1 Models ===
+    {
+        id: 'gpt-5.1',
+        name: 'GPT-5.1',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 1.25, output: 10.0 },
+        capabilities: ['text', 'reasoning', 'analysis', 'coding', 'agents'],
+        category: 'text',
+        isLatest: true,
+        notes: 'GPT-5.1 model. Standard: $1.25/$10.00 per 1M tokens. Batch: $0.625/$5.00. Flex: $0.625/$5.00. Priority: $2.50/$20.00. Cached input: $0.125 (standard), $0.0625 (batch/flex), $0.25 (priority)',
+    },
+    {
+        id: 'gpt-5.1-codex-max',
+        name: 'GPT-5.1-Codex Max',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 1.25, output: 10.0 },
+        capabilities: ['code', 'programming', 'agents', 'coding'],
+        category: 'code',
+        isLatest: true,
+        notes: 'GPT-5.1 optimized for agentic coding. Standard: $1.25/$10.00 per 1M tokens. Priority: $2.50/$20.00. Cached input: $0.125 (standard), $0.25 (priority)',
+    },
+    {
+        id: 'gpt-5.1-codex',
+        name: 'GPT-5.1-Codex',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 1.25, output: 10.0 },
+        capabilities: ['code', 'programming', 'agents', 'coding'],
+        category: 'code',
+        isLatest: true,
+        notes: 'GPT-5.1 optimized for agentic coding in Codex. Standard: $1.25/$10.00 per 1M tokens. Priority: $2.50/$20.00. Cached input: $0.125 (standard), $0.25 (priority)',
+    },
+    {
+        id: 'gpt-5.1-codex-mini',
+        name: 'GPT-5.1-Codex Mini',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.25, output: 2.0 },
+        capabilities: ['code', 'programming', 'agents', 'coding', 'efficient'],
+        category: 'code',
+        isLatest: true,
+        notes: 'Cost-efficient GPT-5.1 Codex variant. Standard: $0.25/$2.00 per 1M tokens. Cached input: $0.025',
+    },
+    {
+        id: 'gpt-5.1-chat-latest',
+        name: 'GPT-5.1 Chat',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 1.25, output: 10.0 },
+        capabilities: ['text', 'chat', 'reasoning', 'analysis'],
+        category: 'text',
+        isLatest: true,
+        notes: 'GPT-5.1 model used in ChatGPT. Standard: $1.25/$10.00 per 1M tokens. Cached input: $0.125',
+    },
+    {
+        id: 'gpt-5.1-search-api',
+        name: 'GPT-5.1 Search API',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 1.25, output: 10.0 },
+        capabilities: ['text', 'search', 'multimodal', 'reasoning'],
+        category: 'search',
+        isLatest: true,
+        notes: 'GPT-5.1 with search capabilities. Standard: $1.25/$10.00 per 1M tokens. Cached input: $0.125. Web search: $10.00/1k calls + search content tokens billed at model rates',
+    },
+    // === GPT-5 Models ===
     {
         id: 'gpt-5',
         name: 'GPT-5',
@@ -30,158 +169,835 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'reasoning', 'analysis', 'coding', 'agents'],
         category: 'text',
         isLatest: true,
-        notes: 'The best model for coding and agentic tasks across domains',
+        notes: 'The best model for coding and agentic tasks across domains. Standard: $1.25/$10.00 per 1M tokens. Batch: $0.625/$5.00. Flex: $0.625/$5.00. Priority: $2.50/$20.00. Cached input: $0.125 (standard), $0.0625 (batch/flex), $0.25 (priority)',
+    },
+    {
+        id: 'gpt-5-mini',
+        name: 'GPT-5 mini',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.25, output: 2.0 },
+        capabilities: ['text', 'reasoning', 'analysis', 'efficient'],
+        category: 'text',
+        isLatest: true,
+        notes: 'A faster, cost-efficient version of GPT-5 for well-defined tasks. Standard: $0.25/$2.00 per 1M tokens. Batch: $0.125/$1.00. Flex: $0.125/$1.00. Priority: $0.45/$3.60. Cached input: $0.025 (standard), $0.0125 (batch/flex), $0.045 (priority)',
+    },
+    {
+        id: 'gpt-5-nano',
+        name: 'GPT-5 nano',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.05, output: 0.4 },
+        capabilities: ['text', 'fast', 'cost-effective'],
+        category: 'text',
+        isLatest: true,
+        notes: 'Fastest, most cost-efficient version of GPT-5. Standard: $0.05/$0.40 per 1M tokens. Batch: $0.025/$0.20. Flex: $0.025/$0.20. Cached input: $0.005 (standard), $0.0025 (batch/flex)',
+    },
+    {
+        id: 'gpt-5-pro',
+        name: 'GPT-5 pro',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 15.0, output: 120.0 },
+        capabilities: [
+            'text',
+            'reasoning',
+            'analysis',
+            'coding',
+            'agents',
+            'premium',
+        ],
+        category: 'text',
+        isLatest: true,
+        notes: 'Version of GPT-5 that produces smarter and more precise responses. Standard: $15.00/$120.00 per 1M tokens. Batch: $7.50/$60.00',
+    },
+    {
+        id: 'gpt-5-codex',
+        name: 'GPT-5-Codex',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 1.25, output: 10.0 },
+        capabilities: ['code', 'programming', 'agents', 'coding'],
+        category: 'code',
+        isLatest: true,
+        notes: 'A version of GPT-5 optimized for agentic coding in Codex. Standard: $1.25/$10.00 per 1M tokens. Priority: $2.50/$20.00. Cached input: $0.125 (standard), $0.25 (priority)',
+    },
+    {
+        id: 'gpt-5-chat-latest',
+        name: 'GPT-5 Chat',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 1.25, output: 10.0 },
+        capabilities: ['text', 'chat', 'reasoning', 'analysis'],
+        category: 'text',
+        isLatest: true,
+        notes: 'GPT-5 model used in ChatGPT. Standard: $1.25/$10.00 per 1M tokens. Cached input: $0.125',
+    },
+    // === GPT-4.1 Series (Latest) ===
+    {
+        id: 'gpt-4.1',
+        name: 'GPT-4.1',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 2.0, output: 8.0 },
+        capabilities: ['text', 'analysis', 'enhanced'],
+        category: 'text',
+        isLatest: true,
+        notes: 'Smartest non-reasoning model. Standard: $2.00/$8.00 per 1M tokens. Batch: $1.00/$4.00. Priority: $3.50/$14.00. Cached input: $0.50 (standard), $0.875 (priority). Fine-tuning: $25.00 training, $3.00/$0.75/$12.00 (standard), $1.50/$0.50/$6.00 (batch)',
+    },
+    {
+        id: 'gpt-4.1-mini',
+        name: 'GPT-4.1 mini',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.4, output: 1.6 },
+        capabilities: ['text', 'analysis', 'efficient'],
+        category: 'text',
+        isLatest: true,
+        notes: 'Smaller, faster version of GPT-4.1. Standard: $0.40/$1.60 per 1M tokens. Batch: $0.20/$0.80. Priority: $0.70/$2.80. Cached input: $0.10 (standard), $0.175 (priority). Fine-tuning: $5.00 training, $0.80/$0.20/$3.20 (standard), $0.40/$0.10/$1.60 (batch)',
+    },
+    {
+        id: 'gpt-4.1-nano',
+        name: 'GPT-4.1 nano',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.1, output: 0.4 },
+        capabilities: ['text', 'fast', 'cost-effective'],
+        category: 'text',
+        isLatest: true,
+        notes: 'Fastest, most cost-efficient version of GPT-4.1. Standard: $0.10/$0.40 per 1M tokens. Batch: $0.05/$0.20. Priority: $0.20/$0.80. Cached input: $0.025 (standard), $0.05 (priority). Fine-tuning: $1.50 training, $0.20/$0.05/$0.80 (standard), $0.10/$0.025/$0.40 (batch)',
+    },
+    // === GPT-4o Series (Latest) ===
+    {
+        id: 'gpt-4o-2024-08-06',
+        name: 'GPT-4o',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 2.5, output: 10.0 },
+        capabilities: ['text', 'vision', 'multimodal', 'analysis'],
+        category: 'multimodal',
+        isLatest: true,
+        notes: 'Latest GPT-4o model with multimodal capabilities. Standard: $2.50/$10.00 per 1M tokens. Batch: $1.25/$5.00. Priority: $4.25/$17.00. Cached input: $1.25 (standard), $2.125 (priority). Fine-tuning: $25.00 training, $3.75/$1.875/$15.00 (standard), $2.225/$0.90/$12.50 (batch)',
+    },
+    {
+        id: 'gpt-4o-2024-05-13',
+        name: 'GPT-4o (2024-05-13)',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 5.0, output: 15.0 },
+        capabilities: ['text', 'vision', 'multimodal'],
+        category: 'multimodal',
+        isLatest: false,
+        notes: 'GPT-4o model from May 2024. Standard: $5.00/$15.00 per 1M tokens. Priority: $8.75/$26.25',
+    },
+    {
+        id: 'gpt-4o-audio-preview',
+        name: 'GPT-4o Audio Preview',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 2.5, output: 10.0 },
+        capabilities: ['text', 'audio', 'multimodal'],
+        category: 'audio',
+        isLatest: true,
+        notes: 'GPT-4o with audio input capabilities. Text: $2.50/$10.00 per 1M tokens. Audio: $40.00/$80.00 per 1M tokens',
+    },
+    {
+        id: 'gpt-4o-realtime-preview',
+        name: 'GPT-4o Realtime Preview',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 5.0, output: 20.0 },
+        capabilities: ['text', 'realtime', 'multimodal'],
+        category: 'realtime',
+        isLatest: true,
+        notes: 'GPT-4o with realtime processing capabilities. Text: $5.00/$20.00 per 1M tokens. Cached: $2.50. Audio: $40.00/$80.00 per 1M tokens. Image: $5.00/$0.50 per 1M tokens',
+    },
+    {
+        id: 'gpt-4o-mini-2024-07-18',
+        name: 'GPT-4o Mini',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.15, output: 0.6 },
+        capabilities: ['text', 'vision', 'multimodal', 'efficient'],
+        category: 'multimodal',
+        isLatest: true,
+        notes: 'Efficient GPT-4o variant with multimodal capabilities. Standard: $0.15/$0.60 per 1M tokens. Batch: $0.075/$0.30. Priority: $0.25/$1.00. Cached input: $0.075 (standard), $0.125 (priority). Fine-tuning: $3.00 training, $0.30/$0.15/$1.20 (standard), $0.15/$0.075/$0.60 (batch)',
+    },
+    {
+        id: 'gpt-4o-mini-audio-preview',
+        name: 'GPT-4o Mini Audio Preview',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.15, output: 0.6 },
+        capabilities: ['text', 'audio', 'efficient'],
+        category: 'audio',
+        isLatest: true,
+        notes: 'GPT-4o Mini with audio input capabilities. Text: $0.15/$0.60 per 1M tokens. Audio: $10.00/$20.00 per 1M tokens',
+    },
+    {
+        id: 'gpt-4o-mini-realtime-preview',
+        name: 'GPT-4o Mini Realtime Preview',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.6, output: 2.4 },
+        capabilities: ['text', 'realtime', 'efficient'],
+        category: 'realtime',
+        isLatest: true,
+        notes: 'GPT-4o Mini with realtime processing capabilities. Text: $0.60/$2.40 per 1M tokens. Cached: $0.30. Audio: $10.00/$20.00 per 1M tokens. Image: $0.80/$0.08 per 1M tokens',
+    },
+    {
+        id: 'gpt-4o-mini',
+        name: 'GPT-4o mini',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.15, output: 0.6 },
+        capabilities: ['text', 'vision', 'multimodal'],
+        category: 'multimodal',
+        isLatest: false,
+        notes: 'Fast, affordable small model for focused tasks. Standard: $0.15/$0.60 per 1M tokens. Batch: $0.075/$0.30',
+    },
+    {
+        id: 'gpt-4o',
+        name: 'GPT-4o',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 2.5, output: 10.0 },
+        capabilities: ['text', 'vision', 'multimodal'],
+        category: 'multimodal',
+        isLatest: false,
+        notes: 'Fast, intelligent, flexible GPT model. Standard: $2.50/$10.00 per 1M tokens. Batch: $1.25/$5.00',
+    },
+    {
+        id: 'gpt-4-turbo',
+        name: 'GPT-4 Turbo',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 10.0, output: 30.0 },
+        capabilities: ['text', 'vision', 'multimodal'],
+        category: 'multimodal',
+        isLatest: false,
+        notes: 'Legacy GPT-4 Turbo model. Standard: $10.00/$30.00 per 1M tokens. Batch: $5.00/$15.00',
+    },
+    {
+        id: 'gpt-4',
+        name: 'GPT-4',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 8192,
+        contextLength: 8192,
+        pricing: { input: 30.0, output: 60.0 },
+        capabilities: ['text'],
+        category: 'text',
+        isLatest: false,
+        notes: 'Legacy GPT-4 base model. Standard: $30.00/$60.00 per 1M tokens. Batch: $15.00/$30.00',
+    },
+    {
+        id: 'gpt-3.5-turbo',
+        name: 'GPT-3.5 Turbo',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 16385,
+        contextLength: 16385,
+        pricing: { input: 0.5, output: 1.5 },
+        capabilities: ['text'],
+        category: 'text',
+        isLatest: false,
+        notes: 'Legacy GPT-3.5 Turbo model. Standard: $0.50/$1.50 per 1M tokens. Batch: $0.25/$0.75. Fine-tuning: $8.00 training, $3.00/$6.00 (standard), $1.50/$3.00 (batch)',
+    },
+    // === Audio and Realtime Models ===
+    {
+        id: 'gpt-realtime',
+        name: 'gpt-realtime',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 4.0, output: 16.0 },
+        capabilities: ['text', 'audio', 'realtime', 'multimodal'],
+        category: 'realtime',
+        isLatest: true,
+        notes: 'Model capable of realtime text and audio inputs and outputs. Text: $4.00/$16.00 per 1M tokens (standard). Cached: $0.40. Audio: $32.00/$64.00 per 1M tokens. Image: $5.00/$0.50 per 1M tokens',
+    },
+    {
+        id: 'gpt-realtime-mini',
+        name: 'gpt-realtime-mini',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.6, output: 2.4 },
+        capabilities: ['text', 'audio', 'realtime', 'efficient'],
+        category: 'realtime',
+        isLatest: true,
+        notes: 'A cost-efficient version of GPT Realtime. Text: $0.60/$2.40 per 1M tokens (standard). Cached: $0.06. Audio: $10.00/$20.00 per 1M tokens. Image: $0.80/$0.08 per 1M tokens',
+    },
+    {
+        id: 'gpt-audio',
+        name: 'gpt-audio',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 2.5, output: 10.0 },
+        capabilities: ['text', 'audio', 'multimodal'],
+        category: 'audio',
+        isLatest: true,
+        notes: 'For audio inputs and outputs with Chat Completions API. Text: $2.50/$10.00 per 1M tokens. Audio: $32.00/$64.00 per 1M tokens',
+    },
+    {
+        id: 'gpt-audio-mini',
+        name: 'gpt-audio-mini',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.6, output: 2.4 },
+        capabilities: ['text', 'audio', 'efficient'],
+        category: 'audio',
+        isLatest: true,
+        notes: 'A cost-efficient version of GPT Audio. Text: $0.60/$2.40 per 1M tokens. Audio: $10.00/$20.00 per 1M tokens',
+    },
+    // === Transcription Models ===
+    {
+        id: 'gpt-4o-transcribe',
+        name: 'GPT-4o Transcribe',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 2.5, output: 10.0 },
+        capabilities: ['audio', 'transcription', 'speech-to-text'],
+        category: 'audio',
+        isLatest: true,
+        notes: 'Speech-to-text model powered by GPT-4o. Text tokens: $2.50/$10.00 per 1M tokens. Audio tokens: $6.00 per 1M tokens. Estimated cost: $0.006 per minute',
+    },
+    {
+        id: 'gpt-4o-transcribe-diarize',
+        name: 'GPT-4o Transcribe Diarize',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 2.5, output: 10.0 },
+        capabilities: ['audio', 'transcription', 'speech-to-text', 'diarization'],
+        category: 'audio',
+        isLatest: true,
+        notes: "Transcription model that identifies who's speaking when. Text tokens: $2.50/$10.00 per 1M tokens. Audio tokens: $6.00 per 1M tokens. Estimated cost: $0.006 per minute",
+    },
+    {
+        id: 'gpt-4o-mini-transcribe',
+        name: 'GPT-4o mini Transcribe',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 1.25, output: 5.0 },
+        capabilities: ['audio', 'transcription', 'speech-to-text', 'efficient'],
+        category: 'audio',
+        isLatest: true,
+        notes: 'Speech-to-text model powered by GPT-4o mini. Text tokens: $1.25/$5.00 per 1M tokens. Audio tokens: $3.00 per 1M tokens. Estimated cost: $0.003 per minute',
+    },
+    {
+        id: 'whisper-1',
+        name: 'Whisper',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.006, output: 0.006 },
+        capabilities: [
+            'audio',
+            'transcription',
+            'speech-to-text',
+            'general-purpose',
+        ],
+        category: 'audio',
+        isLatest: true,
+        notes: 'General-purpose speech recognition model. Priced at $0.006 per minute',
+    },
+    // === Text-to-Speech Models ===
+    {
+        id: 'gpt-4o-mini-tts',
+        name: 'GPT-4o mini TTS',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.6, output: 12.0 },
+        capabilities: ['audio', 'text-to-speech', 'tts'],
+        category: 'audio',
+        isLatest: true,
+        notes: 'Text-to-speech model powered by GPT-4o mini. Text tokens: $0.60 per 1M tokens. Audio tokens: $12.00 per 1M tokens. Estimated cost: $0.015 per minute',
+    },
+    {
+        id: 'tts-1',
+        name: 'TTS-1',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.015, output: 0.015 },
+        capabilities: ['audio', 'text-to-speech', 'tts', 'fast'],
+        category: 'audio',
+        isLatest: true,
+        notes: 'Text-to-speech model optimized for speed. Priced at $15.00 per 1M characters',
+    },
+    {
+        id: 'tts-1-hd',
+        name: 'TTS-1 HD',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.03, output: 0.03 },
+        capabilities: ['audio', 'text-to-speech', 'tts', 'high-quality'],
+        category: 'audio',
+        isLatest: true,
+        notes: 'Text-to-speech model optimized for quality. Priced at $30.00 per 1M characters',
+    },
+    // === Open-Weight Models ===
+    {
+        id: 'gpt-oss-120b',
+        name: 'gpt-oss-120b',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 131072,
+        contextLength: 131072,
+        pricing: { input: 2.0, output: 8.0 },
+        capabilities: ['text', 'open-source', 'open-weight'],
+        category: 'text',
+        isLatest: true,
+        notes: 'Most powerful open-weight model, fits into an H100 GPU. Licensed under Apache 2.0',
+    },
+    {
+        id: 'gpt-oss-20b',
+        name: 'gpt-oss-20b',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 131072,
+        contextLength: 131072,
+        pricing: { input: 0.5, output: 2.0 },
+        capabilities: ['text', 'open-source', 'open-weight', 'low-latency'],
+        category: 'text',
+        isLatest: true,
+        notes: 'Medium-sized open-weight model for low latency. Licensed under Apache 2.0',
+    },
+    // === Specialized Models ===
+    {
+        id: 'codex-mini-latest',
+        name: 'codex-mini-latest',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 1.5, output: 6.0 },
+        capabilities: ['code', 'programming', 'reasoning'],
+        category: 'code',
+        isLatest: true,
+        notes: 'Fast reasoning model optimized for the Codex CLI. Standard: $1.50/$6.00 per 1M tokens. Cached input: $0.375',
+    },
+    {
+        id: 'omni-moderation-latest',
+        name: 'omni-moderation',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 32768,
+        contextLength: 32768,
+        pricing: { input: 0.0, output: 0.0 },
+        capabilities: ['moderation', 'text', 'image', 'harmful-content-detection'],
+        category: 'moderation',
+        isLatest: true,
+        notes: 'Identify potentially harmful content in text and images. Made available free of charge. Built-in tools: Code Interpreter ($0.03-$1.92/container based on memory), File search storage ($0.10/GB per day, 1GB free), File search tool calls ($2.50/1k calls), Web search ($10.00/1k calls for reasoning models, $25.00/1k calls for non-reasoning models) + search content tokens billed at model rates',
+    },
+    {
+        id: 'gpt-4o-mini-search-preview-2025-03-11',
+        name: 'GPT-4o Mini Search Preview',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.15, output: 0.6 },
+        capabilities: ['text', 'search', 'multimodal'],
+        category: 'search',
+        isLatest: true,
+        notes: 'GPT-4o Mini with search capabilities for enhanced information retrieval. Text: $0.15/$0.60 per 1M tokens. Web search: $10.00/1k calls + search content tokens billed at model rates (non-reasoning models: $25.00/1k calls, search content tokens are free)',
+    },
+    {
+        id: 'gpt-4o-search-preview-2025-03-11',
+        name: 'GPT-4o Search Preview',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 2.5, output: 10.0 },
+        capabilities: ['text', 'search', 'multimodal'],
+        category: 'search',
+        isLatest: true,
+        notes: 'GPT-4o with search capabilities for enhanced information retrieval. Text: $2.50/$10.00 per 1M tokens. Web search: $10.00/1k calls + search content tokens billed at model rates (non-reasoning models: $25.00/1k calls, search content tokens are free)',
+    },
+    {
+        id: 'computer-use-preview-2025-03-11',
+        name: 'Computer Use Preview',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 3.0, output: 12.0 },
+        capabilities: ['text', 'computer-use', 'automation'],
+        category: 'computer-use',
+        isLatest: true,
+        notes: 'Model optimized for computer use and automation tasks. Standard: $3.00/$12.00 per 1M tokens. Batch: $1.50/$6.00',
+    },
+    // === Embedding Models ===
+    {
+        id: 'text-embedding-3-small',
+        name: 'Text Embedding 3 Small',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 8191,
+        contextLength: 8191,
+        pricing: { input: 0.02, output: 0.0 },
+        capabilities: ['embedding', 'semantic-search'],
+        category: 'embedding',
+        isLatest: true,
+        notes: 'Latest small embedding model for semantic search and analysis. Online: $0.02 per 1M tokens. Batch: $0.01 per 1M tokens',
+    },
+    {
+        id: 'text-embedding-3-large',
+        name: 'Text Embedding 3 Large',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 8191,
+        contextLength: 8191,
+        pricing: { input: 0.13, output: 0.0 },
+        capabilities: ['embedding', 'semantic-search', 'high-quality'],
+        category: 'embedding',
+        isLatest: true,
+        notes: 'Latest large embedding model with highest quality for semantic search. Online: $0.13 per 1M tokens. Batch: $0.065 per 1M tokens',
+    },
+    {
+        id: 'text-embedding-ada-002',
+        name: 'Text Embedding Ada 002',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 8191,
+        contextLength: 8191,
+        pricing: { input: 0.1, output: 0.0 },
+        capabilities: ['embedding', 'semantic-search'],
+        category: 'embedding',
+        isLatest: false,
+        notes: 'Previous generation embedding model for semantic search. Online: $0.10 per 1M tokens. Batch: $0.05 per 1M tokens',
+    },
+    // === ChatGPT Models ===
+    {
+        id: 'chatgpt-4o-latest',
+        name: 'ChatGPT-4o',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 5.0, output: 15.0 },
+        capabilities: ['text', 'vision', 'multimodal', 'chat'],
+        category: 'multimodal',
+        isLatest: false,
+        notes: 'GPT-4o model used in ChatGPT (not recommended for API use). Standard: $5.00/$15.00 per 1M tokens. Batch: $5.00/$15.00',
+    },
+    // === Legacy and Deprecated Models ===
+    {
+        id: 'gpt-4.5-preview',
+        name: 'GPT-4.5 Preview',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 10.0, output: 30.0 },
+        capabilities: ['text', 'vision', 'multimodal'],
+        category: 'multimodal',
+        isLatest: false,
+        notes: 'Deprecated - Large model. Standard: $10.00/$30.00 per 1M tokens. Batch: $5.00/$15.00',
+    },
+    {
+        id: 'o1-preview',
+        name: 'o1 Preview',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 15.0, output: 60.0 },
+        capabilities: ['text', 'reasoning', 'analysis'],
+        category: 'reasoning',
+        isLatest: false,
+        notes: 'Deprecated - Preview of our first o-series reasoning model. Standard: $15.00/$60.00 per 1M tokens. Batch: $7.50/$30.00',
+    },
+    {
+        id: 'text-moderation-latest',
+        name: 'text-moderation',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 32768,
+        contextLength: 32768,
+        pricing: { input: 0.1, output: 0.1 },
+        capabilities: ['moderation', 'text', 'harmful-content-detection'],
+        category: 'moderation',
+        isLatest: false,
+        notes: 'Deprecated - Previous generation text-only moderation model',
+    },
+    {
+        id: 'text-moderation-stable',
+        name: 'text-moderation-stable',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 32768,
+        contextLength: 32768,
+        pricing: { input: 0.1, output: 0.1 },
+        capabilities: ['moderation', 'text', 'harmful-content-detection'],
+        category: 'moderation',
+        isLatest: false,
+        notes: 'Deprecated - Previous generation text-only moderation model',
+    },
+    {
+        id: 'babbage-002',
+        name: 'babbage-002',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 16384,
+        contextLength: 16384,
+        pricing: { input: 0.4, output: 0.4 },
+        capabilities: ['text'],
+        category: 'text',
+        isLatest: false,
+        notes: 'Deprecated - Replacement for the GPT-3 ada and babbage base models. Standard: $0.40/$0.40 per 1M tokens. Batch: $0.20/$0.20. Fine-tuning: $0.40 training, $1.60/$1.60 (standard), $0.80/$0.90 (batch)',
+    },
+    {
+        id: 'davinci-002',
+        name: 'davinci-002',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 16384,
+        contextLength: 16384,
+        pricing: { input: 2.0, output: 2.0 },
+        capabilities: ['text'],
+        category: 'text',
+        isLatest: false,
+        notes: 'Deprecated - Replacement for the GPT-3 curie and davinci base models. Standard: $2.00/$2.00 per 1M tokens. Batch: $1.00/$1.00. Fine-tuning: $6.00 training, $12.00/$12.00 (standard), $6.00/$6.00 (batch)',
+    },
+    {
+        id: 'gpt-4-turbo-2024-04-09',
+        name: 'GPT-4 Turbo (2024-04-09)',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 10.0, output: 30.0 },
+        capabilities: ['text', 'vision', 'multimodal'],
+        category: 'multimodal',
+        isLatest: false,
+        notes: 'Legacy GPT-4 Turbo model. Standard: $10.00/$30.00 per 1M tokens. Batch: $5.00/$15.00',
+    },
+    {
+        id: 'gpt-4-0125-preview',
+        name: 'GPT-4 (0125 Preview)',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 10.0, output: 30.0 },
+        capabilities: ['text', 'vision', 'multimodal'],
+        category: 'multimodal',
+        isLatest: false,
+        notes: 'Legacy GPT-4 preview model. Standard: $10.00/$30.00 per 1M tokens. Batch: $5.00/$15.00',
+    },
+    {
+        id: 'gpt-4-1106-preview',
+        name: 'GPT-4 (1106 Preview)',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 10.0, output: 30.0 },
+        capabilities: ['text', 'vision', 'multimodal'],
+        category: 'multimodal',
+        isLatest: false,
+        notes: 'Legacy GPT-4 preview model. Standard: $10.00/$30.00 per 1M tokens. Batch: $5.00/$15.00',
     },
     {
-        id: 'gpt-5-mini',
-        name: 'GPT-5 mini',
+        id: 'gpt-4-1106-vision-preview',
+        name: 'GPT-4 Vision (1106 Preview)',
         provider: 'OpenAI',
         available: true,
         maxTokens: 128000,
         contextLength: 128000,
-        pricing: { input: 0.25, output: 2.0 },
-        capabilities: ['text', 'reasoning', 'analysis', 'efficient'],
-        category: 'text',
-        isLatest: true,
-        notes: 'A faster, cost-efficient version of GPT-5 for well-defined tasks',
+        pricing: { input: 10.0, output: 30.0 },
+        capabilities: ['text', 'vision', 'multimodal'],
+        category: 'multimodal',
+        isLatest: false,
+        notes: 'Legacy GPT-4 vision preview model. Standard: $10.00/$30.00 per 1M tokens. Batch: $5.00/$15.00',
     },
     {
-        id: 'gpt-5-nano',
-        name: 'GPT-5 nano',
+        id: 'gpt-4-0613',
+        name: 'GPT-4 (0613)',
         provider: 'OpenAI',
         available: true,
-        maxTokens: 128000,
-        contextLength: 128000,
-        pricing: { input: 0.05, output: 0.4 },
-        capabilities: ['text', 'fast', 'cost-effective'],
+        maxTokens: 8192,
+        contextLength: 8192,
+        pricing: { input: 30.0, output: 60.0 },
+        capabilities: ['text'],
         category: 'text',
-        isLatest: true,
-        notes: 'Fastest, most cost-efficient version of GPT-5',
+        isLatest: false,
+        notes: 'Legacy GPT-4 model. Standard: $30.00/$60.00 per 1M tokens. Batch: $15.00/$30.00',
     },
     {
-        id: 'gpt-5-pro',
-        name: 'GPT-5 pro',
+        id: 'gpt-4-0314',
+        name: 'GPT-4 (0314)',
         provider: 'OpenAI',
         available: true,
-        maxTokens: 128000,
-        contextLength: 128000,
-        pricing: { input: 2.5, output: 20.0 },
-        capabilities: [
-            'text',
-            'reasoning',
-            'analysis',
-            'coding',
-            'agents',
-            'premium',
-        ],
+        maxTokens: 8192,
+        contextLength: 8192,
+        pricing: { input: 30.0, output: 60.0 },
+        capabilities: ['text'],
         category: 'text',
-        isLatest: true,
-        notes: 'Version of GPT-5 that produces smarter and more precise responses',
+        isLatest: false,
+        notes: 'Legacy GPT-4 model. Standard: $30.00/$60.00 per 1M tokens. Batch: $15.00/$30.00',
     },
     {
-        id: 'gpt-5-codex',
-        name: 'GPT-5-Codex',
+        id: 'gpt-4-32k',
+        name: 'GPT-4 32K',
         provider: 'OpenAI',
         available: true,
-        maxTokens: 128000,
-        contextLength: 128000,
-        pricing: { input: 1.25, output: 10.0 },
-        capabilities: ['code', 'programming', 'agents', 'coding'],
-        category: 'code',
-        isLatest: true,
-        notes: 'A version of GPT-5 optimized for agentic coding in Codex',
+        maxTokens: 32768,
+        contextLength: 32768,
+        pricing: { input: 60.0, output: 120.0 },
+        capabilities: ['text'],
+        category: 'text',
+        isLatest: false,
+        notes: 'Legacy GPT-4 model with 32K context. Standard: $60.00/$120.00 per 1M tokens. Batch: $30.00/$60.00',
     },
     {
-        id: 'gpt-5-chat-latest',
-        name: 'GPT-5 Chat',
+        id: 'gpt-4-turbo',
+        name: 'GPT-4 Turbo',
         provider: 'OpenAI',
         available: true,
         maxTokens: 128000,
         contextLength: 128000,
-        pricing: { input: 1.25, output: 10.0 },
-        capabilities: ['text', 'chat', 'reasoning', 'analysis'],
-        category: 'text',
-        isLatest: true,
-        notes: 'GPT-5 model used in ChatGPT (not recommended for API use)',
+        pricing: { input: 10.0, output: 30.0 },
+        capabilities: ['text', 'vision', 'multimodal'],
+        category: 'multimodal',
+        isLatest: false,
+        notes: 'Legacy GPT-4 Turbo model. Standard: $10.00/$30.00 per 1M tokens. Batch: $5.00/$15.00',
     },
-    // === GPT-4o Models ===
     {
-        id: 'gpt-4o-mini-2024-07-18',
-        name: 'GPT-4o Mini',
+        id: 'gpt-3.5-turbo-0125',
+        name: 'GPT-3.5 Turbo (0125)',
         provider: 'OpenAI',
         available: true,
-        maxTokens: 128000,
-        contextLength: 128000,
-        pricing: { input: 0.15, output: 0.6 },
-        capabilities: ['text', 'vision', 'multimodal'],
+        maxTokens: 16385,
+        contextLength: 16385,
+        pricing: { input: 0.5, output: 1.5 },
+        capabilities: ['text'],
         category: 'text',
-        isLatest: true,
-        notes: 'Latest GPT-4o Mini model with vision capabilities',
+        isLatest: false,
+        notes: 'Legacy GPT-3.5 Turbo model. Standard: $0.50/$1.50 per 1M tokens. Batch: $0.25/$0.75. Fine-tuning: $8.00 training, $3.00/$6.00 (standard), $1.50/$3.00 (batch)',
     },
     {
-        id: 'gpt-4o',
-        name: 'GPT-4o',
+        id: 'gpt-3.5-turbo-1106',
+        name: 'GPT-3.5 Turbo (1106)',
         provider: 'OpenAI',
         available: true,
-        maxTokens: 128000,
-        contextLength: 128000,
-        pricing: { input: 2.5, output: 10.0 },
-        capabilities: ['text', 'vision', 'multimodal'],
+        maxTokens: 16385,
+        contextLength: 16385,
+        pricing: { input: 1.0, output: 2.0 },
+        capabilities: ['text'],
         category: 'text',
-        isLatest: true,
-        notes: 'Latest GPT-4o model with enhanced capabilities',
+        isLatest: false,
+        notes: 'Legacy GPT-3.5 Turbo model. Standard: $1.00/$2.00 per 1M tokens. Batch: $1.00/$2.00',
     },
     {
-        id: 'gpt-4o-mini',
-        name: 'GPT-4o Mini',
+        id: 'gpt-3.5-turbo-0613',
+        name: 'GPT-3.5 Turbo (0613)',
         provider: 'OpenAI',
         available: true,
-        maxTokens: 128000,
-        contextLength: 128000,
-        pricing: { input: 0.15, output: 0.6 },
-        capabilities: ['text', 'vision', 'multimodal'],
+        maxTokens: 16385,
+        contextLength: 16385,
+        pricing: { input: 1.5, output: 2.0 },
+        capabilities: ['text'],
         category: 'text',
-        isLatest: true,
-        notes: 'GPT-4o Mini model with vision capabilities',
+        isLatest: false,
+        notes: 'Legacy GPT-3.5 Turbo model. Standard: $1.50/$2.00 per 1M tokens. Batch: $1.50/$2.00',
     },
     {
-        id: 'gpt-4-turbo',
-        name: 'GPT-4 Turbo',
+        id: 'gpt-3.5-0301',
+        name: 'GPT-3.5 (0301)',
         provider: 'OpenAI',
         available: true,
-        maxTokens: 128000,
-        contextLength: 128000,
-        pricing: { input: 10.0, output: 30.0 },
-        capabilities: ['text', 'vision', 'multimodal'],
+        maxTokens: 16385,
+        contextLength: 16385,
+        pricing: { input: 1.5, output: 2.0 },
+        capabilities: ['text'],
         category: 'text',
         isLatest: false,
-        notes: 'GPT-4 Turbo with vision capabilities',
+        notes: 'Legacy GPT-3.5 model. Standard: $1.50/$2.00 per 1M tokens. Batch: $1.50/$2.00',
     },
     {
-        id: 'gpt-4',
-        name: 'GPT-4',
+        id: 'gpt-3.5-turbo-16k-0613',
+        name: 'GPT-3.5 Turbo 16K (0613)',
         provider: 'OpenAI',
         available: true,
-        maxTokens: 8192,
-        contextLength: 8192,
-        pricing: { input: 30.0, output: 60.0 },
+        maxTokens: 16385,
+        contextLength: 16385,
+        pricing: { input: 3.0, output: 4.0 },
         capabilities: ['text'],
         category: 'text',
         isLatest: false,
-        notes: 'GPT-4 base model',
+        notes: 'Legacy GPT-3.5 Turbo model with 16K context. Standard: $3.00/$4.00 per 1M tokens. Batch: $1.50/$2.00',
     },
     {
-        id: 'gpt-3.5-turbo',
-        name: 'GPT-3.5 Turbo',
+        id: 'gpt-3.5-turbo-instruct',
+        name: 'GPT-3.5 Turbo Instruct',
         provider: 'OpenAI',
         available: true,
         maxTokens: 16385,
         contextLength: 16385,
-        pricing: { input: 0.5, output: 1.5 },
+        pricing: { input: 1.5, output: 2.0 },
         capabilities: ['text'],
         category: 'text',
         isLatest: false,
-        notes: 'GPT-3.5 Turbo model',
+        notes: 'Legacy GPT-3.5 Turbo Instruct model. Standard: $1.50/$2.00 per 1M tokens',
     },
     // === O-Series Models (Latest) ===
     {
@@ -195,7 +1011,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'reasoning', 'analysis', 'pro'],
         category: 'reasoning',
         isLatest: true,
-        notes: 'Version of o3 with more compute for better responses',
+        notes: 'Version of o3 with more compute for better responses. Standard: $20.00/$80.00 per 1M tokens. Batch: $10.00/$40.00',
     },
     {
         id: 'o3-deep-research',
@@ -208,7 +1024,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'research', 'analysis', 'deep'],
         category: 'research',
         isLatest: true,
-        notes: 'Our most powerful deep research model',
+        notes: 'Our most powerful deep research model. Standard: $10.00/$40.00 per 1M tokens. Batch: $5.00/$20.00. Cached input: $2.50 (standard)',
     },
     {
         id: 'o4-mini',
@@ -221,7 +1037,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'reasoning', 'efficient'],
         category: 'reasoning',
         isLatest: true,
-        notes: 'Fast, cost-efficient reasoning model, succeeded by GPT-5 mini',
+        notes: 'Fast, cost-efficient reasoning model, succeeded by GPT-5 mini. Standard: $1.10/$4.40 per 1M tokens. Batch: $0.55/$2.20. Flex: $0.55/$2.20. Priority: $2.00/$8.00. Cached input: $0.275 (standard), $0.138 (flex), $0.50 (priority). Fine-tuning: $100.00/hour training, $4.00/$1.00/$16.00 (standard), $2.00/$0.50/$8.00 (batch), $2.00/$0.50/$8.00 (with data sharing)',
     },
     {
         id: 'o4-mini-deep-research',
@@ -234,7 +1050,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'research', 'analysis', 'efficient'],
         category: 'research',
         isLatest: true,
-        notes: 'Faster, more affordable deep research model',
+        notes: 'Faster, more affordable deep research model. Standard: $2.00/$8.00 per 1M tokens. Batch: $1.00/$4.00. Cached input: $0.50 (standard)',
     },
     {
         id: 'o3',
@@ -247,7 +1063,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'reasoning', 'analysis'],
         category: 'reasoning',
         isLatest: true,
-        notes: 'Reasoning model for complex tasks, succeeded by GPT-5',
+        notes: 'Reasoning model for complex tasks, succeeded by GPT-5. Standard: $2.00/$8.00 per 1M tokens. Batch: $1.00/$4.00. Flex: $1.00/$4.00. Priority: $3.50/$14.00. Cached input: $0.50 (standard), $0.25 (flex), $0.875 (priority)',
     },
     {
         id: 'o1-pro',
@@ -260,7 +1076,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'reasoning', 'analysis', 'premium'],
         category: 'reasoning',
         isLatest: true,
-        notes: 'Version of o1 with more compute for better responses',
+        notes: 'Version of o1 with more compute for better responses. Standard: $150.00/$600.00 per 1M tokens. Batch: $75.00/$300.00',
     },
     {
         id: 'o1',
@@ -273,7 +1089,33 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'reasoning', 'analysis', 'advanced'],
         category: 'reasoning',
         isLatest: false,
-        notes: 'Previous full o-series reasoning model',
+        notes: 'Previous full o-series reasoning model. Standard: $15.00/$60.00 per 1M tokens. Batch: $7.50/$30.00. Cached input: $7.50 (standard)',
+    },
+    {
+        id: 'o3-mini',
+        name: 'o3-mini',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 1.1, output: 4.4 },
+        capabilities: ['text', 'reasoning', 'efficient'],
+        category: 'reasoning',
+        isLatest: false,
+        notes: 'A small model alternative to o3. Standard: $1.10/$4.40 per 1M tokens. Batch: $0.55/$2.20. Cached input: $0.55 (standard)',
+    },
+    {
+        id: 'o1-mini',
+        name: 'o1-mini',
+        provider: 'OpenAI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 1.1, output: 4.4 },
+        capabilities: ['text', 'reasoning', 'efficient'],
+        category: 'reasoning',
+        isLatest: false,
+        notes: 'Deprecated - A small model alternative to o1. Standard: $1.10/$4.40 per 1M tokens. Batch: $0.55/$2.20. Cached input: $0.55 (standard)',
     },
     // === Video Generation Models ===
     {
@@ -283,11 +1125,11 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.05, output: 0.05 },
+        pricing: { input: 0.1, output: 0.1 },
         capabilities: ['video-generation', 'audio', 'synced-audio'],
         category: 'video',
         isLatest: true,
-        notes: 'Flagship video generation with synced audio (priced per second)',
+        notes: 'Flagship video generation with synced audio. $0.10/sec (720p)',
     },
     {
         id: 'sora-2-pro',
@@ -296,257 +1138,233 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.1, output: 0.1 },
+        pricing: { input: 0.3, output: 0.3 },
         capabilities: ['video-generation', 'audio', 'synced-audio', 'advanced'],
         category: 'video',
         isLatest: true,
-        notes: 'Most advanced synced-audio video generation (priced per second)',
+        notes: 'Most advanced synced-audio video generation. $0.30/sec (720p), $0.50/sec (1024p)',
     },
     // === Image Generation Models ===
     {
-        id: 'gpt-image-1',
-        name: 'GPT Image 1',
+        id: 'gpt-image-1.5',
+        name: 'GPT Image 1.5',
         provider: 'OpenAI',
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.04, output: 0.04 },
+        pricing: { input: 5.0, output: 10.0 },
         capabilities: ['image-generation', 'text-to-image'],
         category: 'image',
         isLatest: true,
-        notes: 'State-of-the-art image generation model',
+        notes: 'Latest state-of-the-art image generation model. Text tokens: $5.00/$10.00 per 1M tokens (standard), $1.25 cached input. Image tokens: $8.00/$32.00 per 1M tokens (standard), $2.00 cached input. Per image: Low $0.009 (1024x1024), $0.013 (1024x1536/1536x1024); Medium $0.034 (1024x1024), $0.05 (1024x1536/1536x1024); High $0.133 (1024x1024), $0.2 (1024x1536/1536x1024). Text output tokens include model reasoning tokens',
     },
     {
-        id: 'gpt-image-1-mini',
-        name: 'gpt-image-1-mini',
+        id: 'chatgpt-image-latest',
+        name: 'ChatGPT Image Latest',
         provider: 'OpenAI',
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.02, output: 0.02 },
-        capabilities: ['image-generation', 'text-to-image', 'cost-efficient'],
+        pricing: { input: 5.0, output: 10.0 },
+        capabilities: ['image-generation', 'text-to-image'],
         category: 'image',
         isLatest: true,
-        notes: 'A cost-efficient version of GPT Image 1',
-    },
-    // === Audio and Realtime Models ===
-    {
-        id: 'gpt-realtime',
-        name: 'gpt-realtime',
-        provider: 'OpenAI',
-        available: true,
-        maxTokens: 128000,
-        contextLength: 128000,
-        pricing: { input: 5.0, output: 20.0 },
-        capabilities: ['text', 'audio', 'realtime', 'multimodal'],
-        category: 'realtime',
-        isLatest: true,
-        notes: 'Model capable of realtime text and audio inputs and outputs',
-    },
-    {
-        id: 'gpt-realtime-mini',
-        name: 'gpt-realtime-mini',
-        provider: 'OpenAI',
-        available: true,
-        maxTokens: 128000,
-        contextLength: 128000,
-        pricing: { input: 0.6, output: 2.4 },
-        capabilities: ['text', 'audio', 'realtime', 'efficient'],
-        category: 'realtime',
-        isLatest: true,
-        notes: 'A cost-efficient version of GPT Realtime',
-    },
-    {
-        id: 'gpt-audio',
-        name: 'gpt-audio',
-        provider: 'OpenAI',
-        available: true,
-        maxTokens: 128000,
-        contextLength: 128000,
-        pricing: { input: 2.5, output: 10.0 },
-        capabilities: ['text', 'audio', 'multimodal'],
-        category: 'audio',
-        isLatest: true,
-        notes: 'For audio inputs and outputs with Chat Completions API',
-    },
-    {
-        id: 'gpt-audio-mini',
-        name: 'gpt-audio-mini',
-        provider: 'OpenAI',
-        available: true,
-        maxTokens: 128000,
-        contextLength: 128000,
-        pricing: { input: 0.15, output: 0.6 },
-        capabilities: ['text', 'audio', 'efficient'],
-        category: 'audio',
-        isLatest: true,
-        notes: 'A cost-efficient version of GPT Audio',
-    },
-    // === Transcription Models ===
-    {
-        id: 'gpt-4o-transcribe',
-        name: 'GPT-4o Transcribe',
-        provider: 'OpenAI',
-        available: true,
-        maxTokens: 0,
-        contextLength: 0,
-        pricing: { input: 0.15, output: 0.15 },
-        capabilities: ['audio', 'transcription', 'speech-to-text'],
-        category: 'audio',
-        isLatest: true,
-        notes: 'Speech-to-text model powered by GPT-4o',
+        notes: 'GPT Image model used in ChatGPT. Text tokens: $5.00/$10.00 per 1M tokens (standard), $1.25 cached input. Image tokens: $8.00/$32.00 per 1M tokens (standard), $2.00 cached input. Per image: Low $0.009 (1024x1024), $0.013 (1024x1536/1536x1024); Medium $0.034 (1024x1024), $0.05 (1024x1536/1536x1024); High $0.133 (1024x1024), $0.2 (1024x1536/1536x1024)',
     },
     {
-        id: 'gpt-4o-transcribe-diarize',
-        name: 'GPT-4o Transcribe Diarize',
+        id: 'gpt-image-1',
+        name: 'GPT Image 1',
         provider: 'OpenAI',
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.2, output: 0.2 },
-        capabilities: ['audio', 'transcription', 'speech-to-text', 'diarization'],
-        category: 'audio',
-        isLatest: true,
-        notes: "Transcription model that identifies who's speaking when",
+        pricing: { input: 5.0, output: 0.0 },
+        capabilities: ['image-generation', 'text-to-image'],
+        category: 'image',
+        isLatest: false,
+        notes: 'State-of-the-art image generation model. Text tokens: $5.00 per 1M tokens (standard), $1.25 cached input. Image tokens: $10.00/$40.00 per 1M tokens (standard), $2.50 cached input. Per image: Low $0.011 (1024x1024), $0.016 (1024x1536/1536x1024); Medium $0.042 (1024x1024), $0.063 (1024x1536/1536x1024); High $0.167 (1024x1024), $0.25 (1024x1536/1536x1024)',
     },
     {
-        id: 'gpt-4o-mini-transcribe',
-        name: 'GPT-4o mini Transcribe',
+        id: 'gpt-image-1-mini',
+        name: 'gpt-image-1-mini',
         provider: 'OpenAI',
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.1, output: 0.1 },
-        capabilities: ['audio', 'transcription', 'speech-to-text', 'efficient'],
-        category: 'audio',
-        isLatest: true,
-        notes: 'Speech-to-text model powered by GPT-4o mini',
+        pricing: { input: 2.0, output: 0.0 },
+        capabilities: ['image-generation', 'text-to-image', 'cost-efficient'],
+        category: 'image',
+        isLatest: false,
+        notes: 'A cost-efficient version of GPT Image 1. Text tokens: $2.00 per 1M tokens (standard), $0.20 cached input. Image tokens: $2.50/$8.00 per 1M tokens (standard), $0.25 cached input. Per image: Low $0.005 (1024x1024), $0.006 (1024x1536/1536x1024); Medium $0.011 (1024x1024), $0.015 (1024x1536/1536x1024); High $0.036 (1024x1024), $0.052 (1024x1536/1536x1024)',
     },
     {
-        id: 'whisper-1',
-        name: 'Whisper',
+        id: 'dall-e-3',
+        name: 'DALL·E 3',
         provider: 'OpenAI',
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.006, output: 0.006 },
-        capabilities: [
-            'audio',
-            'transcription',
-            'speech-to-text',
-            'general-purpose',
-        ],
-        category: 'audio',
-        isLatest: true,
-        notes: 'General-purpose speech recognition model (priced per minute)',
+        pricing: { input: 0.04, output: 0.08 },
+        capabilities: ['image-generation', 'text-to-image'],
+        category: 'image',
+        isLatest: false,
+        notes: 'Previous generation image generation model. Standard: $0.04 (1024x1024), $0.08 (1024x1536/1536x1024). HD: $0.08 (1024x1024), $0.12 (1024x1536/1536x1024)',
     },
-    // === Text-to-Speech Models ===
     {
-        id: 'gpt-4o-mini-tts',
-        name: 'GPT-4o mini TTS',
+        id: 'dall-e-2',
+        name: 'DALL·E 2',
         provider: 'OpenAI',
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.15, output: 0.15 },
-        capabilities: ['audio', 'text-to-speech', 'tts'],
-        category: 'audio',
-        isLatest: true,
-        notes: 'Text-to-speech model powered by GPT-4o mini',
+        pricing: { input: 0.016, output: 0.02 },
+        capabilities: ['image-generation', 'text-to-image'],
+        category: 'image',
+        isLatest: false,
+        notes: 'Our first image generation model. Standard: $0.016 (1024x1024), $0.018 (1024x1536), $0.02 (1536x1024)',
     },
     {
-        id: 'tts-1',
-        name: 'TTS-1',
+        id: 'gpt-image-1-mini',
+        name: 'gpt-image-1-mini',
         provider: 'OpenAI',
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.015, output: 0.015 },
-        capabilities: ['audio', 'text-to-speech', 'tts', 'fast'],
-        category: 'audio',
+        pricing: { input: 0.02, output: 0.02 },
+        capabilities: ['image-generation', 'text-to-image', 'cost-efficient'],
+        category: 'image',
         isLatest: true,
-        notes: 'Text-to-speech model optimized for speed (priced per 1K characters)',
+        notes: 'A cost-efficient version of GPT Image 1',
     },
+    // === Anthropic Models ===
+    // === Claude 4.5 Series (Latest) ===
     {
-        id: 'tts-1-hd',
-        name: 'TTS-1 HD',
-        provider: 'OpenAI',
+        id: 'claude-sonnet-4-5-20250929',
+        name: 'Claude Sonnet 4.5',
+        provider: 'Anthropic',
         available: true,
-        maxTokens: 0,
-        contextLength: 0,
-        pricing: { input: 0.03, output: 0.03 },
-        capabilities: ['audio', 'text-to-speech', 'tts', 'high-quality'],
-        category: 'audio',
+        maxTokens: 64000,
+        contextLength: 200000,
+        pricing: { input: 3.0, output: 15.0 },
+        capabilities: [
+            'text',
+            'vision',
+            'multimodal',
+            'reasoning',
+            'coding',
+            'agents',
+            'extended-thinking',
+            'multilingual',
+        ],
+        category: 'multimodal',
         isLatest: true,
-        notes: 'Text-to-speech model optimized for quality (priced per 1K characters)',
+        notes: 'Latest Claude Sonnet model with enhanced capabilities and 1M context window support (beta). Reliable knowledge cutoff: Jan 2025. Training data cutoff: Jul 2025. Max output: 64K tokens',
     },
-    // === Open-Weight Models ===
     {
-        id: 'gpt-oss-120b',
-        name: 'gpt-oss-120b',
-        provider: 'OpenAI',
+        id: 'claude-sonnet-4-5',
+        name: 'Claude Sonnet 4.5 (Alias)',
+        provider: 'Anthropic',
         available: true,
-        maxTokens: 131072,
-        contextLength: 131072,
-        pricing: { input: 0.0, output: 0.0 },
-        capabilities: ['text', 'open-source', 'open-weight'],
-        category: 'text',
+        maxTokens: 64000,
+        contextLength: 200000,
+        pricing: { input: 3.0, output: 15.0 },
+        capabilities: [
+            'text',
+            'vision',
+            'multimodal',
+            'reasoning',
+            'coding',
+            'agents',
+            'extended-thinking',
+            'multilingual',
+        ],
+        category: 'multimodal',
         isLatest: true,
-        notes: 'Most powerful open-weight model, fits into an H100 GPU. Licensed under Apache 2.0',
+        notes: 'Alias for claude-sonnet-4-5-20250929 - automatically points to latest snapshot',
     },
     {
-        id: 'gpt-oss-20b',
-        name: 'gpt-oss-20b',
-        provider: 'OpenAI',
+        id: 'claude-haiku-4-5-20251001',
+        name: 'Claude Haiku 4.5',
+        provider: 'Anthropic',
         available: true,
-        maxTokens: 131072,
-        contextLength: 131072,
-        pricing: { input: 0.0, output: 0.0 },
-        capabilities: ['text', 'open-source', 'open-weight', 'low-latency'],
-        category: 'text',
+        maxTokens: 64000,
+        contextLength: 200000,
+        pricing: { input: 1.0, output: 5.0 },
+        capabilities: [
+            'text',
+            'vision',
+            'multimodal',
+            'fast',
+            'extended-thinking',
+            'multilingual',
+        ],
+        category: 'multimodal',
         isLatest: true,
-        notes: 'Medium-sized open-weight model for low latency. Licensed under Apache 2.0',
+        notes: 'Latest Claude Haiku model with improved performance and capabilities. Reliable knowledge cutoff: Feb 2025. Training data cutoff: Jul 2025. Max output: 64K tokens',
     },
     {
-        id: 'gpt-4.1',
-        name: 'GPT-4.1',
-        provider: 'OpenAI',
+        id: 'claude-haiku-4-5',
+        name: 'Claude Haiku 4.5 (Alias)',
+        provider: 'Anthropic',
         available: true,
-        maxTokens: 128000,
-        contextLength: 128000,
-        pricing: { input: 2.0, output: 8.0 },
-        capabilities: ['text', 'analysis', 'enhanced'],
-        category: 'text',
+        maxTokens: 64000,
+        contextLength: 200000,
+        pricing: { input: 1.0, output: 5.0 },
+        capabilities: [
+            'text',
+            'vision',
+            'multimodal',
+            'fast',
+            'extended-thinking',
+            'multilingual',
+        ],
+        category: 'multimodal',
         isLatest: true,
-        notes: 'Smartest non-reasoning model',
+        notes: 'Alias for claude-haiku-4-5-20251001 - automatically points to latest snapshot',
     },
     {
-        id: 'gpt-4.1-mini',
-        name: 'GPT-4.1 mini',
-        provider: 'OpenAI',
+        id: 'claude-opus-4-5-20251101',
+        name: 'Claude Opus 4.5',
+        provider: 'Anthropic',
         available: true,
-        maxTokens: 128000,
-        contextLength: 128000,
-        pricing: { input: 0.4, output: 1.6 },
-        capabilities: ['text', 'analysis', 'efficient'],
-        category: 'text',
+        maxTokens: 64000,
+        contextLength: 200000,
+        pricing: { input: 5.0, output: 25.0 },
+        capabilities: [
+            'text',
+            'vision',
+            'multimodal',
+            'reasoning',
+            'premium',
+            'extended-thinking',
+            'multilingual',
+        ],
+        category: 'multimodal',
         isLatest: true,
-        notes: 'Smaller, faster version of GPT-4.1',
+        notes: 'Latest Claude Opus model with enhanced capabilities. Reliable knowledge cutoff: May 2025. Training data cutoff: Aug 2025. Max output: 64K tokens',
     },
     {
-        id: 'gpt-4.1-nano',
-        name: 'GPT-4.1 nano',
-        provider: 'OpenAI',
+        id: 'claude-opus-4-5',
+        name: 'Claude Opus 4.5 (Alias)',
+        provider: 'Anthropic',
         available: true,
-        maxTokens: 128000,
-        contextLength: 128000,
-        pricing: { input: 0.1, output: 0.4 },
-        capabilities: ['text', 'fast', 'cost-effective'],
-        category: 'text',
+        maxTokens: 64000,
+        contextLength: 200000,
+        pricing: { input: 5.0, output: 25.0 },
+        capabilities: [
+            'text',
+            'vision',
+            'multimodal',
+            'reasoning',
+            'premium',
+            'extended-thinking',
+            'multilingual',
+        ],
+        category: 'multimodal',
         isLatest: true,
-        notes: 'Fastest, most cost-efficient version of GPT-4.1',
+        notes: 'Alias for claude-opus-4-5-20251101 - automatically points to latest snapshot',
     },
-    // === Anthropic Models ===
+    // === Claude 4 Series (Legacy) ===
     {
         id: 'claude-opus-4-1-20250805',
         name: 'Claude Opus 4.1',
@@ -564,8 +1382,8 @@ exports.AVAILABLE_MODELS = [
             'multilingual',
         ],
         category: 'multimodal',
-        isLatest: true,
-        notes: 'Most capable and intelligent Claude model yet - superior reasoning and advanced coding (Mar 2025 cutoff)',
+        isLatest: false,
+        notes: 'Legacy model - migrate to Claude Opus 4.5. Reliable knowledge cutoff: Jan 2025. Training data cutoff: Mar 2025. Max output: 32K tokens',
     },
     {
         id: 'claude-opus-4-20250514',
@@ -584,8 +1402,8 @@ exports.AVAILABLE_MODELS = [
             'multilingual',
         ],
         category: 'multimodal',
-        isLatest: true,
-        notes: 'Previous flagship model with very high intelligence and capability (Mar 2025 cutoff)',
+        isLatest: false,
+        notes: 'Legacy model - migrate to Claude Opus 4.5. Reliable knowledge cutoff: Jan 2025. Training data cutoff: Mar 2025. Max output: 32K tokens',
     },
     {
         id: 'claude-sonnet-4-20250514',
@@ -600,13 +1418,15 @@ exports.AVAILABLE_MODELS = [
             'vision',
             'multimodal',
             'reasoning',
+            'coding',
             'extended-thinking',
             'multilingual',
         ],
         category: 'multimodal',
         isLatest: false,
-        notes: 'High-performance model with exceptional reasoning (Mar 2025 cutoff, 1M context beta available). Use Claude Sonnet 4.5 for latest version',
+        notes: 'Legacy model - migrate to Claude Sonnet 4.5. Reliable knowledge cutoff: Jan 2025. Training data cutoff: Mar 2025. Max output: 64K tokens. 1M context beta available',
     },
+    // === Claude 3.7 Series (Deprecated) ===
     {
         id: 'claude-3-7-sonnet-20250219',
         name: 'Claude Sonnet 3.7',
@@ -620,13 +1440,15 @@ exports.AVAILABLE_MODELS = [
             'vision',
             'multimodal',
             'reasoning',
+            'coding',
             'extended-thinking',
             'multilingual',
         ],
         category: 'multimodal',
         isLatest: false,
-        notes: 'High-performance model with early extended thinking (Oct 2024 cutoff, 64k output). Deprecated - use Claude Sonnet 4.5 instead',
+        notes: 'DEPRECATED - migrate to Claude Sonnet 4.5. Reliable knowledge cutoff: Oct 2024. Training data cutoff: Nov 2024. Max output: 64K tokens',
     },
+    // === Claude 3.5 Series ===
     {
         id: 'claude-3-5-sonnet-20241022',
         name: 'Claude Sonnet 3.5 v2',
@@ -641,52 +1463,66 @@ exports.AVAILABLE_MODELS = [
         notes: 'Upgraded Claude 3.5 Sonnet (Apr 2024 cutoff, 8k output)',
     },
     {
-        id: 'claude-sonnet-4-5',
-        name: 'Claude Sonnet 4.5',
+        id: 'claude-3-5-haiku-20241022',
+        name: 'Claude Haiku 3.5',
         provider: 'Anthropic',
         available: true,
-        maxTokens: 200000,
+        maxTokens: 8192,
         contextLength: 200000,
-        pricing: { input: 3.0, output: 15.0 },
+        pricing: { input: 0.8, output: 4.0 },
+        capabilities: ['text', 'vision', 'multimodal', 'fast', 'multilingual'],
+        category: 'multimodal',
+        isLatest: false,
+        notes: 'Legacy model - migrate to Claude Haiku 4.5. Training data cutoff: July 2024. Max output: 8K tokens',
+    },
+    // === Google AI Models ===
+    // === Gemini 3 Models (Latest) ===
+    {
+        id: 'gemini-3-pro-preview',
+        name: 'Gemini 3 Pro Preview',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 2000000,
+        contextLength: 2000000,
+        pricing: { input: 2.0, output: 12.0 },
         capabilities: [
             'text',
             'vision',
-            'multimodal',
             'reasoning',
-            'extended-thinking',
-            'multilingual',
+            'coding',
+            'agents',
+            'multimodal',
         ],
         category: 'multimodal',
         isLatest: true,
-        notes: 'Latest Claude Sonnet model with enhanced capabilities and 1M context window support (beta)',
+        notes: 'Latest Gemini 3 Pro preview model. Input (text, image, video, audio): $2.00/1M tokens (<=200K), $4.00/1M tokens (>200K). Text output: $12.00/1M tokens (<=200K), $18.00/1M tokens (>200K). Cached input: $0.20/1M tokens (<=200K), $0.40/1M tokens (>200K). Batch API: $1.00/$6.00 (<=200K), $2.00/$9.00 (>200K). Image output: $120/1M tokens (1K/2K image = 1120 tokens = $0.134/image, 4K image = 2000 tokens = $0.24/image)',
     },
     {
-        id: 'claude-haiku-4-5',
-        name: 'Claude Haiku 4.5',
-        provider: 'Anthropic',
+        id: 'gemini-3-pro-image-preview',
+        name: 'Gemini 3 Pro Image Preview',
+        provider: 'Google AI',
         available: true,
-        maxTokens: 200000,
-        contextLength: 200000,
-        pricing: { input: 1.0, output: 5.0 },
-        capabilities: ['text', 'vision', 'multimodal', 'multilingual'],
+        maxTokens: 2000000,
+        contextLength: 2000000,
+        pricing: { input: 2.0, output: 12.0 },
+        capabilities: ['text', 'image', 'vision', 'multimodal'],
         category: 'multimodal',
         isLatest: true,
-        notes: 'Latest Claude Haiku model with improved performance and capabilities',
+        notes: 'Latest Gemini 3 Pro Image preview model with image generation capabilities. Image output: $120/1M tokens (1K/2K image = 1120 tokens = $0.134/image, 4K image = 2000 tokens = $0.24/image)',
     },
     {
-        id: 'claude-3-5-haiku-20241022',
-        name: 'Claude Haiku 3.5',
-        provider: 'Anthropic',
+        id: 'gemini-3-flash-preview',
+        name: 'Gemini 3 Flash Preview',
+        provider: 'Google AI',
         available: true,
-        maxTokens: 8192,
-        contextLength: 200000,
-        pricing: { input: 0.8, output: 4.0 },
-        capabilities: ['text', 'vision', 'multimodal', 'multilingual'],
+        maxTokens: 2000000,
+        contextLength: 2000000,
+        pricing: { input: 0.5, output: 3.0 },
+        capabilities: ['text', 'vision', 'audio', 'fast', 'multimodal'],
         category: 'multimodal',
-        isLatest: false,
-        notes: 'Fastest Claude model (July 2024 cutoff, 8k output)',
+        isLatest: true,
+        notes: 'Latest Gemini 3 Flash preview model. Input (text, image, video): $0.50/1M tokens. Input (audio): $1.00/1M tokens. Text output: $3.00/1M tokens. Cached input: $0.05/1M tokens (text/image/video), $0.10/1M tokens (audio). Batch API: $0.25/1M tokens (text/image/video), $0.50/1M tokens (audio) input, $1.50/1M tokens output',
     },
-    // === Google AI Models ===
     // === Gemini 2.5 Models (Latest) ===
     {
         id: 'gemini-2.5-pro',
@@ -696,17 +1532,30 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 2000000,
         contextLength: 2000000,
         pricing: { input: 1.25, output: 10.0 },
+        capabilities: ['text', 'vision', 'reasoning', 'coding', 'multimodal'],
+        category: 'multimodal',
+        isLatest: true,
+        notes: 'Our state-of-the-art thinking model, capable of reasoning over complex problems in code, math, and STEM, as well as analyzing large datasets, codebases, and documents using long context. Best for multimodal understanding, coding (web development), and complex prompts. Input (text, image, video, audio): $1.25/1M tokens (<=200K), $2.50/1M tokens (>200K). Text output: $10.00/1M tokens (<=200K), $15.00/1M tokens (>200K). Cached: $0.125/1M tokens (<=200K), $0.250/1M tokens (>200K). Batch API: $0.625/$5.00 (<=200K), $1.25/$7.50 (>200K)',
+    },
+    {
+        id: 'gemini-2.5-pro-computer-use-preview',
+        name: 'Gemini 2.5 Pro Computer Use-Preview',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 2000000,
+        contextLength: 2000000,
+        pricing: { input: 1.25, output: 10.0 },
         capabilities: [
             'text',
-            'multimodal',
+            'vision',
             'reasoning',
             'coding',
-            'complex-problems',
-            'thinking',
+            'computer-use',
+            'multimodal',
         ],
         category: 'multimodal',
         isLatest: true,
-        notes: 'Our state-of-the-art thinking model, capable of reasoning over complex problems in code, math, and STEM, as well as analyzing large datasets, codebases, and documents using long context',
+        notes: 'Gemini 2.5 Pro with Computer Use capabilities. Input (text, image, video, audio): $1.25/1M tokens (<=200K), $2.50/1M tokens (>200K). Text output: $10.00/1M tokens (<=200K), $15.00/1M tokens (>200K). Computer Use billing uses the Gemini 2.5 Pro SKU',
     },
     {
         id: 'gemini-2.5-flash',
@@ -718,17 +1567,28 @@ exports.AVAILABLE_MODELS = [
         pricing: { input: 0.3, output: 2.5 },
         capabilities: [
             'text',
-            'image',
-            'video',
+            'vision',
+            'audio',
+            'fast',
             'multimodal',
-            'reasoning',
-            'thinking',
-            'live-api',
-            'agents',
+            'image-generation',
         ],
         category: 'multimodal',
         isLatest: true,
-        notes: 'Our best model in terms of price-performance, offering well-rounded capabilities. Best for large scale processing, low-latency, high volume tasks that require thinking, and agentic use cases',
+        notes: "Our best model in terms of price-performance, offering well-rounded capabilities. Best for large scale processing, low-latency, high volume tasks that require thinking, and agentic use cases. Support for Live API included for some endpoints. See the model's thinking process as part of the response. Input (text, image, video): $0.30/1M tokens. Audio input: $1.00/1M tokens. Text output: $2.50/1M tokens. Image output: $30/1M tokens (1024x1024 image = 1290 tokens). Cached: $0.030/1M tokens. Batch API: $0.15/$1.25 (text/image/video), $0.50/$1.25 (audio)",
+    },
+    {
+        id: 'gemini-2.5-flash-preview-09-2025',
+        name: 'Gemini 2.5 Flash Preview',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 1000000,
+        contextLength: 1000000,
+        pricing: { input: 0.3, output: 2.5 },
+        capabilities: ['text', 'vision', 'audio', 'fast'],
+        category: 'multimodal',
+        isLatest: true,
+        notes: 'Gemini 2.5 Flash preview model. Cached: $0.03',
     },
     {
         id: 'gemini-2.5-flash-lite-preview',
@@ -749,7 +1609,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'multimodal',
         isLatest: true,
-        notes: 'Our fastest flash model optimized for cost-efficiency and high throughput. Features 1M token context window and multimodal input',
+        notes: 'Our fastest flash model optimized for cost-efficiency and high throughput. Features 1M token context window and multimodal input. Outperforms 2.0 Flash on most evaluation benchmarks. Audio input: $0.50',
     },
     {
         id: 'gemini-2.5-flash-lite',
@@ -759,18 +1619,10 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 1000000,
         contextLength: 1000000,
         pricing: { input: 0.1, output: 0.4 },
-        capabilities: [
-            'text',
-            'image',
-            'video',
-            'multimodal',
-            'reasoning',
-            'thinking',
-            'high-throughput',
-        ],
+        capabilities: ['text', 'vision', 'fast', 'multimodal'],
         category: 'multimodal',
         isLatest: true,
-        notes: 'Our fastest flash model optimized for cost-efficiency and high throughput (stable version)',
+        notes: 'Our fastest flash model optimized for cost-efficiency and high throughput (stable version). Features 1M token context window and multimodal input. Input (text, image, video): $0.10/1M tokens. Audio input: $0.30/1M tokens. Text output: $0.40/1M tokens. Cached: $0.010/1M tokens (text/image/video), $0.030/1M tokens (audio). Batch API: $0.05/$0.20 (text/image/video), $0.15/$0.20 (audio)',
     },
     {
         id: 'gemini-2.5-flash-audio',
@@ -792,11 +1644,11 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 1000000,
         contextLength: 1000000,
-        pricing: { input: 0.5, output: 0.4 },
+        pricing: { input: 0.3, output: 0.4 },
         capabilities: ['audio', 'multimodal', 'audio-input', 'high-throughput'],
         category: 'audio',
         isLatest: true,
-        notes: 'Gemini 2.5 Flash-Lite with audio input capabilities',
+        notes: 'Gemini 2.5 Flash-Lite with audio input capabilities. Audio input: $0.30/1M tokens. Text output: $0.40/1M tokens',
     },
     {
         id: 'gemini-2.5-flash-native-audio',
@@ -809,7 +1661,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['audio', 'multimodal', 'native-audio'],
         category: 'audio',
         isLatest: true,
-        notes: 'Native audio model optimized for higher quality audio outputs',
+        notes: 'Native audio model optimized for higher quality audio outputs. Audio/video input: $3.00, Audio output: $12.00',
     },
     {
         id: 'gemini-2.5-flash-native-audio-output',
@@ -858,18 +1710,24 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 1000000,
         contextLength: 1000000,
-        pricing: { input: 0.1, output: 0.4 },
-        capabilities: [
-            'text',
-            'image',
-            'video',
-            'multimodal',
-            'agents',
-            'next-generation',
-        ],
+        pricing: { input: 0.15, output: 0.6 },
+        capabilities: ['text', 'vision', 'audio', 'multimodal'],
+        category: 'multimodal',
+        isLatest: false,
+        notes: 'Our second generation workhorse model, with a 1 million token context window. Most balanced multimodal model built for the era of Agents. Input (text, image, video): $0.15/1M tokens. Audio input: $1.00/1M tokens. Text output: $0.60/1M tokens. Batch API: $0.075/$0.30. Tuning: $3.00/1M training tokens',
+    },
+    {
+        id: 'gemini-2.0-flash-image-generation',
+        name: 'Gemini 2.0 Flash Image Generation',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 1000000,
+        contextLength: 1000000,
+        pricing: { input: 0.15, output: 30.0 },
+        capabilities: ['text', 'vision', 'audio', 'image-generation', 'multimodal'],
         category: 'multimodal',
         isLatest: false,
-        notes: 'Our second generation workhorse model, with a 1 million token context window',
+        notes: 'Gemini 2.0 Flash with image generation capabilities. Input (text, image, video): $0.15/1M tokens. Audio input: $1.00/1M tokens. Video input: $3.00/1M tokens. Text output: $0.60/1M tokens. Image output: $30.00/1M tokens',
     },
     {
         id: 'gemini-2.0-flash-lite',
@@ -879,10 +1737,10 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 1000000,
         contextLength: 1000000,
         pricing: { input: 0.075, output: 0.3 },
-        capabilities: ['text', 'multimodal', 'cost-efficient', 'low-latency'],
+        capabilities: ['text', 'fast', 'multimodal'],
         category: 'multimodal',
         isLatest: false,
-        notes: 'Our second generation small workhorse model, with a 1 million token context window',
+        notes: 'Our second generation small workhorse model, with a 1 million token context window. Optimized for cost efficiency and low latency, built for at scale usage. Input (text, image, video, audio): $0.075/1M tokens. Text output: $0.30/1M tokens. Batch API: $0.0375/$0.15. Tuning: $1.00/1M training tokens',
     },
     {
         id: 'gemini-2.0-flash-audio',
@@ -909,7 +1767,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'image', 'video', 'multimodal'],
         category: 'multimodal',
         isLatest: false,
-        notes: 'Fastest multimodal model for diverse, repetitive tasks',
+        notes: 'Fastest multimodal model for diverse, repetitive tasks. $0.15/$0.60 for prompts > 128k tokens',
     },
     {
         id: 'gemini-1.5-flash-large-context',
@@ -935,7 +1793,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'image', 'video', 'multimodal', 'efficient'],
         category: 'multimodal',
         isLatest: false,
-        notes: 'Smallest model for lower intelligence use cases',
+        notes: 'Smallest model for lower intelligence use cases. $0.075/$0.30 for prompts > 128k tokens',
     },
     {
         id: 'gemini-1.5-flash-8b-large-context',
@@ -968,7 +1826,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'code', 'reasoning', 'multimodal'],
         category: 'text',
         isLatest: false,
-        notes: 'Highest intelligence Gemini 1.5 series model with 2M context',
+        notes: 'Highest intelligence Gemini 1.5 series model with 2M context. $2.50/$10.00 for prompts > 128k tokens',
     },
     {
         id: 'gemini-1.5-pro-large-context',
@@ -1001,7 +1859,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'text',
         isLatest: true,
-        notes: 'The latest open models, designed for efficient execution on low-resource devices, capable of multimodal input (text, image, video, audio), and trained with data in over 140 spoken languages',
+        notes: 'The latest open models, designed for efficient execution on low-resource devices, capable of multimodal input (text, image, video, audio), and trained with data in over 140 spoken languages. Open model built for efficient performance on everyday devices (free tier only)',
     },
     {
         id: 'gemma-3',
@@ -1020,7 +1878,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'text',
         isLatest: true,
-        notes: 'The third generation of our open models, featuring the ability to solve a wide variety of tasks with text and image input, support for over 140 languages, and long 128K context window',
+        notes: 'The third generation of our open models, featuring the ability to solve a wide variety of tasks with text and image input, support for over 140 languages, and long 128K context window (free tier only)',
     },
     {
         id: 'gemma-2',
@@ -1039,7 +1897,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'text',
         isLatest: false,
-        notes: 'The second generation of our open models featuring text generation, summarization, and extraction',
+        notes: 'The second generation of our open models featuring text generation, summarization, and extraction (free tier only)',
     },
     {
         id: 'gemma',
@@ -1059,7 +1917,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'text',
         isLatest: false,
-        notes: 'A small-sized, lightweight open model supporting text generation, summarization, and extraction',
+        notes: 'A small-sized, lightweight open model supporting text generation, summarization, and extraction (free tier only)',
     },
     // === Specialized Gemma Models ===
     {
@@ -1078,7 +1936,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'safety',
         isLatest: true,
-        notes: 'Instruction tuned models for evaluating the safety of text and images against a set of defined safety policies',
+        notes: 'Instruction tuned models for evaluating the safety of text and images against a set of defined safety policies (free tier only)',
     },
     {
         id: 'paligemma',
@@ -1091,7 +1949,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'open-source', 'vision-language', 'siglip', 'gemma'],
         category: 'vision-language',
         isLatest: true,
-        notes: 'Our open vision-language model that combines SigLIP and Gemma',
+        notes: 'Our open vision-language model that combines SigLIP and Gemma (free tier only)',
     },
     {
         id: 'codegemma',
@@ -1111,7 +1969,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'coding',
         isLatest: true,
-        notes: 'Powerful, lightweight open model that can perform a variety of coding tasks like fill-in-the-middle code completion, code generation, natural language understanding, mathematical reasoning, and instruction following',
+        notes: 'Powerful, lightweight open model that can perform a variety of coding tasks like fill-in-the-middle code completion, code generation, natural language understanding, mathematical reasoning, and instruction following (free tier only)',
     },
     {
         id: 'txgemma',
@@ -1131,7 +1989,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'therapeutic',
         isLatest: true,
-        notes: 'Generates predictions, classifications or text based on therapeutic related data and can be used to efficiently build AI models for therapeutic-related tasks with less data and less compute',
+        notes: 'Generates predictions, classifications or text based on therapeutic related data and can be used to efficiently build AI models for therapeutic-related tasks with less data and less compute (free tier only)',
     },
     {
         id: 'medgemma',
@@ -1150,7 +2008,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'medical',
         isLatest: true,
-        notes: 'Collection of Gemma 3 variants that are trained for performance on medical text and image comprehension',
+        notes: 'Collection of Gemma 3 variants that are trained for performance on medical text and image comprehension (free tier only)',
     },
     {
         id: 'medsiglip',
@@ -1169,7 +2027,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'medical',
         isLatest: true,
-        notes: 'SigLIP variant that is trained to encode medical images and text into a common embedding space',
+        notes: 'SigLIP variant that is trained to encode medical images and text into a common embedding space (free tier only)',
     },
     {
         id: 't5gemma',
@@ -1189,9 +2047,22 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'research',
         isLatest: true,
-        notes: 'A family of lightweight yet powerful encoder-decoder research models from Google',
+        notes: 'A family of lightweight yet powerful encoder-decoder research models from Google (free tier only)',
     },
     // === Embeddings Models ===
+    {
+        id: 'gemini-embedding-001',
+        name: 'Gemini Embedding',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 2048,
+        contextLength: 2048,
+        pricing: { input: 0.15, output: 0.0 },
+        capabilities: ['embeddings', 'semantic-search'],
+        category: 'embedding',
+        isLatest: true,
+        notes: 'Gemini embedding model for semantic search and similarity tasks. Online requests: $0.00015 per 1,000 input tokens. Batch requests: $0.00012 per 1,000 input tokens. Output: No charge',
+    },
     {
         id: 'text-embedding-004',
         name: 'Text Embedding 004',
@@ -1206,170 +2077,503 @@ exports.AVAILABLE_MODELS = [
             'classification',
             'clustering',
         ],
-        category: 'embedding',
+        category: 'embedding',
+        isLatest: true,
+        notes: 'State-of-the-art text embedding model for semantic search, classification, clustering, and similar tasks (free tier only)',
+    },
+    {
+        id: 'multimodal-embeddings',
+        name: 'Multimodal Embeddings',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 2048,
+        contextLength: 2048,
+        pricing: { input: 0.0, output: 0.0 },
+        capabilities: [
+            'embedding',
+            'multimodal',
+            'image-classification',
+            'image-search',
+        ],
+        category: 'embedding',
+        isLatest: true,
+        notes: 'Generates vectors based on images, which can be used for downstream tasks like image classification, image search, and more (free tier only)',
+    },
+    // === Imagen Models (Image Generation) ===
+    {
+        id: 'imagen-4-generation',
+        name: 'Imagen 4 for Generation',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.04, output: 0.04 },
+        capabilities: ['image-generation', 'text-to-image', 'higher-quality'],
+        category: 'image',
+        isLatest: true,
+        notes: 'Use text prompts to generate novel images with higher quality than our previous image generation models. Priced at $0.04 per image',
+    },
+    {
+        id: 'imagen-4-fast-generation',
+        name: 'Imagen 4 for Fast Generation',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.02, output: 0.02 },
+        capabilities: [
+            'image-generation',
+            'text-to-image',
+            'higher-quality',
+            'lower-latency',
+        ],
+        category: 'image',
+        isLatest: true,
+        notes: 'Use text prompts to generate novel images with higher quality and lower latency than our previous image generation models. Priced at $0.02 per image',
+    },
+    {
+        id: 'imagen-4-ultra-generation',
+        name: 'Imagen 4 for Ultra Generation',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.06, output: 0.06 },
+        capabilities: [
+            'image-generation',
+            'text-to-image',
+            'higher-quality',
+            'better-prompt-adherence',
+        ],
+        category: 'image',
+        isLatest: true,
+        notes: 'Use text prompts to generate novel images with higher quality and better prompt adherence than our previous image generation models. Priced at $0.06 per image',
+    },
+    {
+        id: 'imagen-4-upscaling',
+        name: 'Imagen 4 for Upscaling',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.06, output: 0.06 },
+        capabilities: ['image-generation', 'upscaling', 'image-enhancement'],
+        category: 'image',
+        isLatest: true,
+        notes: 'Increase resolution of a generated image to 2K, 3K, and 4K. Priced at $0.06 per image',
+    },
+    {
+        id: 'imagen-3-generation',
+        name: 'Imagen 3 for Generation',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.04, output: 0.0 },
+        capabilities: [
+            'image-generation',
+            'text-to-image',
+            'image-editing',
+            'customization',
+        ],
+        category: 'image',
+        isLatest: false,
+        notes: 'Use text prompts to generate novel images, edit an image, or customize an image. Priced at $0.04 per image',
+    },
+    {
+        id: 'imagen-3-editing-customization',
+        name: 'Imagen 3 for Editing and Customization',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.03, output: 0.03 },
+        capabilities: [
+            'image-generation',
+            'text-to-image',
+            'image-editing',
+            'customization',
+            'mask-editing',
+        ],
+        category: 'image',
+        isLatest: false,
+        notes: 'Use text prompts to edit existing input images, or parts of an image with a mask or generate new images based upon the context provided by input reference images',
+    },
+    {
+        id: 'imagen-3-fast-generation',
+        name: 'Imagen 3 for Fast Generation',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.02, output: 0.02 },
+        capabilities: ['image-generation', 'text-to-image', 'lower-latency'],
+        category: 'image',
+        isLatest: false,
+        notes: 'Use text prompts to generate novel images with lower latency than our other image generation models. Priced at $0.02 per image',
+    },
+    {
+        id: 'imagen-2-generation',
+        name: 'Imagen 2 for Generation',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.02, output: 0.02 },
+        capabilities: ['image-generation', 'text-to-image'],
+        category: 'image',
+        isLatest: false,
+        notes: 'Use text prompts to generate novel images. Priced at $0.020 per image',
+    },
+    {
+        id: 'imagen-2-editing',
+        name: 'Imagen 2 for Editing',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.02, output: 0.02 },
+        capabilities: ['image-generation', 'image-editing', 'mask-editing'],
+        category: 'image',
+        isLatest: false,
+        notes: 'Edit an image using mask free or mask approach. Priced at $0.020 per image',
+    },
+    {
+        id: 'imagen-1-generation',
+        name: 'Imagen 1 for Generation',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.02, output: 0.02 },
+        capabilities: ['image-generation', 'text-to-image'],
+        category: 'image',
+        isLatest: false,
+        notes: 'Use text prompts to generate novel images. Priced at $0.020 per image',
+    },
+    {
+        id: 'imagen-1-editing',
+        name: 'Imagen 1 for Editing',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.02, output: 0.02 },
+        capabilities: ['image-generation', 'image-editing', 'mask-editing'],
+        category: 'image',
+        isLatest: false,
+        notes: 'Edit an image using mask free or mask approach. Priced at $0.020 per image',
+    },
+    {
+        id: 'imagen-1-upscaling',
+        name: 'Imagen 1 for Upscaling',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.003, output: 0.003 },
+        capabilities: ['image-generation', 'upscaling', 'image-enhancement'],
+        category: 'image',
+        isLatest: false,
+        notes: 'Increase resolution of a generated image to 2k and 4k. Priced at $0.003 per image',
+    },
+    {
+        id: 'imagen-visual-captioning',
+        name: 'Imagen Visual Captioning',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.0015, output: 0.0 },
+        capabilities: ['image-generation', 'captioning', 'image-analysis'],
+        category: 'image',
+        isLatest: true,
+        notes: 'Generate a short or long text caption for an image. Priced at $0.0015 per image',
+    },
+    {
+        id: 'imagen-visual-qa',
+        name: 'Imagen Visual Q&A',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.0015, output: 0.0 },
+        capabilities: ['image-generation', 'vqa', 'image-analysis'],
+        category: 'image',
+        isLatest: true,
+        notes: 'Provide an answer based on a question referencing an image. Priced at $0.0015 per image',
+    },
+    {
+        id: 'imagen-product-recontext',
+        name: 'Imagen Product Recontext',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.12, output: 0.0 },
+        capabilities: ['image-generation', 'product-recontext', 'scene-generation'],
+        category: 'image',
+        isLatest: true,
+        notes: 'Re-imagine products in a new scene. Requires 1-3 images of the same product and a text prompt describing desired scene. Priced at $0.12 per image',
+    },
+    {
+        id: 'imagen-captioning-vqa',
+        name: 'Imagen for Captioning & VQA',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.03, output: 0.03 },
+        capabilities: [
+            'image-generation',
+            'text-to-image',
+            'image-editing',
+            'mask-editing',
+            'captioning',
+            'vqa',
+        ],
+        category: 'image',
+        isLatest: false,
+        notes: 'Use text prompts to generate novel images, edit existing ones, edit parts of an image with a mask and more',
+    },
+    // === Veo Models (Video Generation) ===
+    // === Veo 3.1 Series (Latest) ===
+    {
+        id: 'veo-3.1-video-audio-720p-1080p',
+        name: 'Veo 3.1 Video + Audio (720p/1080p)',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.4, output: 0.0 },
+        capabilities: [
+            'video-generation',
+            'text-to-video',
+            'image-to-video',
+            'audio-generation',
+            'higher-quality',
+        ],
+        category: 'video',
+        isLatest: true,
+        notes: 'Generate high-quality videos with synchronized speech/sound effects from a text prompt or reference image. Output resolution: 720p, 1080p. Priced at $0.40 per second',
+    },
+    {
+        id: 'veo-3.1-video-audio-4k',
+        name: 'Veo 3.1 Video + Audio (4K)',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.6, output: 0.0 },
+        capabilities: [
+            'video-generation',
+            'text-to-video',
+            'image-to-video',
+            'audio-generation',
+            'higher-quality',
+            '4k',
+        ],
+        category: 'video',
+        isLatest: true,
+        notes: 'Generate high-quality videos with synchronized speech/sound effects from a text prompt or reference image. Output resolution: 4K. Priced at $0.60 per second',
+    },
+    {
+        id: 'veo-3.1-video-720p-1080p',
+        name: 'Veo 3.1 Video (720p/1080p)',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.2, output: 0.0 },
+        capabilities: [
+            'video-generation',
+            'text-to-video',
+            'image-to-video',
+            'higher-quality',
+        ],
+        category: 'video',
         isLatest: true,
-        notes: 'State-of-the-art text embedding model for semantic search, classification, clustering, and similar tasks',
+        notes: 'Generate high-quality videos from a text prompt or reference image. Output resolution: 720p, 1080p. Priced at $0.20 per second',
     },
     {
-        id: 'multimodal-embeddings',
-        name: 'Multimodal Embeddings',
+        id: 'veo-3.1-video-4k',
+        name: 'Veo 3.1 Video (4K)',
         provider: 'Google AI',
         available: true,
-        maxTokens: 2048,
-        contextLength: 2048,
-        pricing: { input: 0.0, output: 0.0 },
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.4, output: 0.0 },
         capabilities: [
-            'embedding',
-            'multimodal',
-            'image-classification',
-            'image-search',
+            'video-generation',
+            'text-to-video',
+            'image-to-video',
+            'higher-quality',
+            '4k',
         ],
-        category: 'embedding',
+        category: 'video',
         isLatest: true,
-        notes: 'Generates vectors based on images, which can be used for downstream tasks like image classification, image search, and more',
+        notes: 'Generate high-quality videos from a text prompt or reference image. Output resolution: 4K. Priced at $0.40 per second',
     },
-    // === Imagen Models (Image Generation) ===
     {
-        id: 'imagen-4-generation',
-        name: 'Imagen 4 for Generation',
+        id: 'veo-3.1-fast-video-audio-720p-1080p',
+        name: 'Veo 3.1 Fast Video + Audio (720p/1080p)',
         provider: 'Google AI',
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.04, output: 0.04 },
-        capabilities: ['image-generation', 'text-to-image', 'higher-quality'],
-        category: 'image',
+        pricing: { input: 0.15, output: 0.0 },
+        capabilities: [
+            'video-generation',
+            'text-to-video',
+            'image-to-video',
+            'audio-generation',
+            'lower-latency',
+        ],
+        category: 'video',
         isLatest: true,
-        notes: 'Use text prompts to generate novel images with higher quality than our previous image generation models',
+        notes: 'Generate videos with synchronized speech/sound effects from a text prompt or reference image faster. Output resolution: 720p, 1080p. Priced at $0.15 per second',
     },
     {
-        id: 'imagen-4-fast-generation',
-        name: 'Imagen 4 for Fast Generation',
+        id: 'veo-3.1-fast-video-audio-4k',
+        name: 'Veo 3.1 Fast Video + Audio (4K)',
         provider: 'Google AI',
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.04, output: 0.04 },
+        pricing: { input: 0.35, output: 0.0 },
         capabilities: [
-            'image-generation',
-            'text-to-image',
-            'higher-quality',
+            'video-generation',
+            'text-to-video',
+            'image-to-video',
+            'audio-generation',
             'lower-latency',
+            '4k',
         ],
-        category: 'image',
+        category: 'video',
         isLatest: true,
-        notes: 'Use text prompts to generate novel images with higher quality and lower latency than our previous image generation models',
+        notes: 'Generate videos with synchronized speech/sound effects from a text prompt or reference image faster. Output resolution: 4K. Priced at $0.35 per second',
     },
     {
-        id: 'imagen-4-ultra-generation',
-        name: 'Imagen 4 for Ultra Generation',
+        id: 'veo-3.1-fast-video-720p-1080p',
+        name: 'Veo 3.1 Fast Video (720p/1080p)',
         provider: 'Google AI',
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.06, output: 0.06 },
+        pricing: { input: 0.1, output: 0.0 },
         capabilities: [
-            'image-generation',
-            'text-to-image',
-            'higher-quality',
-            'better-prompt-adherence',
+            'video-generation',
+            'text-to-video',
+            'image-to-video',
+            'lower-latency',
         ],
-        category: 'image',
+        category: 'video',
         isLatest: true,
-        notes: 'Use text prompts to generate novel images with higher quality and better prompt adherence than our previous image generation models',
+        notes: 'Generate videos from a text prompt or reference image faster. Output resolution: 720p, 1080p. Priced at $0.10 per second',
     },
     {
-        id: 'imagen-3-generation',
-        name: 'Imagen 3 for Generation',
+        id: 'veo-3.1-fast-video-4k',
+        name: 'Veo 3.1 Fast Video (4K)',
         provider: 'Google AI',
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.03, output: 0.03 },
-        capabilities: ['image-generation', 'text-to-image'],
-        category: 'image',
-        isLatest: false,
-        notes: 'Use text prompts to generate novel images',
+        pricing: { input: 0.3, output: 0.0 },
+        capabilities: [
+            'video-generation',
+            'text-to-video',
+            'image-to-video',
+            'lower-latency',
+            '4k',
+        ],
+        category: 'video',
+        isLatest: true,
+        notes: 'Generate videos from a text prompt or reference image faster. Output resolution: 4K. Priced at $0.30 per second',
     },
+    // === Veo 3 Series ===
     {
-        id: 'imagen-3-editing-customization',
-        name: 'Imagen 3 for Editing and Customization',
+        id: 'veo-3-video-audio',
+        name: 'Veo 3 Video + Audio',
         provider: 'Google AI',
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.03, output: 0.03 },
+        pricing: { input: 0.4, output: 0.0 },
         capabilities: [
-            'image-generation',
-            'text-to-image',
-            'image-editing',
-            'customization',
-            'mask-editing',
+            'video-generation',
+            'text-to-video',
+            'image-to-video',
+            'audio-generation',
+            'higher-quality',
         ],
-        category: 'image',
-        isLatest: false,
-        notes: 'Use text prompts to edit existing input images, or parts of an image with a mask or generate new images based upon the context provided by input reference images',
+        category: 'video',
+        isLatest: true,
+        notes: 'Generate high-quality videos with synchronized speech/sound effects from a text prompt or reference image. Output resolution: 720p, 1080p. Priced at $0.40 per second',
     },
     {
-        id: 'imagen-3-fast-generation',
-        name: 'Imagen 3 for Fast Generation',
+        id: 'veo-3-video',
+        name: 'Veo 3 Video',
         provider: 'Google AI',
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.03, output: 0.03 },
-        capabilities: ['image-generation', 'text-to-image', 'lower-latency'],
-        category: 'image',
-        isLatest: false,
-        notes: 'Use text prompts to generate novel images with lower latency than our other image generation models',
+        pricing: { input: 0.2, output: 0.0 },
+        capabilities: [
+            'video-generation',
+            'text-to-video',
+            'image-to-video',
+            'higher-quality',
+        ],
+        category: 'video',
+        isLatest: true,
+        notes: 'Generate high-quality videos from a text prompt or reference image. Output resolution: 720p, 1080p. Priced at $0.20 per second',
     },
     {
-        id: 'imagen-captioning-vqa',
-        name: 'Imagen for Captioning & VQA',
+        id: 'veo-3-fast-video-audio',
+        name: 'Veo 3 Fast Video + Audio',
         provider: 'Google AI',
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.03, output: 0.03 },
+        pricing: { input: 0.15, output: 0.0 },
         capabilities: [
-            'image-generation',
-            'text-to-image',
-            'image-editing',
-            'mask-editing',
-            'captioning',
-            'vqa',
+            'video-generation',
+            'text-to-video',
+            'image-to-video',
+            'audio-generation',
+            'lower-latency',
         ],
-        category: 'image',
-        isLatest: false,
-        notes: 'Use text prompts to generate novel images, edit existing ones, edit parts of an image with a mask and more',
+        category: 'video',
+        isLatest: true,
+        notes: 'Generate videos with synchronized speech/sound effects from a text prompt or reference image faster. Output resolution: 720p, 1080p. Priced at $0.15 per second',
     },
-    // === Veo Models (Video Generation) ===
     {
-        id: 'veo-2',
-        name: 'Veo 2',
+        id: 'veo-3-fast-video',
+        name: 'Veo 3 Fast Video',
         provider: 'Google AI',
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.35, output: 0.35 },
+        pricing: { input: 0.1, output: 0.0 },
         capabilities: [
             'video-generation',
             'text-to-video',
             'image-to-video',
-            'higher-quality',
+            'lower-latency',
         ],
         category: 'video',
         isLatest: true,
-        notes: 'Use text prompts and images to generate novel videos with higher quality than our previous video generation model (priced per second)',
+        notes: 'Generate videos from a text prompt or reference image faster. Output resolution: 720p, 1080p. Priced at $0.10 per second',
     },
+    // === Veo 2 Series ===
     {
-        id: 'veo-3',
-        name: 'Veo 3',
+        id: 'veo-2-video',
+        name: 'Veo 2 Video',
         provider: 'Google AI',
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.35, output: 0.35 },
+        pricing: { input: 0.5, output: 0.0 },
         capabilities: [
             'video-generation',
             'text-to-video',
@@ -1377,27 +2581,27 @@ exports.AVAILABLE_MODELS = [
             'higher-quality',
         ],
         category: 'video',
-        isLatest: true,
-        notes: 'Use text prompts and images to generate novel videos with higher quality than our previous video generation model (priced per second)',
+        isLatest: false,
+        notes: 'Generate videos from a text prompt or reference image. Output resolution: 720p. Priced at $0.50 per second',
     },
     {
-        id: 'veo-3-fast',
-        name: 'Veo 3 Fast',
+        id: 'veo-2-advanced-controls',
+        name: 'Veo 2 Advanced Controls',
         provider: 'Google AI',
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.35, output: 0.35 },
+        pricing: { input: 0.5, output: 0.0 },
         capabilities: [
             'video-generation',
             'text-to-video',
             'image-to-video',
-            'higher-quality',
-            'lower-latency',
+            'interpolation',
+            'camera-controls',
         ],
         category: 'video',
-        isLatest: true,
-        notes: 'Use text prompts and images to generate novel videos with higher quality and lower latency than our previous video generation model (priced per second)',
+        isLatest: false,
+        notes: 'Generate videos through start and end frame interpolation, extend generated videos, and apply camera controls. Output resolution: 720p. Priced at $0.50 per second',
     },
     // === Preview Models ===
     {
@@ -1407,11 +2611,11 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.0, output: 0.0 },
+        pricing: { input: 0.06, output: 0.0 },
         capabilities: ['image-generation', 'virtual-try-on', 'clothing'],
         category: 'image',
         isLatest: true,
-        notes: 'Generate images of people wearing clothing products (preview model, free tier only)',
+        notes: 'Create images of people wearing different clothes. Requires 1 image of a person and 1 image of clothing. Priced at $0.06 per image',
     },
     {
         id: 'veo-3-preview',
@@ -1420,7 +2624,7 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.35, output: 0.35 },
+        pricing: { input: 0.2, output: 0.0 },
         capabilities: [
             'video-generation',
             'text-to-video',
@@ -1430,7 +2634,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'video',
         isLatest: true,
-        notes: 'Use text prompts and images to generate novel videos with higher quality than our previous video generation model (preview model, priced per second)',
+        notes: 'Use text prompts and images to generate novel videos with higher quality than our previous video generation model (preview model). Output resolution: 720p, 1080p. Priced at $0.20 per second',
     },
     {
         id: 'veo-3-fast-preview',
@@ -1439,7 +2643,7 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.35, output: 0.35 },
+        pricing: { input: 0.1, output: 0.0 },
         capabilities: [
             'video-generation',
             'text-to-video',
@@ -1450,7 +2654,21 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'video',
         isLatest: true,
-        notes: 'Use text prompts and images to generate novel videos with higher quality and lower latency than our previous video generation model (preview model, priced per second)',
+        notes: 'Use text prompts and images to generate novel videos with higher quality and lower latency than our previous video generation model (preview model). Output resolution: 720p, 1080p. Priced at $0.10 per second',
+    },
+    // === Lyria Models (Music Generation) ===
+    {
+        id: 'lyria-2',
+        name: 'Lyria 2',
+        provider: 'Google AI',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.06, output: 0.0 },
+        capabilities: ['music-generation', 'text-to-music', 'instrumental'],
+        category: 'audio',
+        isLatest: true,
+        notes: 'High-quality instrumental music generation ideal for sophisticated composition and detailed creative exploration. Priced at $0.06 per 30 seconds',
     },
     // === Legacy Models for Backward Compatibility ===
     {
@@ -1480,6 +2698,7 @@ exports.AVAILABLE_MODELS = [
         notes: 'Earlier generation Gemini model with vision capabilities (legacy)',
     },
     // === AWS Bedrock Models ===
+    // === AI21 Labs Models ===
     {
         id: 'ai21.jamba-1-5-large-v1:0',
         name: 'Jamba 1.5 Large (Bedrock)',
@@ -1491,7 +2710,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'long-context'],
         category: 'text',
         isLatest: true,
-        notes: 'AI21 Labs Jamba 1.5 Large via AWS Bedrock',
+        notes: 'AI21 Labs Jamba 1.5 Large - advanced AI model for text generation and chat',
     },
     {
         id: 'ai21.jamba-1-5-mini-v1:0',
@@ -1504,98 +2723,232 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'long-context', 'efficient'],
         category: 'text',
         isLatest: true,
-        notes: 'AI21 Labs Jamba 1.5 Mini via AWS Bedrock',
+        notes: 'AI21 Labs Jamba 1.5 Mini - advanced AI model for text generation and chat',
+    },
+    {
+        id: 'ai21.jamba-instruct-v1:0',
+        name: 'Jamba-Instruct (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 256000,
+        contextLength: 256000,
+        pricing: { input: 0.5, output: 0.7 },
+        capabilities: ['text', 'instruct', 'long-context'],
+        category: 'text',
+        isLatest: true,
+        notes: 'AI21 Labs Jamba-Instruct - hybrid architecture for long context tasks',
+    },
+    {
+        id: 'ai21.j2-mid-v1',
+        name: 'Jurassic-2 Mid (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 8192,
+        contextLength: 8192,
+        pricing: { input: 12.5, output: 12.5 },
+        capabilities: ['text'],
+        category: 'text',
+        isLatest: true,
+        notes: 'AI21 Labs Jurassic-2 Mid - advanced AI model for text generation and chat',
+    },
+    {
+        id: 'ai21.j2-ultra-v1',
+        name: 'Jurassic-2 Ultra (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 8192,
+        contextLength: 8192,
+        pricing: { input: 18.8, output: 18.8 },
+        capabilities: ['text'],
+        category: 'text',
+        isLatest: true,
+        notes: 'AI21 Labs Jurassic-2 Ultra - advanced AI model for text generation and chat',
+    },
+    // === Amazon Nova 2.0 Series (Latest) ===
+    {
+        id: 'amazon.nova-2-lite-v1:0',
+        name: 'Nova 2 Lite (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 300000,
+        contextLength: 300000,
+        pricing: { input: 0.3, output: 2.5 },
+        capabilities: ['text', 'vision', 'video', 'multimodal', 'cache-read'],
+        category: 'text',
+        isLatest: true,
+        notes: 'Amazon Nova 2 Lite - Text/Image/Video input: $0.3/1M tokens, Output: $2.5/1M tokens. Cache read: $0.075/1M tokens (75% discount)',
+    },
+    {
+        id: 'amazon.nova-2-omni-v1:0',
+        name: 'Nova 2 Omni Preview (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 300000,
+        contextLength: 300000,
+        pricing: { input: 0.3, output: 2.5 },
+        capabilities: [
+            'text',
+            'vision',
+            'video',
+            'audio',
+            'multimodal',
+            'cache-read',
+        ],
+        category: 'multimodal',
+        isLatest: true,
+        notes: 'Amazon Nova 2 Omni (Preview) - Text/Image/Video input: $0.3/1M tokens, Audio input: $1.0/1M tokens, Text output: $2.5/1M tokens, Image output: $40/1M tokens. Cache read: 75% discount',
+    },
+    {
+        id: 'amazon.nova-2-pro-v1:0',
+        name: 'Nova 2 Pro Preview (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 300000,
+        contextLength: 300000,
+        pricing: { input: 1.25, output: 10.0 },
+        capabilities: [
+            'text',
+            'vision',
+            'video',
+            'audio',
+            'multimodal',
+            'cache-read',
+        ],
+        category: 'multimodal',
+        isLatest: true,
+        notes: 'Amazon Nova 2 Pro (Preview) - Text/Image/Video/Audio input: $1.25/1M tokens, Text output: $10/1M tokens. Cache read: 75% discount',
+    },
+    {
+        id: 'amazon.nova-2-sonic-v1:0',
+        name: 'Nova 2 Sonic (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 300000,
+        contextLength: 300000,
+        pricing: { input: 3.0, output: 12.0 },
+        capabilities: ['speech', 'text', 'multimodal', 'native-audio'],
+        category: 'audio',
+        isLatest: true,
+        notes: 'Amazon Nova 2 Sonic - Speech input: $3.0/1M tokens, Speech output: $12.0/1M tokens. Text input: $0.33/1M tokens, Text output: $2.75/1M tokens',
     },
+    // === Amazon Nova 1.0 Series ===
     {
         id: 'amazon.nova-micro-v1:0',
-        name: 'Amazon Nova Micro (Bedrock)',
+        name: 'Nova Micro (Bedrock)',
         provider: 'AWS Bedrock',
         available: true,
         maxTokens: 128000,
         contextLength: 128000,
         pricing: { input: 0.035, output: 0.14 },
-        capabilities: ['text', 'ultra-fast', 'cost-effective'],
+        capabilities: ['text', 'efficient', 'cache-read'],
         category: 'text',
-        isLatest: true,
-        notes: 'Amazon Nova Micro via AWS Bedrock',
+        isLatest: false,
+        notes: 'Amazon Nova Micro - Cache read: $0.00875/1M tokens (75% discount), Batch: $0.0175/$0.07 per 1M tokens',
     },
     {
         id: 'amazon.nova-lite-v1:0',
-        name: 'Amazon Nova Lite (Bedrock)',
+        name: 'Nova Lite (Bedrock)',
         provider: 'AWS Bedrock',
         available: true,
         maxTokens: 300000,
         contextLength: 300000,
         pricing: { input: 0.06, output: 0.24 },
-        capabilities: ['text', 'multimodal', 'fast'],
-        category: 'multimodal',
-        isLatest: true,
-        notes: 'Amazon Nova Lite via AWS Bedrock',
+        capabilities: ['text', 'multimodal', 'cache-read'],
+        category: 'text',
+        isLatest: false,
+        notes: 'Amazon Nova Lite - Cache read: $0.015/1M tokens (75% discount), Batch: $0.03/$0.12 per 1M tokens',
     },
     {
         id: 'amazon.nova-pro-v1:0',
-        name: 'Amazon Nova Pro (Bedrock)',
+        name: 'Nova Pro (Bedrock)',
         provider: 'AWS Bedrock',
         available: true,
         maxTokens: 300000,
         contextLength: 300000,
         pricing: { input: 0.8, output: 3.2 },
-        capabilities: ['text', 'multimodal', 'reasoning'],
-        category: 'multimodal',
-        isLatest: true,
-        notes: 'Amazon Nova Pro via AWS Bedrock',
+        capabilities: ['text', 'multimodal', 'cache-read'],
+        category: 'text',
+        isLatest: false,
+        notes: 'Amazon Nova Pro - Cache read: $0.2/1M tokens (75% discount), Batch: $0.4/$1.6 per 1M tokens',
     },
     {
         id: 'amazon.nova-premier-v1:0',
-        name: 'Amazon Nova Premier (Bedrock)',
+        name: 'Nova Premier (Bedrock)',
         provider: 'AWS Bedrock',
         available: true,
         maxTokens: 300000,
         contextLength: 300000,
         pricing: { input: 2.5, output: 12.5 },
         capabilities: ['text', 'multimodal', 'advanced-reasoning'],
-        category: 'multimodal',
-        isLatest: true,
-        notes: 'Amazon Nova Premier via AWS Bedrock',
+        category: 'text',
+        isLatest: false,
+        notes: 'Amazon Nova Premier - Advanced reasoning capabilities. Batch: $1.25/$6.25 per 1M tokens',
+    },
+    {
+        id: 'amazon.nova-sonic-v1:0',
+        name: 'Nova Sonic (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 300000,
+        contextLength: 300000,
+        pricing: { input: 3.4, output: 13.6 },
+        capabilities: ['speech', 'text', 'multimodal', 'native-audio'],
+        category: 'audio',
+        isLatest: false,
+        notes: 'Amazon Nova Sonic - Speech input: $3.4/1M tokens, Speech output: $13.6/1M tokens. Text input: $0.06/1M tokens, Text output: $0.24/1M tokens',
     },
+    // === Nova Creative Generation Models ===
     {
         id: 'amazon.nova-canvas-v1:0',
-        name: 'Amazon Nova Canvas (Bedrock)',
+        name: 'Nova Canvas (Bedrock)',
         provider: 'AWS Bedrock',
         available: true,
-        maxTokens: 4096,
-        contextLength: 4096,
+        maxTokens: 0,
+        contextLength: 0,
         pricing: { input: 0.04, output: 0.04 },
         capabilities: ['image-generation'],
         category: 'image',
         isLatest: true,
-        notes: 'Amazon Nova Canvas via AWS Bedrock - image generation model',
+        notes: 'Amazon Nova Canvas - Standard quality (up to 1024x1024): $0.04/image, Premium quality (up to 1024x1024): $0.06/image, Standard quality (up to 2048x2048): $0.06/image, Premium quality (up to 2048x2048): $0.08/image',
+    },
+    {
+        id: 'amazon.nova-reel-v1:0',
+        name: 'Nova Reel (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.08, output: 0.08 },
+        capabilities: ['video-generation'],
+        category: 'video',
+        isLatest: true,
+        notes: 'Amazon Nova Reel - $0.08 per second of video generated (720p, 24 fps)',
     },
     {
-        id: 'amazon.nova-reel-v1:0',
-        name: 'Amazon Nova Reel (Bedrock)',
+        id: 'amazon.nova-multimodal-embeddings-v1:0',
+        name: 'Nova Multimodal Embeddings (Bedrock)',
         provider: 'AWS Bedrock',
         available: true,
-        maxTokens: 4096,
-        contextLength: 4096,
-        pricing: { input: 0.08, output: 0.08 },
-        capabilities: ['video-generation'],
-        category: 'video',
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.135, output: 0.0 },
+        capabilities: ['embedding', 'multimodal'],
+        category: 'embedding',
         isLatest: true,
-        notes: 'Amazon Nova Reel via AWS Bedrock - video generation model',
+        notes: 'Amazon Nova Multimodal Embeddings (On-demand) - Text: $0.135/1M tokens, Standard image: $0.06/image, Document image: $0.6/image, Video: $0.7/second, Audio: $0.14/second. Batch: Text $0.0675/1M tokens, Standard image $0.03/image, Document image $0.48/image, Video $0.56/second, Audio $0.112/second',
     },
     {
-        id: 'amazon.nova-sonic-v1:0',
-        name: 'Amazon Nova Sonic (Bedrock)',
+        id: 'amazon-rerank-v1.0',
+        name: 'Amazon Rerank v1.0 (Bedrock)',
         provider: 'AWS Bedrock',
         available: true,
-        maxTokens: 300000,
-        contextLength: 300000,
-        pricing: { input: 3.4, output: 13.6 },
-        capabilities: ['speech', 'multimodal', 'native-audio'],
-        category: 'audio',
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.001, output: 0.0 },
+        capabilities: ['rerank', 'semantic-search', 'retrieval'],
+        category: 'retrieval',
         isLatest: true,
-        notes: 'Amazon Nova Sonic via AWS Bedrock - speech model',
+        notes: 'Amazon Rerank v1.0 - $1.00 per 1,000 queries. A query can contain up to 100 document chunks. If a query contains more than 100 document chunks, it is counted as multiple queries (e.g., 350 documents = 4 queries). Each document can contain up to 512 tokens (inclusive of query and document total tokens). If token length exceeds 512 tokens, it is broken down into multiple documents.',
     },
     {
         id: 'amazon.titan-text-express-v1',
@@ -1637,13 +2990,13 @@ exports.AVAILABLE_MODELS = [
         notes: 'Amazon Titan Text Embeddings V2 via AWS Bedrock',
     },
     {
-        id: 'anthropic.claude-opus-4-1-20250805-v1:0',
-        name: 'Claude Opus 4.1 (Bedrock)',
+        id: 'anthropic.claude-sonnet-4-5-v1:0',
+        name: 'Claude Sonnet 4.5 (Bedrock)',
         provider: 'AWS Bedrock',
         available: true,
-        maxTokens: 32000,
+        maxTokens: 64000,
         contextLength: 200000,
-        pricing: { input: 15.0, output: 75.0 },
+        pricing: { input: 3.3, output: 16.5 },
         capabilities: [
             'text',
             'vision',
@@ -1654,16 +3007,29 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'multimodal',
         isLatest: true,
-        notes: 'Claude Opus 4.1 via AWS Bedrock - most capable and intelligent Claude model yet',
+        notes: 'Claude Sonnet 4.5 on AWS Bedrock (Geo/In-region) - Input: $3.3/1M, Output: $16.5/1M. Batch: $1.65/$8.25 per 1M. Cache (5m write): $4.125/1M, Cache (1h write): $6.6/1M, Cache read: $0.33/1M. Global: $3/$15 per 1M',
     },
     {
-        id: 'anthropic.claude-opus-4-20250514-v1:0',
-        name: 'Claude Opus 4 (Bedrock)',
+        id: 'anthropic.claude-haiku-4-5-v1:0',
+        name: 'Claude Haiku 4.5 (Bedrock)',
         provider: 'AWS Bedrock',
         available: true,
-        maxTokens: 32000,
+        maxTokens: 64000,
         contextLength: 200000,
-        pricing: { input: 15.0, output: 75.0 },
+        pricing: { input: 1.1, output: 5.5 },
+        capabilities: ['text', 'vision', 'multimodal', 'multilingual'],
+        category: 'multimodal',
+        isLatest: true,
+        notes: 'Claude Haiku 4.5 on AWS Bedrock (Geo/In-region) - Input: $1.1/1M, Output: $5.5/1M. Batch: $0.55/$2.75 per 1M. Cache (5m write): $1.375/1M, Cache (1h write): $2.2/1M, Cache read: $0.11/1M. Global: $1/$5 per 1M',
+    },
+    {
+        id: 'anthropic.claude-opus-4-5-20251101-v1:0',
+        name: 'Claude Opus 4.5 (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 64000,
+        contextLength: 200000,
+        pricing: { input: 5.0, output: 25.0 },
         capabilities: [
             'text',
             'vision',
@@ -1674,16 +3040,16 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'multimodal',
         isLatest: true,
-        notes: 'Claude Opus 4 via AWS Bedrock - previous flagship model',
+        notes: 'Claude Opus 4.5 via AWS Bedrock - premium model combining maximum intelligence with practical performance. Reliable knowledge cutoff: May 2025. Training data cutoff: Aug 2025. Max output: 64K tokens',
     },
     {
-        id: 'anthropic.claude-sonnet-4-5-v1:0',
-        name: 'Claude Sonnet 4.5 (Bedrock)',
+        id: 'anthropic.claude-opus-4-1-20250805-v1:0',
+        name: 'Claude Opus 4.1 (Bedrock)',
         provider: 'AWS Bedrock',
         available: true,
-        maxTokens: 200000,
+        maxTokens: 32000,
         contextLength: 200000,
-        pricing: { input: 3.0, output: 15.0 },
+        pricing: { input: 15.0, output: 75.0 },
         capabilities: [
             'text',
             'vision',
@@ -1693,21 +3059,28 @@ exports.AVAILABLE_MODELS = [
             'multilingual',
         ],
         category: 'multimodal',
-        isLatest: true,
-        notes: 'Claude Sonnet 4.5 on AWS Bedrock - latest Claude Sonnet model with enhanced capabilities and 1M context window support (beta)',
+        isLatest: false,
+        notes: 'Claude Opus 4.1 via AWS Bedrock - legacy model, migrate to Claude Opus 4.5. Reliable knowledge cutoff: Jan 2025. Training data cutoff: Mar 2025. Max output: 32K tokens',
     },
     {
-        id: 'anthropic.claude-haiku-4-5-v1:0',
-        name: 'Claude Haiku 4.5 (Bedrock)',
+        id: 'anthropic.claude-opus-4-20250514-v1:0',
+        name: 'Claude Opus 4 (Bedrock)',
         provider: 'AWS Bedrock',
         available: true,
-        maxTokens: 200000,
+        maxTokens: 32000,
         contextLength: 200000,
-        pricing: { input: 1.0, output: 5.0 },
-        capabilities: ['text', 'vision', 'multimodal', 'multilingual'],
+        pricing: { input: 15.0, output: 75.0 },
+        capabilities: [
+            'text',
+            'vision',
+            'multimodal',
+            'reasoning',
+            'extended-thinking',
+            'multilingual',
+        ],
         category: 'multimodal',
-        isLatest: true,
-        notes: 'Claude Haiku 4.5 on AWS Bedrock - latest Claude Haiku model with improved performance',
+        isLatest: false,
+        notes: 'Claude Opus 4 via AWS Bedrock - legacy model, migrate to Claude Opus 4.5. Reliable knowledge cutoff: Jan 2025. Training data cutoff: Mar 2025. Max output: 32K tokens',
     },
     {
         id: 'anthropic.claude-sonnet-4-20250514-v1:0',
@@ -1727,7 +3100,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'multimodal',
         isLatest: false,
-        notes: 'Claude Sonnet 4 via AWS Bedrock - high-performance model with exceptional reasoning',
+        notes: 'Claude Sonnet 4 via AWS Bedrock - legacy model, migrate to Claude Sonnet 4.5. Reliable knowledge cutoff: Jan 2025. Training data cutoff: Mar 2025. Max output: 64K tokens. 1M context beta available',
     },
     {
         id: 'anthropic.claude-3-7-sonnet-20250219-v1:0',
@@ -1747,7 +3120,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'multimodal',
         isLatest: false,
-        notes: 'Claude Sonnet 3.7 via AWS Bedrock - high-performance model with early extended thinking. Deprecated - use Claude Sonnet 4.5 instead',
+        notes: 'Claude Sonnet 3.7 via AWS Bedrock - DEPRECATED, migrate to Claude Sonnet 4.5. Reliable knowledge cutoff: Oct 2024. Training data cutoff: Nov 2024. Max output: 64K tokens',
     },
     {
         id: 'anthropic.claude-3-5-sonnet-20241022-v1:0',
@@ -1772,38 +3145,38 @@ exports.AVAILABLE_MODELS = [
         pricing: { input: 0.8, output: 4.0 },
         capabilities: ['text', 'vision', 'multimodal', 'multilingual'],
         category: 'multimodal',
-        isLatest: true,
-        notes: 'Claude Haiku 3.5 via AWS Bedrock - fastest Claude model',
+        isLatest: false,
+        notes: 'Claude Haiku 3.5 via AWS Bedrock - legacy model, migrate to Claude Haiku 4.5. Training data cutoff: July 2024. Max output: 8K tokens',
     },
     {
         id: 'meta.llama3-70b-instruct-v1:0',
-        name: 'Llama 3 70B Instruct (Bedrock)',
+        name: 'Llama 3 Instruct 70B (Bedrock)',
         provider: 'AWS Bedrock',
         available: true,
         maxTokens: 8192,
         contextLength: 8192,
-        pricing: { input: 0.59, output: 0.79 },
+        pricing: { input: 2.65, output: 3.5 },
         capabilities: ['text', 'instruction-following'],
         category: 'text',
-        isLatest: true,
-        notes: 'Meta Llama 3 70B Instruct via AWS Bedrock',
+        isLatest: false,
+        notes: 'Meta Llama 3 Instruct (70B) on AWS Bedrock (US East N. Virginia) - Input: $2.65/1M, Output: $3.5/1M',
     },
     {
         id: 'meta.llama3-8b-instruct-v1:0',
-        name: 'Llama 3 8B Instruct (Bedrock)',
+        name: 'Llama 3 Instruct 8B (Bedrock)',
         provider: 'AWS Bedrock',
         available: true,
         maxTokens: 8192,
         contextLength: 8192,
-        pricing: { input: 0.05, output: 0.1 },
+        pricing: { input: 0.3, output: 0.6 },
         capabilities: ['text', 'instruction-following', 'fast'],
         category: 'text',
-        isLatest: true,
-        notes: 'Meta Llama 3 8B Instruct via AWS Bedrock',
+        isLatest: false,
+        notes: 'Meta Llama 3 Instruct (8B) on AWS Bedrock (US East N. Virginia) - Input: $0.3/1M, Output: $0.6/1M',
     },
     {
         id: 'meta.llama3-2-11b-instruct-v1:0',
-        name: 'Llama 3.2 11B Instruct (Bedrock)',
+        name: 'Llama 3.2 Instruct 11B (Bedrock)',
         provider: 'AWS Bedrock',
         available: true,
         maxTokens: 128000,
@@ -1811,12 +3184,12 @@ exports.AVAILABLE_MODELS = [
         pricing: { input: 0.16, output: 0.16 },
         capabilities: ['text', 'instruction-following', 'vision'],
         category: 'multimodal',
-        isLatest: true,
-        notes: 'Meta Llama 3.2 11B Instruct via AWS Bedrock',
+        isLatest: false,
+        notes: 'Meta Llama 3.2 Instruct (11B) on AWS Bedrock (US East Ohio) - Input: $0.16/1M, Output: $0.16/1M. Batch not available',
     },
     {
         id: 'meta.llama3-2-90b-instruct-v1:0',
-        name: 'Llama 3.2 90B Instruct (Bedrock)',
+        name: 'Llama 3.2 Instruct 90B (Bedrock)',
         provider: 'AWS Bedrock',
         available: true,
         maxTokens: 128000,
@@ -1824,21 +3197,21 @@ exports.AVAILABLE_MODELS = [
         pricing: { input: 0.72, output: 0.72 },
         capabilities: ['text', 'instruction-following', 'vision'],
         category: 'multimodal',
-        isLatest: true,
-        notes: 'Meta Llama 3.2 90B Instruct via AWS Bedrock',
+        isLatest: false,
+        notes: 'Meta Llama 3.2 Instruct (90B) on AWS Bedrock (US East Ohio) - Input: $0.72/1M, Output: $0.72/1M. Batch not available',
     },
     {
         id: 'meta.llama4-scout-17b-instruct-v1:0',
-        name: 'Llama 4 Scout 17B Instruct (Bedrock)',
+        name: 'Llama 4 Scout 17B (Bedrock)',
         provider: 'AWS Bedrock',
         available: true,
         maxTokens: 128000,
         contextLength: 128000,
         pricing: { input: 0.17, output: 0.66 },
-        capabilities: ['text', 'instruction-following', 'vision'],
+        capabilities: ['text', 'instruct', 'vision'],
         category: 'multimodal',
         isLatest: true,
-        notes: 'Meta Llama 4 Scout 17B Instruct via AWS Bedrock',
+        notes: 'Meta Llama 4 Scout 17B on AWS Bedrock (US East Ohio) - Input: $0.17/1M, Output: $0.66/1M. Batch: $0.085/$0.33 per 1M tokens',
     },
     {
         id: 'meta.llama4-maverick-17b-instruct-v1:0',
@@ -1851,8 +3224,219 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'instruction-following', 'vision'],
         category: 'multimodal',
         isLatest: true,
-        notes: 'Meta Llama 4 Maverick 17B Instruct via AWS Bedrock',
+        notes: 'Meta Llama 4 Maverick 17B on AWS Bedrock (US East Ohio) - Input: $0.24/1M, Output: $0.97/1M. Batch: $0.12/$0.485 per 1M tokens',
+    },
+    {
+        id: 'meta.llama3-3-70b-instruct-v1:0',
+        name: 'Llama 3.3 Instruct 70B (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 131072,
+        contextLength: 131072,
+        pricing: { input: 0.72, output: 0.72 },
+        capabilities: ['text', 'instruct'],
+        category: 'text',
+        isLatest: true,
+        notes: 'Meta Llama 3.3 Instruct (70B) on AWS Bedrock (US East Ohio) - Input: $0.72/1M, Output: $0.72/1M. Batch: $0.36/$0.36 per 1M tokens',
+    },
+    {
+        id: 'meta.llama3-2-1b-instruct-v1:0',
+        name: 'Llama 3.2 Instruct 1B (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.1, output: 0.1 },
+        capabilities: ['text', 'instruct'],
+        category: 'text',
+        isLatest: false,
+        notes: 'Meta Llama 3.2 Instruct (1B) on AWS Bedrock (US East Ohio) - Input: $0.1/1M, Output: $0.1/1M. Batch not available',
+    },
+    {
+        id: 'meta.llama3-2-3b-instruct-v1:0',
+        name: 'Llama 3.2 Instruct 3B (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.15, output: 0.15 },
+        capabilities: ['text', 'instruct'],
+        category: 'text',
+        isLatest: false,
+        notes: 'Meta Llama 3.2 Instruct (3B) on AWS Bedrock (US East Ohio) - Input: $0.15/1M, Output: $0.15/1M. Batch not available',
+    },
+    {
+        id: 'meta.llama3-1-8b-instruct-v1:0',
+        name: 'Llama 3.1 Instruct 8B (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 131072,
+        contextLength: 131072,
+        pricing: { input: 0.22, output: 0.22 },
+        capabilities: ['text', 'instruct'],
+        category: 'text',
+        isLatest: false,
+        notes: 'Meta Llama 3.1 Instruct (8B) on AWS Bedrock (US East Ohio) - Input: $0.22/1M, Output: $0.22/1M. Batch: $0.11/$0.11 per 1M tokens',
+    },
+    {
+        id: 'meta.llama3-1-70b-instruct-v1:0',
+        name: 'Llama 3.1 Instruct 70B (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 131072,
+        contextLength: 131072,
+        pricing: { input: 0.72, output: 0.72 },
+        capabilities: ['text', 'instruct'],
+        category: 'text',
+        isLatest: false,
+        notes: 'Meta Llama 3.1 Instruct (70B) on AWS Bedrock (US East Ohio) - Input: $0.72/1M, Output: $0.72/1M. Batch: $0.36/$0.36 per 1M tokens. Latency optimized: $0.9/$0.9 per 1M tokens',
+    },
+    {
+        id: 'meta.llama3-1-405b-instruct-v1:0',
+        name: 'Llama 3.1 Instruct 405B (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 131072,
+        contextLength: 131072,
+        pricing: { input: 2.4, output: 2.4 },
+        capabilities: ['text', 'instruct'],
+        category: 'text',
+        isLatest: false,
+        notes: 'Meta Llama 3.1 Instruct (405B) on AWS Bedrock (US East Ohio) - Input: $2.4/1M, Output: $2.4/1M. Batch: $1.2/$1.2 per 1M tokens. Latency optimized: $3/$3 per 1M tokens',
+    },
+    {
+        id: 'meta.llama2-13b-chat-v1',
+        name: 'Llama 2 Chat 13B (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 4096,
+        contextLength: 4096,
+        pricing: { input: 0.75, output: 1.0 },
+        capabilities: ['text', 'chat'],
+        category: 'text',
+        isLatest: false,
+        notes: 'Meta Llama 2 Chat (13B) on AWS Bedrock (US East N. Virginia, US West Oregon) - Input: $0.75/1M, Output: $1.0/1M',
+    },
+    {
+        id: 'meta.llama2-70b-chat-v1',
+        name: 'Llama 2 Chat 70B (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 4096,
+        contextLength: 4096,
+        pricing: { input: 1.95, output: 2.56 },
+        capabilities: ['text', 'chat'],
+        category: 'text',
+        isLatest: false,
+        notes: 'Meta Llama 2 Chat (70B) on AWS Bedrock (US East N. Virginia, US West Oregon) - Input: $1.95/1M, Output: $2.56/1M',
+    },
+    // === Mistral AI Models on AWS Bedrock ===
+    // Latest Models
+    {
+        id: 'mistral.pixtral-large-2502-v1:0',
+        name: 'Pixtral Large (25.02) (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 2.0, output: 6.0 },
+        capabilities: ['vision', 'multimodal', 'reasoning'],
+        category: 'multimodal',
+        isLatest: true,
+        notes: 'Mistral Pixtral Large (25.02) on AWS Bedrock (US East Ohio) - Input: $2/1M, Output: $6/1M. Batch not available',
+    },
+    {
+        id: 'mistral.magistral-small-1-2-v1:0',
+        name: 'Magistral Small 1.2 (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 40000,
+        contextLength: 40000,
+        pricing: { input: 0.5, output: 1.5 },
+        capabilities: ['text'],
+        category: 'text',
+        isLatest: true,
+        notes: 'Mistral Magistral Small 1.2 on AWS Bedrock (US East N. Virginia, US East Ohio, US West Oregon) - Standard: $0.50/$1.50 per 1M tokens. Asia Pacific (Mumbai), Europe (Ireland), Europe (Milan): $0.59/$1.76. South America (Sao Paulo), Asia Pacific (Tokyo): $0.61/$1.82. Europe (London): $0.78/$2.33. Priority tier: 75% premium. Flex tier: 50% discount',
+    },
+    {
+        id: 'mistral.voxtral-mini-1-0-v1:0',
+        name: 'Voxtral Mini 1.0 (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.04, output: 0.04 },
+        capabilities: ['text', 'audio'],
+        category: 'multimodal',
+        isLatest: true,
+        notes: 'Mistral Voxtral Mini 1.0 on AWS Bedrock (US East N. Virginia, US East Ohio, US West Oregon) - Standard: $0.04/$0.04 per 1M tokens. Asia Pacific (Mumbai), Europe (Ireland), Europe (Milan): $0.05/$0.05. South America (Sao Paulo), Asia Pacific (Tokyo): $0.05/$0.05. Europe (London): $0.06/$0.06. Priority tier: 75% premium. Flex tier: 50% discount',
+    },
+    {
+        id: 'mistral.voxtral-small-1-0-v1:0',
+        name: 'Voxtral Small 1.0 (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.1, output: 0.3 },
+        capabilities: ['text', 'audio'],
+        category: 'multimodal',
+        isLatest: true,
+        notes: 'Mistral Voxtral Small 1.0 on AWS Bedrock (US East N. Virginia, US East Ohio, US West Oregon) - Standard: $0.10/$0.30 per 1M tokens. Asia Pacific (Mumbai), Europe (Ireland), Europe (Milan): $0.12/$0.35. South America (Sao Paulo), Asia Pacific (Tokyo): $0.12/$0.36. Europe (London): $0.16/$0.47. Priority tier: 75% premium. Flex tier: 50% discount',
+    },
+    {
+        id: 'mistral.ministral-3b-3-0-v1:0',
+        name: 'Ministral 3B 3.0 (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.1, output: 0.1 },
+        capabilities: ['text'],
+        category: 'text',
+        isLatest: true,
+        notes: 'Mistral Ministral 3B 3.0 on AWS Bedrock (US East N. Virginia, US East Ohio, US West Oregon) - Standard: $0.10/$0.10 per 1M tokens. Asia Pacific (Mumbai), Europe (Ireland), Europe (Milan): $0.12/$0.12. South America (Sao Paulo), Asia Pacific (Tokyo): $0.12/$0.12. Europe (London): $0.16/$0.16. Priority tier: 75% premium. Flex tier: 50% discount',
+    },
+    {
+        id: 'mistral.ministral-8b-3-0-v1:0',
+        name: 'Ministral 8B 3.0 (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.15, output: 0.15 },
+        capabilities: ['text'],
+        category: 'text',
+        isLatest: true,
+        notes: 'Mistral Ministral 8B 3.0 on AWS Bedrock (US East N. Virginia, US East Ohio, US West Oregon) - Standard: $0.15/$0.15 per 1M tokens. Asia Pacific (Mumbai), Europe (Ireland), Europe (Milan): $0.18/$0.18. South America (Sao Paulo), Asia Pacific (Tokyo): $0.18/$0.18. Europe (London): $0.23/$0.23. Priority tier: 75% premium. Flex tier: 50% discount',
+    },
+    {
+        id: 'mistral.ministral-14b-3-0-v1:0',
+        name: 'Ministral 14B 3.0 (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.2, output: 0.2 },
+        capabilities: ['text'],
+        category: 'text',
+        isLatest: true,
+        notes: 'Mistral Ministral 14B 3.0 on AWS Bedrock (US East N. Virginia, US East Ohio, US West Oregon) - Standard: $0.20/$0.20 per 1M tokens. Asia Pacific (Mumbai), Europe (Ireland), Europe (Milan): $0.24/$0.24. South America (Sao Paulo), Asia Pacific (Tokyo): $0.24/$0.24. Europe (London): $0.31/$0.31. Priority tier: 75% premium. Flex tier: 50% discount',
+    },
+    {
+        id: 'mistral.mistral-large-3-v1:0',
+        name: 'Mistral Large 3 (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.5, output: 1.5 },
+        capabilities: ['text'],
+        category: 'text',
+        isLatest: true,
+        notes: 'Mistral Large 3 on AWS Bedrock (US East N. Virginia, US East Ohio, US West Oregon) - Standard: $0.50/$1.50 per 1M tokens. Asia Pacific (Mumbai), Europe (Ireland), Europe (Milan): $0.59/$1.76. South America (Sao Paulo), Asia Pacific (Tokyo): $0.61/$1.82. Europe (London): $0.78/$2.33. Priority tier: 75% premium. Flex tier: 50% discount',
     },
+    // Legacy Models
     {
         id: 'mistral.mistral-7b-instruct-v0:2',
         name: 'Mistral 7B Instruct (Bedrock)',
@@ -1860,11 +3444,11 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 32768,
         contextLength: 32768,
-        pricing: { input: 0.15, output: 0.45 },
-        capabilities: ['text', 'instruction-following', 'fast'],
+        pricing: { input: 0.14, output: 0.42 },
+        capabilities: ['text', 'instruct'],
         category: 'text',
-        isLatest: true,
-        notes: 'Mistral 7B Instruct via AWS Bedrock',
+        isLatest: false,
+        notes: 'Mistral 7B Instruct on AWS Bedrock (legacy)',
     },
     {
         id: 'mistral.mixtral-8x7b-instruct-v0:1',
@@ -1873,11 +3457,11 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 32768,
         contextLength: 32768,
-        pricing: { input: 0.24, output: 0.72 },
-        capabilities: ['text', 'instruction-following', 'mixture-of-experts'],
+        pricing: { input: 0.14, output: 0.42 },
+        capabilities: ['text', 'instruct'],
         category: 'text',
-        isLatest: true,
-        notes: 'Mistral Mixtral 8x7B Instruct via AWS Bedrock',
+        isLatest: false,
+        notes: 'Mistral Mixtral 8x7B Instruct on AWS Bedrock (legacy)',
     },
     {
         id: 'mistral.mistral-large-2402-v1:0',
@@ -1887,10 +3471,10 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 32768,
         contextLength: 32768,
         pricing: { input: 6.5, output: 25.0 },
-        capabilities: ['text', 'instruction-following'],
+        capabilities: ['text', 'instruct'],
         category: 'text',
-        isLatest: true,
-        notes: 'Mistral Large via AWS Bedrock',
+        isLatest: false,
+        notes: 'Mistral Large (24.02) on AWS Bedrock (legacy)',
     },
     {
         id: 'mistral.mistral-small-2402-v1:0',
@@ -1899,24 +3483,11 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 32768,
         contextLength: 32768,
-        pricing: { input: 2.0, output: 6.0 },
-        capabilities: ['text', 'instruction-following'],
-        category: 'text',
-        isLatest: true,
-        notes: 'Mistral Small via AWS Bedrock',
-    },
-    {
-        id: 'mistral.pixtral-large-2502-v1:0',
-        name: 'Pixtral Large (25.02) (Bedrock)',
-        provider: 'AWS Bedrock',
-        available: true,
-        maxTokens: 128000,
-        contextLength: 128000,
-        pricing: { input: 2.0, output: 6.0 },
-        capabilities: ['vision', 'multimodal', 'reasoning'],
-        category: 'multimodal',
-        isLatest: true,
-        notes: 'Mistral Pixtral Large via AWS Bedrock',
+        pricing: { input: 2.0, output: 6.0 },
+        capabilities: ['text', 'instruct'],
+        category: 'text',
+        isLatest: false,
+        notes: 'Mistral Small (24.02) on AWS Bedrock (legacy)',
     },
     {
         id: 'cohere.command-r-plus-v1:0',
@@ -1929,7 +3500,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'multilingual', 'enterprise'],
         category: 'text',
         isLatest: true,
-        notes: 'Cohere Command R+ via AWS Bedrock - updated pricing',
+        notes: 'Cohere Command R+ via AWS Bedrock - advanced AI model for text generation and chat',
     },
     {
         id: 'cohere.command-r-v1:0',
@@ -1942,7 +3513,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'multilingual', 'rag', 'tools'],
         category: 'text',
         isLatest: true,
-        notes: 'Cohere Command R via AWS Bedrock - updated pricing',
+        notes: 'Cohere Command R via AWS Bedrock - advanced AI model for text generation and chat',
     },
     {
         id: 'cohere.embed-english-v3',
@@ -1951,11 +3522,11 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 512,
         contextLength: 512,
-        pricing: { input: 0.1, output: 0.1 },
+        pricing: { input: 0.1, output: 0.0 },
         capabilities: ['embedding'],
         category: 'embedding',
         isLatest: true,
-        notes: 'Cohere Embed English v3 via AWS Bedrock',
+        notes: 'Cohere Embed English v3 via AWS Bedrock - advanced AI model for text generation and chat',
     },
     {
         id: 'cohere.embed-multilingual-v3',
@@ -1964,13 +3535,39 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 512,
         contextLength: 512,
-        pricing: { input: 0.1, output: 0.1 },
+        pricing: { input: 0.1, output: 0.0 },
         capabilities: ['embedding', 'multilingual'],
         category: 'embedding',
         isLatest: true,
-        notes: 'Cohere Embed Multilingual v3 via AWS Bedrock',
+        notes: 'Cohere Embed Multilingual v3 via AWS Bedrock - advanced AI model for text generation and chat',
+    },
+    {
+        id: 'cohere.embed-4-v1:0',
+        name: 'Embed 4 (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.12, output: 0.0 },
+        capabilities: ['embedding'],
+        category: 'embedding',
+        isLatest: true,
+        notes: 'Cohere Embed 4 on AWS Bedrock - $0.12 per 1M input tokens. Latest embeddings model (no output tokens)',
+    },
+    {
+        id: 'cohere.rerank-3-5-v1:0',
+        name: 'Rerank 3.5 (Bedrock)',
+        provider: 'AWS Bedrock',
+        available: true,
+        maxTokens: 0,
+        contextLength: 0,
+        pricing: { input: 0.002, output: 0.0 },
+        capabilities: ['rerank', 'semantic-search', 'retrieval'],
+        category: 'retrieval',
+        isLatest: true,
+        notes: "Cohere Rerank 3.5 on AWS Bedrock - $2.00 per 1,000 queries ($0.002 per query). A query can contain up to 100 document chunks. If a query contains more than 100 document chunks, it is counted as multiple queries (e.g., 350 documents = 4 queries). Each document can only contain up to 500 tokens (inclusive of the query and document's total tokens), and if the token length is higher than 512 tokens, it is broken down into multiple documents.",
     },
-    // Latest Cohere Models
+    // === Cohere Models ===
     {
         id: 'command-a-03-2025',
         name: 'Command A',
@@ -1979,10 +3576,10 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 256000,
         contextLength: 256000,
         pricing: { input: 2.5, output: 10.0 },
-        capabilities: ['text', 'agentic', 'multilingual', 'human-evaluations'],
+        capabilities: ['text', 'reasoning', 'enterprise', 'agents', 'multilingual'],
         category: 'text',
         isLatest: true,
-        notes: 'Most performant model to date, excelling at tool use, agents, RAG, and multilingual use cases',
+        notes: 'Advanced generative model for advanced agents and multilingual tasks. Most performant model to date, excelling at tool use, agents, RAG, and multilingual use cases. Priced at $2.50 per 1M input tokens and $10.00 per 1M output tokens.',
     },
     {
         id: 'command-r7b-12-2024',
@@ -1992,10 +3589,17 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 128000,
         contextLength: 128000,
         pricing: { input: 0.0375, output: 0.15 },
-        capabilities: ['text', 'rag', 'tool-use', 'agents'],
+        capabilities: [
+            'text',
+            'edge',
+            'commodity-gpu',
+            'rag',
+            'tools',
+            'reasoning',
+        ],
         category: 'text',
         isLatest: true,
-        notes: 'Small, fast update delivered in December 2024, excels at RAG, tool use, and complex reasoning',
+        notes: 'Cost-effective generative model for simpler tasks. Small, fast update delivered in December 2024, excels at RAG, tool use, and complex reasoning. Priced at $0.0375 per 1M input tokens and $0.15 per 1M output tokens.',
     },
     {
         id: 'command-a-reasoning-08-2025',
@@ -2005,10 +3609,16 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 256000,
         contextLength: 256000,
         pricing: { input: 2.5, output: 10.0 },
-        capabilities: ['text', 'reasoning', 'agentic', 'multilingual'],
+        capabilities: [
+            'text',
+            'reasoning',
+            'agentic',
+            'multilingual',
+            'enterprise',
+        ],
         category: 'text',
         isLatest: true,
-        notes: 'First reasoning model, able to think before generating output for nuanced problem-solving and agent-based tasks in 23 languages',
+        notes: 'Advanced generative model for reasoning tasks. First reasoning model, able to think before generating output for nuanced problem-solving and agent-based tasks in 23 languages. Priced at $2.50 per 1M input tokens and $10.00 per 1M output tokens.',
     },
     {
         id: 'command-a-vision-07-2025',
@@ -2021,7 +3631,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'vision', 'multimodal', 'enterprise'],
         category: 'multimodal',
         isLatest: true,
-        notes: 'First model capable of processing images, excelling in enterprise use cases like charts, graphs, diagrams, table understanding, OCR, and object detection',
+        notes: 'Advanced generative model for vision tasks. First model capable of processing images, excelling in enterprise use cases like charts, graphs, diagrams, table understanding, OCR, and object detection. Priced at $2.50 per 1M input tokens and $10.00 per 1M output tokens.',
     },
     {
         id: 'command-r-plus-04-2024',
@@ -2031,23 +3641,30 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 128000,
         contextLength: 128000,
         pricing: { input: 2.5, output: 10.0 },
-        capabilities: ['text', 'enterprise', 'rag', 'tools', 'multilingual'],
+        capabilities: ['text', 'reasoning', 'rag', 'tools', 'enterprise'],
         category: 'text',
         isLatest: true,
-        notes: 'Instruction-following conversational model for complex RAG workflows and multi-step tool use',
+        notes: 'High-performance generative model for complex tasks. Instruction-following conversational model for complex RAG workflows and multi-step tool use. Priced at $2.50 per 1M input tokens and $10.00 per 1M output tokens.',
     },
     {
         id: 'command-r-08-2024',
-        name: 'Command R (08-2024)',
+        name: 'Command R',
         provider: 'Cohere',
         available: true,
         maxTokens: 128000,
         contextLength: 128000,
         pricing: { input: 0.15, output: 0.6 },
-        capabilities: ['text', 'rag', 'tools', 'agents'],
+        capabilities: [
+            'text',
+            'efficiency',
+            'performance',
+            'rag',
+            'tools',
+            'agents',
+        ],
         category: 'text',
         isLatest: true,
-        notes: 'Update of Command R model delivered in August 2024',
+        notes: 'Balanced generative model for Retrieval-Augmented Generation (RAG) and tool use. Update of Command R model delivered in August 2024. Priced at $0.15 per 1M input tokens and $0.60 per 1M output tokens.',
     },
     {
         id: 'command-r-03-2024',
@@ -2095,8 +3712,8 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 4096,
         contextLength: 4096,
-        pricing: { input: 0.15, output: 0.6 },
-        capabilities: ['text', 'lightweight', 'fast'],
+        pricing: { input: 0.3, output: 0.6 },
+        capabilities: ['text', 'fast'],
         category: 'text',
         isLatest: false,
         notes: 'Smaller, faster version of command, almost as capable but much faster',
@@ -2122,10 +3739,10 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 4096,
         contextLength: 4096,
         pricing: { input: 2.0, output: 2.0 },
-        capabilities: ['rerank', 'semantic-search', 'retrieval'],
+        capabilities: ['search', 'reranking', 'multilingual', 'semantic-search'],
         category: 'rerank',
         isLatest: true,
-        notes: 'Provides powerful semantic boost to search quality of any keyword or vector search system, $2.00 per 1K searches',
+        notes: 'Rerank model used to improve search result relevance. Provides powerful semantic boost to search quality of any keyword or vector search system. Priced at $2.00 per 1,000 searches (usage-based pricing).',
     },
     {
         id: 'rerank-english-v3.0',
@@ -2135,10 +3752,10 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 4096,
         contextLength: 4096,
         pricing: { input: 2.0, output: 2.0 },
-        capabilities: ['rerank', 'semantic-search', 'english'],
+        capabilities: ['rerank', 'semantic-search', 'english', 'search'],
         category: 'rerank',
         isLatest: true,
-        notes: 'English language document and semi-structured data reranking model',
+        notes: 'Rerank model used to improve search result relevance. English language document and semi-structured data reranking model. Priced at $2.00 per 1,000 searches (usage-based pricing).',
     },
     {
         id: 'rerank-multilingual-v3.0',
@@ -2148,10 +3765,10 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 4096,
         contextLength: 4096,
         pricing: { input: 2.0, output: 2.0 },
-        capabilities: ['rerank', 'semantic-search', 'multilingual'],
+        capabilities: ['rerank', 'semantic-search', 'multilingual', 'search'],
         category: 'rerank',
         isLatest: true,
-        notes: 'Multilingual document and semi-structured data reranking model',
+        notes: 'Rerank model used to improve search result relevance. Multilingual document and semi-structured data reranking model. Priced at $2.00 per 1,000 searches (usage-based pricing).',
     },
     {
         id: 'embed-v4.0',
@@ -2160,11 +3777,17 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 128000,
         contextLength: 128000,
-        pricing: { input: 0.12, output: 0.12 },
-        capabilities: ['embedding', 'multimodal', 'semantic-search', 'rag'],
+        pricing: { input: 0.12, output: 0.0 },
+        capabilities: [
+            'embedding',
+            'multimodal',
+            'multilingual',
+            'semantic-search',
+            'rag',
+        ],
         category: 'embedding',
         isLatest: true,
-        notes: 'Leading multimodal embedding model for text and images, acts as intelligent retrieval engine for semantic search and RAG systems',
+        notes: 'Embed model for converting text/images to vectors for semantic search. Leading multimodal embedding model for text and images, acts as intelligent retrieval engine for semantic search and RAG systems. Priced at $0.12 per 1M tokens processed.',
     },
     {
         id: 'embed-english-v3.0',
@@ -2173,11 +3796,11 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 512,
         contextLength: 512,
-        pricing: { input: 0.1, output: 0.1 },
-        capabilities: ['embedding', 'english'],
+        pricing: { input: 0.1, output: 0.0 },
+        capabilities: ['embedding', 'english', 'semantic-search', 'rag'],
         category: 'embedding',
         isLatest: true,
-        notes: 'English-only embedding model for text classification and embeddings',
+        notes: 'Embed model for converting text to vectors for semantic search. English-only embedding model for text classification and embeddings. Priced at $0.10 per 1M tokens processed (usage-based pricing).',
     },
     {
         id: 'embed-english-light-v3.0',
@@ -2186,11 +3809,17 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 512,
         contextLength: 512,
-        pricing: { input: 0.1, output: 0.1 },
-        capabilities: ['embedding', 'english', 'lightweight'],
+        pricing: { input: 0.1, output: 0.0 },
+        capabilities: [
+            'embedding',
+            'english',
+            'lightweight',
+            'semantic-search',
+            'rag',
+        ],
         category: 'embedding',
         isLatest: true,
-        notes: 'Smaller, faster version of embed-english-v3.0, almost as capable but much faster',
+        notes: 'Embed model for converting text to vectors for semantic search. Smaller, faster version of embed-english-v3.0, almost as capable but much faster. Priced at $0.10 per 1M tokens processed (usage-based pricing).',
     },
     {
         id: 'embed-multilingual-v3.0',
@@ -2199,11 +3828,11 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 512,
         contextLength: 512,
-        pricing: { input: 0.1, output: 0.1 },
-        capabilities: ['embedding', 'multilingual'],
+        pricing: { input: 0.1, output: 0.0 },
+        capabilities: ['embedding', 'multilingual', 'semantic-search', 'rag'],
         category: 'embedding',
         isLatest: true,
-        notes: 'Multilingual embedding model for classification and embeddings in multiple languages',
+        notes: 'Embed model for converting text to vectors for semantic search. Multilingual embedding model for classification and embeddings in multiple languages. Priced at $0.10 per 1M tokens processed (usage-based pricing).',
     },
     {
         id: 'embed-multilingual-light-v3.0',
@@ -2212,11 +3841,17 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 512,
         contextLength: 512,
-        pricing: { input: 0.1, output: 0.1 },
-        capabilities: ['embedding', 'multilingual', 'lightweight'],
+        pricing: { input: 0.1, output: 0.0 },
+        capabilities: [
+            'embedding',
+            'multilingual',
+            'lightweight',
+            'semantic-search',
+            'rag',
+        ],
         category: 'embedding',
         isLatest: true,
-        notes: 'Smaller, faster version of embed-multilingual-v3.0, almost as capable but much faster',
+        notes: 'Embed model for converting text to vectors for semantic search. Smaller, faster version of embed-multilingual-v3.0, almost as capable but much faster. Priced at $0.10 per 1M tokens processed (usage-based pricing).',
     },
     {
         id: 'c4ai-aya-expanse-8b',
@@ -2398,14 +4033,7 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 40000,
         contextLength: 40000,
         pricing: { input: 2.0, output: 5.0 },
-        capabilities: [
-            'text',
-            'reasoning',
-            'thinking',
-            'domain-specific',
-            'multilingual',
-            'multimodal',
-        ],
+        capabilities: ['text', 'reasoning'],
         category: 'reasoning',
         isLatest: true,
         notes: 'Our frontier-class multimodal reasoning model released September 2025 (v25.09).',
@@ -2436,7 +4064,7 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 256000,
         contextLength: 256000,
-        pricing: { input: 0.3, output: 0.9 },
+        pricing: { input: 0.2, output: 0.6 },
         capabilities: [
             'code',
             'programming',
@@ -2447,7 +4075,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'code',
         isLatest: true,
-        notes: 'Our cutting-edge language model for coding released end of July 2025, specializes in low-latency, high-frequency tasks.',
+        notes: 'Coding-focused model. Priced at $0.20 per 1M input tokens and $0.60 per 1M output tokens. Our cutting-edge language model for coding released end of July 2025, specializes in low-latency, high-frequency tasks. Available on La Plateforme API with up to 256K context window. Fine-tuning available.',
     },
     {
         id: 'codestral-latest',
@@ -2456,7 +4084,7 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 256000,
         contextLength: 256000,
-        pricing: { input: 0.3, output: 0.9 },
+        pricing: { input: 0.2, output: 0.6 },
         capabilities: [
             'code',
             'programming',
@@ -2467,7 +4095,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'code',
         isLatest: true,
-        notes: 'Our cutting-edge language model for coding released end of July 2025, specializes in low-latency, high-frequency tasks.',
+        notes: 'Coding-focused model. Priced at $0.20 per 1M input tokens and $0.60 per 1M output tokens. Our cutting-edge language model for coding released end of July 2025, specializes in low-latency, high-frequency tasks. Available on La Plateforme API with up to 256K context window. Fine-tuning available.',
     },
     {
         id: 'voxtral-mini-2507',
@@ -2497,7 +4125,7 @@ exports.AVAILABLE_MODELS = [
     },
     {
         id: 'devstral-medium-2507',
-        name: 'Devstral Medium',
+        name: 'Devstral Medium 1.0',
         provider: 'Mistral AI',
         available: true,
         maxTokens: 128000,
@@ -2509,14 +4137,15 @@ exports.AVAILABLE_MODELS = [
             'advanced-coding',
             'codebase-exploration',
             'multi-file-editing',
+            'swe',
         ],
         category: 'code',
         isLatest: true,
-        notes: 'An enterprise grade text model that excels at using tools to explore codebases, editing multiple files and power software engineering agents.',
+        notes: 'An enterprise grade text model that excels at SWE use cases, released July 2025 (v25.07).',
     },
     {
         id: 'devstral-medium-latest',
-        name: 'Devstral Medium',
+        name: 'Devstral Medium 1.0',
         provider: 'Mistral AI',
         available: true,
         maxTokens: 128000,
@@ -2528,10 +4157,11 @@ exports.AVAILABLE_MODELS = [
             'advanced-coding',
             'codebase-exploration',
             'multi-file-editing',
+            'swe',
         ],
         category: 'code',
         isLatest: true,
-        notes: 'An enterprise grade text model that excels at using tools to explore codebases, editing multiple files and power software engineering agents.',
+        notes: 'An enterprise grade text model that excels at SWE use cases, released July 2025 (v25.07).',
     },
     {
         id: 'mistral-ocr-2505',
@@ -2549,7 +4179,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'document',
         isLatest: true,
-        notes: 'Our OCR service powering our Document AI stack that enables our users to extract interleaved text and images.',
+        notes: 'OCR service powering Document AI stack for extracting interleaved text and images. Priced at $2.00 per 1,000 pages (50% discount with Batch-API). Available on La Plateforme API.',
     },
     {
         id: 'mistral-ocr-latest',
@@ -2559,15 +4189,10 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 0,
         contextLength: 0,
         pricing: { input: 1.0, output: 3.0 },
-        capabilities: [
-            'ocr',
-            'document-understanding',
-            'annotations',
-            'text-extraction',
-        ],
+        capabilities: ['ocr', 'multimodal', 'text'],
         category: 'document',
         isLatest: true,
-        notes: 'Our OCR service powering our Document AI stack that enables our users to extract interleaved text and images.',
+        notes: 'OCR service powering Document AI stack for extracting interleaved text and images. Priced at $2.00 per 1,000 pages (50% discount with Batch-API). Available on La Plateforme API.',
     },
     {
         id: 'mistral-large-2411',
@@ -2577,10 +4202,16 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 128000,
         contextLength: 128000,
         pricing: { input: 2.0, output: 6.0 },
-        capabilities: ['text', 'reasoning', 'complex-tasks', 'high-complexity'],
+        capabilities: [
+            'text',
+            'reasoning',
+            'complex-tasks',
+            'high-complexity',
+            'function-calling',
+        ],
         category: 'text',
         isLatest: true,
-        notes: 'Our top-tier large model for high-complexity tasks with the latest version released November 2024.',
+        notes: 'Top-tier large model for high-complexity tasks. Priced at $2.00 per 1M input tokens and $6.00 per 1M output tokens. Latest version released November 2024 (v24.11). Available on La Plateforme API with up to 128K context window. Supports function calling. Fine-tuning available ($9/1M tokens + storage for Fine-tuned Large 2). Also available on Azure AI Foundry.',
     },
     {
         id: 'mistral-large-latest',
@@ -2590,10 +4221,16 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 128000,
         contextLength: 128000,
         pricing: { input: 2.0, output: 6.0 },
-        capabilities: ['text', 'reasoning', 'complex-tasks', 'high-complexity'],
+        capabilities: [
+            'text',
+            'agentic',
+            'multimodal',
+            'reasoning',
+            'function-calling',
+        ],
         category: 'text',
         isLatest: true,
-        notes: 'Our top-tier large model for high-complexity tasks with the latest version released November 2024.',
+        notes: 'Top-tier large model for high-complexity tasks. Priced at $2.00 per 1M input tokens and $6.00 per 1M output tokens. Latest version released November 2024. Available on La Plateforme API with up to 128K context window. Supports function calling. Fine-tuning available ($9/1M tokens + storage for Fine-tuned Large 2). Also available on Azure AI Foundry.',
     },
     {
         id: 'pixtral-large-2411',
@@ -2621,6 +4258,19 @@ exports.AVAILABLE_MODELS = [
         isLatest: true,
         notes: 'Our first frontier-class multimodal model released November 2024.',
     },
+    {
+        id: 'mistral-small-2409',
+        name: 'Mistral Small 2.0',
+        provider: 'Mistral AI',
+        available: true,
+        maxTokens: 32000,
+        contextLength: 32000,
+        pricing: { input: 0.1, output: 0.3 },
+        capabilities: ['text', 'multimodal', 'multilingual', 'open-source'],
+        category: 'multimodal',
+        isLatest: false,
+        notes: 'An update to our efficient small model with open weights under an MRL license, released September 2024 (v24.09).',
+    },
     {
         id: 'mistral-small-2407',
         name: 'Mistral Small 2',
@@ -2632,7 +4282,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'multimodal', 'multilingual', 'open-source'],
         category: 'multimodal',
         isLatest: false,
-        notes: 'Our updated small version, released September 2024.',
+        notes: 'Our updated small version, released September 2024 (v24.07).',
     },
     {
         id: 'mistral-embed',
@@ -2641,11 +4291,11 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 8192,
         contextLength: 8192,
-        pricing: { input: 0.1, output: 0.1 },
-        capabilities: ['embedding', 'text', 'semantic'],
+        pricing: { input: 0.01, output: 0.0 },
+        capabilities: ['text', 'embedding', 'semantic-search'],
         category: 'embedding',
         isLatest: true,
-        notes: 'Our state-of-the-art semantic for extracting representation of text extracts.',
+        notes: 'Embedding model for extracting semantic representations of text. Priced at $0.01 per 1M tokens. Our state-of-the-art semantic for extracting representation of text extracts. Available on La Plateforme API.',
     },
     {
         id: 'codestral-embed-2505',
@@ -2654,8 +4304,8 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 8192,
         contextLength: 8192,
-        pricing: { input: 0.15, output: 0.15 },
-        capabilities: ['embedding', 'code', 'semantic'],
+        pricing: { input: 0.15, output: 0.0 },
+        capabilities: ['coding', 'embedding'],
         category: 'embedding',
         isLatest: true,
         notes: 'Our state-of-the-art semantic for extracting representation of code extracts.',
@@ -2715,21 +4365,33 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 40000,
         contextLength: 40000,
         pricing: { input: 0.5, output: 1.5 },
+        capabilities: ['text', 'reasoning', 'lightweight'],
+        category: 'reasoning',
+        isLatest: true,
+        notes: 'Our small multimodal reasoning model released September 2025 (v25.09).',
+    },
+    {
+        id: 'magistral-small-2507',
+        name: 'Magistral Small 1.1',
+        provider: 'Mistral AI',
+        available: true,
+        maxTokens: 40000,
+        contextLength: 40000,
+        pricing: { input: 0.5, output: 1.5 },
         capabilities: [
             'text',
             'reasoning',
             'thinking',
             'domain-specific',
             'multilingual',
-            'multimodal',
         ],
         category: 'reasoning',
-        isLatest: true,
-        notes: 'Our small multimodal reasoning model released September 2025 (v25.09).',
+        isLatest: false,
+        notes: 'Our small reasoning model released July 2025 (v25.07). Deprecated October 31, 2025, retirement November 30, 2025. Use Magistral Small 1.2 instead.',
     },
     {
-        id: 'magistral-small-2507',
-        name: 'Magistral Small 1.1',
+        id: 'magistral-small-2506',
+        name: 'Magistral Small 1.0',
         provider: 'Mistral AI',
         available: true,
         maxTokens: 40000,
@@ -2744,7 +4406,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'reasoning',
         isLatest: false,
-        notes: 'Our small reasoning model released July 2025 (v25.07). Deprecated October 31, 2025, retirement November 30, 2025. Use Magistral Small 1.2 instead.',
+        notes: 'Our first small reasoning model released June 2025 (v25.06). Deprecated October 31, 2025, retirement November 30, 2025. Use Magistral Small 1.2 instead.',
     },
     {
         id: 'voxtral-small-2507',
@@ -2767,11 +4429,37 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 32000,
         contextLength: 32000,
         pricing: { input: 0.1, output: 0.1 },
-        capabilities: ['audio', 'instruct', 'multimodal'],
+        capabilities: ['voice', 'text'],
         category: 'audio',
         isLatest: true,
         notes: 'Our first model with audio input capabilities for instruct use cases.',
     },
+    {
+        id: 'voxtral-mini-2507',
+        name: 'Voxtral Mini',
+        provider: 'Mistral AI',
+        available: true,
+        maxTokens: 32000,
+        contextLength: 32000,
+        pricing: { input: 0.1, output: 0.1 },
+        capabilities: ['audio', 'instruct', 'mini'],
+        category: 'audio',
+        isLatest: true,
+        notes: 'A mini version of our first audio input model.',
+    },
+    {
+        id: 'voxtral-mini-latest',
+        name: 'Voxtral Mini',
+        provider: 'Mistral AI',
+        available: true,
+        maxTokens: 32000,
+        contextLength: 32000,
+        pricing: { input: 0.1, output: 0.1 },
+        capabilities: ['voice', 'text'],
+        category: 'audio',
+        isLatest: true,
+        notes: 'A mini version of our first audio input model.',
+    },
     {
         id: 'mistral-small-2506',
         name: 'Mistral Small 3.2',
@@ -2783,10 +4471,49 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'multimodal', 'multilingual', 'open-source'],
         category: 'multimodal',
         isLatest: true,
-        notes: 'An update to our previous small model, released June 2025.',
+        notes: 'An update to our previous small model, released June 2025 (v25.06).',
+    },
+    {
+        id: 'mistral-small-latest',
+        name: 'Mistral Small 3.2',
+        provider: 'Mistral AI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.1, output: 0.3 },
+        capabilities: [
+            'text',
+            'agentic',
+            'multimodal',
+            'lightweight',
+            'function-calling',
+        ],
+        category: 'multimodal',
+        isLatest: true,
+        notes: 'An update to our previous small model, released June 2025. Priced at $0.10 per 1M input tokens and $0.30 per 1M output tokens. Available on La Plateforme API with up to 128K context window. Supports function calling. Fine-tuning available. Also available on Azure AI Foundry.',
     },
     {
         id: 'mistral-small-2503',
+        name: 'Mistral Small 3.1',
+        provider: 'Mistral AI',
+        available: true,
+        maxTokens: 128000,
+        contextLength: 128000,
+        pricing: { input: 0.1, output: 0.3 },
+        capabilities: [
+            'text',
+            'multimodal',
+            'multilingual',
+            'open-source',
+            'image-understanding',
+            'function-calling',
+        ],
+        category: 'multimodal',
+        isLatest: false,
+        notes: 'A new leader in the small models category with image understanding capabilities, released March 2025 (v25.03). Priced at $0.10 per 1M input tokens and $0.30 per 1M output tokens. Available on La Plateforme API with up to 128K context window. Supports function calling. Fine-tuning available. Also available on Azure AI Foundry.',
+    },
+    {
+        id: 'mistral-small-2501',
         name: 'Mistral Small 3.0',
         provider: 'Mistral AI',
         available: true,
@@ -2796,33 +4523,33 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'multimodal', 'multilingual', 'open-source'],
         category: 'multimodal',
         isLatest: false,
-        notes: 'Mistral Small 3.0 model released March 2025.',
+        notes: 'A small efficient and powerful 24B open model for personal or commercial use, released January 2025 (v25.01).',
     },
     {
         id: 'ministral-3b',
         name: 'Ministral 3B',
         provider: 'Mistral AI',
         available: true,
-        maxTokens: 128000,
-        contextLength: 128000,
-        pricing: { input: 0.05, output: 0.15 },
-        capabilities: ['text', 'lightweight', 'edge', 'open-source'],
+        maxTokens: 32000,
+        contextLength: 32000,
+        pricing: { input: 0.0, output: 0.0 },
+        capabilities: ['text', 'edge', 'mobile', 'open-source'],
         category: 'text',
         isLatest: true,
-        notes: "World's best edge model. 3B parameter model optimized for edge devices.",
+        notes: "World's best edge model released October 2024 (v24.1).",
     },
     {
         id: 'ministral-8b',
         name: 'Ministral 8B',
         provider: 'Mistral AI',
         available: true,
-        maxTokens: 128000,
-        contextLength: 128000,
-        pricing: { input: 0.1, output: 0.3 },
-        capabilities: ['text', 'edge', 'open-source', 'high-performance'],
+        maxTokens: 32000,
+        contextLength: 32000,
+        pricing: { input: 0.0, output: 0.0 },
+        capabilities: ['text', 'edge', 'mobile', 'open-source', 'high-performance'],
         category: 'text',
         isLatest: true,
-        notes: 'Powerful edge model with extremely high performance/price ratio. 8B parameter model.',
+        notes: 'Powerful edge model with extremely high performance/price ratio, released October 2024 (v24.1).',
     },
     {
         id: 'devstral-small-2507',
@@ -2851,13 +4578,7 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 128000,
         contextLength: 128000,
         pricing: { input: 0.1, output: 0.3 },
-        capabilities: [
-            'code',
-            'agents',
-            'open-source',
-            'codebase-exploration',
-            'multi-file-editing',
-        ],
+        capabilities: ['coding', 'agentic', 'text', 'lightweight'],
         category: 'code',
         isLatest: true,
         notes: 'An update to our open source model that excels at using tools to explore codebases, editing multiple files and power software engineering agents.',
@@ -2896,16 +4617,16 @@ exports.AVAILABLE_MODELS = [
     },
     {
         id: 'devstral-small-2505',
-        name: 'Devstral Small 1',
+        name: 'Devstral Small 1.0',
         provider: 'Mistral AI',
         available: true,
         maxTokens: 128000,
         contextLength: 128000,
         pricing: { input: 0.1, output: 0.3 },
-        capabilities: ['code', 'agents', 'open-source', '24b-parameter'],
+        capabilities: ['code', 'agents', 'open-source', '24b-parameter', 'swe'],
         category: 'code',
         isLatest: false,
-        notes: 'A 24B text model, open source model that excels at using tools to explore codebases, editing multiple files and power software engineering agents.',
+        notes: 'A 24B text model, open source model that excels at SWE use cases, released May 2025 (v25.05). Deprecated October 31, 2025, retirement November 30, 2025. Use Devstral Small 1.1 instead.',
     },
     {
         id: 'pixtral-12b-2409',
@@ -2918,7 +4639,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['vision', 'multimodal', 'small', 'image-understanding'],
         category: 'multimodal',
         isLatest: true,
-        notes: 'A 12B model with image understanding capabilities in addition to text.',
+        notes: 'Multimodal model with image understanding capabilities. Priced at $0.15 per 1M tokens (input/output). A 12B model with image understanding capabilities in addition to text. Available on La Plateforme API with up to 128K context window. Also available on Azure AI Foundry.',
     },
     {
         id: 'pixtral-12b',
@@ -2931,7 +4652,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['vision', 'multimodal', 'small', 'image-understanding'],
         category: 'multimodal',
         isLatest: true,
-        notes: 'A 12B model with image understanding capabilities in addition to text.',
+        notes: 'Multimodal model with image understanding capabilities. Priced at $0.15 per 1M tokens (input/output). A 12B model with image understanding capabilities in addition to text. Available on La Plateforme API with up to 128K context window. Also available on Azure AI Foundry.',
     },
     {
         id: 'open-mistral-nemo-2407',
@@ -2944,7 +4665,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'multilingual', 'open-source', 'best-multilingual'],
         category: 'text',
         isLatest: true,
-        notes: 'Our best multilingual open source model released July 2024.',
+        notes: 'Our best multilingual open source model released July 2024. Priced at $0.15 per 1M tokens (input/output). Available on La Plateforme API with up to 128K context window. Also available on Azure AI Foundry.',
     },
     {
         id: 'open-mistral-nemo',
@@ -2957,7 +4678,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'multilingual', 'open-source', 'best-multilingual'],
         category: 'text',
         isLatest: true,
-        notes: 'Our best multilingual open source model released July 2024.',
+        notes: 'Our best multilingual open source model released July 2024. Priced at $0.15 per 1M tokens (input/output). Available on La Plateforme API with up to 128K context window. Also available on Azure AI Foundry.',
     },
     {
         id: 'mistral-nemo',
@@ -2983,7 +4704,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'open-source', 'fast'],
         category: 'text',
         isLatest: false,
-        notes: 'A 7B transformer model, fast-deployed and easily customisable.',
+        notes: 'A 7B transformer model, fast-deployed and easily customisable. Open-source/open-weights model available for self-hosting (free to use, but requires own infrastructure). Also available on La Plateforme API and Azure AI Foundry.',
     },
     {
         id: 'open-mixtral-8x7b',
@@ -2996,7 +4717,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'mixture-of-experts', 'open-source'],
         category: 'text',
         isLatest: false,
-        notes: 'A 7B sparse Mixture-of-Experts (SMoE). Uses 12.9B active parameters out of 45B total.',
+        notes: 'A 7B sparse Mixture-of-Experts (SMoE). Uses 12.9B active parameters out of 45B total. Open-source/open-weights model available for self-hosting (free to use, but requires own infrastructure). Also available on La Plateforme API and Azure AI Foundry.',
     },
     {
         id: 'open-mixtral-8x22b',
@@ -3017,7 +4738,34 @@ exports.AVAILABLE_MODELS = [
         notes: 'Most performant open model. A 22B sparse Mixture-of-Experts (SMoE). Uses only 39B active parameters out of 141B.',
     },
     // === Grok AI Models ===
-    // === Grok 4 Fast Series (Latest) ===
+    // === Grok 4.1 Fast Series (Latest) ===
+    {
+        id: 'grok-4-1-fast-reasoning',
+        name: 'Grok 4.1 Fast Reasoning',
+        provider: 'xAI',
+        available: true,
+        maxTokens: 2000000,
+        contextLength: 2000000,
+        pricing: { input: 0.2, output: 0.5 },
+        capabilities: ['text', 'vision', 'reasoning', 'agents', 'tools'],
+        category: 'text',
+        isLatest: true,
+        notes: 'Latest cost-efficient reasoning model with 2M context window. Lightning fast, low cost. Priced at $0.20 per 1M input tokens and $0.50 per 1M output tokens. Rate limits: 4M TPM (tokens per minute), 480 RPM (requests per minute)',
+    },
+    {
+        id: 'grok-4-1-fast-non-reasoning',
+        name: 'Grok 4.1 Fast Non-Reasoning',
+        provider: 'xAI',
+        available: true,
+        maxTokens: 2000000,
+        contextLength: 2000000,
+        pricing: { input: 0.2, output: 0.5 },
+        capabilities: ['text', 'vision', 'fast'],
+        category: 'text',
+        isLatest: true,
+        notes: 'Latest cost-efficient non-reasoning model with 2M context window. Lightning fast, low cost. Priced at $0.20 per 1M input tokens and $0.50 per 1M output tokens. Rate limits: 4M TPM (tokens per minute), 480 RPM (requests per minute)',
+    },
+    // === Grok 4 Fast Series ===
     {
         id: 'grok-4-fast-reasoning',
         name: 'Grok 4 Fast Reasoning',
@@ -3026,15 +4774,10 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 2000000,
         contextLength: 2000000,
         pricing: { input: 0.2, output: 0.5 },
-        capabilities: [
-            'text',
-            'reasoning',
-            'function-calling',
-            'structured-outputs',
-        ],
+        capabilities: ['text', 'vision', 'reasoning', 'agents'],
         category: 'text',
         isLatest: true,
-        notes: 'Latest cost-efficient reasoning model with 2M context window. Lightning fast, low cost. 4M TPM, 480 RPM rate limits',
+        notes: 'Cost-efficient reasoning model with 2M context window. Lightning fast, low cost. Priced at $0.20 per 1M input tokens and $0.50 per 1M output tokens. Rate limits: 4M TPM (tokens per minute), 480 RPM (requests per minute)',
     },
     {
         id: 'grok-4-fast-non-reasoning',
@@ -3044,10 +4787,10 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 2000000,
         contextLength: 2000000,
         pricing: { input: 0.2, output: 0.5 },
-        capabilities: ['text', 'function-calling', 'structured-outputs'],
+        capabilities: ['text', 'vision', 'fast'],
         category: 'text',
         isLatest: true,
-        notes: 'Latest cost-efficient non-reasoning model with 2M context window. Lightning fast, low cost. 4M TPM, 480 RPM rate limits',
+        notes: 'Cost-efficient non-reasoning model with 2M context window. Lightning fast, low cost. Priced at $0.20 per 1M input tokens and $0.50 per 1M output tokens. Rate limits: 4M TPM (tokens per minute), 480 RPM (requests per minute)',
     },
     {
         id: 'grok-code-fast-1',
@@ -3057,15 +4800,10 @@ exports.AVAILABLE_MODELS = [
         maxTokens: 256000,
         contextLength: 256000,
         pricing: { input: 0.2, output: 1.5 },
-        capabilities: [
-            'code',
-            'programming',
-            'function-calling',
-            'structured-outputs',
-        ],
+        capabilities: ['text', 'coding', 'function-calling', 'structured-outputs'],
         category: 'code',
         isLatest: true,
-        notes: 'Cost-efficient coding model optimized for code generation and programming tasks. 2M TPM, 480 RPM rate limits',
+        notes: 'Cost-efficient coding model optimized for code generation and programming tasks. Priced at $0.20 per 1M input tokens and $1.50 per 1M output tokens. Context window: 256K tokens. Rate limits: 2M TPM (tokens per minute), 480 RPM (requests per minute)',
     },
     // === Grok 4 Series ===
     {
@@ -3084,7 +4822,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'text',
         isLatest: true,
-        notes: 'Latest Grok 4 reasoning model. Note: Grok 4 is always a reasoning model with no non-reasoning mode. 2M TPM, 480 RPM rate limits. Knowledge cutoff: November 2024',
+        notes: 'Latest Grok 4 reasoning model. Note: Grok 4 is always a reasoning model with no non-reasoning mode. Priced at $3.00 per 1M input tokens and $15.00 per 1M output tokens. Context window: 256K tokens. Rate limits: 2M TPM (tokens per minute), 480 RPM (requests per minute). Knowledge cutoff: November 2024',
     },
     {
         id: 'grok-4',
@@ -3102,7 +4840,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'text',
         isLatest: true,
-        notes: 'Alias for latest stable Grok 4 version. Points to grok-4-0709. 2M TPM, 480 RPM rate limits',
+        notes: 'Alias for latest stable Grok 4 version. Points to grok-4-0709. Priced at $3.00 per 1M input tokens and $15.00 per 1M output tokens. Context window: 256K tokens. Rate limits: 2M TPM (tokens per minute), 480 RPM (requests per minute)',
     },
     {
         id: 'grok-4-latest',
@@ -3120,7 +4858,7 @@ exports.AVAILABLE_MODELS = [
         ],
         category: 'text',
         isLatest: true,
-        notes: 'Alias for latest Grok 4 version (may include preview features). Auto-updates with new releases. 2M TPM, 480 RPM rate limits',
+        notes: 'Alias for latest Grok 4 version (may include preview features). Auto-updates with new releases. Priced at $3.00 per 1M input tokens and $15.00 per 1M output tokens. Context window: 256K tokens. Rate limits: 2M TPM (tokens per minute), 480 RPM (requests per minute)',
     },
     // === Grok 3 Series ===
     {
@@ -3134,7 +4872,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'vision', 'function-calling', 'structured-outputs'],
         category: 'multimodal',
         isLatest: false,
-        notes: 'Standard Grok 3 model. 600 RPM rate limits. Knowledge cutoff: November 2024',
+        notes: 'Standard Grok 3 model. Priced at $3.00 per 1M input tokens and $15.00 per 1M output tokens. Context window: 131K tokens. Rate limits: 600 RPM (requests per minute). Knowledge cutoff: November 2024',
     },
     {
         id: 'grok-3-mini',
@@ -3147,7 +4885,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'vision', 'function-calling', 'structured-outputs'],
         category: 'multimodal',
         isLatest: false,
-        notes: 'Cost-effective Grok 3 Mini model. 480 RPM rate limits. Knowledge cutoff: November 2024',
+        notes: 'Cost-effective Grok 3 Mini model. Priced at $0.30 per 1M input tokens and $0.50 per 1M output tokens. Context window: 131K tokens. Rate limits: 480 RPM (requests per minute). Knowledge cutoff: November 2024',
     },
     // === Grok 2 Vision Series ===
     {
@@ -3161,7 +4899,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'vision', 'image-understanding'],
         category: 'multimodal',
         isLatest: false,
-        notes: 'Grok 2 Vision model for image understanding. 600 RPM rate limits (us-east-1) or 50 RPS (eu-west-1)',
+        notes: 'Grok 2 Vision model for image understanding. Priced at $2.00 per 1M input tokens and $10.00 per 1M output tokens. Context window: 32K tokens. Rate limits: 600 RPM (requests per minute) for us-east-1 region, 50 RPS (requests per second) for eu-west-1 region',
     },
     {
         id: 'grok-2-vision-1212-us-east-1',
@@ -3174,7 +4912,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'vision', 'image-understanding'],
         category: 'multimodal',
         isLatest: false,
-        notes: 'Grok 2 Vision model for us-east-1 region. 600 RPM rate limits',
+        notes: 'Grok 2 Vision model for us-east-1 region. Priced at $2.00 per 1M input tokens and $10.00 per 1M output tokens. Context window: 32K tokens. Rate limits: 600 RPM (requests per minute)',
     },
     {
         id: 'grok-2-vision-1212-eu-west-1',
@@ -3187,7 +4925,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'vision', 'image-understanding'],
         category: 'multimodal',
         isLatest: false,
-        notes: 'Grok 2 Vision model for eu-west-1 region. 50 RPS rate limits',
+        notes: 'Grok 2 Vision model for eu-west-1 region. Priced at $2.00 per 1M input tokens and $10.00 per 1M output tokens. Context window: 32K tokens. Rate limits: 50 RPS (requests per second)',
     },
     // === Grok 2 Image Generation ===
     {
@@ -3197,11 +4935,11 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.07, output: 0.07 },
-        capabilities: ['image-generation'],
+        pricing: { input: 0.07, output: 0.0 },
+        capabilities: ['image-generation', 'text-to-image'],
         category: 'image',
         isLatest: true,
-        notes: 'Grok 2 image generation model. $0.07 per image output, 300 RPM rate limits',
+        notes: 'Grok 2 image generation model. Priced at $0.07 per image output. Rate limits: 300 RPM (requests per minute)',
     },
     {
         id: 'grok-2-image',
@@ -3210,11 +4948,11 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.07, output: 0.07 },
-        capabilities: ['image-generation'],
+        pricing: { input: 0.07, output: 0.0 },
+        capabilities: ['image-generation', 'text-to-image'],
         category: 'image',
         isLatest: true,
-        notes: 'Alias for latest stable Grok 2 Image version. Points to grok-2-image-1212. $0.07 per image, 300 RPM rate limits',
+        notes: 'Alias for latest stable Grok 2 Image version. Points to grok-2-image-1212. Priced at $0.07 per image output. Rate limits: 300 RPM (requests per minute)',
     },
     {
         id: 'grok-2-image-latest',
@@ -3223,11 +4961,11 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 0,
         contextLength: 0,
-        pricing: { input: 0.07, output: 0.07 },
-        capabilities: ['image-generation'],
+        pricing: { input: 0.07, output: 0.0 },
+        capabilities: ['image-generation', 'text-to-image'],
         category: 'image',
         isLatest: true,
-        notes: 'Alias for latest Grok 2 Image version. Auto-updates with new releases. $0.07 per image, 300 RPM rate limits',
+        notes: 'Alias for latest Grok 2 Image version. Auto-updates with new releases. Priced at $0.07 per image output. Rate limits: 300 RPM (requests per minute)',
     },
     // === Meta Llama Models ===
     // === Llama 4 Series (Latest) ===
@@ -3238,18 +4976,11 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 10000000,
         contextLength: 10000000,
-        pricing: { input: 0.19, output: 0.49 },
-        capabilities: [
-            'text',
-            'vision',
-            'multimodal',
-            'long-context',
-            'multilingual',
-            'image-grounding',
-        ],
+        pricing: { input: 0.15, output: 0.45 },
+        capabilities: ['text', 'vision', 'coding', 'reasoning'],
         category: 'multimodal',
         isLatest: true,
-        notes: 'Class-leading natively multimodal model with superior text and visual intelligence. 17B active params x 16 experts, 109B total params. Includes Llama Guard 4 12B, Llama Prompt Guard 2 22M and 86M. Licensed under Llama 4 Community License Agreement',
+        notes: 'Class-leading natively multimodal model with superior text and visual intelligence. 17B active params x 16 experts, 109B total params. Includes Llama Guard 4 12B, Llama Prompt Guard 2 22M and 86M. Features 10M context window and improved multimodal capabilities. Pricing varies by provider: ~$0.08-$0.18 per 1M input tokens, ~$0.30-$0.59 per 1M output tokens. Available on Azure, AWS Bedrock, Together AI, and DeepInfra. Licensed under Llama 4 Community License Agreement',
     },
     {
         id: 'llama-4-maverick',
@@ -3258,19 +4989,18 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 10000000,
         contextLength: 10000000,
-        pricing: { input: 0.19, output: 0.49 },
+        pricing: { input: 0.25, output: 0.75 },
         capabilities: [
             'text',
             'vision',
-            'multimodal',
-            'long-context',
+            'coding',
+            'reasoning',
             'multilingual',
-            'image-grounding',
-            'fast-responses',
+            'long-context',
         ],
         category: 'multimodal',
         isLatest: true,
-        notes: 'Industry-leading natively multimodal model with groundbreaking intelligence and fast responses at a low cost. 17B active params x 128 experts, 400B total params. Includes Llama Guard 4 12B, Llama Prompt Guard 2 22M and 86M. Licensed under Llama 4 Community License Agreement',
+        notes: 'Industry-leading natively multimodal model with groundbreaking intelligence and fast responses at a low cost. 17B active params x 128 experts, 400B total params. Includes Llama Guard 4 12B, Llama Prompt Guard 2 22M and 86M. Features 10M context window and improved multimodal capabilities. Pricing varies by provider: ~$0.15-$0.27 per 1M input tokens, ~$0.60-$0.85 per 1M output tokens. Available on Azure, AWS Bedrock, Together AI, and DeepInfra. Licensed under Llama 4 Community License Agreement',
     },
     {
         id: 'llama-4-behemoth-preview',
@@ -3279,16 +5009,8 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 10000000,
         contextLength: 10000000,
-        pricing: { input: 0.19, output: 0.49 },
-        capabilities: [
-            'text',
-            'vision',
-            'multimodal',
-            'long-context',
-            'multilingual',
-            'image-grounding',
-            'teacher-model',
-        ],
+        pricing: { input: 0.3, output: 0.3 },
+        capabilities: ['text', 'vision', 'coding', 'reasoning', 'multilingual'],
         category: 'multimodal',
         isLatest: true,
         notes: 'Early preview of the Llama 4 teacher model used to distill Llama 4 Scout and Llama 4 Maverick. Still in training phase. Licensed under Llama 4 Community License Agreement',
@@ -3301,11 +5023,11 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 131072,
         contextLength: 131072,
-        pricing: { input: 0.59, output: 0.79 },
-        capabilities: ['text', 'multilingual', 'open-source'],
+        pricing: { input: 0.1, output: 0.1 },
+        capabilities: ['text', 'coding'],
         category: 'text',
         isLatest: true,
-        notes: 'Multilingual open source large language model. Experience 405B performance and quality at a fraction of the cost. Licensed under Llama 3.3 Community License Agreement',
+        notes: 'Multilingual open source large language model. Experience 405B performance and quality at a fraction of the cost. Highly cost-efficient model delivering performance comparable to larger models at significantly lower cost. Pricing varies by provider: ~$0.07-$0.88 per 1M tokens (input/output). Available on Azure AI Foundry (~$0.70/1M tokens), AWS Bedrock, Together AI, and DeepInfra. Licensed under Llama 3.3 Community License Agreement',
     },
     // === Llama 3.2 Series ===
     {
@@ -3315,11 +5037,11 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 128000,
         contextLength: 128000,
-        pricing: { input: 0.16, output: 0.16 },
-        capabilities: ['text', 'vision', 'multimodal', 'open-source'],
+        pricing: { input: 0.08, output: 0.08 },
+        capabilities: ['text', 'vision'],
         category: 'multimodal',
         isLatest: true,
-        notes: 'Open multimodal model that is flexible and can reason on high resolution images and output text. Includes Llama Guard 3 11B Vision. Licensed under Llama 3.2 Community License Agreement',
+        notes: 'Open multimodal model that is flexible and can reason on high resolution images and output text. Includes Llama Guard 3 11B Vision. Pricing varies by provider: ~$0.02-$0.18 per 1M tokens (input/output). Available on Azure, AWS Bedrock, Together AI, and DeepInfra. Licensed under Llama 3.2 Community License Agreement',
     },
     {
         id: 'llama-3.2-90b',
@@ -3332,7 +5054,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'vision', 'multimodal', 'open-source'],
         category: 'multimodal',
         isLatest: true,
-        notes: 'Open multimodal model that is flexible and can reason on high resolution images and output text. Includes Llama Guard 3 11B Vision. Licensed under Llama 3.2 Community License Agreement',
+        notes: 'Open multimodal model that is flexible and can reason on high resolution images and output text. Includes Llama Guard 3 11B Vision. Pricing varies by provider. Available on Azure, AWS Bedrock, Together AI, and DeepInfra. Licensed under Llama 3.2 Community License Agreement',
     },
     {
         id: 'llama-3.2-3b',
@@ -3345,7 +5067,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'lightweight', 'mobile', 'edge', 'open-source'],
         category: 'text',
         isLatest: true,
-        notes: 'Lightweight and most cost-efficient model you can run anywhere on mobile and on edge devices. Includes Llama Guard 3 1B. Quantized models available. Licensed under Llama 3.2 Community License Agreement',
+        notes: 'Lightweight and most cost-efficient model you can run anywhere on mobile and on edge devices. Includes Llama Guard 3 1B. Quantized models available. Pricing varies by provider: ~$0.02-$0.18 per 1M tokens (input/output). Available on Azure, AWS Bedrock, Together AI, and DeepInfra. Licensed under Llama 3.2 Community License Agreement',
     },
     {
         id: 'llama-3.2-1b',
@@ -3358,7 +5080,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'lightweight', 'mobile', 'edge', 'open-source'],
         category: 'text',
         isLatest: true,
-        notes: 'Lightweight and most cost-efficient model you can run anywhere on mobile and on edge devices. Includes Llama Guard 3 1B. Quantized models available. Licensed under Llama 3.2 Community License Agreement',
+        notes: 'Lightweight and most cost-efficient model you can run anywhere on mobile and on edge devices. Includes Llama Guard 3 1B. Quantized models available. Pricing varies by provider: ~$0.02-$0.18 per 1M tokens (input/output). Available on Azure, AWS Bedrock, Together AI, and DeepInfra. Licensed under Llama 3.2 Community License Agreement',
     },
     // === Llama 3.1 Series ===
     {
@@ -3368,11 +5090,11 @@ exports.AVAILABLE_MODELS = [
         available: true,
         maxTokens: 131072,
         contextLength: 131072,
-        pricing: { input: 0.0, output: 0.0 },
-        capabilities: ['text', 'multilingual', 'open-source'],
+        pricing: { input: 2.25, output: 2.25 },
+        capabilities: ['text', 'reasoning'],
         category: 'text',
         isLatest: false,
-        notes: 'Multilingual open source large language model. Includes Llama Guard 3 8B and Llama Prompt Guard 2. Licensed under Llama 3.1 Community License Agreement',
+        notes: 'Multilingual open source large language model. Includes Llama Guard 3 8B and Llama Prompt Guard 2. Pricing varies by provider: ~$1.00-$3.50 per 1M tokens (input/output). Together AI offers at $3.50/1M tokens. Available on Azure, AWS Bedrock, Together AI, and DeepInfra. Licensed under Llama 3.1 Community License Agreement',
     },
     {
         id: 'llama-3.1-8b',
@@ -3385,7 +5107,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'multilingual', 'open-source'],
         category: 'text',
         isLatest: false,
-        notes: 'Multilingual open source large language model. Includes Llama Guard 3 8B and Llama Prompt Guard 2. Licensed under Llama 3.1 Community License Agreement',
+        notes: 'Multilingual open source large language model. Includes Llama Guard 3 8B and Llama Prompt Guard 2. Pricing varies by provider: ~$0.02-$0.18 per 1M tokens (input/output). Together AI offers at $0.18/1M tokens. DeepInfra provides Llama-3.1-8B-Instruct-Turbo at $0.02/$0.03 (input/output) per million tokens. Available on Azure, AWS Bedrock, Together AI, and DeepInfra. Licensed under Llama 3.1 Community License Agreement',
     },
     // === Llama 3 Series (Legacy) ===
     {
@@ -3399,7 +5121,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'open-source'],
         category: 'text',
         isLatest: false,
-        notes: 'Legacy Llama 3 70B model. Licensed under Llama 3 Community License Agreement',
+        notes: 'Legacy Llama 3 70B model. Available on Azure, AWS Bedrock, Together AI, and DeepInfra. Self-hosting requires substantial GPU resources (e.g., H100s). Licensed under Llama 3 Community License Agreement',
     },
     {
         id: 'llama-3-8b',
@@ -3412,7 +5134,7 @@ exports.AVAILABLE_MODELS = [
         capabilities: ['text', 'open-source'],
         category: 'text',
         isLatest: false,
-        notes: 'Legacy Llama 3 8B model. Licensed under Llama 3 Community License Agreement',
+        notes: 'Legacy Llama 3 8B model. Available on Azure, AWS Bedrock, Together AI, and DeepInfra. Models are open-source and can be run for free if you have your own hardware. Licensed under Llama 3 Community License Agreement',
     },
 ];
 const getModelsByProvider = (provider) => {