npm - @sudobility/shapeshyft_types - Versions diffs - 1.0.21 → 1.0.22 - Mend

@sudobility/shapeshyft_types 1.0.21 → 1.0.22

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/dist/index.cjs CHANGED Viewed

@@ -4,9 +4,13 @@
  * TypeScript types for ShapeShyft API - LLM structured output platform
  */
 Object.defineProperty(exports, "__esModule", { value: true });
-exports.COST_PER_MILLION_TOKENS = exports.PROVIDER_ALLOWS_CUSTOM_MODEL = exports.DEFAULT_PROVIDER_MODEL = exports.PROVIDER_MODELS = exports.LLM_PROVIDERS = void 0;
+exports.COST_PER_MILLION_TOKENS = exports.MODEL_CAPABILITIES = exports.PROVIDER_ALLOWS_CUSTOM_MODEL = exports.DEFAULT_PROVIDER_MODEL = exports.PROVIDER_MODELS = exports.LLM_PROVIDERS = void 0;
+exports.getModelCapabilities = getModelCapabilities;
+exports.hasInputCapability = hasInputCapability;
+exports.hasOutputCapability = hasOutputCapability;
 exports.getModelPricing = getModelPricing;
 exports.estimateCost = estimateCost;
+exports.estimateMultimodalCost = estimateMultimodalCost;
 exports.formatCost = formatCost;
 exports.formatCostPerMillion = formatCostPerMillion;
 exports.successResponse = successResponse;
@@ -24,30 +28,75 @@ exports.LLM_PROVIDERS = [
     'perplexity',
     'llm_server',
 ];
-/** Models available for each provider */
+/** Models available for each provider (January 2026) */
 exports.PROVIDER_MODELS = {
-    openai: ['gpt-4o', 'gpt-4o-mini', 'gpt-4-turbo', 'gpt-3.5-turbo', 'o1', 'o1-mini', 'o1-pro'],
-    anthropic: ['claude-sonnet-4-20250514', 'claude-opus-4-20250514', 'claude-3-5-haiku-20241022'],
-    gemini: ['gemini-2.0-flash', 'gemini-2.0-flash-lite', 'gemini-1.5-pro', 'gemini-1.5-flash'],
-    mistral: ['mistral-large-latest', 'mistral-medium-latest', 'mistral-small-latest', 'codestral-latest', 'mistral-nemo'],
-    cohere: ['command-r-plus', 'command-r', 'command', 'command-light'],
-    groq: ['llama-3.3-70b-versatile', 'llama-3.1-8b-instant', 'mixtral-8x7b-32768', 'gemma2-9b-it'],
-    xai: ['grok-2', 'grok-2-mini'],
-    deepseek: ['deepseek-chat', 'deepseek-coder', 'deepseek-reasoner'],
-    perplexity: ['llama-3.1-sonar-small-128k-online', 'llama-3.1-sonar-large-128k-online', 'llama-3.1-sonar-huge-128k-online'],
-    llm_server: ['qwen/qwen3-30b-a3b-2507', 'meta-llama-3.1-8b-instruct', 'qwen-32b-everything', 'openai/gpt-oss-20b'],
+    openai: [
+        'gpt-4.1', 'gpt-4.1-mini', 'gpt-4.1-nano',
+        'gpt-4o', 'gpt-4o-mini',
+        'o3', 'o3-pro', 'o4-mini',
+        'gpt-4-turbo', 'o1',
+    ],
+    anthropic: [
+        'claude-opus-4-5-20251124', 'claude-sonnet-4-5-20251124',
+        'claude-opus-4-1-20250805',
+        'claude-sonnet-4-20250514', 'claude-opus-4-20250514',
+        'claude-3-5-haiku-20241022',
+    ],
+    gemini: [
+        'gemini-3-pro-preview', 'gemini-3-flash-preview', 'gemini-3-pro-image-preview',
+        'gemini-2.5-pro', 'gemini-2.5-flash', 'gemini-2.5-flash-lite', 'gemini-2.5-flash-image', 'gemini-2.5-flash-native-audio-preview',
+        'gemini-2.0-flash', 'gemini-2.0-flash-lite',
+    ],
+    mistral: [
+        'mistral-large-2512', 'mistral-large-latest',
+        'mistral-medium-3.1', 'mistral-medium-latest',
+        'mistral-small-3.2', 'mistral-small-latest',
+        'ministral-3b-2512', 'ministral-8b-2512', 'ministral-14b-2512',
+        'codestral-2501', 'codestral-latest',
+        'pixtral-large-2411', 'pixtral-large-latest',
+        'voxtral-small', 'voxtral-mini',
+        'mistral-ocr-2512',
+    ],
+    cohere: [
+        'command-a-03-2025', 'command-a-reasoning', 'command-a-vision',
+        'command-r-plus-08-2024', 'command-r-08-2024',
+        'command-r-plus', 'command-r',
+    ],
+    groq: [
+        'llama-3.3-70b-versatile', 'llama-3.1-8b-instant',
+        'openai/gpt-oss-120b', 'openai/gpt-oss-20b',
+        'groq/compound', 'groq/compound-mini',
+        'meta-llama/llama-guard-4-12b',
+        'whisper-large-v3', 'whisper-large-v3-turbo',
+    ],
+    xai: [
+        'grok-4', 'grok-4.1-fast',
+        'grok-3', 'grok-3-mini', 'grok-3-vision',
+        'grok-2', 'grok-2-vision',
+    ],
+    deepseek: ['deepseek-chat', 'deepseek-reasoner'],
+    perplexity: [
+        'sonar', 'sonar-pro',
+        'sonar-reasoning', 'sonar-reasoning-pro',
+        'sonar-deep-research',
+    ],
+    llm_server: [
+        'qwen/qwen3-30b-a3b-2507', 'meta-llama-3.1-8b-instruct', 'qwen-32b-everything', 'openai/gpt-oss-20b',
+        'llava-v1.6-mistral-7b', 'llava-v1.6-vicuna-13b', 'qwen2-vl-7b-instruct', 'phi-3-vision-128k-instruct',
+        'minicpm-v-2_6', 'moondream2', 'internvl2-8b', 'llama-3.2-11b-vision', 'pixtral-12b',
+    ],
 };
-/** Default model for each provider */
+/** Default model for each provider (January 2026) */
 exports.DEFAULT_PROVIDER_MODEL = {
-    openai: 'gpt-4o-mini',
-    anthropic: 'claude-sonnet-4-20250514',
-    gemini: 'gemini-2.0-flash',
+    openai: 'gpt-4.1-mini',
+    anthropic: 'claude-sonnet-4-5-20251124',
+    gemini: 'gemini-2.5-flash',
     mistral: 'mistral-small-latest',
-    cohere: 'command-r',
+    cohere: 'command-r-08-2024',
     groq: 'llama-3.3-70b-versatile',
-    xai: 'grok-2-mini',
+    xai: 'grok-3-mini',
     deepseek: 'deepseek-chat',
-    perplexity: 'llama-3.1-sonar-small-128k-online',
+    perplexity: 'sonar',
     llm_server: 'meta-llama-3.1-8b-instruct',
 };
 /** Providers that allow custom model input (user can type any model name) */
@@ -63,84 +112,420 @@ exports.PROVIDER_ALLOWS_CUSTOM_MODEL = {
     perplexity: false,
     llm_server: true, // Users can type any model name for custom LLM servers
 };
+/**
+ * Model capabilities map (January 2026).
+ * Maps model names to their multimodal capabilities.
+ * Models not in this map have undefined capabilities.
+ */
+exports.MODEL_CAPABILITIES = {
+    // ===========================================================================
+    // OpenAI (January 2026)
+    // ===========================================================================
+    // GPT-4.1 family
+    'gpt-4.1': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'gpt-4.1-mini': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'gpt-4.1-nano': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // GPT-4o (omni - multimodal)
+    'gpt-4o': { visionInput: true, audioInput: true, videoInput: false, imageOutput: false, audioOutput: true, videoOutput: false },
+    'gpt-4o-mini': { visionInput: true, audioInput: true, videoInput: false, imageOutput: false, audioOutput: true, videoOutput: false },
+    // Reasoning models (o-series)
+    'o3': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'o3-pro': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'o4-mini': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // Legacy
+    'gpt-4-turbo': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'o1': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // ===========================================================================
+    // Anthropic (January 2026)
+    // ===========================================================================
+    // Claude 4.5
+    'claude-opus-4-5-20251124': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'claude-sonnet-4-5-20251124': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // Claude 4.1
+    'claude-opus-4-1-20250805': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // Claude 4
+    'claude-sonnet-4-20250514': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'claude-opus-4-20250514': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // Claude 3.5
+    'claude-3-5-haiku-20241022': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // ===========================================================================
+    // Google Gemini (January 2026)
+    // ===========================================================================
+    // Gemini 3 (latest)
+    'gemini-3-pro-preview': { visionInput: true, audioInput: true, videoInput: true, imageOutput: false, audioOutput: false, videoOutput: false },
+    'gemini-3-flash-preview': { visionInput: true, audioInput: true, videoInput: true, imageOutput: false, audioOutput: false, videoOutput: false },
+    'gemini-3-pro-image-preview': { visionInput: true, audioInput: false, videoInput: false, imageOutput: true, audioOutput: false, videoOutput: false },
+    // Gemini 2.5
+    'gemini-2.5-pro': { visionInput: true, audioInput: true, videoInput: true, imageOutput: false, audioOutput: false, videoOutput: false },
+    'gemini-2.5-flash': { visionInput: true, audioInput: true, videoInput: true, imageOutput: false, audioOutput: false, videoOutput: false },
+    'gemini-2.5-flash-lite': { visionInput: true, audioInput: true, videoInput: true, imageOutput: false, audioOutput: false, videoOutput: false },
+    'gemini-2.5-flash-image': { visionInput: true, audioInput: false, videoInput: false, imageOutput: true, audioOutput: false, videoOutput: false },
+    'gemini-2.5-flash-native-audio-preview': { visionInput: true, audioInput: true, videoInput: true, imageOutput: false, audioOutput: true, videoOutput: false },
+    // Gemini 2.0
+    'gemini-2.0-flash': { visionInput: true, audioInput: true, videoInput: true, imageOutput: true, audioOutput: true, videoOutput: false },
+    'gemini-2.0-flash-lite': { visionInput: true, audioInput: true, videoInput: true, imageOutput: false, audioOutput: false, videoOutput: false },
+    // ===========================================================================
+    // Mistral AI (January 2026)
+    // ===========================================================================
+    // Large models (Mistral Large 3 has vision)
+    'mistral-large-2512': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'mistral-large-latest': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // Medium models (vision capable)
+    'mistral-medium-3.1': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'mistral-medium-latest': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // Small models (vision capable)
+    'mistral-small-3.2': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'mistral-small-latest': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // Ministral (vision capable)
+    'ministral-3b-2512': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'ministral-8b-2512': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'ministral-14b-2512': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // Code models
+    'codestral-2501': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'codestral-latest': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // Vision models (Pixtral)
+    'pixtral-large-2411': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'pixtral-large-latest': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // Audio models (Voxtral)
+    'voxtral-small': { visionInput: false, audioInput: true, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'voxtral-mini': { visionInput: false, audioInput: true, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // Document AI
+    'mistral-ocr-2512': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // ===========================================================================
+    // Cohere (January 2026)
+    // ===========================================================================
+    // Command A family
+    'command-a-03-2025': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'command-a-reasoning': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'command-a-vision': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // Command R family
+    'command-r-plus-08-2024': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'command-r-08-2024': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'command-r-plus': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'command-r': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // ===========================================================================
+    // Groq (January 2026)
+    // ===========================================================================
+    'llama-3.3-70b-versatile': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'llama-3.1-8b-instant': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'openai/gpt-oss-120b': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'openai/gpt-oss-20b': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'groq/compound': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'groq/compound-mini': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'meta-llama/llama-guard-4-12b': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'whisper-large-v3': { visionInput: false, audioInput: true, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'whisper-large-v3-turbo': { visionInput: false, audioInput: true, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // ===========================================================================
+    // xAI Grok (January 2026)
+    // ===========================================================================
+    'grok-4': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'grok-4.1-fast': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'grok-3': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'grok-3-mini': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'grok-3-vision': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'grok-2': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'grok-2-vision': { visionInput: true, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // ===========================================================================
+    // DeepSeek (January 2026 - V3.2)
+    // ===========================================================================
+    'deepseek-chat': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'deepseek-reasoner': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // ===========================================================================
+    // Perplexity (January 2026 - Sonar family)
+    // ===========================================================================
+    'sonar': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'sonar-pro': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'sonar-reasoning': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'sonar-reasoning-pro': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'sonar-deep-research': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // ===========================================================================
+    // LM Studio / Local Models (common vision models)
+    // ===========================================================================
+    'llava-v1.6-mistral-7b': {
+        visionInput: true,
+        audioInput: false,
+        videoInput: false,
+        imageOutput: false,
+        audioOutput: false,
+        videoOutput: false,
+    },
+    'llava-v1.6-vicuna-13b': {
+        visionInput: true,
+        audioInput: false,
+        videoInput: false,
+        imageOutput: false,
+        audioOutput: false,
+        videoOutput: false,
+    },
+    'qwen2-vl-7b-instruct': {
+        visionInput: true,
+        audioInput: false,
+        videoInput: false,
+        imageOutput: false,
+        audioOutput: false,
+        videoOutput: false,
+    },
+    'phi-3-vision-128k-instruct': {
+        visionInput: true,
+        audioInput: false,
+        videoInput: false,
+        imageOutput: false,
+        audioOutput: false,
+        videoOutput: false,
+    },
+    'minicpm-v-2_6': {
+        visionInput: true,
+        audioInput: false,
+        videoInput: false,
+        imageOutput: false,
+        audioOutput: false,
+        videoOutput: false,
+    },
+    'moondream2': {
+        visionInput: true,
+        audioInput: false,
+        videoInput: false,
+        imageOutput: false,
+        audioOutput: false,
+        videoOutput: false,
+    },
+    'internvl2-8b': {
+        visionInput: true,
+        audioInput: false,
+        videoInput: false,
+        imageOutput: false,
+        audioOutput: false,
+        videoOutput: false,
+    },
+    'llama-3.2-11b-vision': {
+        visionInput: true,
+        audioInput: false,
+        videoInput: false,
+        imageOutput: false,
+        audioOutput: false,
+        videoOutput: false,
+    },
+    'pixtral-12b': {
+        visionInput: true,
+        audioInput: false,
+        videoInput: false,
+        imageOutput: false,
+        audioOutput: false,
+        videoOutput: false,
+    },
+};
+/**
+ * Get capabilities for a model.
+ * Returns undefined for each capability if model is not in the map (unknown).
+ */
+function getModelCapabilities(model) {
+    return exports.MODEL_CAPABILITIES[model] ?? {};
+}
+/**
+ * Check if a model has a specific input capability.
+ * Returns undefined if unknown, true/false if known.
+ */
+function hasInputCapability(model, capability) {
+    const caps = exports.MODEL_CAPABILITIES[model];
+    if (!caps)
+        return undefined;
+    switch (capability) {
+        case 'vision': return caps.visionInput;
+        case 'audio': return caps.audioInput;
+        case 'video': return caps.videoInput;
+    }
+}
+/**
+ * Check if a model has a specific output capability.
+ * Returns undefined if unknown, true/false if known.
+ */
+function hasOutputCapability(model, capability) {
+    const caps = exports.MODEL_CAPABILITIES[model];
+    if (!caps)
+        return undefined;
+    switch (capability) {
+        case 'image': return caps.imageOutput;
+        case 'audio': return caps.audioOutput;
+        case 'video': return caps.videoOutput;
+    }
+}
 /**
  * Cost estimation per 1M tokens (in cents)
- * Prices sourced from official provider pricing pages as of Jan 2025
+ * Prices sourced from official provider pricing pages as of January 2026
  */
 exports.COST_PER_MILLION_TOKENS = {
     // ==========================================================================
-    // OpenAI (https://openai.com/pricing)
+    // OpenAI (https://openai.com/pricing) - January 2026
+    // Images: counted as tokens (~765 tokens per 512x512 image)
+    // Audio: Realtime API pricing
     // ==========================================================================
-    'gpt-4o': { input: 250, output: 1000 },
-    'gpt-4o-mini': { input: 15, output: 60 },
+    // GPT-4.1 family (latest non-reasoning)
+    'gpt-4.1': { input: 200, output: 800 },
+    'gpt-4.1-mini': { input: 40, output: 160 },
+    'gpt-4.1-nano': { input: 10, output: 40 },
+    // GPT-4o (omni - multimodal)
+    'gpt-4o': {
+        input: 250, output: 1000,
+        audioInput: 600, // ~$6.00 per minute (Realtime API)
+        audioOutput: 1200, // ~$12.00 per minute (Realtime API)
+    },
+    'gpt-4o-mini': {
+        input: 15, output: 60,
+        audioInput: 60, // ~$0.60 per minute (Realtime API)
+        audioOutput: 120, // ~$1.20 per minute (Realtime API)
+    },
+    // Reasoning models (o-series)
+    'o3': { input: 1000, output: 4000 },
+    'o3-pro': { input: 15000, output: 60000 },
+    'o4-mini': { input: 150, output: 600 },
+    // Legacy
     'gpt-4-turbo': { input: 1000, output: 3000 },
-    'gpt-3.5-turbo': { input: 50, output: 150 },
     'o1': { input: 1500, output: 6000 },
-    'o1-mini': { input: 300, output: 1200 },
-    'o1-pro': { input: 15000, output: 60000 },
     // ==========================================================================
-    // Anthropic (https://anthropic.com/pricing)
+    // Anthropic (https://anthropic.com/pricing) - January 2026
     // ==========================================================================
+    // Claude 4.5
+    'claude-opus-4-5-20251124': { input: 2000, output: 10000 },
+    'claude-sonnet-4-5-20251124': { input: 400, output: 2000 },
+    // Claude 4.1
+    'claude-opus-4-1-20250805': { input: 1800, output: 9000 },
+    // Claude 4
     'claude-sonnet-4-20250514': { input: 300, output: 1500 },
     'claude-opus-4-20250514': { input: 1500, output: 7500 },
+    // Claude 3.5
     'claude-3-5-haiku-20241022': { input: 80, output: 400 },
-    // Legacy model names (for backwards compatibility)
-    'claude-3-5-sonnet-20241022': { input: 300, output: 1500 },
-    'claude-3-opus-20240229': { input: 1500, output: 7500 },
-    'claude-3-haiku-20240307': { input: 25, output: 125 },
     // ==========================================================================
-    // Google Gemini (https://ai.google.dev/pricing)
+    // Google Gemini (https://ai.google.dev/pricing) - January 2026
+    // Images: ~258 tokens/image, Audio: ~32 tokens/sec, Video: ~263 tokens/sec
     // ==========================================================================
-    'gemini-2.0-flash': { input: 10, output: 40 },
+    // Gemini 3 (latest)
+    'gemini-3-pro-preview': { input: 175, output: 700 },
+    'gemini-3-flash-preview': { input: 15, output: 60 },
+    'gemini-3-pro-image-preview': {
+        input: 175, output: 700,
+        imageOutput: 8, // ~$0.08 per generated image
+    },
+    // Gemini 2.5
+    'gemini-2.5-pro': { input: 125, output: 500 },
+    'gemini-2.5-flash': { input: 7.5, output: 30 },
+    'gemini-2.5-flash-lite': { input: 3.75, output: 15 },
+    'gemini-2.5-flash-image': {
+        input: 10, output: 40,
+        imageOutput: 4, // ~$0.04 per generated image
+    },
+    'gemini-2.5-flash-native-audio-preview': {
+        input: 10, output: 40,
+        audioInput: 10, // ~$0.10 per minute audio input
+        audioOutput: 60, // ~$0.60 per minute audio output
+    },
+    // Gemini 2.0
+    'gemini-2.0-flash': {
+        input: 10, output: 40,
+        imageOutput: 4, // ~$0.04 per generated image
+        audioOutput: 60, // ~$0.60 per minute of audio output
+    },
     'gemini-2.0-flash-lite': { input: 5, output: 20 },
-    'gemini-1.5-pro': { input: 125, output: 500 },
-    'gemini-1.5-flash': { input: 7.5, output: 30 },
     // ==========================================================================
-    // Mistral AI (https://mistral.ai/technology/#pricing)
+    // Mistral AI (https://mistral.ai/technology/#pricing) - January 2026
     // ==========================================================================
+    // Large models (Mistral Large 3)
+    'mistral-large-2512': { input: 200, output: 600 },
     'mistral-large-latest': { input: 200, output: 600 },
-    'mistral-medium-latest': { input: 270, output: 810 },
+    // Medium models
+    'mistral-medium-3.1': { input: 100, output: 300 },
+    'mistral-medium-latest': { input: 100, output: 300 },
+    // Small models
+    'mistral-small-3.2': { input: 20, output: 60 },
     'mistral-small-latest': { input: 10, output: 30 },
+    // Ministral family (small, efficient)
+    'ministral-3b-2512': { input: 4, output: 12 },
+    'ministral-8b-2512': { input: 10, output: 30 },
+    'ministral-14b-2512': { input: 15, output: 45 },
+    // Code models
+    'codestral-2501': { input: 30, output: 90 },
     'codestral-latest': { input: 30, output: 90 },
-    'mistral-nemo': { input: 15, output: 15 },
+    // Vision models (Pixtral)
+    'pixtral-large-2411': { input: 200, output: 600 },
+    'pixtral-large-latest': { input: 200, output: 600 },
+    // Audio models (Voxtral)
+    'voxtral-small': { input: 20, output: 60, audioInput: 15 },
+    'voxtral-mini': { input: 10, output: 30, audioInput: 8 },
+    // Document AI
+    'mistral-ocr-2512': { input: 15, output: 45 },
     // ==========================================================================
-    // Cohere (https://cohere.com/pricing)
+    // Cohere (https://cohere.com/pricing) - January 2026
     // ==========================================================================
+    // Command A family (latest)
+    'command-a-03-2025': { input: 250, output: 1000 },
+    'command-a-reasoning': { input: 400, output: 1600 },
+    'command-a-vision': { input: 300, output: 1200 },
+    // Command R family
+    'command-r-plus-08-2024': { input: 250, output: 1000 },
+    'command-r-08-2024': { input: 15, output: 60 },
     'command-r-plus': { input: 250, output: 1000 },
     'command-r': { input: 15, output: 60 },
-    'command': { input: 100, output: 200 },
-    'command-light': { input: 30, output: 60 },
     // ==========================================================================
-    // Groq (https://groq.com/pricing) - Fast inference, competitive pricing
+    // Groq (https://groq.com/pricing) - Fast inference, January 2026
     // ==========================================================================
+    // Llama models
     'llama-3.3-70b-versatile': { input: 59, output: 79 },
     'llama-3.1-8b-instant': { input: 5, output: 8 },
-    'mixtral-8x7b-32768': { input: 24, output: 24 },
-    'gemma2-9b-it': { input: 20, output: 20 },
+    // GPT OSS models
+    'openai/gpt-oss-120b': { input: 150, output: 200 },
+    'openai/gpt-oss-20b': { input: 30, output: 40 },
+    // Compound (agentic)
+    'groq/compound': { input: 100, output: 150 },
+    'groq/compound-mini': { input: 30, output: 50 },
+    // Safety
+    'meta-llama/llama-guard-4-12b': { input: 20, output: 20 },
+    // Audio (Whisper - speech-to-text, per minute)
+    'whisper-large-v3': { input: 11, output: 0, audioInput: 11 },
+    'whisper-large-v3-turbo': { input: 4, output: 0, audioInput: 4 },
     // ==========================================================================
-    // xAI Grok (https://x.ai/api)
+    // xAI Grok (https://x.ai/api) - January 2026
     // ==========================================================================
+    // Grok 4 (latest)
+    'grok-4': { input: 500, output: 2000 },
+    'grok-4.1-fast': { input: 100, output: 400 },
+    // Grok 3
+    'grok-3': { input: 300, output: 1200 },
+    'grok-3-mini': { input: 30, output: 120 },
+    'grok-3-vision': { input: 350, output: 1400 },
+    // Grok 2 (legacy)
     'grok-2': { input: 200, output: 1000 },
-    'grok-2-mini': { input: 20, output: 100 },
+    'grok-2-vision': { input: 200, output: 1000 },
     // ==========================================================================
-    // DeepSeek (https://platform.deepseek.com/api-docs/pricing)
+    // DeepSeek (https://platform.deepseek.com/api-docs/pricing) - January 2026
+    // V3.2 pricing (very competitive)
     // ==========================================================================
     'deepseek-chat': { input: 14, output: 28 },
-    'deepseek-coder': { input: 14, output: 28 },
     'deepseek-reasoner': { input: 55, output: 219 },
     // ==========================================================================
-    // Perplexity (https://docs.perplexity.ai/guides/pricing)
+    // Perplexity (https://docs.perplexity.ai/guides/pricing) - January 2026
+    // Sonar family (includes search costs)
     // ==========================================================================
-    'llama-3.1-sonar-small-128k-online': { input: 20, output: 20 },
-    'llama-3.1-sonar-large-128k-online': { input: 100, output: 100 },
-    'llama-3.1-sonar-huge-128k-online': { input: 500, output: 500 },
+    'sonar': { input: 100, output: 100 },
+    'sonar-pro': { input: 300, output: 300 },
+    'sonar-reasoning': { input: 500, output: 500 },
+    'sonar-reasoning-pro': { input: 800, output: 800 },
+    'sonar-deep-research': { input: 1200, output: 1200 },
     // ==========================================================================
-    // LLM Server (custom) - Default/estimated pricing
+    // LLM Server (custom) - Default/estimated pricing for local models
     // ==========================================================================
+    // Text models
     'qwen/qwen3-30b-a3b-2507': { input: 50, output: 100 },
     'meta-llama-3.1-8b-instruct': { input: 20, output: 40 },
     'qwen-32b-everything': { input: 50, output: 100 },
-    'openai/gpt-oss-20b': { input: 30, output: 60 },
+    // Vision models (LM Studio / local) - estimated based on model size
+    'llava-v1.6-mistral-7b': { input: 25, output: 50 },
+    'llava-v1.6-vicuna-13b': { input: 40, output: 80 },
+    'qwen2-vl-7b-instruct': { input: 25, output: 50 },
+    'phi-3-vision-128k-instruct': { input: 20, output: 40 },
+    'minicpm-v-2_6': { input: 15, output: 30 },
+    'moondream2': { input: 10, output: 20 },
+    'internvl2-8b': { input: 25, output: 50 },
+    'llama-3.2-11b-vision': { input: 30, output: 60 },
+    'pixtral-12b': { input: 35, output: 70 },
     // ==========================================================================
     // Default for unknown models
     // ==========================================================================
@@ -156,7 +541,7 @@ function getModelPricing(model) {
     return exports.COST_PER_MILLION_TOKENS[model] ?? DEFAULT_MODEL_PRICING;
 }
 /**
- * Estimate cost in cents for token usage
+ * Estimate cost in cents for token usage (text only, for backwards compatibility)
  */
 function estimateCost(model, inputTokens, outputTokens) {
     const costs = getModelPricing(model);
@@ -164,6 +549,42 @@ function estimateCost(model, inputTokens, outputTokens) {
     const outputCost = (outputTokens / 1000000) * costs.output;
     return Math.round((inputCost + outputCost) * 100) / 100; // Round to 2 decimal places
 }
+/**
+ * Estimate cost in cents for multimodal usage
+ */
+function estimateMultimodalCost(model, usage) {
+    const pricing = getModelPricing(model);
+    let totalCost = 0;
+    // Text token costs
+    if (usage.inputTokens) {
+        totalCost += (usage.inputTokens / 1000000) * pricing.input;
+    }
+    if (usage.outputTokens) {
+        totalCost += (usage.outputTokens / 1000000) * pricing.output;
+    }
+    // Image costs
+    if (usage.imagesInput && pricing.imageInput) {
+        totalCost += usage.imagesInput * pricing.imageInput;
+    }
+    if (usage.imagesOutput && pricing.imageOutput) {
+        totalCost += usage.imagesOutput * pricing.imageOutput;
+    }
+    // Audio costs
+    if (usage.audioInputMinutes && pricing.audioInput) {
+        totalCost += usage.audioInputMinutes * pricing.audioInput;
+    }
+    if (usage.audioOutputMinutes && pricing.audioOutput) {
+        totalCost += usage.audioOutputMinutes * pricing.audioOutput;
+    }
+    // Video costs
+    if (usage.videoInputMinutes && pricing.videoInput) {
+        totalCost += usage.videoInputMinutes * pricing.videoInput;
+    }
+    if (usage.videoOutputMinutes && pricing.videoOutput) {
+        totalCost += usage.videoOutputMinutes * pricing.videoOutput;
+    }
+    return Math.round(totalCost * 100) / 100; // Round to 2 decimal places
+}
 /**
  * Format cost in cents to a readable string (e.g., "$0.0015" or "$1.50")
  */