npm - @sudobility/shapeshyft_types - Versions diffs - 1.0.21 → 1.0.23 - Mend

@sudobility/shapeshyft_types 1.0.21 → 1.0.23

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/dist/index.cjs CHANGED Viewed

@@ -4,9 +4,17 @@
  * TypeScript types for ShapeShyft API - LLM structured output platform
  */
 Object.defineProperty(exports, "__esModule", { value: true });
-exports.COST_PER_MILLION_TOKENS = exports.PROVIDER_ALLOWS_CUSTOM_MODEL = exports.DEFAULT_PROVIDER_MODEL = exports.PROVIDER_MODELS = exports.LLM_PROVIDERS = void 0;
+exports.COST_PER_MILLION_TOKENS = exports.MODEL_CAPABILITIES = exports.PROVIDER_ALLOWS_CUSTOM_MODEL = exports.DEFAULT_PROVIDER_MODEL = exports.PROVIDER_MODELS = exports.LLM_PROVIDERS = void 0;
+exports.getModelCapabilities = getModelCapabilities;
+exports.hasInputCapability = hasInputCapability;
+exports.hasOutputCapability = hasOutputCapability;
+exports.getMediaFormats = getMediaFormats;
+exports.supportsMediaFormat = supportsMediaFormat;
+exports.getDefaultMediaFormat = getDefaultMediaFormat;
+exports.supportsMediaUrl = supportsMediaUrl;
 exports.getModelPricing = getModelPricing;
 exports.estimateCost = estimateCost;
+exports.estimateMultimodalCost = estimateMultimodalCost;
 exports.formatCost = formatCost;
 exports.formatCostPerMillion = formatCostPerMillion;
 exports.successResponse = successResponse;
@@ -24,30 +32,75 @@ exports.LLM_PROVIDERS = [
     'perplexity',
     'llm_server',
 ];
-/** Models available for each provider */
+/** Models available for each provider (January 2026) */
 exports.PROVIDER_MODELS = {
-    openai: ['gpt-4o', 'gpt-4o-mini', 'gpt-4-turbo', 'gpt-3.5-turbo', 'o1', 'o1-mini', 'o1-pro'],
-    anthropic: ['claude-sonnet-4-20250514', 'claude-opus-4-20250514', 'claude-3-5-haiku-20241022'],
-    gemini: ['gemini-2.0-flash', 'gemini-2.0-flash-lite', 'gemini-1.5-pro', 'gemini-1.5-flash'],
-    mistral: ['mistral-large-latest', 'mistral-medium-latest', 'mistral-small-latest', 'codestral-latest', 'mistral-nemo'],
-    cohere: ['command-r-plus', 'command-r', 'command', 'command-light'],
-    groq: ['llama-3.3-70b-versatile', 'llama-3.1-8b-instant', 'mixtral-8x7b-32768', 'gemma2-9b-it'],
-    xai: ['grok-2', 'grok-2-mini'],
-    deepseek: ['deepseek-chat', 'deepseek-coder', 'deepseek-reasoner'],
-    perplexity: ['llama-3.1-sonar-small-128k-online', 'llama-3.1-sonar-large-128k-online', 'llama-3.1-sonar-huge-128k-online'],
-    llm_server: ['qwen/qwen3-30b-a3b-2507', 'meta-llama-3.1-8b-instruct', 'qwen-32b-everything', 'openai/gpt-oss-20b'],
+    openai: [
+        'gpt-4.1', 'gpt-4.1-mini', 'gpt-4.1-nano',
+        'gpt-4o', 'gpt-4o-mini',
+        'o3', 'o3-pro', 'o4-mini',
+        'gpt-4-turbo', 'o1',
+    ],
+    anthropic: [
+        'claude-opus-4-5-20251124', 'claude-sonnet-4-5-20251124',
+        'claude-opus-4-1-20250805',
+        'claude-sonnet-4-20250514', 'claude-opus-4-20250514',
+        'claude-3-5-haiku-20241022',
+    ],
+    gemini: [
+        'gemini-3-pro-preview', 'gemini-3-flash-preview', 'gemini-3-pro-image-preview',
+        'gemini-2.5-pro', 'gemini-2.5-flash', 'gemini-2.5-flash-lite', 'gemini-2.5-flash-image', 'gemini-2.5-flash-native-audio-preview',
+        'gemini-2.0-flash', 'gemini-2.0-flash-lite',
+    ],
+    mistral: [
+        'mistral-large-2512', 'mistral-large-latest',
+        'mistral-medium-3.1', 'mistral-medium-latest',
+        'mistral-small-3.2', 'mistral-small-latest',
+        'ministral-3b-2512', 'ministral-8b-2512', 'ministral-14b-2512',
+        'codestral-2501', 'codestral-latest',
+        'pixtral-large-2411', 'pixtral-large-latest',
+        'voxtral-small', 'voxtral-mini',
+        'mistral-ocr-2512',
+    ],
+    cohere: [
+        'command-a-03-2025', 'command-a-reasoning', 'command-a-vision',
+        'command-r-plus-08-2024', 'command-r-08-2024',
+        'command-r-plus', 'command-r',
+    ],
+    groq: [
+        'llama-3.3-70b-versatile', 'llama-3.1-8b-instant',
+        'openai/gpt-oss-120b', 'openai/gpt-oss-20b',
+        'groq/compound', 'groq/compound-mini',
+        'meta-llama/llama-guard-4-12b',
+        'whisper-large-v3', 'whisper-large-v3-turbo',
+    ],
+    xai: [
+        'grok-4', 'grok-4.1-fast',
+        'grok-3', 'grok-3-mini', 'grok-3-vision',
+        'grok-2', 'grok-2-vision',
+    ],
+    deepseek: ['deepseek-chat', 'deepseek-reasoner'],
+    perplexity: [
+        'sonar', 'sonar-pro',
+        'sonar-reasoning', 'sonar-reasoning-pro',
+        'sonar-deep-research',
+    ],
+    llm_server: [
+        'qwen/qwen3-30b-a3b-2507', 'meta-llama-3.1-8b-instruct', 'qwen-32b-everything', 'openai/gpt-oss-20b',
+        'llava-v1.6-mistral-7b', 'llava-v1.6-vicuna-13b', 'qwen2-vl-7b-instruct', 'phi-3-vision-128k-instruct',
+        'minicpm-v-2_6', 'moondream2', 'internvl2-8b', 'llama-3.2-11b-vision', 'pixtral-12b',
+    ],
 };
-/** Default model for each provider */
+/** Default model for each provider (January 2026) */
 exports.DEFAULT_PROVIDER_MODEL = {
-    openai: 'gpt-4o-mini',
-    anthropic: 'claude-sonnet-4-20250514',
-    gemini: 'gemini-2.0-flash',
+    openai: 'gpt-4.1-mini',
+    anthropic: 'claude-sonnet-4-5-20251124',
+    gemini: 'gemini-2.5-flash',
     mistral: 'mistral-small-latest',
-    cohere: 'command-r',
+    cohere: 'command-r-08-2024',
     groq: 'llama-3.3-70b-versatile',
-    xai: 'grok-2-mini',
+    xai: 'grok-3-mini',
     deepseek: 'deepseek-chat',
-    perplexity: 'llama-3.1-sonar-small-128k-online',
+    perplexity: 'sonar',
     llm_server: 'meta-llama-3.1-8b-instruct',
 };
 /** Providers that allow custom model input (user can type any model name) */
@@ -63,84 +116,679 @@ exports.PROVIDER_ALLOWS_CUSTOM_MODEL = {
     perplexity: false,
     llm_server: true, // Users can type any model name for custom LLM servers
 };
+/**
+ * Model capabilities map (January 2026).
+ * Maps model names to their multimodal capabilities.
+ * Models not in this map have undefined capabilities.
+ */
+exports.MODEL_CAPABILITIES = {
+    // ===========================================================================
+    // OpenAI (January 2026)
+    // OpenAI supports URL and base64 for images
+    // ===========================================================================
+    // GPT-4.1 family
+    'gpt-4.1': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    'gpt-4.1-mini': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    'gpt-4.1-nano': {
+        visionInput: false, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+    },
+    // GPT-4o (omni - multimodal)
+    'gpt-4o': {
+        visionInput: true, audioInput: true, videoInput: false,
+        imageOutput: false, audioOutput: true, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'], audioFormats: ['base64', 'file'] },
+    },
+    'gpt-4o-mini': {
+        visionInput: true, audioInput: true, videoInput: false,
+        imageOutput: false, audioOutput: true, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'], audioFormats: ['base64', 'file'] },
+    },
+    // Reasoning models (o-series)
+    'o3': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    'o3-pro': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    'o4-mini': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    // Legacy
+    'gpt-4-turbo': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    'o1': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    // ===========================================================================
+    // Anthropic (January 2026)
+    // Anthropic supports URL and base64 for images
+    // ===========================================================================
+    // Claude 4.5
+    'claude-opus-4-5-20251124': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    'claude-sonnet-4-5-20251124': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    // Claude 4.1
+    'claude-opus-4-1-20250805': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    // Claude 4
+    'claude-sonnet-4-20250514': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    'claude-opus-4-20250514': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    // Claude 3.5
+    'claude-3-5-haiku-20241022': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    // ===========================================================================
+    // Google Gemini (January 2026)
+    // Gemini supports URL, base64, and GCS URIs for all media types
+    // ===========================================================================
+    // Gemini 3 (latest)
+    'gemini-3-pro-preview': {
+        visionInput: true, audioInput: true, videoInput: true,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: {
+            imageFormats: ['url', 'base64', 'gcs'],
+            audioFormats: ['url', 'base64', 'gcs'],
+            videoFormats: ['url', 'gcs'],
+        },
+    },
+    'gemini-3-flash-preview': {
+        visionInput: true, audioInput: true, videoInput: true,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: {
+            imageFormats: ['url', 'base64', 'gcs'],
+            audioFormats: ['url', 'base64', 'gcs'],
+            videoFormats: ['url', 'gcs'],
+        },
+    },
+    'gemini-3-pro-image-preview': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: true, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64', 'gcs'] },
+    },
+    // Gemini 2.5
+    'gemini-2.5-pro': {
+        visionInput: true, audioInput: true, videoInput: true,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: {
+            imageFormats: ['url', 'base64', 'gcs'],
+            audioFormats: ['url', 'base64', 'gcs'],
+            videoFormats: ['url', 'gcs'],
+        },
+    },
+    'gemini-2.5-flash': {
+        visionInput: true, audioInput: true, videoInput: true,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: {
+            imageFormats: ['url', 'base64', 'gcs'],
+            audioFormats: ['url', 'base64', 'gcs'],
+            videoFormats: ['url', 'gcs'],
+        },
+    },
+    'gemini-2.5-flash-lite': {
+        visionInput: true, audioInput: true, videoInput: true,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: {
+            imageFormats: ['url', 'base64', 'gcs'],
+            audioFormats: ['url', 'base64', 'gcs'],
+            videoFormats: ['url', 'gcs'],
+        },
+    },
+    'gemini-2.5-flash-image': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: true, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64', 'gcs'] },
+    },
+    'gemini-2.5-flash-native-audio-preview': {
+        visionInput: true, audioInput: true, videoInput: true,
+        imageOutput: false, audioOutput: true, videoOutput: false,
+        mediaFormats: {
+            imageFormats: ['url', 'base64', 'gcs'],
+            audioFormats: ['url', 'base64', 'gcs'],
+            videoFormats: ['url', 'gcs'],
+        },
+    },
+    // Gemini 2.0
+    'gemini-2.0-flash': {
+        visionInput: true, audioInput: true, videoInput: true,
+        imageOutput: true, audioOutput: true, videoOutput: false,
+        mediaFormats: {
+            imageFormats: ['url', 'base64', 'gcs'],
+            audioFormats: ['url', 'base64', 'gcs'],
+            videoFormats: ['url', 'gcs'],
+        },
+    },
+    'gemini-2.0-flash-lite': {
+        visionInput: true, audioInput: true, videoInput: true,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: {
+            imageFormats: ['url', 'base64', 'gcs'],
+            audioFormats: ['url', 'base64', 'gcs'],
+            videoFormats: ['url', 'gcs'],
+        },
+    },
+    // ===========================================================================
+    // Mistral AI (January 2026)
+    // Mistral supports URL and base64 for images
+    // ===========================================================================
+    // Large models (Mistral Large 3 has vision)
+    'mistral-large-2512': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    'mistral-large-latest': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    // Medium models (vision capable)
+    'mistral-medium-3.1': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    'mistral-medium-latest': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    // Small models (vision capable)
+    'mistral-small-3.2': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    'mistral-small-latest': {
+        visionInput: false, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+    },
+    // Ministral (vision capable)
+    'ministral-3b-2512': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    'ministral-8b-2512': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    'ministral-14b-2512': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    // Code models
+    'codestral-2501': {
+        visionInput: false, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+    },
+    'codestral-latest': {
+        visionInput: false, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+    },
+    // Vision models (Pixtral)
+    'pixtral-large-2411': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    'pixtral-large-latest': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    // Audio models (Voxtral)
+    'voxtral-small': {
+        visionInput: false, audioInput: true, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { audioFormats: ['base64', 'file'] },
+    },
+    'voxtral-mini': {
+        visionInput: false, audioInput: true, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { audioFormats: ['base64', 'file'] },
+    },
+    // Document AI
+    'mistral-ocr-2512': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    // ===========================================================================
+    // Cohere (January 2026)
+    // ===========================================================================
+    // Command A family
+    'command-a-03-2025': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'command-a-reasoning': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'command-a-vision': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['base64'] },
+    },
+    // Command R family
+    'command-r-plus-08-2024': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'command-r-08-2024': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'command-r-plus': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'command-r': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // ===========================================================================
+    // Groq (January 2026)
+    // ===========================================================================
+    'llama-3.3-70b-versatile': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'llama-3.1-8b-instant': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'openai/gpt-oss-120b': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'openai/gpt-oss-20b': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'groq/compound': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'groq/compound-mini': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'meta-llama/llama-guard-4-12b': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['base64'] },
+    },
+    'whisper-large-v3': {
+        visionInput: false, audioInput: true, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { audioFormats: ['file'] },
+    },
+    'whisper-large-v3-turbo': {
+        visionInput: false, audioInput: true, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { audioFormats: ['file'] },
+    },
+    // ===========================================================================
+    // xAI Grok (January 2026)
+    // ===========================================================================
+    'grok-4': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    'grok-4.1-fast': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    'grok-3': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    'grok-3-mini': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'grok-3-vision': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    'grok-2': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'grok-2-vision': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['url', 'base64'] },
+    },
+    // ===========================================================================
+    // DeepSeek (January 2026 - V3.2)
+    // ===========================================================================
+    'deepseek-chat': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'deepseek-reasoner': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // ===========================================================================
+    // Perplexity (January 2026 - Sonar family)
+    // ===========================================================================
+    'sonar': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'sonar-pro': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'sonar-reasoning': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'sonar-reasoning-pro': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    'sonar-deep-research': { visionInput: false, audioInput: false, videoInput: false, imageOutput: false, audioOutput: false, videoOutput: false },
+    // ===========================================================================
+    // LM Studio / Local Models (common vision models)
+    // Local models typically only support base64 as they don't have internet access
+    // ===========================================================================
+    'llava-v1.6-mistral-7b': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['base64'] },
+    },
+    'llava-v1.6-vicuna-13b': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['base64'] },
+    },
+    'qwen2-vl-7b-instruct': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['base64'] },
+    },
+    'phi-3-vision-128k-instruct': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['base64'] },
+    },
+    'minicpm-v-2_6': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['base64'] },
+    },
+    'moondream2': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['base64'] },
+    },
+    'internvl2-8b': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['base64'] },
+    },
+    'llama-3.2-11b-vision': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['base64'] },
+    },
+    'pixtral-12b': {
+        visionInput: true, audioInput: false, videoInput: false,
+        imageOutput: false, audioOutput: false, videoOutput: false,
+        mediaFormats: { imageFormats: ['base64'] },
+    },
+};
+/**
+ * Get capabilities for a model.
+ * Returns undefined for each capability if model is not in the map (unknown).
+ */
+function getModelCapabilities(model) {
+    return exports.MODEL_CAPABILITIES[model] ?? {};
+}
+/**
+ * Check if a model has a specific input capability.
+ * Returns undefined if unknown, true/false if known.
+ */
+function hasInputCapability(model, capability) {
+    const caps = exports.MODEL_CAPABILITIES[model];
+    if (!caps)
+        return undefined;
+    switch (capability) {
+        case 'vision': return caps.visionInput;
+        case 'audio': return caps.audioInput;
+        case 'video': return caps.videoInput;
+    }
+}
+/**
+ * Check if a model has a specific output capability.
+ * Returns undefined if unknown, true/false if known.
+ */
+function hasOutputCapability(model, capability) {
+    const caps = exports.MODEL_CAPABILITIES[model];
+    if (!caps)
+        return undefined;
+    switch (capability) {
+        case 'image': return caps.imageOutput;
+        case 'audio': return caps.audioOutput;
+        case 'video': return caps.videoOutput;
+    }
+}
+/**
+ * Get supported media input formats for a specific media type.
+ * Returns the list of supported formats, or undefined if model is unknown.
+ * Returns empty array if model is known but doesn't support that media type.
+ */
+function getMediaFormats(model, mediaType) {
+    const caps = exports.MODEL_CAPABILITIES[model];
+    if (!caps)
+        return undefined;
+    if (!caps.mediaFormats)
+        return [];
+    switch (mediaType) {
+        case 'image': return caps.mediaFormats.imageFormats ?? [];
+        case 'audio': return caps.mediaFormats.audioFormats ?? [];
+        case 'video': return caps.mediaFormats.videoFormats ?? [];
+    }
+}
+/**
+ * Check if a model supports a specific media input format.
+ * Returns undefined if model is unknown, true/false if known.
+ */
+function supportsMediaFormat(model, mediaType, format) {
+    const formats = getMediaFormats(model, mediaType);
+    if (formats === undefined)
+        return undefined;
+    return formats.includes(format);
+}
+/**
+ * Get the preferred/default media input format for a model.
+ * Returns 'url' if supported, otherwise the first supported format.
+ * Returns undefined if model is unknown or doesn't support the media type.
+ */
+function getDefaultMediaFormat(model, mediaType) {
+    const formats = getMediaFormats(model, mediaType);
+    if (!formats || formats.length === 0)
+        return undefined;
+    // Prefer URL if available (more efficient for providers)
+    if (formats.includes('url'))
+        return 'url';
+    // Otherwise return first available format
+    return formats[0];
+}
+/**
+ * Check if a model supports URL-based media input for a specific media type.
+ * This is a convenience function since URL support affects UI behavior.
+ */
+function supportsMediaUrl(model, mediaType) {
+    return supportsMediaFormat(model, mediaType, 'url');
+}
 /**
  * Cost estimation per 1M tokens (in cents)
- * Prices sourced from official provider pricing pages as of Jan 2025
+ * Prices sourced from official provider pricing pages as of January 2026
  */
 exports.COST_PER_MILLION_TOKENS = {
     // ==========================================================================
-    // OpenAI (https://openai.com/pricing)
+    // OpenAI (https://openai.com/pricing) - January 2026
+    // Images: counted as tokens (~765 tokens per 512x512 image)
+    // Audio: Realtime API pricing
     // ==========================================================================
-    'gpt-4o': { input: 250, output: 1000 },
-    'gpt-4o-mini': { input: 15, output: 60 },
+    // GPT-4.1 family (latest non-reasoning)
+    'gpt-4.1': { input: 200, output: 800 },
+    'gpt-4.1-mini': { input: 40, output: 160 },
+    'gpt-4.1-nano': { input: 10, output: 40 },
+    // GPT-4o (omni - multimodal)
+    'gpt-4o': {
+        input: 250, output: 1000,
+        audioInput: 600, // ~$6.00 per minute (Realtime API)
+        audioOutput: 1200, // ~$12.00 per minute (Realtime API)
+    },
+    'gpt-4o-mini': {
+        input: 15, output: 60,
+        audioInput: 60, // ~$0.60 per minute (Realtime API)
+        audioOutput: 120, // ~$1.20 per minute (Realtime API)
+    },
+    // Reasoning models (o-series)
+    'o3': { input: 1000, output: 4000 },
+    'o3-pro': { input: 15000, output: 60000 },
+    'o4-mini': { input: 150, output: 600 },
+    // Legacy
     'gpt-4-turbo': { input: 1000, output: 3000 },
-    'gpt-3.5-turbo': { input: 50, output: 150 },
     'o1': { input: 1500, output: 6000 },
-    'o1-mini': { input: 300, output: 1200 },
-    'o1-pro': { input: 15000, output: 60000 },
     // ==========================================================================
-    // Anthropic (https://anthropic.com/pricing)
+    // Anthropic (https://anthropic.com/pricing) - January 2026
     // ==========================================================================
+    // Claude 4.5
+    'claude-opus-4-5-20251124': { input: 2000, output: 10000 },
+    'claude-sonnet-4-5-20251124': { input: 400, output: 2000 },
+    // Claude 4.1
+    'claude-opus-4-1-20250805': { input: 1800, output: 9000 },
+    // Claude 4
     'claude-sonnet-4-20250514': { input: 300, output: 1500 },
     'claude-opus-4-20250514': { input: 1500, output: 7500 },
+    // Claude 3.5
     'claude-3-5-haiku-20241022': { input: 80, output: 400 },
-    // Legacy model names (for backwards compatibility)
-    'claude-3-5-sonnet-20241022': { input: 300, output: 1500 },
-    'claude-3-opus-20240229': { input: 1500, output: 7500 },
-    'claude-3-haiku-20240307': { input: 25, output: 125 },
     // ==========================================================================
-    // Google Gemini (https://ai.google.dev/pricing)
+    // Google Gemini (https://ai.google.dev/pricing) - January 2026
+    // Images: ~258 tokens/image, Audio: ~32 tokens/sec, Video: ~263 tokens/sec
     // ==========================================================================
-    'gemini-2.0-flash': { input: 10, output: 40 },
+    // Gemini 3 (latest)
+    'gemini-3-pro-preview': { input: 175, output: 700 },
+    'gemini-3-flash-preview': { input: 15, output: 60 },
+    'gemini-3-pro-image-preview': {
+        input: 175, output: 700,
+        imageOutput: 8, // ~$0.08 per generated image
+    },
+    // Gemini 2.5
+    'gemini-2.5-pro': { input: 125, output: 500 },
+    'gemini-2.5-flash': { input: 7.5, output: 30 },
+    'gemini-2.5-flash-lite': { input: 3.75, output: 15 },
+    'gemini-2.5-flash-image': {
+        input: 10, output: 40,
+        imageOutput: 4, // ~$0.04 per generated image
+    },
+    'gemini-2.5-flash-native-audio-preview': {
+        input: 10, output: 40,
+        audioInput: 10, // ~$0.10 per minute audio input
+        audioOutput: 60, // ~$0.60 per minute audio output
+    },
+    // Gemini 2.0
+    'gemini-2.0-flash': {
+        input: 10, output: 40,
+        imageOutput: 4, // ~$0.04 per generated image
+        audioOutput: 60, // ~$0.60 per minute of audio output
+    },
     'gemini-2.0-flash-lite': { input: 5, output: 20 },
-    'gemini-1.5-pro': { input: 125, output: 500 },
-    'gemini-1.5-flash': { input: 7.5, output: 30 },
     // ==========================================================================
-    // Mistral AI (https://mistral.ai/technology/#pricing)
+    // Mistral AI (https://mistral.ai/technology/#pricing) - January 2026
     // ==========================================================================
+    // Large models (Mistral Large 3)
+    'mistral-large-2512': { input: 200, output: 600 },
     'mistral-large-latest': { input: 200, output: 600 },
-    'mistral-medium-latest': { input: 270, output: 810 },
+    // Medium models
+    'mistral-medium-3.1': { input: 100, output: 300 },
+    'mistral-medium-latest': { input: 100, output: 300 },
+    // Small models
+    'mistral-small-3.2': { input: 20, output: 60 },
     'mistral-small-latest': { input: 10, output: 30 },
+    // Ministral family (small, efficient)
+    'ministral-3b-2512': { input: 4, output: 12 },
+    'ministral-8b-2512': { input: 10, output: 30 },
+    'ministral-14b-2512': { input: 15, output: 45 },
+    // Code models
+    'codestral-2501': { input: 30, output: 90 },
     'codestral-latest': { input: 30, output: 90 },
-    'mistral-nemo': { input: 15, output: 15 },
+    // Vision models (Pixtral)
+    'pixtral-large-2411': { input: 200, output: 600 },
+    'pixtral-large-latest': { input: 200, output: 600 },
+    // Audio models (Voxtral)
+    'voxtral-small': { input: 20, output: 60, audioInput: 15 },
+    'voxtral-mini': { input: 10, output: 30, audioInput: 8 },
+    // Document AI
+    'mistral-ocr-2512': { input: 15, output: 45 },
     // ==========================================================================
-    // Cohere (https://cohere.com/pricing)
+    // Cohere (https://cohere.com/pricing) - January 2026
     // ==========================================================================
+    // Command A family (latest)
+    'command-a-03-2025': { input: 250, output: 1000 },
+    'command-a-reasoning': { input: 400, output: 1600 },
+    'command-a-vision': { input: 300, output: 1200 },
+    // Command R family
+    'command-r-plus-08-2024': { input: 250, output: 1000 },
+    'command-r-08-2024': { input: 15, output: 60 },
     'command-r-plus': { input: 250, output: 1000 },
     'command-r': { input: 15, output: 60 },
-    'command': { input: 100, output: 200 },
-    'command-light': { input: 30, output: 60 },
     // ==========================================================================
-    // Groq (https://groq.com/pricing) - Fast inference, competitive pricing
+    // Groq (https://groq.com/pricing) - Fast inference, January 2026
     // ==========================================================================
+    // Llama models
     'llama-3.3-70b-versatile': { input: 59, output: 79 },
     'llama-3.1-8b-instant': { input: 5, output: 8 },
-    'mixtral-8x7b-32768': { input: 24, output: 24 },
-    'gemma2-9b-it': { input: 20, output: 20 },
+    // GPT OSS models
+    'openai/gpt-oss-120b': { input: 150, output: 200 },
+    'openai/gpt-oss-20b': { input: 30, output: 40 },
+    // Compound (agentic)
+    'groq/compound': { input: 100, output: 150 },
+    'groq/compound-mini': { input: 30, output: 50 },
+    // Safety
+    'meta-llama/llama-guard-4-12b': { input: 20, output: 20 },
+    // Audio (Whisper - speech-to-text, per minute)
+    'whisper-large-v3': { input: 11, output: 0, audioInput: 11 },
+    'whisper-large-v3-turbo': { input: 4, output: 0, audioInput: 4 },
     // ==========================================================================
-    // xAI Grok (https://x.ai/api)
+    // xAI Grok (https://x.ai/api) - January 2026
     // ==========================================================================
+    // Grok 4 (latest)
+    'grok-4': { input: 500, output: 2000 },
+    'grok-4.1-fast': { input: 100, output: 400 },
+    // Grok 3
+    'grok-3': { input: 300, output: 1200 },
+    'grok-3-mini': { input: 30, output: 120 },
+    'grok-3-vision': { input: 350, output: 1400 },
+    // Grok 2 (legacy)
     'grok-2': { input: 200, output: 1000 },
-    'grok-2-mini': { input: 20, output: 100 },
+    'grok-2-vision': { input: 200, output: 1000 },
     // ==========================================================================
-    // DeepSeek (https://platform.deepseek.com/api-docs/pricing)
+    // DeepSeek (https://platform.deepseek.com/api-docs/pricing) - January 2026
+    // V3.2 pricing (very competitive)
     // ==========================================================================
     'deepseek-chat': { input: 14, output: 28 },
-    'deepseek-coder': { input: 14, output: 28 },
     'deepseek-reasoner': { input: 55, output: 219 },
     // ==========================================================================
-    // Perplexity (https://docs.perplexity.ai/guides/pricing)
+    // Perplexity (https://docs.perplexity.ai/guides/pricing) - January 2026
+    // Sonar family (includes search costs)
     // ==========================================================================
-    'llama-3.1-sonar-small-128k-online': { input: 20, output: 20 },
-    'llama-3.1-sonar-large-128k-online': { input: 100, output: 100 },
-    'llama-3.1-sonar-huge-128k-online': { input: 500, output: 500 },
+    'sonar': { input: 100, output: 100 },
+    'sonar-pro': { input: 300, output: 300 },
+    'sonar-reasoning': { input: 500, output: 500 },
+    'sonar-reasoning-pro': { input: 800, output: 800 },
+    'sonar-deep-research': { input: 1200, output: 1200 },
     // ==========================================================================
-    // LLM Server (custom) - Default/estimated pricing
+    // LLM Server (custom) - Default/estimated pricing for local models
     // ==========================================================================
+    // Text models
     'qwen/qwen3-30b-a3b-2507': { input: 50, output: 100 },
     'meta-llama-3.1-8b-instruct': { input: 20, output: 40 },
     'qwen-32b-everything': { input: 50, output: 100 },
-    'openai/gpt-oss-20b': { input: 30, output: 60 },
+    // Vision models (LM Studio / local) - estimated based on model size
+    'llava-v1.6-mistral-7b': { input: 25, output: 50 },
+    'llava-v1.6-vicuna-13b': { input: 40, output: 80 },
+    'qwen2-vl-7b-instruct': { input: 25, output: 50 },
+    'phi-3-vision-128k-instruct': { input: 20, output: 40 },
+    'minicpm-v-2_6': { input: 15, output: 30 },
+    'moondream2': { input: 10, output: 20 },
+    'internvl2-8b': { input: 25, output: 50 },
+    'llama-3.2-11b-vision': { input: 30, output: 60 },
+    'pixtral-12b': { input: 35, output: 70 },
     // ==========================================================================
     // Default for unknown models
     // ==========================================================================
@@ -156,7 +804,7 @@ function getModelPricing(model) {
     return exports.COST_PER_MILLION_TOKENS[model] ?? DEFAULT_MODEL_PRICING;
 }
 /**
- * Estimate cost in cents for token usage
+ * Estimate cost in cents for token usage (text only, for backwards compatibility)
  */
 function estimateCost(model, inputTokens, outputTokens) {
     const costs = getModelPricing(model);
@@ -164,6 +812,42 @@ function estimateCost(model, inputTokens, outputTokens) {
     const outputCost = (outputTokens / 1000000) * costs.output;
     return Math.round((inputCost + outputCost) * 100) / 100; // Round to 2 decimal places
 }
+/**
+ * Estimate cost in cents for multimodal usage
+ */
+function estimateMultimodalCost(model, usage) {
+    const pricing = getModelPricing(model);
+    let totalCost = 0;
+    // Text token costs
+    if (usage.inputTokens) {
+        totalCost += (usage.inputTokens / 1000000) * pricing.input;
+    }
+    if (usage.outputTokens) {
+        totalCost += (usage.outputTokens / 1000000) * pricing.output;
+    }
+    // Image costs
+    if (usage.imagesInput && pricing.imageInput) {
+        totalCost += usage.imagesInput * pricing.imageInput;
+    }
+    if (usage.imagesOutput && pricing.imageOutput) {
+        totalCost += usage.imagesOutput * pricing.imageOutput;
+    }
+    // Audio costs
+    if (usage.audioInputMinutes && pricing.audioInput) {
+        totalCost += usage.audioInputMinutes * pricing.audioInput;
+    }
+    if (usage.audioOutputMinutes && pricing.audioOutput) {
+        totalCost += usage.audioOutputMinutes * pricing.audioOutput;
+    }
+    // Video costs
+    if (usage.videoInputMinutes && pricing.videoInput) {
+        totalCost += usage.videoInputMinutes * pricing.videoInput;
+    }
+    if (usage.videoOutputMinutes && pricing.videoOutput) {
+        totalCost += usage.videoOutputMinutes * pricing.videoOutput;
+    }
+    return Math.round(totalCost * 100) / 100; // Round to 2 decimal places
+}
 /**
  * Format cost in cents to a readable string (e.g., "$0.0015" or "$1.50")
  */