RubyGems - ruby_llm - Versions diffs - 1.9.2 → 1.10.0 - Mend

ruby_llm 1.9.2 → 1.10.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (44) hide show

checksums.yaml +4 -4
data/README.md +3 -2
data/lib/generators/ruby_llm/install/templates/create_messages_migration.rb.tt +3 -0
data/lib/generators/ruby_llm/install/templates/create_tool_calls_migration.rb.tt +1 -0
data/lib/generators/ruby_llm/upgrade_to_v1_10/templates/add_v1_10_message_columns.rb.tt +19 -0
data/lib/generators/ruby_llm/upgrade_to_v1_10/upgrade_to_v1_10_generator.rb +50 -0
data/lib/ruby_llm/active_record/acts_as_legacy.rb +5 -1
data/lib/ruby_llm/active_record/chat_methods.rb +12 -0
data/lib/ruby_llm/active_record/message_methods.rb +41 -8
data/lib/ruby_llm/aliases.json +0 -12
data/lib/ruby_llm/chat.rb +10 -7
data/lib/ruby_llm/configuration.rb +1 -1
data/lib/ruby_llm/message.rb +37 -11
data/lib/ruby_llm/models.json +1059 -857
data/lib/ruby_llm/models.rb +134 -12
data/lib/ruby_llm/provider.rb +4 -3
data/lib/ruby_llm/providers/anthropic/chat.rb +128 -13
data/lib/ruby_llm/providers/anthropic/streaming.rb +25 -1
data/lib/ruby_llm/providers/bedrock/chat.rb +58 -15
data/lib/ruby_llm/providers/bedrock/streaming/content_extraction.rb +59 -2
data/lib/ruby_llm/providers/bedrock/streaming/payload_processing.rb +5 -0
data/lib/ruby_llm/providers/gemini/chat.rb +69 -3
data/lib/ruby_llm/providers/gemini/streaming.rb +32 -1
data/lib/ruby_llm/providers/gemini/tools.rb +16 -3
data/lib/ruby_llm/providers/gpustack/chat.rb +1 -1
data/lib/ruby_llm/providers/mistral/chat.rb +58 -1
data/lib/ruby_llm/providers/ollama/chat.rb +1 -1
data/lib/ruby_llm/providers/openai/capabilities.rb +6 -2
data/lib/ruby_llm/providers/openai/chat.rb +87 -3
data/lib/ruby_llm/providers/openai/streaming.rb +11 -3
data/lib/ruby_llm/providers/openai/temperature.rb +28 -0
data/lib/ruby_llm/providers/openai.rb +1 -1
data/lib/ruby_llm/providers/openrouter/chat.rb +154 -0
data/lib/ruby_llm/providers/openrouter/streaming.rb +74 -0
data/lib/ruby_llm/providers/openrouter.rb +2 -0
data/lib/ruby_llm/providers/vertexai.rb +5 -1
data/lib/ruby_llm/stream_accumulator.rb +111 -14
data/lib/ruby_llm/streaming.rb +54 -51
data/lib/ruby_llm/thinking.rb +49 -0
data/lib/ruby_llm/tokens.rb +47 -0
data/lib/ruby_llm/tool_call.rb +6 -3
data/lib/ruby_llm/version.rb +1 -1
data/lib/tasks/models.rake +19 -12
metadata +12 -5

data/lib/ruby_llm/models.json CHANGED Viewed

@@ -1680,12 +1680,12 @@
   },
   {
     "id": "anthropic.claude-3-5-sonnet-20240620-v1:0:18k",
-    "name": "Claude 3.5 Sonnet",
+    "name": "Claude Sonnet 3.5",
     "provider": "bedrock",
-    "family": "claude3_sonnet",
-    "created_at": null,
-    "context_window": 200000,
-    "max_output_tokens": 4096,
+    "family": "claude-sonnet",
+    "created_at": "2024-06-20 00:00:00 +0200",
+    "context_window": 18000,
+    "max_output_tokens": 8192,
     "knowledge_cutoff": null,
     "modalities": {
       "input": [
@@ -1698,18 +1698,16 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 3.0,
-          "output_per_million": 15.0
-        },
-        "batch": {
-          "input_per_million": 1.5,
-          "output_per_million": 7.5
+          "input_per_million": 3,
+          "output_per_million": 15,
+          "cached_input_per_million": 0.3
         }
       }
     },
@@ -1725,17 +1723,34 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2024-06-20",
+      "cost": {
+        "input": 3,
+        "output": 15,
+        "cache_read": 0.3,
+        "cache_write": 3.75
+      },
+      "limit": {
+        "context": 200000,
+        "output": 8192
+      },
+      "knowledge": "2024-04"
     }
   },
   {
     "id": "anthropic.claude-3-5-sonnet-20240620-v1:0:200k",
-    "name": "Claude 3.5 Sonnet",
+    "name": "Claude Sonnet 3.5",
     "provider": "bedrock",
-    "family": "claude3_sonnet",
-    "created_at": null,
+    "family": "claude-sonnet",
+    "created_at": "2024-06-20 00:00:00 +0200",
     "context_window": 200000,
-    "max_output_tokens": 4096,
+    "max_output_tokens": 8192,
     "knowledge_cutoff": null,
     "modalities": {
       "input": [
@@ -1748,18 +1763,16 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 3.0,
-          "output_per_million": 15.0
-        },
-        "batch": {
-          "input_per_million": 1.5,
-          "output_per_million": 7.5
+          "input_per_million": 3,
+          "output_per_million": 15,
+          "cached_input_per_million": 0.3
         }
       }
     },
@@ -1775,17 +1788,34 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2024-06-20",
+      "cost": {
+        "input": 3,
+        "output": 15,
+        "cache_read": 0.3,
+        "cache_write": 3.75
+      },
+      "limit": {
+        "context": 200000,
+        "output": 8192
+      },
+      "knowledge": "2024-04"
     }
   },
   {
     "id": "anthropic.claude-3-5-sonnet-20240620-v1:0:51k",
-    "name": "Claude 3.5 Sonnet",
+    "name": "Claude Sonnet 3.5",
     "provider": "bedrock",
-    "family": "claude3_sonnet",
-    "created_at": null,
-    "context_window": 200000,
-    "max_output_tokens": 4096,
+    "family": "claude-sonnet",
+    "created_at": "2024-06-20 00:00:00 +0200",
+    "context_window": 51000,
+    "max_output_tokens": 8192,
     "knowledge_cutoff": null,
     "modalities": {
       "input": [
@@ -1798,18 +1828,16 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 3.0,
-          "output_per_million": 15.0
-        },
-        "batch": {
-          "input_per_million": 1.5,
-          "output_per_million": 7.5
+          "input_per_million": 3,
+          "output_per_million": 15,
+          "cached_input_per_million": 0.3
         }
       }
     },
@@ -1825,7 +1853,24 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2024-06-20",
+      "cost": {
+        "input": 3,
+        "output": 15,
+        "cache_read": 0.3,
+        "cache_write": 3.75
+      },
+      "limit": {
+        "context": 200000,
+        "output": 8192
+      },
+      "knowledge": "2024-04"
     }
   },
   {
@@ -1895,12 +1940,12 @@
   },
   {
     "id": "anthropic.claude-3-5-sonnet-20241022-v2:0:18k",
-    "name": "Claude 3.5 Sonnet v2",
+    "name": "Claude Sonnet 3.5 v2",
     "provider": "bedrock",
-    "family": "claude3_sonnet",
-    "created_at": null,
-    "context_window": 200000,
-    "max_output_tokens": 4096,
+    "family": "claude-sonnet",
+    "created_at": "2024-10-22 00:00:00 +0200",
+    "context_window": 18000,
+    "max_output_tokens": 8192,
     "knowledge_cutoff": null,
     "modalities": {
       "input": [
@@ -1913,18 +1958,16 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 3.0,
-          "output_per_million": 15.0
-        },
-        "batch": {
-          "input_per_million": 1.5,
-          "output_per_million": 7.5
+          "input_per_million": 3,
+          "output_per_million": 15,
+          "cached_input_per_million": 0.3
         }
       }
     },
@@ -1940,17 +1983,34 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2024-10-22",
+      "cost": {
+        "input": 3,
+        "output": 15,
+        "cache_read": 0.3,
+        "cache_write": 3.75
+      },
+      "limit": {
+        "context": 200000,
+        "output": 8192
+      },
+      "knowledge": "2024-04"
     }
   },
   {
     "id": "anthropic.claude-3-5-sonnet-20241022-v2:0:200k",
-    "name": "Claude 3.5 Sonnet v2",
+    "name": "Claude Sonnet 3.5 v2",
     "provider": "bedrock",
-    "family": "claude3_sonnet",
-    "created_at": null,
+    "family": "claude-sonnet",
+    "created_at": "2024-10-22 00:00:00 +0200",
     "context_window": 200000,
-    "max_output_tokens": 4096,
+    "max_output_tokens": 8192,
     "knowledge_cutoff": null,
     "modalities": {
       "input": [
@@ -1963,18 +2023,16 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 3.0,
-          "output_per_million": 15.0
-        },
-        "batch": {
-          "input_per_million": 1.5,
-          "output_per_million": 7.5
+          "input_per_million": 3,
+          "output_per_million": 15,
+          "cached_input_per_million": 0.3
         }
       }
     },
@@ -1990,17 +2048,34 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2024-10-22",
+      "cost": {
+        "input": 3,
+        "output": 15,
+        "cache_read": 0.3,
+        "cache_write": 3.75
+      },
+      "limit": {
+        "context": 200000,
+        "output": 8192
+      },
+      "knowledge": "2024-04"
     }
   },
   {
     "id": "anthropic.claude-3-5-sonnet-20241022-v2:0:51k",
-    "name": "Claude 3.5 Sonnet v2",
+    "name": "Claude Sonnet 3.5 v2",
     "provider": "bedrock",
-    "family": "claude3_sonnet",
-    "created_at": null,
-    "context_window": 200000,
-    "max_output_tokens": 4096,
+    "family": "claude-sonnet",
+    "created_at": "2024-10-22 00:00:00 +0200",
+    "context_window": 51000,
+    "max_output_tokens": 8192,
     "knowledge_cutoff": null,
     "modalities": {
       "input": [
@@ -2013,18 +2088,16 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 3.0,
-          "output_per_million": 15.0
-        },
-        "batch": {
-          "input_per_million": 1.5,
-          "output_per_million": 7.5
+          "input_per_million": 3,
+          "output_per_million": 15,
+          "cached_input_per_million": 0.3
         }
       }
     },
@@ -2040,7 +2113,24 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2024-10-22",
+      "cost": {
+        "input": 3,
+        "output": 15,
+        "cache_read": 0.3,
+        "cache_write": 3.75
+      },
+      "limit": {
+        "context": 200000,
+        "output": 8192
+      },
+      "knowledge": "2024-04"
     }
   },
   {
@@ -2159,10 +2249,10 @@
   },
   {
     "id": "anthropic.claude-3-haiku-20240307-v1:0:200k",
-    "name": "Claude 3 Haiku",
+    "name": "Claude Haiku 3",
     "provider": "bedrock",
-    "family": "claude3_haiku",
-    "created_at": null,
+    "family": "claude-haiku",
+    "created_at": "2024-03-13 00:00:00 +0100",
     "context_window": 200000,
     "max_output_tokens": 4096,
     "knowledge_cutoff": null,
@@ -2177,18 +2267,15 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
           "input_per_million": 0.25,
           "output_per_million": 1.25
-        },
-        "batch": {
-          "input_per_million": 0.125,
-          "output_per_million": 0.625
         }
       }
     },
@@ -2204,16 +2291,31 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2024-03-13",
+      "cost": {
+        "input": 0.25,
+        "output": 1.25
+      },
+      "limit": {
+        "context": 200000,
+        "output": 4096
+      },
+      "knowledge": "2024-02"
     }
   },
   {
     "id": "anthropic.claude-3-haiku-20240307-v1:0:48k",
-    "name": "Claude 3 Haiku",
+    "name": "Claude Haiku 3",
     "provider": "bedrock",
-    "family": "claude3_haiku",
-    "created_at": null,
-    "context_window": 200000,
+    "family": "claude-haiku",
+    "created_at": "2024-03-13 00:00:00 +0100",
+    "context_window": 48000,
     "max_output_tokens": 4096,
     "knowledge_cutoff": null,
     "modalities": {
@@ -2227,18 +2329,15 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
           "input_per_million": 0.25,
           "output_per_million": 1.25
-        },
-        "batch": {
-          "input_per_million": 0.125,
-          "output_per_million": 0.625
         }
       }
     },
@@ -2254,7 +2353,22 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2024-03-13",
+      "cost": {
+        "input": 0.25,
+        "output": 1.25
+      },
+      "limit": {
+        "context": 200000,
+        "output": 4096
+      },
+      "knowledge": "2024-02"
     }
   },
   {
@@ -2321,11 +2435,11 @@
   },
   {
     "id": "anthropic.claude-3-opus-20240229-v1:0:12k",
-    "name": "Claude 3 Opus",
+    "name": "Claude Opus 3",
     "provider": "bedrock",
-    "family": "claude3_opus",
-    "created_at": null,
-    "context_window": 200000,
+    "family": "claude-opus",
+    "created_at": "2024-02-29 00:00:00 +0100",
+    "context_window": 12000,
     "max_output_tokens": 4096,
     "knowledge_cutoff": null,
     "modalities": {
@@ -2339,18 +2453,15 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 15.0,
-          "output_per_million": 75.0
-        },
-        "batch": {
-          "input_per_million": 7.5,
-          "output_per_million": 37.5
+          "input_per_million": 15,
+          "output_per_million": 75
         }
       }
     },
@@ -2364,15 +2475,30 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2024-02-29",
+      "cost": {
+        "input": 15,
+        "output": 75
+      },
+      "limit": {
+        "context": 200000,
+        "output": 4096
+      },
+      "knowledge": "2023-08"
     }
   },
   {
     "id": "anthropic.claude-3-opus-20240229-v1:0:200k",
-    "name": "Claude 3 Opus",
+    "name": "Claude Opus 3",
     "provider": "bedrock",
-    "family": "claude3_opus",
-    "created_at": null,
+    "family": "claude-opus",
+    "created_at": "2024-02-29 00:00:00 +0100",
     "context_window": 200000,
     "max_output_tokens": 4096,
     "knowledge_cutoff": null,
@@ -2387,18 +2513,15 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 15.0,
-          "output_per_million": 75.0
-        },
-        "batch": {
-          "input_per_million": 7.5,
-          "output_per_million": 37.5
+          "input_per_million": 15,
+          "output_per_million": 75
         }
       }
     },
@@ -2412,16 +2535,31 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2024-02-29",
+      "cost": {
+        "input": 15,
+        "output": 75
+      },
+      "limit": {
+        "context": 200000,
+        "output": 4096
+      },
+      "knowledge": "2023-08"
     }
   },
   {
     "id": "anthropic.claude-3-opus-20240229-v1:0:28k",
-    "name": "Claude 3 Opus",
+    "name": "Claude Opus 3",
     "provider": "bedrock",
-    "family": "claude3_opus",
-    "created_at": null,
-    "context_window": 200000,
+    "family": "claude-opus",
+    "created_at": "2024-02-29 00:00:00 +0100",
+    "context_window": 28000,
     "max_output_tokens": 4096,
     "knowledge_cutoff": null,
     "modalities": {
@@ -2435,18 +2573,15 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 15.0,
-          "output_per_million": 75.0
-        },
-        "batch": {
-          "input_per_million": 7.5,
-          "output_per_million": 37.5
+          "input_per_million": 15,
+          "output_per_million": 75
         }
       }
     },
@@ -2460,7 +2595,22 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2024-02-29",
+      "cost": {
+        "input": 15,
+        "output": 75
+      },
+      "limit": {
+        "context": 200000,
+        "output": 4096
+      },
+      "knowledge": "2023-08"
     }
   },
   {
@@ -2527,10 +2677,10 @@
   },
   {
     "id": "anthropic.claude-3-sonnet-20240229-v1:0:200k",
-    "name": "Claude 3 Sonnet",
+    "name": "Claude Sonnet 3",
     "provider": "bedrock",
-    "family": "claude3_sonnet",
-    "created_at": null,
+    "family": "claude-sonnet",
+    "created_at": "2024-03-04 00:00:00 +0100",
     "context_window": 200000,
     "max_output_tokens": 4096,
     "knowledge_cutoff": null,
@@ -2545,18 +2695,15 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 3.0,
-          "output_per_million": 15.0
-        },
-        "batch": {
-          "input_per_million": 1.5,
-          "output_per_million": 7.5
+          "input_per_million": 3,
+          "output_per_million": 15
         }
       }
     },
@@ -2572,16 +2719,31 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2024-03-04",
+      "cost": {
+        "input": 3,
+        "output": 15
+      },
+      "limit": {
+        "context": 200000,
+        "output": 4096
+      },
+      "knowledge": "2023-08"
     }
   },
   {
     "id": "anthropic.claude-3-sonnet-20240229-v1:0:28k",
-    "name": "Claude 3 Sonnet",
+    "name": "Claude Sonnet 3",
     "provider": "bedrock",
-    "family": "claude3_sonnet",
-    "created_at": null,
-    "context_window": 200000,
+    "family": "claude-sonnet",
+    "created_at": "2024-03-04 00:00:00 +0100",
+    "context_window": 28000,
     "max_output_tokens": 4096,
     "knowledge_cutoff": null,
     "modalities": {
@@ -2595,18 +2757,15 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 3.0,
-          "output_per_million": 15.0
-        },
-        "batch": {
-          "input_per_million": 1.5,
-          "output_per_million": 7.5
+          "input_per_million": 3,
+          "output_per_million": 15
         }
       }
     },
@@ -2622,7 +2781,22 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2024-03-04",
+      "cost": {
+        "input": 3,
+        "output": 15
+      },
+      "limit": {
+        "context": 200000,
+        "output": 4096
+      },
+      "knowledge": "2023-08"
     }
   },
   {
@@ -2906,7 +3080,7 @@
         "standard": {
           "input_per_million": 5,
           "output_per_million": 25,
-          "cached_input_per_million": 1.5
+          "cached_input_per_million": 0.5
         }
       }
     },
@@ -2920,8 +3094,8 @@
       "cost": {
         "input": 5,
         "output": 25,
-        "cache_read": 1.5,
-        "cache_write": 18.75
+        "cache_read": 0.5,
+        "cache_write": 6.25
       },
       "limit": {
         "context": 200000,
@@ -3224,18 +3398,16 @@
   },
   {
     "id": "anthropic.claude-v2:1:18k",
-    "name": "Claude",
+    "name": "Claude 2.1",
     "provider": "bedrock",
-    "family": "claude2",
-    "created_at": null,
-    "context_window": 200000,
+    "family": "claude",
+    "created_at": "2023-11-21 00:00:00 +0100",
+    "context_window": 18000,
     "max_output_tokens": 4096,
     "knowledge_cutoff": null,
     "modalities": {
       "input": [
-        "text",
-        "image",
-        "pdf"
+        "text"
       ],
       "output": [
         "text"
@@ -3248,12 +3420,8 @@
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 8.0,
-          "output_per_million": 24.0
-        },
-        "batch": {
-          "input_per_million": 4.0,
-          "output_per_million": 12.0
+          "input_per_million": 8,
+          "output_per_million": 24
         }
       }
     },
@@ -3268,23 +3436,36 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": false,
+      "temperature": true,
+      "last_updated": "2023-11-21",
+      "cost": {
+        "input": 8,
+        "output": 24
+      },
+      "limit": {
+        "context": 200000,
+        "output": 4096
+      },
+      "knowledge": "2023-08"
     }
   },
   {
     "id": "anthropic.claude-v2:1:200k",
-    "name": "Claude",
+    "name": "Claude 2.1",
     "provider": "bedrock",
-    "family": "claude2",
-    "created_at": null,
+    "family": "claude",
+    "created_at": "2023-11-21 00:00:00 +0100",
     "context_window": 200000,
     "max_output_tokens": 4096,
     "knowledge_cutoff": null,
     "modalities": {
       "input": [
-        "text",
-        "image",
-        "pdf"
+        "text"
       ],
       "output": [
         "text"
@@ -3297,12 +3478,8 @@
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 8.0,
-          "output_per_million": 24.0
-        },
-        "batch": {
-          "input_per_million": 4.0,
-          "output_per_million": 12.0
+          "input_per_million": 8,
+          "output_per_million": 24
         }
       }
     },
@@ -3317,7 +3494,22 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": false,
+      "temperature": true,
+      "last_updated": "2023-11-21",
+      "cost": {
+        "input": 8,
+        "output": 24
+      },
+      "limit": {
+        "context": 200000,
+        "output": 4096
+      },
+      "knowledge": "2023-08"
     }
   },
   {
@@ -3623,7 +3815,7 @@
         "standard": {
           "input_per_million": 5,
           "output_per_million": 25,
-          "cached_input_per_million": 1.5
+          "cached_input_per_million": 0.5
         }
       }
     },
@@ -3637,8 +3829,8 @@
       "cost": {
         "input": 5,
         "output": 25,
-        "cache_read": 1.5,
-        "cache_write": 18.75
+        "cache_read": 0.5,
+        "cache_write": 6.25
       },
       "limit": {
         "context": 200000,
@@ -5263,12 +5455,12 @@
   },
   {
     "id": "us.anthropic.claude-3-7-sonnet-20250219-v1:0",
-    "name": "Claude 3.7 Sonnet",
+    "name": "Claude Sonnet 3.7",
     "provider": "bedrock",
-    "family": "claude3_sonnet",
-    "created_at": null,
+    "family": "claude-sonnet",
+    "created_at": "2025-02-19 00:00:00 +0100",
     "context_window": 200000,
-    "max_output_tokens": 4096,
+    "max_output_tokens": 8192,
     "knowledge_cutoff": null,
     "modalities": {
       "input": [
@@ -5281,8 +5473,9 @@
       ]
     },
     "capabilities": [
-      "streaming",
       "function_calling",
+      "vision",
+      "streaming",
       "reasoning",
       "batch",
       "citations"
@@ -5290,12 +5483,9 @@
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 3.0,
-          "output_per_million": 15.0
-        },
-        "batch": {
-          "input_per_million": 1.5,
-          "output_per_million": 7.5
+          "input_per_million": 3,
+          "output_per_million": 15,
+          "cached_input_per_million": 0.3
         }
       }
     },
@@ -5311,18 +5501,35 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2025-02-19",
+      "cost": {
+        "input": 3,
+        "output": 15,
+        "cache_read": 0.3,
+        "cache_write": 3.75
+      },
+      "limit": {
+        "context": 200000,
+        "output": 8192
+      },
+      "knowledge": "2024-04"
     }
   },
   {
     "id": "us.anthropic.claude-haiku-4-5-20251001-v1:0",
     "name": "Claude Haiku 4.5",
     "provider": "bedrock",
-    "family": "other",
-    "created_at": null,
+    "family": "claude-haiku",
+    "created_at": "2025-10-15 00:00:00 +0200",
     "context_window": 200000,
-    "max_output_tokens": 4096,
-    "knowledge_cutoff": null,
+    "max_output_tokens": 64000,
+    "knowledge_cutoff": "2025-02-28",
     "modalities": {
       "input": [
         "text",
@@ -5334,18 +5541,17 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "reasoning",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 0.1,
-          "output_per_million": 0.2
-        },
-        "batch": {
-          "input_per_million": 0.05,
-          "output_per_million": 0.1
+          "input_per_million": 1,
+          "output_per_million": 5,
+          "cached_input_per_million": 0.1
         }
       }
     },
@@ -5361,18 +5567,35 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2025-10-15",
+      "cost": {
+        "input": 1,
+        "output": 5,
+        "cache_read": 0.1,
+        "cache_write": 1.25
+      },
+      "limit": {
+        "context": 200000,
+        "output": 64000
+      },
+      "knowledge": "2025-02-28"
     }
   },
   {
     "id": "us.anthropic.claude-opus-4-1-20250805-v1:0",
     "name": "Claude Opus 4.1",
     "provider": "bedrock",
-    "family": "other",
-    "created_at": null,
+    "family": "claude-opus",
+    "created_at": "2025-08-05 00:00:00 +0200",
     "context_window": 200000,
-    "max_output_tokens": 4096,
-    "knowledge_cutoff": null,
+    "max_output_tokens": 32000,
+    "knowledge_cutoff": "2025-03-31",
     "modalities": {
       "input": [
         "text",
@@ -5384,18 +5607,17 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "reasoning",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 0.1,
-          "output_per_million": 0.2
-        },
-        "batch": {
-          "input_per_million": 0.05,
-          "output_per_million": 0.1
+          "input_per_million": 15,
+          "output_per_million": 75,
+          "cached_input_per_million": 1.5
         }
       }
     },
@@ -5411,17 +5633,34 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2025-08-05",
+      "cost": {
+        "input": 15,
+        "output": 75,
+        "cache_read": 1.5,
+        "cache_write": 18.75
+      },
+      "limit": {
+        "context": 200000,
+        "output": 32000
+      },
+      "knowledge": "2025-03-31"
     }
   },
   {
     "id": "us.anthropic.claude-opus-4-20250514-v1:0",
     "name": "Claude Opus 4",
     "provider": "bedrock",
-    "family": "other",
-    "created_at": null,
+    "family": "claude-opus",
+    "created_at": "2025-05-22 00:00:00 +0200",
     "context_window": 200000,
-    "max_output_tokens": 4096,
+    "max_output_tokens": 32000,
     "knowledge_cutoff": null,
     "modalities": {
       "input": [
@@ -5434,18 +5673,17 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "reasoning",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 0.1,
-          "output_per_million": 0.2
-        },
-        "batch": {
-          "input_per_million": 0.05,
-          "output_per_million": 0.1
+          "input_per_million": 15,
+          "output_per_million": 75,
+          "cached_input_per_million": 1.5
         }
       }
     },
@@ -5461,18 +5699,35 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2025-05-22",
+      "cost": {
+        "input": 15,
+        "output": 75,
+        "cache_read": 1.5,
+        "cache_write": 18.75
+      },
+      "limit": {
+        "context": 200000,
+        "output": 32000
+      },
+      "knowledge": "2024-04"
     }
   },
   {
     "id": "us.anthropic.claude-opus-4-5-20251101-v1:0",
     "name": "Claude Opus 4.5",
     "provider": "bedrock",
-    "family": "other",
-    "created_at": null,
+    "family": "claude-opus",
+    "created_at": "2025-11-24 00:00:00 +0100",
     "context_window": 200000,
-    "max_output_tokens": 4096,
-    "knowledge_cutoff": null,
+    "max_output_tokens": 64000,
+    "knowledge_cutoff": "2025-03-31",
     "modalities": {
       "input": [
         "text",
@@ -5484,18 +5739,17 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "reasoning",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 0.1,
-          "output_per_million": 0.2
-        },
-        "batch": {
-          "input_per_million": 0.05,
-          "output_per_million": 0.1
+          "input_per_million": 5,
+          "output_per_million": 25,
+          "cached_input_per_million": 0.5
         }
       }
     },
@@ -5511,17 +5765,34 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2025-08-01",
+      "cost": {
+        "input": 5,
+        "output": 25,
+        "cache_read": 0.5,
+        "cache_write": 6.25
+      },
+      "limit": {
+        "context": 200000,
+        "output": 64000
+      },
+      "knowledge": "2025-03-31"
     }
   },
   {
     "id": "us.anthropic.claude-sonnet-4-20250514-v1:0",
     "name": "Claude Sonnet 4",
     "provider": "bedrock",
-    "family": "other",
-    "created_at": null,
+    "family": "claude-sonnet",
+    "created_at": "2025-05-22 00:00:00 +0200",
     "context_window": 200000,
-    "max_output_tokens": 4096,
+    "max_output_tokens": 64000,
     "knowledge_cutoff": null,
     "modalities": {
       "input": [
@@ -5534,18 +5805,17 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "reasoning",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 0.1,
-          "output_per_million": 0.2
-        },
-        "batch": {
-          "input_per_million": 0.05,
-          "output_per_million": 0.1
+          "input_per_million": 3,
+          "output_per_million": 15,
+          "cached_input_per_million": 0.3
         }
       }
     },
@@ -5561,18 +5831,35 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2025-05-22",
+      "cost": {
+        "input": 3,
+        "output": 15,
+        "cache_read": 0.3,
+        "cache_write": 3.75
+      },
+      "limit": {
+        "context": 200000,
+        "output": 64000
+      },
+      "knowledge": "2024-04"
     }
   },
   {
     "id": "us.anthropic.claude-sonnet-4-5-20250929-v1:0",
     "name": "Claude Sonnet 4.5",
     "provider": "bedrock",
-    "family": "other",
-    "created_at": null,
+    "family": "claude-sonnet",
+    "created_at": "2025-09-29 00:00:00 +0200",
     "context_window": 200000,
-    "max_output_tokens": 4096,
-    "knowledge_cutoff": null,
+    "max_output_tokens": 64000,
+    "knowledge_cutoff": "2025-07-31",
     "modalities": {
       "input": [
         "text",
@@ -5584,18 +5871,17 @@
       ]
     },
     "capabilities": [
-      "streaming",
-      "function_calling"
+      "function_calling",
+      "reasoning",
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 0.1,
-          "output_per_million": 0.2
-        },
-        "batch": {
-          "input_per_million": 0.05,
-          "output_per_million": 0.1
+          "input_per_million": 3,
+          "output_per_million": 15,
+          "cached_input_per_million": 0.3
         }
       }
     },
@@ -5611,7 +5897,24 @@
       ],
       "output_modalities": [
         "TEXT"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "amazon-bedrock",
+      "open_weights": false,
+      "attachment": true,
+      "temperature": true,
+      "last_updated": "2025-09-29",
+      "cost": {
+        "input": 3,
+        "output": 15,
+        "cache_read": 0.3,
+        "cache_write": 3.75
+      },
+      "limit": {
+        "context": 200000,
+        "output": 64000
+      },
+      "knowledge": "2025-07-31"
     }
   },
   {
@@ -7499,7 +7802,7 @@
         "text"
       ],
       "output": [
-        "text"
+        "embeddings"
       ]
     },
     "capabilities": [
@@ -15867,7 +16170,7 @@
         "text"
       ],
       "output": [
-        "text"
+        "embeddings"
       ]
     },
     "capabilities": [
@@ -15914,7 +16217,7 @@
         "text"
       ],
       "output": [
-        "text"
+        "embeddings"
       ]
     },
     "capabilities": [
@@ -15961,7 +16264,7 @@
         "text"
       ],
       "output": [
-        "text"
+        "embeddings"
       ]
     },
     "capabilities": [
@@ -16584,6 +16887,66 @@
       ]
     }
   },
+  {
+    "id": "allenai/molmo-2-8b:free",
+    "name": "AllenAI: Molmo2 8B (free)",
+    "provider": "openrouter",
+    "family": "allenai",
+    "created_at": "2026-01-09 23:11:12 +0100",
+    "context_window": 36864,
+    "max_output_tokens": 36864,
+    "knowledge_cutoff": null,
+    "modalities": {
+      "input": [
+        "text",
+        "image",
+        "video"
+      ],
+      "output": [
+        "text"
+      ]
+    },
+    "capabilities": [
+      "streaming",
+      "predicted_outputs"
+    ],
+    "pricing": {},
+    "metadata": {
+      "description": "Molmo2-8B is an open vision-language model developed by the Allen Institute for AI (Ai2) as part of the Molmo2 family, supporting image, video, and multi-image understanding and grounding. It is based on Qwen3-8B and uses SigLIP 2 as its vision backbone, outperforming other open-weight, open-data models on short videos, counting, and captioning, while remaining competitive on long-video tasks.",
+      "architecture": {
+        "modality": "text+image->text",
+        "input_modalities": [
+          "text",
+          "image",
+          "video"
+        ],
+        "output_modalities": [
+          "text"
+        ],
+        "tokenizer": "Other",
+        "instruct_type": null
+      },
+      "top_provider": {
+        "context_length": 36864,
+        "max_completion_tokens": 36864,
+        "is_moderated": false
+      },
+      "per_request_limits": null,
+      "supported_parameters": [
+        "frequency_penalty",
+        "logit_bias",
+        "max_tokens",
+        "min_p",
+        "presence_penalty",
+        "repetition_penalty",
+        "seed",
+        "stop",
+        "temperature",
+        "top_k",
+        "top_p"
+      ]
+    }
+  },
   {
     "id": "allenai/olmo-2-0325-32b-instruct",
     "name": "AllenAI: Olmo 2 32B Instruct",
@@ -18057,7 +18420,7 @@
       },
       "top_provider": {
         "context_length": 200000,
-        "max_completion_tokens": null,
+        "max_completion_tokens": 32000,
         "is_moderated": true
       },
       "per_request_limits": null,
@@ -18145,7 +18508,7 @@
       },
       "top_provider": {
         "context_length": 200000,
-        "max_completion_tokens": 32000,
+        "max_completion_tokens": 64000,
         "is_moderated": true
       },
       "per_request_limits": null,
@@ -20016,7 +20379,14 @@
       "structured_output",
       "predicted_outputs"
     ],
-    "pricing": {},
+    "pricing": {
+      "text_tokens": {
+        "standard": {
+          "input_per_million": 0.19,
+          "output_per_million": 0.87
+        }
+      }
+    },
     "metadata": {
       "description": "DeepSeek V3, a 685B-parameter, mixture-of-experts model, is the latest iteration of the flagship chat model family from the DeepSeek team.\n\nIt succeeds the [DeepSeek V3](/deepseek/deepseek-chat-v3) model and performs really well on a variety of tasks.",
       "architecture": {
@@ -20299,8 +20669,8 @@
     "provider": "openrouter",
     "family": "deepseek",
     "created_at": "2025-05-28 19:59:30 +0200",
-    "context_window": 163840,
-    "max_output_tokens": 65536,
+    "context_window": 131072,
+    "max_output_tokens": 32768,
     "knowledge_cutoff": null,
     "modalities": {
       "input": [
@@ -20319,8 +20689,8 @@
     "pricing": {
       "text_tokens": {
         "standard": {
-          "input_per_million": 0.39999999999999997,
-          "output_per_million": 1.75
+          "input_per_million": 0.44999999999999996,
+          "output_per_million": 2.1500000000000004
         }
       }
     },
@@ -20338,8 +20708,8 @@
         "instruct_type": "deepseek-r1"
       },
       "top_provider": {
-        "context_length": 163840,
-        "max_completion_tokens": 65536,
+        "context_length": 131072,
+        "max_completion_tokens": 32768,
         "is_moderated": false
       },
       "per_request_limits": null,
@@ -20560,7 +20930,14 @@
       "structured_output",
       "predicted_outputs"
     ],
-    "pricing": {},
+    "pricing": {
+      "text_tokens": {
+        "standard": {
+          "input_per_million": 0.03,
+          "output_per_million": 0.11
+        }
+      }
+    },
     "metadata": {
       "description": "DeepSeek R1 Distill Llama 70B is a distilled large language model based on [Llama-3.3-70B-Instruct](/meta-llama/llama-3.3-70b-instruct), using outputs from [DeepSeek R1](/deepseek/deepseek-r1). The model combines advanced distillation techniques to achieve high performance across multiple benchmarks, including:\n\n- AIME 2024 pass@1: 70.0\n- MATH-500 pass@1: 94.5\n- CodeForces Rating: 1633\n\nThe model leverages fine-tuning from DeepSeek R1's outputs, enabling competitive performance comparable to larger frontier models.",
       "architecture": {
@@ -20638,7 +21015,14 @@
       "streaming",
       "structured_output"
     ],
-    "pricing": {},
+    "pricing": {
+      "text_tokens": {
+        "standard": {
+          "input_per_million": 0.15,
+          "output_per_million": 0.15
+        }
+      }
+    },
     "metadata": {
       "description": "DeepSeek R1 Distill Qwen 14B is a distilled large language model based on [Qwen 2.5 14B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-14B), using outputs from [DeepSeek R1](/deepseek/deepseek-r1). It outperforms OpenAI's o1-mini across various benchmarks, achieving new state-of-the-art results for dense models.\n\nOther benchmark results include:\n\n- AIME 2024 pass@1: 69.7\n- MATH-500 pass@1: 93.9\n- CodeForces Rating: 1481\n\nThe model leverages fine-tuning from DeepSeek R1's outputs, enabling competitive performance comparable to larger frontier models.",
       "architecture": {
@@ -22867,7 +23251,14 @@
       "structured_output",
       "predicted_outputs"
     ],
-    "pricing": {},
+    "pricing": {
+      "text_tokens": {
+        "standard": {
+          "input_per_million": 0.03,
+          "output_per_million": 0.09999999999999999
+        }
+      }
+    },
     "metadata": {
       "description": "Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling. Gemma 3 12B is the second largest in the family of Gemma 3 models after [Gemma 3 27B](google/gemma-3-27b-it)",
       "architecture": {
@@ -22965,6 +23356,7 @@
       "supported_parameters": [
         "max_tokens",
         "seed",
+        "stop",
         "temperature",
         "top_p"
       ]
@@ -22995,7 +23387,14 @@
       "structured_output",
       "predicted_outputs"
     ],
-    "pricing": {},
+    "pricing": {
+      "text_tokens": {
+        "standard": {
+          "input_per_million": 0.04,
+          "output_per_million": 0.15
+        }
+      }
+    },
     "metadata": {
       "description": "Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling. Gemma 3 27B is Google's latest open source model, successor to [Gemma 2](google/gemma-2-27b-it)",
       "architecture": {
@@ -23102,7 +23501,6 @@
         "response_format",
         "seed",
         "stop",
-        "structured_outputs",
         "temperature",
         "tool_choice",
         "tools",
@@ -23222,7 +23620,7 @@
         "max_tokens",
         "response_format",
         "seed",
-        "structured_outputs",
+        "stop",
         "temperature",
         "top_p"
       ]
@@ -23305,7 +23703,14 @@
       "streaming",
       "predicted_outputs"
     ],
-    "pricing": {},
+    "pricing": {
+      "text_tokens": {
+        "standard": {
+          "input_per_million": 0.02,
+          "output_per_million": 0.04
+        }
+      }
+    },
     "metadata": {
       "description": "Gemma 3n E4B-it is optimized for efficient execution on mobile and low-resource devices, such as phones, laptops, and tablets. It supports multimodal inputs—including text, visual data, and audio—enabling diverse tasks such as text generation, speech recognition, translation, and image analysis. Leveraging innovations like Per-Layer Embedding (PLE) caching and the MatFormer architecture, Gemma 3n dynamically manages memory usage and computational load by selectively activating model parameters, significantly reducing runtime resource requirements.\n\nThis model supports a wide linguistic range (trained in over 140 languages) and features a flexible 32K token context window. Gemma 3n can selectively load parameters, optimizing memory and computational efficiency based on the task or device capabilities, making it well-suited for privacy-focused, offline-capable applications and on-device AI solutions. [Read more in the blog post](https://developers.googleblog.com/en/introducing-gemma-3n/)",
       "architecture": {
@@ -23877,45 +24282,10 @@
       ]
     },
     "capabilities": [
-      "function_calling",
-      "streaming",
-      "structured_output"
+      "function_calling"
     ],
     "pricing": {},
     "metadata": {
-      "description": "KAT-Coder-Pro V1 is KwaiKAT's most advanced agentic coding model in the KAT-Coder series. Designed specifically for agentic coding tasks, it excels in real-world software engineering scenarios, achieving 73.4% solve rate on the SWE-Bench Verified benchmark. \n\nThe model has been optimized for tool-use capability, multi-turn interaction, instruction following, generalization, and comprehensive capabilities through a multi-stage training process, including mid-training, supervised fine-tuning (SFT), reinforcement fine-tuning (RFT), and scalable agentic RL.",
-      "architecture": {
-        "modality": "text->text",
-        "input_modalities": [
-          "text"
-        ],
-        "output_modalities": [
-          "text"
-        ],
-        "tokenizer": "Other",
-        "instruct_type": null
-      },
-      "top_provider": {
-        "context_length": 256000,
-        "max_completion_tokens": 128000,
-        "is_moderated": false
-      },
-      "per_request_limits": null,
-      "supported_parameters": [
-        "frequency_penalty",
-        "max_tokens",
-        "presence_penalty",
-        "repetition_penalty",
-        "response_format",
-        "seed",
-        "stop",
-        "structured_outputs",
-        "temperature",
-        "tool_choice",
-        "tools",
-        "top_k",
-        "top_p"
-      ],
       "source": "models.dev",
       "provider_id": "openrouter",
       "open_weights": false,
@@ -24658,7 +25028,14 @@
       "structured_output",
       "predicted_outputs"
     ],
-    "pricing": {},
+    "pricing": {
+      "text_tokens": {
+        "standard": {
+          "input_per_million": 0.049,
+          "output_per_million": 0.049
+        }
+      }
+    },
     "metadata": {
       "description": "Llama 3.2 11B Vision is a multimodal model with 11 billion parameters, designed to handle tasks combining visual and textual data. It excels in tasks such as image captioning and visual question answering, bridging the gap between language generation and visual reasoning. Pre-trained on a massive dataset of image-text pairs, it performs well in complex, high-accuracy image analysis.\n\nIts ability to integrate visual understanding with language processing makes it an ideal solution for industries requiring comprehensive visual-linguistic AI applications, such as content creation, AI-driven customer service, and research.\n\nClick here for the [original model card](https://github.com/meta-llama/llama-models/blob/main/models/llama3_2/MODEL_CARD_VISION.md).\n\nUsage of this model is subject to [Meta's Acceptable Use Policy](https://www.llama.com/llama3/use-policy/).",
       "architecture": {
@@ -26057,7 +26434,7 @@
       },
       "top_provider": {
         "context_length": 196608,
-        "max_completion_tokens": null,
+        "max_completion_tokens": 65536,
         "is_moderated": false
       },
       "per_request_limits": null,
@@ -28015,7 +28392,14 @@
       "streaming",
       "structured_output"
     ],
-    "pricing": {},
+    "pricing": {
+      "text_tokens": {
+        "standard": {
+          "input_per_million": 0.03,
+          "output_per_million": 0.11
+        }
+      }
+    },
     "metadata": {
       "description": "Mistral Small 3.1 24B Instruct is an upgraded variant of Mistral Small 3 (2501), featuring 24 billion parameters with advanced multimodal capabilities. It provides state-of-the-art performance in text-based reasoning and vision tasks, including image analysis, programming, mathematical reasoning, and multilingual support across dozens of languages. Equipped with an extensive 128k token context window and optimized for efficient local inference, it supports use cases such as conversational agents, function calling, long-document comprehension, and privacy-sensitive deployments. The updated version is [Mistral Small 3.2](mistralai/mistral-small-3.2-24b-instruct)",
       "architecture": {
@@ -28152,7 +28536,14 @@
       "structured_output",
       "predicted_outputs"
     ],
-    "pricing": {},
+    "pricing": {
+      "text_tokens": {
+        "standard": {
+          "input_per_million": 0.06,
+          "output_per_million": 0.18
+        }
+      }
+    },
     "metadata": {
       "description": "Mistral-Small-3.2-24B-Instruct-2506 is an updated 24B parameter model from Mistral optimized for instruction following, repetition reduction, and improved function calling. Compared to the 3.1 release, version 3.2 significantly improves accuracy on WildBench and Arena Hard, reduces infinite generations, and delivers gains in tool use and structured output tasks.\n\nIt supports image and text inputs with structured outputs, function/tool calling, and strong performance across coding (HumanEval+, MBPP), STEM (MMLU, MATH, GPQA), and vision benchmarks (ChartQA, DocVQA).",
       "architecture": {
@@ -29445,8 +29836,8 @@
     }
   },
   {
-    "id": "nex-agi/deepseek-v3.1-nex-n1:free",
-    "name": "Nex AGI: DeepSeek V3.1 Nex N1 (free)",
+    "id": "nex-agi/deepseek-v3.1-nex-n1",
+    "name": "Nex AGI: DeepSeek V3.1 Nex N1",
     "provider": "openrouter",
     "family": "nex-agi",
     "created_at": "2025-12-08 15:33:13 +0100",
@@ -29466,7 +29857,14 @@
       "function_calling",
       "structured_output"
     ],
-    "pricing": {},
+    "pricing": {
+      "text_tokens": {
+        "standard": {
+          "input_per_million": 0.27,
+          "output_per_million": 1.0
+        }
+      }
+    },
     "metadata": {
       "description": "DeepSeek V3.1 Nex-N1 is the flagship release of the Nex-N1 series — a post-trained model designed to highlight agent autonomy, tool use, and real-world productivity. \n\nNex-N1 demonstrates competitive performance across all evaluation scenarios, showing particularly strong results in practical coding and HTML generation tasks.",
       "architecture": {
@@ -35479,7 +35877,14 @@
       "structured_output",
       "predicted_outputs"
     ],
-    "pricing": {},
+    "pricing": {
+      "text_tokens": {
+        "standard": {
+          "input_per_million": 0.03,
+          "output_per_million": 0.11
+        }
+      }
+    },
     "metadata": {
       "description": "Qwen2.5-Coder is the latest series of Code-Specific Qwen large language models (formerly known as CodeQwen). Qwen2.5-Coder brings the following improvements upon CodeQwen1.5:\n\n- Significantly improvements in **code generation**, **code reasoning** and **code fixing**. \n- A more comprehensive foundation for real-world applications such as **Code Agents**. Not only enhancing coding capabilities but also maintaining its strengths in mathematics and general competencies.\n\nTo read more about its evaluation results, check out [Qwen 2.5 Coder's blog](https://qwenlm.github.io/blog/qwen2.5-coder-family/).",
       "architecture": {
@@ -36279,7 +36684,14 @@
       "structured_output",
       "predicted_outputs"
     ],
-    "pricing": {},
+    "pricing": {
+      "text_tokens": {
+        "standard": {
+          "input_per_million": 0.15,
+          "output_per_million": 0.6
+        }
+      }
+    },
     "metadata": {
       "description": "Qwen2.5-VL is proficient in recognizing common objects such as flowers, birds, fish, and insects. It is also highly capable of analyzing texts, charts, icons, graphics, and layouts within images.",
       "architecture": {
@@ -37485,12 +37897,12 @@
   },
   {
     "id": "qwen/qwen3-coder-30b-a3b-instruct",
-    "name": "Qwen: Qwen3 Coder 30B A3B Instruct",
+    "name": "Qwen3 Coder 30B A3B Instruct",
     "provider": "openrouter",
-    "family": "qwen",
-    "created_at": "2025-07-31 16:32:59 +0200",
+    "family": "qwen3-coder",
+    "created_at": "2025-07-31 00:00:00 +0200",
     "context_window": 160000,
-    "max_output_tokens": 32768,
+    "max_output_tokens": 65536,
     "knowledge_cutoff": null,
     "modalities": {
       "input": [
@@ -37501,8 +37913,8 @@
       ]
     },
     "capabilities": [
-      "streaming",
       "function_calling",
+      "streaming",
       "structured_output"
     ],
     "pricing": {
@@ -37546,7 +37958,22 @@
         "tools",
         "top_k",
         "top_p"
-      ]
+      ],
+      "source": "models.dev",
+      "provider_id": "openrouter",
+      "open_weights": true,
+      "attachment": false,
+      "temperature": true,
+      "last_updated": "2025-07-31",
+      "cost": {
+        "input": 0.07,
+        "output": 0.27
+      },
+      "limit": {
+        "context": 160000,
+        "output": 65536
+      },
+      "knowledge": "2025-04"
     }
   },
   {
@@ -41790,7 +42217,7 @@
     "name": "Sonar Deep Research",
     "provider": "perplexity",
     "family": "sonar_deep_research",
-    "created_at": "2026-01-09 17:47:54 +0100",
+    "created_at": "2026-01-13 19:17:42 +0100",
     "context_window": 128000,
     "max_output_tokens": 4096,
     "knowledge_cutoff": null,
@@ -41874,7 +42301,7 @@
     "name": "Sonar Reasoning",
     "provider": "perplexity",
     "family": "sonar_reasoning",
-    "created_at": "2026-01-09 17:47:54 +0100",
+    "created_at": "2026-01-13 19:17:42 +0100",
     "context_window": 128000,
     "max_output_tokens": 4096,
     "knowledge_cutoff": null,
@@ -41951,115 +42378,6 @@
       "knowledge": "2025-09-01"
     }
   },
-  {
-    "id": "chat-bison",
-    "name": "chat-bison",
-    "provider": "vertexai",
-    "family": "palm",
-    "created_at": null,
-    "context_window": null,
-    "max_output_tokens": null,
-    "knowledge_cutoff": null,
-    "modalities": {
-      "input": [],
-      "output": []
-    },
-    "capabilities": [
-      "streaming"
-    ],
-    "pricing": {},
-    "metadata": {
-      "version_id": "002",
-      "open_source_category": "PROPRIETARY",
-      "launch_stage": "GA",
-      "supported_actions": {
-        "openGenie": {
-          "references": {
-            "us-central1": {
-              "uri": "https://console.cloud.google.com/vertex-ai/generative/language/create/chat"
-            }
-          },
-          "title": "Open Prompt Design"
-        }
-      },
-      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/chat-bison@002"
-    }
-  },
-  {
-    "id": "code-bison",
-    "name": "code-bison",
-    "provider": "vertexai",
-    "family": "palm",
-    "created_at": null,
-    "context_window": null,
-    "max_output_tokens": null,
-    "knowledge_cutoff": null,
-    "modalities": {
-      "input": [],
-      "output": []
-    },
-    "capabilities": [
-      "streaming"
-    ],
-    "pricing": {},
-    "metadata": {
-      "version_id": "002",
-      "open_source_category": null,
-      "launch_stage": "GA",
-      "supported_actions": null,
-      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/code-bison@002"
-    }
-  },
-  {
-    "id": "code-gecko",
-    "name": "code-gecko",
-    "provider": "vertexai",
-    "family": "gemini",
-    "created_at": null,
-    "context_window": null,
-    "max_output_tokens": null,
-    "knowledge_cutoff": null,
-    "modalities": {
-      "input": [],
-      "output": []
-    },
-    "capabilities": [
-      "streaming"
-    ],
-    "pricing": {},
-    "metadata": {
-      "version_id": "002",
-      "open_source_category": null,
-      "launch_stage": "GA",
-      "supported_actions": null,
-      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/code-gecko@002"
-    }
-  },
-  {
-    "id": "codechat-bison",
-    "name": "codechat-bison",
-    "provider": "vertexai",
-    "family": "palm",
-    "created_at": null,
-    "context_window": null,
-    "max_output_tokens": null,
-    "knowledge_cutoff": null,
-    "modalities": {
-      "input": [],
-      "output": []
-    },
-    "capabilities": [
-      "streaming"
-    ],
-    "pricing": {},
-    "metadata": {
-      "version_id": "002",
-      "open_source_category": null,
-      "launch_stage": "GA",
-      "supported_actions": null,
-      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/codechat-bison@002"
-    }
-  },
   {
     "id": "gemini-1.5-flash",
     "name": "Gemini 1.5 Flash",
@@ -42132,7 +42450,55 @@
     ],
     "pricing": {},
     "metadata": {
-      "source": "known_models"
+      "version_id": "default",
+      "open_source_category": "PROPRIETARY",
+      "launch_stage": "GA",
+      "supported_actions": {
+        "openNotebook": {
+          "references": {
+            "global": {
+              "uri": "https://colab.research.google.com/github/GoogleCloudPlatform/generative-ai/blob/main/gemini/getting-started/intro_gemini_1_5_flash.ipynb"
+            }
+          },
+          "title": "Open Notebook"
+        },
+        "openGenerationAiStudio": {
+          "references": {
+            "global": {
+              "uri": "https://console.cloud.google.com/vertex-ai/studio/freeform?model=gemini-1.5-flash-002"
+            }
+          }
+        },
+        "openEvaluationPipeline": {
+          "references": {
+            "global": {
+              "uri": "https://console.cloud.google.com/vertex-ai/pipelines/vertex-ai-templates/autosxs-template"
+            }
+          },
+          "title": "Evaluate"
+        },
+        "openNotebooks": {
+          "notebooks": [
+            {
+              "references": {
+                "global": {
+                  "uri": "https://colab.research.google.com/github/GoogleCloudPlatform/generative-ai/blob/main/gemini/getting-started/intro_gemini_1_5_flash.ipynb"
+                }
+              },
+              "title": "Open Notebook"
+            },
+            {
+              "references": {
+                "global": {
+                  "uri": "https://colab.research.google.com/github/GoogleCloudPlatform/generative-ai/blob/main/gemini/getting-started/intro_gemini_1_5_flash.ipynb"
+                }
+              },
+              "title": "Open Notebook"
+            }
+          ]
+        }
+      },
+      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/gemini-1.5-flash-002@default"
     }
   },
   {
@@ -42260,7 +42626,72 @@
     ],
     "pricing": {},
     "metadata": {
-      "source": "known_models"
+      "version_id": "default",
+      "open_source_category": "PROPRIETARY",
+      "launch_stage": "GA",
+      "supported_actions": {
+        "openNotebook": {
+          "references": {
+            "us-central1": {
+              "uri": "https://colab.research.google.com/github/GoogleCloudPlatform/generative-ai/blob/main/gemini/use-cases/retail/product_attributes_extraction.ipynb"
+            }
+          },
+          "title": "Open Notebook",
+          "resourceTitle": "Notebook",
+          "resourceUseCase": "Product Attributes Extraction",
+          "resourceDescription": "Extract product descriptions and attribute json from images using Gemini 1.5 Pro. This notebook also shows the use of self-correcting prompt to improve the quality of the output."
+        },
+        "openGenerationAiStudio": {
+          "references": {
+            "us-central1": {
+              "uri": "https://console.cloud.google.com/vertex-ai/studio/freeform?model=gemini-1.5-pro-002"
+            }
+          }
+        },
+        "openEvaluationPipeline": {
+          "references": {
+            "us-central1": {
+              "uri": "https://console.cloud.google.com/vertex-ai/pipelines/vertex-ai-templates/autosxs-template"
+            }
+          },
+          "title": "Evaluate"
+        },
+        "openNotebooks": {
+          "notebooks": [
+            {
+              "references": {
+                "us-central1": {
+                  "uri": "https://colab.research.google.com/github/GoogleCloudPlatform/generative-ai/blob/main/gemini/getting-started/intro_gemini_1_5_pro.ipynb"
+                }
+              },
+              "title": "Open Notebook"
+            },
+            {
+              "references": {
+                "us-central1": {
+                  "uri": "https://colab.research.google.com/github/GoogleCloudPlatform/generative-ai/blob/main/gemini/getting-started/intro_gemini_1_5_pro.ipynb"
+                }
+              },
+              "title": "Open Notebook",
+              "resourceTitle": "Notebook",
+              "resourceUseCase": "Vertex AI Gemini API 1.5 Pro",
+              "resourceDescription": "Use the Vertex AI Gemini API 1.5 Pro model to process images, video, audio, and text simultaneously."
+            },
+            {
+              "references": {
+                "us-central1": {
+                  "uri": "https://colab.research.google.com/github/GoogleCloudPlatform/generative-ai/blob/main/gemini/use-cases/retail/product_attributes_extraction.ipynb"
+                }
+              },
+              "title": "Open Notebook",
+              "resourceTitle": "Notebook",
+              "resourceUseCase": "Product Attributes Extraction",
+              "resourceDescription": "Extract product descriptions and attribute json from images using Gemini 1.5 Pro. This notebook also shows the use of self-correcting prompt to improve the quality of the output."
+            }
+          ]
+        }
+      },
+      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/gemini-1.5-pro-002@default"
     }
   },
   {
@@ -42336,7 +42767,43 @@
     ],
     "pricing": {},
     "metadata": {
-      "source": "known_models"
+      "version_id": "default",
+      "open_source_category": null,
+      "launch_stage": "GA",
+      "supported_actions": {
+        "openNotebook": {
+          "references": {
+            "us-central1": {
+              "uri": "https://colab.research.google.com/github/GoogleCloudPlatform/generative-ai/blob/main/gemini/getting-started/intro_gemini_2_0_flash.ipynb"
+            }
+          },
+          "resourceTitle": "Notebook",
+          "resourceUseCase": "Vertex Serving",
+          "resourceDescription": "Intro to Gemini 2.0 Flash."
+        },
+        "openGenerationAiStudio": {
+          "references": {
+            "us-central1": {
+              "uri": "https://console.cloud.google.com/vertex-ai/generative/multimodal/create/text?model=gemini-2.0-flash-001"
+            }
+          }
+        },
+        "openNotebooks": {
+          "notebooks": [
+            {
+              "references": {
+                "us-central1": {
+                  "uri": "https://colab.research.google.com/github/GoogleCloudPlatform/generative-ai/blob/main/gemini/getting-started/intro_gemini_2_0_flash.ipynb"
+                }
+              },
+              "resourceTitle": "Notebook",
+              "resourceUseCase": "Vertex Serving",
+              "resourceDescription": "Intro to Gemini 2.0 Flash."
+            }
+          ]
+        }
+      },
+      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/gemini-2.0-flash-001@default"
     }
   },
   {
@@ -42431,7 +42898,37 @@
     ],
     "pricing": {},
     "metadata": {
-      "source": "known_models"
+      "version_id": "default",
+      "open_source_category": null,
+      "launch_stage": "GA",
+      "supported_actions": null,
+      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/gemini-2.0-flash-lite-001@default"
+    }
+  },
+  {
+    "id": "gemini-2.0-flash-preview-image-generation",
+    "name": "gemini-2.0-flash-preview-image-generation",
+    "provider": "vertexai",
+    "family": "gemini-2",
+    "created_at": null,
+    "context_window": null,
+    "max_output_tokens": null,
+    "knowledge_cutoff": null,
+    "modalities": {
+      "input": [],
+      "output": []
+    },
+    "capabilities": [
+      "streaming",
+      "function_calling"
+    ],
+    "pricing": {},
+    "metadata": {
+      "version_id": "default",
+      "open_source_category": null,
+      "launch_stage": null,
+      "supported_actions": null,
+      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/gemini-2.0-flash-preview-image-generation@default"
     }
   },
   {
@@ -42471,6 +42968,11 @@
       }
     },
     "metadata": {
+      "version_id": "default",
+      "open_source_category": null,
+      "launch_stage": "GA",
+      "supported_actions": null,
+      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/gemini-2.5-flash@default",
       "source": "models.dev",
       "provider_id": "google-vertex",
       "open_weights": false,
@@ -42527,6 +43029,11 @@
       }
     },
     "metadata": {
+      "version_id": "default",
+      "open_source_category": null,
+      "launch_stage": "GA",
+      "supported_actions": null,
+      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/gemini-2.5-flash-lite@default",
       "source": "models.dev",
       "provider_id": "google-vertex",
       "open_weights": false,
@@ -42677,7 +43184,8 @@
     "capabilities": [
       "function_calling",
       "reasoning",
-      "vision"
+      "vision",
+      "streaming"
     ],
     "pricing": {
       "text_tokens": {
@@ -42689,6 +43197,19 @@
       }
     },
     "metadata": {
+      "version_id": "default",
+      "open_source_category": null,
+      "launch_stage": "PUBLIC_PREVIEW",
+      "supported_actions": {
+        "openGenerationAiStudio": {
+          "references": {
+            "us-central1": {
+              "uri": "https://console.cloud.google.com/vertex-ai/generative/multimodal/create/text?model=gemini-2.5-flash-preview-04-17"
+            }
+          }
+        }
+      },
+      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/gemini-2.5-flash-preview-04-17@default",
       "source": "models.dev",
       "provider_id": "google-vertex",
       "open_weights": false,
@@ -42853,6 +43374,11 @@
       }
     },
     "metadata": {
+      "version_id": "default",
+      "open_source_category": null,
+      "launch_stage": "GA",
+      "supported_actions": null,
+      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/gemini-2.5-pro@default",
       "source": "models.dev",
       "provider_id": "google-vertex",
       "open_weights": false,
@@ -42871,6 +43397,64 @@
       "knowledge": "2025-01"
     }
   },
+  {
+    "id": "gemini-2.5-pro-exp-03-25",
+    "name": "gemini-2.5-pro-exp-03-25",
+    "provider": "vertexai",
+    "family": "gemini-2",
+    "created_at": null,
+    "context_window": null,
+    "max_output_tokens": null,
+    "knowledge_cutoff": null,
+    "modalities": {
+      "input": [],
+      "output": []
+    },
+    "capabilities": [
+      "streaming",
+      "function_calling"
+    ],
+    "pricing": {},
+    "metadata": {
+      "version_id": "default",
+      "open_source_category": null,
+      "launch_stage": "EXPERIMENTAL",
+      "supported_actions": {
+        "openNotebook": {
+          "references": {
+            "us-central1": {
+              "uri": "https://colab.research.google.com/github/GoogleCloudPlatform/generative-ai/blob/main/gemini/getting-started/intro_gemini_2_5_pro.ipynb"
+            }
+          },
+          "resourceTitle": "Notebook",
+          "resourceUseCase": "Vertex Serving",
+          "resourceDescription": "Intro to Gemini 2.5 Pro."
+        },
+        "openGenerationAiStudio": {
+          "references": {
+            "us-central1": {
+              "uri": "https://console.cloud.google.com/vertex-ai/generative/multimodal/create/text?model=gemini-2.5-pro-exp-03-25"
+            }
+          }
+        },
+        "openNotebooks": {
+          "notebooks": [
+            {
+              "references": {
+                "us-central1": {
+                  "uri": "https://colab.research.google.com/github/GoogleCloudPlatform/generative-ai/blob/main/gemini/getting-started/intro_gemini_2_5_pro.ipynb"
+                }
+              },
+              "resourceTitle": "Notebook",
+              "resourceUseCase": "Vertex Serving",
+              "resourceDescription": "Intro to Gemini 2.5 Pro."
+            }
+          ]
+        }
+      },
+      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/gemini-2.5-pro-exp-03-25@default"
+    }
+  },
   {
     "id": "gemini-2.5-pro-preview-05-06",
     "name": "Gemini 2.5 Pro Preview 05-06",
@@ -43113,7 +43697,7 @@
         "text"
       ],
       "output": [
-        "text"
+        "embeddings"
       ]
     },
     "capabilities": [
@@ -43342,279 +43926,6 @@
       "source": "known_models"
     }
   },
-  {
-    "id": "image-segmentation-001",
-    "name": "image-segmentation-001",
-    "provider": "vertexai",
-    "family": "gemini",
-    "created_at": null,
-    "context_window": null,
-    "max_output_tokens": null,
-    "knowledge_cutoff": null,
-    "modalities": {
-      "input": [],
-      "output": []
-    },
-    "capabilities": [
-      "streaming"
-    ],
-    "pricing": {},
-    "metadata": {
-      "version_id": "default",
-      "open_source_category": null,
-      "launch_stage": "PUBLIC_PREVIEW",
-      "supported_actions": {
-        "openNotebook": {
-          "references": {
-            "europe-west1": {
-              "uri": "https://colab.research.google.com/github/GoogleCloudPlatform/generative-ai/blob/main/vision/getting-started/image_segmentation.ipynb"
-            }
-          },
-          "title": "Open Notebook"
-        },
-        "requestAccess": {
-          "references": {
-            "europe-west1": {
-              "uri": "https://docs.google.com/forms/d/e/1FAIpQLSdzIR1EeQGFcMsqd9nPip5e9ovDKSjfWRd58QVjo1zLpfdvEg/viewform?resourcekey=0-Pvqc66u-0Z1QmuzHq4wLKg"
-            }
-          }
-        },
-        "openNotebooks": {
-          "notebooks": [
-            {
-              "references": {
-                "europe-west1": {
-                  "uri": "https://colab.research.google.com/github/GoogleCloudPlatform/generative-ai/blob/main/vision/getting-started/image_segmentation.ipynb"
-                }
-              },
-              "title": "Open Notebook"
-            }
-          ]
-        }
-      },
-      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/image-segmentation-001@default"
-    }
-  },
-  {
-    "id": "imagegeneration",
-    "name": "imagegeneration",
-    "provider": "vertexai",
-    "family": "gemini",
-    "created_at": null,
-    "context_window": null,
-    "max_output_tokens": null,
-    "knowledge_cutoff": null,
-    "modalities": {
-      "input": [],
-      "output": []
-    },
-    "capabilities": [
-      "streaming"
-    ],
-    "pricing": {},
-    "metadata": {
-      "version_id": "006",
-      "open_source_category": "PROPRIETARY",
-      "launch_stage": "PUBLIC_PREVIEW",
-      "supported_actions": {
-        "openGenerationAiStudio": {
-          "references": {
-            "europe-west1": {
-              "uri": "https://cloud.google.com/console/vertex-ai/generative/vision"
-            }
-          },
-          "title": "Open Vertex AI Studio"
-        }
-      },
-      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/imagegeneration@006"
-    }
-  },
-  {
-    "id": "imagen-3.0-capability-002",
-    "name": "imagen-3.0-capability-002",
-    "provider": "vertexai",
-    "family": "gemini",
-    "created_at": null,
-    "context_window": null,
-    "max_output_tokens": null,
-    "knowledge_cutoff": null,
-    "modalities": {
-      "input": [],
-      "output": []
-    },
-    "capabilities": [
-      "streaming"
-    ],
-    "pricing": {},
-    "metadata": {
-      "version_id": "default",
-      "open_source_category": null,
-      "launch_stage": "GA",
-      "supported_actions": null,
-      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/imagen-3.0-capability-002@default"
-    }
-  },
-  {
-    "id": "imagen-4.0-fast-generate-001",
-    "name": "imagen-4.0-fast-generate-001",
-    "provider": "vertexai",
-    "family": "gemini",
-    "created_at": null,
-    "context_window": null,
-    "max_output_tokens": null,
-    "knowledge_cutoff": null,
-    "modalities": {
-      "input": [],
-      "output": []
-    },
-    "capabilities": [
-      "streaming"
-    ],
-    "pricing": {},
-    "metadata": {
-      "version_id": "default",
-      "open_source_category": null,
-      "launch_stage": "GA",
-      "supported_actions": {
-        "openGenerationAiStudio": {
-          "references": {
-            "europe-west1": {
-              "uri": "https://console.cloud.google.com/vertex-ai/studio/media/generate"
-            }
-          },
-          "title": "Open Vertex AI Studio"
-        }
-      },
-      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/imagen-4.0-fast-generate-001@default"
-    }
-  },
-  {
-    "id": "imagen-4.0-generate-001",
-    "name": "imagen-4.0-generate-001",
-    "provider": "vertexai",
-    "family": "gemini",
-    "created_at": null,
-    "context_window": null,
-    "max_output_tokens": null,
-    "knowledge_cutoff": null,
-    "modalities": {
-      "input": [],
-      "output": []
-    },
-    "capabilities": [
-      "streaming"
-    ],
-    "pricing": {},
-    "metadata": {
-      "version_id": "default",
-      "open_source_category": null,
-      "launch_stage": "GA",
-      "supported_actions": {
-        "openGenerationAiStudio": {
-          "references": {
-            "europe-west1": {
-              "uri": "https://console.cloud.google.com/vertex-ai/studio/media/generate"
-            }
-          },
-          "title": "Open Vertex AI Studio"
-        }
-      },
-      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/imagen-4.0-generate-001@default"
-    }
-  },
-  {
-    "id": "imagen-4.0-ultra-generate-001",
-    "name": "imagen-4.0-ultra-generate-001",
-    "provider": "vertexai",
-    "family": "gemini",
-    "created_at": null,
-    "context_window": null,
-    "max_output_tokens": null,
-    "knowledge_cutoff": null,
-    "modalities": {
-      "input": [],
-      "output": []
-    },
-    "capabilities": [
-      "streaming"
-    ],
-    "pricing": {},
-    "metadata": {
-      "version_id": "default",
-      "open_source_category": null,
-      "launch_stage": "GA",
-      "supported_actions": {
-        "openGenerationAiStudio": {
-          "references": {
-            "europe-west1": {
-              "uri": "https://console.cloud.google.com/vertex-ai/studio/media/generate"
-            }
-          },
-          "title": "Open Vertex AI Studio"
-        }
-      },
-      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/imagen-4.0-ultra-generate-001@default"
-    }
-  },
-  {
-    "id": "imagetext",
-    "name": "imagetext",
-    "provider": "vertexai",
-    "family": "gemini",
-    "created_at": null,
-    "context_window": null,
-    "max_output_tokens": null,
-    "knowledge_cutoff": null,
-    "modalities": {
-      "input": [],
-      "output": []
-    },
-    "capabilities": [
-      "streaming"
-    ],
-    "pricing": {},
-    "metadata": {
-      "version_id": "001",
-      "open_source_category": "PROPRIETARY",
-      "launch_stage": "GA",
-      "supported_actions": {
-        "openGenerationAiStudio": {
-          "references": {
-            "us-central1": {
-              "uri": "https://cloud.google.com/console/vertex-ai/generative/vision"
-            }
-          },
-          "title": "Open Vertex AI Studio"
-        }
-      },
-      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/imagetext@001"
-    }
-  },
-  {
-    "id": "multimodalembedding",
-    "name": "multimodalembedding",
-    "provider": "vertexai",
-    "family": "gemini",
-    "created_at": null,
-    "context_window": null,
-    "max_output_tokens": null,
-    "knowledge_cutoff": null,
-    "modalities": {
-      "input": [],
-      "output": []
-    },
-    "capabilities": [
-      "streaming"
-    ],
-    "pricing": {},
-    "metadata": {
-      "version_id": "001",
-      "open_source_category": "PROPRIETARY",
-      "launch_stage": "GA",
-      "supported_actions": null,
-      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/multimodalembedding@001"
-    }
-  },
   {
     "id": "openai/gpt-oss-120b-maas",
     "name": "GPT OSS 120B",
@@ -43707,48 +44018,6 @@
       }
     }
   },
-  {
-    "id": "text-bison",
-    "name": "text-bison",
-    "provider": "vertexai",
-    "family": "palm",
-    "created_at": null,
-    "context_window": null,
-    "max_output_tokens": null,
-    "knowledge_cutoff": null,
-    "modalities": {
-      "input": [],
-      "output": []
-    },
-    "capabilities": [
-      "streaming"
-    ],
-    "pricing": {},
-    "metadata": {
-      "version_id": "002",
-      "open_source_category": "PROPRIETARY",
-      "launch_stage": "GA",
-      "supported_actions": {
-        "openGenie": {
-          "references": {
-            "us-central1": {
-              "uri": "https://console.cloud.google.com/vertex-ai/generative/language/create/text"
-            }
-          },
-          "title": "Open Prompt Design"
-        },
-        "openEvaluationPipeline": {
-          "references": {
-            "us-central1": {
-              "uri": "https://console.cloud.google.com/vertex-ai/pipelines/vertex-ai-templates/evaluation-llm-text-generation-pipeline"
-            }
-          },
-          "title": "Evaluate"
-        }
-      },
-      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/text-bison@002"
-    }
-  },
   {
     "id": "text-embedding-004",
     "name": "text-embedding-004",
@@ -43814,72 +44083,5 @@
     "metadata": {
       "source": "known_models"
     }
-  },
-  {
-    "id": "text-unicorn",
-    "name": "text-unicorn",
-    "provider": "vertexai",
-    "family": "gemini",
-    "created_at": null,
-    "context_window": null,
-    "max_output_tokens": null,
-    "knowledge_cutoff": null,
-    "modalities": {
-      "input": [],
-      "output": []
-    },
-    "capabilities": [
-      "streaming"
-    ],
-    "pricing": {},
-    "metadata": {
-      "version_id": "001",
-      "open_source_category": "PROPRIETARY",
-      "launch_stage": "GA",
-      "supported_actions": {
-        "openGenie": {
-          "references": {
-            "europe-west1": {
-              "uri": "https://console.cloud.google.com/vertex-ai/generative/language/create/text"
-            }
-          },
-          "title": "Open in Vertex AI Studio"
-        },
-        "openEvaluationPipeline": {
-          "references": {
-            "europe-west1": {
-              "uri": "https://console.cloud.google.com/vertex-ai/pipelines/vertex-ai-templates/evaluation-llm-text-generation-pipeline"
-            }
-          },
-          "title": "Evaluate"
-        }
-      },
-      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/text-unicorn@001"
-    }
-  },
-  {
-    "id": "textembedding-gecko",
-    "name": "textembedding-gecko",
-    "provider": "vertexai",
-    "family": "gemini",
-    "created_at": null,
-    "context_window": null,
-    "max_output_tokens": null,
-    "knowledge_cutoff": null,
-    "modalities": {
-      "input": [],
-      "output": []
-    },
-    "capabilities": [
-      "streaming"
-    ],
-    "pricing": {},
-    "metadata": {
-      "version_id": "003",
-      "open_source_category": "PROPRIETARY",
-      "launch_stage": "GA",
-      "supported_actions": null,
-      "publisher_model_template": "projects/{project}/locations/{location}/publishers/google/models/textembedding-gecko@003"
-    }
   }
 ]