PyPI - model-library - Versions diffs - 0.1.3__py3-none-any.whl → 0.1.5__py3-none-any.whl - Mend

model-library 0.1.3py3-none-any.whl → 0.1.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

model_library/base/base.py +2 -0
model_library/base/output.py +24 -9
model_library/base/utils.py +27 -5
model_library/config/README.md +169 -0
model_library/config/ai21labs_models.yaml +11 -11
model_library/config/alibaba_models.yaml +21 -22
model_library/config/all_models.json +4623 -2599
model_library/config/amazon_models.yaml +100 -102
model_library/config/anthropic_models.yaml +43 -52
model_library/config/cohere_models.yaml +25 -24
model_library/config/deepseek_models.yaml +28 -25
model_library/config/dummy_model.yaml +9 -7
model_library/config/fireworks_models.yaml +86 -56
model_library/config/google_models.yaml +146 -126
model_library/config/inception_models.yaml +6 -6
model_library/config/kimi_models.yaml +13 -14
model_library/config/minimax_models.yaml +37 -0
model_library/config/mistral_models.yaml +85 -29
model_library/config/openai_models.yaml +192 -150
model_library/config/perplexity_models.yaml +10 -23
model_library/config/together_models.yaml +115 -104
model_library/config/xai_models.yaml +47 -79
model_library/config/zai_models.yaml +23 -15
model_library/exceptions.py +7 -16
model_library/providers/amazon.py +32 -17
model_library/providers/minimax.py +33 -0
model_library/providers/mistral.py +10 -1
model_library/providers/openai.py +2 -6
model_library/register_models.py +36 -36
model_library/registry_utils.py +78 -16
model_library/utils.py +2 -2
{model_library-0.1.3.dist-info → model_library-0.1.5.dist-info}/METADATA +2 -2
model_library-0.1.5.dist-info/RECORD +64 -0
model_library-0.1.3.dist-info/RECORD +0 -61
{model_library-0.1.3.dist-info → model_library-0.1.5.dist-info}/WHEEL +0 -0
{model_library-0.1.3.dist-info → model_library-0.1.5.dist-info}/licenses/LICENSE +0 -0
{model_library-0.1.3.dist-info → model_library-0.1.5.dist-info}/top_level.txt +0 -0

model_library/config/google_models.yaml CHANGED Viewed

@@ -2,7 +2,14 @@ base-config:
   company: Google
   documentation_url: https://ai.google.dev/gemini-api/docs/models
   open_source: false
-  class_properties:
+  supports:
+    images: false
+    videos: false
+    files: false
+    batch: false
+    temperature: false
+    tools: false
+  metadata:
     available_for_everyone: true
     available_as_evaluator: false
     ignored_for_cost: false
@@ -21,30 +28,25 @@ gemma-models:
       use such as phones and tablets, capable of handling text, audio, and vision
       inputs with efficient parameter caching techniques.
     release_date: 2025-03-12
-    class_properties:
+    metadata:
       deprecated: true
     properties:
       context_window: 131_072
-      max_token_output: 8_192
+      max_tokens: 8_192
       training_cutoff: "2023-09"
     costs_per_million_token:
       input: 0.00
       output: 0.00
 gemini-3-models:
   base-config:
-    properties:
-      context_window: 1_048_576
-      max_token_output: 8_192
-      training_cutoff: "2025-01"
-    class_properties:
-      supports_images: true
-      supports_files: true
-      supports_videos: true
-      supports_tools: true
-      supports_batch_requests: true
-      supports_temperature: true
+    supports:
+      images: true
+      files: true
+      videos: true
+      tools: true
+      batch: true
+      temperature: true
     costs_per_million_token:
       cache:
         read_discount: 0.1
@@ -52,47 +54,55 @@ gemini-3-models:
       temperature: 1
       reasoning_effort: "high"
+  google/gemini-3-flash-preview:
+    label: Gemini 3 Flash (12/25)
+    description: Google's newest budget workhorse model
+    release_date: 2025-12-17
+    properties:
+      context_window: 1048576
+      max_tokens: 65536
+      reasoning_model: true
+    costs_per_million_token:
+      input: 0.50
+      output: 3.00
+    default_parameters:
+      temperature: 1
+      reasoning_effort: "high"
   google/gemini-3-pro-preview:
     label: Gemini 3 Pro (11/25)
     description: Gemini 3 Pro, Google's most powerful model.
     release_date: 2025-11-18
     properties:
       context_window: 1048576
-      max_token_output: 65536
+      max_tokens: 65536
       training_cutoff: "2025-01"
       reasoning_model: true
-    class_properties:
-      supports_images: true
-      supports_files: true
-      supports_videos: true
-      supports_tools: true
-      supports_batch_requests: true
-      supports_temperature: true
     costs_per_million_token:
-      input: 2
-      output: 12
+      input: 2.0
+      output: 12.0
       cache:
         read: 0.20
       context:
         threshold: 200_000
-        input: 2.5
-        output: 15.0
+        input: 4.0
+        output: 18.0
         cache:
           read: 0.40
 gemini-2.5-models:
   base-config:
+    supports:
+      images: true
+      files: true
+      videos: true
+      tools: true
+      batch: true
+      temperature: true
     properties:
       context_window: 1_048_576
-      max_token_output: 8_192
+      max_tokens: 8_192
       training_cutoff: "2024-05"
-    class_properties:
-      supports_images: true
-      supports_files: true
-      supports_videos: true
-      supports_tools: true
-      supports_batch_requests: true
-      supports_temperature: true
     costs_per_million_token:
       cache:
         read_discount: 0.1
@@ -107,12 +117,12 @@ gemini-2.5-models:
       using multimodal inputs including audio, images, video, and PDFs with a context
       window exceeding 1 million tokens.
     release_date: 2025-07-17
+    metadata:
+      available_as_evaluator: true
     properties:
       context_window: 1_048_576
-      max_token_output: 65_536
+      max_tokens: 65_536
       reasoning_model: true
-    class_properties:
-      available_as_evaluator: true
     costs_per_million_token:
       input: 1.25
       output: 10.0
@@ -132,12 +142,12 @@ gemini-2.5-models:
       large scale processing with support for multiple modalities, a 1 million token
       context window, and strong reasoning capabilities.
     release_date: 2025-07-17
+    metadata:
+      available_as_evaluator: true
     properties:
       context_window: 1_048_576
-      max_token_output: 65_536
+      max_tokens: 65_536
       reasoning_model: false
-    class_properties:
-      available_as_evaluator: true
     costs_per_million_token:
       input: 0.30
       output: 2.50
@@ -156,7 +166,7 @@ gemini-2.5-models:
     release_date: 2025-09-25
     properties:
       context_window: 1_048_576
-      max_token_output: 65_535
+      max_tokens: 65_535
       reasoning_model: false
     costs_per_million_token:
       input: 0.30
@@ -177,7 +187,7 @@ gemini-2.5-models:
     release_date: 2025-07-22
     properties:
       context_window: 1_048_576
-      max_token_output: 65_535
+      max_tokens: 65_535
       reasoning_model: false
     costs_per_million_token:
       input: 0.10
@@ -198,7 +208,7 @@ gemini-2.5-models:
     release_date: 2025-09-25
     properties:
       context_window: 1_048_576
-      max_token_output: 65_535
+      max_tokens: 65_535
       reasoning_model: false
     costs_per_million_token:
       input: 0.10
@@ -217,12 +227,12 @@ gemini-2.5-models:
       at scale, with support for text, images, video, and audio input modalities and
       large context length.
     release_date: 2025-06-17
+    metadata:
+      deprecated: true
     properties:
       context_window: 1_048_576
-      max_token_output: 65_535
+      max_tokens: 65_535
       reasoning_model: false
-    class_properties:
-      deprecated: true
     costs_per_million_token:
       input: 0.10
       output: 0.40
@@ -240,13 +250,13 @@ gemini-2.5-models:
       large scale processing with support for multiple modalities, a 1 million token
       context window, and strong reasoning capabilities.
     release_date: 2025-05-20
+    metadata:
+      deprecated: true
     properties:
       context_window: 1_048_576
-      max_token_output: 65_536
+      max_tokens: 65_536
       training_cutoff: "2025-01"
       reasoning_model: false
-    class_properties:
-      deprecated: true
     costs_per_million_token:
       input: 0.15
       output: 0.60
@@ -265,14 +275,15 @@ gemini-2.5-models:
       using multimodal inputs including audio, images, video, and PDFs with a context
       window exceeding 1 million tokens.
     release_date: 2025-06-05
+    supports:
+      batch: false
+    metadata:
+      deprecated: true
     properties:
       context_window: 1_048_576
-      max_token_output: 65_536
+      max_tokens: 65_536
       training_cutoff: "2025-01"
       reasoning_model: true
-    class_properties:
-      supports_batch_requests: false
-      deprecated: true
     costs_per_million_token:
       input: 1.25
       output: 10.0
@@ -287,14 +298,14 @@ gemini-2.5-models:
       using multimodal inputs including audio, images, video, and PDFs with a context
       window exceeding 1 million tokens.
     release_date: 2025-05-06
+    metadata:
+      available_for_everyone: false
+      deprecated: true
     properties:
       context_window: 1_048_576
-      max_token_output: 65_536
+      max_tokens: 65_536
       training_cutoff: "2025-01"
-      available_for_everyone: false
       reasoning_model: true
-    class_properties:
-      deprecated: true
     costs_per_million_token:
       input: 1.25
       output: 10.0
@@ -308,13 +319,13 @@ gemini-2.5-models:
       large scale processing with support for multiple modalities, a 1 million token
       context window, and strong reasoning capabilities.
     release_date: 2025-04-17
+    metadata:
+      deprecated: true
     properties:
       context_window: 1_048_576
-      max_token_output: 65_536
+      max_tokens: 65_536
       training_cutoff: "2025-01"
       reasoning_model: false
-    class_properties:
-      deprecated: true
     costs_per_million_token:
       input: 0.3
       output: 2.5
@@ -333,14 +344,14 @@ gemini-2.5-models:
       using multimodal inputs including audio, images, video, and PDFs with a context
       window exceeding 1 million tokens.
     release_date: 2025-03-25
+    metadata:
+      available_for_everyone: false
+      deprecated: true
     properties:
       context_window: 1_048_576
-      max_token_output: 65_536
+      max_tokens: 65_536
       training_cutoff: "2025-01"
-      available_for_everyone: false
       reasoning_model: true
-    class_properties:
-      deprecated: true
     costs_per_million_token:
       input: 1.25
       output: 10.0
@@ -355,14 +366,14 @@ gemini-2.5-models:
       using multimodal inputs including audio, images, video, and PDFs with a context
       window exceeding 1 million tokens.
     release_date: 2025-04-05
+    metadata:
+      available_for_everyone: false
+      deprecated: true
     properties:
       context_window: 1_048_576
-      max_token_output: 65_536
+      max_tokens: 65_536
       training_cutoff: "2025-01"
-      available_for_everyone: false
       reasoning_model: true
-    class_properties:
-      deprecated: true
     costs_per_million_token:
       input: 1.25
       output: 10.0
@@ -371,12 +382,12 @@ gemini-2.5-models:
 old-gemini-models:
   base-config:
+    metadata:
+      deprecated: true
     properties:
       context_window: 2_097_152
-      max_token_output: 8_192
+      max_tokens: 8_192
       training_cutoff: "2024-05"
-    class_properties:
-      deprecated: true
     costs_per_million_token:
       cache:
         read_discount: 0.25
@@ -388,17 +399,18 @@ old-gemini-models:
       large context processing and multimodal inputs, with strengths in speed, native
       tool use, and dataset comprehension.
     release_date: 2025-02-05
+    supports:
+      images: true
+      files: true
+      videos: true
+    metadata:
+      available_for_everyone: false
+      deprecated: true
     properties:
       context_window: 2_097_152
-      max_token_output: 8_192
+      max_tokens: 8_192
       training_cutoff: "2024-06"
       reasoning_model: true
-      available_for_everyone: false
-    class_properties:
-      deprecated: true
-      supports_images: true
-      supports_files: true
-      supports_videos: true
     costs_per_million_token:
       input: 1.25
       output: 5.00
@@ -410,17 +422,18 @@ old-gemini-models:
       reasoning and longer contextual memory in multimodal scenarios including text,
       images, video, and audio.
     release_date: 2025-01-21
+    supports:
+      images: true
+      files: true
+      videos: true
+    metadata:
+      available_for_everyone: false
+      deprecated: true
     properties:
       context_window: 1_048_576
-      max_token_output: 65_536
+      max_tokens: 65_536
       training_cutoff: "2024-05"
       reasoning_model: true
-      available_for_everyone: false
-    class_properties:
-      deprecated: true
-      supports_images: true
-      supports_files: true
-      supports_videos: true
     costs_per_million_token:
       input: 0.10
       output: 0.70
@@ -432,18 +445,19 @@ old-gemini-models:
       with a 1 million token context window and support for text, image, video, and
       audio inputs.
     release_date: 2025-02-05
+    supports:
+      images: true
+      files: true
+      videos: true
     properties:
-      properties: null
       context_window: 1_048_576
-      max_token_output: 8_192
+      max_tokens: 8_192
       training_cutoff: "2024-08"
     costs_per_million_token:
       input: 0.10
       output: 0.40
-    class_properties:
-      supports_images: true
-      supports_files: true
-      supports_videos: true
+      cache:
+        read: 0.025
   google/gemini-2.0-flash-exp:
     label: Gemini 2.0 Flash Exp
@@ -451,15 +465,16 @@ old-gemini-models:
       Gemini 2.0 Flash Experimental is a developer preview for advanced
       use cases requiring extended context and multimodal reasoning capabilities.
     release_date: 2024-12-11
+    supports:
+      images: true
+      files: true
+      videos: true
+    metadata:
+      deprecated: true
     properties:
       context_window: 1_048_576
-      max_token_output: 8_192
+      max_tokens: 8_192
       training_cutoff: "2024-05"
-    class_properties:
-      deprecated: true
-      supports_images: true
-      supports_files: true
-      supports_videos: true
     costs_per_million_token:
       input: 0.075
       output: 0.30
@@ -470,15 +485,16 @@ old-gemini-models:
       Gemini 1.5 Flash is an efficient and speedy version of Gemini 1.5
       with support for multiple data types and large contexts.
     release_date: 2024-09-24
+    supports:
+      images: true
+      files: true
+      videos: true
+    metadata:
+      deprecated: true
     properties:
       context_window: 1_048_576
-      max_token_output: 8_192
+      max_tokens: 8_192
       training_cutoff: "2024-05"
-    class_properties:
-      deprecated: true
-      supports_images: true
-      supports_files: true
-      supports_videos: true
     costs_per_million_token:
       input: 0.075
       output: 0.30
@@ -489,15 +505,16 @@ old-gemini-models:
       Gemini 1.5 Flash (early release) provides fast processing with vision
       and audio capabilities along with text understanding.
     release_date: 2024-05-24
+    supports:
+      images: true
+      files: true
+      videos: true
+    metadata:
+      deprecated: true
     properties:
       context_window: 1_048_576
-      max_token_output: 8_192
+      max_tokens: 8_192
       training_cutoff: "2023-11"
-    class_properties:
-      deprecated: true
-      supports_images: true
-      supports_files: true
-      supports_videos: true
     costs_per_million_token:
       input: 0.075
       output: 0.30
@@ -508,15 +525,16 @@ old-gemini-models:
       Gemini 1.5 Pro is a high-performance model with multimodal capabilities
       useful for complex reasoning tasks and dataset analysis.
     release_date: 2024-09-24
+    supports:
+      images: true
+      files: true
+      videos: true
+    metadata:
+      deprecated: true
     properties:
       context_window: 2_097_152
-      max_token_output: 8_192
+      max_tokens: 8_192
       training_cutoff: "2024-05"
-    class_properties:
-      deprecated: true
-      supports_images: true
-      supports_files: true
-      supports_videos: true
     costs_per_million_token:
       input: 1.25
       output: 5.0
@@ -530,15 +548,16 @@ old-gemini-models:
       Gemini 1.5 Pro (early release) supports multimodal inputs and advanced
       reasoning on moderate context lengths.
     release_date: 2024-05-24
+    supports:
+      images: true
+      files: true
+      videos: true
+    metadata:
+      deprecated: true
     properties:
       context_window: 1_048_576
-      max_token_output: 8_192
+      max_tokens: 8_192
       training_cutoff: "2023-11"
-    class_properties:
-      deprecated: true
-      supports_images: true
-      supports_files: true
-      supports_videos: true
     costs_per_million_token:
       input: 1.25
       output: 5.0
@@ -549,13 +568,14 @@ old-gemini-models:
       Gemini 1.0 Pro is an earlier generation multimodal model supporting
       text, image, and audio inputs with foundational reasoning abilities.
     release_date: 2024-02-14
+    supports:
+      images: false
+    metadata:
+      deprecated: true
     properties:
       context_window: 32_760
-      max_token_output: 8_192
+      max_tokens: 8_192
       training_cutoff: "2023-02"
-    class_properties:
-      supports_images: false
-      deprecated: true
     costs_per_million_token:
       input: 0.50
       output: 1.50

model_library/config/inception_models.yaml CHANGED Viewed

@@ -2,11 +2,12 @@ base-config:
   company: Inception
   documentation_url: https://docs.inceptionlabs.ai/get-started/models
   open_source: false
-  class_properties:
-    supports_images: false
-    supports_tools: true
+  supports:
+    images: false
+    tools: true
+    files: false
+  metadata:
     available_as_evaluator: false
-    supports_files: false
     available_for_everyone: true
     ignored_for_cost: false
@@ -17,8 +18,7 @@ inception-models:
     properties:
       reasoning_model: false
       context_window: 128_000
-    default_parameters:
-      max_output_tokens: 16_400 # number lifted from https://openrouter.ai/inception/mercury
+      max_tokens: 16_384 # rounded down
     costs_per_million_token:
       input: 0.25
       output: 1

model_library/config/kimi_models.yaml CHANGED Viewed

@@ -2,33 +2,32 @@ base-config:
   company: Kimi
   documentation_url: https://platform.moonshot.ai/docs
   open_source: true
-  class_properties:
-    supports_images: false
-    supports_tools: true
+  supports:
+    images: false
+    tools: true
+    files: false
+  metadata:
     available_as_evaluator: false
-    supports_files: false
     available_for_everyone: true
     ignored_for_cost: false
 kimi-k2-models:
   kimi/kimi-k2-thinking:
     label: Kimi K2 Thinking
     release_date: 2025-11-06
     properties:
       reasoning_model: true
-      context_window: 128_000
-      max_token_output: 128_000
+      context_window: 256_000
+      max_tokens: 32_000
     default_parameters:
       temperature: 1.0
-      max_output_tokens: 128_000
     costs_per_million_token:
-      input: 0.60
-      output: 2.50
+      input: 0.6
+      output: 2.5
+      cache:
+        read: 0.15
     alternative_keys:
       - fireworks/kimi-k2-thinking:
           costs_per_million_token:
-            input: 0.50
-            output: 0.50
-            cache:
-              read_discount: 1
+            input: 0.6
+            output: 2.5

model_library/config/minimax_models.yaml ADDED Viewed

@@ -0,0 +1,37 @@
+base-config:
+  company: MiniMax
+  documentation_url: https://platform.minimax.io/docs
+  open_source: true
+  supports:
+    images: false
+    files: false
+    tools: true
+    temperature: true
+  metadata:
+    available_as_evaluator: false
+    available_for_everyone: true
+    ignored_for_cost: false
+  properties:
+    reasoning_model: false
+minimax-m2-models:
+  minimax/MiniMax-M2:
+    label: MiniMax-M2
+    description: MiniMax-M2 is a cost-efficient open-source model optimized for agentic applications and coding in particular.
+    release_date: 2025-10-26
+    properties:
+      context_window: 204_800
+      max_tokens: 131_000
+      reasoning_model: true
+      training_cutoff: null
+    default_parameters:
+      temperature: 1.0
+      top_p: 0.95
+    costs_per_million_token:
+      input: 0.30
+      output: 1.20
+      cache:
+        read: 0.03
+        write: 0.375

model-library 0.1.3__py3-none-any.whl → 0.1.5__py3-none-any.whl

model-library 0.1.3py3-none-any.whl → 0.1.5py3-none-any.whl