PyPI - model-library - Versions diffs - 0.1.2__py3-none-any.whl → 0.1.4__py3-none-any.whl - Mend

model-library 0.1.2py3-none-any.whl → 0.1.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

model_library/base/base.py +13 -6
model_library/base/output.py +55 -0
model_library/base/utils.py +3 -2
model_library/config/README.md +169 -0
model_library/config/ai21labs_models.yaml +11 -10
model_library/config/alibaba_models.yaml +21 -22
model_library/config/all_models.json +4708 -2471
model_library/config/amazon_models.yaml +100 -102
model_library/config/anthropic_models.yaml +59 -45
model_library/config/cohere_models.yaml +25 -24
model_library/config/deepseek_models.yaml +28 -25
model_library/config/dummy_model.yaml +9 -7
model_library/config/fireworks_models.yaml +86 -56
model_library/config/google_models.yaml +156 -102
model_library/config/inception_models.yaml +6 -6
model_library/config/kimi_models.yaml +13 -14
model_library/config/minimax_models.yaml +37 -0
model_library/config/mistral_models.yaml +85 -29
model_library/config/openai_models.yaml +192 -159
model_library/config/perplexity_models.yaml +8 -23
model_library/config/together_models.yaml +115 -103
model_library/config/xai_models.yaml +85 -57
model_library/config/zai_models.yaml +23 -15
model_library/exceptions.py +12 -17
model_library/file_utils.py +1 -1
model_library/providers/amazon.py +32 -17
model_library/providers/anthropic.py +2 -6
model_library/providers/google/google.py +35 -29
model_library/providers/minimax.py +33 -0
model_library/providers/mistral.py +10 -1
model_library/providers/openai.py +10 -8
model_library/providers/together.py +18 -211
model_library/register_models.py +36 -38
model_library/registry_utils.py +18 -16
model_library/utils.py +2 -2
{model_library-0.1.2.dist-info → model_library-0.1.4.dist-info}/METADATA +3 -4
model_library-0.1.4.dist-info/RECORD +64 -0
model_library-0.1.2.dist-info/RECORD +0 -61
{model_library-0.1.2.dist-info → model_library-0.1.4.dist-info}/WHEEL +0 -0
{model_library-0.1.2.dist-info → model_library-0.1.4.dist-info}/licenses/LICENSE +0 -0
{model_library-0.1.2.dist-info → model_library-0.1.4.dist-info}/top_level.txt +0 -0

model_library/config/cohere_models.yaml CHANGED Viewed

@@ -2,11 +2,12 @@ base-config:
   company: Cohere
   open_source: false
   documentation_url: https://docs.cohere.com/v2/docs/models
-  class_properties:
+  supports:
+    images: false
+    files: false
+    tools: true
+  metadata:
     available_as_evaluator: false
-    supports_images: false
-    supports_files: false
-    supports_tools: true
     available_for_everyone: true
     ignored_for_cost: false
   properties:
@@ -16,8 +17,8 @@ command-models:
   base-config:
     properties:
       context_window: 128000
-    class_properties:
-      supports_temperature: true
+    supports:
+      temperature: true
     default_parameters:
       temperature: 0.3
@@ -30,7 +31,7 @@ command-models:
     release_date: 2025-03-13
     properties:
       context_window: 256000
-      max_token_output: 8000
+      max_tokens: 8000
     costs_per_million_token:
       input: 2.5
       output: 10.0
@@ -43,8 +44,8 @@ command-models:
     release_date: 2024-04-24
     properties:
       context_window: 4000
-      max_token_output: 4000
-    class_properties:
+      max_tokens: 4000
+    metadata:
       deprecated: true
     costs_per_million_token:
       input: 0.3
@@ -58,8 +59,8 @@ command-models:
     release_date: 2024-03-24
     properties:
       context_window: 4000
-      max_token_output: 4000
-    class_properties:
+      max_tokens: 4000
+    metadata:
       deprecated: true
     costs_per_million_token:
       input: 1.0
@@ -73,8 +74,8 @@ command-models:
     release_date: 2024-04-24
     properties:
       context_window: 128000
-      max_token_output: 4000
-    class_properties:
+      max_tokens: 4000
+    metadata:
       available_for_everyone: false
       deprecated: true
     costs_per_million_token:
@@ -90,8 +91,8 @@ command-models:
     release_date: 2024-03-24
     properties:
       context_window: 128000
-      max_token_output: 4000
-    class_properties:
+      max_tokens: 4000
+    metadata:
       available_for_everyone: false
       deprecated: true
     costs_per_million_token:
@@ -107,8 +108,8 @@ command-models:
     release_date: 2024-08-30
     properties:
       context_window: 128000
-      max_token_output: 4000
-    class_properties:
+      max_tokens: 4000
+    metadata:
       available_for_everyone: false
       deprecated: true
     costs_per_million_token:
@@ -124,8 +125,8 @@ command-models:
     release_date: 2024-04-24
     properties:
       context_window: 128000
-      max_token_output: 4000
-    class_properties:
+      max_tokens: 4000
+    metadata:
       deprecated: true
     costs_per_million_token:
       input: 2.5
@@ -140,8 +141,8 @@ command-models:
     release_date: 2024-04-24
     properties:
       context_window: 128000
-      max_token_output: 4000
-    class_properties:
+      max_tokens: 4000
+    metadata:
       deprecated: true
     costs_per_million_token:
       input: 2.5
@@ -155,8 +156,8 @@ command-models:
     release_date: 2024-08-30
     properties:
       context_window: 128000
-      max_token_output: 4000
-    class_properties:
+      max_tokens: 4000
+    metadata:
       deprecated: true
     costs_per_million_token:
       input: 2.5
@@ -171,7 +172,7 @@ command-models:
     release_date: 2024-12-13
     properties:
       context_window: 128000
-      max_token_output: 4000
+      max_tokens: 4000
     costs_per_million_token:
       input: 0.0375
       output: 0.15

model_library/config/deepseek_models.yaml CHANGED Viewed

@@ -2,48 +2,51 @@ base-config:
   company: DeepSeek
   documentation_url: https://api-docs.deepseek.com/
   open_source: true
-  class_properties:
-    supports_images: false
+  supports:
+    images: false
+    files: false
+  metadata:
     available_as_evaluator: false
-    supports_files: false
     available_for_everyone: true
     ignored_for_cost: false
   properties:
     reasoning_model: false
-deepseek-v3p2-exp-models:
+deepseek-endpoints:
   base-config:
-    class_properties:
-      supports_images: false
-      supports_files: false
-      supports_batch_requests: false
-      supports_temperature: true
+    supports:
+      images: false
+      files: false
+      tools: true
+      batch: false
+      temperature: true
     default_parameters:
       temperature: 1
-    costs_per_million_token:
-      input: 0.28
-      output: 0.42
-      cache:
-        read_discount: 0.1
   deepseek/deepseek-chat:
-    label: DeepSeek V3.2-Exp (Nonthinking)
-    description: DeepSeek V3.2-Exp model for general conversation
+    label: DeepSeek Chat
+    description: DeepSeek's latest chat model
     release_date: 2025-09-29
     properties:
       context_window: 128_000
-      max_token_output: 8_000
+      max_tokens: 8_000
       reasoning_model: false
-    class_properties:
-      supports_tools: true
+    costs_per_million_token:
+      input: 0.27
+      output: 1.10
+      cache:
+        read: 0.07
   deepseek/deepseek-reasoner:
-    label: DeepSeek V3.2-Exp (Thinking)
-    description: DeepSeek V3.2-Exp model with thinking mode for complex reasoning
+    label: DeepSeek Reasoner
+    description: DeepSeek's latest reasoning model
     release_date: 2025-09-29
     properties:
       context_window: 128_000
-      max_token_output: 64_000
+      max_tokens: 64_000
       reasoning_model: true
-    class_properties:
-      supports_tools: false
+    costs_per_million_token:
+      input: 0.55
+      output: 2.19
+      cache:
+        read: 0.14

model_library/config/dummy_model.yaml CHANGED Viewed

@@ -2,11 +2,11 @@ vals-models:
   base-config:
     company: Vals AI
     documentation_url: ""
-    class_properties:
-      supports_batch_requests: true
+    supports:
+      batch: true
     properties:
       context_window: 128_000
-      max_token_output: 16_384
+      max_tokens: 16_384
       training_cutoff: ""
   vals/dumbmar-5o-ultra-thinking:
@@ -14,8 +14,9 @@ vals-models:
     open_source: false
     description: Vals Dummy Model for testing
     release_date: null
-    class_properties:
-      supports_images: false
+    supports:
+      images: false
+    metadata:
       available_as_evaluator: false
     costs_per_million_token:
       input: 0.15
@@ -28,8 +29,9 @@ vals-models:
     open_source: false
     description: Vals Dummy Model for evaluating
     release_date: null
-    class_properties:
-      supports_images: false
+    supports:
+      images: false
+    metadata:
       available_as_evaluator: true
     costs_per_million_token:
       input: 0.15

model_library/config/fireworks_models.yaml CHANGED Viewed

@@ -2,12 +2,13 @@ base-config:
   company: Fireworks
   documentation_url: https://fireworks.ai/models
   open_source: false
-  class_properties:
+  supports:
+    files: false
+    tools: true
+  metadata:
     available_as_evaluator: false
-    supports_files: false
     available_for_everyone: true
     ignored_for_cost: false
-    supports_tools: true
   properties:
     reasoning_model: false
   costs_per_million_token:
@@ -21,8 +22,8 @@ qwen-models:
   base-config:
     company: Alibaba
     open_source: true
-    class_properties:
-      supports_temperature: true
+    supports:
+      temperature: true
     default_parameters:
       temperature: 0.7
@@ -32,11 +33,11 @@ qwen-models:
     release_date: 2025-04-28
     properties:
       context_window: 128_000
-      max_token_output: 32_768
+      max_tokens: 32_768
       training_cutoff: "2024-08"
       reasoning_model: true
-    class_properties:
-      supports_images: false
+    supports:
+      images: false
     costs_per_million_token:
       input: 0.22
       output: 0.88
@@ -52,13 +53,14 @@ llama-4-models:
     release_date: 2025-04-05
     properties:
       context_window: 1_000_000
-      max_token_output: 16_384
+      max_tokens: 16_384
       training_cutoff: "2024-08"
     costs_per_million_token:
       input: 0.22
       output: 0.88
-    class_properties:
-      supports_images: true
+    supports:
+      images: true
+    metadata:
       deprecated: true
   fireworks/llama4-scout-instruct-basic:
@@ -67,23 +69,23 @@ llama-4-models:
     release_date: 2025-04-05
     properties:
       context_window: 10_000_000
-      max_token_output: 16_384
+      max_tokens: 16_384
       training_cutoff: "2024-08"
     costs_per_million_token:
-      input: 0.18
-      output: 0.59
-    class_properties:
-      supports_images: true
+      input: 0.15
+      output: 0.6
+    supports:
+      images: true
+    metadata:
       deprecated: true
 deepseek-models:
   base-config:
     company: DeepSeek
     open_source: true
-    class_properties:
-      supports_images: false
-      supports_temperature: true
-      deprecated: true
+    supports:
+      images: false
+      temperature: true
     default_parameters:
       temperature: 1
@@ -93,12 +95,14 @@ deepseek-models:
     release_date: 2025-01-20
     properties:
       context_window: 163_840
-      max_token_output: 163_840
+      max_tokens: 163_840
       training_cutoff: null
       reasoning_model: true
+    metadata:
+      deprecated: true
     costs_per_million_token:
-      input: 3.00
-      output: 8.00
+      input: 1.35
+      output: 5.4
   fireworks/deepseek-v3-0324:
     label: DeepSeek V3 (03/24/2025)
@@ -106,10 +110,12 @@ deepseek-models:
     release_date: 2025-03-24
     properties:
       context_window: 131_072
-      max_token_output: 131_072
+      max_tokens: 131_072
+    metadata:
+      deprecated: true
     costs_per_million_token:
-      input: 1.20
-      output: 1.20
+      input: 0.9
+      output: 0.9
   fireworks/deepseek-v3:
     label: DeepSeek V3
@@ -117,10 +123,12 @@ deepseek-models:
     release_date: 2024-12-26
     properties:
       context_window: 131_072
-      max_token_output: 131_072
+      max_tokens: 131_072
+    metadata:
+      deprecated: true
     costs_per_million_token:
-      input: 0.90
-      output: 0.90
+      input: 0.9
+      output: 0.9
   fireworks/deepseek-v3p1:
     label: DeepSeek V3.1
@@ -128,19 +136,39 @@ deepseek-models:
     release_date: 2025-08-21
     properties:
       context_window: 163_840
-      max_token_output: 163_840
-      reasoning_model: false # actually hybrid
-      deprecated: false # still using this one
+      max_tokens: 163_840
+      reasoning_model: false
+    costs_per_million_token:
+      input: 0.56
+      output: 1.68
+  fireworks/deepseek-v3p2:
+    label: DeepSeek V3.2 (Nonthinking)
+    description: ""
+    release_date: 2025-12-01
+    properties:
+      context_window: 160_000
+      max_tokens: 20_480
+      reasoning_model: false
     costs_per_million_token:
       input: 0.56
       output: 1.68
+      cache:
+        read: 0.28
+    alternative_keys:
+      - fireworks/deepseek-v3p2-thinking:
+          label: DeepSeek V3.2 (Thinking)
+          properties:
+            reasoning_model: true
+          default_parameters:
+            reasoning_effort: "high"
 openai-models:
   base-config:
     company: OpenAI
     open_source: true
-    class_properties:
-      supports_images: false
+    supports:
+      images: false
   fireworks/gpt-oss-120b:
     label: GPT OSS 120B
@@ -148,7 +176,7 @@ openai-models:
     release_date: 2025-08-05
     properties:
       context_window: 128_000
-      max_token_output: 32_768
+      max_tokens: 32_768
       training_cutoff: null
       reasoning_model: true
     costs_per_million_token:
@@ -161,20 +189,20 @@ openai-models:
     release_date: 2025-08-05
     properties:
       context_window: 128_000
-      max_token_output: 32_768
+      max_tokens: 32_768
       training_cutoff: null
       reasoning_model: true
     costs_per_million_token:
-      input: 0.05
-      output: 0.20
+      input: 0.07
+      output: 0.3
 kimi-models:
   base-config:
     company: Kimi
     open_source: true
     documentation_url: https://www.kimi.com/
-    class_properties:
-      supports_images: false
+    supports:
+      images: false
   fireworks/kimi-k2-instruct-0905:
     label: Kimi K2 Instruct 0905
@@ -182,11 +210,11 @@ kimi-models:
     release_date: 2025-09-04
     properties:
       context_window: 256_000
-      max_token_output: 256_000
+      max_tokens: 256_000
       training_cutoff: null
       reasoning_model: false
-    class_properties:
-      supports_images: false
+    supports:
+      images: false
     costs_per_million_token:
       input: 0.60
       output: 2.50
@@ -196,33 +224,35 @@ minimax-models:
     company: MiniMax AI
     documentation_url: https://platform.minimax.io/docs
     open_source: true
-    class_properties:
+    supports:
+      images: false
+      files: false
+      tools: true
+      temperature: true
+    metadata:
       available_as_evaluator: false
-      supports_images: false
-      supports_files: false
-      supports_tools: true
       available_for_everyone: true
       ignored_for_cost: false
-      supports_temperature: true
+    default_parameters:
+      temperature: 1.0
+      top_p: 0.95
+      top_k: 40
   fireworks/minimax-m2:
     label: MiniMax-M2
     description: MiniMax-M2 is a cost-efficient open-source model optimized for agentic applications and coding in particular.
     release_date: 2025-10-26
     properties:
-      context_window: 204_800
-      max_token_output: 131_000
+      context_window: 204_800
+      max_tokens: 131_000
       reasoning_model: true
       training_cutoff: null
-    class_properties:
-      supports_tools: true
-      supports_temperature: true
+    supports:
+      tools: true
+      temperature: true
     default_parameters: # taken from https://huggingface.co/MiniMaxAI/MiniMax-M2#inference-parameters
       temperature: 1.0
       top_p: 0.95
-      top_k: 40
     costs_per_million_token:
       input: 0.30
       output: 1.20

model-library 0.1.2__py3-none-any.whl → 0.1.4__py3-none-any.whl

model-library 0.1.2py3-none-any.whl → 0.1.4py3-none-any.whl