PyPI - model-library - Versions diffs - 0.1.2__py3-none-any.whl → 0.1.4__py3-none-any.whl - Mend

model-library 0.1.2py3-none-any.whl → 0.1.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

model_library/base/base.py +13 -6
model_library/base/output.py +55 -0
model_library/base/utils.py +3 -2
model_library/config/README.md +169 -0
model_library/config/ai21labs_models.yaml +11 -10
model_library/config/alibaba_models.yaml +21 -22
model_library/config/all_models.json +4708 -2471
model_library/config/amazon_models.yaml +100 -102
model_library/config/anthropic_models.yaml +59 -45
model_library/config/cohere_models.yaml +25 -24
model_library/config/deepseek_models.yaml +28 -25
model_library/config/dummy_model.yaml +9 -7
model_library/config/fireworks_models.yaml +86 -56
model_library/config/google_models.yaml +156 -102
model_library/config/inception_models.yaml +6 -6
model_library/config/kimi_models.yaml +13 -14
model_library/config/minimax_models.yaml +37 -0
model_library/config/mistral_models.yaml +85 -29
model_library/config/openai_models.yaml +192 -159
model_library/config/perplexity_models.yaml +8 -23
model_library/config/together_models.yaml +115 -103
model_library/config/xai_models.yaml +85 -57
model_library/config/zai_models.yaml +23 -15
model_library/exceptions.py +12 -17
model_library/file_utils.py +1 -1
model_library/providers/amazon.py +32 -17
model_library/providers/anthropic.py +2 -6
model_library/providers/google/google.py +35 -29
model_library/providers/minimax.py +33 -0
model_library/providers/mistral.py +10 -1
model_library/providers/openai.py +10 -8
model_library/providers/together.py +18 -211
model_library/register_models.py +36 -38
model_library/registry_utils.py +18 -16
model_library/utils.py +2 -2
{model_library-0.1.2.dist-info → model_library-0.1.4.dist-info}/METADATA +3 -4
model_library-0.1.4.dist-info/RECORD +64 -0
model_library-0.1.2.dist-info/RECORD +0 -61
{model_library-0.1.2.dist-info → model_library-0.1.4.dist-info}/WHEEL +0 -0
{model_library-0.1.2.dist-info → model_library-0.1.4.dist-info}/licenses/LICENSE +0 -0
{model_library-0.1.2.dist-info → model_library-0.1.4.dist-info}/top_level.txt +0 -0

model_library/config/together_models.yaml CHANGED Viewed

@@ -2,15 +2,17 @@
 base-config:
   open_source: true
   documentation_url: https://docs.together.ai/docs/serverless-models
-  class_properties:
-    supports_images: true
+  supports:
+    images: true
+    files: false
+    tools: false
+  metadata:
     available_as_evaluator: false
-    supports_files: false
     available_for_everyone: true
     ignored_for_cost: false
-    supports_tools: false
   properties:
     reasoning_model: false
+  costs_per_million_token:
     cache:
       read_discount: 1
     batch:
@@ -23,9 +25,9 @@ kimi-models:
     company: Kimi
     open_source: true
     documentation_url: https://www.kimi.com/
-    class_properties:
-      supports_tools: true
-      supports_temperature: true
+    supports:
+      tools: true
+      temperature: true
     default_parameters:
       temperature: 0.3
@@ -35,11 +37,11 @@ kimi-models:
     release_date: 2025-07-11
     properties:
       context_window: 128_000
-      max_token_output: 16_384
+      max_tokens: 16_384
       training_cutoff: null
       reasoning_model: false
-    class_properties:
-      supports_images: false
+    supports:
+      images: false
     costs_per_million_token:
       input: 1.00
       output: 3.00
@@ -49,9 +51,9 @@ llama-4-models:
   base-config:
     company: Meta
     open_source: true
-    class_properties:
-      supports_tools: true
-      supports_images: true
+    supports:
+      tools: true
+      images: true
   together/meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8:
     label: Llama 4 Maverick
@@ -60,7 +62,7 @@ llama-4-models:
     release_date: 2025-04-05
     properties:
       context_window: 1_000_000
-      max_token_output: 16_384
+      max_tokens: 16_384
       training_cutoff: "2024-08"
     costs_per_million_token:
       input: 0.27
@@ -74,7 +76,7 @@ llama-4-models:
     release_date: 2025-04-05
     properties:
       context_window: 10_000_000
-      max_token_output: 16_384
+      max_tokens: 16_384
       training_cutoff: "2024-08"
     costs_per_million_token:
       input: 0.18
@@ -83,7 +85,7 @@ llama-4-models:
 old-llama-models:
   base-config:
     company: Meta
-    class_properties:
+    metadata:
       deprecated: true
   together/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo:
@@ -92,7 +94,7 @@ old-llama-models:
     release_date: 2024-07-23
     properties:
       context_window: 131_072
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.18
@@ -106,9 +108,9 @@ old-llama-models:
     release_date: 2024-07-23
     properties:
       context_window: 131_072
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
-    class_properties:
+    metadata:
       available_as_evaluator: true
     costs_per_million_token:
       input: 0.88
@@ -122,7 +124,7 @@ old-llama-models:
     release_date: 2024-07-23
     properties:
       context_window: 130_815
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 3.50
@@ -136,7 +138,7 @@ old-llama-models:
     release_date: 2024-04-18
     properties:
       context_window: 8_192
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-03"
     costs_per_million_token:
       input: 0.20
@@ -150,7 +152,7 @@ old-llama-models:
     release_date: 2024-04-18
     properties:
       context_window: 8_192
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.90
@@ -164,7 +166,7 @@ old-llama-models:
     release_date: 2024-04-18
     properties:
       context_window: 8_192
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.90
@@ -178,7 +180,7 @@ old-llama-models:
     release_date: 2024-04-18
     properties:
       context_window: 8_192
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.90
@@ -192,7 +194,7 @@ old-llama-models:
     release_date: 2024-04-18
     properties:
       context_window: 8_192
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.18
@@ -206,7 +208,7 @@ old-llama-models:
     release_date: 2024-04-18
     properties:
       context_window: 8_192
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.88
@@ -220,7 +222,7 @@ old-llama-models:
     release_date: 2024-04-18
     properties:
       context_window: 131_072
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.06
@@ -234,13 +236,13 @@ old-llama-models:
     release_date: 2024-04-18
     properties:
       context_window: 131_072
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.18
       output: 0.18
-    class_properties:
-      supports_images: true
+    supports:
+      images: true
     alternative_keys:
       - together/llama-3.2-11b-instruct
@@ -250,13 +252,14 @@ old-llama-models:
     release_date: 2024-04-18
     properties:
       context_window: 131_072
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 1.2
       output: 1.2
-    class_properties:
-      supports_images: true
+    supports:
+      images: true
+    metadata:
       deprecated: true
     alternative_keys:
       - together/llama-3.2-90b-instruct
@@ -267,10 +270,10 @@ old-llama-models:
     release_date: 2024-12-06
     properties:
       context_window: 128_000
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
-    class_properties:
-      supports_images: false
+    supports:
+      images: false
     costs_per_million_token:
       input: 0.88
       output: 0.88
@@ -283,7 +286,7 @@ old-llama-models:
     release_date: 2024-04-18
     properties:
       context_window: 8_192
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.10
@@ -295,7 +298,7 @@ old-llama-models:
     release_date: 2024-04-18
     properties:
       context_window: 8_192
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.54
@@ -307,7 +310,7 @@ old-llama-models:
     release_date: 2024-04-18
     properties:
       context_window: 8_192
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.20
@@ -321,7 +324,7 @@ old-llama-models:
     release_date: 2023-07-18
     properties:
       context_window: 4_096
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2022-09"
     costs_per_million_token:
       input: 0.20
@@ -333,7 +336,7 @@ old-llama-models:
     release_date: 2023-07-18
     properties:
       context_window: 4_096
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2022-09"
     costs_per_million_token:
       input: 0.20
@@ -347,7 +350,7 @@ old-llama-models:
     release_date: 2023-07-18
     properties:
       context_window: 4_096
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2022-09"
     costs_per_million_token:
       input: 0.30
@@ -359,7 +362,7 @@ old-llama-models:
     release_date: 2023-07-18
     properties:
       context_window: 4_096
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2022-09"
     costs_per_million_token:
       input: 0.30
@@ -373,7 +376,7 @@ old-llama-models:
     release_date: 2023-07-18
     properties:
       context_window: 4_096
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2022-09"
     costs_per_million_token:
       input: 0.90
@@ -385,9 +388,9 @@ old-llama-models:
     release_date: 2023-07-18
     properties:
       context_window: 4_096
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2022-09"
-    class_properties:
+    metadata:
       deprecated: true
     costs_per_million_token:
       input: 0.90
@@ -401,7 +404,7 @@ old-llama-models:
     release_date: 2023-07-18
     properties:
       context_window: 4_096
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2022-09"
     costs_per_million_token:
       input: 0.20
@@ -413,9 +416,9 @@ old-llama-models:
     release_date: 2023-07-18
     properties:
       context_window: 4_096
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2022-09"
-    class_properties:
+    metadata:
       deprecated: true
     costs_per_million_token:
       input: 0.20
@@ -429,9 +432,9 @@ old-llama-models:
     release_date: 2023-07-18
     properties:
       context_window: 4_096
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2022-09"
-    class_properties:
+    metadata:
       deprecated: true
     costs_per_million_token:
       input: 0.30
@@ -443,7 +446,7 @@ old-llama-models:
     release_date: 2023-07-18
     properties:
       context_window: 4_096
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2022-09"
     costs_per_million_token:
       input: 0.20
@@ -457,7 +460,7 @@ old-llama-models:
     release_date: 2023-07-18
     properties:
       context_window: 4_096
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2022-09"
     costs_per_million_token:
       input: 0.90
@@ -469,7 +472,7 @@ old-llama-models:
 nvidia-models:
   base-config:
     company: NVIDIA
-    class_properties:
+    metadata:
       deprecated: true
   together/nvidia/Llama-3.1-Nemotron-70B-Instruct-HF:
@@ -478,7 +481,7 @@ nvidia-models:
     release_date: 2024-04-18
     properties:
       context_window: 32_768
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.90
@@ -487,9 +490,10 @@ nvidia-models:
 qwen-models:
   base-config:
     company: Alibaba
-    class_properties:
+    supports:
+      temperature: true
+    metadata:
       deprecated: true
-      supports_temperature: true
     default_parameters:
       temperature: 0.7
@@ -499,14 +503,15 @@ qwen-models:
     release_date: 2024-04-18
     properties:
       context_window: 32_768
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.80
       output: 0.80
-    class_properties:
+    supports:
+      images: false
+    metadata:
       available_for_everyone: false
-      supports_images: false
   together/Qwen/Qwen2.5-7B-Instruct-Turbo:
     label: Qwen 2.5 Instruct Turbo (7B)
@@ -514,14 +519,15 @@ qwen-models:
     release_date: 2024-04-18
     properties:
       context_window: 32_768
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.30
       output: 0.30
-    class_properties:
+    supports:
+      images: false
+    metadata:
       available_for_everyone: false
-      supports_images: false
     alternative_keys:
       - together/qwen-2.5-7b-instruct
@@ -531,14 +537,15 @@ qwen-models:
     release_date: 2024-04-18
     properties:
       context_window: 32_768
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 1.20
       output: 1.20
-    class_properties:
+    supports:
+      images: false
+    metadata:
       available_for_everyone: false
-      supports_images: false
     alternative_keys:
       - together/qwen-2.5-72b-instruct
@@ -546,9 +553,10 @@ qwen-models:
 mistralai-models:
   base-config:
     company: Mistral
-    class_properties:
+    supports:
+      images: false
+    metadata:
       deprecated: true
-      supports_images: false
   together/mistralai/Mistral-7B-v0.1:
     label: Mistral (7B)
@@ -556,7 +564,7 @@ mistralai-models:
     release_date: 2023-09-27
     properties:
       context_window: 8_192
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-06"
     costs_per_million_token:
       input: 0.18
@@ -570,7 +578,7 @@ mistralai-models:
     release_date: 2023-09-27
     properties:
       context_window: 32_768
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-06"
     costs_per_million_token:
       input: 0.18
@@ -584,11 +592,11 @@ mistralai-models:
     release_date: 2023-12-15
     properties:
       context_window: 32_768
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-09"
     costs_per_million_token:
-      input: 0.18
-      output: 0.18
+      input: 0.2
+      output: 0.2
     alternative_keys:
       - together/Mistral-7B-Instruct-v0.2
@@ -598,7 +606,7 @@ mistralai-models:
     release_date: 2024-04-18
     properties:
       context_window: 32_768
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.18
@@ -612,7 +620,7 @@ mistralai-models:
     release_date: 2023-12-15
     properties:
       context_window: 32_768
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-09"
     costs_per_million_token:
       input: 0.60
@@ -626,7 +634,7 @@ mistralai-models:
     release_date: 2023-12-15
     properties:
       context_window: 32_768
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-09"
     costs_per_million_token:
       input: 0.60
@@ -640,9 +648,9 @@ mistralai-models:
     release_date: 2024-02-15
     properties:
       context_window: 65_536
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
-    class_properties:
+    metadata:
       available_as_evaluator: true
     costs_per_million_token:
       input: 1.20
@@ -660,10 +668,11 @@ meta-llama-vision:
     release_date: 2024-04-18
     properties:
       context_window: 131_072
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
-    class_properties:
-      supports_images: true
+    supports:
+      images: true
+    metadata:
       available_for_everyone: false
       deprecated: true
@@ -674,10 +683,11 @@ meta-llama-vision:
     release_date: 2024-04-18
     properties:
       context_window: 131_072
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
-    class_properties:
-      supports_images: true
+    supports:
+      images: true
+    metadata:
       available_for_everyone: true
       deprecated: true
     costs_per_million_token:
@@ -693,10 +703,11 @@ meta-llama-vision:
     release_date: 2024-04-18
     properties:
       context_window: 131_072
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
-    class_properties:
-      supports_images: true
+    supports:
+      images: true
+    metadata:
       available_for_everyone: true
       deprecated: true
     costs_per_million_token:
@@ -714,15 +725,16 @@ google-models:
     release_date: 2024-02-21
     properties:
       context_window: 8_192
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.50
       output: 0.50
-    class_properties:
+    metadata:
       available_for_everyone: false
       deprecated: true
-      supports_images: false
+    supports:
+      images: false
     alternative_keys:
       - together/gemma-2-27b-instruct
@@ -733,12 +745,12 @@ google-models:
     release_date: 2024-02-21
     properties:
       context_window: 8_192
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.20
       output: 0.20
-    class_properties:
+    metadata:
       available_for_everyone: false
       deprecated: true
     alternative_keys:
@@ -751,12 +763,12 @@ google-models:
     release_date: 2024-02-21
     properties:
       context_window: 8_192
-      max_token_output: 4_096
+      max_tokens: 4_096
       training_cutoff: "2023-12"
     costs_per_million_token:
       input: 0.10
       output: 0.10
-    class_properties:
+    metadata:
       available_for_everyone: false
       deprecated: true
     alternative_keys:
@@ -766,7 +778,7 @@ google-models:
 falcon-models:
   base-config:
     company: Technology Innovation Institute
-    class_properties:
+    metadata:
       deprecated: true
   together/togethercomputer/falcon-7b-instruct:
@@ -819,7 +831,7 @@ alpaca-models:
     costs_per_million_token:
       input: 0.20
       output: 0.20
-    class_properties:
+    metadata:
       deprecated: true
     alternative_keys:
       - together/alpaca-7b
@@ -829,9 +841,9 @@ deepseek-models:
   base-config:
     company: DeepSeek
     open_source: true
-    class_properties:
-      supports_images: false
-      supports_temperature: true
+    supports:
+      images: false
+      temperature: true
     default_parameters:
       temperature: 1
@@ -841,9 +853,9 @@ deepseek-models:
     release_date: 2024-12-26
     properties:
       context_window: 131_072
-      max_token_output: null
+      max_tokens: null
       training_cutoff: null
-    class_properties:
+    metadata:
       deprecated: true
     costs_per_million_token:
       input: 1.25
@@ -856,10 +868,10 @@ deepseek-models:
     release_date: 2025-01-20
     properties:
       context_window: 163_840
-      max_token_output: null
+      max_tokens: null
       training_cutoff: null
       reasoning_model: true
-    class_properties:
+    metadata:
       deprecated: true
     costs_per_million_token:
       input: 3.00

model-library 0.1.2__py3-none-any.whl → 0.1.4__py3-none-any.whl

model-library 0.1.2py3-none-any.whl → 0.1.4py3-none-any.whl