PyPI - model-library - Versions diffs - 0.1.6__py3-none-any.whl → 0.1.8__py3-none-any.whl - Mend

model-library 0.1.6py3-none-any.whl → 0.1.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (48) hide show

model_library/base/base.py +237 -62
model_library/base/delegate_only.py +86 -9
model_library/base/input.py +10 -7
model_library/base/output.py +48 -0
model_library/base/utils.py +56 -7
model_library/config/alibaba_models.yaml +44 -57
model_library/config/all_models.json +253 -126
model_library/config/kimi_models.yaml +30 -3
model_library/config/openai_models.yaml +15 -23
model_library/config/zai_models.yaml +24 -3
model_library/exceptions.py +14 -77
model_library/logging.py +6 -2
model_library/providers/ai21labs.py +30 -14
model_library/providers/alibaba.py +17 -8
model_library/providers/amazon.py +119 -64
model_library/providers/anthropic.py +184 -104
model_library/providers/azure.py +22 -10
model_library/providers/cohere.py +7 -7
model_library/providers/deepseek.py +8 -8
model_library/providers/fireworks.py +7 -8
model_library/providers/google/batch.py +17 -13
model_library/providers/google/google.py +130 -73
model_library/providers/inception.py +7 -7
model_library/providers/kimi.py +18 -8
model_library/providers/minimax.py +30 -13
model_library/providers/mistral.py +61 -35
model_library/providers/openai.py +219 -93
model_library/providers/openrouter.py +34 -0
model_library/providers/perplexity.py +7 -7
model_library/providers/together.py +7 -8
model_library/providers/vals.py +16 -9
model_library/providers/xai.py +157 -144
model_library/providers/zai.py +38 -8
model_library/register_models.py +4 -2
model_library/registry_utils.py +39 -15
model_library/retriers/__init__.py +0 -0
model_library/retriers/backoff.py +73 -0
model_library/retriers/base.py +225 -0
model_library/retriers/token.py +427 -0
model_library/retriers/utils.py +11 -0
model_library/settings.py +1 -1
model_library/utils.py +13 -35
{model_library-0.1.6.dist-info → model_library-0.1.8.dist-info}/METADATA +4 -3
model_library-0.1.8.dist-info/RECORD +70 -0
{model_library-0.1.6.dist-info → model_library-0.1.8.dist-info}/WHEEL +1 -1
model_library-0.1.6.dist-info/RECORD +0 -64
{model_library-0.1.6.dist-info → model_library-0.1.8.dist-info}/licenses/LICENSE +0 -0
{model_library-0.1.6.dist-info → model_library-0.1.8.dist-info}/top_level.txt +0 -0

model_library/config/all_models.json CHANGED Viewed

@@ -1,4 +1,184 @@
 {
+    "kimi/kimi-k2.5-thinking": {
+        "company": "Moonshot AI",
+        "label": "Kimi K2.5",
+        "description": null,
+        "release_date": "2026-01-26",
+        "open_source": true,
+        "documentation_url": "https://platform.moonshot.ai/docs",
+        "properties": {
+            "context_window": 262144,
+            "max_tokens": 128000,
+            "training_cutoff": null,
+            "reasoning_model": true
+        },
+        "supports": {
+            "images": true,
+            "files": false,
+            "temperature": false,
+            "tools": true
+        },
+        "metadata": {
+            "deprecated": false,
+            "available_for_everyone": true,
+            "available_as_evaluator": false,
+            "ignored_for_cost": false
+        },
+        "provider_properties": {},
+        "costs_per_million_token": {
+            "input": 0.6,
+            "output": 3.0,
+            "cache": {
+                "read": 0.1,
+                "write_markup": 1.0
+            }
+        },
+        "alternative_keys": [],
+        "default_parameters": {
+            "temperature": 1.0,
+            "top_p": 0.95
+        },
+        "provider_endpoint": "kimi-k2.5",
+        "provider_name": "kimi",
+        "full_key": "kimi/kimi-k2.5-thinking",
+        "slug": "kimi_kimi-k2.5-thinking"
+    },
+    "kimi/kimi-k2.5": {
+        "company": "Moonshot AI",
+        "label": "Kimi K2.5",
+        "description": null,
+        "release_date": "2026-01-26",
+        "open_source": true,
+        "documentation_url": "https://platform.moonshot.ai/docs",
+        "properties": {
+            "context_window": 262144,
+            "max_tokens": 128000,
+            "training_cutoff": null,
+            "reasoning_model": false
+        },
+        "supports": {
+            "images": true,
+            "files": false,
+            "temperature": false,
+            "tools": true
+        },
+        "metadata": {
+            "deprecated": false,
+            "available_for_everyone": true,
+            "available_as_evaluator": false,
+            "ignored_for_cost": false
+        },
+        "provider_properties": {},
+        "costs_per_million_token": {
+            "input": 0.6,
+            "output": 3.0,
+            "cache": {
+                "read": 0.1,
+                "write_markup": 1.0
+            }
+        },
+        "alternative_keys": [
+            {
+                "kimi/kimi-k2.5-thinking": {
+                    "properties": {
+                        "reasoning_model": true
+                    },
+                    "default_parameters": {
+                        "temperature": 1.0
+                    }
+                }
+            }
+        ],
+        "default_parameters": {
+            "temperature": 0.6,
+            "top_p": 0.95
+        },
+        "provider_endpoint": "kimi-k2.5",
+        "provider_name": "kimi",
+        "full_key": "kimi/kimi-k2.5",
+        "slug": "kimi_kimi-k2.5"
+    },
+    "alibaba/qwen3-max-2026-01-23": {
+        "company": "Alibaba",
+        "label": "Qwen 3 Max Thinking",
+        "description": "Qwen 3 Max with enhanced reasoning capabilities",
+        "release_date": "2026-01-23",
+        "open_source": false,
+        "properties": {
+            "context_window": 256000,
+            "max_tokens": 32000,
+            "training_cutoff": null,
+            "reasoning_model": true
+        },
+        "supports": {
+            "images": false,
+            "temperature": true,
+            "tools": true
+        },
+        "metadata": {
+            "deprecated": false,
+            "available_for_everyone": false,
+            "available_as_evaluator": false,
+            "ignored_for_cost": false
+        },
+        "provider_properties": {},
+        "costs_per_million_token": {},
+        "alternative_keys": [],
+        "default_parameters": {
+            "temperature": 0.7
+        },
+        "provider_endpoint": "qwen3-max-2026-01-23",
+        "provider_name": "alibaba",
+        "full_key": "alibaba/qwen3-max-2026-01-23",
+        "slug": "alibaba_qwen3-max-2026-01-23"
+    },
+    "zai/glm-4.7-flashx": {
+        "company": "zAI",
+        "label": "GLM 4.7 Flash",
+        "description": "z.AI lightweight fast model",
+        "release_date": "2026-01-19",
+        "open_source": true,
+        "documentation_url": "https://docs.z.ai/",
+        "properties": {
+            "context_window": 200000,
+            "max_tokens": 128000,
+            "training_cutoff": null,
+            "reasoning_model": true
+        },
+        "supports": {
+            "images": false,
+            "files": false,
+            "temperature": true,
+            "tools": true
+        },
+        "metadata": {
+            "deprecated": false,
+            "available_for_everyone": true,
+            "available_as_evaluator": false,
+            "ignored_for_cost": false
+        },
+        "provider_properties": {
+            "clear_thinking": false
+        },
+        "costs_per_million_token": {
+            "input": 0.07,
+            "output": 0.4,
+            "cache": {
+                "read": 0.01,
+                "read_discount": 1.0,
+                "write_markup": 1.0
+            }
+        },
+        "alternative_keys": [],
+        "default_parameters": {
+            "temperature": 1.0,
+            "top_p": 0.95
+        },
+        "provider_endpoint": "glm-4.7-flashx",
+        "provider_name": "zai",
+        "full_key": "zai/glm-4.7-flashx",
+        "slug": "zai_glm-4.7-flashx"
+    },
     "minimax/MiniMax-M2.1": {
         "company": "MiniMax",
         "label": "MiniMax-M2.1",
@@ -229,6 +409,54 @@
         "full_key": "openai/gpt-5.2-pro",
         "slug": "openai_gpt-5.2-pro"
     },
+    "openai/gpt-5.2-codex": {
+        "company": "OpenAI",
+        "label": "GPT 5.2 Codex",
+        "description": "GPT 5.2 optimized for code",
+        "release_date": "2025-12-11",
+        "open_source": false,
+        "documentation_url": "https://platform.openai.com/docs/models/gpt-5.2-codex",
+        "properties": {
+            "context_window": 400000,
+            "max_tokens": 128000,
+            "training_cutoff": "2024-09",
+            "reasoning_model": true
+        },
+        "supports": {
+            "images": true,
+            "files": true,
+            "batch": true,
+            "temperature": false,
+            "tools": true
+        },
+        "metadata": {
+            "deprecated": false,
+            "available_for_everyone": false,
+            "available_as_evaluator": false,
+            "ignored_for_cost": false
+        },
+        "provider_properties": {},
+        "costs_per_million_token": {
+            "input": 1.75,
+            "output": 14.0,
+            "cache": {
+                "read": 0.175,
+                "write_markup": 1.0
+            },
+            "batch": {
+                "input_discount": 0.5,
+                "output_discount": 0.5
+            }
+        },
+        "alternative_keys": [],
+        "default_parameters": {
+            "reasoning_effort": "high"
+        },
+        "provider_endpoint": "gpt-5.2-codex",
+        "provider_name": "openai",
+        "full_key": "openai/gpt-5.2-codex",
+        "slug": "openai_gpt-5.2-codex"
+    },
     "openai/gpt-5.2-2025-12-11": {
         "company": "OpenAI",
         "label": "GPT 5.2",
@@ -408,7 +636,7 @@
     "openai/gpt-5.1-codex-max": {
         "company": "OpenAI",
         "label": "GPT 5.1 Codex Max",
-        "description": "OpenAI's frontier agentic coding model. Good at long-running coding tasks.",
+        "description": "GPT 5.1 optimized for code",
         "release_date": "2025-12-04",
         "open_source": false,
         "documentation_url": "",
@@ -921,7 +1149,7 @@
     "openai/gpt-5.1-codex": {
         "company": "OpenAI",
         "label": "GPT 5.1 Codex",
-        "description": "OpenAI's latest coding model",
+        "description": "GPT 5.1 optimized for code",
         "release_date": "2025-11-13",
         "open_source": false,
         "documentation_url": "https://platform.openai.com/docs/models/gpt-5.1-codex",
@@ -1015,7 +1243,7 @@
         "slug": "openai_gpt-5.1-2025-11-13"
     },
     "kimi/kimi-k2-thinking": {
-        "company": "Kimi",
+        "company": "Moonshot AI",
         "label": "Kimi K2 Thinking",
         "description": null,
         "release_date": "2025-11-06",
@@ -1025,7 +1253,7 @@
             "context_window": 256000,
             "max_tokens": 32000,
             "training_cutoff": null,
-            "reasoning_model": true
+            "reasoning_model": false
         },
         "supports": {
             "images": false,
@@ -1058,7 +1286,7 @@
             }
         ],
         "default_parameters": {
-            "temperature": 1.0
+            "temperature": 0.6
         },
         "provider_endpoint": "kimi-k2-thinking",
         "provider_name": "kimi",
@@ -1102,7 +1330,7 @@
         "slug": "inception_mercury"
     },
     "fireworks/kimi-k2-thinking": {
-        "company": "Kimi",
+        "company": "Moonshot AI",
         "label": "Kimi K2 Thinking",
         "description": null,
         "release_date": "2025-11-06",
@@ -1112,7 +1340,7 @@
             "context_window": 256000,
             "max_tokens": 32000,
             "training_cutoff": null,
-            "reasoning_model": true
+            "reasoning_model": false
         },
         "supports": {
             "images": false,
@@ -1136,7 +1364,7 @@
         },
         "alternative_keys": [],
         "default_parameters": {
-            "temperature": 1.0
+            "temperature": 0.6
         },
         "provider_endpoint": "kimi-k2-thinking",
         "provider_name": "fireworks",
@@ -1939,7 +2167,7 @@
             "temperature": true
         },
         "metadata": {
-            "deprecated": false,
+            "deprecated": true,
             "available_for_everyone": false,
             "available_as_evaluator": false,
             "ignored_for_cost": false
@@ -1982,10 +2210,7 @@
             "ignored_for_cost": false
         },
         "provider_properties": {},
-        "costs_per_million_token": {
-            "input": 1.2,
-            "output": 6.0
-        },
+        "costs_per_million_token": {},
         "alternative_keys": [],
         "default_parameters": {
             "temperature": 0.7
@@ -2019,19 +2244,7 @@
             "ignored_for_cost": false
         },
         "provider_properties": {},
-        "costs_per_million_token": {
-            "input": 1.2,
-            "output": 6.0,
-            "cache": {
-                "read_discount": 0.8,
-                "write_markup": 1.0
-            },
-            "context": {
-                "threshold": 32000.0,
-                "input": 2.4,
-                "output": 12.0
-            }
-        },
+        "costs_per_million_token": {},
         "alternative_keys": [],
         "default_parameters": {
             "temperature": 0.7
@@ -2383,8 +2596,8 @@
         "properties": {
             "context_window": 262144,
             "max_tokens": 65536,
-            "training_cutoff": "",
-            "reasoning_model": false
+            "training_cutoff": null,
+            "reasoning_model": true
         },
         "supports": {
             "images": false,
@@ -2398,10 +2611,7 @@
             "ignored_for_cost": false
         },
         "provider_properties": {},
-        "costs_per_million_token": {
-            "input": 1.2,
-            "output": 6.0
-        },
+        "costs_per_million_token": {},
         "alternative_keys": [],
         "default_parameters": {
             "temperature": 0.7
@@ -3305,9 +3515,14 @@
         },
         "alternative_keys": [
             {
-                "costs_per_million_token": {
-                    "input": 0.55,
-                    "output": 2.19
+                "fireworks/glm-4p5": {
+                    "metadata": {
+                        "deprecated": true
+                    },
+                    "costs_per_million_token": {
+                        "input": 0.55,
+                        "output": 2.19
+                    }
                 }
             }
         ],
@@ -3385,15 +3600,15 @@
             "tools": true
         },
         "metadata": {
-            "deprecated": false,
+            "deprecated": true,
             "available_for_everyone": true,
             "available_as_evaluator": false,
             "ignored_for_cost": false
         },
         "provider_properties": {},
         "costs_per_million_token": {
-            "input": 0.6,
-            "output": 2.2,
+            "input": 0.55,
+            "output": 2.19,
             "cache": {
                 "read": 0.11,
                 "read_discount": 1.0,
@@ -12286,94 +12501,6 @@
         "full_key": "azure/gpt-4-turbo-2024-04-09",
         "slug": "azure_gpt-4-turbo-2024-04-09"
     },
-    "databricks/dbrx-instruct": {
-        "company": "Databricks",
-        "label": "DBRX Instruct",
-        "description": "Databricks Instruct model.",
-        "release_date": "2024-03-27",
-        "open_source": false,
-        "properties": {
-            "context_window": 32768,
-            "max_tokens": 4096,
-            "training_cutoff": "2023-12",
-            "reasoning_model": false
-        },
-        "supports": {
-            "images": false,
-            "files": false,
-            "batch": true,
-            "temperature": true,
-            "tools": true
-        },
-        "metadata": {
-            "deprecated": true,
-            "available_for_everyone": false,
-            "available_as_evaluator": false,
-            "ignored_for_cost": false
-        },
-        "provider_properties": {},
-        "costs_per_million_token": {
-            "input": 2.25,
-            "output": 6.75,
-            "batch": {
-                "input_discount": 0.5,
-                "output_discount": 0.5
-            }
-        },
-        "alternative_keys": [],
-        "default_parameters": {
-            "reasoning_effort": "high"
-        },
-        "provider_endpoint": "databricks-dbrx-instruct",
-        "provider_name": "databricks",
-        "full_key": "databricks/dbrx-instruct",
-        "slug": "databricks_dbrx-instruct"
-    },
-    "databricks/databricks-dbrx-instruct": {
-        "company": "Databricks",
-        "label": "DBRX Instruct",
-        "description": "Databricks Instruct model.",
-        "release_date": "2024-03-27",
-        "open_source": false,
-        "properties": {
-            "context_window": 32768,
-            "max_tokens": 4096,
-            "training_cutoff": "2023-12",
-            "reasoning_model": false
-        },
-        "supports": {
-            "images": false,
-            "files": false,
-            "batch": true,
-            "temperature": true,
-            "tools": true
-        },
-        "metadata": {
-            "deprecated": true,
-            "available_for_everyone": false,
-            "available_as_evaluator": false,
-            "ignored_for_cost": false
-        },
-        "provider_properties": {},
-        "costs_per_million_token": {
-            "input": 2.25,
-            "output": 6.75,
-            "batch": {
-                "input_discount": 0.5,
-                "output_discount": 0.5
-            }
-        },
-        "alternative_keys": [
-            "databricks/dbrx-instruct"
-        ],
-        "default_parameters": {
-            "reasoning_effort": "high"
-        },
-        "provider_endpoint": "databricks-dbrx-instruct",
-        "provider_name": "databricks",
-        "full_key": "databricks/databricks-dbrx-instruct",
-        "slug": "databricks_databricks-dbrx-instruct"
-    },
     "cohere/command-r-03-2024": {
         "company": "Cohere",
         "label": "Command R (03/2024)",

model_library/config/kimi_models.yaml CHANGED Viewed

@@ -1,5 +1,5 @@
 base-config:
-  company: Kimi
+  company: Moonshot AI
   documentation_url: https://platform.moonshot.ai/docs
   open_source: true
   supports:
@@ -11,16 +11,43 @@ base-config:
     available_for_everyone: true
     ignored_for_cost: false
+kimi-k2.5-models:
+  kimi/kimi-k2.5:
+    label: Kimi K2.5
+    release_date: 2026-01-26
+    supports:
+      images: true
+      temperature: false
+    properties:
+      reasoning_model: false
+      context_window: 262_144
+      max_tokens: 128_000
+    default_parameters:
+      temperature: 0.6
+      top_p: 0.95
+    costs_per_million_token:
+      input: 0.6
+      output: 3.0
+      cache:
+        read: 0.1
+    alternative_keys:
+      - kimi/kimi-k2.5-thinking:
+          properties:
+            reasoning_model: true
+          default_parameters:
+            temperature: 1.0
 kimi-k2-models:
   kimi/kimi-k2-thinking:
     label: Kimi K2 Thinking
     release_date: 2025-11-06
     properties:
-      reasoning_model: true
+      reasoning_model: false
       context_window: 256_000
       max_tokens: 32_000
     default_parameters:
-      temperature: 1.0
+      temperature: 0.6
     costs_per_million_token:
       input: 0.6
       output: 2.5

model_library/config/openai_models.yaml CHANGED Viewed

@@ -35,6 +35,19 @@ gpt-5-models:
       training_cutoff: "2024-09"
       reasoning_model: true
+  openai/gpt-5.2-codex:
+    label: GPT 5.2 Codex
+    documentation_url: https://platform.openai.com/docs/models/gpt-5.2-codex
+    description: GPT 5.2 optimized for code
+    release_date: 2025-12-11
+    properties:
+      context_window: 400_000
+    costs_per_million_token:
+      input: 1.75
+      output: 14
+      cache:
+        read: 0.175
   openai/gpt-5.2-2025-12-11:
     label: GPT 5.2
     documentation_url: https://platform.openai.com/docs/models/gpt-5.2
@@ -70,7 +83,7 @@ gpt-5-models:
   openai/gpt-5.1-codex-max:
     label: GPT 5.1 Codex Max
     release_date: 2025-12-04
-    description: OpenAI's frontier agentic coding model. Good at long-running coding tasks.
+    description: GPT 5.1 optimized for code
     costs_per_million_token:
       input: 1.25
       output: 10.0
@@ -79,7 +92,7 @@ gpt-5-models:
   openai/gpt-5.1-codex:
     label: GPT 5.1 Codex
     documentation_url: https://platform.openai.com/docs/models/gpt-5.1-codex
-    description: OpenAI's latest coding model
+    description: GPT 5.1 optimized for code
     release_date: 2025-11-13
     costs_per_million_token:
       input: 1.25
@@ -841,24 +854,3 @@ gpt-3.5-models:
       input: 1.5
       output: 2.0
     documentation_url: https://platform.openai.com/docs/models/gpt-3.5-turbo-instruct
-databricks-models:
-  base-config:
-    company: Databricks
-  databricks/databricks-dbrx-instruct:
-    label: DBRX Instruct
-    description: Databricks Instruct model.
-    release_date: 2024-03-27
-    properties:
-      context_window: 32_768
-      max_tokens: 4_096
-      training_cutoff: "2023-12"
-    metadata:
-      available_for_everyone: false
-      deprecated: true
-    costs_per_million_token:
-      input: 2.25
-      output: 6.75
-    alternative_keys:
-      - databricks/dbrx-instruct

model_library/config/zai_models.yaml CHANGED Viewed

@@ -18,6 +18,25 @@ base-config:
       write_markup: 1
 zai-models:
+  zai/glm-4.7-flashx:
+    label: GLM 4.7 Flash
+    description: "z.AI lightweight fast model"
+    release_date: 2026-01-19
+    properties:
+      context_window: 200_000
+      max_tokens: 128_000
+    costs_per_million_token:
+      input: 0.07
+      output: 0.4
+      cache:
+        read: 0.01
+    default_parameters:
+      # from https://huggingface.co/zai-org/GLM-4.7-Flash
+      temperature: 1
+      top_p: 0.95
+    provider_properties:
+      clear_thinking: false
   zai/glm-4.7:
     label: GLM 4.7
     description: "Latest model from ZAI"
@@ -46,9 +65,11 @@ zai-models:
         read: 0.11
     alternative_keys:
       - fireworks/glm-4p5:
-        costs_per_million_token:
-          input: 0.55
-          output: 2.19
+          metadata:
+            deprecated: true
+          costs_per_million_token:
+            input: 0.55
+            output: 2.19
   zai/glm-4.5-air:
     label: GLM 4.5 Air

model-library 0.1.6__py3-none-any.whl → 0.1.8__py3-none-any.whl

model-library 0.1.6py3-none-any.whl → 0.1.8py3-none-any.whl