PyPI - model-library - Versions diffs - 0.1.7__py3-none-any.whl → 0.1.9__py3-none-any.whl - Mend

model-library 0.1.7py3-none-any.whl → 0.1.9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (52) hide show

model_library/base/base.py +141 -62
model_library/base/delegate_only.py +77 -10
model_library/base/output.py +43 -0
model_library/base/utils.py +35 -0
model_library/config/alibaba_models.yaml +49 -57
model_library/config/all_models.json +353 -120
model_library/config/anthropic_models.yaml +2 -1
model_library/config/kimi_models.yaml +30 -3
model_library/config/mistral_models.yaml +2 -0
model_library/config/openai_models.yaml +15 -23
model_library/config/together_models.yaml +2 -0
model_library/config/xiaomi_models.yaml +43 -0
model_library/config/zai_models.yaml +27 -3
model_library/exceptions.py +3 -77
model_library/providers/ai21labs.py +12 -8
model_library/providers/alibaba.py +17 -8
model_library/providers/amazon.py +49 -16
model_library/providers/anthropic.py +128 -48
model_library/providers/azure.py +22 -10
model_library/providers/cohere.py +7 -7
model_library/providers/deepseek.py +8 -8
model_library/providers/fireworks.py +7 -8
model_library/providers/google/batch.py +14 -10
model_library/providers/google/google.py +57 -30
model_library/providers/inception.py +7 -7
model_library/providers/kimi.py +18 -8
model_library/providers/minimax.py +15 -17
model_library/providers/mistral.py +20 -8
model_library/providers/openai.py +99 -22
model_library/providers/openrouter.py +34 -0
model_library/providers/perplexity.py +7 -7
model_library/providers/together.py +7 -8
model_library/providers/vals.py +12 -6
model_library/providers/vercel.py +34 -0
model_library/providers/xai.py +47 -42
model_library/providers/xiaomi.py +34 -0
model_library/providers/zai.py +38 -8
model_library/register_models.py +5 -0
model_library/registry_utils.py +48 -17
model_library/retriers/__init__.py +0 -0
model_library/retriers/backoff.py +73 -0
model_library/retriers/base.py +225 -0
model_library/retriers/token.py +427 -0
model_library/retriers/utils.py +11 -0
model_library/settings.py +1 -1
model_library/utils.py +17 -7
{model_library-0.1.7.dist-info → model_library-0.1.9.dist-info}/METADATA +2 -1
model_library-0.1.9.dist-info/RECORD +73 -0
{model_library-0.1.7.dist-info → model_library-0.1.9.dist-info}/WHEEL +1 -1
model_library-0.1.7.dist-info/RECORD +0 -64
{model_library-0.1.7.dist-info → model_library-0.1.9.dist-info}/licenses/LICENSE +0 -0
{model_library-0.1.7.dist-info → model_library-0.1.9.dist-info}/top_level.txt +0 -0

model_library/config/all_models.json CHANGED Viewed

@@ -1,4 +1,187 @@
 {
+    "kimi/kimi-k2.5-thinking": {
+        "company": "Moonshot AI",
+        "label": "Kimi K2.5",
+        "description": null,
+        "release_date": "2026-01-26",
+        "open_source": true,
+        "documentation_url": "https://platform.moonshot.ai/docs",
+        "properties": {
+            "context_window": 262144,
+            "max_tokens": 128000,
+            "training_cutoff": null,
+            "reasoning_model": true
+        },
+        "supports": {
+            "images": true,
+            "files": false,
+            "temperature": false,
+            "tools": true
+        },
+        "metadata": {
+            "deprecated": false,
+            "available_for_everyone": true,
+            "available_as_evaluator": false,
+            "ignored_for_cost": false
+        },
+        "provider_properties": {},
+        "costs_per_million_token": {
+            "input": 0.6,
+            "output": 3.0,
+            "cache": {
+                "read": 0.1,
+                "write_markup": 1.0
+            }
+        },
+        "alternative_keys": [],
+        "default_parameters": {
+            "temperature": 1.0,
+            "top_p": 0.95
+        },
+        "provider_endpoint": "kimi-k2.5",
+        "provider_name": "kimi",
+        "full_key": "kimi/kimi-k2.5-thinking",
+        "slug": "kimi_kimi-k2.5-thinking"
+    },
+    "kimi/kimi-k2.5": {
+        "company": "Moonshot AI",
+        "label": "Kimi K2.5",
+        "description": null,
+        "release_date": "2026-01-26",
+        "open_source": true,
+        "documentation_url": "https://platform.moonshot.ai/docs",
+        "properties": {
+            "context_window": 262144,
+            "max_tokens": 128000,
+            "training_cutoff": null,
+            "reasoning_model": false
+        },
+        "supports": {
+            "images": true,
+            "files": false,
+            "temperature": false,
+            "tools": true
+        },
+        "metadata": {
+            "deprecated": false,
+            "available_for_everyone": true,
+            "available_as_evaluator": false,
+            "ignored_for_cost": false
+        },
+        "provider_properties": {},
+        "costs_per_million_token": {
+            "input": 0.6,
+            "output": 3.0,
+            "cache": {
+                "read": 0.1,
+                "write_markup": 1.0
+            }
+        },
+        "alternative_keys": [
+            {
+                "kimi/kimi-k2.5-thinking": {
+                    "properties": {
+                        "reasoning_model": true
+                    },
+                    "default_parameters": {
+                        "temperature": 1.0
+                    }
+                }
+            }
+        ],
+        "default_parameters": {
+            "temperature": 0.6,
+            "top_p": 0.95
+        },
+        "provider_endpoint": "kimi-k2.5",
+        "provider_name": "kimi",
+        "full_key": "kimi/kimi-k2.5",
+        "slug": "kimi_kimi-k2.5"
+    },
+    "alibaba/qwen3-max-2026-01-23": {
+        "company": "Alibaba",
+        "label": "Qwen 3 Max Thinking",
+        "description": "Qwen 3 Max with enhanced reasoning capabilities",
+        "release_date": "2026-01-23",
+        "open_source": false,
+        "properties": {
+            "context_window": 256000,
+            "max_tokens": 32000,
+            "training_cutoff": null,
+            "reasoning_model": true
+        },
+        "supports": {
+            "images": false,
+            "temperature": true,
+            "tools": true
+        },
+        "metadata": {
+            "deprecated": false,
+            "available_for_everyone": false,
+            "available_as_evaluator": false,
+            "ignored_for_cost": false
+        },
+        "provider_properties": {},
+        "costs_per_million_token": {
+            "input": 1.2,
+            "output": 6.0
+        },
+        "alternative_keys": [],
+        "default_parameters": {
+            "temperature": 0.7
+        },
+        "provider_endpoint": "qwen3-max-2026-01-23",
+        "provider_name": "alibaba",
+        "full_key": "alibaba/qwen3-max-2026-01-23",
+        "slug": "alibaba_qwen3-max-2026-01-23"
+    },
+    "zai/glm-4.7-flashx": {
+        "company": "zAI",
+        "label": "GLM 4.7 Flash",
+        "description": "z.AI lightweight fast model",
+        "release_date": "2026-01-19",
+        "open_source": true,
+        "documentation_url": "https://docs.z.ai/",
+        "properties": {
+            "context_window": 200000,
+            "max_tokens": 128000,
+            "training_cutoff": null,
+            "reasoning_model": true
+        },
+        "supports": {
+            "images": false,
+            "files": false,
+            "temperature": true,
+            "tools": true
+        },
+        "metadata": {
+            "deprecated": false,
+            "available_for_everyone": true,
+            "available_as_evaluator": false,
+            "ignored_for_cost": false
+        },
+        "provider_properties": {
+            "clear_thinking": false
+        },
+        "costs_per_million_token": {
+            "input": 0.07,
+            "output": 0.4,
+            "cache": {
+                "read": 0.01,
+                "read_discount": 1.0,
+                "write_markup": 1.0
+            }
+        },
+        "alternative_keys": [],
+        "default_parameters": {
+            "temperature": 1.0,
+            "top_p": 0.95
+        },
+        "provider_endpoint": "glm-4.7-flashx",
+        "provider_name": "zai",
+        "full_key": "zai/glm-4.7-flashx",
+        "slug": "zai_glm-4.7-flashx"
+    },
     "minimax/MiniMax-M2.1": {
         "company": "MiniMax",
         "label": "MiniMax-M2.1",
@@ -79,7 +262,9 @@
                 "write_markup": 1.0
             }
         },
-        "alternative_keys": [],
+        "alternative_keys": [
+            "vercel/zai/glm-4.7"
+        ],
         "default_parameters": {
             "temperature": 1.0,
             "top_p": 1.0
@@ -89,6 +274,94 @@
         "full_key": "zai/glm-4.7",
         "slug": "zai_glm-4.7"
     },
+    "vercel/zai/glm-4.7": {
+        "company": "zAI",
+        "label": "GLM 4.7",
+        "description": "Latest model from ZAI",
+        "release_date": "2025-12-22",
+        "open_source": true,
+        "documentation_url": "https://docs.z.ai/",
+        "properties": {
+            "context_window": 200000,
+            "max_tokens": 128000,
+            "training_cutoff": null,
+            "reasoning_model": true
+        },
+        "supports": {
+            "images": false,
+            "files": false,
+            "temperature": true,
+            "tools": true
+        },
+        "metadata": {
+            "deprecated": false,
+            "available_for_everyone": true,
+            "available_as_evaluator": false,
+            "ignored_for_cost": false
+        },
+        "provider_properties": {},
+        "costs_per_million_token": {
+            "input": 0.6,
+            "output": 2.2,
+            "cache": {
+                "read": 0.11,
+                "read_discount": 1.0,
+                "write_markup": 1.0
+            }
+        },
+        "alternative_keys": [],
+        "default_parameters": {
+            "temperature": 1.0,
+            "top_p": 1.0
+        },
+        "provider_endpoint": "zai/glm-4.7",
+        "provider_name": "vercel",
+        "full_key": "vercel/zai/glm-4.7",
+        "slug": "vercel_zai_glm-4.7"
+    },
+    "xiaomi/mimo-v2-flash": {
+        "company": "Xiaomi",
+        "label": "MiMo V2 Flash",
+        "description": "MiMo V2 Flash is Xiaomi's Mixture-of-Experts (MoE) language model with 309B total parameters and 15B active parameters. Designed for high-speed reasoning and agentic workflows, it utilizes a novel hybrid attention architecture and Multi-Token Prediction (MTP) to achieve state-of-the-art performance while significantly reducing inference costs.",
+        "release_date": "2025-12-17",
+        "open_source": true,
+        "documentation_url": "https://platform.xiaomimimo.com/#/docs/",
+        "properties": {
+            "context_window": 256000,
+            "max_tokens": 64000,
+            "training_cutoff": "December 2024"
+        },
+        "supports": {
+            "images": false,
+            "files": false,
+            "temperature": true,
+            "tools": true
+        },
+        "metadata": {
+            "deprecated": false,
+            "available_for_everyone": true,
+            "available_as_evaluator": false,
+            "ignored_for_cost": false
+        },
+        "provider_properties": {},
+        "costs_per_million_token": {
+            "input": 0.1,
+            "output": 0.3,
+            "cache": {
+                "read": 0.01,
+                "write_markup": 1.0
+            }
+        },
+        "alternative_keys": [],
+        "default_parameters": {
+            "temperature": 0.3,
+            "top_p": 0.95
+        },
+        "provider_endpoint": "mimo-v2-flash",
+        "provider_name": "xiaomi",
+        "full_key": "xiaomi/mimo-v2-flash",
+        "slug": "xiaomi_mimo-v2-flash"
+    },
     "google/gemini-3-flash-preview": {
         "company": "Google",
         "label": "Gemini 3 Flash (12/25)",
@@ -229,6 +502,54 @@
         "full_key": "openai/gpt-5.2-pro",
         "slug": "openai_gpt-5.2-pro"
     },
+    "openai/gpt-5.2-codex": {
+        "company": "OpenAI",
+        "label": "GPT 5.2 Codex",
+        "description": "GPT 5.2 optimized for code",
+        "release_date": "2025-12-11",
+        "open_source": false,
+        "documentation_url": "https://platform.openai.com/docs/models/gpt-5.2-codex",
+        "properties": {
+            "context_window": 400000,
+            "max_tokens": 128000,
+            "training_cutoff": "2024-09",
+            "reasoning_model": true
+        },
+        "supports": {
+            "images": true,
+            "files": true,
+            "batch": true,
+            "temperature": false,
+            "tools": true
+        },
+        "metadata": {
+            "deprecated": false,
+            "available_for_everyone": false,
+            "available_as_evaluator": false,
+            "ignored_for_cost": false
+        },
+        "provider_properties": {},
+        "costs_per_million_token": {
+            "input": 1.75,
+            "output": 14.0,
+            "cache": {
+                "read": 0.175,
+                "write_markup": 1.0
+            },
+            "batch": {
+                "input_discount": 0.5,
+                "output_discount": 0.5
+            }
+        },
+        "alternative_keys": [],
+        "default_parameters": {
+            "reasoning_effort": "high"
+        },
+        "provider_endpoint": "gpt-5.2-codex",
+        "provider_name": "openai",
+        "full_key": "openai/gpt-5.2-codex",
+        "slug": "openai_gpt-5.2-codex"
+    },
     "openai/gpt-5.2-2025-12-11": {
         "company": "OpenAI",
         "label": "GPT 5.2",
@@ -408,7 +729,7 @@
     "openai/gpt-5.1-codex-max": {
         "company": "OpenAI",
         "label": "GPT 5.1 Codex Max",
-        "description": "OpenAI's frontier agentic coding model. Good at long-running coding tasks.",
+        "description": "GPT 5.1 optimized for code",
         "release_date": "2025-12-04",
         "open_source": false,
         "documentation_url": "",
@@ -628,7 +949,9 @@
             "available_as_evaluator": false,
             "ignored_for_cost": false
         },
-        "provider_properties": {},
+        "provider_properties": {
+            "supports_compute_effort": true
+        },
         "costs_per_million_token": {
             "input": 5.0,
             "output": 25.0,
@@ -678,7 +1001,9 @@
             "available_as_evaluator": false,
             "ignored_for_cost": false
         },
-        "provider_properties": {},
+        "provider_properties": {
+            "supports_compute_effort": true
+        },
         "costs_per_million_token": {
             "input": 5.0,
             "output": 25.0,
@@ -921,7 +1246,7 @@
     "openai/gpt-5.1-codex": {
         "company": "OpenAI",
         "label": "GPT 5.1 Codex",
-        "description": "OpenAI's latest coding model",
+        "description": "GPT 5.1 optimized for code",
         "release_date": "2025-11-13",
         "open_source": false,
         "documentation_url": "https://platform.openai.com/docs/models/gpt-5.1-codex",
@@ -1015,7 +1340,7 @@
         "slug": "openai_gpt-5.1-2025-11-13"
     },
     "kimi/kimi-k2-thinking": {
-        "company": "Kimi",
+        "company": "Moonshot AI",
         "label": "Kimi K2 Thinking",
         "description": null,
         "release_date": "2025-11-06",
@@ -1025,7 +1350,7 @@
             "context_window": 256000,
             "max_tokens": 32000,
             "training_cutoff": null,
-            "reasoning_model": true
+            "reasoning_model": false
         },
         "supports": {
             "images": false,
@@ -1058,7 +1383,7 @@
             }
         ],
         "default_parameters": {
-            "temperature": 1.0
+            "temperature": 0.6
         },
         "provider_endpoint": "kimi-k2-thinking",
         "provider_name": "kimi",
@@ -1102,7 +1427,7 @@
         "slug": "inception_mercury"
     },
     "fireworks/kimi-k2-thinking": {
-        "company": "Kimi",
+        "company": "Moonshot AI",
         "label": "Kimi K2 Thinking",
         "description": null,
         "release_date": "2025-11-06",
@@ -1112,7 +1437,7 @@
             "context_window": 256000,
             "max_tokens": 32000,
             "training_cutoff": null,
-            "reasoning_model": true
+            "reasoning_model": false
         },
         "supports": {
             "images": false,
@@ -1136,7 +1461,7 @@
         },
         "alternative_keys": [],
         "default_parameters": {
-            "temperature": 1.0
+            "temperature": 0.6
         },
         "provider_endpoint": "kimi-k2-thinking",
         "provider_name": "fireworks",
@@ -1939,7 +2264,7 @@
             "temperature": true
         },
         "metadata": {
-            "deprecated": false,
+            "deprecated": true,
             "available_for_everyone": false,
             "available_as_evaluator": false,
             "ignored_for_cost": false
@@ -2021,16 +2346,7 @@
         "provider_properties": {},
         "costs_per_million_token": {
             "input": 1.2,
-            "output": 6.0,
-            "cache": {
-                "read_discount": 0.8,
-                "write_markup": 1.0
-            },
-            "context": {
-                "threshold": 32000.0,
-                "input": 2.4,
-                "output": 12.0
-            }
+            "output": 6.0
         },
         "alternative_keys": [],
         "default_parameters": {
@@ -2383,8 +2699,8 @@
         "properties": {
             "context_window": 262144,
             "max_tokens": 65536,
-            "training_cutoff": "",
-            "reasoning_model": false
+            "training_cutoff": null,
+            "reasoning_model": true
         },
         "supports": {
             "images": false,
@@ -3305,9 +3621,14 @@
         },
         "alternative_keys": [
             {
-                "costs_per_million_token": {
-                    "input": 0.55,
-                    "output": 2.19
+                "fireworks/glm-4p5": {
+                    "metadata": {
+                        "deprecated": true
+                    },
+                    "costs_per_million_token": {
+                        "input": 0.55,
+                        "output": 2.19
+                    }
                 }
             }
         ],
@@ -3385,15 +3706,15 @@
             "tools": true
         },
         "metadata": {
-            "deprecated": false,
+            "deprecated": true,
             "available_for_everyone": true,
             "available_as_evaluator": false,
             "ignored_for_cost": false
         },
         "provider_properties": {},
         "costs_per_million_token": {
-            "input": 0.6,
-            "output": 2.2,
+            "input": 0.55,
+            "output": 2.19,
             "cache": {
                 "read": 0.11,
                 "read_discount": 1.0,
@@ -3705,7 +4026,7 @@
             "tools": true
         },
         "metadata": {
-            "deprecated": false,
+            "deprecated": true,
             "available_for_everyone": true,
             "available_as_evaluator": false,
             "ignored_for_cost": false
@@ -4335,7 +4656,7 @@
             "tools": true
         },
         "metadata": {
-            "deprecated": false,
+            "deprecated": true,
             "available_for_everyone": true,
             "available_as_evaluator": false,
             "ignored_for_cost": false
@@ -12286,94 +12607,6 @@
         "full_key": "azure/gpt-4-turbo-2024-04-09",
         "slug": "azure_gpt-4-turbo-2024-04-09"
     },
-    "databricks/dbrx-instruct": {
-        "company": "Databricks",
-        "label": "DBRX Instruct",
-        "description": "Databricks Instruct model.",
-        "release_date": "2024-03-27",
-        "open_source": false,
-        "properties": {
-            "context_window": 32768,
-            "max_tokens": 4096,
-            "training_cutoff": "2023-12",
-            "reasoning_model": false
-        },
-        "supports": {
-            "images": false,
-            "files": false,
-            "batch": true,
-            "temperature": true,
-            "tools": true
-        },
-        "metadata": {
-            "deprecated": true,
-            "available_for_everyone": false,
-            "available_as_evaluator": false,
-            "ignored_for_cost": false
-        },
-        "provider_properties": {},
-        "costs_per_million_token": {
-            "input": 2.25,
-            "output": 6.75,
-            "batch": {
-                "input_discount": 0.5,
-                "output_discount": 0.5
-            }
-        },
-        "alternative_keys": [],
-        "default_parameters": {
-            "reasoning_effort": "high"
-        },
-        "provider_endpoint": "databricks-dbrx-instruct",
-        "provider_name": "databricks",
-        "full_key": "databricks/dbrx-instruct",
-        "slug": "databricks_dbrx-instruct"
-    },
-    "databricks/databricks-dbrx-instruct": {
-        "company": "Databricks",
-        "label": "DBRX Instruct",
-        "description": "Databricks Instruct model.",
-        "release_date": "2024-03-27",
-        "open_source": false,
-        "properties": {
-            "context_window": 32768,
-            "max_tokens": 4096,
-            "training_cutoff": "2023-12",
-            "reasoning_model": false
-        },
-        "supports": {
-            "images": false,
-            "files": false,
-            "batch": true,
-            "temperature": true,
-            "tools": true
-        },
-        "metadata": {
-            "deprecated": true,
-            "available_for_everyone": false,
-            "available_as_evaluator": false,
-            "ignored_for_cost": false
-        },
-        "provider_properties": {},
-        "costs_per_million_token": {
-            "input": 2.25,
-            "output": 6.75,
-            "batch": {
-                "input_discount": 0.5,
-                "output_discount": 0.5
-            }
-        },
-        "alternative_keys": [
-            "databricks/dbrx-instruct"
-        ],
-        "default_parameters": {
-            "reasoning_effort": "high"
-        },
-        "provider_endpoint": "databricks-dbrx-instruct",
-        "provider_name": "databricks",
-        "full_key": "databricks/databricks-dbrx-instruct",
-        "slug": "databricks_databricks-dbrx-instruct"
-    },
     "cohere/command-r-03-2024": {
         "company": "Cohere",
         "label": "Command R (03/2024)",

model_library/config/anthropic_models.yaml CHANGED Viewed

@@ -22,7 +22,6 @@ base-config:
   documentation_url: https://docs.claude.com/en/docs/about-claude/models/overview
   default_parameters:
     temperature: 1
 claude-4-models:
   base-config:
     supports:
@@ -40,6 +39,8 @@ claude-4-models:
       cache:
         read: 0.5
         write: 6.25
+    provider_properties:
+      supports_compute_effort: true
     alternative_keys:
       - anthropic/claude-opus-4-5-20251101-thinking:
           properties:

model_library/config/kimi_models.yaml CHANGED Viewed

@@ -1,5 +1,5 @@
 base-config:
-  company: Kimi
+  company: Moonshot AI
   documentation_url: https://platform.moonshot.ai/docs
   open_source: true
   supports:
@@ -11,16 +11,43 @@ base-config:
     available_for_everyone: true
     ignored_for_cost: false
+kimi-k2.5-models:
+  kimi/kimi-k2.5:
+    label: Kimi K2.5
+    release_date: 2026-01-26
+    supports:
+      images: true
+      temperature: false
+    properties:
+      reasoning_model: false
+      context_window: 262_144
+      max_tokens: 128_000
+    default_parameters:
+      temperature: 0.6
+      top_p: 0.95
+    costs_per_million_token:
+      input: 0.6
+      output: 3.0
+      cache:
+        read: 0.1
+    alternative_keys:
+      - kimi/kimi-k2.5-thinking:
+          properties:
+            reasoning_model: true
+          default_parameters:
+            temperature: 1.0
 kimi-k2-models:
   kimi/kimi-k2-thinking:
     label: Kimi K2 Thinking
     release_date: 2025-11-06
     properties:
-      reasoning_model: true
+      reasoning_model: false
       context_window: 256_000
       max_tokens: 32_000
     default_parameters:
-      temperature: 1.0
+      temperature: 0.6
     costs_per_million_token:
       input: 0.6
       output: 2.5

model-library 0.1.7__py3-none-any.whl → 0.1.9__py3-none-any.whl

model-library 0.1.7py3-none-any.whl → 0.1.9py3-none-any.whl