PyPI - lm-deluge - Versions diffs - 0.0.67__py3-none-any.whl → 0.0.90__py3-none-any.whl - Mend

lm-deluge 0.0.67py3-none-any.whl → 0.0.90py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of lm-deluge might be problematic. Click here for more details.

Files changed (108) hide show

lm_deluge/__init__.py +1 -2
lm_deluge/api_requests/anthropic.py +117 -22
lm_deluge/api_requests/base.py +84 -11
lm_deluge/api_requests/bedrock.py +30 -6
lm_deluge/api_requests/chat_reasoning.py +4 -0
lm_deluge/api_requests/gemini.py +166 -20
lm_deluge/api_requests/openai.py +145 -25
lm_deluge/batches.py +15 -45
lm_deluge/client.py +309 -50
lm_deluge/config.py +15 -3
lm_deluge/models/__init__.py +14 -1
lm_deluge/models/anthropic.py +29 -14
lm_deluge/models/arcee.py +16 -0
lm_deluge/models/deepseek.py +36 -4
lm_deluge/models/google.py +42 -0
lm_deluge/models/grok.py +24 -0
lm_deluge/models/kimi.py +36 -0
lm_deluge/models/minimax.py +18 -0
lm_deluge/models/openai.py +100 -0
lm_deluge/models/openrouter.py +133 -7
lm_deluge/models/together.py +11 -0
lm_deluge/models/zai.py +50 -0
lm_deluge/pipelines/gepa/__init__.py +95 -0
lm_deluge/pipelines/gepa/core.py +354 -0
lm_deluge/pipelines/gepa/docs/samples.py +705 -0
lm_deluge/pipelines/gepa/examples/01_synthetic_keywords.py +140 -0
lm_deluge/pipelines/gepa/examples/02_gsm8k_math.py +261 -0
lm_deluge/pipelines/gepa/examples/03_hotpotqa_multihop.py +300 -0
lm_deluge/pipelines/gepa/examples/04_batch_classification.py +271 -0
lm_deluge/pipelines/gepa/examples/simple_qa.py +129 -0
lm_deluge/pipelines/gepa/optimizer.py +435 -0
lm_deluge/pipelines/gepa/proposer.py +235 -0
lm_deluge/pipelines/gepa/util.py +165 -0
lm_deluge/{llm_tools → pipelines}/score.py +2 -2
lm_deluge/{llm_tools → pipelines}/translate.py +5 -3
lm_deluge/prompt.py +537 -88
lm_deluge/request_context.py +7 -2
lm_deluge/server/__init__.py +24 -0
lm_deluge/server/__main__.py +144 -0
lm_deluge/server/adapters.py +369 -0
lm_deluge/server/app.py +388 -0
lm_deluge/server/auth.py +71 -0
lm_deluge/server/model_policy.py +215 -0
lm_deluge/server/models_anthropic.py +172 -0
lm_deluge/server/models_openai.py +175 -0
lm_deluge/tool/__init__.py +1130 -0
lm_deluge/tool/builtin/anthropic/__init__.py +300 -0
lm_deluge/tool/builtin/anthropic/bash.py +0 -0
lm_deluge/tool/builtin/anthropic/computer_use.py +0 -0
lm_deluge/tool/builtin/gemini.py +59 -0
lm_deluge/tool/builtin/openai.py +74 -0
lm_deluge/tool/cua/__init__.py +173 -0
lm_deluge/tool/cua/actions.py +148 -0
lm_deluge/tool/cua/base.py +27 -0
lm_deluge/tool/cua/batch.py +215 -0
lm_deluge/tool/cua/converters.py +466 -0
lm_deluge/tool/cua/kernel.py +702 -0
lm_deluge/tool/cua/trycua.py +989 -0
lm_deluge/tool/prefab/__init__.py +45 -0
lm_deluge/tool/prefab/batch_tool.py +156 -0
lm_deluge/tool/prefab/docs.py +1119 -0
lm_deluge/tool/prefab/email.py +294 -0
lm_deluge/tool/prefab/filesystem.py +1711 -0
lm_deluge/tool/prefab/full_text_search/__init__.py +285 -0
lm_deluge/tool/prefab/full_text_search/tantivy_index.py +396 -0
lm_deluge/tool/prefab/memory.py +458 -0
lm_deluge/tool/prefab/otc/__init__.py +165 -0
lm_deluge/tool/prefab/otc/executor.py +281 -0
lm_deluge/tool/prefab/otc/parse.py +188 -0
lm_deluge/tool/prefab/random.py +212 -0
lm_deluge/tool/prefab/rlm/__init__.py +296 -0
lm_deluge/tool/prefab/rlm/executor.py +349 -0
lm_deluge/tool/prefab/rlm/parse.py +144 -0
lm_deluge/tool/prefab/sandbox/__init__.py +19 -0
lm_deluge/tool/prefab/sandbox/daytona_sandbox.py +483 -0
lm_deluge/tool/prefab/sandbox/docker_sandbox.py +609 -0
lm_deluge/tool/prefab/sandbox/fargate_sandbox.py +546 -0
lm_deluge/tool/prefab/sandbox/modal_sandbox.py +469 -0
lm_deluge/tool/prefab/sandbox/seatbelt_sandbox.py +827 -0
lm_deluge/tool/prefab/sheets.py +385 -0
lm_deluge/tool/prefab/skills.py +0 -0
lm_deluge/tool/prefab/subagents.py +233 -0
lm_deluge/tool/prefab/todos.py +342 -0
lm_deluge/tool/prefab/tool_search.py +169 -0
lm_deluge/tool/prefab/web_search.py +199 -0
lm_deluge/tracker.py +16 -13
lm_deluge/util/schema.py +412 -0
lm_deluge/warnings.py +8 -0
{lm_deluge-0.0.67.dist-info → lm_deluge-0.0.90.dist-info}/METADATA +23 -9
lm_deluge-0.0.90.dist-info/RECORD +132 -0
lm_deluge/built_in_tools/anthropic/__init__.py +0 -128
lm_deluge/built_in_tools/openai.py +0 -28
lm_deluge/presets/cerebras.py +0 -17
lm_deluge/presets/meta.py +0 -13
lm_deluge/tool.py +0 -849
lm_deluge-0.0.67.dist-info/RECORD +0 -72
lm_deluge/{llm_tools → pipelines}/__init__.py +1 -1
/lm_deluge/{llm_tools → pipelines}/classify.py +0 -0
/lm_deluge/{llm_tools → pipelines}/extract.py +0 -0
/lm_deluge/{llm_tools → pipelines}/locate.py +0 -0
/lm_deluge/{llm_tools → pipelines}/ocr.py +0 -0
/lm_deluge/{built_in_tools/anthropic/bash.py → skills/anthropic.py} +0 -0
/lm_deluge/{built_in_tools/anthropic/computer_use.py → skills/compat.py} +0 -0
/lm_deluge/{built_in_tools → tool/builtin}/anthropic/editor.py +0 -0
/lm_deluge/{built_in_tools → tool/builtin}/base.py +0 -0
{lm_deluge-0.0.67.dist-info → lm_deluge-0.0.90.dist-info}/WHEEL +0 -0
{lm_deluge-0.0.67.dist-info → lm_deluge-0.0.90.dist-info}/licenses/LICENSE +0 -0
{lm_deluge-0.0.67.dist-info → lm_deluge-0.0.90.dist-info}/top_level.txt +0 -0

lm_deluge/models/__init__.py CHANGED Viewed

@@ -4,9 +4,10 @@ import random
 from dataclasses import dataclass, field
 from ..request_context import RequestContext
+from .anthropic import ANTHROPIC_MODELS
 # Import and register all provider models
-from .anthropic import ANTHROPIC_MODELS
+from .arcee import ARCEE_MODELS
 from .bedrock import BEDROCK_MODELS
 from .cerebras import CEREBRAS_MODELS
 from .cohere import COHERE_MODELS
@@ -15,11 +16,14 @@ from .fireworks import FIREWORKS_MODELS
 from .google import GOOGLE_MODELS
 from .grok import XAI_MODELS
 from .groq import GROQ_MODELS
+from .kimi import KIMI_MODELS
 from .meta import META_MODELS
+from .minimax import MINIMAX_MODELS
 from .mistral import MISTRAL_MODELS
 from .openai import OPENAI_MODELS
 from .openrouter import OPENROUTER_MODELS
 from .together import TOGETHER_MODELS
+from .zai import ZAI_MODELS
 @dataclass
@@ -37,6 +41,9 @@ class APIModel:
     supports_logprobs: bool = False
     supports_responses: bool = False
     reasoning_model: bool = False
+    supports_xhigh: bool = (
+        False  # supports xhigh reasoning_effort (gpt-5.2, gpt-5.1-codex-max)
+    )
     regions: list[str] | dict[str, int] = field(default_factory=list)
     # tokens_per_minute: int | None = None
     # requests_per_minute: int | None = None
@@ -96,6 +103,7 @@ def register_model(
     supports_logprobs: bool = False,
     supports_responses: bool = False,
     reasoning_model: bool = False,
+    supports_xhigh: bool = False,
     regions: list[str] | dict[str, int] = field(default_factory=list),
     # tokens_per_minute: int | None = None,
     # requests_per_minute: int | None = None,
@@ -115,6 +123,7 @@ def register_model(
         supports_logprobs=supports_logprobs,
         supports_responses=supports_responses,
         reasoning_model=reasoning_model,
+        supports_xhigh=supports_xhigh,
         regions=regions,
         # tokens_per_minute=tokens_per_minute,
         # requests_per_minute=requests_per_minute,
@@ -126,13 +135,17 @@ def register_model(
 # Register all models from all providers
 for model_dict in [
     ANTHROPIC_MODELS,
+    ZAI_MODELS,
+    ARCEE_MODELS,
     BEDROCK_MODELS,
     COHERE_MODELS,
     DEEPSEEK_MODELS,
     FIREWORKS_MODELS,
     GOOGLE_MODELS,
     XAI_MODELS,
+    KIMI_MODELS,
     META_MODELS,
+    MINIMAX_MODELS,
     MISTRAL_MODELS,
     OPENAI_MODELS,
     OPENROUTER_MODELS,

lm_deluge/models/anthropic.py CHANGED Viewed

@@ -10,6 +10,19 @@ ANTHROPIC_MODELS = {
     #                                                                   ░███
     #                                                                   █████
     #
+    "claude-4.5-opus": {
+        "id": "claude-4.5-opus",
+        "name": "claude-opus-4-5-20251101",
+        "api_base": "https://api.anthropic.com/v1",
+        "api_key_env_var": "ANTHROPIC_API_KEY",
+        "supports_json": False,
+        "api_spec": "anthropic",
+        "input_cost": 5.0,
+        "cached_input_cost": 0.50,
+        "cache_write_cost": 6.25,
+        "output_cost": 25.0,
+        "reasoning_model": True,
+    },
     "claude-4.5-haiku": {
         "id": "claude-4.5-haiku",
         "name": "claude-haiku-4-5-20251001",
@@ -21,25 +34,27 @@ ANTHROPIC_MODELS = {
         "cached_input_cost": 0.10,
         "cache_write_cost": 1.25,
         "output_cost": 3.0,
+        "reasoning_model": True,
     },
     "claude-4.5-sonnet": {
         "id": "claude-4.5-sonnet",
         "name": "claude-sonnet-4-5-20250929",
         "api_base": "https://api.anthropic.com/v1",
         "api_key_env_var": "ANTHROPIC_API_KEY",
-        "supports_json": False,
+        "supports_json": True,
         "api_spec": "anthropic",
         "input_cost": 3.0,
         "cached_input_cost": 0.30,
         "cache_write_cost": 3.75,
         "output_cost": 15.0,
+        "reasoning_model": True,
     },
     "claude-4.1-opus": {
         "id": "claude-4.1-opus",
         "name": "claude-opus-4-1-20250805",
         "api_base": "https://api.anthropic.com/v1",
         "api_key_env_var": "ANTHROPIC_API_KEY",
-        "supports_json": False,
+        "supports_json": True,
         "api_spec": "anthropic",
         "input_cost": 15.0,
         "cached_input_cost": 1.50,
@@ -97,18 +112,18 @@ ANTHROPIC_MODELS = {
         "cache_write_cost": 3.75,
         "output_cost": 15.0,
     },
-    "claude-3.5-sonnet": {
-        "id": "claude-3.5-sonnet",
-        "name": "claude-3-5-sonnet-20240620",
-        "api_base": "https://api.anthropic.com/v1",
-        "api_key_env_var": "ANTHROPIC_API_KEY",
-        "supports_json": False,
-        "api_spec": "anthropic",
-        "input_cost": 3.0,
-        "cached_input_cost": 0.30,
-        "cache_write_cost": 3.75,
-        "output_cost": 15.0,
-    },
+    # "claude-3.5-sonnet": {
+    #     "id": "claude-3.5-sonnet",
+    #     "name": "claude-3-5-sonnet-20240620",
+    #     "api_base": "https://api.anthropic.com/v1",
+    #     "api_key_env_var": "ANTHROPIC_API_KEY",
+    #     "supports_json": False,
+    #     "api_spec": "anthropic",
+    #     "input_cost": 3.0,
+    #     "cached_input_cost": 0.30,
+    #     "cache_write_cost": 3.75,
+    #     "output_cost": 15.0,
+    # },
     "claude-3-opus": {
         "id": "claude-3-opus",
         "name": "claude-3-opus-20240229",

lm_deluge/models/arcee.py ADDED Viewed

@@ -0,0 +1,16 @@
+ARCEE_MODELS = {
+    "trinity-mini": {
+        "id": "trinity-mini",
+        "name": "trinity-mini",
+        "api_base": "https://api.arcee.ai/api/v1",
+        "api_key_env_var": "ARCEE_API_KEY",
+        "supports_json": True,
+        "supports_logprobs": False,
+        "supports_responses": False,
+        "api_spec": "openai",
+        "input_cost": 0.045,
+        "cached_input_cost": 0.045,
+        "output_cost": 0.15,
+        "reasoning_model": True,
+    }
+}

lm_deluge/models/deepseek.py CHANGED Viewed

@@ -12,8 +12,9 @@ DEEPSEEK_MODELS = {
         "api_base": "https://api.deepseek.com/v1",
         "api_key_env_var": "DEEPSEEK_API_KEY",
         "api_spec": "openai",
-        "input_cost": 0.27,
-        "output_cost": 1.10,
+        "input_cost": 0.28,
+        "cached_input_cost": 0.028,
+        "output_cost": 0.42,
     },
     "deepseek-r1": {
         "id": "deepseek-r1",
@@ -21,7 +22,38 @@ DEEPSEEK_MODELS = {
         "api_base": "https://api.deepseek.com/v1",
         "api_key_env_var": "DEEPSEEK_API_KEY",
         "api_spec": "openai",
-        "input_cost": 0.55,
-        "output_cost": 2.19,
+        "input_cost": 0.28,
+        "cached_input_cost": 0.028,
+        "output_cost": 0.42,
+    },
+    "deepseek-reasoner": {
+        "id": "deepseek-reasoner",
+        "name": "deepseek-reasoner",
+        "api_base": "https://api.deepseek.com/v1",
+        "api_key_env_var": "DEEPSEEK_API_KEY",
+        "api_spec": "openai",
+        "input_cost": 0.28,
+        "cached_input_cost": 0.028,
+        "output_cost": 0.42,
+    },
+    "deepseek-reasoner-anthropic-compat": {
+        "id": "deepseek-reasoner-anthropic-compat",
+        "name": "deepseek-reasoner",
+        "api_base": "https://api.deepseek.com/anthropic",
+        "api_key_env_var": "DEEPSEEK_API_KEY",
+        "api_spec": "anthropic",
+        "input_cost": 0.28,
+        "cached_input_cost": 0.028,
+        "output_cost": 0.42,
+    },
+    "deepseek-speciale": {
+        "id": "deepseek-speciale",
+        "name": "deepseek-reasoner",
+        "api_base": "https://api.deepseek.com/v3.2_speciale_expires_on_20251215/v1",
+        "api_key_env_var": "DEEPSEEK_API_KEY",
+        "api_spec": "openai",
+        "input_cost": 0.28,
+        "cached_input_cost": 0.028,
+        "output_cost": 0.42,
     },
 }

lm_deluge/models/google.py CHANGED Viewed

@@ -138,4 +138,46 @@ GOOGLE_MODELS = {
         "output_cost": 0.4,
         "reasoning_model": True,
     },
+    # Gemini 3 models - advanced reasoning with thought signatures
+    "gemini-3-pro-preview": {
+        "id": "gemini-3-pro-preview",
+        "name": "gemini-3-pro-preview",
+        "api_base": "https://generativelanguage.googleapis.com/v1alpha",
+        "api_key_env_var": "GEMINI_API_KEY",
+        "supports_json": True,
+        "supports_logprobs": False,
+        "api_spec": "gemini",
+        "input_cost": 2.0,  # <200k tokens
+        "cached_input_cost": 0.5,  # estimated
+        "output_cost": 12.0,  # <200k tokens
+        # Note: >200k tokens pricing is $4/$18 per million
+        "reasoning_model": True,
+    },
+    "gemini-3-flash-preview": {
+        "id": "gemini-3-flash-preview",
+        "name": "gemini-3-flash-preview",
+        "api_base": "https://generativelanguage.googleapis.com/v1alpha",
+        "api_key_env_var": "GEMINI_API_KEY",
+        "supports_json": True,
+        "supports_logprobs": False,
+        "api_spec": "gemini",
+        "input_cost": 0.5,
+        "cached_input_cost": 0.125,  # estimated
+        "output_cost": 3.0,
+        "reasoning_model": True,
+    },
+    # Gemini 2.5 Computer Use model
+    "gemini-2.5-computer-use": {
+        "id": "gemini-2.5-computer-use",
+        "name": "gemini-2.5-computer-use-preview-10-2025",
+        "api_base": "https://generativelanguage.googleapis.com/v1beta",
+        "api_key_env_var": "GEMINI_API_KEY",
+        "supports_json": True,
+        "supports_logprobs": False,
+        "api_spec": "gemini",
+        "input_cost": 1.25,  # same as gemini-2.5-pro for now
+        "cached_input_cost": 0.31,
+        "output_cost": 10.0,
+        "reasoning_model": True,
+    },
 }

lm_deluge/models/grok.py CHANGED Viewed

@@ -7,6 +7,30 @@ XAI_MODELS = {
     # 888    888 888    888  888 888888K
     # Y88b  d88P 888    Y88..88P 888 "88b
     #  "Y8888P88 888     "Y88P"  888  888
+    "grok-4.1-fast-reasoning": {
+        "id": "grok-4.1-fast-reasoning",
+        "name": "grok-4-1-fast-reasoning",
+        "api_base": "https://api.x.ai/v1",
+        "api_key_env_var": "GROK_API_KEY",
+        "supports_json": True,
+        "supports_logprobs": True,
+        "api_spec": "openai",
+        "input_cost": 0.2,
+        "output_cost": 1.5,
+        "reasoning_model": False,
+    },
+    "grok-4.1-fast": {
+        "id": "grok-4.1-fast",
+        "name": "grok-4-1-fast-non-reasoning",
+        "api_base": "https://api.x.ai/v1",
+        "api_key_env_var": "GROK_API_KEY",
+        "supports_json": True,
+        "supports_logprobs": True,
+        "api_spec": "openai",
+        "input_cost": 0.2,
+        "output_cost": 1.5,
+        "reasoning_model": False,
+    },
     "grok-code-fast-1": {
         "id": "grok-code-fast-1",
         "name": "grok-code-fast-1",

lm_deluge/models/kimi.py ADDED Viewed

@@ -0,0 +1,36 @@
+KIMI_MODELS = {
+    "kimi-k2": {
+        "id": "kimi-k2",
+        "name": "kimi-k2-0905-preview",
+        "api_base": "https://api.moonshot.ai/anthropic/v1",
+        "api_key_env_var": "MOONSHOT_API_KEY",
+        "supports_json": True,
+        "api_spec": "anthropic",
+    },
+    "kimi-k2-turbo": {
+        "id": "kimi-k2-turbo",
+        "name": "kimi-k2-turbo-preview",
+        "api_base": "https://api.moonshot.ai/anthropic/v1",
+        "api_key_env_var": "MOONSHOT_API_KEY",
+        "supports_json": True,
+        "api_spec": "anthropic",
+    },
+    "kimi-k2-thinking": {
+        "id": "kimi-k2-thinking",
+        "name": "kimi-k2-thinking",
+        "api_base": "https://api.moonshot.ai/anthropic/v1",
+        "api_key_env_var": "MOONSHOT_API_KEY",
+        "supports_json": True,
+        "api_spec": "anthropic",
+        "reasoning_model": True,
+    },
+    "kimi-k2-thinking-turbo": {
+        "id": "kimi-k2-thinking-turbo",
+        "name": "kimi-k2-thinking-turbo",
+        "api_base": "https://api.moonshot.ai/anthropic/v1",
+        "api_key_env_var": "MOONSHOT_API_KEY",
+        "supports_json": True,
+        "api_spec": "anthropic",
+        "reasoning_model": True,
+    },
+}

lm_deluge/models/minimax.py ADDED Viewed

@@ -0,0 +1,18 @@
+MINIMAX_MODELS = {
+    "minimax-m2.1": {
+        "id": "minimax-m2.1",
+        "name": "MiniMax-M2.1",
+        "api_base": "https://api.minimax.io/anthropic/v1",
+        "api_key_env_var": "MINIMAX_API_KEY",
+        "supports_json": False,
+        "api_spec": "anthropic",
+    },
+    "minimax-m2": {
+        "id": "minimax-m2",
+        "name": "MiniMax-M2",
+        "api_base": "https://api.minimax.io/anthropic/v1",
+        "api_key_env_var": "MINIMAX_API_KEY",
+        "supports_json": False,
+        "api_spec": "anthropic",
+    },
+}

lm_deluge/models/openai.py CHANGED Viewed

@@ -10,6 +10,78 @@ OPENAI_MODELS = {
     #                ░███
     #                █████
     #               ░░░░░
+    "gpt-5.2": {
+        "id": "gpt-5.2",
+        "name": "gpt-5.2",
+        "api_base": "https://api.openai.com/v1",
+        "api_key_env_var": "OPENAI_API_KEY",
+        "supports_json": True,
+        "supports_logprobs": False,
+        "supports_responses": True,
+        "api_spec": "openai",
+        "input_cost": 1.75,
+        "cached_input_cost": 0.175,
+        "output_cost": 14.0,
+        "reasoning_model": True,
+        "supports_xhigh": True,
+    },
+    "gpt-5.1-codex-max": {
+        "id": "gpt-5.1-codex-max",
+        "name": "gpt-5.1-codex-max",
+        "api_base": "https://api.openai.com/v1",
+        "api_key_env_var": "OPENAI_API_KEY",
+        "supports_json": True,
+        "supports_logprobs": False,
+        "supports_responses": True,
+        "api_spec": "openai",
+        "input_cost": 1.25,
+        "cached_input_cost": 0.125,
+        "output_cost": 10.0,
+        "reasoning_model": True,
+        "supports_xhigh": True,
+    },
+    "gpt-5.1": {
+        "id": "gpt-5.1",
+        "name": "gpt-5.1",
+        "api_base": "https://api.openai.com/v1",
+        "api_key_env_var": "OPENAI_API_KEY",
+        "supports_json": True,
+        "supports_logprobs": True,
+        "supports_responses": True,
+        "api_spec": "openai",
+        "input_cost": 1.25,
+        "cached_input_cost": 0.125,
+        "output_cost": 10.0,
+        "reasoning_model": True,
+    },
+    "gpt-5.1-codex": {
+        "id": "gpt-5.1-codex",
+        "name": "gpt-5.1-codex",
+        "api_base": "https://api.openai.com/v1",
+        "api_key_env_var": "OPENAI_API_KEY",
+        "supports_json": False,
+        "supports_logprobs": True,
+        "supports_responses": True,
+        "api_spec": "openai",
+        "input_cost": 1.25,
+        "cached_input_cost": 0.125,
+        "output_cost": 10.0,
+        "reasoning_model": True,
+    },
+    "gpt-5.1-codex-mini": {
+        "id": "gpt-5.1-codex-mini",
+        "name": "gpt-5.1-codex-mini",
+        "api_base": "https://api.openai.com/v1",
+        "api_key_env_var": "OPENAI_API_KEY",
+        "supports_json": False,
+        "supports_logprobs": True,
+        "supports_responses": True,
+        "api_spec": "openai",
+        "input_cost": 0.25,
+        "cached_input_cost": 0.025,
+        "output_cost": 2.0,
+        "reasoning_model": True,
+    },
     "gpt-5-codex": {
         "id": "gpt-5-codex",
         "name": "gpt-5-codex",
@@ -107,6 +179,34 @@ OPENAI_MODELS = {
         "output_cost": 6.0,
         "reasoning_model": True,
     },
+    "o4-mini-deep-research": {
+        "id": "o4-mini-deep-research",
+        "name": "o4-mini-deep-research",
+        "api_base": "https://api.openai.com/v1",
+        "api_key_env_var": "OPENAI_API_KEY",
+        "supports_json": True,
+        "supports_logprobs": False,
+        "supports_responses": True,
+        "api_spec": "openai",
+        "input_cost": 2,
+        "cached_input_cost": 0.5,
+        "output_cost": 8.0,
+        "reasoning_model": True,
+    },
+    "o3-deep-research": {
+        "id": "o3-deep-research",
+        "name": "o3-deep-research",
+        "api_base": "https://api.openai.com/v1",
+        "api_key_env_var": "OPENAI_API_KEY",
+        "supports_json": True,
+        "supports_logprobs": False,
+        "supports_responses": True,
+        "api_spec": "openai",
+        "input_cost": 10,
+        "cached_input_cost": 2.50,
+        "output_cost": 40.0,
+        "reasoning_model": True,
+    },
     "o3": {
         "id": "o3",
         "name": "o3-2025-04-16",

lm_deluge/models/openrouter.py CHANGED Viewed

@@ -1,13 +1,25 @@
 OPENROUTER_MODELS = {
+    "intellect-3-openrouter": {
+        "id": "intellect-3-openrouter",
+        "name": "prime-intellect/intellect-3",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.2,
+        "cached_input_cost": 0.2,
+        "cache_write_cost": 0.2,
+        "output_cost": 1.10,
+    },
     "glm-4.6-openrouter": {
         "id": "glm-4.6-openrouter",
-        "name": "z-ai/glm-4.6",
+        "name": "z-ai/glm-4.6:exacto",
         "api_base": "https://openrouter.ai/api/v1",
         "api_key_env_var": "OPENROUTER_API_KEY",
         "supports_json": True,
         "api_spec": "openai",
         "input_cost": 0.6,
-        "cached_input_cost": 0.11,
+        "cached_input_cost": 0.6,
         "cache_write_cost": 0.6,
         "output_cost": 2.20,
     },
@@ -35,9 +47,21 @@ OPENROUTER_MODELS = {
         "cache_write_cost": 0.23,
         "output_cost": 0.9,
     },
+    "deepseek-3.2-exp-openrouter": {
+        "id": "deepseek-3.2-exp-openrouter",
+        "name": "deepseek/deepseek-v3.2-exp",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.27,
+        "cached_input_cost": 0.27,
+        "cache_write_cost": 0.27,
+        "output_cost": 0.4,
+    },
     "deepseek-3.2-openrouter": {
         "id": "deepseek-3.2-openrouter",
-        "name": "deepseek/deepseek-v3.2-exp",
+        "name": "deepseek/deepseek-v3.2",
         "api_base": "https://openrouter.ai/api/v1",
         "api_key_env_var": "OPENROUTER_API_KEY",
         "supports_json": True,
@@ -47,18 +71,120 @@ OPENROUTER_MODELS = {
         "cache_write_cost": 0.27,
         "output_cost": 0.4,
     },
-    # "gpt-oss-20b-openrouter": {},
-    # "gpt-oss-120b-openrouter": {},
+    "gpt-oss-20b-openrouter": {
+        "id": "gpt-oss-20b-openrouter",
+        "name": "openai/gpt-oss-20b",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.04,
+        "cached_input_cost": 0.04,
+        "cache_write_cost": 0.04,
+        "output_cost": 0.18,
+    },
+    "gpt-oss-20b-free-openrouter": {
+        "id": "gpt-oss-20b-openrouter",
+        "name": "openai/gpt-oss-20b:free",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.0,
+        "cached_input_cost": 0.0,
+        "cache_write_cost": 0.0,
+        "output_cost": 0.0,
+    },
+    "gpt-oss-120b-openrouter": {
+        "id": "gpt-oss-120b-openrouter",
+        "name": "openai/gpt-oss-120b",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.05,
+        "cached_input_cost": 0.05,
+        "cache_write_cost": 0.05,
+        "output_cost": 0.45,
+    },
+    "gpt-oss-120b-free-openrouter": {
+        "id": "gpt-oss-120b-free-openrouter",
+        "name": "openai/gpt-oss-120b:free",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.00,
+        "cached_input_cost": 0.00,
+        "cache_write_cost": 0.00,
+        "output_cost": 0.0,
+    },
     "kimi-k2-openrouter": {
         "id": "kimi-k2-openrouter",
-        "name": "z-ai/glm-4.6",
+        "name": "moonshotai/kimi-k2-0905:exacto",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 1,
+        "cached_input_cost": 1,
+        "cache_write_cost": 1,
+        "output_cost": 3,
+    },
+    "kimi-k2-thinking-openrouter": {
+        "id": "kimi-k2-thinking-openrouter",
+        "name": "moonshotai/kimi-k2-thinking",
         "api_base": "https://openrouter.ai/api/v1",
         "api_key_env_var": "OPENROUTER_API_KEY",
         "supports_json": True,
         "api_spec": "openai",
         "input_cost": 0.6,
-        "cached_input_cost": 0.11,
+        "cached_input_cost": 0.6,
+        "cache_write_cost": 0.6,
+        "output_cost": 2.5,
+    },
+    "olmo-3-32b-think-openrouter": {
+        "id": "olmo-3-32b-think-openrouter",
+        "name": "allenai/olmo-3-32b-think",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.2,
+        "output_cost": 35,
+    },
+    "trinity-mini-openrouter": {
+        "id": "trinity-mini-openrouter",
+        "name": "arcee-ai/trinity-mini:free",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.045,
+        "output_cost": 0.15,
+    },
+    "glm-4.7-openrouter": {
+        "id": "glm-4.7-openrouter",
+        "name": "z-ai/glm-4.7",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.6,
+        "cached_input_cost": 0.6,
         "cache_write_cost": 0.6,
         "output_cost": 2.20,
     },
+    "minimax-m2.1-openrouter": {
+        "id": "minimax-m2.1-openrouter",
+        "name": "minimax/minimax-m2.1",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.3,
+        "cached_input_cost": 0.3,
+        "cache_write_cost": 0.3,
+        "output_cost": 1.20,
+    },
 }

lm_deluge/models/together.py CHANGED Viewed

@@ -93,4 +93,15 @@ TOGETHER_MODELS = {
         "output_cost": 0.59,
         "reasoning_model": True,
     },
+    "trinity-mini-together": {
+        "id": "trinity-mini-together",
+        "name": "arcee-ai/trinity-mini",
+        "api_base": "https://api.together.xyz/v1",
+        "api_key_env_var": "TOGETHER_API_KEY",
+        "supports_json": False,
+        "api_spec": "openai",
+        "input_cost": 0.18,
+        "output_cost": 0.59,
+        "reasoning_model": True,
+    },
 }

lm-deluge 0.0.67__py3-none-any.whl → 0.0.90__py3-none-any.whl

Potentially problematic release.

lm-deluge 0.0.67py3-none-any.whl → 0.0.90py3-none-any.whl