PyPI - lm-deluge - Versions diffs - 0.0.89__py3-none-any.whl → 0.0.91__py3-none-any.whl - Mend

lm-deluge 0.0.89py3-none-any.whl → 0.0.91py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (88) hide show

lm_deluge/__init__.py +3 -27
lm_deluge/api_requests/anthropic.py +29 -7
lm_deluge/api_requests/base.py +38 -1
lm_deluge/api_requests/bedrock.py +29 -3
lm_deluge/{request_context.py → api_requests/context.py} +4 -4
lm_deluge/api_requests/gemini.py +30 -14
lm_deluge/api_requests/mistral.py +1 -1
lm_deluge/api_requests/openai.py +34 -5
lm_deluge/batches.py +19 -49
lm_deluge/cache.py +1 -1
lm_deluge/cli.py +672 -300
lm_deluge/{client.py → client/__init__.py} +42 -13
lm_deluge/config.py +9 -31
lm_deluge/embed.py +2 -6
lm_deluge/models/__init__.py +138 -29
lm_deluge/models/anthropic.py +32 -24
lm_deluge/models/bedrock.py +9 -0
lm_deluge/models/cerebras.py +2 -0
lm_deluge/models/cohere.py +2 -0
lm_deluge/models/google.py +13 -0
lm_deluge/models/grok.py +4 -0
lm_deluge/models/groq.py +2 -0
lm_deluge/models/meta.py +2 -0
lm_deluge/models/minimax.py +9 -1
lm_deluge/models/openai.py +24 -1
lm_deluge/models/openrouter.py +155 -1
lm_deluge/models/together.py +3 -0
lm_deluge/models/zai.py +50 -1
lm_deluge/pipelines/extract.py +4 -5
lm_deluge/pipelines/gepa/__init__.py +1 -1
lm_deluge/pipelines/gepa/docs/samples.py +19 -10
lm_deluge/pipelines/gepa/examples/01_synthetic_keywords.py +1 -1
lm_deluge/pipelines/gepa/examples/02_gsm8k_math.py +1 -1
lm_deluge/pipelines/gepa/examples/03_hotpotqa_multihop.py +1 -1
lm_deluge/pipelines/gepa/examples/04_batch_classification.py +1 -1
lm_deluge/pipelines/gepa/examples/simple_qa.py +1 -1
lm_deluge/prompt/__init__.py +45 -0
lm_deluge/{prompt.py → prompt/conversation.py} +165 -869
lm_deluge/{image.py → prompt/image.py} +0 -10
lm_deluge/prompt/message.py +571 -0
lm_deluge/prompt/serialization.py +21 -0
lm_deluge/prompt/signatures.py +77 -0
lm_deluge/prompt/text.py +47 -0
lm_deluge/prompt/thinking.py +55 -0
lm_deluge/prompt/tool_calls.py +245 -0
lm_deluge/server/__init__.py +24 -0
lm_deluge/server/__main__.py +144 -0
lm_deluge/server/adapters.py +369 -0
lm_deluge/server/app.py +388 -0
lm_deluge/server/auth.py +71 -0
lm_deluge/server/model_policy.py +215 -0
lm_deluge/server/models_anthropic.py +172 -0
lm_deluge/server/models_openai.py +175 -0
lm_deluge/skills/anthropic.py +0 -0
lm_deluge/skills/compat.py +0 -0
lm_deluge/tool/__init__.py +78 -19
lm_deluge/tool/builtin/anthropic/__init__.py +1 -1
lm_deluge/tool/cua/actions.py +26 -26
lm_deluge/tool/cua/batch.py +1 -2
lm_deluge/tool/cua/kernel.py +1 -1
lm_deluge/tool/prefab/filesystem.py +2 -2
lm_deluge/tool/prefab/full_text_search/__init__.py +3 -2
lm_deluge/tool/prefab/memory.py +3 -1
lm_deluge/tool/prefab/otc/executor.py +3 -3
lm_deluge/tool/prefab/random.py +30 -54
lm_deluge/tool/prefab/rlm/__init__.py +2 -2
lm_deluge/tool/prefab/rlm/executor.py +1 -1
lm_deluge/tool/prefab/sandbox/__init__.py +19 -0
lm_deluge/tool/prefab/sandbox/daytona_sandbox.py +483 -0
lm_deluge/tool/prefab/sandbox/docker_sandbox.py +609 -0
lm_deluge/tool/prefab/sandbox/fargate_sandbox.py +546 -0
lm_deluge/tool/prefab/sandbox/modal_sandbox.py +469 -0
lm_deluge/tool/prefab/sandbox/seatbelt_sandbox.py +829 -0
lm_deluge/tool/prefab/skills.py +0 -0
lm_deluge/tool/prefab/subagents.py +1 -1
lm_deluge/util/logprobs.py +4 -4
lm_deluge/util/schema.py +6 -6
lm_deluge/util/validation.py +14 -9
{lm_deluge-0.0.89.dist-info → lm_deluge-0.0.91.dist-info}/METADATA +12 -12
lm_deluge-0.0.91.dist-info/RECORD +140 -0
lm_deluge-0.0.91.dist-info/entry_points.txt +3 -0
lm_deluge/mock_openai.py +0 -643
lm_deluge/tool/prefab/sandbox.py +0 -1621
lm_deluge-0.0.89.dist-info/RECORD +0 -117
/lm_deluge/{file.py → prompt/file.py} +0 -0
{lm_deluge-0.0.89.dist-info → lm_deluge-0.0.91.dist-info}/WHEEL +0 -0
{lm_deluge-0.0.89.dist-info → lm_deluge-0.0.91.dist-info}/licenses/LICENSE +0 -0
{lm_deluge-0.0.89.dist-info → lm_deluge-0.0.91.dist-info}/top_level.txt +0 -0

lm_deluge/models/google.py CHANGED Viewed

@@ -21,6 +21,7 @@ GOOGLE_MODELS = {
         "cached_input_cost": 0.025,
         "output_cost": 0.4,
         "reasoning_model": False,
+        "supports_images": True,
     },
     "gemini-2.0-flash-lite-compat": {
         "id": "gemini-2.0-flash-lite-compat",
@@ -33,6 +34,7 @@ GOOGLE_MODELS = {
         "input_cost": 0.075,
         "output_cost": 0.3,
         "reasoning_model": False,
+        "supports_images": True,
     },
     "gemini-2.5-pro-compat": {
         "id": "gemini-2.5-pro-compat",
@@ -46,6 +48,7 @@ GOOGLE_MODELS = {
         "cached_input_cost": 0.31,
         "output_cost": 10.0,
         "reasoning_model": True,
+        "supports_images": True,
     },
     "gemini-2.5-flash-compat": {
         "id": "gemini-2.5-flash-compat",
@@ -59,6 +62,7 @@ GOOGLE_MODELS = {
         "cached_input_cost": 0.075,
         "output_cost": 2.5,
         "reasoning_model": True,
+        "supports_images": True,
     },
     "gemini-2.5-flash-lite-compat": {
         "id": "gemini-2.5-flash-lite-compat",
@@ -72,6 +76,7 @@ GOOGLE_MODELS = {
         "cached_input_cost": 0.025,
         "output_cost": 0.4,
         "reasoning_model": True,
+        "supports_images": True,
     },
     # Native Gemini API versions with file support
     "gemini-2.0-flash": {
@@ -86,6 +91,7 @@ GOOGLE_MODELS = {
         "cached_input_cost": 0.025,
         "output_cost": 0.4,
         "reasoning_model": False,
+        "supports_images": True,
     },
     "gemini-2.0-flash-lite": {
         "id": "gemini-2.0-flash-lite",
@@ -98,6 +104,7 @@ GOOGLE_MODELS = {
         "input_cost": 0.075,
         "output_cost": 0.3,
         "reasoning_model": False,
+        "supports_images": True,
     },
     "gemini-2.5-pro": {
         "id": "gemini-2.5-pro",
@@ -111,6 +118,7 @@ GOOGLE_MODELS = {
         "cached_input_cost": 0.31,
         "output_cost": 10.0,
         "reasoning_model": True,
+        "supports_images": True,
     },
     "gemini-2.5-flash": {
         "id": "gemini-2.5-flash",
@@ -124,6 +132,7 @@ GOOGLE_MODELS = {
         "cached_input_cost": 0.075,
         "output_cost": 2.5,
         "reasoning_model": True,
+        "supports_images": True,
     },
     "gemini-2.5-flash-lite": {
         "id": "gemini-2.5-flash-lite",
@@ -137,6 +146,7 @@ GOOGLE_MODELS = {
         "cached_input_cost": 0.025,
         "output_cost": 0.4,
         "reasoning_model": True,
+        "supports_images": True,
     },
     # Gemini 3 models - advanced reasoning with thought signatures
     "gemini-3-pro-preview": {
@@ -152,6 +162,7 @@ GOOGLE_MODELS = {
         "output_cost": 12.0,  # <200k tokens
         # Note: >200k tokens pricing is $4/$18 per million
         "reasoning_model": True,
+        "supports_images": True,
     },
     "gemini-3-flash-preview": {
         "id": "gemini-3-flash-preview",
@@ -165,6 +176,7 @@ GOOGLE_MODELS = {
         "cached_input_cost": 0.125,  # estimated
         "output_cost": 3.0,
         "reasoning_model": True,
+        "supports_images": True,
     },
     # Gemini 2.5 Computer Use model
     "gemini-2.5-computer-use": {
@@ -179,5 +191,6 @@ GOOGLE_MODELS = {
         "cached_input_cost": 0.31,
         "output_cost": 10.0,
         "reasoning_model": True,
+        "supports_images": True,
     },
 }

lm_deluge/models/grok.py CHANGED Viewed

@@ -18,6 +18,7 @@ XAI_MODELS = {
         "input_cost": 0.2,
         "output_cost": 1.5,
         "reasoning_model": False,
+        "supports_images": True,
     },
     "grok-4.1-fast": {
         "id": "grok-4.1-fast",
@@ -30,6 +31,7 @@ XAI_MODELS = {
         "input_cost": 0.2,
         "output_cost": 1.5,
         "reasoning_model": False,
+        "supports_images": True,
     },
     "grok-code-fast-1": {
         "id": "grok-code-fast-1",
@@ -54,6 +56,7 @@ XAI_MODELS = {
         "input_cost": 0.2,
         "output_cost": 0.5,
         "reasoning_model": False,
+        "supports_images": True,
     },
     "grok-4-fast-non-reasoning": {
         "id": "grok-4-fast-non-reasoning",
@@ -66,6 +69,7 @@ XAI_MODELS = {
         "input_cost": 0.2,
         "output_cost": 0.5,
         "reasoning_model": False,
+        "supports_images": True,
     },
     "grok-4": {
         "id": "grok-4",

lm_deluge/models/groq.py CHANGED Viewed

@@ -30,6 +30,7 @@ GROQ_MODELS = {
         "api_key_env_var": "GROQ_API_KEY",
         "supports_json": False,
         "api_spec": "openai",
+        "supports_images": True,
     },
     "llama-4-scout-groq": {
         "id": "llama-4-scout-groq",
@@ -38,6 +39,7 @@ GROQ_MODELS = {
         "api_key_env_var": "GROQ_API_KEY",
         "supports_json": False,
         "api_spec": "openai",
+        "supports_images": True,
     },
     "kimi-k2-groq": {
         "id": "kimi-k2-groq",

lm_deluge/models/meta.py CHANGED Viewed

@@ -17,6 +17,7 @@ META_MODELS = {
         "input_cost": 0.0,
         "output_cost": 0.0,
         "reasoning_model": False,
+        "supports_images": True,
     },
     "llama-4-maverick": {
         "id": "llama-4-maverick",
@@ -29,6 +30,7 @@ META_MODELS = {
         "input_cost": 0.0,
         "output_cost": 0.0,
         "reasoning_model": False,
+        "supports_images": True,
     },
     "llama-3.3-70b": {
         "id": "llama-3.3-70b",

lm_deluge/models/minimax.py CHANGED Viewed

@@ -1,4 +1,12 @@
 MINIMAX_MODELS = {
+    "minimax-m2.1": {
+        "id": "minimax-m2.1",
+        "name": "MiniMax-M2.1",
+        "api_base": "https://api.minimax.io/anthropic/v1",
+        "api_key_env_var": "MINIMAX_API_KEY",
+        "supports_json": False,
+        "api_spec": "anthropic",
+    },
     "minimax-m2": {
         "id": "minimax-m2",
         "name": "MiniMax-M2",
@@ -6,5 +14,5 @@ MINIMAX_MODELS = {
         "api_key_env_var": "MINIMAX_API_KEY",
         "supports_json": False,
         "api_spec": "anthropic",
-    }
+    },
 }

lm_deluge/models/openai.py CHANGED Viewed

@@ -24,6 +24,7 @@ OPENAI_MODELS = {
         "output_cost": 14.0,
         "reasoning_model": True,
         "supports_xhigh": True,
+        "supports_images": True,
     },
     "gpt-5.1-codex-max": {
         "id": "gpt-5.1-codex-max",
@@ -31,7 +32,6 @@ OPENAI_MODELS = {
         "api_base": "https://api.openai.com/v1",
         "api_key_env_var": "OPENAI_API_KEY",
         "supports_json": True,
-        "supports_logprobs": False,
         "supports_responses": True,
         "api_spec": "openai",
         "input_cost": 1.25,
@@ -39,6 +39,7 @@ OPENAI_MODELS = {
         "output_cost": 10.0,
         "reasoning_model": True,
         "supports_xhigh": True,
+        "supports_images": True,
     },
     "gpt-5.1": {
         "id": "gpt-5.1",
@@ -53,6 +54,7 @@ OPENAI_MODELS = {
         "cached_input_cost": 0.125,
         "output_cost": 10.0,
         "reasoning_model": True,
+        "supports_images": True,
     },
     "gpt-5.1-codex": {
         "id": "gpt-5.1-codex",
@@ -67,6 +69,7 @@ OPENAI_MODELS = {
         "cached_input_cost": 0.125,
         "output_cost": 10.0,
         "reasoning_model": True,
+        "supports_images": True,
     },
     "gpt-5.1-codex-mini": {
         "id": "gpt-5.1-codex-mini",
@@ -95,6 +98,7 @@ OPENAI_MODELS = {
         "cached_input_cost": 0.125,
         "output_cost": 10.0,
         "reasoning_model": True,
+        "supports_images": True,
     },
     "gpt-5": {
         "id": "gpt-5",
@@ -109,6 +113,7 @@ OPENAI_MODELS = {
         "cached_input_cost": 0.125,
         "output_cost": 10.0,
         "reasoning_model": True,
+        "supports_images": True,
     },
     "gpt-5-chat": {
         "id": "gpt-5-chat",
@@ -123,6 +128,7 @@ OPENAI_MODELS = {
         "cached_input_cost": 0.125,
         "output_cost": 10.0,
         "reasoning_model": False,
+        "supports_images": True,
     },
     "gpt-5-mini": {
         "id": "gpt-5-mini",
@@ -137,6 +143,7 @@ OPENAI_MODELS = {
         "cached_input_cost": 0.025,
         "output_cost": 2.0,
         "reasoning_model": True,
+        "supports_images": True,
     },
     "gpt-5-nano": {
         "id": "gpt-5-nano",
@@ -151,6 +158,7 @@ OPENAI_MODELS = {
         "cached_input_cost": 0.005,
         "output_cost": 0.40,
         "reasoning_model": True,
+        "supports_images": True,
     },
     "openai-computer-use-preview": {
         "id": "openai-computer-use-preview",
@@ -178,6 +186,7 @@ OPENAI_MODELS = {
         "cached_input_cost": 0.375,
         "output_cost": 6.0,
         "reasoning_model": True,
+        "supports_images": True,
     },
     "o4-mini-deep-research": {
         "id": "o4-mini-deep-research",
@@ -192,6 +201,7 @@ OPENAI_MODELS = {
         "cached_input_cost": 0.5,
         "output_cost": 8.0,
         "reasoning_model": True,
+        "supports_images": True,
     },
     "o3-deep-research": {
         "id": "o3-deep-research",
@@ -206,6 +216,7 @@ OPENAI_MODELS = {
         "cached_input_cost": 2.50,
         "output_cost": 40.0,
         "reasoning_model": True,
+        "supports_images": True,
     },
     "o3": {
         "id": "o3",
@@ -220,6 +231,7 @@ OPENAI_MODELS = {
         "cached_input_cost": 0.50,
         "output_cost": 8.0,
         "reasoning_model": True,
+        "supports_images": True,
     },
     "o4-mini": {
         "id": "o4-mini",
@@ -234,6 +246,7 @@ OPENAI_MODELS = {
         "cached_input_cost": 0.275,
         "output_cost": 4.4,
         "reasoning_model": True,
+        "supports_images": True,
     },
     "gpt-4.1": {
         "id": "gpt-4.1",
@@ -248,6 +261,7 @@ OPENAI_MODELS = {
         "cached_input_cost": 0.50,
         "output_cost": 8.0,
         "reasoning_model": False,
+        "supports_images": True,
     },
     "gpt-4.1-mini": {
         "id": "gpt-4.1-mini",
@@ -262,6 +276,7 @@ OPENAI_MODELS = {
         "cached_input_cost": 0.10,
         "output_cost": 1.6,
         "reasoning_model": False,
+        "supports_images": True,
     },
     "gpt-4.1-nano": {
         "id": "gpt-4.1-nano",
@@ -276,6 +291,7 @@ OPENAI_MODELS = {
         "cached_input_cost": 0.025,
         "output_cost": 0.4,
         "reasoning_model": False,
+        "supports_images": True,
     },
     "gpt-4.5": {
         "id": "gpt-4.5",
@@ -289,6 +305,7 @@ OPENAI_MODELS = {
         "input_cost": 75.0,
         "output_cost": 150.0,
         "reasoning_model": False,
+        "supports_images": True,
     },
     "o3-mini": {
         "id": "o3-mini",
@@ -317,6 +334,7 @@ OPENAI_MODELS = {
         "cached_input_cost": 7.50,
         "output_cost": 60.0,
         "reasoning_model": True,
+        "supports_images": True,
     },
     "o1-preview": {
         "id": "o1-preview",
@@ -357,6 +375,7 @@ OPENAI_MODELS = {
         "input_cost": 2.50,
         "cached_input_cost": 1.25,
         "output_cost": 10.0,
+        "supports_images": True,
     },
     "gpt-4o-mini": {
         "id": "gpt-4o-mini",
@@ -370,6 +389,7 @@ OPENAI_MODELS = {
         "input_cost": 0.15,
         "cached_input_cost": 0.075,
         "output_cost": 0.6,
+        "supports_images": True,
     },
     "gpt-3.5-turbo": {
         "id": "gpt-3.5-turbo",
@@ -394,6 +414,7 @@ OPENAI_MODELS = {
         "api_spec": "openai",
         "input_cost": 10.0,
         "output_cost": 30.0,
+        "supports_images": True,
     },
     "gpt-4": {
         "id": "gpt-4",
@@ -406,6 +427,7 @@ OPENAI_MODELS = {
         "api_spec": "openai",
         "input_cost": 30.0,
         "output_cost": 60.0,
+        "supports_images": True,
     },
     "gpt-4-32k": {
         "id": "gpt-4-32k",
@@ -418,5 +440,6 @@ OPENAI_MODELS = {
         "api_spec": "openai",
         "input_cost": 60.0,
         "output_cost": 120.0,
+        "supports_images": True,
     },
 }

lm_deluge/models/openrouter.py CHANGED Viewed

@@ -1,4 +1,90 @@
 OPENROUTER_MODELS = {
+    "nemotron-3-nano-30b-a3b-free": {
+        "id": "nemotron-3-nano-30b-a3b-free",
+        "name": "nvidia/nemotron-3-nano-30b-a3b:free",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.0,
+        "cached_input_cost": 0.0,
+        "cache_write_cost": 0.0,
+        "output_cost": 0.0,
+    },
+    "nemotron-3-nano-30b-a3b": {
+        "id": "nemotron-3-nano-30b-a3b",
+        "name": "nvidia/nemotron-3-nano-30b-a3b",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.06,
+        "cached_input_cost": 0.06,
+        "cache_write_cost": 0.06,
+        "output_cost": 0.24,
+    },
+    "nemotron-nano-12b-2-vl-free": {
+        "id": "nemotron-nano-12b-2-vl-free",
+        "name": "nvidia/nemotron-nano-12b-v2-vl:free",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.0,
+        "cached_input_cost": 0.0,
+        "cache_write_cost": 0.0,
+        "output_cost": 0.0,
+        "supports_images": True,
+    },
+    "nemotron-nano-12b-2-vl": {
+        "id": "nemotron-nano-12b-2-vl",
+        "name": "nvidia/nemotron-nano-12b-v2-vl",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.0,
+        "cached_input_cost": 0.0,
+        "cache_write_cost": 0.0,
+        "output_cost": 0.0,
+        "supports_images": True,
+    },
+    "devstral-2-free-openrouter": {
+        "id": "devstral-2-free-openrouter",
+        "name": "mistralai/devstral-2512:free",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.0,
+        "cached_input_cost": 0.0,
+        "cache_write_cost": 0.0,
+        "output_cost": 0.0,
+    },
+    "devstral-2-openrouter": {
+        "id": "devstral-2-openrouter",
+        "name": "mistralai/devstral-2512",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.05,
+        "cached_input_cost": 0.05,
+        "cache_write_cost": 0.05,
+        "output_cost": 0.22,
+    },
+    "mimo-flash-v2-free-openrouter": {
+        "id": "mimo-flash-v2-free-openrouter",
+        "name": "xiaomi/mimo-v2-flash:free",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.0,
+        "cached_input_cost": 0.0,
+        "cache_write_cost": 0.0,
+        "output_cost": 0.0,
+    },
     "intellect-3-openrouter": {
         "id": "intellect-3-openrouter",
         "name": "prime-intellect/intellect-3",
@@ -83,6 +169,18 @@ OPENROUTER_MODELS = {
         "cache_write_cost": 0.04,
         "output_cost": 0.18,
     },
+    "gpt-oss-20b-free-openrouter": {
+        "id": "gpt-oss-20b-openrouter",
+        "name": "openai/gpt-oss-20b:free",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.0,
+        "cached_input_cost": 0.0,
+        "cache_write_cost": 0.0,
+        "output_cost": 0.0,
+    },
     "gpt-oss-120b-openrouter": {
         "id": "gpt-oss-120b-openrouter",
         "name": "openai/gpt-oss-120b",
@@ -95,6 +193,18 @@ OPENROUTER_MODELS = {
         "cache_write_cost": 0.05,
         "output_cost": 0.45,
     },
+    "gpt-oss-120b-free-openrouter": {
+        "id": "gpt-oss-120b-free-openrouter",
+        "name": "openai/gpt-oss-120b:free",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.00,
+        "cached_input_cost": 0.00,
+        "cache_write_cost": 0.00,
+        "output_cost": 0.0,
+    },
     "kimi-k2-openrouter": {
         "id": "kimi-k2-openrouter",
         "name": "moonshotai/kimi-k2-0905:exacto",
@@ -129,9 +239,29 @@ OPENROUTER_MODELS = {
         "input_cost": 0.2,
         "output_cost": 35,
     },
+    "olmo-3.1-32b-think-openrouter": {
+        "id": "olmo-3.1-32b-think-openrouter",
+        "name": "allenai/olmo-3.1-32b-think:free",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.2,
+        "output_cost": 35,
+    },
+    "trinity-mini-free-openrouter": {
+        "id": "trinity-mini-free-openrouter",
+        "name": "arcee-ai/trinity-mini:free",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.045,
+        "output_cost": 0.15,
+    },
     "trinity-mini-openrouter": {
         "id": "trinity-mini-openrouter",
-        "name": "arcee-ai/trinity-mini:free",
+        "name": "arcee-ai/trinity-mini",
         "api_base": "https://openrouter.ai/api/v1",
         "api_key_env_var": "OPENROUTER_API_KEY",
         "supports_json": True,
@@ -139,4 +269,28 @@ OPENROUTER_MODELS = {
         "input_cost": 0.045,
         "output_cost": 0.15,
     },
+    "glm-4.7-openrouter": {
+        "id": "glm-4.7-openrouter",
+        "name": "z-ai/glm-4.7",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.6,
+        "cached_input_cost": 0.6,
+        "cache_write_cost": 0.6,
+        "output_cost": 2.20,
+    },
+    "minimax-m2.1-openrouter": {
+        "id": "minimax-m2.1-openrouter",
+        "name": "minimax/minimax-m2.1",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.3,
+        "cached_input_cost": 0.3,
+        "cache_write_cost": 0.3,
+        "output_cost": 1.20,
+    },
 }

lm_deluge/models/together.py CHANGED Viewed

@@ -50,6 +50,7 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 1.95,
         "output_cost": 8.0,
+        "supports_images": True,
     },
     "llama-4-maverick-together": {
         "id": "llama-4-maverick-together",
@@ -60,6 +61,7 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.27,
         "output_cost": 0.85,
+        "supports_images": True,
     },
     "llama-4-scout-together": {
         "id": "llama-4-scout-together",
@@ -70,6 +72,7 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.18,
         "output_cost": 0.59,
+        "supports_images": True,
     },
     "gpt-oss-120b-together": {
         "id": "gpt-oss-120b-together",

lm_deluge/models/zai.py CHANGED Viewed

@@ -1 +1,50 @@
-ZAI_MODELS = {}
+ZAI_MODELS = {
+    "glm-4.7": {
+        "id": "glm-4.7",
+        "name": "glm-4.7",
+        "api_base": "https://api.z.ai/api/anthropic/v1",
+        "api_key_env_var": "ZAI_API_KEY",
+        "supports_json": True,
+        "api_spec": "anthropic",
+        "input_cost": 0.6,
+        "cached_input_cost": 0.6,
+        "cache_write_cost": 0.6,
+        "output_cost": 2.20,
+    },
+    "glm-4.6": {
+        "id": "glm-4.6",
+        "name": "glm-4.6",
+        "api_base": "https://api.z.ai/api/anthropic/v1",
+        "api_key_env_var": "ZAI_API_KEY",
+        "supports_json": True,
+        "api_spec": "anthropic",
+        "input_cost": 0.6,
+        "cached_input_cost": 0.6,
+        "cache_write_cost": 0.6,
+        "output_cost": 2.20,
+    },
+    "glm-4.5": {
+        "id": "glm-4.5",
+        "name": "glm-4.5",
+        "api_base": "https://api.z.ai/api/anthropic/v1",
+        "api_key_env_var": "ZAI_API_KEY",
+        "supports_json": True,
+        "api_spec": "anthropic",
+        "input_cost": 0.6,
+        "cached_input_cost": 0.6,
+        "cache_write_cost": 0.6,
+        "output_cost": 2.20,
+    },
+    "glm-4.5-air": {
+        "id": "glm-4.5-air",
+        "name": "glm-4.5-air",
+        "api_base": "https://api.z.ai/api/anthropic/v1",
+        "api_key_env_var": "ZAI_API_KEY",
+        "supports_json": True,
+        "api_spec": "anthropic",
+        "input_cost": 0.6,
+        "cached_input_cost": 0.6,
+        "cache_write_cost": 0.6,
+        "output_cost": 2.20,
+    },
+}

lm_deluge/pipelines/extract.py CHANGED Viewed

@@ -5,15 +5,14 @@ import os
 from typing import Any
 from lm_deluge.client import _LLMClient
-from lm_deluge.file import File
-from ..prompt import Conversation
+from ..prompt import Conversation, File
 from ..util.json import load_json
 try:
     from PIL import Image as PILImage
 except ImportError:
-    PILImage = None
+    PILImage: Any = None
 async def extract_async(
@@ -86,13 +85,13 @@ async def extract_async(
             buffer = io.BytesIO()
             input.save(buffer, format="PNG")
             prompts.append(
-                Conversation.user(text=image_only_prompt, image=buffer.getvalue())
+                Conversation().user(text=image_only_prompt, image=buffer.getvalue())
             )
         elif isinstance(input, File):
             data = input.data
             if isinstance(data, io.BytesIO):
                 data = data.getvalue()
-            prompts.append(Conversation.user(text=file_prompt, file=data))
+            prompts.append(Conversation().user(text=file_prompt, file=data))
         else:
             raise ValueError(
                 "inputs must be a list of strings or PIL images or a File object."

lm_deluge/pipelines/gepa/__init__.py CHANGED Viewed

@@ -21,7 +21,7 @@ Example usage:
     # Define how to evaluate one example
     def evaluate(client: LLMClient, values: dict[str, str], example: dict) -> EvalResult:
         # Build prompt with current component values
-        conv = Conversation.system(values["system_prompt"])
+        conv = Conversation().system(values["system_prompt"])
         conv = conv.add(Message.user(example["question"]))
         # Run inference

lm-deluge 0.0.89__py3-none-any.whl → 0.0.91__py3-none-any.whl

lm-deluge 0.0.89py3-none-any.whl → 0.0.91py3-none-any.whl