PyPI - lm-deluge - Versions diffs - 0.0.56__py3-none-any.whl → 0.0.58__py3-none-any.whl - Mend

lm-deluge 0.0.56py3-none-any.whl → 0.0.58py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of lm-deluge might be problematic. Click here for more details.

Files changed (24) hide show

lm_deluge/__init__.py +2 -1
lm_deluge/api_requests/anthropic.py +1 -1
lm_deluge/client.py +34 -21
lm_deluge/models/__init__.py +7 -7
lm_deluge/models/anthropic.py +12 -20
lm_deluge/models/bedrock.py +0 -14
lm_deluge/models/cohere.py +0 -16
lm_deluge/models/google.py +0 -20
lm_deluge/models/grok.py +48 -4
lm_deluge/models/groq.py +2 -2
lm_deluge/models/meta.py +0 -8
lm_deluge/models/openai.py +0 -34
lm_deluge/models/openrouter.py +64 -1
lm_deluge/models/together.py +0 -16
lm_deluge/prompt.py +6 -7
lm_deluge/tool.py +338 -18
lm_deluge/tracker.py +11 -5
{lm_deluge-0.0.56.dist-info → lm_deluge-0.0.58.dist-info}/METADATA +1 -1
{lm_deluge-0.0.56.dist-info → lm_deluge-0.0.58.dist-info}/RECORD +22 -24
lm_deluge/agent.py +0 -0
lm_deluge/gemini_limits.py +0 -65
{lm_deluge-0.0.56.dist-info → lm_deluge-0.0.58.dist-info}/WHEEL +0 -0
{lm_deluge-0.0.56.dist-info → lm_deluge-0.0.58.dist-info}/licenses/LICENSE +0 -0
{lm_deluge-0.0.56.dist-info → lm_deluge-0.0.58.dist-info}/top_level.txt +0 -0

lm_deluge/models/openai.py CHANGED Viewed

@@ -77,8 +77,6 @@ OPENAI_MODELS = {
         "api_spec": "openai",
         "input_cost": 3.0,
         "output_cost": 12.0,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": False,
     },
     "o3": {
@@ -93,8 +91,6 @@ OPENAI_MODELS = {
         "input_cost": 2.0,
         "cached_input_cost": 0.50,
         "output_cost": 8.0,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
     "o4-mini": {
@@ -109,8 +105,6 @@ OPENAI_MODELS = {
         "input_cost": 1.1,
         "cached_input_cost": 0.275,
         "output_cost": 4.4,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
     "gpt-4.1": {
@@ -125,8 +119,6 @@ OPENAI_MODELS = {
         "input_cost": 2.0,
         "cached_input_cost": 0.50,
         "output_cost": 8.0,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": False,
     },
     "gpt-4.1-mini": {
@@ -141,8 +133,6 @@ OPENAI_MODELS = {
         "input_cost": 0.4,
         "cached_input_cost": 0.10,
         "output_cost": 1.6,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": False,
     },
     "gpt-4.1-nano": {
@@ -157,8 +147,6 @@ OPENAI_MODELS = {
         "input_cost": 0.1,
         "cached_input_cost": 0.025,
         "output_cost": 0.4,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": False,
     },
     "gpt-4.5": {
@@ -172,8 +160,6 @@ OPENAI_MODELS = {
         "api_spec": "openai",
         "input_cost": 75.0,
         "output_cost": 150.0,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": False,
     },
     "o3-mini": {
@@ -188,8 +174,6 @@ OPENAI_MODELS = {
         "input_cost": 1.1,
         "cached_input_cost": 0.55,
         "output_cost": 4.4,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
     "o1": {
@@ -204,8 +188,6 @@ OPENAI_MODELS = {
         "input_cost": 15.0,
         "cached_input_cost": 7.50,
         "output_cost": 60.0,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
     "o1-preview": {
@@ -219,8 +201,6 @@ OPENAI_MODELS = {
         "api_spec": "openai",
         "input_cost": 15.0,
         "output_cost": 60.0,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
     "o1-mini": {
@@ -235,8 +215,6 @@ OPENAI_MODELS = {
         "input_cost": 1.1,
         "cached_input_cost": 0.55,
         "output_cost": 4.4,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
     "gpt-4o": {
@@ -251,8 +229,6 @@ OPENAI_MODELS = {
         "input_cost": 2.50,
         "cached_input_cost": 1.25,
         "output_cost": 10.0,
-        "requests_per_minute": 10_000,
-        "tokens_per_minute": 30_000_000,
     },
     "gpt-4o-mini": {
         "id": "gpt-4o-mini",
@@ -266,8 +242,6 @@ OPENAI_MODELS = {
         "input_cost": 0.15,
         "cached_input_cost": 0.075,
         "output_cost": 0.6,
-        "requests_per_minute": 60_000,
-        "tokens_per_minute": 250_000_000,
     },
     "gpt-3.5-turbo": {
         "id": "gpt-3.5-turbo",
@@ -280,8 +254,6 @@ OPENAI_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.5,
         "output_cost": 1.5,
-        "requests_per_minute": 40_000,
-        "tokens_per_minute": 75_000_000,
     },
     "gpt-4-turbo": {
         "id": "gpt-4-turbo",
@@ -294,8 +266,6 @@ OPENAI_MODELS = {
         "api_spec": "openai",
         "input_cost": 10.0,
         "output_cost": 30.0,
-        "requests_per_minute": 10_000,
-        "tokens_per_minute": 1_500_000,
     },
     "gpt-4": {
         "id": "gpt-4",
@@ -308,8 +278,6 @@ OPENAI_MODELS = {
         "api_spec": "openai",
         "input_cost": 30.0,
         "output_cost": 60.0,
-        "requests_per_minute": 10_000,
-        "tokens_per_minute": 300_000,
     },
     "gpt-4-32k": {
         "id": "gpt-4-32k",
@@ -322,7 +290,5 @@ OPENAI_MODELS = {
         "api_spec": "openai",
         "input_cost": 60.0,
         "output_cost": 120.0,
-        "requests_per_minute": 1_000,
-        "tokens_per_minute": 150_000,
     },
 }

lm_deluge/models/openrouter.py CHANGED Viewed

@@ -1 +1,64 @@
-OPENROUTER_MODELS = {}
+OPENROUTER_MODELS = {
+    "glm-4.6-openrouter": {
+        "id": "glm-4.6-openrouter",
+        "name": "z-ai/glm-4.6",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.6,
+        "cached_input_cost": 0.11,
+        "cache_write_cost": 0.6,
+        "output_cost": 2.20,
+    },
+    "deepseek-r1-openrouter": {
+        "id": "deepseek-r1-openrouter",
+        "name": "deepseek/deepseek-r1-0528",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.40,
+        "cached_input_cost": 0.40,
+        "cache_write_cost": 0.40,
+        "output_cost": 1.75,
+    },
+    "deepseek-3.1-openrouter": {
+        "id": "deepseek-3.1-openrouter",
+        "name": "deepseek/deepseek-v3.1-terminus",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.23,
+        "cached_input_cost": 0.23,
+        "cache_write_cost": 0.23,
+        "output_cost": 0.9,
+    },
+    "deepseek-3.2-openrouter": {
+        "id": "deepseek-3.2-openrouter",
+        "name": "deepseek/deepseek-v3.2-exp",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.27,
+        "cached_input_cost": 0.27,
+        "cache_write_cost": 0.27,
+        "output_cost": 0.4,
+    },
+    # "gpt-oss-20b-openrouter": {},
+    # "gpt-oss-120b-openrouter": {},
+    "kimi-k2-openrouter": {
+        "id": "kimi-k2-openrouter",
+        "name": "z-ai/glm-4.6",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.6,
+        "cached_input_cost": 0.11,
+        "cache_write_cost": 0.6,
+        "output_cost": 2.20,
+    },
+}

lm_deluge/models/together.py CHANGED Viewed

@@ -20,8 +20,6 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 3.0,
         "output_cost": 7.0,
-        "requests_per_minute": None,
-        "tokens_per_minute": None,
     },
     "deepseek-v3-together": {
         "id": "deepseek-v3-together",
@@ -32,8 +30,6 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 1.25,
         "output_cost": 1.25,
-        "requests_per_minute": None,
-        "tokens_per_minute": None,
     },
     "qwen-3-235b-together": {
         "id": "qwen-3-235b-together",
@@ -44,8 +40,6 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.2,
         "output_cost": 0.6,
-        "requests_per_minute": None,
-        "tokens_per_minute": None,
     },
     "qwen-2.5-vl-together": {
         "id": "qwen-2.5-vl-together",
@@ -56,8 +50,6 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 1.95,
         "output_cost": 8.0,
-        "requests_per_minute": None,
-        "tokens_per_minute": None,
     },
     "llama-4-maverick-together": {
         "id": "llama-4-maverick-together",
@@ -68,8 +60,6 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.27,
         "output_cost": 0.85,
-        "requests_per_minute": None,
-        "tokens_per_minute": None,
     },
     "llama-4-scout-together": {
         "id": "llama-4-scout-together",
@@ -80,8 +70,6 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.18,
         "output_cost": 0.59,
-        "requests_per_minute": None,
-        "tokens_per_minute": None,
     },
     "gpt-oss-120b-together": {
         "id": "gpt-oss-120b-together",
@@ -92,8 +80,6 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.18,
         "output_cost": 0.59,
-        "requests_per_minute": None,
-        "tokens_per_minute": None,
         "reasoning_model": True,
     },
     "gpt-oss-20b-together": {
@@ -105,8 +91,6 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.18,
         "output_cost": 0.59,
-        "requests_per_minute": None,
-        "tokens_per_minute": None,
         "reasoning_model": True,
     },
 }

lm_deluge/prompt.py CHANGED Viewed

@@ -144,8 +144,8 @@ class ToolResult:
     def oa_chat(
         self,
     ) -> dict:  # OpenAI Chat Completions - tool results are separate messages
-        print("serializing toolresult with oa_chat...")
-        print("typeof self.result:", type(self.result))
+        # print("serializing toolresult with oa_chat...")
+        # print("typeof self.result:", type(self.result))
         if isinstance(self.result, str):
             return {
                 "role": "tool",
@@ -174,8 +174,7 @@ class ToolResult:
             raise ValueError("result type not supported")
     def oa_resp(self) -> dict:  # OpenAI Responses
-        print("serializing toolresult with oa_chat...")
-        print("typeof self.result:", type(self.result))
+        # print("typeof self.result:", type(self.result))
         # if normal (not built-in just return the regular output
         if not self.built_in:
             result = (
@@ -466,7 +465,7 @@ class Message:
         self.parts.append(ToolCall(id=id, name=name, arguments=arguments))
         return self
-    def add_tool_result(
+    def with_tool_result(
         self, tool_call_id: str, result: str | list[ToolResultPart]
     ) -> "Message":
         """Append a tool result block and return self for chaining."""
@@ -1189,11 +1188,11 @@ class Conversation:
         """
         if self.messages and self.messages[-1].role == "tool":
             # Append to existing tool message (parallel tool calls)
-            self.messages[-1].add_tool_result(tool_call_id, result)
+            self.messages[-1].with_tool_result(tool_call_id, result)
         else:
             # Create new tool message
             tool_msg = Message("tool", [])
-            tool_msg.add_tool_result(tool_call_id, result)
+            tool_msg.with_tool_result(tool_call_id, result)
             self.messages.append(tool_msg)
         return self

lm-deluge 0.0.56__py3-none-any.whl → 0.0.58__py3-none-any.whl

Potentially problematic release.

lm-deluge 0.0.56py3-none-any.whl → 0.0.58py3-none-any.whl