PyPI - lm-deluge - Versions diffs - 0.0.57__tar.gz → 0.0.58__tar.gz - Mend

lm-deluge 0.0.57tar.gz → 0.0.58tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of lm-deluge might be problematic. Click here for more details.

Files changed (80) hide show

{lm_deluge-0.0.57/src/lm_deluge.egg-info → lm_deluge-0.0.58}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: lm_deluge
-Version: 0.0.57
+Version: 0.0.58
 Summary: Python utility for using LLM API models.
 Author-email: Benjamin Anderson <ben@trytaylor.ai>
 Requires-Python: >=3.10

{lm_deluge-0.0.57 → lm_deluge-0.0.58}/pyproject.toml RENAMED Viewed

@@ -3,7 +3,7 @@ requires = ["setuptools", "wheel"]
 [project]
 name = "lm_deluge"
-version = "0.0.57"
+version = "0.0.58"
 authors = [{ name = "Benjamin Anderson", email = "ben@trytaylor.ai" }]
 description = "Python utility for using LLM API models."
 readme = "README.md"

{lm_deluge-0.0.57 → lm_deluge-0.0.58}/src/lm_deluge/api_requests/anthropic.py RENAMED Viewed

@@ -72,7 +72,7 @@ def _build_anthropic_request(
         request_json["system"] = system_message
     # handle temp + top_p for opus 4.1/sonnet 4.5
-    if model.name in ["claude-sonnet-4-5-20250929", "claude-opus-4-1-20250805"]:
+    if "4-1" in model.name or "4-5" in model.name:
         if "temperature" in request_json and "top_p" in request_json:
             request_json.pop("top_p")

{lm_deluge-0.0.57 → lm_deluge-0.0.58}/src/lm_deluge/client.py RENAMED Viewed

@@ -369,7 +369,7 @@ class _LLMClient(BaseModel):
         tools: list[Tool | dict | MCPServer] | None = ...,
         cache: CachePattern | None = ...,
         use_responses_api: bool = ...,
-    ) -> list[APIResponse | None]: ...
+    ) -> list[APIResponse]: ...
     async def process_prompts_async(
         self,
@@ -380,7 +380,7 @@ class _LLMClient(BaseModel):
         tools: list[Tool | dict | MCPServer] | None = None,
         cache: CachePattern | None = None,
         use_responses_api: bool = False,
-    ) -> list[APIResponse | None] | list[str | None] | dict[str, int]:
+    ) -> list[APIResponse] | list[str | None] | dict[str, int]:
         """Process multiple prompts asynchronously using the start_nowait/wait_for_all backend.
         This implementation creates all tasks upfront and waits for them to complete,
@@ -516,28 +516,40 @@ class _LLMClient(BaseModel):
         tools: list[Tool | dict | MCPServer] | None = None,
         cache: CachePattern | None = None,
         use_responses_api: bool = False,
-    ) -> APIResponse | None:
+    ) -> APIResponse:
         task_id = self.start_nowait(
             prompt, tools=tools, cache=cache, use_responses_api=use_responses_api
         )
         return await self.wait_for(task_id)
-    async def wait_for(self, task_id: int) -> APIResponse | None:
+    async def wait_for(self, task_id: int) -> APIResponse:
         task = self._tasks.get(task_id)
         if task:
             return await task
-        return self._results.get(task_id)
+        res = self._results.get(task_id)
+        if res:
+            return res
+        else:
+            return APIResponse(
+                id=-1,
+                model_internal="",
+                prompt=Conversation([]),
+                sampling_params=SamplingParams(),
+                status_code=500,
+                is_error=True,
+                error_message="Task not found",
+            )
     async def wait_for_all(
         self, task_ids: Sequence[int] | None = None
-    ) -> list[APIResponse | None]:
+    ) -> list[APIResponse]:
         if task_ids is None:
             task_ids = list(self._tasks.keys())
         return [await self.wait_for(tid) for tid in task_ids]
     async def as_completed(
         self, task_ids: Sequence[int] | None = None
-    ) -> AsyncGenerator[tuple[int, APIResponse | None], None]:
+    ) -> AsyncGenerator[tuple[int, APIResponse], None]:
         """Yield ``(task_id, result)`` pairs as tasks complete.
         Args:
@@ -561,7 +573,9 @@ class _LLMClient(BaseModel):
         for task in list(tasks_map.keys()):
             if task.done():
                 tid = tasks_map.pop(task)
-                yield tid, self._results.get(tid, await task)
+                task_result = self._results.get(tid, await task)
+                assert task_result
+                yield tid, task_result
         while tasks_map:
             done, _ = await asyncio.wait(
@@ -569,7 +583,9 @@ class _LLMClient(BaseModel):
             )
             for task in done:
                 tid = tasks_map.pop(task)
-                yield tid, self._results.get(tid, await task)
+                task_result = self._results.get(tid, await task)
+                assert task_result
+                yield tid, task_result
     async def stream(
         self,

{lm_deluge-0.0.57 → lm_deluge-0.0.58}/src/lm_deluge/models/__init__.py RENAMED Viewed

@@ -38,9 +38,9 @@ class APIModel:
     supports_responses: bool = False
     reasoning_model: bool = False
     regions: list[str] | dict[str, int] = field(default_factory=list)
-    tokens_per_minute: int | None = None
-    requests_per_minute: int | None = None
-    gpus: list[str] | None = None
+    # tokens_per_minute: int | None = None
+    # requests_per_minute: int | None = None
+    # gpus: list[str] | None = None
     @classmethod
     def from_registry(cls, name: str):
@@ -97,8 +97,8 @@ def register_model(
     supports_responses: bool = False,
     reasoning_model: bool = False,
     regions: list[str] | dict[str, int] = field(default_factory=list),
-    tokens_per_minute: int | None = None,
-    requests_per_minute: int | None = None,
+    # tokens_per_minute: int | None = None,
+    # requests_per_minute: int | None = None,
 ) -> APIModel:
     """Register a model configuration and return the created APIModel."""
     model = APIModel(
@@ -116,8 +116,8 @@ def register_model(
         supports_responses=supports_responses,
         reasoning_model=reasoning_model,
         regions=regions,
-        tokens_per_minute=tokens_per_minute,
-        requests_per_minute=requests_per_minute,
+        # tokens_per_minute=tokens_per_minute,
+        # requests_per_minute=requests_per_minute,
     )
     registry[model.id] = model
     return model

{lm_deluge-0.0.57 → lm_deluge-0.0.58}/src/lm_deluge/models/anthropic.py RENAMED Viewed

@@ -10,6 +10,18 @@ ANTHROPIC_MODELS = {
     #                                                                   ░███
     #                                                                   █████
     #
+    "claude-4.5-haiku": {
+        "id": "claude-4.5-haiku",
+        "name": "claude-haiku-4-5-20251001",
+        "api_base": "https://api.anthropic.com/v1",
+        "api_key_env_var": "ANTHROPIC_API_KEY",
+        "supports_json": False,
+        "api_spec": "anthropic",
+        "input_cost": 1.0,
+        "cached_input_cost": 0.10,
+        "cache_write_cost": 1.25,
+        "output_cost": 3.0,
+    },
     "claude-4.5-sonnet": {
         "id": "claude-4.5-sonnet",
         "name": "claude-sonnet-4-5-20250929",
@@ -21,8 +33,6 @@ ANTHROPIC_MODELS = {
         "cached_input_cost": 0.30,
         "cache_write_cost": 3.75,
         "output_cost": 15.0,
-        "requests_per_minute": 4_000,
-        "tokens_per_minute": 400_000,
     },
     "claude-4.1-opus": {
         "id": "claude-4.1-opus",
@@ -35,8 +45,6 @@ ANTHROPIC_MODELS = {
         "cached_input_cost": 1.50,
         "cache_write_cost": 18.75,
         "output_cost": 75.0,
-        "requests_per_minute": 4_000,
-        "tokens_per_minute": 400_000,
         "reasoning_model": True,
     },
     "claude-4-opus": {
@@ -50,8 +58,6 @@ ANTHROPIC_MODELS = {
         "cached_input_cost": 1.50,
         "cache_write_cost": 18.75,
         "output_cost": 75.0,
-        "requests_per_minute": 4_000,
-        "tokens_per_minute": 400_000,
         "reasoning_model": True,
     },
     "claude-4-sonnet": {
@@ -65,8 +71,6 @@ ANTHROPIC_MODELS = {
         "cached_input_cost": 0.30,
         "cache_write_cost": 3.75,
         "output_cost": 15.0,
-        "requests_per_minute": 4_000,
-        "tokens_per_minute": 400_000,
     },
     "claude-3.7-sonnet": {
         "id": "claude-3.7-sonnet",
@@ -79,8 +83,6 @@ ANTHROPIC_MODELS = {
         "cached_input_cost": 0.30,
         "cache_write_cost": 3.75,
         "output_cost": 15.0,
-        "requests_per_minute": 4_000,
-        "tokens_per_minute": 400_000,
         "reasoning_model": True,
     },
     "claude-3.6-sonnet": {
@@ -94,8 +96,6 @@ ANTHROPIC_MODELS = {
         "cached_input_cost": 0.30,
         "cache_write_cost": 3.75,
         "output_cost": 15.0,
-        "requests_per_minute": 4_000,
-        "tokens_per_minute": 400_000,
     },
     "claude-3.5-sonnet": {
         "id": "claude-3.5-sonnet",
@@ -108,8 +108,6 @@ ANTHROPIC_MODELS = {
         "cached_input_cost": 0.30,
         "cache_write_cost": 3.75,
         "output_cost": 15.0,
-        "requests_per_minute": 4_000,
-        "tokens_per_minute": 400_000,
     },
     "claude-3-opus": {
         "id": "claude-3-opus",
@@ -120,8 +118,6 @@ ANTHROPIC_MODELS = {
         "api_spec": "anthropic",
         "input_cost": 15.0,
         "output_cost": 75.0,
-        "requests_per_minute": 4_000,
-        "tokens_per_minute": 400_000,
     },
     "claude-3.5-haiku": {
         "id": "claude-3.5-haiku",
@@ -134,8 +130,6 @@ ANTHROPIC_MODELS = {
         "cached_input_cost": 0.08,
         "cache_write_cost": 1.00,
         "output_cost": 4.00,
-        "requests_per_minute": 20_000,
-        "tokens_per_minute": 4_000_000,  # supposed to be this but they fucked up
     },
     "claude-3-haiku": {
         "id": "claude-3-haiku",
@@ -148,7 +142,5 @@ ANTHROPIC_MODELS = {
         "cache_write_cost": 0.30,
         "cached_input_cost": 0.03,
         "output_cost": 1.25,
-        "requests_per_minute": 10_000,
-        "tokens_per_minute": 4_000_000,  # supposed to be this but they fucked up
     },
 }

{lm_deluge-0.0.57 → lm_deluge-0.0.58}/src/lm_deluge/models/bedrock.py RENAMED Viewed

@@ -16,8 +16,6 @@ BEDROCK_MODELS = {
         "api_spec": "bedrock",
         "input_cost": 0.25,
         "output_cost": 1.25,
-        "requests_per_minute": 4_000,
-        "tokens_per_minute": 8_000_000,
     },
     "claude-3.5-haiku-bedrock": {
         "id": "claude-3.5-haiku-bedrock",
@@ -28,8 +26,6 @@ BEDROCK_MODELS = {
         "api_spec": "bedrock",
         "input_cost": 0.25,
         "output_cost": 1.25,
-        "requests_per_minute": 4_000,
-        "tokens_per_minute": 8_000_000,
     },
     "claude-3.5-sonnet-bedrock": {
         "id": "claude-3.5-sonnet-bedrock",
@@ -40,8 +36,6 @@ BEDROCK_MODELS = {
         "api_spec": "bedrock",
         "input_cost": 3.0,
         "output_cost": 15.0,
-        "requests_per_minute": 4_000,
-        "tokens_per_minute": 400_000,
         "reasoning_model": False,
     },
     "claude-3.6-sonnet-bedrock": {
@@ -53,8 +47,6 @@ BEDROCK_MODELS = {
         "api_spec": "bedrock",
         "input_cost": 3.0,
         "output_cost": 15.0,
-        "requests_per_minute": 4_000,
-        "tokens_per_minute": 400_000,
         "reasoning_model": False,
     },
     "claude-3.7-sonnet-bedrock": {
@@ -66,8 +58,6 @@ BEDROCK_MODELS = {
         "api_spec": "bedrock",
         "input_cost": 3.0,
         "output_cost": 15.0,
-        "requests_per_minute": 4_000,
-        "tokens_per_minute": 400_000,
         "reasoning_model": True,
     },
     "claude-4-sonnet-bedrock": {
@@ -79,8 +69,6 @@ BEDROCK_MODELS = {
         "api_spec": "bedrock",
         "input_cost": 3.0,
         "output_cost": 15.0,
-        "requests_per_minute": 4_000,
-        "tokens_per_minute": 400_000,
         "reasoning_model": True,
     },
     "claude-4-opus-bedrock": {
@@ -92,8 +80,6 @@ BEDROCK_MODELS = {
         "api_spec": "bedrock",
         "input_cost": 3.0,
         "output_cost": 15.0,
-        "requests_per_minute": 4_000,
-        "tokens_per_minute": 400_000,
         "reasoning_model": True,
     },
     # GPT-OSS on AWS Bedrock

{lm_deluge-0.0.57 → lm_deluge-0.0.58}/src/lm_deluge/models/cohere.py RENAMED Viewed

@@ -15,8 +15,6 @@ COHERE_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.5,
         "output_cost": 1.5,
-        "requests_per_minute": 10_000,
-        "tokens_per_minute": None,
     },
     "aya-expanse-32b": {
         "id": "aya-expanse-32b",
@@ -26,8 +24,6 @@ COHERE_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.5,
         "output_cost": 1.5,
-        "requests_per_minute": 10_000,
-        "tokens_per_minute": None,
     },
     "aya-vision-8b": {
         "id": "aya-vision-8b",
@@ -37,8 +33,6 @@ COHERE_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.5,
         "output_cost": 1.5,
-        "requests_per_minute": 10_000,
-        "tokens_per_minute": None,
     },
     "aya-vision-32b": {
         "id": "aya-vision-32b",
@@ -48,8 +42,6 @@ COHERE_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.5,
         "output_cost": 1.5,
-        "requests_per_minute": 10_000,
-        "tokens_per_minute": None,
     },
     "command-a": {
         "id": "command-a",
@@ -59,8 +51,6 @@ COHERE_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.5,
         "output_cost": 1.5,
-        "requests_per_minute": 10_000,
-        "tokens_per_minute": None,
     },
     "command-r-7b": {
         "id": "command-r-cohere",
@@ -70,8 +60,6 @@ COHERE_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.5,
         "output_cost": 1.5,
-        "requests_per_minute": 10_000,
-        "tokens_per_minute": None,
     },
     "command-r": {
         "id": "command-r",
@@ -81,8 +69,6 @@ COHERE_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.5,
         "output_cost": 1.5,
-        "requests_per_minute": 10_000,
-        "tokens_per_minute": None,
     },
     "command-r-plus": {
         "id": "command-r-plus",
@@ -92,7 +78,5 @@ COHERE_MODELS = {
         "api_spec": "openai",
         "input_cost": 3.0,
         "output_cost": 15.0,
-        "requests_per_minute": 10_000,
-        "tokens_per_minute": None,
     },
 }

{lm_deluge-0.0.57 → lm_deluge-0.0.58}/src/lm_deluge/models/google.py RENAMED Viewed

@@ -20,8 +20,6 @@ GOOGLE_MODELS = {
         "input_cost": 0.1,
         "cached_input_cost": 0.025,
         "output_cost": 0.4,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": False,
     },
     "gemini-2.0-flash-lite-compat": {
@@ -34,8 +32,6 @@ GOOGLE_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.075,
         "output_cost": 0.3,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": False,
     },
     "gemini-2.5-pro-compat": {
@@ -49,8 +45,6 @@ GOOGLE_MODELS = {
         "input_cost": 1.25,
         "cached_input_cost": 0.31,
         "output_cost": 10.0,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
     "gemini-2.5-flash-compat": {
@@ -64,8 +58,6 @@ GOOGLE_MODELS = {
         "input_cost": 0.3,
         "cached_input_cost": 0.075,
         "output_cost": 2.5,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
     "gemini-2.5-flash-lite-compat": {
@@ -79,8 +71,6 @@ GOOGLE_MODELS = {
         "input_cost": 0.1,
         "cached_input_cost": 0.025,
         "output_cost": 0.4,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
     # Native Gemini API versions with file support
@@ -95,8 +85,6 @@ GOOGLE_MODELS = {
         "input_cost": 0.1,
         "cached_input_cost": 0.025,
         "output_cost": 0.4,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": False,
     },
     "gemini-2.0-flash-lite": {
@@ -109,8 +97,6 @@ GOOGLE_MODELS = {
         "api_spec": "gemini",
         "input_cost": 0.075,
         "output_cost": 0.3,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": False,
     },
     "gemini-2.5-pro": {
@@ -124,8 +110,6 @@ GOOGLE_MODELS = {
         "input_cost": 1.25,
         "cached_input_cost": 0.31,
         "output_cost": 10.0,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
     "gemini-2.5-flash": {
@@ -139,8 +123,6 @@ GOOGLE_MODELS = {
         "input_cost": 0.3,
         "cached_input_cost": 0.075,
         "output_cost": 2.5,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
     "gemini-2.5-flash-lite": {
@@ -154,8 +136,6 @@ GOOGLE_MODELS = {
         "input_cost": 0.1,
         "cached_input_cost": 0.025,
         "output_cost": 0.4,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
 }

lm_deluge-0.0.58/src/lm_deluge/models/grok.py ADDED Viewed

@@ -0,0 +1,82 @@
+XAI_MODELS = {
+    #  .d8888b.                  888
+    # d88P  Y88b                 888
+    # 888    888                 888
+    # 888        888d888 .d88b.  888  888
+    # 888  88888 888P"  d88""88b 888 .88P
+    # 888    888 888    888  888 888888K
+    # Y88b  d88P 888    Y88..88P 888 "88b
+    #  "Y8888P88 888     "Y88P"  888  888
+    "grok-code-fast-1": {
+        "id": "grok-code-fast-1",
+        "name": "grok-code-fast-1",
+        "api_base": "https://api.x.ai/v1",
+        "api_key_env_var": "GROK_API_KEY",
+        "supports_json": True,
+        "supports_logprobs": True,
+        "api_spec": "openai",
+        "input_cost": 0.2,
+        "output_cost": 1.5,
+        "reasoning_model": False,
+    },
+    "grok-4-fast-reasoning": {
+        "id": "grok-4-fast-reasoning",
+        "name": "grok-4-fast-reasoning",
+        "api_base": "https://api.x.ai/v1",
+        "api_key_env_var": "GROK_API_KEY",
+        "supports_json": True,
+        "supports_logprobs": True,
+        "api_spec": "openai",
+        "input_cost": 0.2,
+        "output_cost": 0.5,
+        "reasoning_model": False,
+    },
+    "grok-4-fast-non-reasoning": {
+        "id": "grok-4-fast-non-reasoning",
+        "name": "grok-4-fast-non-reasoning",
+        "api_base": "https://api.x.ai/v1",
+        "api_key_env_var": "GROK_API_KEY",
+        "supports_json": True,
+        "supports_logprobs": True,
+        "api_spec": "openai",
+        "input_cost": 0.2,
+        "output_cost": 0.5,
+        "reasoning_model": False,
+    },
+    "grok-4": {
+        "id": "grok-4",
+        "name": "grok-4-0709",
+        "api_base": "https://api.x.ai/v1",
+        "api_key_env_var": "GROK_API_KEY",
+        "supports_json": True,
+        "supports_logprobs": True,
+        "api_spec": "openai",
+        "input_cost": 2.0,
+        "output_cost": 8.0,
+        "reasoning_model": False,
+    },
+    "grok-3": {
+        "id": "grok-3",
+        "name": "grok-3-latest",
+        "api_base": "https://api.x.ai/v1",
+        "api_key_env_var": "GROK_API_KEY",
+        "supports_json": True,
+        "supports_logprobs": True,
+        "api_spec": "openai",
+        "input_cost": 2.0,
+        "output_cost": 8.0,
+        "reasoning_model": False,
+    },
+    "grok-3-mini": {
+        "id": "grok-3-mini",
+        "name": "grok-3-mini-latest",
+        "api_base": "https://api.x.ai/v1",
+        "api_key_env_var": "GROK_API_KEY",
+        "supports_json": True,
+        "supports_logprobs": True,
+        "api_spec": "openai",
+        "input_cost": 2.0,
+        "output_cost": 8.0,
+        "reasoning_model": True,
+    },
+}

{lm_deluge-0.0.57 → lm_deluge-0.0.58}/src/lm_deluge/models/groq.py RENAMED Viewed

@@ -41,10 +41,10 @@ GROQ_MODELS = {
     },
     "kimi-k2-groq": {
         "id": "kimi-k2-groq",
-        "name": "moonshotai/kimi-k2-instruct",
+        "name": "moonshotai/kimi-k2-instruct-0905",
         "api_base": "https://api.groq.com/openai/v1",
         "api_key_env_var": "GROQ_API_KEY",
-        "supports_json": False,
+        "supports_json": True,
         "api_spec": "openai",
     },
     "gpt-oss-120b-groq": {

{lm_deluge-0.0.57 → lm_deluge-0.0.58}/src/lm_deluge/models/meta.py RENAMED Viewed

@@ -16,8 +16,6 @@ META_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.0,
         "output_cost": 0.0,
-        "requests_per_minute": 3_000,
-        "tokens_per_minute": 1_000_000,
         "reasoning_model": False,
     },
     "llama-4-maverick": {
@@ -30,8 +28,6 @@ META_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.0,
         "output_cost": 0.0,
-        "requests_per_minute": 3_000,
-        "tokens_per_minute": 1_000_000,
         "reasoning_model": False,
     },
     "llama-3.3-70b": {
@@ -44,8 +40,6 @@ META_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.0,
         "output_cost": 0.0,
-        "requests_per_minute": 3_000,
-        "tokens_per_minute": 1_000_000,
         "reasoning_model": False,
     },
     "llama-3.3-8b": {
@@ -58,8 +52,6 @@ META_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.0,
         "output_cost": 0.0,
-        "requests_per_minute": 3_000,
-        "tokens_per_minute": 1_000_000,
         "reasoning_model": False,
     },
 }

{lm_deluge-0.0.57 → lm_deluge-0.0.58}/src/lm_deluge/models/openai.py RENAMED Viewed

@@ -77,8 +77,6 @@ OPENAI_MODELS = {
         "api_spec": "openai",
         "input_cost": 3.0,
         "output_cost": 12.0,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": False,
     },
     "o3": {
@@ -93,8 +91,6 @@ OPENAI_MODELS = {
         "input_cost": 2.0,
         "cached_input_cost": 0.50,
         "output_cost": 8.0,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
     "o4-mini": {
@@ -109,8 +105,6 @@ OPENAI_MODELS = {
         "input_cost": 1.1,
         "cached_input_cost": 0.275,
         "output_cost": 4.4,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
     "gpt-4.1": {
@@ -125,8 +119,6 @@ OPENAI_MODELS = {
         "input_cost": 2.0,
         "cached_input_cost": 0.50,
         "output_cost": 8.0,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": False,
     },
     "gpt-4.1-mini": {
@@ -141,8 +133,6 @@ OPENAI_MODELS = {
         "input_cost": 0.4,
         "cached_input_cost": 0.10,
         "output_cost": 1.6,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": False,
     },
     "gpt-4.1-nano": {
@@ -157,8 +147,6 @@ OPENAI_MODELS = {
         "input_cost": 0.1,
         "cached_input_cost": 0.025,
         "output_cost": 0.4,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": False,
     },
     "gpt-4.5": {
@@ -172,8 +160,6 @@ OPENAI_MODELS = {
         "api_spec": "openai",
         "input_cost": 75.0,
         "output_cost": 150.0,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": False,
     },
     "o3-mini": {
@@ -188,8 +174,6 @@ OPENAI_MODELS = {
         "input_cost": 1.1,
         "cached_input_cost": 0.55,
         "output_cost": 4.4,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
     "o1": {
@@ -204,8 +188,6 @@ OPENAI_MODELS = {
         "input_cost": 15.0,
         "cached_input_cost": 7.50,
         "output_cost": 60.0,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
     "o1-preview": {
@@ -219,8 +201,6 @@ OPENAI_MODELS = {
         "api_spec": "openai",
         "input_cost": 15.0,
         "output_cost": 60.0,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
     "o1-mini": {
@@ -235,8 +215,6 @@ OPENAI_MODELS = {
         "input_cost": 1.1,
         "cached_input_cost": 0.55,
         "output_cost": 4.4,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
         "reasoning_model": True,
     },
     "gpt-4o": {
@@ -251,8 +229,6 @@ OPENAI_MODELS = {
         "input_cost": 2.50,
         "cached_input_cost": 1.25,
         "output_cost": 10.0,
-        "requests_per_minute": 10_000,
-        "tokens_per_minute": 30_000_000,
     },
     "gpt-4o-mini": {
         "id": "gpt-4o-mini",
@@ -266,8 +242,6 @@ OPENAI_MODELS = {
         "input_cost": 0.15,
         "cached_input_cost": 0.075,
         "output_cost": 0.6,
-        "requests_per_minute": 60_000,
-        "tokens_per_minute": 250_000_000,
     },
     "gpt-3.5-turbo": {
         "id": "gpt-3.5-turbo",
@@ -280,8 +254,6 @@ OPENAI_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.5,
         "output_cost": 1.5,
-        "requests_per_minute": 40_000,
-        "tokens_per_minute": 75_000_000,
     },
     "gpt-4-turbo": {
         "id": "gpt-4-turbo",
@@ -294,8 +266,6 @@ OPENAI_MODELS = {
         "api_spec": "openai",
         "input_cost": 10.0,
         "output_cost": 30.0,
-        "requests_per_minute": 10_000,
-        "tokens_per_minute": 1_500_000,
     },
     "gpt-4": {
         "id": "gpt-4",
@@ -308,8 +278,6 @@ OPENAI_MODELS = {
         "api_spec": "openai",
         "input_cost": 30.0,
         "output_cost": 60.0,
-        "requests_per_minute": 10_000,
-        "tokens_per_minute": 300_000,
     },
     "gpt-4-32k": {
         "id": "gpt-4-32k",
@@ -322,7 +290,5 @@ OPENAI_MODELS = {
         "api_spec": "openai",
         "input_cost": 60.0,
         "output_cost": 120.0,
-        "requests_per_minute": 1_000,
-        "tokens_per_minute": 150_000,
     },
 }

lm_deluge-0.0.58/src/lm_deluge/models/openrouter.py ADDED Viewed

@@ -0,0 +1,64 @@
+OPENROUTER_MODELS = {
+    "glm-4.6-openrouter": {
+        "id": "glm-4.6-openrouter",
+        "name": "z-ai/glm-4.6",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.6,
+        "cached_input_cost": 0.11,
+        "cache_write_cost": 0.6,
+        "output_cost": 2.20,
+    },
+    "deepseek-r1-openrouter": {
+        "id": "deepseek-r1-openrouter",
+        "name": "deepseek/deepseek-r1-0528",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.40,
+        "cached_input_cost": 0.40,
+        "cache_write_cost": 0.40,
+        "output_cost": 1.75,
+    },
+    "deepseek-3.1-openrouter": {
+        "id": "deepseek-3.1-openrouter",
+        "name": "deepseek/deepseek-v3.1-terminus",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.23,
+        "cached_input_cost": 0.23,
+        "cache_write_cost": 0.23,
+        "output_cost": 0.9,
+    },
+    "deepseek-3.2-openrouter": {
+        "id": "deepseek-3.2-openrouter",
+        "name": "deepseek/deepseek-v3.2-exp",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.27,
+        "cached_input_cost": 0.27,
+        "cache_write_cost": 0.27,
+        "output_cost": 0.4,
+    },
+    # "gpt-oss-20b-openrouter": {},
+    # "gpt-oss-120b-openrouter": {},
+    "kimi-k2-openrouter": {
+        "id": "kimi-k2-openrouter",
+        "name": "z-ai/glm-4.6",
+        "api_base": "https://openrouter.ai/api/v1",
+        "api_key_env_var": "OPENROUTER_API_KEY",
+        "supports_json": True,
+        "api_spec": "openai",
+        "input_cost": 0.6,
+        "cached_input_cost": 0.11,
+        "cache_write_cost": 0.6,
+        "output_cost": 2.20,
+    },
+}

{lm_deluge-0.0.57 → lm_deluge-0.0.58}/src/lm_deluge/models/together.py RENAMED Viewed

@@ -20,8 +20,6 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 3.0,
         "output_cost": 7.0,
-        "requests_per_minute": None,
-        "tokens_per_minute": None,
     },
     "deepseek-v3-together": {
         "id": "deepseek-v3-together",
@@ -32,8 +30,6 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 1.25,
         "output_cost": 1.25,
-        "requests_per_minute": None,
-        "tokens_per_minute": None,
     },
     "qwen-3-235b-together": {
         "id": "qwen-3-235b-together",
@@ -44,8 +40,6 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.2,
         "output_cost": 0.6,
-        "requests_per_minute": None,
-        "tokens_per_minute": None,
     },
     "qwen-2.5-vl-together": {
         "id": "qwen-2.5-vl-together",
@@ -56,8 +50,6 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 1.95,
         "output_cost": 8.0,
-        "requests_per_minute": None,
-        "tokens_per_minute": None,
     },
     "llama-4-maverick-together": {
         "id": "llama-4-maverick-together",
@@ -68,8 +60,6 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.27,
         "output_cost": 0.85,
-        "requests_per_minute": None,
-        "tokens_per_minute": None,
     },
     "llama-4-scout-together": {
         "id": "llama-4-scout-together",
@@ -80,8 +70,6 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.18,
         "output_cost": 0.59,
-        "requests_per_minute": None,
-        "tokens_per_minute": None,
     },
     "gpt-oss-120b-together": {
         "id": "gpt-oss-120b-together",
@@ -92,8 +80,6 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.18,
         "output_cost": 0.59,
-        "requests_per_minute": None,
-        "tokens_per_minute": None,
         "reasoning_model": True,
     },
     "gpt-oss-20b-together": {
@@ -105,8 +91,6 @@ TOGETHER_MODELS = {
         "api_spec": "openai",
         "input_cost": 0.18,
         "output_cost": 0.59,
-        "requests_per_minute": None,
-        "tokens_per_minute": None,
         "reasoning_model": True,
     },
 }

{lm_deluge-0.0.57 → lm_deluge-0.0.58/src/lm_deluge.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: lm_deluge
-Version: 0.0.57
+Version: 0.0.58
 Summary: Python utility for using LLM API models.
 Author-email: Benjamin Anderson <ben@trytaylor.ai>
 Requires-Python: >=3.10

lm_deluge-0.0.57/src/lm_deluge/models/grok.py DELETED Viewed

@@ -1,38 +0,0 @@
-XAI_MODELS = {
-    #  .d8888b.                  888
-    # d88P  Y88b                 888
-    # 888    888                 888
-    # 888        888d888 .d88b.  888  888
-    # 888  88888 888P"  d88""88b 888 .88P
-    # 888    888 888    888  888 888888K
-    # Y88b  d88P 888    Y88..88P 888 "88b
-    #  "Y8888P88 888     "Y88P"  888  888
-    "grok-3": {
-        "id": "grok-3",
-        "name": "grok-3-latest",
-        "api_base": "https://api.x.ai/v1",
-        "api_key_env_var": "GROK_API_KEY",
-        "supports_json": True,
-        "supports_logprobs": True,
-        "api_spec": "openai",
-        "input_cost": 2.0,
-        "output_cost": 8.0,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
-        "reasoning_model": False,
-    },
-    "grok-3-mini": {
-        "id": "grok-3-mini",
-        "name": "grok-3-mini-latest",
-        "api_base": "https://api.x.ai/v1",
-        "api_key_env_var": "GROK_API_KEY",
-        "supports_json": True,
-        "supports_logprobs": True,
-        "api_spec": "openai",
-        "input_cost": 2.0,
-        "output_cost": 8.0,
-        "requests_per_minute": 20,
-        "tokens_per_minute": 100_000,
-        "reasoning_model": True,
-    },
-}