PyPI - lm-deluge - Versions diffs - 0.0.43__tar.gz → 0.0.45__tar.gz - Mend

lm-deluge 0.0.43tar.gz → 0.0.45tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of lm-deluge might be problematic. Click here for more details.

Files changed (78) hide show

{lm_deluge-0.0.43/src/lm_deluge.egg-info → lm_deluge-0.0.45}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: lm_deluge
-Version: 0.0.43
+Version: 0.0.45
 Summary: Python utility for using LLM API models.
 Author-email: Benjamin Anderson <ben@trytaylor.ai>
 Requires-Python: >=3.10

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/pyproject.toml RENAMED Viewed

@@ -3,7 +3,7 @@ requires = ["setuptools", "wheel"]
 [project]
 name = "lm_deluge"
-version = "0.0.43"
+version = "0.0.45"
 authors = [{ name = "Benjamin Anderson", email = "ben@trytaylor.ai" }]
 description = "Python utility for using LLM API models."
 readme = "README.md"

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/client.py RENAMED Viewed

@@ -1,5 +1,4 @@
 import asyncio
-import random
 from typing import Any, AsyncGenerator, Callable, Literal, Self, Sequence, overload
 import numpy as np
@@ -218,16 +217,19 @@ class _LLMClient(BaseModel):
         self, num_tokens: int, tracker: StatusTracker, *, retry: bool = False
     ):
         while True:
+            # Enforce cooldown first, regardless of current capacity.
+            cooldown = tracker.seconds_to_pause
+            if cooldown > 0:
+                print(f"Pausing for {cooldown} seconds to cool down.")
+                await asyncio.sleep(cooldown)
+                continue
             async with self._capacity_lock:
                 if tracker.check_capacity(num_tokens, retry=retry):
                     tracker.set_limiting_factor(None)
                     return
-                seconds_to_pause = tracker.seconds_to_pause
-            if seconds_to_pause > 0:
-                await asyncio.sleep(seconds_to_pause)
-            else:
-                await asyncio.sleep(random.random())
+            # Idle wait before next capacity check. Aim for ~RPM spacing.
+            await asyncio.sleep(max(60.0 / self.max_requests_per_minute, 0.01))
     async def _execute_request(self, context: RequestContext) -> APIResponse:
         """Create and send a single API request using the provided context."""
@@ -363,7 +365,7 @@ class _LLMClient(BaseModel):
         # Create retry queue for failed requests
         retry_queue: asyncio.Queue[RequestContext] = asyncio.Queue()
-        # Calculate sleep time for rate limiting
+        # Calculate sleep time for rate limiting (legacy; gating happens in _wait_for_capacity)
         seconds_to_sleep_each_loop = (60.0 * 0.9) / tracker.max_requests_per_minute
         # Main dispatch loop - using original pattern but with all prompts
@@ -403,40 +405,37 @@ class _LLMClient(BaseModel):
                     except StopIteration:
                         prompts_not_finished = False
-            # Update capacity - original logic
-            tracker.update_capacity()
-            # Dispatch if capacity available - original logic
+            # Dispatch using shared capacity gate (consistent with start_nowait)
             if next_context:
-                if tracker.check_capacity(next_context.num_tokens, retry=next_is_retry):
-                    tracker.set_limiting_factor(None)
+                # Wait here until we have capacity to launch this context
+                await self._wait_for_capacity(
+                    next_context.num_tokens, tracker, retry=next_is_retry
+                )
+                # Launch simplified request processing
+                async def process_and_store(ctx: RequestContext):
+                    try:
+                        response = await self.process_single_request(ctx, retry_queue)
+                        results[ctx.task_id] = response
+                    except Exception as e:
+                        # Create an error response for validation errors and other exceptions
+                        error_response = APIResponse(
+                            id=ctx.task_id,
+                            model_internal=ctx.model_name,
+                            prompt=ctx.prompt,
+                            sampling_params=ctx.sampling_params,
+                            status_code=None,
+                            is_error=True,
+                            error_message=str(e),
+                        )
+                        results[ctx.task_id] = error_response
+                        # Mark task as completed so the main loop can finish
+                        if ctx.status_tracker:
+                            ctx.status_tracker.task_failed(ctx.task_id)
-                    # Launch simplified request processing
-                    async def process_and_store(ctx: RequestContext):
-                        try:
-                            response = await self.process_single_request(
-                                ctx, retry_queue
-                            )
-                            results[ctx.task_id] = response
-                        except Exception as e:
-                            # Create an error response for validation errors and other exceptions
-                            error_response = APIResponse(
-                                id=ctx.task_id,
-                                model_internal=ctx.model_name,
-                                prompt=ctx.prompt,
-                                sampling_params=ctx.sampling_params,
-                                status_code=None,
-                                is_error=True,
-                                error_message=str(e),
-                            )
-                            results[ctx.task_id] = error_response
-                            # Mark task as completed so the main loop can finish
-                            if ctx.status_tracker:
-                                ctx.status_tracker.task_failed(ctx.task_id)
-                    asyncio.create_task(process_and_store(next_context))
-                    next_context = None  # Reset after successful dispatch
-                    next_is_retry = False
+                asyncio.create_task(process_and_store(next_context))
+                next_context = None  # Reset after successful dispatch
+                next_is_retry = False
             # Update progress - original logic
             tracker.update_pbar()
@@ -448,8 +447,8 @@ class _LLMClient(BaseModel):
             ) and retry_queue.empty():
                 break
-            # Sleep - original logic
-            await asyncio.sleep(seconds_to_sleep_each_loop + tracker.seconds_to_pause)
+            # Yield briefly to allow in-flight tasks to progress
+            await asyncio.sleep(min(0.01, seconds_to_sleep_each_loop))
         if not tracker_preopened:
             self.close()

{lm_deluge-0.0.43 → lm_deluge-0.0.45/src/lm_deluge.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: lm_deluge
-Version: 0.0.43
+Version: 0.0.45
 Summary: Python utility for using LLM API models.
 Author-email: Benjamin Anderson <ben@trytaylor.ai>
 Requires-Python: >=3.10

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/LICENSE RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/README.md RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/setup.cfg RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/__init__.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/agent.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/api_requests/__init__.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/api_requests/anthropic.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/api_requests/base.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/api_requests/bedrock.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/api_requests/common.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/api_requests/deprecated/bedrock.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/api_requests/deprecated/cohere.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/api_requests/deprecated/deepseek.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/api_requests/deprecated/mistral.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/api_requests/deprecated/vertex.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/api_requests/gemini.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/api_requests/mistral.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/api_requests/openai.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/api_requests/response.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/batches.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/built_in_tools/anthropic/__init__.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/built_in_tools/anthropic/bash.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/built_in_tools/anthropic/computer_use.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/built_in_tools/anthropic/editor.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/built_in_tools/base.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/built_in_tools/openai.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/cache.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/cli.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/config.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/embed.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/errors.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/file.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/gemini_limits.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/image.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/llm_tools/__init__.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/llm_tools/classify.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/llm_tools/extract.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/llm_tools/locate.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/llm_tools/ocr.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/llm_tools/score.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/llm_tools/translate.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/models/__init__.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/models/anthropic.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/models/bedrock.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/models/cerebras.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/models/cohere.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/models/deepseek.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/models/fireworks.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/models/google.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/models/grok.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/models/groq.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/models/meta.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/models/mistral.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/models/openai.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/models/openrouter.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/models/together.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/prompt.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/request_context.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/rerank.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/tool.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/tracker.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/usage.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/util/harmony.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/util/json.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/util/logprobs.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/util/spatial.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/util/validation.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge/util/xml.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge.egg-info/SOURCES.txt RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge.egg-info/dependency_links.txt RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge.egg-info/requires.txt RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/src/lm_deluge.egg-info/top_level.txt RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/tests/test_builtin_tools.py RENAMED Viewed

File without changes

{lm_deluge-0.0.43 → lm_deluge-0.0.45}/tests/test_native_mcp_server.py RENAMED Viewed

File without changes

lm-deluge 0.0.43__tar.gz → 0.0.45__tar.gz

Potentially problematic release.

lm-deluge 0.0.43tar.gz → 0.0.45tar.gz