PyPI - lm-deluge - Versions diffs - 0.0.53__tar.gz → 0.0.54__tar.gz - Mend

lm-deluge 0.0.53tar.gz → 0.0.54tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of lm-deluge might be problematic. Click here for more details.

Files changed (80) hide show

{lm_deluge-0.0.53/src/lm_deluge.egg-info → lm_deluge-0.0.54}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: lm_deluge
-Version: 0.0.53
+Version: 0.0.54
 Summary: Python utility for using LLM API models.
 Author-email: Benjamin Anderson <ben@trytaylor.ai>
 Requires-Python: >=3.10

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/pyproject.toml RENAMED Viewed

@@ -3,7 +3,7 @@ requires = ["setuptools", "wheel"]
 [project]
 name = "lm_deluge"
-version = "0.0.53"
+version = "0.0.54"
 authors = [{ name = "Benjamin Anderson", email = "ben@trytaylor.ai" }]
 description = "Python utility for using LLM API models."
 readme = "README.md"

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/__init__.py RENAMED Viewed

@@ -1,10 +1,9 @@
-from .client import LLMClient, SamplingParams, APIResponse
+from .client import APIResponse, LLMClient, SamplingParams
+from .file import File
 from .prompt import Conversation, Message
 from .tool import Tool
-from .file import File
-import dotenv
-dotenv.load_dotenv()
+# dotenv.load_dotenv() - don't do this, fucks with other packages
 __all__ = [
     "LLMClient",

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/client.py RENAMED Viewed

@@ -80,6 +80,22 @@ class _LLMClient(BaseModel):
             self._tracker.log_final_status()
             self._tracker = None
+    def reset_tracker(self):
+        """Reset tracker by closing and reopening with fresh state.
+        Useful when reusing a client across multiple batches and you want
+        the progress bar to start from 0 instead of showing cumulative totals.
+        """
+        if self._tracker is None:
+            return
+        # Close existing tracker (including progress bar)
+        show_progress = self._tracker.use_progress_bar
+        self.close()
+        # Create fresh tracker
+        self.open(total=0, show_progress=show_progress)
     # NEW! Builder methods
     def with_model(self, model: str):
         self.model_names = [model]
@@ -353,147 +369,61 @@ class _LLMClient(BaseModel):
         cache: CachePattern | None = None,
         use_responses_api: bool = False,
     ) -> list[APIResponse | None] | list[str | None] | dict[str, int]:
-        # Convert prompts to Conversations - no upfront cache checking for dynamic caching!
-        prompts = prompts_to_conversations(prompts)
-        ids = list(range(len(prompts)))
-        results: list[APIResponse | None] = [None for _ in range(len(prompts))]
-        contexts: list[RequestContext | None] = [None for _ in range(len(prompts))]
-        inflight_tasks: set[asyncio.Task[None]] = set()
-        # Use existing tracker if client has been opened; otherwise open/close automatically
-        tracker: StatusTracker
-        tracker_preopened = self._tracker is not None
-        if tracker_preopened:
-            tracker = self._tracker  # type: ignore[assignment]
-            tracker.add_to_total(len(prompts))
-        else:
-            self.open(total=len(prompts), show_progress=show_progress)
-            tracker = self._tracker  # type: ignore[assignment]
-        assert tracker is not None
+        """Process multiple prompts asynchronously using the start_nowait/wait_for_all backend.
-        # Create retry queue for failed requests
-        retry_queue: asyncio.Queue[RequestContext] = asyncio.Queue()
-        # Calculate sleep time for rate limiting (legacy; gating happens in _wait_for_capacity)
-        seconds_to_sleep_each_loop = (60.0 * 0.9) / tracker.max_requests_per_minute
-        # Main dispatch loop - using original pattern but with all prompts
-        next_context = None  # Persist across iterations like original
-        next_is_retry = False  # Track whether next_context is a retry
-        prompts_not_finished = True
-        prompts_iter = iter(zip(ids, prompts))
-        while True:
-            # Get next context (retry or new) - only if we don't already have one waiting
-            if next_context is None:
-                if not retry_queue.empty():
-                    next_context = retry_queue.get_nowait()
-                    next_is_retry = True
-                    print(f"Retrying request {next_context.task_id}.")
-                elif prompts_not_finished:
-                    try:
-                        task_id, prompt = next(prompts_iter)
-                        model, sampling_params = self._select_model()
-                        assert isinstance(prompt, Conversation)
-                        next_context = RequestContext(
-                            task_id=task_id,
-                            model_name=model,
-                            prompt=prompt,
-                            sampling_params=sampling_params,
-                            attempts_left=self.max_attempts,
-                            request_timeout=self.request_timeout,
-                            status_tracker=tracker,
-                            tools=tools,
-                            cache=cache,
-                            use_responses_api=use_responses_api,
-                            extra_headers=self.extra_headers,
-                            force_local_mcp=self.force_local_mcp,
-                        )
-                        next_is_retry = False
-                    except StopIteration:
-                        prompts_not_finished = False
-            # Dispatch using shared capacity gate (consistent with start_nowait)
-            if next_context:
-                # Wait here until we have capacity to launch this context
-                await self._wait_for_capacity(
-                    next_context.num_tokens, tracker, retry=next_is_retry
-                )
-                # Launch simplified request processing
-                contexts[next_context.task_id] = next_context
-                async def process_and_store(ctx: RequestContext):
-                    try:
-                        response = await self.process_single_request(ctx, retry_queue)
-                        results[ctx.task_id] = response
-                    except BaseException as exc:
-                        # Capture cancellations and other BaseExceptions before fallback response fires.
-                        error_response = APIResponse(
-                            id=ctx.task_id,
-                            model_internal=ctx.model_name,
-                            prompt=ctx.prompt,
-                            sampling_params=ctx.sampling_params,
-                            status_code=None,
-                            is_error=True,
-                            error_message=f"{type(exc).__name__}: {exc}",
-                            raw_response={"exception_repr": repr(exc)},
-                        )
-                        results[ctx.task_id] = error_response
-                        if ctx.status_tracker:
-                            ctx.status_tracker.task_failed(ctx.task_id)
-                        raise
-                task = asyncio.create_task(process_and_store(next_context))
-                inflight_tasks.add(task)
-                task.add_done_callback(inflight_tasks.discard)
-                next_context = None  # Reset after successful dispatch
-                next_is_retry = False
-            # Update progress - original logic
-            tracker.update_pbar()
-            # Check completion: consider final outcomes, not in-progress count
-            # This avoids rare hangs if in-progress is miscounted (e.g., double-increment).
-            if (tracker.num_tasks_succeeded + tracker.num_tasks_failed) >= len(
-                prompts
-            ) and retry_queue.empty():
-                break
+        This implementation creates all tasks upfront and waits for them to complete,
+        avoiding issues with tracker state accumulating across multiple calls.
+        """
+        # Convert prompts to Conversations
+        prompts = prompts_to_conversations(prompts)
-            # Yield briefly to allow in-flight tasks to progress
-            await asyncio.sleep(min(0.01, seconds_to_sleep_each_loop))
+        # Ensure tracker exists (start_nowait will call add_to_total for each task)
+        if self._tracker is None:
+            self.open(total=0, show_progress=show_progress)
+            tracker_preopened = False
+        else:
+            tracker_preopened = True
+        # Start all tasks using start_nowait - tasks will coordinate via shared capacity lock
+        task_ids = []
+        for prompt in prompts:
+            assert isinstance(prompt, Conversation)
+            task_id = self.start_nowait(
+                prompt,
+                tools=tools,
+                cache=cache,
+                use_responses_api=use_responses_api,
+            )
+            task_ids.append(task_id)
-        if inflight_tasks:
-            await asyncio.gather(*inflight_tasks, return_exceptions=True)
+        # Wait for all tasks to complete
+        results = await self.wait_for_all(task_ids)
+        # Close tracker if we opened it
         if not tracker_preopened:
             self.close()
+        # Defensive check: This should rarely happen, but provides a safety net
         for idx, response in enumerate(results):
             if response is None:
-                ctx = contexts[idx]
-                prompt = ctx.prompt if ctx else prompts[idx]
-                sampling_params = (
-                    ctx.sampling_params
-                    if ctx
-                    else self.sampling_params[0]
-                    if self.sampling_params
-                    else SamplingParams()
+                # This should only happen if there's a bug in _run_context
+                print(
+                    f"WARNING: result[{idx}] is None! Creating defensive error response. "
+                    f"Please report this bug."
                 )
-                model_name = ctx.model_name if ctx else self.model_names[0]
-                assert isinstance(
-                    prompt, Conversation
-                ), "expected prompt to be a conversation"
                 results[idx] = APIResponse(
                     id=idx,
-                    model_internal=model_name,
-                    prompt=prompt,
-                    sampling_params=sampling_params,
+                    model_internal=self.model_names[0],
+                    prompt=prompts[idx],  # type: ignore
+                    sampling_params=self.sampling_params[0]
+                    if self.sampling_params
+                    else SamplingParams(),
                     status_code=None,
                     is_error=True,
                     error_message="Internal error: no response produced.",
                 )
+        # Handle return format
         if return_completions_only:
             return [r.completion if r is not None else None for r in results]

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/llm_tools/extract.py RENAMED Viewed

@@ -1,11 +1,12 @@
 import asyncio
 import io
 import json
+import os
 from typing import Any
+from lm_deluge.client import _LLMClient
 from lm_deluge.file import File
-from ..client import LLMClient
 from ..prompt import Conversation
 from ..util.json import load_json
@@ -18,7 +19,7 @@ except ImportError:
 async def extract_async(
     inputs: list[str | Any],
     schema: Any,
-    client: LLMClient,
+    client: _LLMClient,
     document_name: str | None = None,
     object_name: str | None = None,
     show_progress: bool = True,
@@ -32,12 +33,13 @@ async def extract_async(
         raise ValueError("schema must be a pydantic model or a dict.")
     # warn if json_mode is not True
+    has_warned = os.environ.get("LM_DELUGE_WARN_JSON_MODE", False)
     for sp in client.sampling_params:
-        if sp.json_mode is False:
+        if sp.json_mode is False and not has_warned:
             print(
                 "Warning: json_mode is False for one or more sampling params. You may get invalid output."
             )
-            break
+            os.environ["LM_DELUGE_WARN_JSON_MODE"] = "True"
     # check_schema(schema_dict) -- figure out later
     if document_name is None:
         document_name = "text"
@@ -111,7 +113,7 @@ async def extract_async(
 def extract(
     inputs: list[str | Any],
     schema: Any,
-    client: LLMClient,
+    client: _LLMClient,
     document_name: str | None = None,
     object_name: str | None = None,
     show_progress: bool = True,

{lm_deluge-0.0.53 → lm_deluge-0.0.54/src/lm_deluge.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: lm_deluge
-Version: 0.0.53
+Version: 0.0.54
 Summary: Python utility for using LLM API models.
 Author-email: Benjamin Anderson <ben@trytaylor.ai>
 Requires-Python: >=3.10

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/LICENSE RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/README.md RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/setup.cfg RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/agent.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/api_requests/__init__.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/api_requests/anthropic.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/api_requests/base.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/api_requests/bedrock.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/api_requests/common.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/api_requests/deprecated/bedrock.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/api_requests/deprecated/cohere.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/api_requests/deprecated/deepseek.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/api_requests/deprecated/mistral.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/api_requests/deprecated/vertex.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/api_requests/gemini.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/api_requests/mistral.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/api_requests/openai.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/api_requests/response.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/batches.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/built_in_tools/anthropic/__init__.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/built_in_tools/anthropic/bash.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/built_in_tools/anthropic/computer_use.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/built_in_tools/anthropic/editor.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/built_in_tools/base.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/built_in_tools/openai.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/cache.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/cli.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/config.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/embed.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/errors.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/file.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/gemini_limits.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/image.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/llm_tools/__init__.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/llm_tools/classify.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/llm_tools/locate.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/llm_tools/ocr.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/llm_tools/score.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/llm_tools/translate.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/models/__init__.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/models/anthropic.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/models/bedrock.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/models/cerebras.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/models/cohere.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/models/deepseek.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/models/fireworks.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/models/google.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/models/grok.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/models/groq.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/models/meta.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/models/mistral.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/models/openai.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/models/openrouter.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/models/together.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/presets/cerebras.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/presets/meta.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/prompt.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/request_context.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/rerank.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/tool.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/tracker.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/usage.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/util/harmony.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/util/json.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/util/logprobs.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/util/spatial.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/util/validation.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge/util/xml.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge.egg-info/SOURCES.txt RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge.egg-info/dependency_links.txt RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge.egg-info/requires.txt RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/src/lm_deluge.egg-info/top_level.txt RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/tests/test_builtin_tools.py RENAMED Viewed

File without changes

{lm_deluge-0.0.53 → lm_deluge-0.0.54}/tests/test_native_mcp_server.py RENAMED Viewed

File without changes

lm-deluge 0.0.53__tar.gz → 0.0.54__tar.gz

Potentially problematic release.

lm-deluge 0.0.53tar.gz → 0.0.54tar.gz