PyPI - lm-deluge - Versions diffs - 0.0.76__py3-none-any.whl → 0.0.79__py3-none-any.whl - Mend

lm-deluge 0.0.76py3-none-any.whl → 0.0.79py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

lm_deluge/api_requests/gemini.py +78 -11
lm_deluge/client.py +1 -0
lm_deluge/config.py +7 -0
lm_deluge/llm_tools/filesystem.py +821 -0
lm_deluge/llm_tools/sandbox.py +523 -0
lm_deluge/models/google.py +15 -0
lm_deluge/models/openrouter.py +10 -0
lm_deluge/prompt.py +62 -24
lm_deluge/warnings.py +2 -0
{lm_deluge-0.0.76.dist-info → lm_deluge-0.0.79.dist-info}/METADATA +9 -8
{lm_deluge-0.0.76.dist-info → lm_deluge-0.0.79.dist-info}/RECORD +14 -13
{lm_deluge-0.0.76.dist-info → lm_deluge-0.0.79.dist-info}/WHEEL +0 -0
{lm_deluge-0.0.76.dist-info → lm_deluge-0.0.79.dist-info}/licenses/LICENSE +0 -0
{lm_deluge-0.0.76.dist-info → lm_deluge-0.0.79.dist-info}/top_level.txt +0 -0

lm_deluge/api_requests/gemini.py CHANGED Viewed

@@ -23,6 +23,21 @@ async def _build_gemini_request(
 ) -> dict:
     system_message, messages = prompt.to_gemini()
+    # For Gemini 3, inject dummy signatures when missing for function calls
+    is_gemini_3 = "gemini-3" in model.name.lower()
+    if is_gemini_3:
+        dummy_sig = "context_engineering_is_the_way_to_go"
+        for msg in messages:
+            if "parts" in msg:
+                for part in msg["parts"]:
+                    # For function calls, inject dummy signature if missing
+                    if "functionCall" in part and "thoughtSignature" not in part:
+                        part["thoughtSignature"] = dummy_sig
+                        maybe_warn(
+                            "WARN_GEMINI3_MISSING_SIGNATURE",
+                            part_type="function call",
+                        )
     request_json = {
         "contents": messages,
         "generationConfig": {
@@ -40,17 +55,44 @@ async def _build_gemini_request(
     if model.reasoning_model:
         thinking_config: dict[str, Any] | None = None
         effort = sampling_params.reasoning_effort
-        if effort is None or effort == "none":
-            budget = 128 if "2.5-pro" in model.id else 0
-            # Explicitly disable thoughts when no effort is requested
-            thinking_config = {"includeThoughts": False, "thinkingBudget": budget}
+        is_gemini_3 = "gemini-3" in model.name.lower()
+        if is_gemini_3:
+            # Gemini 3 uses thinkingLevel instead of thinkingBudget
+            if effort in {"none", "minimal"}:
+                thinking_config = {"thinkingLevel": "low"}
+            elif effort is None:
+                # Default to high when reasoning is enabled but no preference was provided
+                thinking_config = {"thinkingLevel": "high"}
+            else:
+                # Map reasoning_effort to thinkingLevel
+                level_map = {
+                    "minimal": "low",
+                    "low": "low",
+                    "medium": "medium",  # Will work when supported
+                    "high": "high",
+                }
+                thinking_level = level_map.get(effort, "high")
+                thinking_config = {"thinkingLevel": thinking_level}
         else:
-            thinking_config = {"includeThoughts": True}
-            if effort in {"minimal", "low", "medium", "high"} and "flash" in model.id:
-                budget = {"minimal": 256, "low": 1024, "medium": 4096, "high": 16384}[
-                    effort
-                ]
-                thinking_config["thinkingBudget"] = budget
+            # Gemini 2.5 uses thinkingBudget (legacy)
+            if effort is None or effort == "none":
+                budget = 128 if "2.5-pro" in model.id else 0
+                # Explicitly disable thoughts when no effort is requested
+                thinking_config = {"includeThoughts": False, "thinkingBudget": budget}
+            else:
+                thinking_config = {"includeThoughts": True}
+                if (
+                    effort in {"minimal", "low", "medium", "high"}
+                    and "flash" in model.id
+                ):
+                    budget = {
+                        "minimal": 256,
+                        "low": 1024,
+                        "medium": 4096,
+                        "high": 16384,
+                    }[effort]
+                    thinking_config["thinkingBudget"] = budget
         request_json["generationConfig"]["thinkingConfig"] = thinking_config
     else:
@@ -66,6 +108,21 @@ async def _build_gemini_request(
     if sampling_params.json_mode and model.supports_json:
         request_json["generationConfig"]["responseMimeType"] = "application/json"
+    # Handle media_resolution for Gemini 3 (requires v1alpha)
+    if sampling_params.media_resolution is not None:
+        is_gemini_3 = "gemini-3" in model.name.lower()
+        if is_gemini_3:
+            # Add global media resolution to generationConfig
+            request_json["generationConfig"]["mediaResolution"] = {
+                "level": sampling_params.media_resolution
+            }
+        else:
+            # Warn if trying to use media_resolution on non-Gemini-3 models
+            maybe_warn(
+                "WARN_MEDIA_RESOLUTION_UNSUPPORTED",
+                model_name=model.name,
+            )
     return request_json
@@ -137,10 +194,19 @@ class GeminiRequest(APIRequestBase):
                         candidate = data["candidates"][0]
                         if "content" in candidate and "parts" in candidate["content"]:
                             for part in candidate["content"]["parts"]:
+                                # Extract thought signature if present
+                                thought_sig = part.get("thoughtSignature")
                                 if "text" in part:
                                     parts.append(Text(part["text"]))
                                 elif "thought" in part:
-                                    parts.append(Thinking(part["thought"]))
+                                    # Thought with optional signature
+                                    parts.append(
+                                        Thinking(
+                                            content=part["thought"],
+                                            thought_signature=thought_sig,
+                                        )
+                                    )
                                 elif "functionCall" in part:
                                     func_call = part["functionCall"]
                                     # Generate a unique ID since Gemini doesn't provide one
@@ -152,6 +218,7 @@ class GeminiRequest(APIRequestBase):
                                             id=tool_id,
                                             name=func_call["name"],
                                             arguments=func_call.get("args", {}),
+                                            thought_signature=thought_sig,
                                         )
                                     )

lm_deluge/client.py CHANGED Viewed

@@ -262,6 +262,7 @@ class _LLMClient(BaseModel):
             self.max_tokens_per_minute = max_tokens_per_minute
         if max_concurrent_requests:
             self.max_concurrent_requests = max_concurrent_requests
+        return self
     def _get_tracker(self) -> StatusTracker:
         if self._tracker is None:

lm_deluge/config.py CHANGED Viewed

@@ -12,6 +12,13 @@ class SamplingParams(BaseModel):
     logprobs: bool = False
     top_logprobs: int | None = None
     strict_tools: bool = True
+    # Gemini 3 only - controls multimodal vision processing fidelity
+    media_resolution: (
+        Literal[
+            "media_resolution_low", "media_resolution_medium", "media_resolution_high"
+        ]
+        | None
+    ) = None
     def to_vllm(self):
         try:

lm-deluge 0.0.76__py3-none-any.whl → 0.0.79__py3-none-any.whl

lm-deluge 0.0.76py3-none-any.whl → 0.0.79py3-none-any.whl