PyPI - lm-deluge - Versions diffs - 0.0.67__py3-none-any.whl → 0.0.90__py3-none-any.whl - Mend

lm-deluge 0.0.67py3-none-any.whl → 0.0.90py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of lm-deluge might be problematic. Click here for more details.

Files changed (108) hide show

lm_deluge/__init__.py +1 -2
lm_deluge/api_requests/anthropic.py +117 -22
lm_deluge/api_requests/base.py +84 -11
lm_deluge/api_requests/bedrock.py +30 -6
lm_deluge/api_requests/chat_reasoning.py +4 -0
lm_deluge/api_requests/gemini.py +166 -20
lm_deluge/api_requests/openai.py +145 -25
lm_deluge/batches.py +15 -45
lm_deluge/client.py +309 -50
lm_deluge/config.py +15 -3
lm_deluge/models/__init__.py +14 -1
lm_deluge/models/anthropic.py +29 -14
lm_deluge/models/arcee.py +16 -0
lm_deluge/models/deepseek.py +36 -4
lm_deluge/models/google.py +42 -0
lm_deluge/models/grok.py +24 -0
lm_deluge/models/kimi.py +36 -0
lm_deluge/models/minimax.py +18 -0
lm_deluge/models/openai.py +100 -0
lm_deluge/models/openrouter.py +133 -7
lm_deluge/models/together.py +11 -0
lm_deluge/models/zai.py +50 -0
lm_deluge/pipelines/gepa/__init__.py +95 -0
lm_deluge/pipelines/gepa/core.py +354 -0
lm_deluge/pipelines/gepa/docs/samples.py +705 -0
lm_deluge/pipelines/gepa/examples/01_synthetic_keywords.py +140 -0
lm_deluge/pipelines/gepa/examples/02_gsm8k_math.py +261 -0
lm_deluge/pipelines/gepa/examples/03_hotpotqa_multihop.py +300 -0
lm_deluge/pipelines/gepa/examples/04_batch_classification.py +271 -0
lm_deluge/pipelines/gepa/examples/simple_qa.py +129 -0
lm_deluge/pipelines/gepa/optimizer.py +435 -0
lm_deluge/pipelines/gepa/proposer.py +235 -0
lm_deluge/pipelines/gepa/util.py +165 -0
lm_deluge/{llm_tools → pipelines}/score.py +2 -2
lm_deluge/{llm_tools → pipelines}/translate.py +5 -3
lm_deluge/prompt.py +537 -88
lm_deluge/request_context.py +7 -2
lm_deluge/server/__init__.py +24 -0
lm_deluge/server/__main__.py +144 -0
lm_deluge/server/adapters.py +369 -0
lm_deluge/server/app.py +388 -0
lm_deluge/server/auth.py +71 -0
lm_deluge/server/model_policy.py +215 -0
lm_deluge/server/models_anthropic.py +172 -0
lm_deluge/server/models_openai.py +175 -0
lm_deluge/tool/__init__.py +1130 -0
lm_deluge/tool/builtin/anthropic/__init__.py +300 -0
lm_deluge/tool/builtin/anthropic/bash.py +0 -0
lm_deluge/tool/builtin/anthropic/computer_use.py +0 -0
lm_deluge/tool/builtin/gemini.py +59 -0
lm_deluge/tool/builtin/openai.py +74 -0
lm_deluge/tool/cua/__init__.py +173 -0
lm_deluge/tool/cua/actions.py +148 -0
lm_deluge/tool/cua/base.py +27 -0
lm_deluge/tool/cua/batch.py +215 -0
lm_deluge/tool/cua/converters.py +466 -0
lm_deluge/tool/cua/kernel.py +702 -0
lm_deluge/tool/cua/trycua.py +989 -0
lm_deluge/tool/prefab/__init__.py +45 -0
lm_deluge/tool/prefab/batch_tool.py +156 -0
lm_deluge/tool/prefab/docs.py +1119 -0
lm_deluge/tool/prefab/email.py +294 -0
lm_deluge/tool/prefab/filesystem.py +1711 -0
lm_deluge/tool/prefab/full_text_search/__init__.py +285 -0
lm_deluge/tool/prefab/full_text_search/tantivy_index.py +396 -0
lm_deluge/tool/prefab/memory.py +458 -0
lm_deluge/tool/prefab/otc/__init__.py +165 -0
lm_deluge/tool/prefab/otc/executor.py +281 -0
lm_deluge/tool/prefab/otc/parse.py +188 -0
lm_deluge/tool/prefab/random.py +212 -0
lm_deluge/tool/prefab/rlm/__init__.py +296 -0
lm_deluge/tool/prefab/rlm/executor.py +349 -0
lm_deluge/tool/prefab/rlm/parse.py +144 -0
lm_deluge/tool/prefab/sandbox/__init__.py +19 -0
lm_deluge/tool/prefab/sandbox/daytona_sandbox.py +483 -0
lm_deluge/tool/prefab/sandbox/docker_sandbox.py +609 -0
lm_deluge/tool/prefab/sandbox/fargate_sandbox.py +546 -0
lm_deluge/tool/prefab/sandbox/modal_sandbox.py +469 -0
lm_deluge/tool/prefab/sandbox/seatbelt_sandbox.py +827 -0
lm_deluge/tool/prefab/sheets.py +385 -0
lm_deluge/tool/prefab/skills.py +0 -0
lm_deluge/tool/prefab/subagents.py +233 -0
lm_deluge/tool/prefab/todos.py +342 -0
lm_deluge/tool/prefab/tool_search.py +169 -0
lm_deluge/tool/prefab/web_search.py +199 -0
lm_deluge/tracker.py +16 -13
lm_deluge/util/schema.py +412 -0
lm_deluge/warnings.py +8 -0
{lm_deluge-0.0.67.dist-info → lm_deluge-0.0.90.dist-info}/METADATA +23 -9
lm_deluge-0.0.90.dist-info/RECORD +132 -0
lm_deluge/built_in_tools/anthropic/__init__.py +0 -128
lm_deluge/built_in_tools/openai.py +0 -28
lm_deluge/presets/cerebras.py +0 -17
lm_deluge/presets/meta.py +0 -13
lm_deluge/tool.py +0 -849
lm_deluge-0.0.67.dist-info/RECORD +0 -72
lm_deluge/{llm_tools → pipelines}/__init__.py +1 -1
/lm_deluge/{llm_tools → pipelines}/classify.py +0 -0
/lm_deluge/{llm_tools → pipelines}/extract.py +0 -0
/lm_deluge/{llm_tools → pipelines}/locate.py +0 -0
/lm_deluge/{llm_tools → pipelines}/ocr.py +0 -0
/lm_deluge/{built_in_tools/anthropic/bash.py → skills/anthropic.py} +0 -0
/lm_deluge/{built_in_tools/anthropic/computer_use.py → skills/compat.py} +0 -0
/lm_deluge/{built_in_tools → tool/builtin}/anthropic/editor.py +0 -0
/lm_deluge/{built_in_tools → tool/builtin}/base.py +0 -0
{lm_deluge-0.0.67.dist-info → lm_deluge-0.0.90.dist-info}/WHEEL +0 -0
{lm_deluge-0.0.67.dist-info → lm_deluge-0.0.90.dist-info}/licenses/LICENSE +0 -0
{lm_deluge-0.0.67.dist-info → lm_deluge-0.0.90.dist-info}/top_level.txt +0 -0

lm_deluge/tool/cua/actions.py ADDED Viewed

@@ -0,0 +1,148 @@
+from typing import Any, List, Literal, TypedDict, Union
+Coord = tuple[int, int]
+class CUActionBase(TypedDict):
+    kind: str | Any  # discriminator
+class Click(CUActionBase):
+    kind: Literal["click"]
+    x: int | None  # if missing, current cursor position
+    y: int | None
+    button: Literal["left", "right", "middle", "back", "forward"]
+class DoubleClick(CUActionBase):
+    kind: Literal["double_click"]
+    x: int | None  # if missing, current cursor position
+    y: int | None
+class Move(CUActionBase):
+    kind: Literal["move"]
+    x: int
+    y: int
+class Drag(CUActionBase):
+    kind: Literal["drag"]
+    start_x: int | None  # if missing, current cursor position
+    start_y: int | None  # if missing, current cursor position
+    path: List[Coord]  # path to drag after mousedown
+class Scroll(CUActionBase):
+    kind: Literal["scroll"]
+    x: int | None  # if not provided, current cursor position
+    y: int | None  # if not provided, current cursor position
+    dx: int  # scroll_x in OpenAI
+    dy: int  # scroll_y in OpenAI
+class Keypress(CUActionBase):
+    kind: Literal["keypress"]
+    keys: List[str]
+class Type(CUActionBase):
+    kind: Literal["type"]
+    text: str
+class Wait(CUActionBase):
+    kind: Literal["wait"]
+    ms: int
+class Screenshot(CUActionBase):
+    kind: Literal["screenshot"]
+class MouseDown(CUActionBase):
+    kind: Literal["mouse_down"]
+    button: Literal["left", "right", "middle", "back", "forward"]
+class MouseUp(CUActionBase):
+    kind: Literal["mouse_up"]
+    button: Literal["left", "right", "middle", "back", "forward"]
+class CursorPos(CUActionBase):
+    kind: Literal["cursor_position"]
+class HoldKey(CUActionBase):
+    kind: Literal["hold_key"]
+    key: str
+    ms: int  # duration
+class TripleClick(CUActionBase):
+    kind: Literal["triple_click"]
+    x: int | None  # if missing, current cursor position
+    y: int | None
+# ── Browser‑level actions ────────────────────────────────────────────
+class Navigate(CUActionBase):
+    kind: Literal["navigate"]
+    url: str
+class GoBack(CUActionBase):
+    kind: Literal["go_back"]
+class GoForward(CUActionBase):
+    kind: Literal["go_forward"]
+class Search(CUActionBase):
+    kind: Literal["search"]
+    query: str
+# ── Bash / Editor (provider‑independent) ────────────────────────────
+class Bash(CUActionBase):
+    kind: Literal["bash"]
+    command: str | None
+    restart: bool | None
+class Edit(CUActionBase):
+    kind: Literal["edit"]
+    command: Literal["view", "create", "str_replace", "insert", "undo_edit"]
+    path: str
+    # optional, keep names identical to Anthropic spec
+    file_text: str | None
+    view_range: List[int] | None
+    old_str: str | None
+    new_str: str | None
+    insert_line: int | None
+CUAction = Union[
+    Click,
+    DoubleClick,
+    TripleClick,
+    MouseDown,
+    MouseUp,
+    Drag,
+    Move,
+    Scroll,
+    Keypress,
+    Type,
+    HoldKey,
+    Wait,
+    Screenshot,
+    CursorPos,
+    Navigate,
+    GoBack,
+    GoForward,
+    Search,
+    Bash,
+    Edit,
+]

lm_deluge/tool/cua/base.py ADDED Viewed

@@ -0,0 +1,27 @@
+import abc
+from typing import TypedDict
+from .actions import CUAction
+class Screenshot(TypedDict):
+    media_type: str
+    content: bytes
+class CUActionResult(TypedDict):
+    screenshot: Screenshot | None
+    data: dict  # for structured metadata
+class ComputerExecutor(abc.ABC):
+    """
+    A computer executor is any class that can take an action (from actions.py)
+    and "execute" it. This allows us to plug any API provider (OpenAI, Anthropic)
+    into any computer-use backend (BrowserBase, Kernel, Modal sandbox) by:
+    - Mapping each provider's tools to some (sub)set of CUActions
+    - Defining how to run each CUAction on that backend
+    """
+    def execute(self, action: CUAction) -> CUActionResult:
+        raise NotImplementedError("Subclasses must implement execute method")

lm_deluge/tool/cua/batch.py ADDED Viewed

@@ -0,0 +1,215 @@
+"""
+Batch tool for computer use actions.
+Allows Claude to submit multiple computer actions in a single tool call,
+executing them sequentially and returning only one screenshot at the end.
+This dramatically reduces roundtrips for common action sequences like:
+- Ctrl+L → type URL → Return → wait → screenshot
+"""
+from __future__ import annotations
+import base64
+from typing import Any
+from .. import Tool
+from .converters import anthropic_tool_call_to_action
+# Define the action schema matching Anthropic's computer tool
+ACTION_SCHEMA = {
+    "type": "object",
+    "properties": {
+        "action": {
+            "type": "string",
+            "enum": [
+                "screenshot",
+                "key",
+                "type",
+                "mouse_move",
+                "left_click",
+                "left_click_drag",
+                "right_click",
+                "middle_click",
+                "double_click",
+                "triple_click",
+                "scroll",
+                "wait",
+                "cursor_position",
+            ],
+            "description": "The action to perform",
+        },
+        "text": {
+            "type": "string",
+            "description": "For 'key' action: key combo like 'Return', 'ctrl+l'. For 'type' action: text to type.",
+        },
+        "coordinate": {
+            "type": "array",
+            "items": {"type": "integer"},
+            "minItems": 2,
+            "maxItems": 2,
+            "description": "For click/move actions: [x, y] coordinates",
+        },
+        "scroll_direction": {
+            "type": "string",
+            "enum": ["up", "down", "left", "right"],
+            "description": "For scroll action: direction to scroll",
+        },
+        "scroll_amount": {
+            "type": "integer",
+            "description": "For scroll action: number of scroll clicks",
+        },
+        "duration": {
+            "type": "number",
+            "description": "For wait action: seconds to wait",
+        },
+    },
+    "required": ["action"],
+}
+def create_computer_batch_tool(
+    executor,  # AsyncKernelExecutor or similar
+    *,
+    tool_name: str = "computer_batch",
+    include_final_screenshot: bool = True,
+) -> Tool:
+    """
+    Create a batch tool for computer use actions.
+    This tool allows Claude to submit multiple actions in one call:
+    - Actions execute sequentially
+    - Only one screenshot is returned at the end (if requested)
+    - Dramatically reduces API roundtrips
+    Args:
+        executor: The computer executor (e.g., AsyncKernelExecutor)
+        tool_name: Name for the batch tool
+        include_final_screenshot: Whether to always include a screenshot at the end
+    Returns:
+        A Tool that can be passed to the LLM
+    Example:
+        executor = AsyncKernelExecutor(session_id)
+        batch_tool = create_computer_batch_tool(executor)
+        # Claude can now call:
+        # computer_batch(actions=[
+        #     {"action": "key", "text": "ctrl+l"},
+        #     {"action": "type", "text": "https://example.com"},
+        #     {"action": "key", "text": "Return"},
+        #     {"action": "wait", "duration": 2},
+        #     {"action": "screenshot"}
+        # ])
+    """
+    async def run_batch(actions: list[dict[str, Any]]) -> str | list:
+        """Execute a batch of computer actions and return results."""
+        from ...image import Image
+        from ...prompt import Text
+        results = []
+        final_screenshot = None
+        for i, action_args in enumerate(actions):
+            action_name = action_args.get("action", "unknown")
+            try:
+                # Convert Anthropic format to CUAction
+                cu_action = anthropic_tool_call_to_action(action_args)
+                # Execute the action
+                result = await executor.execute(cu_action)
+                # Track if this was a screenshot
+                if result.get("screenshot"):
+                    final_screenshot = result["screenshot"]
+                    results.append(
+                        {
+                            "action": action_name,
+                            "status": "ok",
+                            "has_screenshot": True,
+                        }
+                    )
+                else:
+                    results.append(
+                        {
+                            "action": action_name,
+                            "status": "ok",
+                        }
+                    )
+            except Exception as e:
+                results.append(
+                    {
+                        "action": action_name,
+                        "status": "error",
+                        "error": str(e),
+                    }
+                )
+                # Stop on error
+                break
+        # If we should include a final screenshot and don't have one yet, take one
+        if include_final_screenshot and final_screenshot is None:
+            try:
+                from .actions import Screenshot
+                result = await executor.execute(Screenshot(kind="screenshot"))
+                if result.get("screenshot"):
+                    final_screenshot = result["screenshot"]
+            except Exception:
+                pass
+        # Build the response
+        summary = f"Executed {len(results)} actions. "
+        errors = [r for r in results if r.get("status") == "error"]
+        if errors:
+            summary += f"{len(errors)} failed: {errors[0].get('error', 'unknown')}"
+        else:
+            summary += "All succeeded."
+        if final_screenshot:
+            # Return Text + Image (proper ToolResultPart types)
+            screenshot_bytes = final_screenshot["content"]
+            b64 = base64.b64encode(screenshot_bytes).decode()
+            img = Image(data=f"data:image/png;base64,{b64}")
+            return [Text(summary), img]
+        else:
+            # Just return text summary
+            return summary
+    description = """Execute multiple computer actions in a single call.
+This is much faster than calling actions one at a time.
+Actions run sequentially. A screenshot is taken at the end.
+Common patterns:
+- Navigate to URL: [{"action":"key","text":"ctrl+l"}, {"action":"type","text":"https://..."}, {"action":"key","text":"Return"}, {"action":"wait","duration":2}]
+- Click and type: [{"action":"left_click","coordinate":[x,y]}, {"action":"type","text":"..."}]
+- Scroll and screenshot: [{"action":"scroll","coordinate":[x,y],"scroll_direction":"down","scroll_amount":3}]
+Available actions:
+- screenshot: Capture the screen
+- key: Press key combo (text="Return", "ctrl+l", "ctrl+a", etc.)
+- type: Type text (text="hello world")
+- left_click, right_click, middle_click, double_click, triple_click: Click at coordinate=[x,y]
+- mouse_move: Move cursor to coordinate=[x,y]
+- scroll: Scroll at coordinate=[x,y] with scroll_direction and scroll_amount
+- wait: Pause for duration seconds
+"""
+    return Tool(
+        name=tool_name,
+        description=description,
+        parameters={
+            "actions": {
+                "type": "array",
+                "description": "List of actions to execute in order",
+                "items": ACTION_SCHEMA,
+                "minItems": 1,
+            }
+        },
+        required=["actions"],
+        run=run_batch,
+    )

lm-deluge 0.0.67__py3-none-any.whl → 0.0.90__py3-none-any.whl

Potentially problematic release.

lm-deluge 0.0.67py3-none-any.whl → 0.0.90py3-none-any.whl