PyPI - cua-agent - Versions diffs - 0.3.2__py3-none-any.whl → 0.4.0b2__py3-none-any.whl - Mend

cua-agent 0.3.2py3-none-any.whl → 0.4.0b2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of cua-agent might be problematic. Click here for more details.

Files changed (111) hide show

agent/__init__.py +15 -51
agent/__main__.py +21 -0
agent/adapters/__init__.py +9 -0
agent/adapters/huggingfacelocal_adapter.py +229 -0
agent/agent.py +577 -0
agent/callbacks/__init__.py +17 -0
agent/callbacks/base.py +153 -0
agent/callbacks/budget_manager.py +44 -0
agent/callbacks/image_retention.py +139 -0
agent/callbacks/logging.py +247 -0
agent/callbacks/pii_anonymization.py +259 -0
agent/callbacks/trajectory_saver.py +305 -0
agent/cli.py +290 -0
agent/computer_handler.py +107 -0
agent/decorators.py +90 -0
agent/loops/__init__.py +11 -0
agent/loops/anthropic.py +728 -0
agent/loops/omniparser.py +339 -0
agent/loops/openai.py +95 -0
agent/loops/uitars.py +688 -0
agent/responses.py +207 -0
agent/types.py +79 -0
agent/ui/__init__.py +7 -1
agent/ui/gradio/__init__.py +6 -19
agent/ui/gradio/app.py +80 -1299
agent/ui/gradio/ui_components.py +703 -0
cua_agent-0.4.0b2.dist-info/METADATA +424 -0
cua_agent-0.4.0b2.dist-info/RECORD +30 -0
agent/core/__init__.py +0 -27
agent/core/agent.py +0 -210
agent/core/base.py +0 -217
agent/core/callbacks.py +0 -200
agent/core/experiment.py +0 -249
agent/core/factory.py +0 -122
agent/core/messages.py +0 -332
agent/core/provider_config.py +0 -21
agent/core/telemetry.py +0 -142
agent/core/tools/__init__.py +0 -21
agent/core/tools/base.py +0 -74
agent/core/tools/bash.py +0 -52
agent/core/tools/collection.py +0 -46
agent/core/tools/computer.py +0 -113
agent/core/tools/edit.py +0 -67
agent/core/tools/manager.py +0 -56
agent/core/tools.py +0 -32
agent/core/types.py +0 -88
agent/core/visualization.py +0 -197
agent/providers/__init__.py +0 -4
agent/providers/anthropic/__init__.py +0 -6
agent/providers/anthropic/api/client.py +0 -360
agent/providers/anthropic/api/logging.py +0 -150
agent/providers/anthropic/api_handler.py +0 -140
agent/providers/anthropic/callbacks/__init__.py +0 -5
agent/providers/anthropic/callbacks/manager.py +0 -65
agent/providers/anthropic/loop.py +0 -568
agent/providers/anthropic/prompts.py +0 -23
agent/providers/anthropic/response_handler.py +0 -226
agent/providers/anthropic/tools/__init__.py +0 -33
agent/providers/anthropic/tools/base.py +0 -88
agent/providers/anthropic/tools/bash.py +0 -66
agent/providers/anthropic/tools/collection.py +0 -34
agent/providers/anthropic/tools/computer.py +0 -396
agent/providers/anthropic/tools/edit.py +0 -326
agent/providers/anthropic/tools/manager.py +0 -54
agent/providers/anthropic/tools/run.py +0 -42
agent/providers/anthropic/types.py +0 -16
agent/providers/anthropic/utils.py +0 -381
agent/providers/omni/__init__.py +0 -8
agent/providers/omni/api_handler.py +0 -42
agent/providers/omni/clients/anthropic.py +0 -103
agent/providers/omni/clients/base.py +0 -35
agent/providers/omni/clients/oaicompat.py +0 -195
agent/providers/omni/clients/ollama.py +0 -122
agent/providers/omni/clients/openai.py +0 -155
agent/providers/omni/clients/utils.py +0 -25
agent/providers/omni/image_utils.py +0 -34
agent/providers/omni/loop.py +0 -990
agent/providers/omni/parser.py +0 -307
agent/providers/omni/prompts.py +0 -64
agent/providers/omni/tools/__init__.py +0 -30
agent/providers/omni/tools/base.py +0 -29
agent/providers/omni/tools/bash.py +0 -74
agent/providers/omni/tools/computer.py +0 -179
agent/providers/omni/tools/manager.py +0 -61
agent/providers/omni/utils.py +0 -236
agent/providers/openai/__init__.py +0 -6
agent/providers/openai/api_handler.py +0 -456
agent/providers/openai/loop.py +0 -472
agent/providers/openai/response_handler.py +0 -205
agent/providers/openai/tools/__init__.py +0 -15
agent/providers/openai/tools/base.py +0 -79
agent/providers/openai/tools/computer.py +0 -326
agent/providers/openai/tools/manager.py +0 -106
agent/providers/openai/types.py +0 -36
agent/providers/openai/utils.py +0 -98
agent/providers/uitars/__init__.py +0 -1
agent/providers/uitars/clients/base.py +0 -35
agent/providers/uitars/clients/mlxvlm.py +0 -263
agent/providers/uitars/clients/oaicompat.py +0 -214
agent/providers/uitars/loop.py +0 -660
agent/providers/uitars/prompts.py +0 -63
agent/providers/uitars/tools/__init__.py +0 -1
agent/providers/uitars/tools/computer.py +0 -283
agent/providers/uitars/tools/manager.py +0 -60
agent/providers/uitars/utils.py +0 -264
agent/telemetry.py +0 -21
agent/ui/__main__.py +0 -15
cua_agent-0.3.2.dist-info/METADATA +0 -295
cua_agent-0.3.2.dist-info/RECORD +0 -87
{cua_agent-0.3.2.dist-info → cua_agent-0.4.0b2.dist-info}/WHEEL +0 -0
{cua_agent-0.3.2.dist-info → cua_agent-0.4.0b2.dist-info}/entry_points.txt +0 -0

agent/providers/anthropic/response_handler.py DELETED Viewed

@@ -1,226 +0,0 @@
-"""Response and tool handling for Anthropic provider."""
-import logging
-from typing import Any, Dict, List, Tuple, cast
-from anthropic.types.beta import (
-    BetaMessage,
-    BetaTextBlock,
-    BetaContentBlockParam,
-)
-from .tools import ToolResult
-logger = logging.getLogger(__name__)
-class AnthropicResponseHandler:
-    """Handles Anthropic API responses and tool execution results."""
-    def __init__(self, loop):
-        """Initialize the response handler.
-        Args:
-            loop: Reference to the parent loop instance that provides context
-        """
-        self.loop = loop
-    async def handle_response(
-        self, response: BetaMessage, messages: List[Dict[str, Any]]
-    ) -> Tuple[List[Dict[str, Any]], bool]:
-        """Handle the Anthropic API response.
-        Args:
-            response: API response
-            messages: List of messages for context
-        Returns:
-            Tuple containing:
-            - List of new messages to be added
-            - Boolean indicating if the loop should continue
-        """
-        try:
-            new_messages = []
-            # Convert response to parameter format
-            response_params = self.response_to_params(response)
-            # Collect all existing tool_use IDs from previous messages for validation
-            existing_tool_use_ids = set()
-            for msg in messages:
-                if msg.get("role") == "assistant" and isinstance(msg.get("content"), list):
-                    for block in msg.get("content", []):
-                        if (
-                            isinstance(block, dict)
-                            and block.get("type") == "tool_use"
-                            and "id" in block
-                        ):
-                            existing_tool_use_ids.add(block["id"])
-            # Also add new tool_use IDs from the current response
-            current_tool_use_ids = set()
-            for block in response_params:
-                if isinstance(block, dict) and block.get("type") == "tool_use" and "id" in block:
-                    current_tool_use_ids.add(block["id"])
-                    existing_tool_use_ids.add(block["id"])
-            logger.info(f"Existing tool_use IDs in conversation: {existing_tool_use_ids}")
-            logger.info(f"New tool_use IDs in current response: {current_tool_use_ids}")
-            # Create assistant message
-            new_messages.append(
-                {
-                    "role": "assistant",
-                    "content": response_params,
-                }
-            )
-            if self.loop.callback_manager is None:
-                raise RuntimeError(
-                    "Callback manager not initialized. Call initialize_client() first."
-                )
-            # Handle tool use blocks and collect results
-            tool_result_content = []
-            for content_block in response_params:
-                # Notify callback of content
-                self.loop.callback_manager.on_content(cast(BetaContentBlockParam, content_block))
-                # Handle tool use
-                if content_block.get("type") == "tool_use":
-                    if self.loop.tool_manager is None:
-                        raise RuntimeError(
-                            "Tool manager not initialized. Call initialize_client() first."
-                        )
-                    # Execute the tool
-                    result = await self.loop.tool_manager.execute_tool(
-                        name=content_block["name"],
-                        tool_input=cast(Dict[str, Any], content_block["input"]),
-                    )
-                    # Verify the tool_use ID exists in the conversation (which it should now)
-                    tool_use_id = content_block["id"]
-                    if tool_use_id in existing_tool_use_ids:
-                        # Create tool result and add to content
-                        tool_result = self.make_tool_result(cast(ToolResult, result), tool_use_id)
-                        tool_result_content.append(tool_result)
-                        # Notify callback of tool result
-                        self.loop.callback_manager.on_tool_result(
-                            cast(ToolResult, result), content_block["id"]
-                        )
-                    else:
-                        logger.warning(
-                            f"Tool use ID {tool_use_id} not found in previous messages. Skipping tool result."
-                        )
-            # If no tool results, we're done
-            if not tool_result_content:
-                # Signal completion
-                self.loop.callback_manager.on_content({"type": "text", "text": "<DONE>"})
-                return new_messages, False
-            # Add tool results as user message
-            new_messages.append({"content": tool_result_content, "role": "user"})
-            return new_messages, True
-        except Exception as e:
-            logger.error(f"Error handling response: {str(e)}")
-            new_messages.append(
-                {
-                    "role": "assistant",
-                    "content": f"Error: {str(e)}",
-                }
-            )
-            return new_messages, False
-    def response_to_params(
-        self,
-        response: BetaMessage,
-    ) -> List[Dict[str, Any]]:
-        """Convert API response to message parameters.
-        Args:
-            response: API response message
-        Returns:
-            List of content blocks
-        """
-        result = []
-        for block in response.content:
-            if isinstance(block, BetaTextBlock):
-                result.append({"type": "text", "text": block.text})
-            else:
-                result.append(cast(Dict[str, Any], block.model_dump()))
-        return result
-    def make_tool_result(self, result: ToolResult, tool_use_id: str) -> Dict[str, Any]:
-        """Convert a tool result to API format.
-        Args:
-            result: Tool execution result
-            tool_use_id: ID of the tool use
-        Returns:
-            Formatted tool result
-        """
-        if result.content:
-            return {
-                "type": "tool_result",
-                "content": result.content,
-                "tool_use_id": tool_use_id,
-                "is_error": bool(result.error),
-            }
-        tool_result_content = []
-        is_error = False
-        if result.error:
-            is_error = True
-            tool_result_content = [
-                {
-                    "type": "text",
-                    "text": self.maybe_prepend_system_tool_result(result, result.error),
-                }
-            ]
-        else:
-            if result.output:
-                tool_result_content.append(
-                    {
-                        "type": "text",
-                        "text": self.maybe_prepend_system_tool_result(result, result.output),
-                    }
-                )
-            if result.base64_image:
-                tool_result_content.append(
-                    {
-                        "type": "image",
-                        "source": {
-                            "type": "base64",
-                            "media_type": "image/png",
-                            "data": result.base64_image,
-                        },
-                    }
-                )
-        return {
-            "type": "tool_result",
-            "content": tool_result_content,
-            "tool_use_id": tool_use_id,
-            "is_error": is_error,
-        }
-    def maybe_prepend_system_tool_result(self, result: ToolResult, result_text: str) -> str:
-        """Prepend system information to tool result if available.
-        Args:
-            result: Tool execution result
-            result_text: Text to prepend to
-        Returns:
-            Text with system information prepended if available
-        """
-        if result.system:
-            result_text = f"<s>{result.system}</s>\n{result_text}"
-        return result_text

agent/providers/anthropic/tools/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-"""Anthropic-specific tools for agent."""
-from .base import (
-    BaseAnthropicTool,
-    ToolResult,
-    ToolError,
-    ToolFailure,
-    CLIResult,
-    AnthropicToolResult,
-    AnthropicToolError,
-    AnthropicToolFailure,
-    AnthropicCLIResult,
-)
-from .bash import BashTool
-from .computer import ComputerTool
-from .edit import EditTool
-from .manager import ToolManager
-__all__ = [
-    "BaseAnthropicTool",
-    "ToolResult",
-    "ToolError",
-    "ToolFailure",
-    "CLIResult",
-    "AnthropicToolResult",
-    "AnthropicToolError",
-    "AnthropicToolFailure",
-    "AnthropicCLIResult",
-    "BashTool",
-    "ComputerTool",
-    "EditTool",
-    "ToolManager",
-]

agent/providers/anthropic/tools/base.py DELETED Viewed

@@ -1,88 +0,0 @@
-"""Anthropic-specific tool base classes."""
-from abc import ABCMeta, abstractmethod
-from dataclasses import dataclass, fields, replace
-from typing import Any, Dict
-from anthropic.types.beta import BetaToolUnionParam
-from ....core.tools.base import BaseTool
-class BaseAnthropicTool(BaseTool, metaclass=ABCMeta):
-    """Abstract base class for Anthropic-defined tools."""
-    def __init__(self):
-        """Initialize the base Anthropic tool."""
-        # No specific initialization needed yet, but included for future extensibility
-        pass
-    @abstractmethod
-    async def __call__(self, **kwargs) -> Any:
-        """Executes the tool with the given arguments."""
-        ...
-    @abstractmethod
-    def to_params(self) -> Dict[str, Any]:
-        """Convert tool to Anthropic-specific API parameters.
-        Returns:
-            Dictionary with tool parameters for Anthropic API
-        """
-        raise NotImplementedError
-@dataclass(kw_only=True, frozen=True)
-class ToolResult:
-    """Represents the result of a tool execution."""
-    output: str | None = None
-    error: str | None = None
-    base64_image: str | None = None
-    system: str | None = None
-    content: list[dict] | None = None
-    def __bool__(self):
-        return any(getattr(self, field.name) for field in fields(self))
-    def __add__(self, other: "ToolResult"):
-        def combine_fields(field: str | None, other_field: str | None, concatenate: bool = True):
-            if field and other_field:
-                if concatenate:
-                    return field + other_field
-                raise ValueError("Cannot combine tool results")
-            return field or other_field
-        return ToolResult(
-            output=combine_fields(self.output, other.output),
-            error=combine_fields(self.error, other.error),
-            base64_image=combine_fields(self.base64_image, other.base64_image, False),
-            system=combine_fields(self.system, other.system),
-            content=self.content or other.content,  # Use first non-None content
-        )
-    def replace(self, **kwargs):
-        """Returns a new ToolResult with the given fields replaced."""
-        return replace(self, **kwargs)
-class CLIResult(ToolResult):
-    """A ToolResult that can be rendered as a CLI output."""
-class ToolFailure(ToolResult):
-    """A ToolResult that represents a failure."""
-class ToolError(Exception):
-    """Raised when a tool encounters an error."""
-    def __init__(self, message):
-        self.message = message
-# Re-export the core tool classes with Anthropic-specific names for backward compatibility
-AnthropicToolResult = ToolResult
-AnthropicToolError = ToolError
-AnthropicToolFailure = ToolFailure
-AnthropicCLIResult = CLIResult

agent/providers/anthropic/tools/bash.py DELETED Viewed

@@ -1,66 +0,0 @@
-import asyncio
-import os
-from typing import ClassVar, Literal, Dict, Any
-from computer.computer import Computer
-from .base import BaseAnthropicTool, CLIResult, ToolError, ToolResult
-from ....core.tools.bash import BaseBashTool
-class BashTool(BaseBashTool, BaseAnthropicTool):
-    """
-    A tool that allows the agent to run bash commands.
-    The tool parameters are defined by Anthropic and are not editable.
-    """
-    name: ClassVar[Literal["bash"]] = "bash"
-    api_type: ClassVar[Literal["bash_20250124"]] = "bash_20250124"
-    _timeout: float = 120.0  # seconds
-    def __init__(self, computer: Computer):
-        """Initialize the bash tool.
-        Args:
-            computer: Computer instance for executing commands
-        """
-        # Initialize the base bash tool first
-        BaseBashTool.__init__(self, computer)
-        # Then initialize the Anthropic tool
-        BaseAnthropicTool.__init__(self)
-        # Initialize bash session
-    async def __call__(self, command: str | None = None, restart: bool = False, **kwargs):
-        """Execute a bash command.
-        Args:
-            command: The command to execute
-            restart: Whether to restart the shell (not used with computer interface)
-        Returns:
-            Tool execution result
-        Raises:
-            ToolError: If command execution fails
-        """
-        if restart:
-            return ToolResult(system="Restart not needed with computer interface.")
-        if command is None:
-            raise ToolError("no command provided.")
-        try:
-            async with asyncio.timeout(self._timeout):
-                result = await self.computer.interface.run_command(command)
-                return CLIResult(output=result.stdout or "", error=result.stderr or "")
-        except asyncio.TimeoutError as e:
-            raise ToolError(f"Command timed out after {self._timeout} seconds") from e
-        except Exception as e:
-            raise ToolError(f"Failed to execute command: {str(e)}")
-    def to_params(self) -> Dict[str, Any]:
-        """Convert tool to API parameters.
-        Returns:
-            Dictionary with tool parameters
-        """
-        return {"name": self.name, "type": self.api_type}

agent/providers/anthropic/tools/collection.py DELETED Viewed

@@ -1,34 +0,0 @@
-"""Collection classes for managing multiple tools."""
-from typing import Any, cast
-from anthropic.types.beta import BetaToolUnionParam
-from .base import (
-    BaseAnthropicTool,
-    ToolError,
-    ToolFailure,
-    ToolResult,
-)
-class ToolCollection:
-    """A collection of anthropic-defined tools."""
-    def __init__(self, *tools: BaseAnthropicTool):
-        self.tools = tools
-        self.tool_map = {tool.to_params()["name"]: tool for tool in tools}
-    def to_params(
-        self,
-    ) -> list[BetaToolUnionParam]:
-        return cast(list[BetaToolUnionParam], [tool.to_params() for tool in self.tools])
-    async def run(self, *, name: str, tool_input: dict[str, Any]) -> ToolResult:
-        tool = self.tool_map.get(name)
-        if not tool:
-            return ToolFailure(error=f"Tool {name} is invalid")
-        try:
-            return await tool(**tool_input)
-        except ToolError as e:
-            return ToolFailure(error=e.message)

cua-agent 0.3.2__py3-none-any.whl → 0.4.0b2__py3-none-any.whl

Potentially problematic release.

cua-agent 0.3.2py3-none-any.whl → 0.4.0b2py3-none-any.whl