PyPI - cua-agent - Versions diffs - 0.3.2__py3-none-any.whl → 0.4.0__py3-none-any.whl - Mend

cua-agent 0.3.2py3-none-any.whl → 0.4.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of cua-agent might be problematic. Click here for more details.

Files changed (112) hide show

agent/__init__.py +21 -12
agent/__main__.py +21 -0
agent/adapters/__init__.py +9 -0
agent/adapters/huggingfacelocal_adapter.py +229 -0
agent/agent.py +594 -0
agent/callbacks/__init__.py +19 -0
agent/callbacks/base.py +153 -0
agent/callbacks/budget_manager.py +44 -0
agent/callbacks/image_retention.py +139 -0
agent/callbacks/logging.py +247 -0
agent/callbacks/pii_anonymization.py +259 -0
agent/callbacks/telemetry.py +210 -0
agent/callbacks/trajectory_saver.py +305 -0
agent/cli.py +297 -0
agent/computer_handler.py +107 -0
agent/decorators.py +90 -0
agent/loops/__init__.py +11 -0
agent/loops/anthropic.py +728 -0
agent/loops/omniparser.py +339 -0
agent/loops/openai.py +95 -0
agent/loops/uitars.py +688 -0
agent/responses.py +207 -0
agent/telemetry.py +135 -14
agent/types.py +79 -0
agent/ui/__init__.py +7 -1
agent/ui/__main__.py +2 -13
agent/ui/gradio/__init__.py +6 -19
agent/ui/gradio/app.py +94 -1313
agent/ui/gradio/ui_components.py +721 -0
cua_agent-0.4.0.dist-info/METADATA +424 -0
cua_agent-0.4.0.dist-info/RECORD +33 -0
agent/core/__init__.py +0 -27
agent/core/agent.py +0 -210
agent/core/base.py +0 -217
agent/core/callbacks.py +0 -200
agent/core/experiment.py +0 -249
agent/core/factory.py +0 -122
agent/core/messages.py +0 -332
agent/core/provider_config.py +0 -21
agent/core/telemetry.py +0 -142
agent/core/tools/__init__.py +0 -21
agent/core/tools/base.py +0 -74
agent/core/tools/bash.py +0 -52
agent/core/tools/collection.py +0 -46
agent/core/tools/computer.py +0 -113
agent/core/tools/edit.py +0 -67
agent/core/tools/manager.py +0 -56
agent/core/tools.py +0 -32
agent/core/types.py +0 -88
agent/core/visualization.py +0 -197
agent/providers/__init__.py +0 -4
agent/providers/anthropic/__init__.py +0 -6
agent/providers/anthropic/api/client.py +0 -360
agent/providers/anthropic/api/logging.py +0 -150
agent/providers/anthropic/api_handler.py +0 -140
agent/providers/anthropic/callbacks/__init__.py +0 -5
agent/providers/anthropic/callbacks/manager.py +0 -65
agent/providers/anthropic/loop.py +0 -568
agent/providers/anthropic/prompts.py +0 -23
agent/providers/anthropic/response_handler.py +0 -226
agent/providers/anthropic/tools/__init__.py +0 -33
agent/providers/anthropic/tools/base.py +0 -88
agent/providers/anthropic/tools/bash.py +0 -66
agent/providers/anthropic/tools/collection.py +0 -34
agent/providers/anthropic/tools/computer.py +0 -396
agent/providers/anthropic/tools/edit.py +0 -326
agent/providers/anthropic/tools/manager.py +0 -54
agent/providers/anthropic/tools/run.py +0 -42
agent/providers/anthropic/types.py +0 -16
agent/providers/anthropic/utils.py +0 -381
agent/providers/omni/__init__.py +0 -8
agent/providers/omni/api_handler.py +0 -42
agent/providers/omni/clients/anthropic.py +0 -103
agent/providers/omni/clients/base.py +0 -35
agent/providers/omni/clients/oaicompat.py +0 -195
agent/providers/omni/clients/ollama.py +0 -122
agent/providers/omni/clients/openai.py +0 -155
agent/providers/omni/clients/utils.py +0 -25
agent/providers/omni/image_utils.py +0 -34
agent/providers/omni/loop.py +0 -990
agent/providers/omni/parser.py +0 -307
agent/providers/omni/prompts.py +0 -64
agent/providers/omni/tools/__init__.py +0 -30
agent/providers/omni/tools/base.py +0 -29
agent/providers/omni/tools/bash.py +0 -74
agent/providers/omni/tools/computer.py +0 -179
agent/providers/omni/tools/manager.py +0 -61
agent/providers/omni/utils.py +0 -236
agent/providers/openai/__init__.py +0 -6
agent/providers/openai/api_handler.py +0 -456
agent/providers/openai/loop.py +0 -472
agent/providers/openai/response_handler.py +0 -205
agent/providers/openai/tools/__init__.py +0 -15
agent/providers/openai/tools/base.py +0 -79
agent/providers/openai/tools/computer.py +0 -326
agent/providers/openai/tools/manager.py +0 -106
agent/providers/openai/types.py +0 -36
agent/providers/openai/utils.py +0 -98
agent/providers/uitars/__init__.py +0 -1
agent/providers/uitars/clients/base.py +0 -35
agent/providers/uitars/clients/mlxvlm.py +0 -263
agent/providers/uitars/clients/oaicompat.py +0 -214
agent/providers/uitars/loop.py +0 -660
agent/providers/uitars/prompts.py +0 -63
agent/providers/uitars/tools/__init__.py +0 -1
agent/providers/uitars/tools/computer.py +0 -283
agent/providers/uitars/tools/manager.py +0 -60
agent/providers/uitars/utils.py +0 -264
cua_agent-0.3.2.dist-info/METADATA +0 -295
cua_agent-0.3.2.dist-info/RECORD +0 -87
{cua_agent-0.3.2.dist-info → cua_agent-0.4.0.dist-info}/WHEEL +0 -0
{cua_agent-0.3.2.dist-info → cua_agent-0.4.0.dist-info}/entry_points.txt +0 -0

agent/core/tools/base.py DELETED Viewed

@@ -1,74 +0,0 @@
-"""Abstract base classes for tools that can be used with any provider."""
-from abc import ABCMeta, abstractmethod
-from dataclasses import dataclass, fields, replace
-from typing import Any, Dict
-class BaseTool(metaclass=ABCMeta):
-    """Abstract base class for provider-agnostic tools."""
-    name: str
-    @abstractmethod
-    async def __call__(self, **kwargs) -> Any:
-        """Executes the tool with the given arguments."""
-        ...
-    @abstractmethod
-    def to_params(self) -> Dict[str, Any]:
-        """Convert tool to provider-specific API parameters.
-        Returns:
-            Dictionary with tool parameters specific to the LLM provider
-        """
-        raise NotImplementedError
-@dataclass(kw_only=True, frozen=True)
-class ToolResult:
-    """Represents the result of a tool execution."""
-    output: str | None = None
-    error: str | None = None
-    base64_image: str | None = None
-    system: str | None = None
-    content: list[dict] | None = None
-    def __bool__(self):
-        return any(getattr(self, field.name) for field in fields(self))
-    def __add__(self, other: "ToolResult"):
-        def combine_fields(field: str | None, other_field: str | None, concatenate: bool = True):
-            if field and other_field:
-                if concatenate:
-                    return field + other_field
-                raise ValueError("Cannot combine tool results")
-            return field or other_field
-        return ToolResult(
-            output=combine_fields(self.output, other.output),
-            error=combine_fields(self.error, other.error),
-            base64_image=combine_fields(self.base64_image, other.base64_image, False),
-            system=combine_fields(self.system, other.system),
-            content=self.content or other.content,  # Use first non-None content
-        )
-    def replace(self, **kwargs):
-        """Returns a new ToolResult with the given fields replaced."""
-        return replace(self, **kwargs)
-class CLIResult(ToolResult):
-    """A ToolResult that can be rendered as a CLI output."""
-class ToolFailure(ToolResult):
-    """A ToolResult that represents a failure."""
-class ToolError(Exception):
-    """Raised when a tool encounters an error."""
-    def __init__(self, message):
-        self.message = message

agent/core/tools/bash.py DELETED Viewed

@@ -1,52 +0,0 @@
-"""Abstract base bash/shell tool implementation."""
-import asyncio
-import logging
-from abc import abstractmethod
-from typing import Any, Dict, Tuple
-from computer.computer import Computer
-from .base import BaseTool, ToolResult
-class BaseBashTool(BaseTool):
-    """Base class for bash/shell command execution tools across different providers."""
-    name = "bash"
-    logger = logging.getLogger(__name__)
-    computer: Computer
-    def __init__(self, computer: Computer):
-        """Initialize the BashTool.
-        Args:
-            computer: Computer instance, may be used for related operations
-        """
-        self.computer = computer
-    async def run_command(self, command: str) -> Tuple[int, str, str]:
-        """Run a shell command and return exit code, stdout, and stderr.
-        Args:
-            command: Shell command to execute
-        Returns:
-            Tuple containing (exit_code, stdout, stderr)
-        """
-        try:
-            process = await asyncio.create_subprocess_shell(
-                command,
-                stdout=asyncio.subprocess.PIPE,
-                stderr=asyncio.subprocess.PIPE,
-            )
-            stdout, stderr = await process.communicate()
-            return process.returncode or 0, stdout.decode(), stderr.decode()
-        except Exception as e:
-            self.logger.error(f"Error running command: {str(e)}")
-            return 1, "", str(e)
-    @abstractmethod
-    async def __call__(self, **kwargs) -> ToolResult:
-        """Execute the tool with the provided arguments."""
-        raise NotImplementedError

agent/core/tools/collection.py DELETED Viewed

@@ -1,46 +0,0 @@
-"""Collection classes for managing multiple tools."""
-from typing import Any, Dict, List, Type
-from .base import (
-    BaseTool,
-    ToolError,
-    ToolFailure,
-    ToolResult,
-)
-class ToolCollection:
-    """A collection of tools that can be used with any provider."""
-    def __init__(self, *tools: BaseTool):
-        self.tools = tools
-        self.tool_map = {tool.name: tool for tool in tools}
-    def to_params(self) -> List[Dict[str, Any]]:
-        """Convert all tools to provider-specific parameters.
-        Returns:
-            List of dictionaries with tool parameters
-        """
-        return [tool.to_params() for tool in self.tools]
-    async def run(self, *, name: str, tool_input: Dict[str, Any]) -> ToolResult:
-        """Run a tool with the given input.
-        Args:
-            name: Name of the tool to run
-            tool_input: Input parameters for the tool
-        Returns:
-            Result of the tool execution
-        """
-        tool = self.tool_map.get(name)
-        if not tool:
-            return ToolFailure(error=f"Tool {name} is invalid")
-        try:
-            return await tool(**tool_input)
-        except ToolError as e:
-            return ToolFailure(error=e.message)
-        except Exception as e:
-            return ToolFailure(error=f"Unexpected error in tool {name}: {str(e)}")

agent/core/tools/computer.py DELETED Viewed

@@ -1,113 +0,0 @@
-"""Abstract base computer tool implementation."""
-import asyncio
-import base64
-import io
-import logging
-from abc import abstractmethod
-from typing import Any, Dict, Optional, Tuple
-from PIL import Image
-from computer.computer import Computer
-from .base import BaseTool, ToolError, ToolResult
-class BaseComputerTool(BaseTool):
-    """Base class for computer interaction tools across different providers."""
-    name = "computer"
-    logger = logging.getLogger(__name__)
-    width: Optional[int] = None
-    height: Optional[int] = None
-    display_num: Optional[int] = None
-    computer: Computer
-    _screenshot_delay = 1.0  # Default delay for most platforms
-    _scaling_enabled = True
-    def __init__(self, computer: Computer):
-        """Initialize the ComputerTool.
-        Args:
-            computer: Computer instance for screen interactions
-        """
-        self.computer = computer
-    async def initialize_dimensions(self):
-        """Initialize screen dimensions from the computer interface."""
-        display_size = await self.computer.interface.get_screen_size()
-        self.width = display_size["width"]
-        self.height = display_size["height"]
-        self.logger.info(f"Initialized screen dimensions to {self.width}x{self.height}")
-    @property
-    def options(self) -> Dict[str, Any]:
-        """Get the options for the tool.
-        Returns:
-            Dictionary with tool options
-        """
-        if self.width is None or self.height is None:
-            raise RuntimeError(
-                "Screen dimensions not initialized. Call initialize_dimensions() first."
-            )
-        return {
-            "display_width_px": self.width,
-            "display_height_px": self.height,
-            "display_number": self.display_num,
-        }
-    async def resize_screenshot_if_needed(self, screenshot: bytes) -> bytes:
-        """Resize a screenshot to match the expected dimensions.
-        Args:
-            screenshot: Raw screenshot data
-        Returns:
-            Resized screenshot data
-        """
-        if self.width is None or self.height is None:
-            raise ToolError("Screen dimensions not initialized")
-        try:
-            img = Image.open(io.BytesIO(screenshot))
-            if img.mode in ("RGBA", "LA") or (img.mode == "P" and "transparency" in img.info):
-                img = img.convert("RGB")
-            # Resize if dimensions don't match
-            if img.size != (self.width, self.height):
-                self.logger.info(
-                    f"Scaling image from {img.size} to {self.width}x{self.height} to match screen dimensions"
-                )
-                img = img.resize((self.width, self.height), Image.Resampling.LANCZOS)
-                # Save back to bytes
-                buffer = io.BytesIO()
-                img.save(buffer, format="PNG")
-                return buffer.getvalue()
-            return screenshot
-        except Exception as e:
-            self.logger.error(f"Error during screenshot resizing: {str(e)}")
-            raise ToolError(f"Failed to resize screenshot: {str(e)}")
-    async def screenshot(self) -> ToolResult:
-        """Take a screenshot and return it as a ToolResult with base64-encoded image.
-        Returns:
-            ToolResult with the screenshot
-        """
-        try:
-            screenshot = await self.computer.interface.screenshot()
-            screenshot = await self.resize_screenshot_if_needed(screenshot)
-            return ToolResult(base64_image=base64.b64encode(screenshot).decode())
-        except Exception as e:
-            self.logger.error(f"Error taking screenshot: {str(e)}")
-            return ToolResult(error=f"Failed to take screenshot: {str(e)}")
-    @abstractmethod
-    async def __call__(self, **kwargs) -> ToolResult:
-        """Execute the tool with the provided arguments."""
-        raise NotImplementedError

agent/core/tools/edit.py DELETED Viewed

@@ -1,67 +0,0 @@
-"""Abstract base edit tool implementation."""
-import asyncio
-import logging
-import os
-from abc import abstractmethod
-from pathlib import Path
-from typing import Any, Dict, Optional
-from computer.computer import Computer
-from .base import BaseTool, ToolError, ToolResult
-class BaseEditTool(BaseTool):
-    """Base class for text editor tools across different providers."""
-    name = "edit"
-    logger = logging.getLogger(__name__)
-    computer: Computer
-    def __init__(self, computer: Computer):
-        """Initialize the EditTool.
-        Args:
-            computer: Computer instance, may be used for related operations
-        """
-        self.computer = computer
-    async def read_file(self, path: str) -> str:
-        """Read a file and return its contents.
-        Args:
-            path: Path to the file to read
-        Returns:
-            File contents as a string
-        """
-        try:
-            path_obj = Path(path)
-            if not path_obj.exists():
-                raise ToolError(f"File does not exist: {path}")
-            return path_obj.read_text()
-        except Exception as e:
-            self.logger.error(f"Error reading file: {str(e)}")
-            raise ToolError(f"Failed to read file: {str(e)}")
-    async def write_file(self, path: str, content: str) -> None:
-        """Write content to a file.
-        Args:
-            path: Path to the file to write
-            content: Content to write to the file
-        """
-        try:
-            path_obj = Path(path)
-            # Create parent directories if they don't exist
-            path_obj.parent.mkdir(parents=True, exist_ok=True)
-            path_obj.write_text(content)
-        except Exception as e:
-            self.logger.error(f"Error writing file: {str(e)}")
-            raise ToolError(f"Failed to write file: {str(e)}")
-    @abstractmethod
-    async def __call__(self, **kwargs) -> ToolResult:
-        """Execute the tool with the provided arguments."""
-        raise NotImplementedError

agent/core/tools/manager.py DELETED Viewed

@@ -1,56 +0,0 @@
-"""Tool manager for initializing and running tools."""
-from abc import ABC, abstractmethod
-from typing import Any, Dict, List
-from computer.computer import Computer
-from .base import BaseTool, ToolResult
-from .collection import ToolCollection
-class BaseToolManager(ABC):
-    """Base class for tool managers across different providers."""
-    def __init__(self, computer: Computer):
-        """Initialize the tool manager.
-        Args:
-            computer: Computer instance for computer-related tools
-        """
-        self.computer = computer
-        self.tools: ToolCollection | None = None
-    @abstractmethod
-    def _initialize_tools(self) -> ToolCollection:
-        """Initialize all available tools."""
-        ...
-    async def initialize(self) -> None:
-        """Initialize tool-specific requirements and create tool collection."""
-        await self._initialize_tools_specific()
-        self.tools = self._initialize_tools()
-    @abstractmethod
-    async def _initialize_tools_specific(self) -> None:
-        """Initialize provider-specific tool requirements."""
-        ...
-    @abstractmethod
-    def get_tool_params(self) -> List[Dict[str, Any]]:
-        """Get tool parameters for API calls."""
-        ...
-    async def execute_tool(self, name: str, tool_input: Dict[str, Any]) -> ToolResult:
-        """Execute a tool with the given input.
-        Args:
-            name: Name of the tool to execute
-            tool_input: Input parameters for the tool
-        Returns:
-            Result of the tool execution
-        """
-        if self.tools is None:
-            raise RuntimeError("Tools not initialized. Call initialize() first.")
-        return await self.tools.run(name=name, tool_input=tool_input)

agent/core/tools.py DELETED Viewed

@@ -1,32 +0,0 @@
-"""Tool-related type definitions."""
-from enum import StrEnum
-from typing import Dict, Any, Optional
-from pydantic import BaseModel, ConfigDict
-class ToolInvocationState(StrEnum):
-    """States for tool invocation."""
-    CALL = 'call'
-    PARTIAL_CALL = 'partial-call'
-    RESULT = 'result'
-class ToolInvocation(BaseModel):
-    """Tool invocation type."""
-    model_config = ConfigDict(extra='forbid')
-    state: Optional[str] = None
-    toolCallId: str
-    toolName: Optional[str] = None
-    args: Optional[Dict[str, Any]] = None
-class ClientAttachment(BaseModel):
-    """Client attachment type."""
-    name: str
-    contentType: str
-    url: str
-class ToolResult(BaseModel):
-    """Result of a tool execution."""
-    model_config = ConfigDict(extra='forbid')
-    output: Optional[str] = None
-    error: Optional[str] = None
-    metadata: Optional[Dict[str, Any]] = None

agent/core/types.py DELETED Viewed

@@ -1,88 +0,0 @@
-"""Core type definitions."""
-from typing import Any, Dict, List, Optional, TypedDict, Union
-from enum import StrEnum
-from dataclasses import dataclass
-class AgentLoop(StrEnum):
-    """Enumeration of available loop types."""
-    ANTHROPIC = "anthropic"  # Anthropic implementation
-    OMNI = "omni"  # OmniLoop implementation
-    OPENAI = "openai"  # OpenAI implementation
-    OLLAMA = "ollama"  # OLLAMA implementation
-    UITARS = "uitars"  # UI-TARS implementation
-    # Add more loop types as needed
-class LLMProvider(StrEnum):
-    """Supported LLM providers."""
-    ANTHROPIC = "anthropic"
-    OPENAI = "openai"
-    OLLAMA = "ollama"
-    OAICOMPAT = "oaicompat"
-    MLXVLM= "mlxvlm"
-@dataclass
-class LLM:
-    """Configuration for LLM model and provider."""
-    provider: LLMProvider
-    name: Optional[str] = None
-    provider_base_url: Optional[str] = None
-    def __post_init__(self):
-        """Set default model name if not provided."""
-        if self.name is None:
-            from .provider_config import DEFAULT_MODELS
-            self.name = DEFAULT_MODELS.get(self.provider)
-        # Set default provider URL if none provided
-        if self.provider_base_url is None and self.provider == LLMProvider.OAICOMPAT:
-            # Default for vLLM
-            self.provider_base_url = "http://localhost:8000/v1"
-            # Common alternatives:
-            # - LM Studio: "http://localhost:1234/v1"
-            # - LocalAI: "http://localhost:8080/v1"
-            # - Ollama with OpenAI compatible API: "http://localhost:11434/v1"
-# For backward compatibility
-LLMModel = LLM
-Model = LLM
-class AgentResponse(TypedDict, total=False):
-    """Agent response format."""
-    id: str
-    object: str
-    created_at: int
-    status: str
-    error: Optional[str]
-    incomplete_details: Optional[Any]
-    instructions: Optional[Any]
-    max_output_tokens: Optional[int]
-    model: str
-    output: List[Dict[str, Any]]
-    parallel_tool_calls: bool
-    previous_response_id: Optional[str]
-    reasoning: Dict[str, str]
-    store: bool
-    temperature: float
-    text: Dict[str, Dict[str, str]]
-    tool_choice: str
-    tools: List[Dict[str, Union[str, int]]]
-    top_p: float
-    truncation: str
-    usage: Dict[str, Any]
-    user: Optional[str]
-    metadata: Dict[str, Any]
-    response: Dict[str, List[Dict[str, Any]]]
-    # Additional fields for error responses
-    role: str
-    content: Union[str, List[Dict[str, Any]]]

cua-agent 0.3.2__py3-none-any.whl → 0.4.0__py3-none-any.whl

Potentially problematic release.

cua-agent 0.3.2py3-none-any.whl → 0.4.0py3-none-any.whl