PyPI - cua-computer - Versions diffs - 0.4.3__py3-none-any.whl → 0.4.5__py3-none-any.whl - Mend

cua-computer 0.4.3py3-none-any.whl → 0.4.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

computer/__init__.py +0 -4
computer/computer.py +13 -3
computer/diorama_computer.py +139 -0
{cua_computer-0.4.3.dist-info → cua_computer-0.4.5.dist-info}/METADATA +10 -81
{cua_computer-0.4.3.dist-info → cua_computer-0.4.5.dist-info}/RECORD +7 -8
computer/telemetry.py +0 -116
{cua_computer-0.4.3.dist-info → cua_computer-0.4.5.dist-info}/WHEEL +0 -0
{cua_computer-0.4.3.dist-info → cua_computer-0.4.5.dist-info}/entry_points.txt +0 -0

computer/__init__.py CHANGED Viewed

@@ -12,7 +12,6 @@ logger = logging.getLogger("computer")
 try:
     # Import from core telemetry
     from core.telemetry import (
-        flush,
         is_telemetry_enabled,
         record_event,
     )
@@ -30,9 +29,6 @@ try:
                 "python_version": sys.version,
             },
         )
-        # Flush events to ensure they're sent
-        flush()
     else:
         logger.info("Telemetry is disabled")
 except ImportError as e:

computer/computer.py CHANGED Viewed

@@ -9,10 +9,18 @@ import re
 from .logger import Logger, LogLevel
 import json
 import logging
-from .telemetry import record_computer_initialization
+from core.telemetry import is_telemetry_enabled, record_event
 import os
 from . import helpers
+import platform
+SYSTEM_INFO = {
+    "os": platform.system().lower(),
+    "os_version": platform.release(),
+    "python_version": platform.python_version(),
+}
 # Import provider related modules
 from .providers.base import VMProviderType
 from .providers.factory import VMProviderFactory
@@ -152,6 +160,8 @@ class Computer:
             if not name:
                 # Normalize the name to be used for the VM
                 name = image.replace(":", "_")
+                # Remove any forward slashes
+                name = name.replace("/", "_")
             # Convert display parameter to Display object
             if isinstance(display, str):
@@ -190,8 +200,8 @@ class Computer:
         self.use_host_computer_server = use_host_computer_server
         # Record initialization in telemetry (if enabled)
-        if telemetry_enabled:
-            record_computer_initialization()
+        if telemetry_enabled and is_telemetry_enabled():
+            record_event("computer_initialized", SYSTEM_INFO)
         else:
             self.logger.debug("Telemetry disabled - skipping initialization tracking")

computer/diorama_computer.py CHANGED Viewed

@@ -6,16 +6,35 @@ class DioramaComputer:
     A Computer-compatible proxy for Diorama that sends commands over the ComputerInterface.
     """
     def __init__(self, computer, apps):
+        """
+        Initialize the DioramaComputer with a computer instance and list of apps.
+        Args:
+            computer: The computer instance to proxy commands through
+            apps: List of applications available in the diorama environment
+        """
         self.computer = computer
         self.apps = apps
         self.interface = DioramaComputerInterface(computer, apps)
         self._initialized = False
     async def __aenter__(self):
+        """
+        Async context manager entry point.
+        Returns:
+            self: The DioramaComputer instance
+        """
         self._initialized = True
         return self
     async def run(self):
+        """
+        Initialize and run the DioramaComputer if not already initialized.
+        Returns:
+            self: The DioramaComputer instance
+        """
         if not self._initialized:
             await self.__aenter__()
         return self
@@ -25,11 +44,31 @@ class DioramaComputerInterface:
     Diorama Interface proxy that sends diorama_cmds via the Computer's interface.
     """
     def __init__(self, computer, apps):
+        """
+        Initialize the DioramaComputerInterface.
+        Args:
+            computer: The computer instance to send commands through
+            apps: List of applications available in the diorama environment
+        """
         self.computer = computer
         self.apps = apps
         self._scene_size = None
     async def _send_cmd(self, action, arguments=None):
+        """
+        Send a command to the diorama interface through the computer.
+        Args:
+            action (str): The action/command to execute
+            arguments (dict, optional): Additional arguments for the command
+        Returns:
+            The result from the diorama command execution
+        Raises:
+            RuntimeError: If the computer interface is not initialized or command fails
+        """
         arguments = arguments or {}
         arguments = {"app_list": self.apps, **arguments}
         # Use the computer's interface (must be initialized)
@@ -42,6 +81,15 @@ class DioramaComputerInterface:
         return result.get("result")
     async def screenshot(self, as_bytes=True):
+        """
+        Take a screenshot of the diorama scene.
+        Args:
+            as_bytes (bool): If True, return image as bytes; if False, return PIL Image object
+        Returns:
+            bytes or PIL.Image: Screenshot data in the requested format
+        """
         from PIL import Image
         import base64
         result = await self._send_cmd("screenshot")
@@ -53,41 +101,122 @@ class DioramaComputerInterface:
         return img_bytes if as_bytes else img
     async def get_screen_size(self):
+        """
+        Get the dimensions of the diorama scene.
+        Returns:
+            dict: Dictionary containing 'width' and 'height' keys with pixel dimensions
+        """
         if not self._scene_size:
             await self.screenshot(as_bytes=False)
         return {"width": self._scene_size[0], "height": self._scene_size[1]}
     async def move_cursor(self, x, y):
+        """
+        Move the cursor to the specified coordinates.
+        Args:
+            x (int): X coordinate to move cursor to
+            y (int): Y coordinate to move cursor to
+        """
         await self._send_cmd("move_cursor", {"x": x, "y": y})
     async def left_click(self, x=None, y=None):
+        """
+        Perform a left mouse click at the specified coordinates or current cursor position.
+        Args:
+            x (int, optional): X coordinate to click at. If None, clicks at current cursor position
+            y (int, optional): Y coordinate to click at. If None, clicks at current cursor position
+        """
         await self._send_cmd("left_click", {"x": x, "y": y})
     async def right_click(self, x=None, y=None):
+        """
+        Perform a right mouse click at the specified coordinates or current cursor position.
+        Args:
+            x (int, optional): X coordinate to click at. If None, clicks at current cursor position
+            y (int, optional): Y coordinate to click at. If None, clicks at current cursor position
+        """
         await self._send_cmd("right_click", {"x": x, "y": y})
     async def double_click(self, x=None, y=None):
+        """
+        Perform a double mouse click at the specified coordinates or current cursor position.
+        Args:
+            x (int, optional): X coordinate to double-click at. If None, clicks at current cursor position
+            y (int, optional): Y coordinate to double-click at. If None, clicks at current cursor position
+        """
         await self._send_cmd("double_click", {"x": x, "y": y})
     async def scroll_up(self, clicks=1):
+        """
+        Scroll up by the specified number of clicks.
+        Args:
+            clicks (int): Number of scroll clicks to perform upward. Defaults to 1
+        """
         await self._send_cmd("scroll_up", {"clicks": clicks})
     async def scroll_down(self, clicks=1):
+        """
+        Scroll down by the specified number of clicks.
+        Args:
+            clicks (int): Number of scroll clicks to perform downward. Defaults to 1
+        """
         await self._send_cmd("scroll_down", {"clicks": clicks})
     async def drag_to(self, x, y, duration=0.5):
+        """
+        Drag from the current cursor position to the specified coordinates.
+        Args:
+            x (int): X coordinate to drag to
+            y (int): Y coordinate to drag to
+            duration (float): Duration of the drag operation in seconds. Defaults to 0.5
+        """
         await self._send_cmd("drag_to", {"x": x, "y": y, "duration": duration})
     async def get_cursor_position(self):
+        """
+        Get the current cursor position.
+        Returns:
+            dict: Dictionary containing the current cursor coordinates
+        """
         return await self._send_cmd("get_cursor_position")
     async def type_text(self, text):
+        """
+        Type the specified text at the current cursor position.
+        Args:
+            text (str): The text to type
+        """
         await self._send_cmd("type_text", {"text": text})
     async def press_key(self, key):
+        """
+        Press a single key.
+        Args:
+            key: The key to press
+        """
         await self._send_cmd("press_key", {"key": key})
     async def hotkey(self, *keys):
+        """
+        Press multiple keys simultaneously as a hotkey combination.
+        Args:
+            *keys: Variable number of keys to press together. Can be Key enum instances or strings
+        Raises:
+            ValueError: If any key is not a Key enum or string type
+        """
         actual_keys = []
         for key in keys:
             if isinstance(key, Key):
@@ -101,4 +230,14 @@ class DioramaComputerInterface:
         await self._send_cmd("hotkey", {"keys": actual_keys})
     async def to_screen_coordinates(self, x, y):
+        """
+        Convert coordinates to screen coordinates.
+        Args:
+            x (int): X coordinate to convert
+            y (int): Y coordinate to convert
+        Returns:
+            dict: Dictionary containing the converted screen coordinates
+        """
         return await self._send_cmd("to_screen_coordinates", {"x": x, "y": y})

{cua_computer-0.4.3.dist-info → cua_computer-0.4.5.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: cua-computer
-Version: 0.4.3
+Version: 0.4.5
 Summary: Computer-Use Interface (CUI) framework powering Cua
 Author-Email: TryCua <gh@trycua.com>
 Requires-Python: >=3.11
@@ -26,8 +26,8 @@ Description-Content-Type: text/markdown
 <h1>
   <div class="image-wrapper" style="display: inline-block;">
     <picture>
-      <source media="(prefers-color-scheme: dark)" alt="logo" height="150" srcset="../../img/logo_white.png" style="display: block; margin: auto;">
-      <source media="(prefers-color-scheme: light)" alt="logo" height="150" srcset="../../img/logo_black.png" style="display: block; margin: auto;">
+      <source media="(prefers-color-scheme: dark)" alt="logo" height="150" srcset="https://raw.githubusercontent.com/trycua/cua/main/img/logo_white.png" style="display: block; margin: auto;">
+      <source media="(prefers-color-scheme: light)" alt="logo" height="150" srcset="https://raw.githubusercontent.com/trycua/cua/main/img/logo_black.png" style="display: block; margin: auto;">
       <img alt="Shows my svg">
     </picture>
   </div>
@@ -44,7 +44,7 @@ Description-Content-Type: text/markdown
 ### Get started with Computer
 <div align="center">
-    <img src="../../img/computer.png"/>
+    <img src="https://raw.githubusercontent.com/trycua/cua/main/img/computer.png"/>
 </div>
 ```python
@@ -87,82 +87,11 @@ The `cua-computer` PyPi package pulls automatically the latest executable versio
 Refer to this notebook for a step-by-step guide on how to use the Computer-Use Interface (CUI):
-- [Computer-Use Interface (CUI)](../../notebooks/computer_nb.ipynb)
+- [Computer-Use Interface (CUI)](https://github.com/trycua/cua/blob/main/notebooks/computer_nb.ipynb)
-## Using the Gradio Computer UI
-The computer module includes a Gradio UI for creating and sharing demonstration data. We make it easy for people to build community datasets for better computer use models with an upload to Huggingface feature.
-```bash
-# Install with UI support
-pip install "cua-computer[ui]"
-```
-> **Note:** For precise control of the computer, we recommend using VNC or Screen Sharing instead of the Computer Gradio UI.
-### Building and Sharing Demonstrations with Huggingface
-Follow these steps to contribute your own demonstrations:
-#### 1. Set up Huggingface Access
-Set your HF_TOKEN in a .env file or in your environment variables:
-```bash
-# In .env file
-HF_TOKEN=your_huggingface_token
-```
-#### 2. Launch the Computer UI
-```python
-# launch_ui.py
-from computer.ui.gradio.app import create_gradio_ui
-from dotenv import load_dotenv
-load_dotenv('.env')
-app = create_gradio_ui()
-app.launch(share=False)
-```
-For examples, see [Computer UI Examples](../../examples/computer_ui_examples.py)
-#### 3. Record Your Tasks
-<details open>
-<summary>View demonstration video</summary>
-<video src="https://github.com/user-attachments/assets/de3c3477-62fe-413c-998d-4063e48de176" controls width="600"></video>
-</details>
-Record yourself performing various computer tasks using the UI.
-#### 4. Save Your Demonstrations
-<details open>
-<summary>View demonstration video</summary>
-<video src="https://github.com/user-attachments/assets/5ad1df37-026a-457f-8b49-922ae805faef" controls width="600"></video>
-</details>
-Save each task by picking a descriptive name and adding relevant tags (e.g., "office", "web-browsing", "coding").
-#### 5. Record Additional Demonstrations
-Repeat steps 3 and 4 until you have a good amount of demonstrations covering different tasks and scenarios.
-#### 6. Upload to Huggingface
-<details open>
-<summary>View demonstration video</summary>
-<video src="https://github.com/user-attachments/assets/c586d460-3877-4b5f-a736-3248886d2134" controls width="600"></video>
-</details>
-Upload your dataset to Huggingface by:
-- Naming it as `{your_username}/{dataset_name}`
-- Choosing public or private visibility
-- Optionally selecting specific tags to upload only tasks with certain tags
-#### Examples and Resources
-- Example Dataset: [ddupont/test-dataset](https://huggingface.co/datasets/ddupont/test-dataset)
-- Find Community Datasets: 🔍 [Browse CUA Datasets on Huggingface](https://huggingface.co/datasets?other=cua)
+## Docs
+- [Computers](https://trycua.com/docs/computer-sdk/computers)
+- [Commands](https://trycua.com/docs/computer-sdk/commands)
+- [Computer UI](https://trycua.com/docs/computer-sdk/computer-ui)
+- [Sandboxed Python](https://trycua.com/docs/computer-sdk/sandboxed-python)

{cua_computer-0.4.3.dist-info → cua_computer-0.4.5.dist-info}/RECORD RENAMED Viewed

@@ -1,6 +1,6 @@
-computer/__init__.py,sha256=44ZBq815dMihgAHmBKn1S_GFNbElCXyZInh3hle1k9Y,1237
-computer/computer.py,sha256=u-M9pZM3Tc0PEtV13M6Dj8_yaW6HqMHJwlJLVbA7XtQ,42398
-computer/diorama_computer.py,sha256=jOP7_eXxxU6SMIoE25ni0YXPK0E7p5sZeLKmkYLh6G8,3871
+computer/__init__.py,sha256=HG8dhCmSPjuQ4G-NGAoiXEhzhO37kwrHHmyboNhGWOA,1159
+computer/computer.py,sha256=AjPqUAv1hF2AgK1eODRrQCvMikyxeuE6gxlwsnwNB-s,42701
+computer/diorama_computer.py,sha256=3JaXKpcSi_OAVXtwlmNwQgrcnvqP1AxdlKEQ0XRJ0aQ,8569
 computer/helpers.py,sha256=iHkO2WhuCLc15g67kfMnpQWxfNRlz2YeJNEvYaL9jlM,1826
 computer/interface/__init__.py,sha256=xQvYjq5PMn9ZJOmRR5mWtONTl_0HVd8ACvW6AQnzDdw,262
 computer/interface/base.py,sha256=1beR4T0z5anb9NaNgKJrMJTF0BFIKyiHlokMLesOV5Q,15131
@@ -27,13 +27,12 @@ computer/providers/lumier/provider.py,sha256=BDgnTuik42H9OuCmnd-1TxM8p4vl_ahfrhN
 computer/providers/winsandbox/__init__.py,sha256=WsMVBBa_qFfqVHPQzg6j4PegQwLiIudkzUedpYkrfXU,244
 computer/providers/winsandbox/provider.py,sha256=vduDKUB1OuimvjJdUus9RQY8gv3XQfFgVS8fKOzHVME,19306
 computer/providers/winsandbox/setup_script.ps1,sha256=8aGwR7PEvqnYzCNyXTDKIwJ6pYrwyWYLRjmNT_jYIwQ,4623
-computer/telemetry.py,sha256=jHM3LJAgO2ltN3wlQ6mqCPUcmlS8F955KI70no-T3xA,3730
 computer/ui/__init__.py,sha256=pmo05ek9qiB_x7DPeE6Vf_8RsIOqTD0w1dBLMHfoOnY,45
 computer/ui/__main__.py,sha256=Jwy2oC_mGZLN0fX7WLqpjaQkbXMeM3ISrUc8WSRUG0c,284
 computer/ui/gradio/__init__.py,sha256=5_KimixM48-X74FCsLw7LbSt39MQfUMEL8-M9amK3Cw,117
 computer/ui/gradio/app.py,sha256=_V6FI-g0GJGMEk-C2iPFtxPO1Gn0juCaeCrWsBtjC4E,70395
 computer/utils.py,sha256=zY50NXB7r51GNLQ6l7lhG_qv0_ufpQ8n0-SDhCei8m4,2838
-cua_computer-0.4.3.dist-info/METADATA,sha256=ACsrn0_9Eyqrev62IeSun_AYPWO1mOtx-iHQCkmkIUM,5802
-cua_computer-0.4.3.dist-info/WHEEL,sha256=9P2ygRxDrTJz3gsagc0Z96ukrxjr-LFBGOgv3AuKlCA,90
-cua_computer-0.4.3.dist-info/entry_points.txt,sha256=6OYgBcLyFCUgeqLgnvMyOJxPCWzgy7se4rLPKtNonMs,34
-cua_computer-0.4.3.dist-info/RECORD,,
+cua_computer-0.4.5.dist-info/METADATA,sha256=jhHrPllu_5B85qOHCO75bkc6vGSg9gtq_O7RiRxak6M,3776
+cua_computer-0.4.5.dist-info/WHEEL,sha256=9P2ygRxDrTJz3gsagc0Z96ukrxjr-LFBGOgv3AuKlCA,90
+cua_computer-0.4.5.dist-info/entry_points.txt,sha256=6OYgBcLyFCUgeqLgnvMyOJxPCWzgy7se4rLPKtNonMs,34
+cua_computer-0.4.5.dist-info/RECORD,,

computer/telemetry.py DELETED Viewed

@@ -1,116 +0,0 @@
-"""Computer telemetry for tracking anonymous usage and feature usage."""
-import logging
-import platform
-from typing import Any
-# Import the core telemetry module
-TELEMETRY_AVAILABLE = False
-try:
-    from core.telemetry import (
-        increment,
-        is_telemetry_enabled,
-        is_telemetry_globally_disabled,
-        record_event,
-    )
-    def increment_counter(counter_name: str, value: int = 1) -> None:
-        """Wrapper for increment to maintain backward compatibility."""
-        if is_telemetry_enabled():
-            increment(counter_name, value)
-    def set_dimension(name: str, value: Any) -> None:
-        """Set a dimension that will be attached to all events."""
-        logger = logging.getLogger("computer.telemetry")
-        logger.debug(f"Setting dimension {name}={value}")
-    TELEMETRY_AVAILABLE = True
-    logger = logging.getLogger("computer.telemetry")
-    logger.info("Successfully imported telemetry")
-except ImportError as e:
-    logger = logging.getLogger("computer.telemetry")
-    logger.warning(f"Could not import telemetry: {e}")
-    TELEMETRY_AVAILABLE = False
-# Local fallbacks in case core telemetry isn't available
-def _noop(*args: Any, **kwargs: Any) -> None:
-    """No-op function for when telemetry is not available."""
-    pass
-logger = logging.getLogger("computer.telemetry")
-# If telemetry isn't available, use no-op functions
-if not TELEMETRY_AVAILABLE:
-    logger.debug("Telemetry not available, using no-op functions")
-    record_event = _noop  # type: ignore
-    increment_counter = _noop  # type: ignore
-    set_dimension = _noop  # type: ignore
-    get_telemetry_client = lambda: None  # type: ignore
-    flush = _noop  # type: ignore
-    is_telemetry_enabled = lambda: False  # type: ignore
-    is_telemetry_globally_disabled = lambda: True  # type: ignore
-# Get system info once to use in telemetry
-SYSTEM_INFO = {
-    "os": platform.system().lower(),
-    "os_version": platform.release(),
-    "python_version": platform.python_version(),
-}
-def enable_telemetry() -> bool:
-    """Enable telemetry if available.
-    Returns:
-        bool: True if telemetry was successfully enabled, False otherwise
-    """
-    global TELEMETRY_AVAILABLE
-    # Check if globally disabled using core function
-    if TELEMETRY_AVAILABLE and is_telemetry_globally_disabled():
-        logger.info("Telemetry is globally disabled via environment variable - cannot enable")
-        return False
-    # Already enabled
-    if TELEMETRY_AVAILABLE:
-        return True
-    # Try to import and enable
-    try:
-        # Verify we can import core telemetry
-        from core.telemetry import record_event  # type: ignore
-        TELEMETRY_AVAILABLE = True
-        logger.info("Telemetry successfully enabled")
-        return True
-    except ImportError as e:
-        logger.warning(f"Could not enable telemetry: {e}")
-        return False
-def is_telemetry_enabled() -> bool:
-    """Check if telemetry is enabled.
-    Returns:
-        bool: True if telemetry is enabled, False otherwise
-    """
-    # Use the core function if available, otherwise use our local flag
-    if TELEMETRY_AVAILABLE:
-        from core.telemetry import is_telemetry_enabled as core_is_enabled
-        return core_is_enabled()
-    return False
-def record_computer_initialization() -> None:
-    """Record when a computer instance is initialized."""
-    if TELEMETRY_AVAILABLE and is_telemetry_enabled():
-        record_event("computer_initialized", SYSTEM_INFO)
-        # Set dimensions that will be attached to all events
-        set_dimension("os", SYSTEM_INFO["os"])
-        set_dimension("os_version", SYSTEM_INFO["os_version"])
-        set_dimension("python_version", SYSTEM_INFO["python_version"])

{cua_computer-0.4.3.dist-info → cua_computer-0.4.5.dist-info}/WHEEL RENAMED Viewed

File without changes

{cua_computer-0.4.3.dist-info → cua_computer-0.4.5.dist-info}/entry_points.txt RENAMED Viewed

File without changes

cua-computer 0.4.3__py3-none-any.whl → 0.4.5__py3-none-any.whl

cua-computer 0.4.3py3-none-any.whl → 0.4.5py3-none-any.whl