PyPI - lybic-guiagents - Versions diffs - 0.1.0__py3-none-any.whl → 0.2.1__py3-none-any.whl - Mend

lybic-guiagents 0.1.0py3-none-any.whl → 0.2.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of lybic-guiagents might be problematic. Click here for more details.

Files changed (38) hide show

gui_agents/__init__.py +63 -0
gui_agents/agents/Action.py +3 -3
gui_agents/agents/Backend/ADBBackend.py +62 -0
gui_agents/agents/Backend/Backend.py +28 -0
gui_agents/agents/Backend/LybicBackend.py +354 -0
gui_agents/agents/Backend/PyAutoGUIBackend.py +183 -0
gui_agents/agents/Backend/PyAutoGUIVMwareBackend.py +250 -0
gui_agents/agents/Backend/__init__.py +0 -0
gui_agents/agents/agent_s.py +0 -2
gui_agents/agents/grounding.py +1 -6
gui_agents/agents/hardware_interface.py +24 -7
gui_agents/agents/manager.py +0 -3
gui_agents/agents/translator.py +1 -1
gui_agents/agents/worker.py +1 -2
gui_agents/cli_app.py +143 -8
gui_agents/core/engine.py +0 -2
gui_agents/core/knowledge.py +0 -2
gui_agents/lybic_client/__init__.py +0 -0
gui_agents/lybic_client/lybic_client.py +88 -0
gui_agents/prompts/__init__.py +0 -0
gui_agents/prompts/prompts.py +869 -0
gui_agents/service/__init__.py +19 -0
gui_agents/service/agent_service.py +527 -0
gui_agents/service/api_models.py +136 -0
gui_agents/service/config.py +241 -0
gui_agents/service/exceptions.py +35 -0
gui_agents/store/__init__.py +0 -0
gui_agents/store/registry.py +22 -0
gui_agents/tools/tools.py +0 -4
gui_agents/unit_test/test_manager.py +0 -2
gui_agents/unit_test/test_worker.py +0 -2
gui_agents/utils/analyze_display.py +1 -1
gui_agents/utils/common_utils.py +0 -2
{lybic_guiagents-0.1.0.dist-info → lybic_guiagents-0.2.1.dist-info}/METADATA +203 -75
{lybic_guiagents-0.1.0.dist-info → lybic_guiagents-0.2.1.dist-info}/RECORD +38 -21
{lybic_guiagents-0.1.0.dist-info → lybic_guiagents-0.2.1.dist-info}/WHEEL +0 -0
{lybic_guiagents-0.1.0.dist-info → lybic_guiagents-0.2.1.dist-info}/licenses/LICENSE +0 -0
{lybic_guiagents-0.1.0.dist-info → lybic_guiagents-0.2.1.dist-info}/top_level.txt +0 -0

gui_agents/cli_app.py CHANGED Viewed

@@ -4,13 +4,11 @@ import io
 import logging
 import os
 import platform
-import pyautogui
 import sys
 import time
 import datetime
 from pathlib import Path
 from dotenv import load_dotenv
-from gui_agents.agents.Backend.PyAutoGUIBackend import PyAutoGUIBackend
 env_path = Path(os.path.dirname(os.path.abspath(__file__))) / '.env'
 if env_path.exists():
@@ -35,6 +33,80 @@ from gui_agents.utils.analyze_display import analyze_display_json, aggregate_res
 current_platform = platform.system().lower()
+# Display environment detection and backend compatibility validation
+def check_display_environment():
+    """
+    Check if the current environment supports GUI operations.
+    Returns (has_display, pyautogui_available, error_message)
+    """
+    has_display = False
+    pyautogui_available = False
+    error_message = None
+    # Check DISPLAY environment variable (Linux/Unix)
+    if current_platform == "linux":
+        display_env = os.environ.get('DISPLAY')
+        if display_env:
+            has_display = True
+        else:
+            error_message = "No DISPLAY environment variable found. Running in headless/containerized environment."
+    elif current_platform == "darwin":
+        # macOS typically has display available unless running in special contexts
+        has_display = True
+    elif current_platform == "windows":
+        # Windows typically has display available
+        has_display = True
+    # Try to import and initialize pyautogui if display is available
+    if has_display:
+        try:
+            import pyautogui
+            # Test if pyautogui can actually work
+            pyautogui.size()  # This will fail if no display is available
+            pyautogui_available = True
+        except Exception as e:
+            pyautogui_available = False
+            error_message = f"PyAutoGUI not available: {str(e)}"
+    return has_display, pyautogui_available, error_message
+def get_compatible_backends(has_display, pyautogui_available):
+    """
+    Get list of backends compatible with current environment.
+    """
+    compatible_backends = []
+    incompatible_backends = []
+    # Lybic backend works in headless environments (cloud-based)
+    compatible_backends.append("lybic")
+    # ADB backend works without display (for Android devices)
+    compatible_backends.append("adb")
+    # PyAutoGUI-based backends require display
+    if has_display and pyautogui_available:
+        compatible_backends.extend(["pyautogui", "pyautogui_vmware"])
+    else:
+        incompatible_backends.extend(["pyautogui", "pyautogui_vmware"])
+    return compatible_backends, incompatible_backends
+def validate_backend_compatibility(backend, compatible_backends, incompatible_backends):
+    """
+    Validate if the requested backend is compatible with current environment.
+    Returns (is_compatible, recommended_backend, warning_message)
+    """
+    if backend in compatible_backends:
+        return True, backend, None
+    elif backend in incompatible_backends:
+        # Recommend lybic as the primary fallback for headless environments
+        recommended = "lybic"
+        warning = f"Backend '{backend}' is not compatible with current environment (no display/GUI). Recommending '{recommended}' backend instead."
+        return False, recommended, warning
+    else:
+        # Unknown backend, let it fail naturally
+        return True, backend, f"Unknown backend '{backend}', compatibility cannot be determined."
 logger = logging.getLogger()
 logger.setLevel(logging.DEBUG)
@@ -172,10 +244,18 @@ def show_permission_dialog(code: str, action_description: str):
 def scale_screenshot_dimensions(screenshot: Image.Image, hwi_para: HardwareInterface):
     screenshot_high = screenshot.height
     screenshot_width = screenshot.width
-    if isinstance(hwi_para.backend, PyAutoGUIBackend):
-        screen_width, screen_height = pyautogui.size()
-        if screen_width != screenshot_width or screen_height != screenshot_high:
-            screenshot = screenshot.resize((screen_width, screen_height), Image.Resampling.LANCZOS)
+    # Only try to scale if we have a PyAutoGUI backend and pyautogui is available
+    try:
+        from gui_agents.agents.Backend.PyAutoGUIBackend import PyAutoGUIBackend
+        if isinstance(hwi_para.backend, PyAutoGUIBackend):
+            import pyautogui
+            screen_width, screen_height = pyautogui.size()
+            if screen_width != screenshot_width or screen_height != screenshot_high:
+                screenshot = screenshot.resize((screen_width, screen_height), Image.Resampling.LANCZOS)
+    except Exception as e:
+        # Any error (e.g., no display, import error), skip scaling
+        logger.warning(f"Could not scale screenshot dimensions: {e}")
     return screenshot
@@ -453,8 +533,37 @@ def main():
         type=str,
         default=None,
         help='Lybic precreated sandbox ID (if not provided, will use LYBIC_PRECREATE_SID environment variable)')
+    parser.add_argument(
+        '--force-backend',
+        action='store_true',
+        help='Force the use of specified backend even if incompatible with current environment')
     args = parser.parse_args()
+    # Check environment compatibility
+    has_display, pyautogui_available, env_error = check_display_environment()
+    compatible_backends, incompatible_backends = get_compatible_backends(has_display, pyautogui_available)
+    # Log environment status
+    logger.info(f"Environment check: Display available={has_display}, PyAutoGUI available={pyautogui_available}")
+    if env_error:
+        logger.info(f"Environment note: {env_error}")
+    logger.info(f"Compatible backends: {compatible_backends}")
+    if incompatible_backends:
+        logger.info(f"Incompatible backends: {incompatible_backends}")
+    # Validate backend compatibility
+    is_compatible, recommended_backend, warning = validate_backend_compatibility(
+        args.backend, compatible_backends, incompatible_backends)
+    if not is_compatible and not args.force_backend:
+        logger.warning(warning)
+        logger.info(f"Switching from '{args.backend}' to '{recommended_backend}' backend")
+        args.backend = recommended_backend
+    elif not is_compatible and args.force_backend:
+        logger.warning(f"Forcing incompatible backend '{args.backend}' - this may cause errors")
+    elif warning:
+        logger.info(warning)
     # Ensure necessary directory structure exists
     timestamp_dir = os.path.join(log_dir, datetime_str)
     cache_dir = os.path.join(timestamp_dir, "cache", "screens")
@@ -515,7 +624,7 @@ def main():
     else:
         logger.info("Web search functionality is ENABLED")
-    # Initialize hardware interface
+    # Initialize hardware interface with error handling
     backend_kwargs = {"platform": platform_os}
     if args.lybic_sid is not None:
         backend_kwargs["precreate_sid"] = args.lybic_sid
@@ -523,7 +632,25 @@ def main():
     else:
         logger.info("Using Lybic SID from environment variable LYBIC_PRECREATE_SID")
-    hwi = HardwareInterface(backend=args.backend, **backend_kwargs)
+    try:
+        hwi = HardwareInterface(backend=args.backend, **backend_kwargs)
+        logger.info(f"Successfully initialized hardware interface with backend: {args.backend}")
+    except Exception as e:
+        logger.error(f"Failed to initialize hardware interface with backend '{args.backend}': {e}")
+        # If the backend failed and it's a GUI-dependent backend, suggest alternatives
+        if args.backend in incompatible_backends and not args.force_backend:
+            logger.info("Attempting to initialize with lybic backend as fallback...")
+            try:
+                hwi = HardwareInterface(backend="lybic", **backend_kwargs)
+                logger.info("Successfully initialized with lybic backend")
+                args.backend = "lybic"
+            except Exception as fallback_error:
+                logger.error(f"Fallback to lybic backend also failed: {fallback_error}")
+                sys.exit(1)
+        else:
+            logger.error("Hardware interface initialization failed. Please check your environment and backend configuration.")
+            sys.exit(1)
     # if query is provided, run the agent on the query
     if args.query:
@@ -547,6 +674,13 @@ def main():
 if __name__ == "__main__":
     """
+    GUI Agent CLI Application with environment compatibility checking.
+    The application automatically detects the current environment and recommends compatible backends:
+    - In headless/containerized environments: uses 'lybic' or 'adb' backends
+    - In GUI environments: supports all backends including 'pyautogui' and 'pyautogui_vmware'
+    Examples:
     python gui_agents/cli_app.py --backend lybic
     python gui_agents/cli_app.py --backend pyautogui --mode fast
     python gui_agents/cli_app.py --backend pyautogui_vmware
@@ -556,5 +690,6 @@ if __name__ == "__main__":
     python gui_agents/cli_app.py --backend pyautogui --mode fast --disable-search
     python gui_agents/cli_app.py --backend lybic --lybic-sid SBX-01K1X6ZKAERXAN73KTJ1XXJXAF
     python gui_agents/cli_app.py --backend lybic --mode fast --lybic-sid SBX-01K1X6ZKAERXAN73KTJ1XXJXAF
+    python gui_agents/cli_app.py --backend pyautogui --force-backend  # Force incompatible backend
     """
     main()

gui_agents/core/engine.py CHANGED Viewed

@@ -2,7 +2,6 @@ import os
 import json
 import backoff
 import requests
-from typing import List, Dict, Any, Optional, Union
 import numpy as np
 from anthropic import Anthropic
 from openai import (
@@ -18,7 +17,6 @@ from google.genai import types
 from zhipuai import ZhipuAI
 from groq import Groq
 import boto3
-import exa_py
 from typing import List, Dict, Any, Optional, Union, Tuple
 class ModelPricing:

gui_agents/core/knowledge.py CHANGED Viewed

@@ -9,8 +9,6 @@ from gui_agents.utils.common_utils import (
     save_embeddings,
 )
 from gui_agents.tools.tools import Tools
-from gui_agents.agents.global_state import GlobalState
-from gui_agents.store.registry import Registry
 from gui_agents.core.mllm import CostManager
 def get_embedding_dim(model_name):

gui_agents/lybic_client/__init__.py ADDED Viewed

File without changes

gui_agents/lybic_client/lybic_client.py ADDED Viewed

@@ -0,0 +1,88 @@
+import httpx
+from typing import Optional, Dict, Any
+class LybicClient:
+    """Light-weight async wrapper for Lybic REST API."""
+    # ---------- life-cycle ----------
+    def __init__(self, api_key: str, base_url: str, org_id: str) -> None:
+        self.base     = base_url.rstrip("/")
+        self.org_id   = org_id
+        self.http     = httpx.AsyncClient(
+            headers={"X-Api-Key": api_key, "Content-Type": "application/json"},
+            timeout=30,
+        )
+        # runtime cache (set by create_sandbox)
+        self.sandbox: Optional[Dict[str, Any]] = None
+        # self.connect_details: Optional[Dict[str, Any]] = None
+    async def close(self) -> None:
+        await self.http.aclose()
+    # ---------- low-level ----------
+    async def _req(self, path: str, method: str = "GET", json: Any = None):
+        r = await self.http.request(method, f"{self.base}{path}", json=json)
+        # ▶ 打印调试信息
+        req = r.request                        # httpx.Request 对象
+        print(
+            "[HTTP]", req.method, req.url,     # 完整 URL（含 querystring）
+            "json=",   json,
+            "status=", r.status_code,
+        )
+        r.raise_for_status()
+        return r.json()
+    # ---------- high-level ----------
+    async def create_sandbox(self, **opts) -> Dict[str, Any]:
+        """
+        Create a new sandbox and cache its metadata / connectDetails.
+        Returns the full response dict.
+        """
+        resp = await self._req(
+            f"/api/orgs/{self.org_id}/sandboxes", "POST", opts or {}
+        )
+        # cache
+        self.sandbox          = resp
+        # self.connect_details  = resp.get("connectDetails")
+        return resp
+    def _require_sandbox_id(self, sid: Optional[str]) -> str:
+        if sid:
+            return sid
+        if self.sandbox:
+            return self.sandbox["id"]
+        raise RuntimeError("No sandbox_id specified and none cached — "
+                           "call create_sandbox() first.")
+    async def preview(self, sid: Optional[str] = None):
+        sid = self._require_sandbox_id(sid)
+        return await self._req(
+            f"/api/orgs/{self.org_id}/sandboxes/{sid}/preview", "POST"
+        )
+    async def exec_action(self, action: dict, sid: Optional[str] = None):
+        """
+        Execute a single GUI action. `sid` optional if sandbox already cached.
+        """
+        sid = self._require_sandbox_id(sid)
+        return await self._req(
+            f"/api/orgs/{self.org_id}/sandboxes/{sid}/actions/computer-use",
+            "POST",
+            {"action": action},
+        )
+    async def parse_nl(self, text: str, model: str = "ui-tars"):
+        return await self._req(
+            "/api/computer-use/parse",
+            "POST",
+            {"model": model, "textContent": text},
+        )
+    # ---------- helpers ----------
+    @property
+    def sandbox_id(self) -> Optional[str]:
+        return self.sandbox["id"] if self.sandbox else None

gui_agents/prompts/__init__.py ADDED Viewed

File without changes

lybic-guiagents 0.1.0__py3-none-any.whl → 0.2.1__py3-none-any.whl

Potentially problematic release.

lybic-guiagents 0.1.0py3-none-any.whl → 0.2.1py3-none-any.whl