PyPI - autoglm-gui - Versions diffs - 1.4.0__py3-none-any.whl → 1.5.0__py3-none-any.whl - Mend

autoglm-gui 1.4.0py3-none-any.whl → 1.5.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (120) hide show

AutoGLM_GUI/__init__.py +11 -0
AutoGLM_GUI/__main__.py +26 -8
AutoGLM_GUI/actions/__init__.py +6 -0
AutoGLM_GUI/actions/handler.py +196 -0
AutoGLM_GUI/actions/types.py +15 -0
AutoGLM_GUI/adb/__init__.py +53 -0
AutoGLM_GUI/adb/apps.py +227 -0
AutoGLM_GUI/adb/connection.py +323 -0
AutoGLM_GUI/adb/device.py +171 -0
AutoGLM_GUI/adb/input.py +67 -0
AutoGLM_GUI/adb/screenshot.py +11 -0
AutoGLM_GUI/adb/timing.py +167 -0
AutoGLM_GUI/adb_plus/keyboard_installer.py +4 -2
AutoGLM_GUI/adb_plus/qr_pair.py +8 -8
AutoGLM_GUI/adb_plus/screenshot.py +22 -1
AutoGLM_GUI/adb_plus/serial.py +38 -20
AutoGLM_GUI/adb_plus/touch.py +4 -9
AutoGLM_GUI/agents/__init__.py +51 -0
AutoGLM_GUI/agents/events.py +19 -0
AutoGLM_GUI/agents/factory.py +153 -0
AutoGLM_GUI/agents/glm/__init__.py +7 -0
AutoGLM_GUI/agents/glm/agent.py +292 -0
AutoGLM_GUI/agents/glm/message_builder.py +81 -0
AutoGLM_GUI/agents/glm/parser.py +110 -0
AutoGLM_GUI/agents/glm/prompts_en.py +77 -0
AutoGLM_GUI/agents/glm/prompts_zh.py +75 -0
AutoGLM_GUI/agents/mai/__init__.py +28 -0
AutoGLM_GUI/agents/mai/agent.py +405 -0
AutoGLM_GUI/agents/mai/parser.py +254 -0
AutoGLM_GUI/agents/mai/prompts.py +103 -0
AutoGLM_GUI/agents/mai/traj_memory.py +91 -0
AutoGLM_GUI/agents/protocols.py +27 -0
AutoGLM_GUI/agents/stream_runner.py +188 -0
AutoGLM_GUI/api/__init__.py +71 -11
AutoGLM_GUI/api/agents.py +190 -229
AutoGLM_GUI/api/control.py +9 -6
AutoGLM_GUI/api/devices.py +112 -28
AutoGLM_GUI/api/health.py +13 -0
AutoGLM_GUI/api/history.py +78 -0
AutoGLM_GUI/api/layered_agent.py +306 -181
AutoGLM_GUI/api/mcp.py +11 -10
AutoGLM_GUI/api/media.py +64 -1
AutoGLM_GUI/api/scheduled_tasks.py +98 -0
AutoGLM_GUI/api/version.py +23 -10
AutoGLM_GUI/api/workflows.py +2 -1
AutoGLM_GUI/config.py +72 -14
AutoGLM_GUI/config_manager.py +98 -27
AutoGLM_GUI/device_adapter.py +263 -0
AutoGLM_GUI/device_manager.py +248 -29
AutoGLM_GUI/device_protocol.py +266 -0
AutoGLM_GUI/devices/__init__.py +49 -0
AutoGLM_GUI/devices/adb_device.py +200 -0
AutoGLM_GUI/devices/mock_device.py +185 -0
AutoGLM_GUI/devices/remote_device.py +177 -0
AutoGLM_GUI/exceptions.py +3 -3
AutoGLM_GUI/history_manager.py +164 -0
AutoGLM_GUI/i18n.py +81 -0
AutoGLM_GUI/metrics.py +13 -20
AutoGLM_GUI/model/__init__.py +5 -0
AutoGLM_GUI/model/message_builder.py +69 -0
AutoGLM_GUI/model/types.py +24 -0
AutoGLM_GUI/models/__init__.py +10 -0
AutoGLM_GUI/models/history.py +96 -0
AutoGLM_GUI/models/scheduled_task.py +71 -0
AutoGLM_GUI/parsers/__init__.py +22 -0
AutoGLM_GUI/parsers/base.py +50 -0
AutoGLM_GUI/parsers/phone_parser.py +58 -0
AutoGLM_GUI/phone_agent_manager.py +118 -367
AutoGLM_GUI/platform_utils.py +31 -2
AutoGLM_GUI/prompt_config.py +15 -0
AutoGLM_GUI/prompts/__init__.py +32 -0
AutoGLM_GUI/scheduler_manager.py +304 -0
AutoGLM_GUI/schemas.py +272 -63
AutoGLM_GUI/scrcpy_stream.py +159 -37
AutoGLM_GUI/server.py +3 -1
AutoGLM_GUI/socketio_server.py +114 -29
AutoGLM_GUI/state.py +10 -30
AutoGLM_GUI/static/assets/{about-DeclntHg.js → about-BQm96DAl.js} +1 -1
AutoGLM_GUI/static/assets/alert-dialog-B42XxGPR.js +1 -0
AutoGLM_GUI/static/assets/chat-C0L2gQYG.js +129 -0
AutoGLM_GUI/static/assets/circle-alert-D4rSJh37.js +1 -0
AutoGLM_GUI/static/assets/dialog-DZ78cEcj.js +45 -0
AutoGLM_GUI/static/assets/history-DFBv7TGc.js +1 -0
AutoGLM_GUI/static/assets/index-Bzyv2yQ2.css +1 -0
AutoGLM_GUI/static/assets/{index-zQ4KKDHt.js → index-CmZSnDqc.js} +1 -1
AutoGLM_GUI/static/assets/index-CssG-3TH.js +11 -0
AutoGLM_GUI/static/assets/label-BCUzE_nm.js +1 -0
AutoGLM_GUI/static/assets/logs-eoFxn5of.js +1 -0
AutoGLM_GUI/static/assets/popover-DLsuV5Sx.js +1 -0
AutoGLM_GUI/static/assets/scheduled-tasks-MyqGJvy_.js +1 -0
AutoGLM_GUI/static/assets/square-pen-zGWYrdfj.js +1 -0
AutoGLM_GUI/static/assets/textarea-BX6y7uM5.js +1 -0
AutoGLM_GUI/static/assets/workflows-CYFs6ssC.js +1 -0
AutoGLM_GUI/static/index.html +2 -2
AutoGLM_GUI/types.py +142 -0
{autoglm_gui-1.4.0.dist-info → autoglm_gui-1.5.0.dist-info}/METADATA +178 -92
autoglm_gui-1.5.0.dist-info/RECORD +157 -0
mai_agent/base.py +137 -0
mai_agent/mai_grounding_agent.py +263 -0
mai_agent/mai_naivigation_agent.py +526 -0
mai_agent/prompt.py +148 -0
mai_agent/unified_memory.py +67 -0
mai_agent/utils.py +73 -0
AutoGLM_GUI/api/dual_model.py +0 -311
AutoGLM_GUI/dual_model/__init__.py +0 -53
AutoGLM_GUI/dual_model/decision_model.py +0 -664
AutoGLM_GUI/dual_model/dual_agent.py +0 -917
AutoGLM_GUI/dual_model/protocols.py +0 -354
AutoGLM_GUI/dual_model/vision_model.py +0 -442
AutoGLM_GUI/mai_ui_adapter/agent_wrapper.py +0 -291
AutoGLM_GUI/phone_agent_patches.py +0 -146
AutoGLM_GUI/static/assets/chat-Iut2yhSw.js +0 -125
AutoGLM_GUI/static/assets/dialog-BfdcBs1x.js +0 -45
AutoGLM_GUI/static/assets/index-5hCCwHA7.css +0 -1
AutoGLM_GUI/static/assets/index-DHF1NZh0.js +0 -12
AutoGLM_GUI/static/assets/workflows-xiplap-r.js +0 -1
autoglm_gui-1.4.0.dist-info/RECORD +0 -100
{autoglm_gui-1.4.0.dist-info → autoglm_gui-1.5.0.dist-info}/WHEEL +0 -0
{autoglm_gui-1.4.0.dist-info → autoglm_gui-1.5.0.dist-info}/entry_points.txt +0 -0
{autoglm_gui-1.4.0.dist-info → autoglm_gui-1.5.0.dist-info}/licenses/LICENSE +0 -0

AutoGLM_GUI/mai_ui_adapter/agent_wrapper.py DELETED Viewed

@@ -1,291 +0,0 @@
-"""MAI-UI PhoneAgent wrapper for compatibility with AutoGLM-GUI interface."""
-from dataclasses import dataclass
-from typing import Any, Callable, Optional
-from phone_agent.agent import AgentConfig, StepResult
-from phone_agent.actions.handler import ActionHandler
-from phone_agent.model import ModelConfig
-from AutoGLM_GUI.logger import logger
-from AutoGLM_GUI.mai_ui.mai_navigation_agent import MAIUINaivigationAgent
-from AutoGLM_GUI.mai_ui_adapter.action_adapter import MAIUIActionAdapter
-@dataclass
-class MAIUIConfig:
-    """MAI-UI specific configuration."""
-    history_n: int = 3
-    temperature: float = 0.0
-    top_k: int = -1
-    top_p: float = 1.0
-    max_tokens: int = 2048
-class MAIUIPhoneAgent:
-    """
-    MAI-UI Agent wrapper that implements the PhoneAgent interface.
-    This wrapper allows MAI-UI agents to be used transparently in place of
-    the standard PhoneAgent, providing compatibility with the existing
-    PhoneAgentManager and API infrastructure.
-    Usage:
-        agent = MAIUIPhoneAgent(
-            model_config=model_config,
-            agent_config=agent_config,
-        )
-        result = agent.run("Open WeChat")
-    """
-    def __init__(
-        self,
-        model_config: ModelConfig,
-        agent_config: AgentConfig,
-        mai_config: Optional[MAIUIConfig] = None,
-        takeover_callback: Optional[Callable[[str], None]] = None,
-    ):
-        """
-        Initialize MAI-UI PhoneAgent wrapper.
-        Args:
-            model_config: Model configuration (base_url, api_key, model_name).
-            agent_config: Agent configuration (device_id, max_steps, etc.).
-            mai_config: MAI-UI specific configuration.
-            takeover_callback: Callback for takeover requests.
-        """
-        self.model_config = model_config
-        self.agent_config = agent_config
-        self.mai_config = mai_config or MAIUIConfig()
-        # Create MAI-UI navigation agent
-        self._mai_agent = MAIUINaivigationAgent(
-            llm_base_url=model_config.base_url,
-            model_name=model_config.model_name,
-            api_key=model_config.api_key,
-            runtime_conf={
-                "history_n": self.mai_config.history_n,
-                "temperature": self.mai_config.temperature,
-                "top_k": self.mai_config.top_k,
-                "top_p": self.mai_config.top_p,
-                "max_tokens": self.mai_config.max_tokens,
-            },
-        )
-        # Action adapter and handler
-        self._action_adapter = MAIUIActionAdapter()
-        self.action_handler = ActionHandler(
-            device_id=agent_config.device_id,
-            takeover_callback=takeover_callback,
-        )
-        # PhoneAgent-compatible state
-        self._context: list[dict[str, Any]] = []
-        self._step_count = 0
-        self._current_task: str = ""
-        # For model_client compatibility (used by streaming patches)
-        self.model_client = _DummyModelClient()
-        # Debug: Print model configuration for troubleshooting
-        logger.info("=" * 60)
-        logger.info("[MAI-UI Agent] Initialization")
-        logger.info(f"  Device ID: {agent_config.device_id}")
-        logger.info(f"  Base URL:  {model_config.base_url}")
-        logger.info(f"  Model:     {model_config.model_name}")
-        logger.info("=" * 60)
-    def run(self, task: str) -> str:
-        """
-        Execute a complete task.
-        Args:
-            task: Natural language task description.
-        Returns:
-            Final message from the agent.
-        """
-        self.reset()
-        self._current_task = task
-        # First step
-        result = self._execute_step(task, is_first=True)
-        if result.finished:
-            return result.message or "Task completed"
-        # Continue until finished or max steps reached
-        while self._step_count < self.agent_config.max_steps:
-            result = self._execute_step(is_first=False)
-            if result.finished:
-                return result.message or "Task completed"
-        return "Max steps reached"
-    def step(self, task: Optional[str] = None) -> StepResult:
-        """
-        Execute a single step.
-        Args:
-            task: Task description (required for first step).
-        Returns:
-            StepResult with step details.
-        """
-        is_first = len(self._context) == 0
-        if is_first:
-            if not task:
-                raise ValueError("Task is required for the first step")
-            self._current_task = task
-        return self._execute_step(task, is_first)
-    def _execute_step(
-        self, user_prompt: Optional[str] = None, is_first: bool = False
-    ) -> StepResult:
-        """Execute a single step of the agent loop."""
-        from phone_agent.device_factory import get_device_factory
-        from PIL import Image
-        from io import BytesIO
-        self._step_count += 1
-        logger.info(f"[MAI-UI] Executing step {self._step_count}")
-        # Get screenshot
-        device_factory = get_device_factory()
-        screenshot = device_factory.get_screenshot(self.agent_config.device_id)
-        # Convert base64 to PIL Image
-        import base64
-        image_bytes = base64.b64decode(screenshot.base64_data)
-        pil_image = Image.open(BytesIO(image_bytes))
-        # Build observation
-        obs = {
-            "screenshot": pil_image,
-            "accessibility_tree": None,
-        }
-        # Get instruction
-        instruction = user_prompt or self._current_task
-        # Call MAI-UI predict
-        try:
-            raw_response, action_json = self._mai_agent.predict(
-                instruction=instruction,
-                obs=obs,
-            )
-        except Exception as e:
-            logger.error(f"[MAI-UI] Predict failed: {e}")
-            return StepResult(
-                success=False,
-                finished=True,
-                action=None,
-                thinking="",
-                message=f"Prediction failed: {e}",
-            )
-        # Check for error
-        if action_json.get("action") is None:
-            logger.error("[MAI-UI] Invalid action returned")
-            return StepResult(
-                success=False,
-                finished=True,
-                action=None,
-                thinking="",
-                message="Invalid action from model",
-            )
-        # Get thinking from trajectory
-        thinking = ""
-        if self._mai_agent.traj_memory.steps:
-            last_step = self._mai_agent.traj_memory.steps[-1]
-            thinking = last_step.thought or ""
-        # Convert action to AutoGLM-GUI format
-        converted_action = self._action_adapter.convert(action_json)
-        logger.debug(f"[MAI-UI] Converted action: {converted_action}")
-        # Check if finished (terminate action)
-        if converted_action.get("_metadata") == "finish":
-            return StepResult(
-                success=True,
-                finished=True,
-                action=converted_action,
-                thinking=thinking,
-                message=converted_action.get("message", "Task completed"),
-            )
-        # Execute action
-        try:
-            result = self.action_handler.execute(
-                converted_action,
-                screenshot.width,
-                screenshot.height,
-            )
-        except Exception as e:
-            logger.error(f"[MAI-UI] Action execution failed: {e}")
-            return StepResult(
-                success=False,
-                finished=False,
-                action=converted_action,
-                thinking=thinking,
-                message=f"Action failed: {e}",
-            )
-        # Update context for compatibility
-        self._context.append(
-            {
-                "step": self._step_count,
-                "action": action_json,
-                "converted_action": converted_action,
-                "result": result.success,
-                "thinking": thinking,
-            }
-        )
-        return StepResult(
-            success=result.success,
-            finished=result.should_finish,
-            action=converted_action,
-            thinking=thinking,
-            message=result.message,
-        )
-    def reset(self) -> None:
-        """Reset agent state for a new task."""
-        self._context = []
-        self._step_count = 0
-        self._current_task = ""
-        self._mai_agent.reset()
-        logger.debug("[MAI-UI] Agent reset")
-    @property
-    def step_count(self) -> int:
-        """Get current step count."""
-        return self._step_count
-    @property
-    def context(self) -> list[dict[str, Any]]:
-        """Get conversation context (for compatibility)."""
-        return self._context.copy()
-class _DummyModelClient:
-    """
-    Dummy model client for compatibility with streaming patches.
-    The actual model calls are handled by MAI-UI agent internally.
-    This exists to satisfy code that expects model_client attribute.
-    """
-    def request(self, messages: list, **kwargs) -> Any:
-        """Dummy request method - should not be called directly."""
-        raise NotImplementedError(
-            "MAIUIPhoneAgent handles model calls internally. "
-            "Do not call model_client.request() directly."
-        )

AutoGLM_GUI/phone_agent_patches.py DELETED Viewed

@@ -1,146 +0,0 @@
-"""
-Monkey patches for phone_agent to add streaming functionality.
-This module patches the upstream phone_agent code without modifying the original files.
-"""
-from typing import Any, Callable
-from phone_agent.model import ModelClient
-# Store original methods
-_original_model_request = ModelClient.request
-def _patched_model_request(
-    self,
-    messages: list[dict[str, Any]],
-    on_thinking_chunk: Callable[[str], None] | None = None,
-) -> Any:
-    """
-    Patched version of ModelClient.request that supports streaming thinking chunks.
-    This wraps the original request method and adds callback support for thinking chunks.
-    """
-    import time
-    from phone_agent.model.client import ModelResponse
-    # Start timing
-    start_time = time.time()
-    time_to_first_token = None
-    time_to_thinking_end = None
-    stream = self.client.chat.completions.create(
-        messages=messages,
-        model=self.config.model_name,
-        max_tokens=self.config.max_tokens,
-        temperature=self.config.temperature,
-        top_p=self.config.top_p,
-        frequency_penalty=self.config.frequency_penalty,
-        extra_body=self.config.extra_body,
-        stream=True,
-    )
-    raw_content = ""
-    buffer = ""  # Buffer to hold content that might be part of a marker
-    action_markers = ["finish(message=", "do(action="]
-    in_action_phase = False  # Track if we've entered the action phase
-    first_token_received = False
-    for chunk in stream:
-        if len(chunk.choices) == 0:
-            continue
-        if chunk.choices[0].delta.content is not None:
-            content = chunk.choices[0].delta.content
-            raw_content += content
-            # Record time to first token
-            if not first_token_received:
-                time_to_first_token = time.time() - start_time
-                first_token_received = True
-            if in_action_phase:
-                # Already in action phase, just accumulate content without printing
-                continue
-            buffer += content
-            # Check if any marker is fully present in buffer
-            marker_found = False
-            for marker in action_markers:
-                if marker in buffer:
-                    # Marker found, print everything before it
-                    thinking_part = buffer.split(marker, 1)[0]
-                    print(thinking_part, end="", flush=True)
-                    if on_thinking_chunk:
-                        on_thinking_chunk(thinking_part)
-                    print()  # Print newline after thinking is complete
-                    in_action_phase = True
-                    marker_found = True
-                    # Record time to thinking end
-                    if time_to_thinking_end is None:
-                        time_to_thinking_end = time.time() - start_time
-                    break
-            if marker_found:
-                continue  # Continue to collect remaining content
-            # Check if buffer ends with a prefix of any marker
-            # If so, don't print yet (wait for more content)
-            is_potential_marker = False
-            for marker in action_markers:
-                for i in range(1, len(marker)):
-                    if buffer.endswith(marker[:i]):
-                        is_potential_marker = True
-                        break
-                if is_potential_marker:
-                    break
-            if not is_potential_marker:
-                # Safe to print the buffer
-                print(buffer, end="", flush=True)
-                if on_thinking_chunk:
-                    on_thinking_chunk(buffer)
-                buffer = ""
-    # Calculate total time
-    total_time = time.time() - start_time
-    # Parse thinking and action from response
-    thinking, action = self._parse_response(raw_content)
-    # Print performance metrics
-    from phone_agent.config.i18n import get_message
-    lang = self.config.lang
-    print()
-    print("=" * 50)
-    print(f"⏱️  {get_message('performance_metrics', lang)}:")
-    print("-" * 50)
-    if time_to_first_token is not None:
-        print(f"{get_message('time_to_first_token', lang)}: {time_to_first_token:.3f}s")
-    if time_to_thinking_end is not None:
-        print(
-            f"{get_message('time_to_thinking_end', lang)}:        {time_to_thinking_end:.3f}s"
-        )
-    print(f"{get_message('total_inference_time', lang)}:          {total_time:.3f}s")
-    print("=" * 50)
-    return ModelResponse(
-        thinking=thinking,
-        action=action,
-        raw_content=raw_content,
-        time_to_first_token=time_to_first_token,
-        time_to_thinking_end=time_to_thinking_end,
-        total_time=total_time,
-    )
-def apply_patches():
-    """Apply all monkey patches to phone_agent."""
-    # Patch ModelClient.request to support streaming callbacks
-    ModelClient.request = _patched_model_request

autoglm-gui 1.4.0__py3-none-any.whl → 1.5.0__py3-none-any.whl

autoglm-gui 1.4.0py3-none-any.whl → 1.5.0py3-none-any.whl