PyPI - autoglm-gui - Versions diffs - 1.4.0__py3-none-any.whl → 1.5.0__py3-none-any.whl - Mend

autoglm-gui 1.4.0py3-none-any.whl → 1.5.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (120) hide show

AutoGLM_GUI/__init__.py +11 -0
AutoGLM_GUI/__main__.py +26 -8
AutoGLM_GUI/actions/__init__.py +6 -0
AutoGLM_GUI/actions/handler.py +196 -0
AutoGLM_GUI/actions/types.py +15 -0
AutoGLM_GUI/adb/__init__.py +53 -0
AutoGLM_GUI/adb/apps.py +227 -0
AutoGLM_GUI/adb/connection.py +323 -0
AutoGLM_GUI/adb/device.py +171 -0
AutoGLM_GUI/adb/input.py +67 -0
AutoGLM_GUI/adb/screenshot.py +11 -0
AutoGLM_GUI/adb/timing.py +167 -0
AutoGLM_GUI/adb_plus/keyboard_installer.py +4 -2
AutoGLM_GUI/adb_plus/qr_pair.py +8 -8
AutoGLM_GUI/adb_plus/screenshot.py +22 -1
AutoGLM_GUI/adb_plus/serial.py +38 -20
AutoGLM_GUI/adb_plus/touch.py +4 -9
AutoGLM_GUI/agents/__init__.py +51 -0
AutoGLM_GUI/agents/events.py +19 -0
AutoGLM_GUI/agents/factory.py +153 -0
AutoGLM_GUI/agents/glm/__init__.py +7 -0
AutoGLM_GUI/agents/glm/agent.py +292 -0
AutoGLM_GUI/agents/glm/message_builder.py +81 -0
AutoGLM_GUI/agents/glm/parser.py +110 -0
AutoGLM_GUI/agents/glm/prompts_en.py +77 -0
AutoGLM_GUI/agents/glm/prompts_zh.py +75 -0
AutoGLM_GUI/agents/mai/__init__.py +28 -0
AutoGLM_GUI/agents/mai/agent.py +405 -0
AutoGLM_GUI/agents/mai/parser.py +254 -0
AutoGLM_GUI/agents/mai/prompts.py +103 -0
AutoGLM_GUI/agents/mai/traj_memory.py +91 -0
AutoGLM_GUI/agents/protocols.py +27 -0
AutoGLM_GUI/agents/stream_runner.py +188 -0
AutoGLM_GUI/api/__init__.py +71 -11
AutoGLM_GUI/api/agents.py +190 -229
AutoGLM_GUI/api/control.py +9 -6
AutoGLM_GUI/api/devices.py +112 -28
AutoGLM_GUI/api/health.py +13 -0
AutoGLM_GUI/api/history.py +78 -0
AutoGLM_GUI/api/layered_agent.py +306 -181
AutoGLM_GUI/api/mcp.py +11 -10
AutoGLM_GUI/api/media.py +64 -1
AutoGLM_GUI/api/scheduled_tasks.py +98 -0
AutoGLM_GUI/api/version.py +23 -10
AutoGLM_GUI/api/workflows.py +2 -1
AutoGLM_GUI/config.py +72 -14
AutoGLM_GUI/config_manager.py +98 -27
AutoGLM_GUI/device_adapter.py +263 -0
AutoGLM_GUI/device_manager.py +248 -29
AutoGLM_GUI/device_protocol.py +266 -0
AutoGLM_GUI/devices/__init__.py +49 -0
AutoGLM_GUI/devices/adb_device.py +200 -0
AutoGLM_GUI/devices/mock_device.py +185 -0
AutoGLM_GUI/devices/remote_device.py +177 -0
AutoGLM_GUI/exceptions.py +3 -3
AutoGLM_GUI/history_manager.py +164 -0
AutoGLM_GUI/i18n.py +81 -0
AutoGLM_GUI/metrics.py +13 -20
AutoGLM_GUI/model/__init__.py +5 -0
AutoGLM_GUI/model/message_builder.py +69 -0
AutoGLM_GUI/model/types.py +24 -0
AutoGLM_GUI/models/__init__.py +10 -0
AutoGLM_GUI/models/history.py +96 -0
AutoGLM_GUI/models/scheduled_task.py +71 -0
AutoGLM_GUI/parsers/__init__.py +22 -0
AutoGLM_GUI/parsers/base.py +50 -0
AutoGLM_GUI/parsers/phone_parser.py +58 -0
AutoGLM_GUI/phone_agent_manager.py +118 -367
AutoGLM_GUI/platform_utils.py +31 -2
AutoGLM_GUI/prompt_config.py +15 -0
AutoGLM_GUI/prompts/__init__.py +32 -0
AutoGLM_GUI/scheduler_manager.py +304 -0
AutoGLM_GUI/schemas.py +272 -63
AutoGLM_GUI/scrcpy_stream.py +159 -37
AutoGLM_GUI/server.py +3 -1
AutoGLM_GUI/socketio_server.py +114 -29
AutoGLM_GUI/state.py +10 -30
AutoGLM_GUI/static/assets/{about-DeclntHg.js → about-BQm96DAl.js} +1 -1
AutoGLM_GUI/static/assets/alert-dialog-B42XxGPR.js +1 -0
AutoGLM_GUI/static/assets/chat-C0L2gQYG.js +129 -0
AutoGLM_GUI/static/assets/circle-alert-D4rSJh37.js +1 -0
AutoGLM_GUI/static/assets/dialog-DZ78cEcj.js +45 -0
AutoGLM_GUI/static/assets/history-DFBv7TGc.js +1 -0
AutoGLM_GUI/static/assets/index-Bzyv2yQ2.css +1 -0
AutoGLM_GUI/static/assets/{index-zQ4KKDHt.js → index-CmZSnDqc.js} +1 -1
AutoGLM_GUI/static/assets/index-CssG-3TH.js +11 -0
AutoGLM_GUI/static/assets/label-BCUzE_nm.js +1 -0
AutoGLM_GUI/static/assets/logs-eoFxn5of.js +1 -0
AutoGLM_GUI/static/assets/popover-DLsuV5Sx.js +1 -0
AutoGLM_GUI/static/assets/scheduled-tasks-MyqGJvy_.js +1 -0
AutoGLM_GUI/static/assets/square-pen-zGWYrdfj.js +1 -0
AutoGLM_GUI/static/assets/textarea-BX6y7uM5.js +1 -0
AutoGLM_GUI/static/assets/workflows-CYFs6ssC.js +1 -0
AutoGLM_GUI/static/index.html +2 -2
AutoGLM_GUI/types.py +142 -0
{autoglm_gui-1.4.0.dist-info → autoglm_gui-1.5.0.dist-info}/METADATA +178 -92
autoglm_gui-1.5.0.dist-info/RECORD +157 -0
mai_agent/base.py +137 -0
mai_agent/mai_grounding_agent.py +263 -0
mai_agent/mai_naivigation_agent.py +526 -0
mai_agent/prompt.py +148 -0
mai_agent/unified_memory.py +67 -0
mai_agent/utils.py +73 -0
AutoGLM_GUI/api/dual_model.py +0 -311
AutoGLM_GUI/dual_model/__init__.py +0 -53
AutoGLM_GUI/dual_model/decision_model.py +0 -664
AutoGLM_GUI/dual_model/dual_agent.py +0 -917
AutoGLM_GUI/dual_model/protocols.py +0 -354
AutoGLM_GUI/dual_model/vision_model.py +0 -442
AutoGLM_GUI/mai_ui_adapter/agent_wrapper.py +0 -291
AutoGLM_GUI/phone_agent_patches.py +0 -146
AutoGLM_GUI/static/assets/chat-Iut2yhSw.js +0 -125
AutoGLM_GUI/static/assets/dialog-BfdcBs1x.js +0 -45
AutoGLM_GUI/static/assets/index-5hCCwHA7.css +0 -1
AutoGLM_GUI/static/assets/index-DHF1NZh0.js +0 -12
AutoGLM_GUI/static/assets/workflows-xiplap-r.js +0 -1
autoglm_gui-1.4.0.dist-info/RECORD +0 -100
{autoglm_gui-1.4.0.dist-info → autoglm_gui-1.5.0.dist-info}/WHEEL +0 -0
{autoglm_gui-1.4.0.dist-info → autoglm_gui-1.5.0.dist-info}/entry_points.txt +0 -0
{autoglm_gui-1.4.0.dist-info → autoglm_gui-1.5.0.dist-info}/licenses/LICENSE +0 -0

AutoGLM_GUI/api/layered_agent.py CHANGED Viewed

@@ -6,9 +6,13 @@ a decision model for planning and autoglm-phone for execution.
 import asyncio
 import json
-from typing import Any
+import threading
+from typing import TYPE_CHECKING, Any
 from agents import Agent, Runner, SQLiteSession, function_tool
+if TYPE_CHECKING:
+    from agents.result import RunResultStreaming
 from agents.models.openai_chatcompletions import OpenAIChatCompletionsModel
 from fastapi import APIRouter
 from fastapi.responses import StreamingResponse
@@ -24,6 +28,11 @@ router = APIRouter()
 # 存储每个 session_id 对应的 SQLiteSession（内存模式）
 _sessions: dict[str, SQLiteSession] = {}
+# ==================== 活跃运行管理 ====================
+# 存储每个 session_id 对应的活跃 RunResultStreaming 实例，用于 abort
+_active_runs: dict[str, "RunResultStreaming"] = {}
+_active_runs_lock = threading.Lock()
 def _get_or_create_session(session_id: str) -> SQLiteSession:
     """获取或创建指定 session_id 的内存 session."""
@@ -44,9 +53,20 @@ def _clear_session(session_id: str) -> bool:
 def get_planner_model() -> str:
-    """获取规划层使用的模型名称，从配置读取."""
-    config = config_manager.get_effective_config()
-    return config.decision_model_name or "glm-4.7"
+    """获取规划层使用的模型名称."""
+    config_manager.load_file_config()
+    effective_config = config_manager.get_effective_config()
+    model_name = effective_config.decision_model_name
+    if not model_name:
+        raise ValueError(
+            "决策模型未配置。使用分层代理模式需要配置决策模型。\n"
+            "请在全局配置中设置决策模型的 Base URL、模型名称和 API Key。"
+        )
+    logger.info(f"[LayeredAgent] Using decision model: {model_name}")
+    return model_name
 PLANNER_INSTRUCTIONS = """## 核心目标
@@ -146,7 +166,9 @@ def _sync_list_devices() -> str:
         _build_device_response_with_agent(d, agent_manager) for d in managed_devices
     ]
-    return json.dumps(devices_with_agents, ensure_ascii=False, indent=2)
+    # Convert DeviceResponse Pydantic models to dicts before JSON serialization
+    devices_dict = [device.model_dump() for device in devices_with_agents]
+    return json.dumps(devices_dict, ensure_ascii=False, indent=2)
 @function_tool
@@ -271,20 +293,31 @@ async def chat(device_id: str, message: str) -> str:
 def _setup_openai_client() -> AsyncOpenAI:
-    """设置 OpenAI 客户端，使用 AutoGLM 的配置"""
+    """设置 OpenAI 客户端，使用决策模型配置"""
     config_manager.load_file_config()
     effective_config = config_manager.get_effective_config()
-    if not effective_config.base_url:
-        raise ValueError("base_url not configured")
+    # 检查决策模型配置
+    decision_base_url = effective_config.decision_base_url
+    decision_api_key = effective_config.decision_api_key
-    planner_model = get_planner_model()
-    logger.info(f"[LayeredAgent] API Base URL: {effective_config.base_url}")
-    logger.info(f"[LayeredAgent] Planner Model: {planner_model}")
+    if not decision_base_url:
+        raise ValueError(
+            "决策模型 Base URL 未配置。使用分层代理模式需要配置决策模型。\n"
+            "请在全局配置中设置决策模型的 Base URL、模型名称和 API Key。"
+        )
+    # decision_api_key 可以为 None（某些本地模型不需要）
+    planner_model = get_planner_model()  # 这里会再次检查 model_name
+    logger.info("[LayeredAgent] Decision model config:")
+    logger.info(f"  - Base URL: {decision_base_url}")
+    logger.info(f"  - Model: {planner_model}")
+    logger.info(f"  - API Key: {'***' if decision_api_key else 'None'}")
     return AsyncOpenAI(
-        base_url=effective_config.base_url,
-        api_key=effective_config.api_key,
+        base_url=decision_base_url,
+        api_key=decision_api_key or "EMPTY",  # 某些本地模型需要非空字符串
     )
@@ -307,14 +340,35 @@ def _create_planner_agent(client: AsyncOpenAI) -> Agent[Any]:
 # Global agent instance (lazy initialized)
 _client: AsyncOpenAI | None = None
 _agent: Agent[Any] | None = None
+_cached_config_hash: str | None = None
+def _compute_config_hash() -> str:
+    import hashlib
+    config = config_manager.get_effective_config()
+    config_str = config.model_dump_json()
+    return hashlib.md5(config_str.encode()).hexdigest()
 def _ensure_agent() -> Agent[Any]:
-    """Ensure the planner agent is initialized."""
-    global _client, _agent
-    if _agent is None:
+    global _client, _agent, _cached_config_hash
+    current_hash = _compute_config_hash()
+    if _agent is None or _cached_config_hash != current_hash:
+        if _agent is not None and _cached_config_hash != current_hash:
+            logger.info(
+                f"[LayeredAgent] Config changed (hash: {_cached_config_hash} -> {current_hash}), reloading agent..."
+            )
         _client = _setup_openai_client()
         _agent = _create_planner_agent(_client)
+        _cached_config_hash = current_hash
+        logger.info(
+            f"[LayeredAgent] Agent initialized/reloaded with config hash: {current_hash}"
+        )
     return _agent
@@ -343,18 +397,24 @@ async def layered_agent_chat(request: LayeredAgentRequest):
     - done: Final response
     - error: Error occurred
     """
+    from datetime import datetime
     from agents.stream_events import (
         RawResponsesStreamEvent,
         RunItemStreamEvent,
     )
+    from AutoGLM_GUI.history_manager import history_manager
+    from AutoGLM_GUI.models.history import ConversationRecord
     async def event_generator():
+        start_time = datetime.now()
+        final_output = ""
+        final_success = False
         try:
-            # Ensure agent is initialized
             agent = _ensure_agent()
-            # 获取或创建 session 以保持对话上下文
-            # 优先使用 session_id，其次使用 device_id，最后使用默认值
             session_id = request.session_id or request.device_id or "default"
             session = _get_or_create_session(session_id)
@@ -366,179 +426,186 @@ async def layered_agent_chat(request: LayeredAgentRequest):
                 session=session,
             )
+            # 保存活跃运行实例，用于 abort
+            with _active_runs_lock:
+                _active_runs[session_id] = result
             current_tool_call: dict[str, Any] | None = None
-            async for event in result.stream_events():
-                if isinstance(event, RawResponsesStreamEvent):
-                    # Raw response chunk - could contain thinking
-                    pass
-                elif isinstance(event, RunItemStreamEvent):
-                    item = event.item
-                    # Handle different item types
-                    item_type = getattr(item, "type", None)
-                    if item_type == "tool_call_item":
-                        # Tool call started - extract name from raw_item
-                        tool_name = "unknown"
-                        tool_args: dict[str, Any] = {}
-                        # Try to get from raw_item
-                        if hasattr(item, "raw_item") and item.raw_item:
-                            raw = item.raw_item
-                            # Handle dict format (sometimes returned as dict)
-                            if isinstance(raw, dict):
-                                tool_name = raw.get(
-                                    "name",
-                                    raw.get("function", {}).get("name", "unknown"),
-                                )
-                                args_str = raw.get(
-                                    "arguments",
-                                    raw.get("function", {}).get("arguments", "{}"),
-                                )
-                                try:
-                                    tool_args = (
-                                        json.loads(args_str)
-                                        if isinstance(args_str, str)
-                                        else args_str
+            try:
+                async for event in result.stream_events():
+                    if isinstance(event, RawResponsesStreamEvent):
+                        # Raw response chunk - could contain thinking
+                        pass
+                    elif isinstance(event, RunItemStreamEvent):
+                        item = event.item
+                        # Handle different item types
+                        item_type = getattr(item, "type", None)
+                        if item_type == "tool_call_item":
+                            # Tool call started - extract name from raw_item
+                            tool_name = "unknown"
+                            tool_args: dict[str, Any] = {}
+                            # Try to get from raw_item
+                            if hasattr(item, "raw_item") and item.raw_item:
+                                raw = item.raw_item
+                                # Handle dict format (sometimes returned as dict)
+                                if isinstance(raw, dict):
+                                    tool_name = raw.get(
+                                        "name",
+                                        raw.get("function", {}).get("name", "unknown"),
                                     )
-                                except Exception:
-                                    tool_args = {"raw": str(args_str)}
-                            else:
-                                # Chat Completions API format: raw_item.function.name
-                                if hasattr(raw, "function") and raw.function:
-                                    func = raw.function
-                                    if hasattr(func, "name"):
-                                        tool_name = func.name
-                                    if hasattr(func, "arguments"):
-                                        try:
-                                            tool_args = (
-                                                json.loads(func.arguments)
-                                                if isinstance(func.arguments, str)
-                                                else func.arguments
-                                            )
-                                        except Exception:
-                                            tool_args = {"raw": str(func.arguments)}
-                                # Responses API format: raw_item.name directly
-                                elif hasattr(raw, "name") and raw.name:
-                                    tool_name = raw.name
-                                    if hasattr(raw, "arguments"):
-                                        try:
-                                            tool_args = (
-                                                json.loads(raw.arguments)
-                                                if isinstance(raw.arguments, str)
-                                                else raw.arguments
-                                            )
-                                        except Exception:
-                                            tool_args = {"raw": str(raw.arguments)}
-                        # Fallback to direct item attributes
-                        if tool_name == "unknown":
-                            if hasattr(item, "name") and item.name:
-                                tool_name = item.name
-                            elif hasattr(item, "call") and item.call:
-                                call = item.call
-                                if hasattr(call, "function") and call.function:
-                                    if hasattr(call.function, "name"):
-                                        tool_name = call.function.name
-                                    if hasattr(call.function, "arguments"):
-                                        try:
-                                            tool_args = (
-                                                json.loads(call.function.arguments)
-                                                if isinstance(
-                                                    call.function.arguments, str
+                                    args_str = raw.get(
+                                        "arguments",
+                                        raw.get("function", {}).get("arguments", "{}"),
+                                    )
+                                    try:
+                                        tool_args = (
+                                            json.loads(args_str)
+                                            if isinstance(args_str, str)
+                                            else args_str
+                                        )
+                                    except Exception:
+                                        tool_args = {"raw": str(args_str)}
+                                else:
+                                    func = getattr(raw, "function", None)
+                                    if func:
+                                        tool_name = getattr(func, "name", "unknown")
+                                        args_val = getattr(func, "arguments", None)
+                                        if args_val:
+                                            try:
+                                                tool_args = (
+                                                    json.loads(args_val)
+                                                    if isinstance(args_val, str)
+                                                    else args_val
+                                                )
+                                            except Exception:
+                                                tool_args = {"raw": str(args_val)}
+                                    else:
+                                        name_val = getattr(raw, "name", None)
+                                        if name_val:
+                                            tool_name = name_val
+                                            args_val = getattr(raw, "arguments", None)
+                                            if args_val:
+                                                try:
+                                                    tool_args = (
+                                                        json.loads(args_val)
+                                                        if isinstance(args_val, str)
+                                                        else args_val
+                                                    )
+                                                except Exception:
+                                                    tool_args = {"raw": str(args_val)}
+                            # Fallback to direct item attributes
+                            if tool_name == "unknown":
+                                if hasattr(item, "name") and item.name:
+                                    tool_name = item.name
+                                elif hasattr(item, "call") and item.call:
+                                    call = item.call
+                                    if hasattr(call, "function") and call.function:
+                                        if hasattr(call.function, "name"):
+                                            tool_name = call.function.name
+                                        if hasattr(call.function, "arguments"):
+                                            try:
+                                                tool_args = (
+                                                    json.loads(call.function.arguments)
+                                                    if isinstance(
+                                                        call.function.arguments, str
+                                                    )
+                                                    else call.function.arguments
+                                                )
+                                            except Exception:
+                                                tool_args = {
+                                                    "raw": str(call.function.arguments)
+                                                }
+                                    elif hasattr(call, "name"):
+                                        tool_name = call.name
+                                        if hasattr(call, "arguments"):
+                                            try:
+                                                tool_args = (
+                                                    json.loads(call.arguments)
+                                                    if isinstance(call.arguments, str)
+                                                    else call.arguments
                                                 )
-                                                else call.function.arguments
-                                            )
-                                        except Exception:
-                                            tool_args = {
-                                                "raw": str(call.function.arguments)
-                                            }
-                                elif hasattr(call, "name"):
-                                    tool_name = call.name
-                                    if hasattr(call, "arguments"):
-                                        try:
-                                            tool_args = (
-                                                json.loads(call.arguments)
-                                                if isinstance(call.arguments, str)
-                                                else call.arguments
-                                            )
-                                        except Exception:
-                                            tool_args = {"raw": str(call.arguments)}
-                        logger.info(
-                            f"[LayeredAgent] Tool call: {tool_name}, args keys: {list(tool_args.keys()) if isinstance(tool_args, dict) else 'not dict'}"
-                        )
-                        current_tool_call = {
-                            "name": tool_name,
-                            "args": tool_args,
-                        }
-                        event_data = {
-                            "type": "tool_call",
-                            "tool_name": tool_name,
-                            "tool_args": tool_args,
-                        }
-                        yield f"data: {json.dumps(event_data, ensure_ascii=False)}\n\n"
-                    elif item_type == "tool_call_output_item":
-                        # Tool call result
-                        output = getattr(item, "output", "")
-                        # Get tool name from current_tool_call or try to extract from item
-                        tool_name = (
-                            current_tool_call["name"]
-                            if current_tool_call
-                            else "unknown"
-                        )
-                        # Try to get tool name from raw_item if available
-                        if (
-                            tool_name == "unknown"
-                            and hasattr(item, "raw_item")
-                            and item.raw_item
-                        ):
-                            if hasattr(item.raw_item, "name"):
-                                tool_name = item.raw_item.name
-                        logger.info(
-                            f"[LayeredAgent] Tool result for {tool_name}: {str(output)[:100] if output else 'empty'}..."
-                        )
-                        event_data = {
-                            "type": "tool_result",
-                            "tool_name": tool_name,
-                            "result": output,
-                        }
-                        yield f"data: {json.dumps(event_data, ensure_ascii=False)}\n\n"
-                        current_tool_call = None
-                    elif item_type == "message_output_item":
-                        # Final message
-                        content = ""
-                        if hasattr(item, "raw_item") and item.raw_item:
-                            if (
-                                hasattr(item.raw_item, "content")
-                                and item.raw_item.content
-                            ):
-                                for c in item.raw_item.content:
-                                    if hasattr(c, "text"):
-                                        content += c.text
-                        if content:
+                                            except Exception:
+                                                tool_args = {"raw": str(call.arguments)}
+                            logger.info(
+                                f"[LayeredAgent] Tool call: {tool_name}, args keys: {list(tool_args.keys()) if isinstance(tool_args, dict) else 'not dict'}"
+                            )
+                            current_tool_call = {
+                                "name": tool_name,
+                                "args": tool_args,
+                            }
                             event_data = {
-                                "type": "message",
-                                "content": content,
+                                "type": "tool_call",
+                                "tool_name": tool_name,
+                                "tool_args": tool_args,
                             }
                             yield f"data: {json.dumps(event_data, ensure_ascii=False)}\n\n"
-            # Final result
+                        elif item_type == "tool_call_output_item":
+                            # Tool call result
+                            output = getattr(item, "output", "")
+                            # Get tool name from current_tool_call or try to extract from item
+                            tool_name = (
+                                current_tool_call["name"]
+                                if current_tool_call
+                                else "unknown"
+                            )
+                            raw_item = getattr(item, "raw_item", None)
+                            if tool_name == "unknown" and raw_item:
+                                name_val = getattr(raw_item, "name", None)
+                                if name_val:
+                                    tool_name = name_val
+                            logger.info(
+                                f"[LayeredAgent] Tool result for {tool_name}: {str(output)[:100] if output else 'empty'}..."
+                            )
+                            event_data = {
+                                "type": "tool_result",
+                                "tool_name": tool_name,
+                                "result": output,
+                            }
+                            yield f"data: {json.dumps(event_data, ensure_ascii=False)}\n\n"
+                            current_tool_call = None
+                        elif item_type == "message_output_item":
+                            content = ""
+                            raw_item = getattr(item, "raw_item", None)
+                            if raw_item:
+                                raw_content = getattr(raw_item, "content", None)
+                                if raw_content:
+                                    for c in raw_content:
+                                        text_val = getattr(c, "text", None)
+                                        if text_val:
+                                            content += text_val
+                            if content:
+                                event_data = {
+                                    "type": "message",
+                                    "content": content,
+                                }
+                                yield f"data: {json.dumps(event_data, ensure_ascii=False)}\n\n"
+            finally:
+                # 清理活跃运行实例
+                with _active_runs_lock:
+                    _active_runs.pop(session_id, None)
             final_output = (
                 result.final_output if hasattr(result, "final_output") else ""
             )
+            final_success = True
             event_data = {
                 "type": "done",
                 "content": final_output,
@@ -548,12 +615,36 @@ async def layered_agent_chat(request: LayeredAgentRequest):
         except Exception as e:
             logger.exception(f"[LayeredAgent] Error: {e}")
+            final_output = str(e)
+            final_success = False
             event_data = {
                 "type": "error",
                 "message": str(e),
             }
             yield f"data: {json.dumps(event_data, ensure_ascii=False)}\n\n"
+        finally:
+            if request.device_id and final_output:
+                from AutoGLM_GUI.device_manager import DeviceManager
+                device_manager = DeviceManager.get_instance()
+                serialno = device_manager.get_serial_by_device_id(request.device_id)
+                if serialno:
+                    end_time = datetime.now()
+                    record = ConversationRecord(
+                        task_text=request.message,
+                        final_message=final_output,
+                        success=final_success,
+                        steps=0,
+                        start_time=start_time,
+                        end_time=end_time,
+                        duration_ms=int((end_time - start_time).total_seconds() * 1000),
+                        source="layered",
+                        source_detail=request.session_id or "",
+                        error_message=None if final_success else final_output,
+                    )
+                    history_manager.add_record(serialno, record)
     return StreamingResponse(
         event_generator(),
         media_type="text/event-stream",
@@ -565,6 +656,40 @@ async def layered_agent_chat(request: LayeredAgentRequest):
     )
+class AbortSessionRequest(BaseModel):
+    """Request for aborting a running session."""
+    session_id: str
+@router.post("/api/layered-agent/abort")
+def abort_session(request: AbortSessionRequest):
+    """
+    Abort a running layered agent session.
+    Uses the OpenAI agents SDK's native cancel() method to stop execution.
+    """
+    session_id = request.session_id
+    with _active_runs_lock:
+        if session_id in _active_runs:
+            result = _active_runs[session_id]
+            result.cancel(mode="immediate")
+            logger.info(f"[LayeredAgent] Aborted session: {session_id}")
+            return {
+                "success": True,
+                "message": f"Session {session_id} abort signal sent",
+            }
+        else:
+            logger.warning(
+                f"[LayeredAgent] No active run found for session: {session_id}"
+            )
+            return {
+                "success": False,
+                "message": f"No active run found for session {session_id}",
+            }
 class ResetSessionRequest(BaseModel):
     """Request for resetting a session."""

AutoGLM_GUI/api/mcp.py CHANGED Viewed

@@ -1,11 +1,19 @@
 """MCP (Model Context Protocol) tools for AutoGLM-GUI."""
-from typing import Any, Dict, List
+from typing_extensions import TypedDict
 from fastmcp import FastMCP
 from AutoGLM_GUI.logger import logger
 from AutoGLM_GUI.prompts import MCP_SYSTEM_PROMPT_ZH
+from AutoGLM_GUI.schemas import DeviceResponse
+class ChatResult(TypedDict):
+    result: str
+    steps: int
+    success: bool
 # 创建 MCP 服务器实例
 mcp = FastMCP("AutoGLM-GUI MCP Server")
@@ -15,7 +23,7 @@ MCP_MAX_STEPS = 5
 @mcp.tool()
-def chat(device_id: str, message: str) -> Dict[str, Any]:
+def chat(device_id: str, message: str) -> ChatResult:
     """
     Send a task to the AutoGLM Phone Agent for execution.
@@ -26,13 +34,6 @@ def chat(device_id: str, message: str) -> Dict[str, Any]:
     Args:
         device_id: Device identifier (e.g., "192.168.1.100:5555" or serial)
         message: Natural language task (e.g., "打开微信", "发送消息")
-    Returns:
-        {
-            "result": str,    # Task execution result
-            "steps": int,     # Number of steps taken
-            "success": bool   # Success flag
-        }
     """
     from AutoGLM_GUI.exceptions import DeviceBusyError
     from AutoGLM_GUI.phone_agent_manager import PhoneAgentManager
@@ -84,7 +85,7 @@ def chat(device_id: str, message: str) -> Dict[str, Any]:
 @mcp.tool()
-def list_devices() -> List[Dict[str, Any]]:
+def list_devices() -> list[DeviceResponse]:
     """
     List all connected ADB devices and their agent status.

autoglm-gui 1.4.0__py3-none-any.whl → 1.5.0__py3-none-any.whl

autoglm-gui 1.4.0py3-none-any.whl → 1.5.0py3-none-any.whl