PyPI - aury-agent - Versions diffs - 0.0.4__py3-none-any.whl → 0.0.5__py3-none-any.whl - Mend

aury-agent 0.0.4py3-none-any.whl → 0.0.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (34) hide show

aury/agents/context_providers/message.py +8 -5
aury/agents/core/base.py +11 -0
aury/agents/core/factory.py +8 -0
aury/agents/core/parallel.py +26 -4
aury/agents/core/state.py +25 -0
aury/agents/core/types/tool.py +1 -0
aury/agents/hitl/ask_user.py +44 -0
aury/agents/llm/adapter.py +55 -26
aury/agents/llm/openai.py +5 -1
aury/agents/memory/manager.py +33 -2
aury/agents/messages/store.py +27 -1
aury/agents/middleware/base.py +57 -0
aury/agents/middleware/chain.py +81 -18
aury/agents/react/agent.py +161 -1484
aury/agents/react/context.py +309 -0
aury/agents/react/factory.py +301 -0
aury/agents/react/pause.py +241 -0
aury/agents/react/persistence.py +182 -0
aury/agents/react/step.py +680 -0
aury/agents/react/tools.py +318 -0
aury/agents/tool/builtin/bash.py +11 -0
aury/agents/tool/builtin/delegate.py +38 -3
aury/agents/tool/builtin/edit.py +16 -0
aury/agents/tool/builtin/plan.py +19 -0
aury/agents/tool/builtin/read.py +13 -0
aury/agents/tool/builtin/thinking.py +10 -4
aury/agents/tool/builtin/yield_result.py +9 -6
aury/agents/tool/set.py +23 -0
aury/agents/workflow/adapter.py +22 -3
aury/agents/workflow/executor.py +51 -7
{aury_agent-0.0.4.dist-info → aury_agent-0.0.5.dist-info}/METADATA +1 -1
{aury_agent-0.0.4.dist-info → aury_agent-0.0.5.dist-info}/RECORD +34 -28
{aury_agent-0.0.4.dist-info → aury_agent-0.0.5.dist-info}/WHEEL +0 -0
{aury_agent-0.0.4.dist-info → aury_agent-0.0.5.dist-info}/entry_points.txt +0 -0

aury/agents/react/agent.py CHANGED Viewed

@@ -9,31 +9,33 @@ All services (llm, tools, storage, etc.) are accessed through ctx.
 from __future__ import annotations
 import asyncio
-import json
-from dataclasses import asdict
 from datetime import datetime
 from typing import Any, AsyncIterator, ClassVar, Literal, TYPE_CHECKING
-from ..core.base import AgentConfig, BaseAgent, ToolInjectionMode
+from ..core.base import AgentConfig, BaseAgent
 from ..core.context import InvocationContext
 from ..core.logging import react_logger as logger
 from ..core.event_bus import Events
-from ..context_providers import ContextProvider, AgentContext
+from ..context_providers import AgentContext
 from ..core.types.block import BlockEvent, BlockKind, BlockOp
-from ..llm import LLMMessage, ToolDefinition
+from ..llm import LLMMessage
 from ..middleware import HookAction
 from ..core.types import (
     Invocation,
     InvocationState,
     PromptInput,
-    ToolContext,
-    ToolResult,
     ToolInvocation,
-    ToolInvocationState,
     generate_id,
 )
-from ..core.state import State
-from ..core.signals import SuspendSignal, HITLSuspend
+from ..core.signals import SuspendSignal
+# Import helper modules
+from . import context as ctx_helpers
+from . import step as step_helpers
+from . import tools as tool_helpers
+from . import persistence as persist_helpers
+from . import pause as pause_helpers
+from .factory import SessionNotFoundError, create_react_agent, restore_react_agent
 if TYPE_CHECKING:
     from ..llm import LLMProvider
@@ -41,17 +43,12 @@ if TYPE_CHECKING:
     from ..core.types.tool import BaseTool
     from ..core.types.session import Session
     from ..backends import Backends
-    from ..backends.state import StateBackend
     from ..backends.snapshot import SnapshotBackend
     from ..backends.subagent import AgentConfig as SubAgentConfig
     from ..core.event_bus import Bus
     from ..middleware import MiddlewareChain, Middleware
     from ..memory import MemoryManager
-class SessionNotFoundError(Exception):
-    """Raised when session is not found in storage."""
-    pass
+    from ..context_providers import ContextProvider
 class ReactAgent(BaseAgent):
@@ -76,6 +73,8 @@ class ReactAgent(BaseAgent):
     # Class-level config
     agent_type: ClassVar[Literal["react", "workflow"]] = "react"
+    # ========== Factory methods (delegate to factory.py) ==========
     @classmethod
     def create(
         cls,
@@ -90,145 +89,28 @@ class ReactAgent(BaseAgent):
         subagents: "list[SubAgentConfig] | None" = None,
         memory: "MemoryManager | None" = None,
         snapshot: "SnapshotBackend | None" = None,
-        # ContextProvider system
         context_providers: "list[ContextProvider] | None" = None,
         enable_history: bool = True,
         history_limit: int = 50,
-        # Tool customization
         delegate_tool_class: "type[BaseTool] | None" = None,
     ) -> "ReactAgent":
-        """Create ReactAgent with minimal boilerplate.
-        This is the recommended way to create a ReactAgent for simple use cases.
-        Session, Storage, and Bus are auto-created if not provided.
-        Args:
-            llm: LLM provider (required)
-            tools: Tool registry or list of tools (optional)
-            config: Agent configuration (optional)
-            backends: Backends container (recommended, auto-created if None)
-            session: Session object (auto-created if None)
-            bus: Event bus (auto-created if None)
-            middlewares: List of middlewares (auto-creates chain)
-            subagents: List of sub-agent configs (auto-creates SubAgentManager)
-            memory: Memory manager (optional)
-            snapshot: Snapshot backend (optional)
-            context_providers: Additional custom context providers (optional)
-            enable_history: Enable message history (default True)
-            history_limit: Max conversation turns to keep (default 50)
-            delegate_tool_class: Custom DelegateTool class (optional)
-        Returns:
-            Configured ReactAgent ready to run
-        Example:
-            # Minimal
-            agent = ReactAgent.create(llm=my_llm)
-            # With backends
-            agent = ReactAgent.create(
-                llm=my_llm,
-                backends=Backends.create_default(),
-            )
-            # With tools and middlewares
-            agent = ReactAgent.create(
-                llm=my_llm,
-                tools=[tool1, tool2],
-                middlewares=[MessageContainerMiddleware()],
-            )
-            # With sub-agents
-            agent = ReactAgent.create(
-                llm=my_llm,
-                subagents=[
-                    AgentConfig(key="researcher", agent=researcher_agent),
-                ],
-            )
-            # With custom context providers
-            agent = ReactAgent.create(
-                llm=my_llm,
-                tools=[tool1],
-                context_providers=[MyRAGProvider(), MyProjectProvider()],
-            )
-        """
-        from ..core.event_bus import EventBus
-        from ..core.types.session import Session, generate_id
-        from ..backends import Backends
-        from ..backends.subagent import ListSubAgentBackend
-        from ..tool import ToolSet
-        from ..tool.builtin import DelegateTool
-        from ..middleware import MiddlewareChain, MessageBackendMiddleware
-        from ..context_providers import MessageContextProvider
-        # Auto-create backends if not provided
-        if backends is None:
-            backends = Backends.create_default()
-        # Auto-create missing components
-        if session is None:
-            session = Session(id=generate_id("sess"))
-        if bus is None:
-            bus = EventBus()
-        # Create middleware chain (add MessageBackendMiddleware if history enabled)
-        middleware_chain: MiddlewareChain | None = None
-        if middlewares or enable_history:
-            middleware_chain = MiddlewareChain()
-            # Add message persistence middleware first (uses backends.message)
-            if enable_history and backends.message is not None:
-                middleware_chain.use(MessageBackendMiddleware(max_history=history_limit))
-            # Add user middlewares
-            if middlewares:
-                for mw in middlewares:
-                    middleware_chain.use(mw)
-        # === Build tools list (direct, no provider) ===
-        tool_list: list["BaseTool"] = []
-        if tools is not None:
-            if isinstance(tools, ToolSet):
-                tool_list = list(tools.all())
-            else:
-                tool_list = list(tools)
-        # Handle subagents - create DelegateTool directly
-        if subagents:
-            backend = ListSubAgentBackend(subagents)
-            tool_cls = delegate_tool_class or DelegateTool
-            delegate_tool = tool_cls(backend, middleware=middleware_chain)
-            tool_list.append(delegate_tool)
-        # === Build providers ===
-        default_providers: list["ContextProvider"] = []
-        # MessageContextProvider - for fetching history (uses backends.message)
-        if enable_history:
-            message_provider = MessageContextProvider(max_messages=history_limit * 2)
-            default_providers.append(message_provider)
-        # Combine default + custom context_providers
-        all_providers = default_providers + (context_providers or [])
-        # Build context
-        ctx = InvocationContext(
-            session=session,
-            invocation_id=generate_id("inv"),
-            agent_id=config.name if config else "react_agent",
+        """Create ReactAgent with minimal boilerplate. See factory.create_react_agent for details."""
+        return create_react_agent(
+            llm=llm,
+            tools=tools,
+            config=config,
             backends=backends,
+            session=session,
             bus=bus,
-            llm=llm,
-            middleware=middleware_chain,
+            middlewares=middlewares,
+            subagents=subagents,
             memory=memory,
             snapshot=snapshot,
+            context_providers=context_providers,
+            enable_history=enable_history,
+            history_limit=history_limit,
+            delegate_tool_class=delegate_tool_class,
         )
-        agent = cls(ctx, config)
-        agent._tools = tool_list  # Direct tools (not from context_provider)
-        agent._context_providers = all_providers
-        agent._delegate_tool_class = delegate_tool_class or DelegateTool
-        agent._middleware_chain = middleware_chain
-        return agent
     @classmethod
     async def restore(
@@ -244,113 +126,18 @@ class ReactAgent(BaseAgent):
         memory: "MemoryManager | None" = None,
         snapshot: "SnapshotBackend | None" = None,
     ) -> "ReactAgent":
-        """Restore agent from persisted state.
-        Use this to resume an agent after:
-        - Page refresh
-        - Process restart
-        - Cross-process recovery
-        Args:
-            session_id: Session ID to restore
-            llm: LLM provider
-            backends: Backends container (recommended, auto-created if None)
-            tools: Tool registry or list of tools
-            config: Agent configuration
-            bus: Event bus (auto-created if None)
-            middleware: Middleware chain
-            memory: Memory manager
-            snapshot: Snapshot backend
-        Returns:
-            Restored ReactAgent ready to continue
-        Raises:
-            SessionNotFoundError: If session not found
-        Example:
-            agent = await ReactAgent.restore(
-                session_id="sess_xxx",
-                backends=my_backends,
-                llm=my_llm,
-            )
-            # Check if waiting for HITL response
-            if agent.is_suspended:
-                print(f"Waiting for: {agent.pending_request}")
-            else:
-                # Continue conversation
-                await agent.run("Continue...")
-        """
-        from ..core.event_bus import Bus
-        from ..core.types.session import Session, Invocation, InvocationState, generate_id
-        from ..core.state import State
-        from ..tool import ToolSet
-        from ..backends import Backends
-        # Auto-create backends if not provided
-        if backends is None:
-            backends = Backends.create_default()
-        # Validate storage backend is available
-        if backends.state is None:
-            raise ValueError("Cannot restore: no storage backend available (backends.state is None)")
-        storage = backends.state
-        # 1. Load session
-        session_data = await storage.get("sessions", session_id)
-        if not session_data:
-            raise SessionNotFoundError(f"Session not found: {session_id}")
-        session = Session.from_dict(session_data)
-        # 2. Load current invocation
-        invocation: Invocation | None = None
-        if session_data.get("current_invocation_id"):
-            inv_data = await storage.get("invocations", session_data["current_invocation_id"])
-            if inv_data:
-                invocation = Invocation.from_dict(inv_data)
-        # 3. Load state
-        state = State(storage, session_id)
-        await state.restore()
-        # 4. Handle tools
-        tool_set: ToolSet | None = None
-        if tools is not None:
-            if isinstance(tools, ToolSet):
-                tool_set = tools
-            else:
-                tool_set = ToolSet()
-                for tool in tools:
-                    tool_set.add(tool)
-        else:
-            tool_set = ToolSet()
-        # 5. Create bus if needed
-        if bus is None:
-            bus = Bus()
-        # 6. Build context
-        ctx = InvocationContext(
-            session=session,
-            invocation_id=invocation.id if invocation else generate_id("inv"),
-            agent_id=config.name if config else "react_agent",
+        """Restore agent from persisted state. See factory.restore_react_agent for details."""
+        return await restore_react_agent(
+            session_id=session_id,
+            llm=llm,
             backends=backends,
+            tools=tools,
+            config=config,
             bus=bus,
-            llm=llm,
-            tools=tool_set,
             middleware=middleware,
             memory=memory,
             snapshot=snapshot,
         )
-        # 7. Create agent
-        agent = cls(ctx, config)
-        agent._restored_invocation = invocation
-        agent._state = state
-        return agent
     def __init__(
         self,
@@ -364,7 +151,7 @@ class ReactAgent(BaseAgent):
             config: Agent configuration
         Raises:
-            ValueError: If ctx.llm or ctx.tools is None
+            ValueError: If ctx.llm is None
         """
         super().__init__(ctx, config)
@@ -393,13 +180,13 @@ class ReactAgent(BaseAgent):
         # Restore support
         self._restored_invocation: "Invocation | None" = None
-        self._state: "State | None" = None
+        self._state: "Any | None" = None  # State object for checkpoint
         # Direct tools (passed to create())
         self._tools: list["BaseTool"] = []
         # ContextProviders for context engineering
-        self._context_providers: list[ContextProvider] = []
+        self._context_providers: list["ContextProvider"] = []
         # DelegateTool class and middleware for dynamic subagent handling
         self._delegate_tool_class: type | None = None
@@ -418,7 +205,7 @@ class ReactAgent(BaseAgent):
         return False
     @property
-    def state(self) -> "State | None":
+    def state(self) -> "Any | None":
         """Get session state (for checkpoint/restore)."""
         return self._state
@@ -457,6 +244,8 @@ class ReactAgent(BaseAgent):
             return self._run_config["stream_thinking"]
         return self.config.stream_thinking
+    # ========== Main execution ==========
     async def _execute(self, input: PromptInput | str) -> None:
         """Execute the React loop.
@@ -467,10 +256,6 @@ class ReactAgent(BaseAgent):
         if isinstance(input, str):
             input = PromptInput(text=input)
-        # NOTE: 如果需要 HITL 恢复到同一个 invocation（而不是创建新的），
-        # 可以检查 self._restored_invocation.state == SUSPENDED 并恢复精确状态。
-        # 当前设计：每次 run() 都创建新 invocation，HITL 回复也是新 invocation。
         self.reset()
         self._running = True
@@ -488,7 +273,7 @@ class ReactAgent(BaseAgent):
             "session_id": self.session.id,
             "agent_id": self.name,
             "agent_type": self.agent_type,
-            "emit": global_emit,  # For middleware to emit ActionEvent
+            "emit": global_emit,
             "backends": self.ctx.backends,
         }
@@ -502,15 +287,19 @@ class ReactAgent(BaseAgent):
             )
             mw_context["invocation_id"] = self._current_invocation.id
-            logger.debug("Created invocation", extra={"invocation_id": self._current_invocation.id})
+            logger.info("Created invocation", extra={"invocation_id": self._current_invocation.id})
             # === Middleware: on_agent_start ===
             if self.middleware:
+                logger.info(
+                    "Calling middleware: on_agent_start",
+                    extra={"invocation_id": self._current_invocation.id},
+                )
                 hook_result = await self.middleware.process_agent_start(
                     self.name, input, mw_context
                 )
                 if hook_result.action == HookAction.STOP:
-                    logger.info("Agent stopped by middleware on_agent_start")
+                    logger.warning("Agent stopped by middleware on_agent_start", extra={"invocation_id": self._current_invocation.id})
                     await self.ctx.emit(BlockEvent(
                         kind=BlockKind.ERROR,
                         op=BlockOp.APPLY,
@@ -518,7 +307,7 @@ class ReactAgent(BaseAgent):
                     ))
                     return
                 elif hook_result.action == HookAction.SKIP:
-                    logger.info("Agent skipped by middleware on_agent_start")
+                    logger.warning("Agent skipped by middleware on_agent_start", extra={"invocation_id": self._current_invocation.id})
                     return
             await self.bus.publish(
@@ -529,18 +318,49 @@ class ReactAgent(BaseAgent):
                 },
             )
-            # Build initial messages (loads history from storage)
-            self._message_history = await self._build_messages(input)
+            # Fetch context from providers
+            logger.info("Fetching agent context", extra={"invocation_id": self._current_invocation.id})
+            self._agent_context = await ctx_helpers.fetch_agent_context(
+                self._ctx,
+                input,
+                self._context_providers,
+                self._tools,
+                self._delegate_tool_class,
+                self._middleware_chain,
+            )
+            # Build initial messages
+            logger.info("Building message history", extra={"invocation_id": self._current_invocation.id})
+            self._message_history = await ctx_helpers.build_messages(
+                input,
+                self._agent_context,
+                self.config.system_prompt,
+            )
             self._current_step = 0
+            logger.info(
+                "Built message history",
+                extra={
+                    "invocation_id": self._current_invocation.id,
+                    "message_count": len(self._message_history),
+                },
+            )
             # Save user message (real-time persistence)
-            await self._save_user_message(input)
+            logger.info("Saving user message", extra={"invocation_id": self._current_invocation.id})
+            await persist_helpers.save_user_message(self, input)
-            # 3. Main loop
+            # Main loop
             finish_reason = None
             while not await self._check_abort():
                 self._current_step += 1
+                logger.info(
+                    "Starting step",
+                    extra={
+                        "invocation_id": self._current_invocation.id,
+                        "step": self._current_step,
+                    },
+                )
                 # Check step limit
                 if self._current_step > self.config.max_steps:
@@ -564,14 +384,30 @@ class ReactAgent(BaseAgent):
                     snapshot_id = await self.snapshot.track()
                 # Execute step
-                finish_reason = await self._execute_step()
+                logger.info(
+                    "Executing LLM request",
+                    extra={
+                        "invocation_id": self._current_invocation.id,
+                        "step": self._current_step,
+                    },
+                )
+                finish_reason = await step_helpers.execute_step(self)
+                logger.info(
+                    "LLM response received",
+                    extra={
+                        "invocation_id": self._current_invocation.id,
+                        "step": self._current_step,
+                        "finish_reason": finish_reason,
+                        "tool_count": len(self._tool_invocations),
+                    },
+                )
                 # Save assistant message (real-time persistence)
-                await self._save_assistant_message()
+                await persist_helpers.save_assistant_message(self)
                 # Save message_history to state and checkpoint
                 if self._state:
-                    self._save_messages_to_state()
+                    persist_helpers.save_messages_to_state(self)
                     await self._state.checkpoint()
                 # Check if we should exit
@@ -580,26 +416,57 @@ class ReactAgent(BaseAgent):
                 # Process tool results and continue
                 if self._tool_invocations:
-                    await self._process_tool_results()
+                    logger.info(
+                        "Processing tool invocations",
+                        extra={
+                            "invocation_id": self._current_invocation.id,
+                            "step": self._current_step,
+                            "tool_count": len(self._tool_invocations),
+                            "tools": ", ".join([inv.tool_name for inv in self._tool_invocations]),
+                        },
+                    )
+                    await tool_helpers.process_tool_results(self)
+                    logger.info(
+                        "Tool results processed",
+                        extra={
+                            "invocation_id": self._current_invocation.id,
+                            "step": self._current_step,
+                        },
+                    )
                     # Save tool messages (real-time persistence)
-                    await self._save_tool_messages()
+                    await persist_helpers.save_tool_messages(self)
                     self._tool_invocations.clear()
                     # Save message_history to state and checkpoint
                     if self._state:
-                        self._save_messages_to_state()
+                        persist_helpers.save_messages_to_state(self)
                         await self._state.checkpoint()
-            # 4. Check if aborted
+            # Check if aborted
             is_aborted = self.is_cancelled
-            # 5. Complete invocation
+            # Complete invocation
             if is_aborted:
                 self._current_invocation.state = InvocationState.ABORTED
+                logger.info(
+                    "Invocation aborted by user",
+                    extra={
+                        "invocation_id": self._current_invocation.id,
+                        "steps": self._current_step,
+                    },
+                )
             else:
                 self._current_invocation.state = InvocationState.COMPLETED
+                logger.info(
+                    "Invocation completed successfully",
+                    extra={
+                        "invocation_id": self._current_invocation.id,
+                        "steps": self._current_step,
+                        "finish_reason": finish_reason,
+                    },
+                )
             self._current_invocation.finished_at = datetime.now()
             # Save to invocation backend
@@ -638,20 +505,19 @@ class ReactAgent(BaseAgent):
             )
             # Clear message_history from State after successful completion
-            # Historical messages are already persisted (truncated) via MessageStore
-            self._clear_messages_from_state()
+            persist_helpers.clear_messages_from_state(self)
             if self._state:
                 await self._state.checkpoint()
         except SuspendSignal as e:
             # HITL/Suspend signal - invocation waits for user input
-            logger.info(
-                "Agent suspended",
+            logger.warning(
+                "Agent suspended (HITL)",
                 extra={
-                    "invocation_id": self._current_invocation.id
-                    if self._current_invocation
-                    else None,
+                    "invocation_id": self._current_invocation.id if self._current_invocation else None,
                     "signal_type": type(e).__name__,
+                    "request_type": getattr(e, "request_type", None),
+                    "request_id": getattr(e, "request_id", None),
                 },
             )
@@ -668,10 +534,9 @@ class ReactAgent(BaseAgent):
             # Save pending_request to execution state
             if self._state:
                 self._state.execution["pending_request"] = e.to_dict()
-                self._save_messages_to_state()
+                persist_helpers.save_messages_to_state(self)
                 await self._state.checkpoint()
-            # Don't raise - just return to exit cleanly
             return
         except Exception as e:
@@ -679,9 +544,7 @@ class ReactAgent(BaseAgent):
                 "ReactAgent run failed",
                 extra={
                     "error": str(e),
-                    "invocation_id": self._current_invocation.id
-                    if self._current_invocation
-                    else None,
+                    "invocation_id": self._current_invocation.id if self._current_invocation else None,
                 },
                 exc_info=True,
             )
@@ -690,8 +553,10 @@ class ReactAgent(BaseAgent):
             if self.middleware:
                 processed_error = await self.middleware.process_error(e, mw_context)
                 if processed_error is None:
-                    # Error suppressed by middleware
-                    logger.info("Error suppressed by middleware")
+                    logger.warning(
+                        "Error suppressed by middleware",
+                        extra={"invocation_id": self._current_invocation.id if self._current_invocation else None},
+                    )
                     return
             if self._current_invocation:
@@ -709,1214 +574,26 @@ class ReactAgent(BaseAgent):
             self._running = False
             self._restored_invocation = None
-    async def pause(self) -> str:
-        """Pause execution and return invocation ID for later resume.
-        Saves current state to the invocation for later resumption.
-        Returns:
-            Invocation ID for resuming
-        """
-        if not self._current_invocation:
-            raise RuntimeError("No active invocation to pause")
-        # Mark as paused
-        self._paused = True
-        self._current_invocation.mark_paused()
-        # Save state for resumption
-        self._current_invocation.agent_state = {
-            "step": self._current_step,
-            "message_history": [
-                {"role": m.role, "content": m.content} for m in self._message_history
-            ],
-            "text_buffer": self._text_buffer,
-        }
-        self._current_invocation.step_count = self._current_step
-        # Save pending tool calls
-        self._current_invocation.pending_tool_ids = [
-            inv.tool_call_id
-            for inv in self._tool_invocations
-            if inv.state == ToolInvocationState.CALL
-        ]
-        # Persist invocation
-        if self.ctx.backends and self.ctx.backends.invocation:
-            await self.ctx.backends.invocation.update(
-                self._current_invocation.id,
-                self._current_invocation.to_dict(),
-            )
-        await self.bus.publish(
-            Events.INVOCATION_PAUSE,
-            {
-                "invocation_id": self._current_invocation.id,
-                "step": self._current_step,
-            },
-        )
-        return self._current_invocation.id
+    # ========== Pause/resume (delegate to pause.py) ==========
-    async def _resume_internal(self, invocation_id: str) -> None:
-        """Internal resume logic using emit."""
-        # Load invocation
-        if not self.ctx.backends or not self.ctx.backends.invocation:
-            raise ValueError("No invocation backend available")
-        inv_data = await self.ctx.backends.invocation.get(invocation_id)
-        if not inv_data:
-            raise ValueError(f"Invocation not found: {invocation_id}")
-        invocation = Invocation.from_dict(inv_data)
-        if invocation.state != InvocationState.PAUSED:
-            raise ValueError(f"Invocation is not paused: {invocation.state}")
-        # Restore state
-        self._current_invocation = invocation
-        self._paused = False
-        self._running = True
-        agent_state = invocation.agent_state or {}
-        self._current_step = agent_state.get("step", 0)
-        self._text_buffer = agent_state.get("text_buffer", "")
-        # Restore message history
-        self._message_history = [
-            LLMMessage(role=m["role"], content=m["content"])
-            for m in agent_state.get("message_history", [])
-        ]
-        # Mark as running
-        invocation.state = InvocationState.RUNNING
-        await self.bus.publish(
-            Events.INVOCATION_RESUME,
-            {
-                "invocation_id": invocation_id,
-                "step": self._current_step,
-            },
-        )
-        # Continue execution loop
-        try:
-            finish_reason = None
-            while not await self._check_abort() and not self._paused:
-                self._current_step += 1
-                if self._current_step > self.config.max_steps:
-                    await self.ctx.emit(BlockEvent(
-                        kind=BlockKind.ERROR,
-                        op=BlockOp.APPLY,
-                        data={"message": f"Max steps ({self.config.max_steps}) exceeded"},
-                    ))
-                    break
-                finish_reason = await self._execute_step()
-                # Save assistant message (real-time persistence)
-                await self._save_assistant_message()
-                if finish_reason == "end_turn" and not self._tool_invocations:
-                    break
-                if self._tool_invocations:
-                    await self._process_tool_results()
-                    # Save tool messages (real-time persistence)
-                    await self._save_tool_messages()
-                    self._tool_invocations.clear()
-            if not self._paused:
-                self._current_invocation.state = InvocationState.COMPLETED
-                self._current_invocation.finished_at = datetime.now()
-        except Exception as e:
-            self._current_invocation.state = InvocationState.FAILED
-            await self.ctx.emit(BlockEvent(
-                kind=BlockKind.ERROR,
-                op=BlockOp.APPLY,
-                data={"message": str(e)},
-            ))
-            raise
-        finally:
-            self._running = False
+    async def pause(self) -> str:
+        """Pause execution and return invocation ID for later resume."""
+        return await pause_helpers.pause_agent(self)
     async def resume(self, invocation_id: str) -> AsyncIterator[BlockEvent]:
-        """Resume paused execution.
-        Args:
-            invocation_id: ID from pause()
-        Yields:
-            BlockEvent streaming events
-        """
-        from ..core.context import _emit_queue_var
-        queue: asyncio.Queue[BlockEvent] = asyncio.Queue()
-        token = _emit_queue_var.set(queue)
-        try:
-            exec_task = asyncio.create_task(self._resume_internal(invocation_id))
-            get_task: asyncio.Task | None = None
-            # Event-driven processing - no timeout delays
-            while True:
-                # First drain any pending items from queue (non-blocking)
-                while True:
-                    try:
-                        block = queue.get_nowait()
-                        yield block
-                    except asyncio.QueueEmpty:
-                        break
-                # Exit if task is done and queue is empty
-                if exec_task.done() and queue.empty():
-                    break
-                # Create get_task if needed
-                if get_task is None or get_task.done():
-                    get_task = asyncio.create_task(queue.get())
-                # Wait for EITHER: queue item OR exec_task completion
-                done, _ = await asyncio.wait(
-                    {get_task, exec_task},
-                    return_when=asyncio.FIRST_COMPLETED,
-                )
-                if get_task in done:
-                    try:
-                        block = get_task.result()
-                        yield block
-                        get_task = None
-                    except asyncio.CancelledError:
-                        pass
-            # Cancel pending get_task if any
-            if get_task and not get_task.done():
-                get_task.cancel()
-                try:
-                    await get_task
-                except asyncio.CancelledError:
-                    pass
-            # Final drain after task completion
-            while not queue.empty():
-                try:
-                    block = queue.get_nowait()
-                    yield block
-                except asyncio.QueueEmpty:
-                    break
-            await exec_task
-        finally:
-            _emit_queue_var.reset(token)
-    async def _fetch_agent_context(self, input: PromptInput) -> AgentContext:
-        """Fetch context from all providers and merge with direct tools.
-        Process:
-        1. Fetch from all providers and merge
-        2. Add direct tools (from create())
-        3. If providers returned subagents, create DelegateTool
-        Also sets ctx.input for providers to access.
-        """
-        from ..tool.builtin import DelegateTool
-        from ..backends.subagent import ListSubAgentBackend
-        # Set input on context for providers to access
-        self._ctx.input = input
-        # Fetch from all context_providers
-        outputs: list[AgentContext] = []
-        for provider in self._context_providers:
-            try:
-                output = await provider.fetch(self._ctx)
-                outputs.append(output)
-            except Exception as e:
-                logger.warning(f"Provider {provider.name} fetch failed: {e}")
-        # Merge all provider outputs
-        merged = AgentContext.merge(outputs)
-        # Add direct tools (from create())
-        all_tools = list(self._tools)  # Copy direct tools
-        seen_names = {t.name for t in all_tools}
-        # Add tools from providers (deduplicate)
-        for tool in merged.tools:
-            if tool.name not in seen_names:
-                seen_names.add(tool.name)
-                all_tools.append(tool)
-        # If providers returned subagents, create DelegateTool
-        if merged.subagents:
-            # Check if we already have a delegate tool
-            has_delegate = any(t.name == "delegate" for t in all_tools)
-            if not has_delegate:
-                backend = ListSubAgentBackend(merged.subagents)
-                tool_cls = self._delegate_tool_class or DelegateTool
-                delegate_tool = tool_cls(backend, middleware=self._middleware_chain)
-                all_tools.append(delegate_tool)
-        # Return merged context with combined tools
-        return AgentContext(
-            system_content=merged.system_content,
-            user_content=merged.user_content,
-            tools=all_tools,
-            messages=merged.messages,
-            subagents=merged.subagents,
-            skills=merged.skills,
-        )
-    async def _build_messages(self, input: PromptInput) -> list[LLMMessage]:
-        """Build message history for LLM.
-        Uses AgentContext from providers for system content, messages, etc.
-        """
-        messages = []
-        # Fetch context from providers
-        self._agent_context = await self._fetch_agent_context(input)
-        # System message: config.system_prompt + agent_context.system_content
-        system_prompt = self.config.system_prompt or self._default_system_prompt()
-        if self._agent_context.system_content:
-            system_prompt = system_prompt + "\n\n" + self._agent_context.system_content
-        messages.append(LLMMessage(role="system", content=system_prompt))
-        # Historical messages from AgentContext (provided by MessageContextProvider)
-        for msg in self._agent_context.messages:
-            messages.append(LLMMessage(
-                role=msg.get("role", "user"),
-                content=msg.get("content", ""),
-            ))
-        # User content prefix (from providers) + current user message
-        content = input.text
-        if self._agent_context.user_content:
-            content = self._agent_context.user_content + "\n\n" + content
-        if input.attachments:
-            # Build multimodal content
-            content_parts = [{"type": "text", "text": content}]
-            for attachment in input.attachments:
-                content_parts.append(attachment)
-            content = content_parts
-        messages.append(LLMMessage(role="user", content=content))
-        return messages
-    def _default_system_prompt(self) -> str:
-        """Generate default system prompt with tool descriptions."""
-        # Get tools from AgentContext (from providers)
-        all_tools = self._agent_context.tools if self._agent_context else []
-        tool_list = []
-        for tool in all_tools:
-            info = tool.get_info()
-            tool_list.append(f"- {info.name}: {info.description}")
-        tools_desc = "\n".join(tool_list) if tool_list else "No tools available."
-        return f"""You are a helpful AI assistant with access to tools.
-Available tools:
-{tools_desc}
-When you need to use a tool, make a tool call. After receiving the tool result, continue reasoning or provide your final response.
-Think step by step and use tools when necessary to complete the user's request."""
-    def _get_effective_tool_mode(self) -> ToolInjectionMode:
-        """Get effective tool mode (auto-detect based on model capabilities).
-        Returns:
-            FUNCTION_CALL if model supports tools, else PROMPT
-        """
-        # If explicitly set to PROMPT, use PROMPT
-        if self.config.tool_mode == ToolInjectionMode.PROMPT:
-            return ToolInjectionMode.PROMPT
-        # Auto-detect: if model doesn't support tools, use PROMPT
-        caps = self.llm.capabilities
-        if not caps.supports_tools:
-            logger.info(
-                f"Model {self.llm.model} does not support function calling, "
-                "auto-switching to PROMPT mode for tools"
-            )
-            return ToolInjectionMode.PROMPT
-        return ToolInjectionMode.FUNCTION_CALL
-    def _build_tool_prompt(self, tools: list) -> str:
-        """Build tool description for PROMPT mode injection.
-        Args:
-            tools: List of BaseTool objects
-        Returns:
-            Tool prompt string to inject into system message
-        """
-        if not tools:
-            return ""
-        tool_descriptions = []
-        for tool in tools:
-            info = tool.get_info()
-            # Build parameter description
-            params_desc = ""
-            if info.parameters and "properties" in info.parameters:
-                params = []
-                properties = info.parameters.get("properties", {})
-                required = info.parameters.get("required", [])
-                for name, schema in properties.items():
-                    param_type = schema.get("type", "any")
-                    param_desc = schema.get("description", "")
-                    is_required = "required" if name in required else "optional"
-                    params.append(f"    - {name} ({param_type}, {is_required}): {param_desc}")
-                params_desc = "\n" + "\n".join(params) if params else ""
-            tool_descriptions.append(
-                f"### {info.name}\n"
-                f"{info.description}{params_desc}"
-            )
-        return f"""## Available Tools
-You have access to the following tools. To use a tool, output a JSON block in this exact format:
-```tool_call
-{{
-  "tool": "tool_name",
-  "arguments": {{
-    "param1": "value1",
-    "param2": "value2"
-  }}
-}}
-```
-IMPORTANT:
-- Use the exact format above with ```tool_call code block
-- You can make multiple tool calls in one response
-- Wait for tool results before continuing
-{chr(10).join(tool_descriptions)}
-"""
-    def _parse_tool_calls_from_text(self, text: str) -> list[dict]:
-        """Parse tool calls from LLM text output (for PROMPT mode).
-        Looks for ```tool_call blocks in the format:
-        ```tool_call
-        {"tool": "name", "arguments": {...}}
-        ```
-        Args:
-            text: LLM output text
-        Returns:
-            List of parsed tool calls: [{"name": str, "arguments": dict}, ...]
-        """
-        import re
-        tool_calls = []
-        # Match ```tool_call ... ``` blocks
-        pattern = r"```tool_call\s*\n?(.+?)\n?```"
-        matches = re.findall(pattern, text, re.DOTALL)
-        for match in matches:
-            try:
-                data = json.loads(match.strip())
-                if "tool" in data:
-                    tool_calls.append({
-                        "name": data["tool"],
-                        "arguments": data.get("arguments", {}),
-                    })
-            except json.JSONDecodeError as e:
-                logger.warning(f"Failed to parse tool call JSON: {e}")
-                continue
-        return tool_calls
-    async def _execute_step(self) -> str | None:
-        """Execute a single LLM step with middleware hooks.
-        Returns:
-            finish_reason from LLM
-        """
-        # Get tools from AgentContext (from providers)
-        all_tools = self._agent_context.tools if self._agent_context else []
-        # Determine effective tool mode (auto-detect based on capabilities)
-        effective_tool_mode = self._get_effective_tool_mode()
-        # Get tool definitions (only for FUNCTION_CALL mode)
-        tool_defs = None
-        if effective_tool_mode == ToolInjectionMode.FUNCTION_CALL and all_tools:
-            tool_defs = [
-                ToolDefinition(
-                    name=t.name,
-                    description=t.description,
-                    input_schema=t.parameters,
-                )
-                for t in all_tools
-            ]
-        # For PROMPT mode, inject tools into system message
-        if effective_tool_mode == ToolInjectionMode.PROMPT and all_tools:
-            tool_prompt = self._build_tool_prompt(all_tools)
-            # Inject into first system message
-            if self._message_history and self._message_history[0].role == "system":
-                original_content = self._message_history[0].content
-                self._message_history[0] = LLMMessage(
-                    role="system",
-                    content=f"{original_content}\n\n{tool_prompt}",
-                )
-        # Reset buffers
-        self._text_buffer = ""
-        self._thinking_buffer = ""  # Buffer for non-streaming thinking
-        self._tool_invocations = []
-        current_tool_invocation: ToolInvocation | None = None
-        # Reset block IDs for this step (each step gets fresh block IDs)
-        self._current_text_block_id = None
-        self._current_thinking_block_id = None
-        # Reset tool call tracking
-        self._call_id_to_tool = {}
-        self._tool_call_blocks = {}
-        # Build middleware context for this step
-        from ..core.context import emit as global_emit
-        mw_context = {
-            "session_id": self.session.id,
-            "invocation_id": self._current_invocation.id if self._current_invocation else "",
-            "step": self._current_step,
-            "agent_id": self.name,
-            "emit": global_emit,  # For middleware to emit BlockEvent/ActionEvent
-            "backends": self.ctx.backends,
-            "tool_mode": effective_tool_mode.value,  # Add tool mode to context
-        }
-        # Build LLM call kwargs
-        # Note: temperature, max_tokens, timeout, retries are configured on LLMProvider
-        llm_kwargs: dict[str, Any] = {
-            "messages": self._message_history,
-            "tools": tool_defs,  # None for PROMPT mode
-        }
-        # Get model capabilities
-        caps = self.llm.capabilities
-        # Add thinking configuration (use runtime override if set)
-        # Only if model supports thinking
-        enable_thinking = self._get_enable_thinking()
-        reasoning_effort = self._get_reasoning_effort()
-        if enable_thinking:
-            if caps.supports_thinking:
-                llm_kwargs["enable_thinking"] = True
-                if reasoning_effort:
-                    llm_kwargs["reasoning_effort"] = reasoning_effort
-            else:
-                logger.debug(
-                    f"Model {self.llm.model} does not support thinking, "
-                    "enable_thinking will be ignored"
-                )
-        # === Middleware: on_request ===
-        if self.middleware:
-            llm_kwargs = await self.middleware.process_request(llm_kwargs, mw_context)
-            if llm_kwargs is None:
-                logger.info("LLM request cancelled by middleware")
-                return None
-        # Debug: log message history before LLM call
-        logger.debug(
-            f"LLM call - Step {self._current_step}, messages: {len(self._message_history)}, "
-            f"tools: {len(tool_defs) if tool_defs else 0}"
-        )
-        # Detailed message log (for debugging model issues like repeated calls)
-        for i, msg in enumerate(self._message_history):
-            content_preview = str(msg.content)[:300] if msg.content else "<empty>"
-            tool_call_id = getattr(msg, 'tool_call_id', None)
-            logger.debug(
-                f"  msg[{i}] role={msg.role}"
-                f"{f', tool_call_id={tool_call_id}' if tool_call_id else ''}"
-                f", content={content_preview}"
-            )
-        # Call LLM
-        await self.bus.publish(
-            Events.LLM_START,
-            {
-                "provider": self.llm.provider,
-                "model": self.llm.model,
-                "step": self._current_step,
-                "enable_thinking": enable_thinking,
-            },
-        )
-        finish_reason = None
-        llm_response_data: dict[str, Any] = {}  # Collect response for middleware
-        # Reset middleware stream state
-        if self.middleware:
-            self.middleware.reset_stream_state()
-        async for event in self.llm.complete(**llm_kwargs):
-            if await self._check_abort():
-                break
-            if event.type == "content":
-                # Text content
-                if event.delta:
-                    # === Middleware: on_model_stream ===
-                    stream_chunk = {"delta": event.delta, "type": "content"}
-                    if self.middleware:
-                        stream_chunk = await self.middleware.process_stream_chunk(
-                            stream_chunk, mw_context
-                        )
-                        if stream_chunk is None:
-                            continue  # Skip this chunk
-                    delta = stream_chunk.get("delta", event.delta)
-                    self._text_buffer += delta
-                    # Reuse or create block_id for text streaming
-                    if self._current_text_block_id is None:
-                        self._current_text_block_id = generate_id("blk")
-                    await self.ctx.emit(BlockEvent(
-                        block_id=self._current_text_block_id,
-                        kind=BlockKind.TEXT,
-                        op=BlockOp.DELTA,
-                        data={"content": delta},
-                    ))
-                    await self.bus.publish(
-                        Events.LLM_STREAM,
-                        {
-                            "delta": delta,
-                            "step": self._current_step,
-                        },
-                    )
-            elif event.type == "thinking":
-                # Thinking content - only emit if thinking is enabled
-                stream_thinking = self._get_stream_thinking()
-                if event.delta and enable_thinking:
-                    if stream_thinking:
-                        # Reuse or create block_id for thinking streaming
-                        if self._current_thinking_block_id is None:
-                            self._current_thinking_block_id = generate_id("blk")
-                        # Stream thinking in real-time
-                        await self.ctx.emit(BlockEvent(
-                            block_id=self._current_thinking_block_id,
-                            kind=BlockKind.THINKING,
-                            op=BlockOp.DELTA,
-                            data={"content": event.delta},
-                        ))
-                    else:
-                        # Buffer thinking for batch output
-                        self._thinking_buffer += event.delta
-            elif event.type == "tool_call_start":
-                # Tool call started (name known, arguments pending)
-                if event.tool_call:
-                    tc = event.tool_call
-                    self._call_id_to_tool[tc.id] = tc.name
-                    # Always emit start notification (privacy-safe, no arguments)
-                    block_id = generate_id("blk")
-                    self._tool_call_blocks[tc.id] = block_id
-                    await self.ctx.emit(BlockEvent(
-                        block_id=block_id,
-                        kind=BlockKind.TOOL_USE,
-                        op=BlockOp.APPLY,
-                        data={
-                            "name": tc.name,
-                            "call_id": tc.id,
-                            "status": "streaming",  # Indicate arguments are streaming
-                        },
-                    ))
-            elif event.type == "tool_call_delta":
-                # Tool arguments delta (streaming)
-                if event.tool_call_delta:
-                    call_id = event.tool_call_delta.get("call_id")
-                    arguments_delta = event.tool_call_delta.get("arguments_delta")
-                    if call_id and arguments_delta:
-                        tool_name = self._call_id_to_tool.get(call_id)
-                        if tool_name:
-                            tool = self._get_tool(tool_name)
-                            # Check if tool allows streaming arguments
-                            if tool and tool.config.stream_arguments:
-                                block_id = self._tool_call_blocks.get(call_id)
-                                if block_id:
-                                    await self.ctx.emit(BlockEvent(
-                                        block_id=block_id,
-                                        kind=BlockKind.TOOL_USE,
-                                        op=BlockOp.DELTA,
-                                        data={
-                                            "call_id": call_id,
-                                            "arguments_delta": arguments_delta,
-                                        },
-                                    ))
-            elif event.type == "tool_call_progress":
-                # Tool arguments progress (bytes received)
-                if event.tool_call_progress:
-                    call_id = event.tool_call_progress.get("call_id")
-                    bytes_received = event.tool_call_progress.get("bytes_received")
-                    if call_id and bytes_received is not None:
-                        block_id = self._tool_call_blocks.get(call_id)
-                        if block_id:
-                            # Always emit progress (privacy-safe, no content)
-                            await self.ctx.emit(BlockEvent(
-                                block_id=block_id,
-                                kind=BlockKind.TOOL_USE,
-                                op=BlockOp.PATCH,
-                                data={
-                                    "call_id": call_id,
-                                    "bytes_received": bytes_received,
-                                    "status": "receiving",
-                                },
-                            ))
-            elif event.type == "tool_call":
-                # Tool call complete (arguments fully received)
-                if event.tool_call:
-                    tc = event.tool_call
-                    invocation = ToolInvocation(
-                        tool_call_id=tc.id,
-                        tool_name=tc.name,
-                        args_raw=tc.arguments,
-                        state=ToolInvocationState.CALL,
-                    )
-                    # Parse arguments
-                    try:
-                        invocation.args = json.loads(tc.arguments)
-                    except json.JSONDecodeError:
-                        invocation.args = {}
-                    self._tool_invocations.append(invocation)
-                    # Strict mode: require tool_call_start to be received first
-                    # TODO: Uncomment below for compatibility with providers that don't send tool_call_start
-                    # block_id = self._tool_call_blocks.get(tc.id)
-                    # if block_id is None:
-                    #     # No streaming start event, create block now
-                    #     block_id = generate_id("blk")
-                    #     self._tool_call_blocks[tc.id] = block_id
-                    #     self._call_id_to_tool[tc.id] = tc.name
-                    #
-                    #     # Emit APPLY with full data
-                    #     await self.ctx.emit(BlockEvent(
-                    #         block_id=block_id,
-                    #         kind=BlockKind.TOOL_USE,
-                    #         op=BlockOp.APPLY,
-                    #         data={
-                    #             "name": tc.name,
-                    #             "call_id": tc.id,
-                    #             "arguments": invocation.args,
-                    #             "status": "ready",
-                    #         },
-                    #     ))
-                    # else:
-                    #     # Update existing block with complete arguments
-                    #     await self.ctx.emit(BlockEvent(
-                    #         block_id=block_id,
-                    #         kind=BlockKind.TOOL_USE,
-                    #         op=BlockOp.PATCH,
-                    #         data={
-                    #             "call_id": tc.id,
-                    #             "arguments": invocation.args,
-                    #             "status": "ready",
-                    #         },
-                    #     ))
-                    # Strict mode: tool_call_start must have been received
-                    block_id = self._tool_call_blocks[tc.id]  # Will raise KeyError if not found
-                    await self.ctx.emit(BlockEvent(
-                        block_id=block_id,
-                        kind=BlockKind.TOOL_USE,
-                        op=BlockOp.PATCH,
-                        data={
-                            "call_id": tc.id,
-                            "arguments": invocation.args,
-                            "status": "ready",
-                        },
-                    ))
-                    await self.bus.publish(
-                        Events.TOOL_START,
-                        {
-                            "call_id": tc.id,
-                            "tool": tc.name,
-                            "arguments": invocation.args,
-                        },
-                    )
-            elif event.type == "completed":
-                finish_reason = event.finish_reason
-            elif event.type == "usage":
-                if event.usage:
-                    await self.bus.publish(
-                        Events.USAGE_RECORDED,
-                        {
-                            "provider": self.llm.provider,
-                            "model": self.llm.model,
-                            "input_tokens": event.usage.input_tokens,
-                            "output_tokens": event.usage.output_tokens,
-                            "cache_read_tokens": event.usage.cache_read_tokens,
-                            "cache_write_tokens": event.usage.cache_write_tokens,
-                            "reasoning_tokens": event.usage.reasoning_tokens,
-                        },
-                    )
-            elif event.type == "error":
-                await self.ctx.emit(BlockEvent(
-                    kind=BlockKind.ERROR,
-                    op=BlockOp.APPLY,
-                    data={"message": event.error or "Unknown LLM error"},
-                ))
-        # If thinking was buffered, emit it now
-        if self._thinking_buffer and not self.config.stream_thinking:
-            await self.ctx.emit(BlockEvent(
-                kind=BlockKind.THINKING,
-                op=BlockOp.APPLY,
-                data={"content": self._thinking_buffer},
-            ))
-        # PROMPT mode: parse tool calls from text output
-        if effective_tool_mode == ToolInjectionMode.PROMPT and self._text_buffer:
-            parsed_calls = self._parse_tool_calls_from_text(self._text_buffer)
-            for i, call in enumerate(parsed_calls):
-                call_id = generate_id("call")
-                invocation = ToolInvocation(
-                    tool_call_id=call_id,
-                    tool_name=call["name"],
-                    args_raw=json.dumps(call["arguments"]),
-                    args=call["arguments"],
-                    state=ToolInvocationState.CALL,
-                )
-                self._tool_invocations.append(invocation)
-                # Create block for tool call (no streaming events in PROMPT mode)
-                block_id = generate_id("blk")
-                self._tool_call_blocks[call_id] = block_id
-                self._call_id_to_tool[call_id] = call["name"]
-                await self.ctx.emit(BlockEvent(
-                    block_id=block_id,
-                    kind=BlockKind.TOOL_USE,
-                    op=BlockOp.APPLY,
-                    data={
-                        "name": call["name"],
-                        "call_id": call_id,
-                        "arguments": call["arguments"],
-                        "status": "ready",
-                        "source": "prompt",  # Indicate parsed from text
-                    },
-                ))
-                await self.bus.publish(
-                    Events.TOOL_START,
-                    {
-                        "call_id": call_id,
-                        "tool": call["name"],
-                        "arguments": call["arguments"],
-                        "source": "prompt",
-                    },
-                )
-            if parsed_calls:
-                logger.debug(f"PROMPT mode: parsed {len(parsed_calls)} tool calls from text")
-        # === Middleware: on_response ===
-        llm_response_data = {
-            "text": self._text_buffer,
-            "thinking": self._thinking_buffer,
-            "tool_calls": len(self._tool_invocations),
-            "finish_reason": finish_reason,
-        }
-        if self.middleware:
-            llm_response_data = await self.middleware.process_response(
-                llm_response_data, mw_context
-            )
-        await self.bus.publish(
-            Events.LLM_END,
-            {
-                "step": self._current_step,
-                "finish_reason": finish_reason,
-                "text_length": len(self._text_buffer),
-                "thinking_length": len(self._thinking_buffer),
-                "tool_calls": len(self._tool_invocations),
-            },
-        )
-        # Add assistant message to history
-        if self._text_buffer or self._tool_invocations:
-            assistant_content: Any = self._text_buffer
-            if self._tool_invocations:
-                # Build content with tool calls
-                content_parts = []
-                if self._text_buffer:
-                    content_parts.append({"type": "text", "text": self._text_buffer})
-                for inv in self._tool_invocations:
-                    content_parts.append(
-                        {
-                            "type": "tool_use",
-                            "id": inv.tool_call_id,
-                            "name": inv.tool_name,
-                            "input": inv.args,
-                        }
-                    )
-                assistant_content = content_parts
-            self._message_history.append(
-                LLMMessage(
-                    role="assistant",
-                    content=assistant_content,
-                )
-            )
-        return finish_reason
-    async def _process_tool_results(self) -> None:
-        """Execute tool calls and add results to history.
-        Executes tools in parallel or sequentially based on config.
-        """
-        if not self._tool_invocations:
-            return
-        # Execute tools based on configuration
-        if self.config.parallel_tool_execution:
-            # Parallel execution using asyncio.gather with create_task
-            # create_task ensures each task gets its own ContextVar copy
-            tasks = [asyncio.create_task(self._execute_tool(inv)) for inv in self._tool_invocations]
-            results = await asyncio.gather(*tasks, return_exceptions=True)
-        else:
-            # Sequential execution
-            results = []
-            for inv in self._tool_invocations:
-                try:
-                    result = await self._execute_tool(inv)
-                    results.append(result)
-                except Exception as e:
-                    results.append(e)
-        # Check for SuspendSignal first - must propagate
-        for result in results:
-            if isinstance(result, SuspendSignal):
-                raise result
-        # Process results
-        tool_results = []
-        for invocation, result in zip(self._tool_invocations, results):
-            # Handle exceptions from gather
-            if isinstance(result, Exception):
-                error_msg = f"Tool execution error: {str(result)}"
-                invocation.mark_result(error_msg, is_error=True)
-                result = ToolResult.error(error_msg)
-            # Get parent block_id from tool_call mapping
-            parent_block_id = self._tool_call_blocks.get(invocation.tool_call_id)
-            await self.ctx.emit(BlockEvent(
-                kind=BlockKind.TOOL_RESULT,
-                op=BlockOp.APPLY,
-                parent_id=parent_block_id,
-                data={
-                    "call_id": invocation.tool_call_id,
-                    "content": result.output,
-                    "is_error": invocation.is_error,
-                },
-            ))
+        """Resume paused execution."""
+        async for block in pause_helpers.resume_agent(self, invocation_id):
+            yield block
-            await self.bus.publish(
-                Events.TOOL_END,
-                {
-                    "call_id": invocation.tool_call_id,
-                    "tool": invocation.tool_name,
-                    "result": result.output[:500],  # Truncate for event
-                    "is_error": invocation.is_error,
-                    "duration_ms": invocation.duration_ms,
-                },
-            )
-            tool_results.append(
-                {
-                    "type": "tool_result",
-                    "tool_use_id": invocation.tool_call_id,
-                    "content": result.output,
-                    "is_error": invocation.is_error,
-                }
-            )
-        # Add tool results as tool messages (OpenAI format)
-        for tr in tool_results:
-            print(f"[DEBUG _process_tool_results] Adding tool_result to history: {tr}")
-            self._message_history.append(
-                LLMMessage(
-                    role="tool",
-                    content=tr["content"],
-                    tool_call_id=tr["tool_use_id"],
-                )
-            )
-    def _save_messages_to_state(self) -> None:
-        """Save execution state for recovery.
-        This saves to state.execution namespace:
-        - step: current step number
-        - message_ids: references to raw messages (if using RawMessageMiddleware)
-        - For legacy/fallback: message_history as serialized data
-        Note: With RawMessageMiddleware, message_ids are automatically populated
-        by the middleware. This method saves additional execution state.
-        """
-        if not self._state:
-            return
-        # Save step to execution namespace
-        self._state.execution["step"] = self._current_step
-        # Save invocation_id for recovery context
-        if self._current_invocation:
-            self._state.execution["invocation_id"] = self._current_invocation.id
-        # Fallback: if message_ids not populated by middleware, save full history
-        # This ensures backward compatibility when RawMessageMiddleware is not used
-        if "message_ids" not in self._state.execution:
-            messages_data = []
-            for msg in self._message_history:
-                msg_dict = {"role": msg.role, "content": msg.content}
-                if hasattr(msg, "tool_call_id") and msg.tool_call_id:
-                    msg_dict["tool_call_id"] = msg.tool_call_id
-                messages_data.append(msg_dict)
-            self._state.execution["message_history"] = messages_data
-    def _clear_messages_from_state(self) -> None:
-        """Clear execution state after invocation completes.
-        Called when invocation completes normally. Historical messages
-        are already persisted (truncated) via MessageStore.
-        """
-        if not self._state:
-            return
-        # Clear execution namespace
-        self._state.execution.clear()
-    async def _trigger_message_save(self, message: dict) -> dict | None:
-        """Trigger on_message_save hook via middleware.
-        Message persistence is handled by MessageBackendMiddleware.
-        Agent only triggers the hook, doesn't save directly.
-        Args:
-            message: Message dict with role, content, etc.
-        Returns:
-            Modified message or None if blocked
-        """
-        # Check if message saving is disabled (e.g., for sub-agents with record_messages=False)
-        if getattr(self, '_disable_message_save', False):
-            return message
-        if not self.middleware:
-            return message
-        namespace = getattr(self, '_message_namespace', None)
-        mw_context = {
-            "session_id": self.session.id,
-            "agent_id": self.name,
-            "namespace": namespace,
-        }
-        return await self.middleware.process_message_save(message, mw_context)
-    async def _save_user_message(self, input: PromptInput) -> None:
-        """Trigger save for user message."""
-        # Build user content
-        content: str | list[dict] = input.text
-        if self._agent_context and self._agent_context.user_content:
-            content = self._agent_context.user_content + "\n\n" + input.text
-        if input.attachments:
-            content_parts: list[dict] = [{"type": "text", "text": content}]
-            for attachment in input.attachments:
-                content_parts.append(attachment)
-            content = content_parts
-        # Build message and trigger hook
-        message = {
-            "role": "user",
-            "content": content,
-            "invocation_id": self._current_invocation.id if self._current_invocation else "",
-        }
-        await self._trigger_message_save(message)
-    async def _save_assistant_message(self) -> None:
-        """Trigger save for assistant message."""
-        if not self._text_buffer and not self._tool_invocations:
-            return
-        # Build assistant content
-        content: str | list[dict] = self._text_buffer
-        if self._tool_invocations:
-            content_parts: list[dict] = []
-            if self._text_buffer:
-                content_parts.append({"type": "text", "text": self._text_buffer})
-            for inv in self._tool_invocations:
-                content_parts.append({
-                    "type": "tool_use",
-                    "id": inv.tool_call_id,
-                    "name": inv.tool_name,
-                    "input": inv.args,
-                })
-            content = content_parts
-        # Build message and trigger hook
-        message = {
-            "role": "assistant",
-            "content": content,
-            "invocation_id": self._current_invocation.id if self._current_invocation else "",
-        }
-        await self._trigger_message_save(message)
-    async def _save_tool_messages(self) -> None:
-        """Trigger save for tool result messages."""
-        for inv in self._tool_invocations:
-            if inv.result is not None:
-                # Build tool result message
-                content: list[dict] = [{
-                    "type": "tool_result",
-                    "tool_use_id": inv.tool_call_id,
-                    "content": inv.result,
-                    "is_error": inv.is_error,
-                }]
-                message = {
-                    "role": "tool",
-                    "content": content,
-                    "tool_call_id": inv.tool_call_id,
-                    "invocation_id": self._current_invocation.id if self._current_invocation else "",
-                }
-                await self._trigger_message_save(message)
+    # ========== Helper methods used by other modules ==========
     def _get_tool(self, tool_name: str) -> "BaseTool | None":
         """Get tool by name from agent context."""
-        if self._agent_context:
-            for tool in self._agent_context.tools:
-                if tool.name == tool_name:
-                    return tool
-        return None
+        return tool_helpers.get_tool(self, tool_name)
-    async def _execute_tool(self, invocation: ToolInvocation) -> ToolResult:
-        """Execute a single tool call."""
-        invocation.mark_call_complete()
-        # Build middleware context
-        mw_context = {
-            "session_id": self.session.id,
-            "invocation_id": self._current_invocation.id if self._current_invocation else "",
-            "tool_call_id": invocation.tool_call_id,
-            "agent_id": self.name,
-        }
-        try:
-            # Get tool from agent context
-            tool = self._get_tool(invocation.tool_name)
-            if tool is None:
-                error_msg = f"Unknown tool: {invocation.tool_name}"
-                invocation.mark_result(error_msg, is_error=True)
-                return ToolResult.error(error_msg)
-            # === Middleware: on_tool_call ===
-            if self.middleware:
-                hook_result = await self.middleware.process_tool_call(
-                    tool, invocation.args, mw_context
-                )
-                if hook_result.action == HookAction.SKIP:
-                    logger.info(f"Tool {invocation.tool_name} skipped by middleware")
-                    return ToolResult(
-                        output=hook_result.message or "Skipped by middleware",
-                        is_error=False,
-                    )
-                elif hook_result.action == HookAction.RETRY and hook_result.modified_data:
-                    invocation.args = hook_result.modified_data
-            # Create ToolContext
-            tool_ctx = ToolContext(
-                session_id=self.session.id,
-                invocation_id=self._current_invocation.id if self._current_invocation else "",
-                block_id="",
-                call_id=invocation.tool_call_id,
-                agent=self.config.name,
-                abort_signal=self._abort,
-                update_metadata=self._noop_update_metadata,
-                middleware=self.middleware,
-            )
-            # Execute tool (with optional timeout from tool.config)
-            timeout = tool.config.timeout
-            if timeout is not None:
-                result = await asyncio.wait_for(
-                    tool.execute(invocation.args, tool_ctx),
-                    timeout=timeout,
-                )
-            else:
-                # No timeout - tool runs until completion
-                result = await tool.execute(invocation.args, tool_ctx)
-            # === Middleware: on_tool_end ===
-            if self.middleware:
-                hook_result = await self.middleware.process_tool_end(tool, result, mw_context)
-                if hook_result.action == HookAction.RETRY:
-                    logger.info(f"Tool {invocation.tool_name} retry requested by middleware")
-            invocation.mark_result(result.output, is_error=result.is_error)
-            return result
-        except asyncio.TimeoutError:
-            timeout = tool.config.timeout if tool else None
-            error_msg = f"Tool {invocation.tool_name} timed out after {timeout}s"
-            invocation.mark_result(error_msg, is_error=True)
-            return ToolResult.error(error_msg)
-        except SuspendSignal:
-            # HITL/Suspend signal must propagate up
-            raise
-        except Exception as e:
-            error_msg = f"Tool execution error: {str(e)}"
-            invocation.mark_result(error_msg, is_error=True)
-            return ToolResult.error(error_msg)
+    async def _save_tool_messages(self) -> None:
+        """Trigger save for tool result messages."""
+        await persist_helpers.save_tool_messages(self)
     async def _noop_update_metadata(self, metadata: dict[str, Any]) -> None:
         """No-op metadata updater."""

aury-agent 0.0.4__py3-none-any.whl → 0.0.5__py3-none-any.whl

aury-agent 0.0.4py3-none-any.whl → 0.0.5py3-none-any.whl