PyPI - flowly-code - Versions diffs - 1.0.0__py3-none-any.whl - Mend

flowly-code 1.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (86) hide show

flowly_code/__init__.py +30 -0
flowly_code/__main__.py +8 -0
flowly_code/activity/__init__.py +1 -0
flowly_code/activity/bus.py +91 -0
flowly_code/activity/events.py +40 -0
flowly_code/agent/__init__.py +8 -0
flowly_code/agent/context.py +485 -0
flowly_code/agent/loop.py +1349 -0
flowly_code/agent/memory.py +109 -0
flowly_code/agent/skills.py +259 -0
flowly_code/agent/subagent.py +249 -0
flowly_code/agent/tools/__init__.py +6 -0
flowly_code/agent/tools/base.py +55 -0
flowly_code/agent/tools/delegate.py +194 -0
flowly_code/agent/tools/dispatch.py +840 -0
flowly_code/agent/tools/docker.py +609 -0
flowly_code/agent/tools/filesystem.py +280 -0
flowly_code/agent/tools/mcp.py +85 -0
flowly_code/agent/tools/message.py +235 -0
flowly_code/agent/tools/registry.py +257 -0
flowly_code/agent/tools/screenshot.py +444 -0
flowly_code/agent/tools/shell.py +166 -0
flowly_code/agent/tools/spawn.py +65 -0
flowly_code/agent/tools/system.py +917 -0
flowly_code/agent/tools/trello.py +420 -0
flowly_code/agent/tools/web.py +139 -0
flowly_code/agent/tools/x.py +399 -0
flowly_code/bus/__init__.py +6 -0
flowly_code/bus/events.py +37 -0
flowly_code/bus/queue.py +81 -0
flowly_code/channels/__init__.py +6 -0
flowly_code/channels/base.py +121 -0
flowly_code/channels/manager.py +135 -0
flowly_code/channels/telegram.py +1132 -0
flowly_code/cli/__init__.py +1 -0
flowly_code/cli/commands.py +1831 -0
flowly_code/cli/setup.py +1356 -0
flowly_code/compaction/__init__.py +39 -0
flowly_code/compaction/estimator.py +88 -0
flowly_code/compaction/pruning.py +223 -0
flowly_code/compaction/service.py +297 -0
flowly_code/compaction/summarizer.py +384 -0
flowly_code/compaction/types.py +71 -0
flowly_code/config/__init__.py +6 -0
flowly_code/config/loader.py +102 -0
flowly_code/config/schema.py +324 -0
flowly_code/exec/__init__.py +39 -0
flowly_code/exec/approvals.py +288 -0
flowly_code/exec/executor.py +184 -0
flowly_code/exec/safety.py +247 -0
flowly_code/exec/types.py +88 -0
flowly_code/gateway/__init__.py +5 -0
flowly_code/gateway/server.py +103 -0
flowly_code/heartbeat/__init__.py +5 -0
flowly_code/heartbeat/service.py +130 -0
flowly_code/multiagent/README.md +248 -0
flowly_code/multiagent/__init__.py +1 -0
flowly_code/multiagent/invoke.py +210 -0
flowly_code/multiagent/orchestrator.py +156 -0
flowly_code/multiagent/router.py +156 -0
flowly_code/multiagent/setup.py +171 -0
flowly_code/pairing/__init__.py +21 -0
flowly_code/pairing/store.py +343 -0
flowly_code/providers/__init__.py +6 -0
flowly_code/providers/base.py +69 -0
flowly_code/providers/litellm_provider.py +178 -0
flowly_code/providers/transcription.py +64 -0
flowly_code/session/__init__.py +5 -0
flowly_code/session/manager.py +249 -0
flowly_code/skills/README.md +24 -0
flowly_code/skills/compact/SKILL.md +27 -0
flowly_code/skills/github/SKILL.md +48 -0
flowly_code/skills/skill-creator/SKILL.md +371 -0
flowly_code/skills/summarize/SKILL.md +67 -0
flowly_code/skills/tmux/SKILL.md +121 -0
flowly_code/skills/tmux/scripts/find-sessions.sh +112 -0
flowly_code/skills/tmux/scripts/wait-for-text.sh +83 -0
flowly_code/skills/weather/SKILL.md +49 -0
flowly_code/utils/__init__.py +5 -0
flowly_code/utils/helpers.py +91 -0
flowly_code-1.0.0.dist-info/METADATA +724 -0
flowly_code-1.0.0.dist-info/RECORD +86 -0
flowly_code-1.0.0.dist-info/WHEEL +4 -0
flowly_code-1.0.0.dist-info/entry_points.txt +2 -0
flowly_code-1.0.0.dist-info/licenses/LICENSE +191 -0
flowly_code-1.0.0.dist-info/licenses/NOTICE +74 -0

flowly_code/agent/loop.py ADDED Viewed

@@ -0,0 +1,1349 @@
+"""Agent loop: the core processing engine."""
+import asyncio
+import copy
+import json
+import re
+from datetime import datetime
+from pathlib import Path
+from contextlib import AsyncExitStack
+from typing import Any, Awaitable, Callable
+from loguru import logger
+from flowly_code.bus.events import InboundMessage, OutboundMessage
+from flowly_code.bus.queue import MessageBus
+from flowly_code.providers.base import LLMProvider
+from flowly_code.agent.context import ContextBuilder
+from flowly_code.agent.tools.registry import ToolRegistry
+from flowly_code.agent.tools.filesystem import ReadFileTool, WriteFileTool, EditFileTool, ListDirTool
+from flowly_code.agent.tools.web import WebSearchTool, WebFetchTool
+from flowly_code.agent.tools.message import MessageTool
+from flowly_code.agent.tools.screenshot import ScreenshotTool
+from flowly_code.agent.tools.spawn import SpawnTool
+from flowly_code.agent.tools.trello import TrelloTool
+from flowly_code.agent.tools.docker import DockerTool
+from flowly_code.agent.tools.system import SystemTool
+from flowly_code.agent.subagent import SubagentManager
+from flowly_code.session.manager import SessionManager
+from flowly_code.compaction.service import CompactionService
+from flowly_code.compaction.types import CompactionConfig, MemoryFlushConfig
+from flowly_code.compaction.estimator import estimate_messages_tokens
+from flowly_code.exec.types import ExecConfig
+from flowly_code.config.schema import TrelloConfig, XConfig, DispatchConfig
+class AgentLoop:
+    """
+    The agent loop is the core processing engine.
+    It:
+    1. Receives messages from the bus
+    2. Builds context with history, memory, skills
+    3. Calls the LLM
+    4. Executes tool calls
+    5. Sends responses back
+    """
+    def __init__(
+        self,
+        bus: MessageBus,
+        provider: LLMProvider,
+        workspace: Path,
+        model: str | None = None,
+        action_temperature: float = 0.1,
+        action_tool_retries: int = 2,
+        max_iterations: int = 20,
+        brave_api_key: str | None = None,
+        context_messages: int = 100,
+        compaction_config: CompactionConfig | None = None,
+        exec_config: ExecConfig | None = None,
+        trello_config: TrelloConfig | None = None,
+        x_config: XConfig | None = None,
+        dispatch_config: DispatchConfig | None = None,
+        tools_config=None,
+        mcp_servers: dict | None = None,
+        persona: str = "default",
+        activity_bus: "ActivityBus | None" = None,
+    ):
+        self.bus = bus
+        self.provider = provider
+        self.workspace = workspace
+        self.model = model or provider.get_default_model()
+        self.action_temperature = action_temperature
+        self.action_tool_retries = max(0, action_tool_retries)
+        self.max_iterations = max_iterations
+        self.brave_api_key = brave_api_key
+        self.context_messages = context_messages
+        self.dispatch_config = dispatch_config
+        self.tools_config = tools_config
+        # Activity streaming (real-time monitoring)
+        self.activity_bus = activity_bus
+        # MCP (Model Context Protocol) servers
+        self._mcp_servers = mcp_servers or {}
+        self._mcp_stack: AsyncExitStack | None = None
+        self._mcp_connected = False
+        self.context = ContextBuilder(workspace, persona=persona)
+        self.sessions = SessionManager(workspace)
+        self.tools = ToolRegistry()
+        self.subagents = SubagentManager(
+            provider=provider,
+            workspace=workspace,
+            bus=bus,
+            model=self.model,
+            brave_api_key=brave_api_key,
+            activity_bus=activity_bus,
+        )
+        # Compaction service
+        self.compaction = CompactionService(
+            provider=provider,
+            model=self.model,
+            config=compaction_config,
+        )
+        # Exec config
+        self.exec_config = exec_config or ExecConfig()
+        # Trello config
+        self.trello_config = trello_config
+        # X config
+        self.x_config = x_config
+        self._running = False
+        self._register_default_tools()
+    def _emit_activity(self, event_type: str, **kwargs: Any) -> None:
+        """Emit an activity event if bus is available and has subscribers."""
+        if not self.activity_bus or not self.activity_bus.has_subscribers:
+            return
+        try:
+            from flowly_code.activity.events import ActivityEvent
+            kwargs.setdefault("agent_name", self.context.persona)
+            self.activity_bus.emit(ActivityEvent(type=event_type, **kwargs))
+        except Exception:
+            pass  # Never let activity tracking break the agent
+    def _fetch_project_paths(self) -> list[Path]:
+        """Fetch Dispatch project directories synchronously (best-effort)."""
+        if not self.dispatch_config or not self.dispatch_config.enabled:
+            return []
+        try:
+            import httpx
+            port = self.dispatch_config.backend_port
+            resp = httpx.get(f"http://127.0.0.1:{port}/api/projects", timeout=5.0)
+            resp.raise_for_status()
+            projects = resp.json().get("data", [])
+            paths = []
+            for p in projects:
+                d = p.get("default_agent_working_dir", "")
+                if d:
+                    paths.append(Path(d))
+            return paths
+        except Exception:
+            return []
+    def _register_default_tools(self) -> None:
+        """Register the default set of tools."""
+        # Determine filesystem access mode
+        fs_access = "full"
+        fs_allowed: list[Path] | None = None
+        if self.tools_config and hasattr(self.tools_config, 'filesystem'):
+            fs_access = self.tools_config.filesystem.access
+        if fs_access == "projects":
+            fs_allowed = self._fetch_project_paths()
+            logger.info(f"Filesystem access: projects mode ({len(fs_allowed)} dirs)")
+        elif fs_access != "full":
+            logger.info(f"Filesystem access: {fs_access} mode")
+        # File tools
+        fs_kwargs = dict(workspace=self.workspace, access_mode=fs_access, allowed_paths=fs_allowed)
+        self.tools.register(ReadFileTool(**fs_kwargs))
+        self.tools.register(WriteFileTool(**fs_kwargs))
+        self.tools.register(EditFileTool(**fs_kwargs))
+        self.tools.register(ListDirTool(**fs_kwargs))
+        # Shell tool (secure)
+        from flowly_code.agent.tools.shell import SecureExecTool
+        self.tools.register(SecureExecTool(
+            config=self.exec_config,
+            working_dir=str(self.workspace),
+        ))
+        # Web tools
+        self.tools.register(WebSearchTool(api_key=self.brave_api_key))
+        self.tools.register(WebFetchTool())
+        # Message tool
+        message_tool = MessageTool(send_callback=self.bus.publish_outbound)
+        self.tools.register(message_tool)
+        # Screenshot tool
+        self.tools.register(ScreenshotTool())
+        # Spawn tool (for subagents)
+        spawn_tool = SpawnTool(manager=self.subagents)
+        self.tools.register(spawn_tool)
+        # Trello tool (if configured)
+        if self.trello_config and self.trello_config.api_key and self.trello_config.token:
+            self.tools.register(TrelloTool(
+                api_key=self.trello_config.api_key,
+                token=self.trello_config.token,
+            ))
+        # X (Twitter) tool (if configured)
+        if self.x_config and (self.x_config.bearer_token or self.x_config.api_key):
+            from flowly_code.agent.tools.x import XTool
+            self.tools.register(XTool(
+                bearer_token=self.x_config.bearer_token,
+                api_key=self.x_config.api_key,
+                api_secret=self.x_config.api_secret,
+                access_token=self.x_config.access_token,
+                access_token_secret=self.x_config.access_token_secret,
+            ))
+        # Docker tool (always available, will error if Docker not installed)
+        self.tools.register(DockerTool())
+        # System monitoring tool
+        self.tools.register(SystemTool())
+        # Dispatch App tools (if configured)
+        if self.dispatch_config and self.dispatch_config.enabled:
+            from flowly_code.agent.tools.dispatch import (
+                DispatchListProjectsTool,
+                DispatchGetProjectTool,
+                DispatchListTasksTool,
+                DispatchCreateTaskTool,
+                DispatchUpdateTaskTool,
+                DispatchDeleteTaskTool,
+                DispatchGetTaskTool,
+                DispatchRalphStatusTool,
+                DispatchStartRalphTool,
+                DispatchListTaskAttemptsTool,
+                DispatchStartRalphSessionTool,
+                DispatchStopRalphSessionTool,
+                DispatchKanbanSummaryTool,
+                DispatchGetRalphSessionTool,
+                DispatchGetRalphPrdTool,
+            )
+            port = self.dispatch_config.backend_port
+            self.tools.register(DispatchListProjectsTool(port=port))
+            self.tools.register(DispatchGetProjectTool(port=port))
+            self.tools.register(DispatchListTasksTool(port=port))
+            self.tools.register(DispatchCreateTaskTool(port=port))
+            self.tools.register(DispatchUpdateTaskTool(port=port))
+            self.tools.register(DispatchDeleteTaskTool(port=port))
+            self.tools.register(DispatchGetTaskTool(port=port))
+            self.tools.register(DispatchRalphStatusTool(port=port))
+            self.tools.register(DispatchStartRalphTool(port=port))
+            self.tools.register(DispatchListTaskAttemptsTool(port=port))
+            self.tools.register(DispatchStartRalphSessionTool(port=port))
+            self.tools.register(DispatchStopRalphSessionTool(port=port))
+            self.tools.register(DispatchKanbanSummaryTool(port=port))
+            self.tools.register(DispatchGetRalphSessionTool(port=port))
+            self.tools.register(DispatchGetRalphPrdTool(port=port))
+    async def _connect_mcp(self) -> None:
+        """Connect to configured MCP servers (one-time, lazy)."""
+        if self._mcp_connected or not self._mcp_servers:
+            return
+        self._mcp_connected = True
+        from flowly_code.agent.tools.mcp import connect_mcp_servers
+        self._mcp_stack = AsyncExitStack()
+        await self._mcp_stack.__aenter__()
+        await connect_mcp_servers(self._mcp_servers, self.tools, self._mcp_stack)
+    async def close_mcp(self) -> None:
+        """Cleanup MCP connections."""
+        if self._mcp_stack:
+            await self._mcp_stack.aclose()
+            self._mcp_stack = None
+    @staticmethod
+    def _tool_hint(tool_calls: list) -> str:
+        """Format tool calls as concise hint, e.g. 'web_search("query")'."""
+        def _fmt(tc):
+            val = next(iter(tc.arguments.values()), None) if tc.arguments else None
+            if not isinstance(val, str):
+                return tc.name
+            return f'{tc.name}("{val[:40]}…")' if len(val) > 40 else f'{tc.name}("{val}")'
+        return ", ".join(_fmt(tc) for tc in tool_calls)
+    async def run(self) -> None:
+        """Run the agent loop, processing messages from the bus."""
+        self._running = True
+        await self._connect_mcp()
+        logger.info("Agent loop started")
+        while self._running:
+            try:
+                # Wait for next message
+                first_msg = await asyncio.wait_for(
+                    self.bus.consume_inbound(),
+                    timeout=1.0
+                )
+                batch, dropped = self._coalesce_inbound_batch(first_msg)
+                if dropped:
+                    logger.warning(f"Inbound coalescing dropped {dropped} stale message(s)")
+                # Process coalesced batch
+                for msg in batch:
+                    try:
+                        response = await self._process_message(msg)
+                        if response:
+                            await self.bus.publish_outbound(response)
+                    except Exception as e:
+                        logger.error(f"Error processing message: {e}")
+                        # Send error response
+                        await self.bus.publish_outbound(OutboundMessage(
+                            channel=msg.channel,
+                            chat_id=msg.chat_id,
+                            content=f"Sorry, I encountered an error: {str(e)}"
+                        ))
+            except asyncio.TimeoutError:
+                continue
+    def stop(self) -> None:
+        """Stop the agent loop."""
+        self._running = False
+        logger.info("Agent loop stopping")
+        # Schedule MCP cleanup (fire-and-forget since stop() is sync)
+        if self._mcp_stack:
+            try:
+                loop = asyncio.get_event_loop()
+                if loop.is_running():
+                    loop.create_task(self.close_mcp())
+            except RuntimeError:
+                pass
+    def _extract_action_intent_text(self, content: str) -> str:
+        """Extract the user utterance for intent detection."""
+        return content.lower()
+    def _is_action_turn(self, channel: str, content: str) -> bool:
+        """Detect whether this turn is an action request that should execute tools strictly."""
+        intent_text = self._extract_action_intent_text(content)
+        action_patterns = (
+            # Retry
+            r"\btry\s+again\b",
+            r"\bretry\b",
+            r"\btekrar\s+dene\b",
+            r"\btekrar\s+b[iı]\s+dene\b",
+            r"\btekrar\s+bir\s+dene\b",
+            r"\btekrar\s+dener\s+m[ıi]s[ıi]n\b",
+            r"\btekrar\b.*\bden\w+\b",
+            r"\byeniden\s+dene\b",
+            r"\bbir\s+daha\s+dene\b",
+            # Send / share
+            r"\bsend\b",
+            r"\bshare\b",
+            r"\bg[öo]nder\b",
+            r"\bpayla[şs]\b",
+            # Screenshot
+            r"\bscreenshot\b",
+            r"\bss\b",
+            r"\bekran\s+g[öo]r[üu]nt[üu]s[üu]\b",
+            # Generic
+            r"\brun\s+tool\b",
+            r"\bexecute\b",
+        )
+        return any(re.search(pattern, intent_text) for pattern in action_patterns)
+    def _is_retry_action_followup(self, content: str) -> bool:
+        """Detect short follow-up prompts that usually mean 'retry previous action'."""
+        intent_text = self._extract_action_intent_text(content)
+        retry_patterns = (
+            r"\btry\s+again\b",
+            r"\bretry\b",
+            r"\bdo\s+it\s+again\b",
+            r"\bone\s+more\s+time\b",
+            r"\btekrar\s+dene\b",
+            r"\btekrar\s+b[iı]\s+dene\b",
+            r"\btekrar\s+bir\s+dene\b",
+            r"\btekrar\s+dener\s+m[ıi]s[ıi]n\b",
+            r"\btekrar\b.*\bden\w+\b",
+            r"\byeniden\s+dene\b",
+            r"\bbir\s+daha\s+dene\b",
+        )
+        return any(re.search(pattern, intent_text) for pattern in retry_patterns)
+    def _is_cancel_action_followup(self, content: str) -> bool:
+        """Detect explicit cancellation for pending actions."""
+        intent_text = self._extract_action_intent_text(content)
+        cancel_patterns = (
+            r"\bcancel\b",
+            r"\bstop\b",
+            r"\bforget\s+it\b",
+            r"\bnever\s*mind\b",
+            r"\babort\b",
+            r"\bvazge[cç]\b",
+            r"\biptal\b",
+            r"\bbo[sş]ver\b",
+        )
+        return any(re.search(pattern, intent_text) for pattern in cancel_patterns)
+    def _consume_pending_action_lock(self, session: Any, content: str) -> bool:
+        """
+        Consume a pending-action lock set by a previous failed action turn.
+        If active, force this turn into action mode unless user explicitly cancels.
+        """
+        pending = session.metadata.get("pending_action_lock")
+        if not isinstance(pending, dict):
+            return False
+        if not pending.get("active"):
+            return False
+        remaining = int(pending.get("remaining_turns", 0) or 0)
+        if remaining <= 0:
+            session.metadata.pop("pending_action_lock", None)
+            return False
+        if self._is_cancel_action_followup(content):
+            session.metadata.pop("pending_action_lock", None)
+            return False
+        pending["remaining_turns"] = remaining - 1
+        pending["last_consumed_at"] = datetime.now().isoformat()
+        session.metadata["pending_action_lock"] = pending
+        return True
+    def _set_pending_action_lock(self, session: Any, request_text: str) -> None:
+        """Arm pending-action lock so next follow-up is forced into action mode."""
+        session.metadata["pending_action_lock"] = {
+            "active": True,
+            "remaining_turns": 2,
+            "request": request_text[:300],
+            "set_at": datetime.now().isoformat(),
+        }
+    def _clear_pending_action_lock(self, session: Any) -> None:
+        """Clear pending-action lock after successful action execution."""
+        session.metadata.pop("pending_action_lock", None)
+    def _should_promote_retry_to_action(
+        self,
+        content: str,
+        history: list[dict[str, Any]],
+    ) -> bool:
+        """Promote retry follow-ups to action turns when recent context indicates pending action."""
+        if not self._is_retry_action_followup(content):
+            return False
+        # Strong default: retry follow-ups are treated as action intents.
+        if history:
+            return True
+        recent_messages = history[-6:]
+        recent_text = " ".join(
+            str(msg.get("content", "")).lower()
+            for msg in recent_messages
+            if isinstance(msg, dict)
+        )
+        retry_context_markers = (
+            "tool call could not be verified",
+            "tool calls failed",
+            "no action was taken",
+        )
+        if any(marker in recent_text for marker in retry_context_markers):
+            return True
+        # If recent user messages were action-like, treat retry as action.
+        for msg in reversed(recent_messages):
+            if not isinstance(msg, dict):
+                continue
+            if msg.get("role") != "user":
+                continue
+            text = str(msg.get("content", ""))
+            if text and self._is_action_turn("", text):
+                return True
+        return False
+    def _contains_unverified_completion_claim(self, text: str) -> bool:
+        """Detect response phrases that claim completion without tool evidence."""
+        lowered = (text or "").lower()
+        claim_patterns = (
+            r"\byapt[ıi]m\b",
+            r"\bg[öo]nderdim\b",
+            r"\bald[ıi]m\b",
+            r"\ba[cç]t[ıi]m\b",
+            r"\bkapatt[ıi]m\b",
+            r"\btamamlad[ıi]m\b",
+            r"\bi did\b",
+            r"\bi sent\b",
+            r"\bi took\b",
+            r"\bi opened\b",
+            r"\bi closed\b",
+            r"\bdone\b",
+            r"\bcompleted\b",
+            r"\bfinished\b",
+        )
+        return any(re.search(pattern, lowered) for pattern in claim_patterns)
+    # Hardcoded fallback messages that should be replaced by model-generated summaries.
+    _HARDCODED_FALLBACKS = frozenset({
+        "Tool calls failed, no action was taken.",
+        "Tool call could not be verified, no action was taken.",
+        "No safe tool could be executed for the live call.",
+        "Action executed.",
+        "Action completed but no response could be generated.",
+        "No tool was executed, no action was taken.",
+    })
+    def _is_hardcoded_fallback(self, content: str) -> bool:
+        """Check if final_content is a hardcoded fallback rather than model output."""
+        if content in self._HARDCODED_FALLBACKS:
+            return True
+        if content.startswith("Actions completed (") and "tools executed" in content:
+            return True
+        if content.startswith("✓ Action completed"):
+            return True
+        if content.startswith("Action completed.\n"):
+            return True
+        return False
+    async def _request_summary_turn(
+        self, messages: list[dict], tool_results: list[dict]
+    ) -> str | None:
+        """Ask the model to summarize tool results in natural language.
+        When tool calls complete but the loop exits with a hardcoded fallback,
+        this gives the model a chance to explain what happened to the user.
+        """
+        summary_prompt = (
+            "The tool calls above have completed. "
+            "Summarize what happened to the user in a natural, concise way. "
+            "If there were errors, explain what went wrong clearly."
+        )
+        messages_copy = list(messages)
+        messages_copy.append({"role": "user", "content": summary_prompt})
+        try:
+            response = await self.provider.chat(
+                messages=messages_copy,
+                tools=[],
+                model=self.model,
+                temperature=0.7,
+            )
+            if response.content and response.content.strip():
+                return response.content.strip()
+        except Exception as e:
+            logger.warning(f"Summary turn failed, keeping fallback: {e}")
+        return None
+    def _is_strict_live_call_action_intent(self, content: str) -> bool:
+        """
+        Detect high-confidence action intents in an active call turn.
+        This avoids forcing tools for regular chat utterances.
+        """
+        intent_text = self._extract_action_intent_text(content)
+        strict_patterns = (
+            r"\bg[öo]nder\b",
+            r"\bsend\b",
+            r"\bekran\s+g[öo]r[üu]nt[üu]s[üu]\b",
+            r"\bscreenshot\b",
+        )
+        return any(re.search(pattern, intent_text) for pattern in strict_patterns)
+    def _is_live_call_turn(self, content: str) -> bool:
+        """Detect active call orchestration prompts (disabled - voice removed)."""
+        return False
+    def _apply_turn_tool_policy(
+        self,
+        tool_defs: list[dict[str, Any]],
+        live_call_turn: bool,
+    ) -> tuple[list[dict[str, Any]], list[str]]:
+        """Apply per-turn tool constraints for safety and predictability."""
+        # Voice/call handling removed for Dispatch integration
+        return tool_defs, []
+    def _is_live_call_tool_allowed(self, tool_name: str, tool_args: dict[str, Any]) -> bool:
+        """Final runtime guard for live-call tool execution (disabled)."""
+        return True
+    def _coalesce_inbound_batch(self, first_msg: InboundMessage) -> tuple[list[InboundMessage], int]:
+        """
+        Collect bursty inbound traffic without dropping user messages.
+        Queue-All policy: preserve full ordering and keep every message.
+        """
+        batch = [first_msg]
+        while True:
+            try:
+                batch.append(self.bus.inbound.get_nowait())
+            except asyncio.QueueEmpty:
+                break
+        return batch, 0
+    async def _run_llm_tool_loop(
+        self,
+        messages: list[dict[str, Any]],
+        action_turn: bool,
+        live_call_turn: bool = False,
+        turn_content: str = "",
+        on_progress: Callable[[str], Awaitable[None]] | None = None,
+    ) -> tuple[str, list[dict[str, Any]], list[str]]:
+        """
+        Run iterative LLM + tool execution loop until final response.
+        Returns:
+            (final_content, accumulated_tool_results, executed_tool_names)
+        """
+        iteration = 0
+        final_content: str | None = None
+        accumulated_tool_results: list[dict[str, Any]] = []
+        executed_tool_names: list[str] = []
+        blocked_tools: list[str] = []
+        tools_were_used = False
+        successful_tools_were_used = False
+        no_tool_retry_count = 0
+        forced_tool_retry = False
+        strict_live_call_action = live_call_turn and self._is_strict_live_call_action_intent(turn_content)
+        enforce_action_tools = action_turn and (not live_call_turn or strict_live_call_action)
+        selected_model = self.model
+        selected_temperature = self.action_temperature if action_turn else 0.7
+        max_turn_iterations = self.max_iterations
+        if live_call_turn and not enforce_action_tools:
+            max_turn_iterations = min(max_turn_iterations, 3)
+        while iteration < max_turn_iterations:
+            iteration += 1
+            self._emit_activity("iteration_start", iteration=iteration)
+            tool_defs, policy_blocked_tools = self._apply_turn_tool_policy(
+                self.tools.get_definitions(),
+                live_call_turn=live_call_turn,
+            )
+            if policy_blocked_tools:
+                blocked_tools.extend(policy_blocked_tools)
+            tool_choice = (
+                "required"
+                if ((enforce_action_tools or forced_tool_retry) and not successful_tools_were_used)
+                else "auto"
+            )
+            logger.info(
+                "LLM request telemetry: "
+                f"model={selected_model}, tool_choice={tool_choice}, tool_count={len(tool_defs)}, "
+                f"action_turn={action_turn}, live_call_turn={live_call_turn}, "
+                f"blocked_tools={sorted(set(blocked_tools))}, "
+                f"iteration={iteration}/{max_turn_iterations}"
+            )
+            self._emit_activity("llm_start", iteration=iteration)
+            response = await self.provider.chat(
+                messages=messages,
+                tools=tool_defs,
+                model=selected_model,
+                temperature=selected_temperature,
+                tool_choice=tool_choice,
+            )
+            self._emit_activity("llm_end", iteration=iteration)
+            if response.content and response.content.startswith("Error") and tool_choice == "required":
+                logger.warning(f"tool_choice=required failed, retrying with auto: {response.content[:120]}")
+                response = await self.provider.chat(
+                    messages=messages,
+                    tools=tool_defs,
+                    model=selected_model,
+                    temperature=selected_temperature,
+                    tool_choice="auto",
+                )
+            if response.content and response.content.startswith("Error calling LLM:"):
+                lowered_error = response.content.lower()
+                schema_rejected = (
+                    "input_schema does not support oneof" in lowered_error
+                    or "input_schema does not support allof" in lowered_error
+                    or "input_schema does not support anyof" in lowered_error
+                )
+                if schema_rejected:
+                    logger.error("Provider rejected tool schema; aborting turn without additional retries.")
+                    final_content = (
+                        "Tool schema was rejected by the model provider. "
+                        "No action was taken."
+                    )
+                else:
+                    logger.error("LLM call failed after fallback; aborting turn without additional retries.")
+                    final_content = (
+                        "Could not get a valid response from the model provider. "
+                        "No action was taken."
+                    )
+                break
+            logger.info(
+                "LLM response telemetry: "
+                f"has_tool_calls={response.has_tool_calls}, content_len={len(response.content or '')}, "
+                f"action_turn={action_turn}, live_call_turn={live_call_turn}, iteration={iteration}"
+            )
+            if response.has_tool_calls:
+                # Emit progress hint to caller
+                if on_progress:
+                    hint = self._tool_hint(response.tool_calls)
+                    await on_progress(hint)
+                tool_call_dicts = [
+                    {
+                        "id": tc.id,
+                        "type": "function",
+                        "function": {
+                            "name": tc.name,
+                            "arguments": json.dumps(tc.arguments),
+                        },
+                    }
+                    for tc in response.tool_calls
+                ]
+                assistant_content = None
+                if response.content:
+                    content_lower = response.content.lower()
+                    hallucination_phrases = [
+                        "i did", "i sent", "i took", "i opened", "i closed",
+                        "done", "completed", "finished",
+                        "yaptım", "gönderdim", "aldım", "açtım", "kapattım", "tamamlandı",
+                    ]
+                    if not any(phrase in content_lower for phrase in hallucination_phrases):
+                        assistant_content = response.content
+                messages = self.context.add_assistant_message(
+                    messages, assistant_content, tool_call_dicts
+                )
+                turn_tools: list[str] = []
+                terminal_action_executed = False
+                turn_success_count = 0
+                for tool_call in response.tool_calls:
+                    turn_tools.append(tool_call.name)
+                    executed_tool_names.append(tool_call.name)
+                    args_str = json.dumps(tool_call.arguments)
+                    logger.info(f"Executing tool: {tool_call.name}({args_str[:160]}...)")
+                    if live_call_turn and not self._is_live_call_tool_allowed(
+                        tool_call.name,
+                        tool_call.arguments,
+                    ):
+                        blocked_tools.append(tool_call.name)
+                        result = (
+                            f"Error: Tool '{tool_call.name}' was blocked by the "
+                            "live-call security policy."
+                        )
+                        logger.error(
+                            f"Live call blocked risky tool: {tool_call.name} args={args_str[:160]}"
+                        )
+                        accumulated_tool_results.append({
+                            "tool": tool_call.name,
+                            "success": False,
+                            "result": result,
+                        })
+                        messages = self.context.add_tool_result(
+                            messages, tool_call.id, tool_call.name, result
+                        )
+                        continue
+                    self._emit_activity(
+                        "tool_start",
+                        iteration=iteration,
+                        tool_name=tool_call.name,
+                        tool_args_preview=args_str[:100],
+                    )
+                    try:
+                        result = await self.tools.execute(tool_call.name, tool_call.arguments)
+                        accumulated_tool_results.append({
+                            "tool": tool_call.name,
+                            "success": not result.startswith("Error"),
+                            "result": result[:500] if len(result) > 500 else result,
+                        })
+                    except Exception as e:
+                        result = f"Error executing {tool_call.name}: {str(e)}"
+                        logger.error(result)
+                        accumulated_tool_results.append({
+                            "tool": tool_call.name,
+                            "success": False,
+                            "result": result,
+                        })
+                    else:
+                        if not result.startswith("Error"):
+                            turn_success_count += 1
+                            logger.info(
+                                f"Tool success: {tool_call.name} result={result[:180]}"
+                            )
+                        else:
+                            logger.warning(
+                                f"Tool failed: {tool_call.name} result={result[:220]}"
+                            )
+                    self._emit_activity(
+                        "tool_end",
+                        iteration=iteration,
+                        tool_name=tool_call.name,
+                        success=not result.startswith("Error"),
+                    )
+                    messages = self.context.add_tool_result(
+                        messages, tool_call.id, tool_call.name, result
+                    )
+                    # In strict action turns, stop as soon as a terminal action succeeds.
+                    # (voice_call and cron tools removed for Dispatch integration)
+                    if terminal_action_executed:
+                        logger.info(
+                            "Action turn terminal tool executed; skipping remaining tool calls in this batch."
+                        )
+                        break
+                logger.info(f"Tool execution telemetry: executed_tools={turn_tools}")
+                tools_were_used = True
+                if turn_success_count > 0:
+                    successful_tools_were_used = True
+                    forced_tool_retry = False
+                if terminal_action_executed:
+                    successful = [t for t in accumulated_tool_results if t.get("success")]
+                    if successful:
+                        last_ok = successful[-1]
+                        final_content = (
+                            "Action completed.\n"
+                            f"{last_ok['tool']}: {last_ok['result']}"
+                        )
+                    else:
+                        final_content = "Action executed."
+                    break
+                if live_call_turn and not enforce_action_tools:
+                    successful = [t for t in accumulated_tool_results if t.get("success")]
+                    if successful:
+                        last_ok = successful[-1]
+                        final_content = (
+                            response.content.strip()
+                            if response.content and response.content.strip()
+                            else f"Action completed: {last_ok['tool']}"
+                        )
+                    else:
+                        final_content = "No safe tool could be executed for the live call."
+                    break
+                if enforce_action_tools and turn_success_count == 0:
+                    if no_tool_retry_count < self.action_tool_retries:
+                        no_tool_retry_count += 1
+                        logger.warning(
+                            "Action turn tool calls all failed; retrying with corrective instruction "
+                            f"({no_tool_retry_count}/{self.action_tool_retries})"
+                        )
+                        messages.append({
+                            "role": "user",
+                            "content": (
+                                "The previous tool call failed. "
+                                "Retry the relevant tool with correct parameters. "
+                                "If it fails, give a clear error — do not call unrelated tools."
+                            ),
+                        })
+                        continue
+                    final_content = "Tool calls failed, no action was taken."
+                    break
+                continue
+            # Provider/model may hallucinate completion without emitting tool calls.
+            # OpenClaw-style guard: force a corrective tool-only retry before responding.
+            if (
+                not successful_tools_were_used
+                and response.content
+                and self._contains_unverified_completion_claim(response.content)
+                and no_tool_retry_count < self.action_tool_retries
+            ):
+                no_tool_retry_count += 1
+                forced_tool_retry = True
+                self._emit_activity("hallucination_retry", iteration=iteration)
+                logger.warning(
+                    "Completion claim without tool call; retrying with forced tool instruction "
+                    f"({no_tool_retry_count}/{self.action_tool_retries})"
+                )
+                messages.append({
+                    "role": "user",
+                    "content": (
+                        "The previous response claims the action was done but no tool was called. "
+                        "You must call the appropriate tool now. "
+                        "Do not claim completion without executing a tool."
+                    ),
+                })
+                continue
+            if enforce_action_tools and not successful_tools_were_used:
+                if no_tool_retry_count < self.action_tool_retries:
+                    no_tool_retry_count += 1
+                    logger.warning(
+                        "Action turn returned no tool call; retrying with corrective instruction "
+                        f"({no_tool_retry_count}/{self.action_tool_retries})"
+                    )
+                    messages.append({
+                        "role": "user",
+                        "content": (
+                            "This is an action request. Call the appropriate tool now. "
+                            "Do not claim completion without executing a tool."
+                        ),
+                    })
+                    continue
+                final_content = "Tool call could not be verified, no action was taken."
+                break
+            if forced_tool_retry and not successful_tools_were_used:
+                final_content = "Tool call could not be verified, no action was taken."
+                break
+            final_content = response.content
+            break
+        if enforce_action_tools and not successful_tools_were_used:
+            if not final_content or not final_content.startswith("Tool"):
+                final_content = "Tool calls failed, no action was taken."
+        if final_content is None:
+            if accumulated_tool_results:
+                summary = f"Actions completed ({len(accumulated_tool_results)} tools executed):\n"
+                for tr in accumulated_tool_results[-5:]:
+                    status = "✓" if tr["success"] else "✗"
+                    summary += f"  {status} {tr['tool']}\n"
+                final_content = summary
+            else:
+                final_content = "Action completed but no response could be generated."
+        if not final_content or not final_content.strip():
+            if enforce_action_tools and not successful_tools_were_used:
+                final_content = "Tool call could not be verified, no action was taken."
+            elif accumulated_tool_results:
+                final_content = "✓ Action completed."
+            else:
+                final_content = "Action completed but no response could be generated."
+        if (
+            final_content
+            and not executed_tool_names
+            and (action_turn or self._is_retry_action_followup(turn_content))
+            and self._contains_unverified_completion_claim(final_content)
+        ):
+            logger.warning("Suppressed unverified completion claim because no tool was executed.")
+            final_content = "No tool was executed, no action was taken."
+        logger.info(
+            "LLM final telemetry: "
+            f"final_content_length={len(final_content)}, executed_tools={executed_tool_names}, "
+            f"action_turn={action_turn}, live_call_turn={live_call_turn}, "
+            f"blocked_tools={sorted(set(blocked_tools))}"
+        )
+        if enforce_action_tools and not executed_tool_names:
+            logger.error("Action turn alarm: executed_tools=0")
+        # If the loop produced a hardcoded fallback and tool results exist,
+        # ask the model to summarize what happened in natural language.
+        if final_content and self._is_hardcoded_fallback(final_content) and accumulated_tool_results:
+            logger.info("Requesting model summary turn to replace hardcoded fallback")
+            summary = await self._request_summary_turn(messages, accumulated_tool_results)
+            if summary:
+                final_content = summary
+        self._emit_activity("iteration_end", iteration=iteration)
+        return final_content, accumulated_tool_results, executed_tool_names
+    async def _run_memory_flush(
+        self,
+        session: Any,
+        channel: str,
+        chat_id: str,
+    ) -> None:
+        """
+        Run a pre-compaction memory flush turn.
+        This gives the agent a chance to save important information
+        to disk before context gets compacted.
+        """
+        user_prompt, system_prompt = self.compaction.get_memory_flush_prompt()
+        # Build messages with flush prompt
+        messages = self.context.build_messages(
+            history=session.get_history(max_messages=self.context_messages),
+            current_message=user_prompt,
+        )
+        # Add system prompt for flush context
+        messages[0]["content"] += f"\n\n{system_prompt}"
+        # Run a single turn with tools available
+        try:
+            response = await self.provider.chat(
+                messages=messages,
+                tools=self.tools.get_definitions(),
+                model=self.model
+            )
+            # Execute any tool calls (agent might want to write to memory)
+            if response.has_tool_calls:
+                for tool_call in response.tool_calls:
+                    logger.debug(f"Memory flush tool: {tool_call.name}")
+                    await self.tools.execute(tool_call.name, tool_call.arguments)
+            # Check if response should be silent
+            content = response.content or ""
+            if not self.compaction.is_silent_reply(content):
+                # Agent wants to communicate something
+                stripped = self.compaction.strip_silent_token(content)
+                if stripped:
+                    logger.info(f"Memory flush response: {stripped[:100]}...")
+                    # Optionally send to user
+                    await self.bus.publish_outbound(OutboundMessage(
+                        channel=channel,
+                        chat_id=chat_id,
+                        content=f"📝 {stripped}"
+                    ))
+            # Save flush interaction to session
+            session.add_message("user", f"[System: Memory Flush] {user_prompt}")
+            session.add_message("assistant", content)
+            self.sessions.save(session)
+        except Exception as e:
+            logger.warning(f"Memory flush failed: {e}")
+    async def _process_message(self, msg: InboundMessage) -> OutboundMessage | None:
+        """
+        Process a single inbound message.
+        Args:
+            msg: The inbound message to process.
+        Returns:
+            The response message, or None if no response needed.
+        """
+        # Handle system messages (subagent announces)
+        # The chat_id contains the original "channel:chat_id" to route back to
+        if msg.channel == "system":
+            return await self._process_system_message(msg)
+        logger.info(f"Processing message from {msg.channel}:{msg.sender_id}")
+        # Handle /new and /clear commands
+        is_command = msg.metadata.get("is_command", False)
+        command = msg.metadata.get("command", "")
+        if is_command and command in ("new", "clear"):
+            session = self.sessions.get_or_create(msg.session_key)
+            session.clear()
+            session.metadata["persona"] = self.context.persona
+            self.sessions.save(session)
+            logger.info(f"Session {msg.session_key} cleared via /{command}")
+            return None  # Telegram handler already sent confirmation
+        # Get or create session
+        session = self.sessions.get_or_create(msg.session_key)
+        # Update tool contexts
+        message_tool = self.tools.get("message")
+        if isinstance(message_tool, MessageTool):
+            message_tool.set_context(msg.channel, msg.chat_id)
+        spawn_tool = self.tools.get("spawn")
+        if isinstance(spawn_tool, SpawnTool):
+            spawn_tool.set_context(msg.channel, msg.chat_id)
+        # Detect persona change and inject transition marker
+        current_persona = self.context.persona
+        session_persona = session.metadata.get("persona")
+        if session_persona and session_persona != current_persona and session.messages:
+            logger.info(f"Persona changed: {session_persona} → {current_persona}")
+            session.add_message(
+                "system",
+                f"[PERSONA CHANGE] The assistant's persona has been changed from "
+                f"'{session_persona}' to '{current_persona}'. From this point forward, "
+                f"respond strictly as the new persona. Ignore the style/tone of previous "
+                f"messages in this conversation."
+            )
+        session.metadata["persona"] = current_persona
+        # Get history and check for compaction
+        history = session.get_history(max_messages=self.context_messages)
+        # Check if memory flush is needed before potential compaction
+        total_tokens = estimate_messages_tokens(history)
+        if self.compaction.should_memory_flush(total_tokens):
+            logger.info("Running pre-compaction memory flush")
+            await self._run_memory_flush(session, msg.channel, msg.chat_id)
+            self.compaction.mark_memory_flush_done()
+            # Reload history after flush
+            history = session.get_history(max_messages=self.context_messages)
+            total_tokens = estimate_messages_tokens(history)
+        # Check if compaction is needed
+        if self.compaction.should_compact(total_tokens):
+            logger.info(f"Compacting context: {total_tokens} tokens exceeds threshold")
+            result = await self.compaction.compact(history)
+            logger.info(
+                f"Compaction complete: {result.tokens_before} -> {result.tokens_after} tokens, "
+                f"removed {result.messages_removed} messages"
+            )
+            # Replace history with summary
+            history = [{"role": "system", "content": f"[Previous conversation summary]\n\n{result.summary}"}]
+            # Update session with compacted history
+            session.metadata["last_compaction_summary"] = result.summary
+        # Build initial messages
+        messages = self.context.build_messages(
+            history=history,
+            current_message=msg.content,
+            media=msg.media if msg.media else None,
+        )
+        action_turn = self._is_action_turn(msg.channel, msg.content)
+        if not action_turn and self._should_promote_retry_to_action(msg.content, history):
+            action_turn = True
+        if not action_turn and self._consume_pending_action_lock(session, msg.content):
+            action_turn = True
+            logger.info("Pending action lock promoted this turn to action_turn=True")
+        live_call_turn = self._is_live_call_turn(msg.content)
+        final_content, tool_results, _executed_tools = await self._run_llm_tool_loop(
+            messages=messages,
+            action_turn=action_turn,
+            live_call_turn=live_call_turn,
+            turn_content=msg.content,
+        )
+        if action_turn:
+            successful_tools = [r for r in tool_results if r.get("success")]
+            if successful_tools:
+                self._clear_pending_action_lock(session)
+            else:
+                self._set_pending_action_lock(session, msg.content)
+                logger.warning("Action turn ended without successful tool execution; pending lock armed.")
+        # Save to session
+        session.add_message("user", msg.content)
+        session.add_message("assistant", final_content)
+        self.sessions.save(session)
+        return OutboundMessage(
+            channel=msg.channel,
+            chat_id=msg.chat_id,
+            content=final_content
+        )
+    async def _process_system_message(self, msg: InboundMessage) -> OutboundMessage | None:
+        """
+        Process a system message (e.g., subagent announce).
+        The chat_id field contains "original_channel:original_chat_id" to route
+        the response back to the correct destination.
+        """
+        logger.info(f"Processing system message from {msg.sender_id}")
+        # Parse origin from chat_id (format: "channel:chat_id")
+        if ":" in msg.chat_id:
+            parts = msg.chat_id.split(":", 1)
+            origin_channel = parts[0]
+            origin_chat_id = parts[1]
+        else:
+            # Fallback
+            origin_channel = "cli"
+            origin_chat_id = msg.chat_id
+        # Use the origin session for context
+        session_key = f"{origin_channel}:{origin_chat_id}"
+        session = self.sessions.get_or_create(session_key)
+        # Update tool contexts
+        message_tool = self.tools.get("message")
+        if isinstance(message_tool, MessageTool):
+            message_tool.set_context(origin_channel, origin_chat_id)
+        spawn_tool = self.tools.get("spawn")
+        if isinstance(spawn_tool, SpawnTool):
+            spawn_tool.set_context(origin_channel, origin_chat_id)
+        # Build messages with the announce content
+        messages = self.context.build_messages(
+            history=session.get_history(max_messages=self.context_messages),
+            current_message=msg.content
+        )
+        action_turn = self._is_action_turn(origin_channel, msg.content)
+        if not action_turn and self._should_promote_retry_to_action(
+            msg.content,
+            session.get_history(max_messages=self.context_messages),
+        ):
+            action_turn = True
+        if not action_turn and self._consume_pending_action_lock(session, msg.content):
+            action_turn = True
+            logger.info("Pending action lock promoted system turn to action_turn=True")
+        live_call_turn = self._is_live_call_turn(msg.content)
+        # Progress callback: prefer custom callback from metadata, fallback to bus
+        custom_progress = (msg.metadata or {}).pop("on_progress", None)
+        async def _bus_progress(hint: str) -> None:
+            await self.bus.publish_outbound(OutboundMessage(
+                channel=msg.channel, chat_id=msg.chat_id,
+                content=f"↳ {hint}",
+                metadata={"progress": True},
+            ))
+        progress_fn = custom_progress if callable(custom_progress) else _bus_progress
+        final_content, tool_results, _executed_tools = await self._run_llm_tool_loop(
+            messages=messages,
+            action_turn=action_turn,
+            live_call_turn=live_call_turn,
+            turn_content=msg.content,
+            on_progress=progress_fn,
+        )
+        if action_turn:
+            successful_tools = [r for r in tool_results if r.get("success")]
+            if successful_tools:
+                self._clear_pending_action_lock(session)
+            else:
+                self._set_pending_action_lock(session, msg.content)
+        # Save to session (mark as system message in history)
+        session.add_message("user", f"[System: {msg.sender_id}] {msg.content}")
+        session.add_message("assistant", final_content)
+        self.sessions.save(session)
+        return OutboundMessage(
+            channel=origin_channel,
+            chat_id=origin_chat_id,
+            content=final_content
+        )
+    async def process_direct(
+        self,
+        content: str,
+        session_key: str = "cli:direct",
+        on_progress: Callable[[str], Awaitable[None]] | None = None,
+    ) -> str:
+        """
+        Process a message directly (for CLI usage or voice calls).
+        Args:
+            content: The message content.
+            session_key: Session identifier in format "channel:chat_id".
+        Returns:
+            The agent's response.
+        """
+        # Parse session_key to extract channel and chat_id
+        if ":" in session_key:
+            channel, chat_id = session_key.split(":", 1)
+        else:
+            channel, chat_id = "cli", session_key
+        await self._connect_mcp()
+        msg = InboundMessage(
+            channel=channel,
+            sender_id="user",
+            chat_id=chat_id,
+            content=content,
+            metadata={"on_progress": on_progress} if on_progress else {},
+        )
+        response = await self._process_message(msg)
+        return response.content if response else ""
+    async def compact_session(
+        self,
+        session_key: str,
+        custom_instructions: str | None = None,
+    ) -> dict[str, Any]:
+        """
+        Manually compact a session's history.
+        Args:
+            session_key: Session identifier.
+            custom_instructions: Optional instructions for summarization.
+        Returns:
+            Dict with compaction results.
+        """
+        session = self.sessions.get_or_create(session_key)
+        history = session.get_history(max_messages=self.context_messages)
+        if not history:
+            return {
+                "success": False,
+                "message": "No history to compact.",
+                "tokens_before": 0,
+                "tokens_after": 0,
+            }
+        tokens_before = estimate_messages_tokens(history)
+        # Check if already compacted (first message is a compaction summary)
+        is_already_compacted = (
+            len(history) == 1
+            and history[0].get("role") == "system"
+            and "[Compacted conversation summary]" in history[0].get("content", "")
+        )
+        if is_already_compacted:
+            return {
+                "success": False,
+                "message": "Already compacted. Send more messages first.",
+                "tokens_before": tokens_before,
+                "tokens_after": tokens_before,
+            }
+        # Check if too few messages to compact (need at least 3 messages)
+        # Filter out system messages for this count
+        user_assistant_messages = [m for m in history if m.get("role") in ("user", "assistant")]
+        if len(user_assistant_messages) < 3:
+            return {
+                "success": False,
+                "message": f"Not enough messages to compact ({len(user_assistant_messages)} messages). Need at least 3.",
+                "tokens_before": tokens_before,
+                "tokens_after": tokens_before,
+            }
+        # Check if token count is too low to bother compacting (< 1000 tokens)
+        if tokens_before < 1000:
+            return {
+                "success": False,
+                "message": f"History too small to compact ({tokens_before} tokens). Need at least 1000.",
+                "tokens_before": tokens_before,
+                "tokens_after": tokens_before,
+            }
+        # Run compaction
+        result = await self.compaction.compact(
+            history,
+            custom_instructions=custom_instructions,
+        )
+        # Clear session and add summary as first message
+        session.clear()
+        session.add_message(
+            "system",
+            f"[Compacted conversation summary]\n\n{result.summary}"
+        )
+        session.metadata["last_compaction_summary"] = result.summary
+        session.metadata["compaction_count"] = session.metadata.get("compaction_count", 0) + 1
+        self.sessions.save(session)
+        return {
+            "success": True,
+            "message": f"Compacted {result.messages_removed} messages",
+            "tokens_before": result.tokens_before,
+            "tokens_after": result.tokens_after,
+            "summary_preview": result.summary[:200] + "..." if len(result.summary) > 200 else result.summary,
+        }