PyPI - massgen - Versions diffs - 0.1.4__py3-none-any.whl → 0.1.6__py3-none-any.whl - Mend

massgen 0.1.4py3-none-any.whl → 0.1.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of massgen might be problematic. Click here for more details.

Files changed (84) hide show

massgen/__init__.py +1 -1
massgen/backend/base_with_custom_tool_and_mcp.py +453 -23
massgen/backend/capabilities.py +39 -0
massgen/backend/chat_completions.py +111 -197
massgen/backend/claude.py +210 -181
massgen/backend/gemini.py +1015 -1559
massgen/backend/grok.py +3 -2
massgen/backend/response.py +160 -220
massgen/chat_agent.py +340 -20
massgen/cli.py +399 -25
massgen/config_builder.py +20 -54
massgen/config_validator.py +931 -0
massgen/configs/README.md +95 -10
massgen/configs/memory/gpt5mini_gemini_baseline_research_to_implementation.yaml +94 -0
massgen/configs/memory/gpt5mini_gemini_context_window_management.yaml +187 -0
massgen/configs/memory/gpt5mini_gemini_research_to_implementation.yaml +127 -0
massgen/configs/memory/gpt5mini_high_reasoning_gemini.yaml +107 -0
massgen/configs/memory/single_agent_compression_test.yaml +64 -0
massgen/configs/tools/custom_tools/claude_code_custom_tool_with_mcp_example.yaml +1 -0
massgen/configs/tools/custom_tools/claude_custom_tool_example_no_path.yaml +1 -1
massgen/configs/tools/custom_tools/claude_custom_tool_with_mcp_example.yaml +1 -0
massgen/configs/tools/custom_tools/computer_use_browser_example.yaml +1 -1
massgen/configs/tools/custom_tools/computer_use_docker_example.yaml +1 -1
massgen/configs/tools/custom_tools/gemini_custom_tool_with_mcp_example.yaml +1 -0
massgen/configs/tools/custom_tools/gpt5_nano_custom_tool_with_mcp_example.yaml +1 -0
massgen/configs/tools/custom_tools/gpt_oss_custom_tool_with_mcp_example.yaml +1 -0
massgen/configs/tools/custom_tools/grok3_mini_custom_tool_with_mcp_example.yaml +1 -0
massgen/configs/tools/custom_tools/interop/ag2_and_langgraph_lesson_planner.yaml +65 -0
massgen/configs/tools/custom_tools/interop/ag2_and_openai_assistant_lesson_planner.yaml +65 -0
massgen/configs/tools/custom_tools/interop/ag2_lesson_planner_example.yaml +48 -0
massgen/configs/tools/custom_tools/interop/agentscope_lesson_planner_example.yaml +48 -0
massgen/configs/tools/custom_tools/interop/langgraph_lesson_planner_example.yaml +49 -0
massgen/configs/tools/custom_tools/interop/openai_assistant_lesson_planner_example.yaml +50 -0
massgen/configs/tools/custom_tools/interop/smolagent_lesson_planner_example.yaml +49 -0
massgen/configs/tools/custom_tools/qwen_api_custom_tool_with_mcp_example.yaml +1 -0
massgen/configs/tools/custom_tools/two_models_with_tools_example.yaml +44 -0
massgen/formatter/_gemini_formatter.py +61 -15
massgen/memory/README.md +277 -0
massgen/memory/__init__.py +26 -0
massgen/memory/_base.py +193 -0
massgen/memory/_compression.py +237 -0
massgen/memory/_context_monitor.py +211 -0
massgen/memory/_conversation.py +255 -0
massgen/memory/_fact_extraction_prompts.py +333 -0
massgen/memory/_mem0_adapters.py +257 -0
massgen/memory/_persistent.py +687 -0
massgen/memory/docker-compose.qdrant.yml +36 -0
massgen/memory/docs/DESIGN.md +388 -0
massgen/memory/docs/QUICKSTART.md +409 -0
massgen/memory/docs/SUMMARY.md +319 -0
massgen/memory/docs/agent_use_memory.md +408 -0
massgen/memory/docs/orchestrator_use_memory.md +586 -0
massgen/memory/examples.py +237 -0
massgen/orchestrator.py +207 -7
massgen/tests/memory/test_agent_compression.py +174 -0
massgen/tests/memory/test_context_window_management.py +286 -0
massgen/tests/memory/test_force_compression.py +154 -0
massgen/tests/memory/test_simple_compression.py +147 -0
massgen/tests/test_ag2_lesson_planner.py +223 -0
massgen/tests/test_agent_memory.py +534 -0
massgen/tests/test_config_validator.py +1156 -0
massgen/tests/test_conversation_memory.py +382 -0
massgen/tests/test_langgraph_lesson_planner.py +223 -0
massgen/tests/test_orchestrator_memory.py +620 -0
massgen/tests/test_persistent_memory.py +435 -0
massgen/token_manager/token_manager.py +6 -0
massgen/tool/__init__.py +2 -9
massgen/tool/_decorators.py +52 -0
massgen/tool/_extraframework_agents/ag2_lesson_planner_tool.py +251 -0
massgen/tool/_extraframework_agents/agentscope_lesson_planner_tool.py +303 -0
massgen/tool/_extraframework_agents/langgraph_lesson_planner_tool.py +275 -0
massgen/tool/_extraframework_agents/openai_assistant_lesson_planner_tool.py +247 -0
massgen/tool/_extraframework_agents/smolagent_lesson_planner_tool.py +180 -0
massgen/tool/_manager.py +102 -16
massgen/tool/_registered_tool.py +3 -0
massgen/tool/_result.py +3 -0
{massgen-0.1.4.dist-info → massgen-0.1.6.dist-info}/METADATA +138 -77
{massgen-0.1.4.dist-info → massgen-0.1.6.dist-info}/RECORD +82 -37
massgen/backend/gemini_mcp_manager.py +0 -545
massgen/backend/gemini_trackers.py +0 -344
{massgen-0.1.4.dist-info → massgen-0.1.6.dist-info}/WHEEL +0 -0
{massgen-0.1.4.dist-info → massgen-0.1.6.dist-info}/entry_points.txt +0 -0
{massgen-0.1.4.dist-info → massgen-0.1.6.dist-info}/licenses/LICENSE +0 -0
{massgen-0.1.4.dist-info → massgen-0.1.6.dist-info}/top_level.txt +0 -0

massgen/backend/gemini.py CHANGED Viewed

@@ -19,10 +19,10 @@ TECHNICAL SOLUTION:
 - Maintains compatibility with existing MassGen workflow
 """
+import asyncio
 import json
 import logging
 import os
-import time
 from typing import Any, AsyncGenerator, Dict, List, Optional
 from ..api_params_handler._gemini_api_params_handler import GeminiAPIParamsHandler
@@ -35,10 +35,12 @@ from ..logger_config import (
     logger,
 )
 from .base import FilesystemSupport, StreamChunk
-from .base_with_custom_tool_and_mcp import CustomToolAndMCPBackend
-from .gemini_mcp_manager import GeminiMCPManager
-from .gemini_trackers import MCPCallTracker, MCPResponseExtractor, MCPResponseTracker
-from .gemini_utils import CoordinationResponse
+from .base_with_custom_tool_and_mcp import (
+    CustomToolAndMCPBackend,
+    CustomToolChunk,
+    ToolExecutionConfig,
+)
+from .gemini_utils import CoordinationResponse, PostEvaluationResponse
 # Suppress Gemini SDK logger warning about non-text parts in response
@@ -53,51 +55,31 @@ class NoFunctionCallWarning(logging.Filter):
 logging.getLogger("google_genai.types").addFilter(NoFunctionCallWarning())
-try:
-    from pydantic import BaseModel, Field
-except ImportError:
-    BaseModel = None
-    Field = None
 # MCP integration imports
 try:
     from ..mcp_tools import (
-        MCPClient,
-        MCPConfigurationError,
-        MCPConfigValidator,
         MCPConnectionError,
         MCPError,
         MCPServerError,
         MCPTimeoutError,
-        MCPValidationError,
     )
 except ImportError:  # MCP not installed or import failed within mcp_tools
-    MCPClient = None  # type: ignore[assignment]
     MCPError = ImportError  # type: ignore[assignment]
     MCPConnectionError = ImportError  # type: ignore[assignment]
-    MCPConfigValidator = None  # type: ignore[assignment]
-    MCPConfigurationError = ImportError  # type: ignore[assignment]
-    MCPValidationError = ImportError  # type: ignore[assignment]
     MCPTimeoutError = ImportError  # type: ignore[assignment]
     MCPServerError = ImportError  # type: ignore[assignment]
 # Import MCP backend utilities
 try:
     from ..mcp_tools.backend_utils import (
-        MCPCircuitBreakerManager,
-        MCPConfigHelper,
         MCPErrorHandler,
-        MCPExecutionManager,
         MCPMessageManager,
-        MCPSetupManager,
+        MCPResourceManager,
     )
 except ImportError:
     MCPErrorHandler = None  # type: ignore[assignment]
-    MCPSetupManager = None  # type: ignore[assignment]
     MCPMessageManager = None  # type: ignore[assignment]
-    MCPCircuitBreakerManager = None  # type: ignore[assignment]
-    MCPExecutionManager = None  # type: ignore[assignment]
-    MCPConfigHelper = None  # type: ignore[assignment]
+    MCPResourceManager = None  # type: ignore[assignment]
 def format_tool_response_as_json(response_text: str) -> str:
@@ -145,11 +127,8 @@ class GeminiBackend(CustomToolAndMCPBackend):
         self._mcp_tool_successes = 0
         self._mcp_connection_retries = 0
-        # MCP Response Extractor for capturing tool interactions (Gemini-specific)
-        self.mcp_extractor = MCPResponseExtractor()
-        # Initialize Gemini MCP manager after all attributes are ready
-        self.mcp_manager = GeminiMCPManager(self)
+        # Active tool result capture during manual tool execution
+        self._active_tool_result_store: Optional[Dict[str, str]] = None
     def _setup_permission_hooks(self):
         """Override base class - Gemini uses session-based permissions, not function hooks."""
@@ -166,10 +145,10 @@ class GeminiBackend(CustomToolAndMCPBackend):
     async def _setup_mcp_tools(self) -> None:
         """
-        Override parent class - Gemini uses GeminiMCPManager for MCP setup.
+        Override parent class - Use base class MCP setup for manual execution pattern.
         This method is called by the parent class's __aenter__() context manager.
         """
-        await self.mcp_manager.setup_mcp_tools(agent_id=self.agent_id)
+        await super()._setup_mcp_tools()
     def supports_upload_files(self) -> bool:
         """
@@ -178,13 +157,46 @@ class GeminiBackend(CustomToolAndMCPBackend):
         """
         return False
+    def _create_client(self, **kwargs):
+        pass
+    async def _stream_with_custom_and_mcp_tools(
+        self,
+        current_messages: List[Dict[str, Any]],
+        tools: List[Dict[str, Any]],
+        client,
+        **kwargs,
+    ) -> AsyncGenerator[StreamChunk, None]:
+        yield StreamChunk(type="error", error="Not implemented")
     async def stream_with_tools(self, messages: List[Dict[str, Any]], tools: List[Dict[str, Any]], **kwargs) -> AsyncGenerator[StreamChunk, None]:
-        """Stream response using Gemini API with structured output for coordination and MCP tool support."""
+        """Stream response using Gemini API with manual MCP execution pattern.
+        Tool Execution Behavior:
+        - Custom tools: Always executed (not blocked by planning mode or circuit breaker)
+        - MCP tools: Blocked by planning mode during coordination, blocked by circuit breaker when servers fail
+        - Provider tools (vote/new_answer): Emitted as StreamChunks but not executed (handled by orchestrator)
+        """
         # Use instance agent_id (from __init__) or get from kwargs if not set
         agent_id = self.agent_id or kwargs.get("agent_id", None)
         client = None
         stream = None
+        # Build execution context for tools (generic, not tool-specific)
+        # This is required for custom tool execution
+        from .base_with_custom_tool_and_mcp import ExecutionContext
+        self._execution_context = ExecutionContext(
+            messages=messages,
+            agent_system_message=kwargs.get("system_message", None),
+            agent_id=self.agent_id,
+            backend_name="gemini",
+            current_stage=self.coordination_stage,
+        )
+        # Track whether MCP tools were actually used in this turn
+        mcp_used = False
         log_backend_activity(
             "gemini",
             "Starting stream_with_tools",
@@ -192,7 +204,7 @@ class GeminiBackend(CustomToolAndMCPBackend):
             agent_id=agent_id,
         )
-        # Only trim when MCP tools will be used
+        # Trim message history for MCP if needed
         if self.mcp_servers and MCPMessageManager is not None and hasattr(self, "_max_mcp_message_history") and self._max_mcp_message_history > 0:
             original_count = len(messages)
             messages = MCPMessageManager.trim_message_history(messages, self._max_mcp_message_history)
@@ -210,29 +222,26 @@ class GeminiBackend(CustomToolAndMCPBackend):
         try:
             from google import genai
+            from google.genai import types
-            # Setup MCP with status streaming via manager if not already initialized
+            # Setup MCP using base class if not already initialized
             if not self._mcp_initialized and self.mcp_servers:
-                async for chunk in self.mcp_manager.setup_mcp_with_status_stream(agent_id):
-                    yield chunk
-            elif not self._mcp_initialized:
-                # Setup MCP without streaming for backward compatibility
-                await self.mcp_manager.setup_mcp_tools(agent_id)
+                await self._setup_mcp_tools()
+                if self._mcp_initialized:
+                    yield StreamChunk(
+                        type="mcp_status",
+                        status="mcp_initialized",
+                        content="✅ [MCP] Tools initialized",
+                        source="mcp_tools",
+                    )
-            # Merge constructor config with stream kwargs (stream kwargs take priority)
+            # Merge constructor config with stream kwargs
             all_params = {**self.config, **kwargs}
-            # Extract framework-specific parameters
-            all_params.get("enable_web_search", False)
-            enable_code_execution = all_params.get("enable_code_execution", False)
-            # Always use SDK MCP sessions when mcp_servers are configured
-            using_sdk_mcp = bool(self.mcp_servers)
-            # Custom tool handling - add custom tools if any
+            # Detect custom tools
             using_custom_tools = bool(self.custom_tool_manager and len(self._custom_tool_names) > 0)
-            # Analyze tool types
+            # Detect coordination mode
             is_coordination = self.formatter.has_coordination_tools(tools)
             is_post_evaluation = self.formatter.has_post_evaluation_tools(tools)
@@ -258,1355 +267,502 @@ class GeminiBackend(CustomToolAndMCPBackend):
                 # For post-evaluation, modify prompt to use structured output
                 full_content = self.formatter.build_post_evaluation_prompt(full_content)
-            # Use google-genai package
+            # Create Gemini client
             client = genai.Client(api_key=self.api_key)
-            # Setup builtin tools via API params handler (SDK Tool objects)
+            # Setup builtin tools via API params handler
             builtin_tools = self.api_params_handler.get_provider_tools(all_params)
-            # Build config via API params handler (maps params, excludes backend-managed ones)
+            # Build config via API params handler
             config = await self.api_params_handler.build_api_params(messages, tools, all_params)
-            # Extract model name (not included in config)
+            # Extract model name
             model_name = all_params.get("model")
-            # Setup tools configuration (builtins only when not using sessions)
-            all_tools = []
-            # Branch 1: SDK auto-calling via MCP sessions (reuse existing MCPClient sessions)
-            if using_sdk_mcp and self.mcp_servers:
-                if not self._mcp_client or not getattr(self._mcp_client, "is_connected", lambda: False)():
-                    mcp_connected, status_chunks = await self.mcp_manager.setup_mcp_sessions_with_retry(agent_id, max_retries=5)
-                    async for chunk in status_chunks:
-                        yield chunk
-                    if not mcp_connected:
-                        using_sdk_mcp = False
-                        self._mcp_client = None
-            if not using_sdk_mcp and not using_custom_tools:
-                all_tools.extend(builtin_tools)
-                if all_tools:
-                    config["tools"] = all_tools
-            # For coordination requests, use JSON response format (may conflict with tools/sessions)
-            if is_coordination:
-                # Only request JSON schema when no tools are present
-                if (not using_sdk_mcp) and (not using_custom_tools) and (not all_tools):
-                    config["response_mime_type"] = "application/json"
-                    config["response_schema"] = CoordinationResponse.model_json_schema()
-                else:
-                    # Tools or sessions are present; fallback to text parsing
-                    pass
-            elif is_post_evaluation:
-                # For post-evaluation, use JSON response format for structured decisions
-                from .gemini_utils import PostEvaluationResponse
+            # ====================================================================
+            # Tool Registration Phase: Convert and register tools for manual execution
+            # ====================================================================
+            tools_to_apply = []
-                if (not using_sdk_mcp) and (not using_custom_tools) and (not all_tools):
-                    config["response_mime_type"] = "application/json"
-                    config["response_schema"] = PostEvaluationResponse.model_json_schema()
-                else:
-                    # Tools or sessions are present; fallback to text parsing
-                    pass
-            # Log messages being sent after builtin_tools is defined
-            log_backend_agent_message(
-                agent_id or "default",
-                "SEND",
-                {
-                    "content": full_content,
-                    "builtin_tools": len(builtin_tools) if builtin_tools else 0,
-                },
-                backend_name="gemini",
-            )
-            # Use streaming for real-time response
-            full_content_text = ""
-            final_response = None
-            # Buffer the last response chunk that contains candidate metadata so we can
-            # inspect builtin tool usage (grounding/code execution) after streaming
-            last_response_with_candidates = None
-            if (using_sdk_mcp and self.mcp_servers) or using_custom_tools:
-                # Process MCP and/or custom tools
+            # Add custom tools if available
+            if using_custom_tools:
                 try:
-                    # ====================================================================
-                    # Preparation phase: Initialize MCP and custom tools
-                    # ====================================================================
-                    mcp_sessions = []
-                    mcp_error = None
-                    custom_tools_functions = []
-                    custom_tools_error = None
-                    # Try to initialize MCP sessions
-                    if using_sdk_mcp and self.mcp_servers:
-                        try:
-                            if not self._mcp_client:
-                                raise RuntimeError("MCP client not initialized")
-                            mcp_sessions = self.mcp_manager.get_active_mcp_sessions(
-                                convert_to_permission_sessions=bool(self.filesystem_manager),
-                            )
-                            if not mcp_sessions:
-                                # If no MCP sessions, record error but don't interrupt (may still have custom tools)
-                                mcp_error = RuntimeError("No active MCP sessions available")
-                                logger.warning(f"[Gemini] MCP sessions unavailable: {mcp_error}")
-                        except Exception as e:
-                            mcp_error = e
-                            logger.warning(f"[Gemini] Failed to initialize MCP sessions: {e}")
-                    # Try to initialize custom tools
-                    if using_custom_tools:
-                        try:
-                            # Get custom tools schemas (in OpenAI format)
-                            custom_tools_schemas = self._get_custom_tools_schemas()
-                            if custom_tools_schemas:
-                                # Convert to Gemini SDK format using formatter
-                                # formatter handles: OpenAI format -> Gemini dict -> FunctionDeclaration objects
-                                custom_tools_functions = self.formatter.format_custom_tools(
-                                    custom_tools_schemas,
-                                    return_sdk_objects=True,
-                                )
-                                if custom_tools_functions:
-                                    logger.debug(
-                                        f"[Gemini] Loaded {len(custom_tools_functions)} custom tools " f"as FunctionDeclarations",
-                                    )
-                                else:
-                                    custom_tools_error = RuntimeError("Custom tools conversion failed")
-                                    logger.warning(f"[Gemini] Custom tools unavailable: {custom_tools_error}")
-                            else:
-                                custom_tools_error = RuntimeError("No custom tools available")
-                                logger.warning(f"[Gemini] Custom tools unavailable: {custom_tools_error}")
-                        except Exception as e:
-                            custom_tools_error = e
-                            logger.warning(f"[Gemini] Failed to initialize custom tools: {e}")
-                    # Check if at least one tool system is available
-                    has_mcp = bool(mcp_sessions and not mcp_error)
-                    has_custom_tools = bool(custom_tools_functions and not custom_tools_error)
-                    if not has_mcp and not has_custom_tools:
-                        # Both failed, raise error to enter fallback
-                        raise RuntimeError(
-                            f"Both MCP and custom tools unavailable. " f"MCP error: {mcp_error}. Custom tools error: {custom_tools_error}",
+                    # Get custom tools schemas (in OpenAI format)
+                    custom_tools_schemas = self._get_custom_tools_schemas()
+                    if custom_tools_schemas:
+                        # Convert to Gemini SDK format using formatter
+                        custom_tools_functions = self.formatter.format_custom_tools(
+                            custom_tools_schemas,
+                            return_sdk_objects=True,
                         )
-                    # ====================================================================
-                    # Configuration phase: Build session_config
-                    # ====================================================================
-                    session_config = dict(config)
-                    # Collect all available tool information
-                    available_mcp_tools = []
-                    if has_mcp and self._mcp_client:
-                        available_mcp_tools = list(self._mcp_client.tools.keys())
-                    available_custom_tool_names = list(self._custom_tool_names) if has_custom_tools else []
-                    # Apply tools to config
-                    tools_to_apply = []
-                    sessions_applied = False
-                    custom_tools_applied = False
-                    # Add MCP sessions (if available and not blocked by planning mode)
-                    if has_mcp:
-                        if not self.mcp_manager.should_block_mcp_tools_in_planning_mode(
-                            self.is_planning_mode_enabled(),
-                            available_mcp_tools,
-                        ):
-                            logger.debug(
-                                f"[Gemini] Passing {len(mcp_sessions)} MCP sessions to SDK: " f"{[type(s).__name__ for s in mcp_sessions]}",
-                            )
-                            tools_to_apply.extend(mcp_sessions)
-                            sessions_applied = True
-                        if self.is_planning_mode_enabled():
-                            blocked_tools = self.get_planning_mode_blocked_tools()
-                            if not blocked_tools:
-                                # Empty set means block ALL MCP tools (backward compatible)
-                                logger.info("[Gemini] Planning mode enabled - blocking ALL MCP tools during coordination")
-                                # Don't set tools at all - this prevents any MCP tool execution
-                                log_backend_activity(
-                                    "gemini",
-                                    "All MCP tools blocked in planning mode",
-                                    {
-                                        "blocked_tools": len(available_mcp_tools),
-                                        "session_count": len(mcp_sessions),
-                                    },
-                                    agent_id=agent_id,
-                                )
-                            else:
-                                # Selective blocking - allow non-blocked tools to be called
-                                # The execution layer (_execute_mcp_function_with_retry) will enforce blocking
-                                # but we still register all tools so non-blocked ones can be used
-                                logger.info(f"[Gemini] Planning mode enabled - allowing non-blocked MCP tools, blocking {len(blocked_tools)} specific tools")
-                                # Pass all sessions - the backend's is_mcp_tool_blocked() will handle selective blocking
-                                session_config["tools"] = mcp_sessions
-                                log_backend_activity(
-                                    "gemini",
-                                    "Selective MCP tools blocked in planning mode",
-                                    {
-                                        "total_tools": len(available_mcp_tools),
-                                        "blocked_tools": len(blocked_tools),
-                                        "allowed_tools": len(available_mcp_tools) - len(blocked_tools),
-                                    },
-                                    agent_id=agent_id,
-                                )
-                    # Add custom tools (if available)
-                    if has_custom_tools:
-                        # Wrap FunctionDeclarations in a Tool object for Gemini SDK
-                        try:
-                            from google.genai import types
-                            # Create a Tool object containing all custom function declarations
+                        if custom_tools_functions:
+                            # Wrap FunctionDeclarations in a Tool object for Gemini SDK
                             custom_tool = types.Tool(function_declarations=custom_tools_functions)
-                            logger.debug(
-                                f"[Gemini] Wrapped {len(custom_tools_functions)} custom tools " f"in Tool object for SDK",
-                            )
                             tools_to_apply.append(custom_tool)
-                            custom_tools_applied = True
-                        except Exception as e:
-                            logger.error(f"[Gemini] Failed to wrap custom tools in Tool object: {e}")
-                            custom_tools_error = e
-                    # Apply tool configuration
-                    if tools_to_apply:
-                        session_config["tools"] = tools_to_apply
-                        # Disable automatic function calling for custom tools
-                        # MassGen uses declarative mode: SDK should return function call requests
-                        # instead of automatically executing them
-                        if has_custom_tools:
-                            from google.genai import types
+                            logger.debug(f"[Gemini] Registered {len(custom_tools_functions)} custom tools for manual execution")
-                            session_config["automatic_function_calling"] = types.AutomaticFunctionCallingConfig(
-                                disable=True,
+                            yield StreamChunk(
+                                type="custom_tool_status",
+                                status="custom_tools_registered",
+                                content=f"🔧 [Custom Tools] Registered {len(custom_tools_functions)} tools",
+                                source="custom_tools",
                             )
-                            logger.debug("[Gemini] Disabled automatic function calling for custom tools")
-                    # ====================================================================
-                    # Logging and status output
-                    # ====================================================================
-                    if sessions_applied:
-                        # Track MCP tool usage attempt
-                        self._mcp_tool_calls_count += 1
-                        log_backend_activity(
-                            "gemini",
-                            "MCP tool call initiated",
-                            {
-                                "call_number": self._mcp_tool_calls_count,
-                                "session_count": len(mcp_sessions),
-                                "available_tools": available_mcp_tools[:],
-                                "total_tools": len(available_mcp_tools),
-                            },
-                            agent_id=agent_id,
-                        )
+                except Exception as e:
+                    logger.warning(f"[Gemini] Failed to register custom tools: {e}")
-                        log_tool_call(
-                            agent_id,
-                            "mcp_session_tools",
-                            {
-                                "session_count": len(mcp_sessions),
-                                "call_number": self._mcp_tool_calls_count,
-                                "available_tools": available_mcp_tools,
-                            },
-                            backend_name="gemini",
-                        )
+            # Add MCP tools if available (unless blocked by planning mode)
+            if self._mcp_initialized and self._mcp_functions:
+                # Check planning mode
+                if self.is_planning_mode_enabled():
+                    blocked_tools = self.get_planning_mode_blocked_tools()
-                        tools_info = f" ({len(available_mcp_tools)} tools available)" if available_mcp_tools else ""
+                    if not blocked_tools:
+                        # Empty set means block ALL MCP tools (backward compatible)
+                        logger.info("[Gemini] Planning mode enabled - blocking ALL MCP tools during coordination")
                         yield StreamChunk(
                             type="mcp_status",
-                            status="mcp_tools_initiated",
-                            content=f"MCP tool call initiated (call #{self._mcp_tool_calls_count}){tools_info}: {', '.join(available_mcp_tools[:5])}{'...' if len(available_mcp_tools) > 5 else ''}",
-                            source="mcp_tools",
+                            status="planning_mode_blocked",
+                            content="🚫 [MCP] Planning mode active - all MCP tools blocked during coordination",
+                            source="planning_mode",
                         )
-                    if custom_tools_applied:
-                        # Track custom tool usage attempt
-                        log_backend_activity(
-                            "gemini",
-                            "Custom tools initiated",
-                            {
-                                "tool_count": len(custom_tools_functions),
-                                "available_tools": available_custom_tool_names,
-                            },
-                            agent_id=agent_id,
-                        )
+                    else:
+                        # Selective blocking - register all MCP tools, execution layer will block specific ones
+                        logger.info(f"[Gemini] Planning mode enabled - registering all MCP tools, will block {len(blocked_tools)} at execution")
+                        try:
+                            # Convert MCP tools using formatter
+                            mcp_tools_functions = self.formatter.format_mcp_tools(self._mcp_functions, return_sdk_objects=True)
-                        tools_preview = ", ".join(available_custom_tool_names[:5])
-                        tools_suffix = "..." if len(available_custom_tool_names) > 5 else ""
-                        yield StreamChunk(
-                            type="custom_tool_status",
-                            status="custom_tools_initiated",
-                            content=f"Custom tools initiated ({len(custom_tools_functions)} tools available): {tools_preview}{tools_suffix}",
-                            source="custom_tools",
-                        )
+                            if mcp_tools_functions:
+                                # Wrap in Tool object
+                                mcp_tool = types.Tool(function_declarations=mcp_tools_functions)
+                                tools_to_apply.append(mcp_tool)
-                    # ====================================================================
-                    # Streaming phase
-                    # ====================================================================
-                    # Use async streaming call with sessions/tools
-                    stream = await client.aio.models.generate_content_stream(
-                        model=model_name,
-                        contents=full_content,
-                        config=session_config,
-                    )
+                                # Mark MCP as used since tools are registered (even with selective blocking)
+                                mcp_used = True
-                    # Initialize trackers for both MCP and custom tools
-                    mcp_tracker = MCPCallTracker()
-                    mcp_response_tracker = MCPResponseTracker()
-                    custom_tracker = MCPCallTracker()  # Reuse MCPCallTracker for custom tools
-                    custom_response_tracker = MCPResponseTracker()  # Reuse for custom tools
+                                logger.debug(f"[Gemini] Registered {len(mcp_tools_functions)} MCP tools for selective blocking")
-                    mcp_tools_used = []  # Keep for backward compatibility
-                    custom_tools_used = []  # Track custom tool usage
+                                yield StreamChunk(
+                                    type="mcp_status",
+                                    status="mcp_tools_registered",
+                                    content=f"🔧 [MCP] Registered {len(mcp_tools_functions)} tools (selective blocking enabled)",
+                                    source="mcp_tools",
+                                )
+                        except Exception as e:
+                            logger.warning(f"[Gemini] Failed to register MCP tools: {e}")
+                else:
+                    # No planning mode - register all MCP tools
+                    try:
+                        # Convert MCP tools using formatter
+                        mcp_tools_functions = self.formatter.format_mcp_tools(self._mcp_functions, return_sdk_objects=True)
+                        if mcp_tools_functions:
+                            # Wrap in Tool object
+                            mcp_tool = types.Tool(function_declarations=mcp_tools_functions)
+                            tools_to_apply.append(mcp_tool)
+                            # Mark MCP as used since tools are registered
+                            mcp_used = True
+                            logger.debug(f"[Gemini] Registered {len(mcp_tools_functions)} MCP tools for manual execution")
+                            yield StreamChunk(
+                                type="mcp_status",
+                                status="mcp_tools_registered",
+                                content=f"🔧 [MCP] Registered {len(mcp_tools_functions)} tools",
+                                source="mcp_tools",
+                            )
+                    except Exception as e:
+                        logger.warning(f"[Gemini] Failed to register MCP tools: {e}")
+            # Apply tools to config
+            if tools_to_apply:
+                config["tools"] = tools_to_apply
+                # Disable automatic function calling for manual execution
+                config["automatic_function_calling"] = types.AutomaticFunctionCallingConfig(disable=True)
+                logger.debug("[Gemini] Disabled automatic function calling for manual execution")
+            else:
+                # No custom/MCP tools, add builtin tools if any
+                if builtin_tools:
+                    config["tools"] = builtin_tools
-                    # Iterate over the asynchronous stream to get chunks as they arrive
-                    async for chunk in stream:
-                        # ============================================
-                        # 1. Process function calls/responses
-                        # ============================================
+            # For coordination/post-evaluation requests, use JSON response format when no tools present
+            if not tools_to_apply and not builtin_tools:
+                if is_coordination:
+                    config["response_mime_type"] = "application/json"
+                    config["response_schema"] = CoordinationResponse.model_json_schema()
+                elif is_post_evaluation:
+                    config["response_mime_type"] = "application/json"
+                    config["response_schema"] = PostEvaluationResponse.model_json_schema()
-                        # First check for function calls in the current chunk's candidates
-                        # (this is where custom tool calls appear, not in automatic_function_calling_history)
-                        if hasattr(chunk, "candidates") and chunk.candidates:
-                            for candidate in chunk.candidates:
-                                if hasattr(candidate, "content") and candidate.content:
-                                    if hasattr(candidate.content, "parts") and candidate.content.parts:
-                                        for part in candidate.content.parts:
-                                            # Check for function_call part
-                                            if hasattr(part, "function_call") and part.function_call:
-                                                # Extract call data
-                                                call_data = self.mcp_extractor.extract_function_call(part.function_call)
-                                                if call_data:
-                                                    tool_name = call_data["name"]
-                                                    tool_args = call_data["arguments"]
-                                                    # DEBUG: Log tool matching
-                                                    logger.info(f"🔍 [DEBUG] Function call detected: tool_name='{tool_name}'")
-                                                    logger.info(f"🔍 [DEBUG] Available MCP tools: {available_mcp_tools}")
-                                                    logger.info(f"🔍 [DEBUG] Available custom tools: {list(self._custom_tool_names) if has_custom_tools else []}")
-                                                    # Determine if it's MCP tool or custom tool
-                                                    # MCP tools may come from SDK without prefix, so we need to check both:
-                                                    # 1. Direct match (tool_name in list)
-                                                    # 2. Prefixed match (mcp__server__tool_name in list)
-                                                    is_mcp_tool = False
-                                                    if has_mcp:
-                                                        # Direct match
-                                                        if tool_name in available_mcp_tools:
-                                                            is_mcp_tool = True
-                                                        else:
-                                                            # Try matching with MCP prefix format: mcp__<server>__<tool>
-                                                            # Check if any available MCP tool ends with the current tool_name
-                                                            for mcp_tool in available_mcp_tools:
-                                                                # Format: mcp__server__toolname
-                                                                if mcp_tool.startswith("mcp__") and mcp_tool.endswith(f"__{tool_name}"):
-                                                                    is_mcp_tool = True
-                                                                    logger.info(f"🔍 [DEBUG] Matched MCP tool: {tool_name} -> {mcp_tool}")
-                                                                    break
-                                                    is_custom_tool = has_custom_tools and tool_name in self._custom_tool_names
-                                                    logger.info(f"🔍 [DEBUG] Tool matching result: is_mcp_tool={is_mcp_tool}, is_custom_tool={is_custom_tool}")
-                                                    if is_custom_tool:
-                                                        # Process custom tool call
-                                                        if custom_tracker.is_new_call(tool_name, tool_args):
-                                                            call_record = custom_tracker.add_call(tool_name, tool_args)
-                                                            custom_tools_used.append(
-                                                                {
-                                                                    "name": tool_name,
-                                                                    "arguments": tool_args,
-                                                                    "timestamp": call_record["timestamp"],
-                                                                },
-                                                            )
-                                                            timestamp_str = time.strftime(
-                                                                "%H:%M:%S",
-                                                                time.localtime(call_record["timestamp"]),
-                                                            )
-                                                            yield StreamChunk(
-                                                                type="custom_tool_status",
-                                                                status="custom_tool_called",
-                                                                content=f"🔧 Custom Tool Called: {tool_name} at {timestamp_str} with args: {json.dumps(tool_args, indent=2)}",
-                                                                source="custom_tools",
-                                                            )
-                                                            log_tool_call(
-                                                                agent_id,
-                                                                tool_name,
-                                                                tool_args,
-                                                                backend_name="gemini",
-                                                            )
-                                                    elif is_mcp_tool:
-                                                        # Process MCP tool call
-                                                        if mcp_tracker.is_new_call(tool_name, tool_args):
-                                                            call_record = mcp_tracker.add_call(tool_name, tool_args)
-                                                            mcp_tools_used.append(
-                                                                {
-                                                                    "name": tool_name,
-                                                                    "arguments": tool_args,
-                                                                    "timestamp": call_record["timestamp"],
-                                                                },
-                                                            )
-                                                            timestamp_str = time.strftime(
-                                                                "%H:%M:%S",
-                                                                time.localtime(call_record["timestamp"]),
-                                                            )
-                                                            yield StreamChunk(
-                                                                type="mcp_status",
-                                                                status="mcp_tool_called",
-                                                                content=f"🔧 MCP Tool Called: {tool_name} at {timestamp_str} with args: {json.dumps(tool_args, indent=2)}",
-                                                                source="mcp_tools",
-                                                            )
-                                                            log_tool_call(
-                                                                agent_id,
-                                                                tool_name,
-                                                                tool_args,
-                                                                backend_name="gemini",
-                                                            )
-                        # Then check automatic_function_calling_history (for MCP tools that were auto-executed)
-                        if hasattr(chunk, "automatic_function_calling_history") and chunk.automatic_function_calling_history:
-                            for history_item in chunk.automatic_function_calling_history:
-                                if hasattr(history_item, "parts") and history_item.parts is not None:
-                                    for part in history_item.parts:
-                                        # Check for function_call part
-                                        if hasattr(part, "function_call") and part.function_call:
-                                            # Use MCPResponseExtractor to extract call data
-                                            call_data = self.mcp_extractor.extract_function_call(part.function_call)
-                                            if call_data:
-                                                tool_name = call_data["name"]
-                                                tool_args = call_data["arguments"]
-                                                # DEBUG: Log tool matching (from automatic_function_calling_history)
-                                                logger.info(f"🔍 [DEBUG-AUTO] Function call in history: tool_name='{tool_name}'")
-                                                logger.info(f"🔍 [DEBUG-AUTO] Available MCP tools: {available_mcp_tools}")
-                                                logger.info(f"🔍 [DEBUG-AUTO] Available custom tools: {list(self._custom_tool_names) if has_custom_tools else []}")
-                                                # Determine if it's MCP tool or custom tool
-                                                # MCP tools may come from SDK without prefix, so we need to check both
-                                                is_mcp_tool = False
-                                                if has_mcp:
-                                                    if tool_name in available_mcp_tools:
-                                                        is_mcp_tool = True
-                                                    else:
-                                                        # Try matching with MCP prefix format
-                                                        for mcp_tool in available_mcp_tools:
-                                                            if mcp_tool.startswith("mcp__") and mcp_tool.endswith(f"__{tool_name}"):
-                                                                is_mcp_tool = True
-                                                                logger.info(f"🔍 [DEBUG-AUTO] Matched MCP tool: {tool_name} -> {mcp_tool}")
-                                                                break
-                                                is_custom_tool = has_custom_tools and tool_name in self._custom_tool_names
-                                                logger.info(f"🔍 [DEBUG-AUTO] Tool matching result: is_mcp_tool={is_mcp_tool}, is_custom_tool={is_custom_tool}")
-                                                if is_mcp_tool:
-                                                    # Process MCP tool call
-                                                    if mcp_tracker.is_new_call(tool_name, tool_args):
-                                                        call_record = mcp_tracker.add_call(tool_name, tool_args)
-                                                        mcp_tools_used.append(
-                                                            {
-                                                                "name": tool_name,
-                                                                "arguments": tool_args,
-                                                                "timestamp": call_record["timestamp"],
-                                                            },
-                                                        )
-                                                        timestamp_str = time.strftime(
-                                                            "%H:%M:%S",
-                                                            time.localtime(call_record["timestamp"]),
-                                                        )
-                                                        yield StreamChunk(
-                                                            type="mcp_status",
-                                                            status="mcp_tool_called",
-                                                            content=f"🔧 MCP Tool Called: {tool_name} at {timestamp_str} with args: {json.dumps(tool_args, indent=2)}",
-                                                            source="mcp_tools",
-                                                        )
-                                                        log_tool_call(
-                                                            agent_id,
-                                                            tool_name,
-                                                            tool_args,
-                                                            backend_name="gemini",
-                                                        )
-                                                elif is_custom_tool:
-                                                    # Process custom tool call
-                                                    if custom_tracker.is_new_call(tool_name, tool_args):
-                                                        call_record = custom_tracker.add_call(tool_name, tool_args)
-                                                        custom_tools_used.append(
-                                                            {
-                                                                "name": tool_name,
-                                                                "arguments": tool_args,
-                                                                "timestamp": call_record["timestamp"],
-                                                            },
-                                                        )
-                                                        timestamp_str = time.strftime(
-                                                            "%H:%M:%S",
-                                                            time.localtime(call_record["timestamp"]),
-                                                        )
-                                                        yield StreamChunk(
-                                                            type="custom_tool_status",
-                                                            status="custom_tool_called",
-                                                            content=f"🔧 Custom Tool Called: {tool_name} at {timestamp_str} with args: {json.dumps(tool_args, indent=2)}",
-                                                            source="custom_tools",
-                                                        )
-                                                        log_tool_call(
-                                                            agent_id,
-                                                            tool_name,
-                                                            tool_args,
-                                                            backend_name="gemini",
-                                                        )
-                                        # Check for function_response part
-                                        elif hasattr(part, "function_response") and part.function_response:
-                                            response_data = self.mcp_extractor.extract_function_response(part.function_response)
-                                            if response_data:
-                                                tool_name = response_data["name"]
-                                                tool_response = response_data["response"]
-                                                # Determine if it's MCP tool or custom tool
-                                                # MCP tools may come from SDK without prefix
-                                                is_mcp_tool = False
-                                                if has_mcp:
-                                                    if tool_name in available_mcp_tools:
-                                                        is_mcp_tool = True
-                                                    else:
-                                                        # Try matching with MCP prefix format
-                                                        for mcp_tool in available_mcp_tools:
-                                                            if mcp_tool.startswith("mcp__") and mcp_tool.endswith(f"__{tool_name}"):
-                                                                is_mcp_tool = True
-                                                                break
-                                                is_custom_tool = has_custom_tools and tool_name in self._custom_tool_names
-                                                if is_mcp_tool:
-                                                    # Process MCP tool response
-                                                    if mcp_response_tracker.is_new_response(tool_name, tool_response):
-                                                        response_record = mcp_response_tracker.add_response(tool_name, tool_response)
-                                                        # Extract text content from CallToolResult
-                                                        response_text = None
-                                                        if isinstance(tool_response, dict) and "result" in tool_response:
-                                                            result = tool_response["result"]
-                                                            if hasattr(result, "content") and result.content:
-                                                                first_content = result.content[0]
-                                                                if hasattr(first_content, "text"):
-                                                                    response_text = first_content.text
-                                                        if response_text is None:
-                                                            response_text = str(tool_response)
-                                                        timestamp_str = time.strftime(
-                                                            "%H:%M:%S",
-                                                            time.localtime(response_record["timestamp"]),
-                                                        )
-                                                        # Format response as JSON if possible
-                                                        formatted_response = format_tool_response_as_json(response_text)
-                                                        yield StreamChunk(
-                                                            type="mcp_status",
-                                                            status="mcp_tool_response",
-                                                            content=f"✅ MCP Tool Response from {tool_name} at {timestamp_str}: {formatted_response}",
-                                                            source="mcp_tools",
-                                                        )
-                                                        log_backend_activity(
-                                                            "gemini",
-                                                            "MCP tool response received",
-                                                            {
-                                                                "tool_name": tool_name,
-                                                                "response_preview": str(tool_response)[:],
-                                                            },
-                                                            agent_id=agent_id,
-                                                        )
-                                                elif is_custom_tool:
-                                                    # Process custom tool response
-                                                    if custom_response_tracker.is_new_response(tool_name, tool_response):
-                                                        response_record = custom_response_tracker.add_response(tool_name, tool_response)
-                                                        # Extract text from response
-                                                        response_text = str(tool_response)
-                                                        timestamp_str = time.strftime(
-                                                            "%H:%M:%S",
-                                                            time.localtime(response_record["timestamp"]),
-                                                        )
-                                                        # Format response as JSON if possible
-                                                        formatted_response = format_tool_response_as_json(response_text)
-                                                        yield StreamChunk(
-                                                            type="custom_tool_status",
-                                                            status="custom_tool_response",
-                                                            content=f"✅ Custom Tool Response from {tool_name} at {timestamp_str}: {formatted_response}",
-                                                            source="custom_tools",
-                                                        )
-                                                        log_backend_activity(
-                                                            "gemini",
-                                                            "Custom tool response received",
-                                                            {
-                                                                "tool_name": tool_name,
-                                                                "response_preview": str(tool_response),
-                                                            },
-                                                            agent_id=agent_id,
-                                                        )
-                        # ============================================
-                        # 2. Process text content
-                        # ============================================
-                        if hasattr(chunk, "text") and chunk.text:
-                            chunk_text = chunk.text
-                            full_content_text += chunk_text
-                            log_backend_agent_message(
-                                agent_id,
-                                "RECV",
-                                {"content": chunk_text},
-                                backend_name="gemini",
-                            )
-                            log_stream_chunk("backend.gemini", "content", chunk_text, agent_id)
-                            yield StreamChunk(type="content", content=chunk_text)
+            # Log messages being sent
+            log_backend_agent_message(
+                agent_id or "default",
+                "SEND",
+                {
+                    "content": full_content,
+                    "custom_tools": len(tools_to_apply) if tools_to_apply else 0,
+                },
+                backend_name="gemini",
+            )
-                        # ============================================
-                        # 3. Buffer last chunk with candidates
-                        # ============================================
-                        if hasattr(chunk, "candidates") and chunk.candidates:
-                            last_response_with_candidates = chunk
-                    # Reset stream tracking
-                    if hasattr(self, "_mcp_stream_started"):
-                        delattr(self, "_mcp_stream_started")
-                    # ====================================================================
-                    # Tool execution loop: Execute tools until model stops calling them
-                    # ====================================================================
-                    # Note: When automatic_function_calling is disabled, BOTH custom and MCP tools
-                    # need to be manually executed. The model may make multiple rounds of tool calls
-                    # (e.g., call custom tool first, then MCP tool after seeing the result).
-                    executed_tool_calls = set()  # Track which tools we've already executed
-                    max_tool_rounds = 10  # Prevent infinite loops
-                    tool_round = 0
-                    while tool_round < max_tool_rounds:
-                        # Find new tool calls that haven't been executed yet
-                        new_custom_tools = []
-                        new_mcp_tools = []
-                        for tool_call in custom_tools_used:
-                            call_signature = f"custom_{tool_call['name']}_{json.dumps(tool_call['arguments'], sort_keys=True)}"
-                            if call_signature not in executed_tool_calls:
-                                new_custom_tools.append(tool_call)
-                                executed_tool_calls.add(call_signature)
-                        for tool_call in mcp_tools_used:
-                            call_signature = f"mcp_{tool_call['name']}_{json.dumps(tool_call['arguments'], sort_keys=True)}"
-                            if call_signature not in executed_tool_calls:
-                                new_mcp_tools.append(tool_call)
-                                executed_tool_calls.add(call_signature)
-                        # If no new tools to execute, break the loop
-                        if not new_custom_tools and not new_mcp_tools:
-                            break
+            # ====================================================================
+            # Streaming Phase: Stream with simple function call detection
+            # ====================================================================
+            stream = await client.aio.models.generate_content_stream(
+                model=model_name,
+                contents=full_content,
+                config=config,
+            )
-                        tool_round += 1
-                        logger.debug(f"[Gemini] Tool execution round {tool_round}: {len(new_custom_tools)} custom, {len(new_mcp_tools)} MCP")
+            # Simple list accumulation for function calls (no trackers)
+            captured_function_calls = []
+            full_content_text = ""
+            last_response_with_candidates = None
-                        # Execute tools and collect results for this round
-                        tool_responses = []
+            # Stream chunks and capture function calls
+            async for chunk in stream:
+                # Detect function calls in candidates
+                if hasattr(chunk, "candidates") and chunk.candidates:
+                    for candidate in chunk.candidates:
+                        if hasattr(candidate, "content") and candidate.content:
+                            if hasattr(candidate.content, "parts") and candidate.content.parts:
+                                for part in candidate.content.parts:
+                                    # Check for function_call part
+                                    if hasattr(part, "function_call") and part.function_call:
+                                        # Extract call data
+                                        tool_name = part.function_call.name
+                                        tool_args = dict(part.function_call.args) if part.function_call.args else {}
+                                        # Create call record
+                                        call_id = f"call_{len(captured_function_calls)}"
+                                        captured_function_calls.append(
+                                            {
+                                                "call_id": call_id,
+                                                "name": tool_name,
+                                                "arguments": json.dumps(tool_args),
+                                            },
+                                        )
+                                        logger.info(f"[Gemini] Function call detected: {tool_name}")
+                # Process text content
+                if hasattr(chunk, "text") and chunk.text:
+                    chunk_text = chunk.text
+                    full_content_text += chunk_text
+                    log_backend_agent_message(
+                        agent_id,
+                        "RECV",
+                        {"content": chunk_text},
+                        backend_name="gemini",
+                    )
+                    log_stream_chunk("backend.gemini", "content", chunk_text, agent_id)
+                    yield StreamChunk(type="content", content=chunk_text)
-                        # Execute custom tools
-                        for tool_call in new_custom_tools:
-                            tool_name = tool_call["name"]
-                            tool_args = tool_call["arguments"]
+                # Buffer last chunk with candidates
+                if hasattr(chunk, "candidates") and chunk.candidates:
+                    last_response_with_candidates = chunk
-                            try:
-                                # Execute the custom tool
-                                result_str = await self._execute_custom_tool(
-                                    {
-                                        "name": tool_name,
-                                        "arguments": json.dumps(tool_args) if isinstance(tool_args, dict) else tool_args,
-                                    },
-                                )
+            # ====================================================================
+            # Structured Coordination Output Parsing
+            # ====================================================================
+            # Check for structured coordination output when no function calls captured
+            if is_coordination and not captured_function_calls and full_content_text:
+                # Try to parse structured response from text content
+                parsed = self.formatter.extract_structured_response(full_content_text)
-                                # Format result as JSON if possible
-                                formatted_result = format_tool_response_as_json(result_str)
+                if parsed and isinstance(parsed, dict):
+                    # Convert structured response to tool calls
+                    tool_calls = self.formatter.convert_structured_to_tool_calls(parsed)
-                                # Yield execution status
-                                yield StreamChunk(
-                                    type="custom_tool_status",
-                                    status="custom_tool_executed",
-                                    content=f"✅ Custom Tool Executed: {tool_name} -> {formatted_result}",
-                                    source="custom_tools",
-                                )
+                    if tool_calls:
+                        # Categorize the tool calls
+                        mcp_calls, custom_calls, provider_calls = self._categorize_tool_calls(tool_calls)
+                        # Handle provider (workflow) calls - these are coordination actions
+                        # We yield StreamChunk entries but do NOT execute them
+                        if provider_calls:
+                            # Convert provider calls to tool_calls format for orchestrator
+                            workflow_tool_calls = []
+                            for call in provider_calls:
+                                tool_name = call.get("name", "")
+                                tool_args_str = call.get("arguments", "{}")
+                                # Parse arguments if they're a string
+                                if isinstance(tool_args_str, str):
+                                    try:
+                                        tool_args = json.loads(tool_args_str)
+                                    except json.JSONDecodeError:
+                                        tool_args = {}
+                                else:
+                                    tool_args = tool_args_str
-                                # Build function response in Gemini format
-                                tool_responses.append(
-                                    {
-                                        "name": tool_name,
-                                        "response": {"result": result_str},
-                                    },
+                                # Log the coordination action
+                                logger.info(f"[Gemini] Structured coordination action: {tool_name}")
+                                log_tool_call(
+                                    agent_id,
+                                    tool_name,
+                                    tool_args,
+                                    None,
+                                    backend_name="gemini",
                                 )
-                            except Exception as e:
-                                error_msg = f"Error executing custom tool {tool_name}: {str(e)}"
-                                logger.error(error_msg)
-                                yield StreamChunk(
-                                    type="custom_tool_status",
-                                    status="custom_tool_error",
-                                    content=f"❌ {error_msg}",
-                                    source="custom_tools",
-                                )
-                                # Add error response
-                                tool_responses.append(
+                                # Build tool call in standard format
+                                workflow_tool_calls.append(
                                     {
-                                        "name": tool_name,
-                                        "response": {"error": str(e)},
+                                        "id": call.get("call_id", f"call_{len(workflow_tool_calls)}"),
+                                        "type": "function",
+                                        "function": {
+                                            "name": tool_name,
+                                            "arguments": tool_args,
+                                        },
                                     },
                                 )
-                        # Execute MCP tools manually (since automatic_function_calling is disabled)
-                        for tool_call in new_mcp_tools:
-                            tool_name = tool_call["name"]
-                            tool_args = tool_call["arguments"]
-                            try:
-                                # Execute the MCP tool via MCP client
-                                if not self._mcp_client:
-                                    raise RuntimeError("MCP client not initialized")
-                                # Convert tool name to prefixed format if needed
-                                # MCP client expects: mcp__server__toolname
-                                # Gemini SDK returns: toolname (without prefix)
-                                prefixed_tool_name = tool_name
-                                if not tool_name.startswith("mcp__"):
-                                    # Find the matching prefixed tool name
-                                    for mcp_tool in available_mcp_tools:
-                                        if mcp_tool.startswith("mcp__") and mcp_tool.endswith(f"__{tool_name}"):
-                                            prefixed_tool_name = mcp_tool
-                                            logger.info(f"🔧 [DEBUG] Converting tool name for execution: {tool_name} -> {prefixed_tool_name}")
-                                            break
-                                mcp_result = await self._mcp_client.call_tool(prefixed_tool_name, tool_args)
-                                # Extract text from CallToolResult object
-                                result_str = None
-                                if mcp_result:
-                                    if hasattr(mcp_result, "content") and mcp_result.content:
-                                        first_content = mcp_result.content[0]
-                                        if hasattr(first_content, "text"):
-                                            result_str = first_content.text
-                                if result_str is None:
-                                    result_str = str(mcp_result) if mcp_result else "None"
-                                # Format result as JSON if possible
-                                formatted_result = format_tool_response_as_json(result_str)
-                                result_preview = formatted_result
-                                # Yield execution status
+                            # Emit tool_calls chunk for orchestrator to process
+                            if workflow_tool_calls:
+                                log_stream_chunk("backend.gemini", "tool_calls", workflow_tool_calls, agent_id)
                                 yield StreamChunk(
-                                    type="mcp_status",
-                                    status="mcp_tool_executed",
-                                    content=f"✅ MCP Tool Executed: {tool_name} -> {result_preview}{'...' if len(formatted_result) > 200 else ''}",
-                                    source="mcp_tools",
+                                    type="tool_calls",
+                                    tool_calls=workflow_tool_calls,
+                                    source="gemini",
                                 )
-                                # Build function response in Gemini format
-                                tool_responses.append(
-                                    {
-                                        "name": tool_name,
-                                        "response": {"result": mcp_result},
-                                    },
-                                )
-                            except Exception as e:
-                                error_msg = f"Error executing MCP tool {tool_name}: {str(e)}"
-                                logger.error(error_msg)
+                        # Do not execute workflow tools - just return after yielding
+                        # The orchestrator will handle these coordination actions
+                        if provider_calls:
+                            # Emit completion status if MCP was actually used
+                            if mcp_used:
                                 yield StreamChunk(
                                     type="mcp_status",
-                                    status="mcp_tool_error",
-                                    content=f"❌ {error_msg}",
+                                    status="mcp_session_complete",
+                                    content="✅ [MCP] Session completed",
                                     source="mcp_tools",
                                 )
-                                # Add error response
-                                tool_responses.append(
-                                    {
-                                        "name": tool_name,
-                                        "response": {"error": str(e)},
-                                    },
-                                )
-                        # Make continuation call with tool results from this round
-                        if tool_responses:
+                            yield StreamChunk(type="done")
+                            return
+            # ====================================================================
+            # Tool Execution Phase: Execute captured function calls using base class
+            # ====================================================================
+            if captured_function_calls:
+                # Categorize function calls using base class helper
+                mcp_calls, custom_calls, provider_calls = self._categorize_tool_calls(captured_function_calls)
+                # ====================================================================
+                # Handle provider (workflow) calls - emit as StreamChunks but do NOT execute
+                # ====================================================================
+                if provider_calls:
+                    # Convert provider calls to tool_calls format for orchestrator
+                    workflow_tool_calls = []
+                    for call in provider_calls:
+                        tool_name = call.get("name", "")
+                        tool_args_str = call.get("arguments", "{}")
+                        # Parse arguments if they're a string
+                        if isinstance(tool_args_str, str):
                             try:
-                                from google.genai import types
-                                # Build conversation history for continuation
-                                # Track all function calls from this round
-                                round_function_calls = new_custom_tools + new_mcp_tools
-                                # Build conversation history
-                                conversation_history = []
-                                # Add original user content
-                                conversation_history.append(
-                                    types.Content(
-                                        parts=[types.Part(text=full_content)],
-                                        role="user",
-                                    ),
-                                )
-                                # Add model's function call response (tools from THIS round)
-                                model_parts = []
-                                for tool_call in round_function_calls:
-                                    model_parts.append(
-                                        types.Part.from_function_call(
-                                            name=tool_call["name"],
-                                            args=tool_call["arguments"],
-                                        ),
-                                    )
-                                conversation_history.append(
-                                    types.Content(
-                                        parts=model_parts,
-                                        role="model",
-                                    ),
-                                )
-                                # Add function response (as user message with function_response parts)
-                                response_parts = []
-                                for resp in tool_responses:
-                                    response_parts.append(
-                                        types.Part.from_function_response(
-                                            name=resp["name"],
-                                            response=resp["response"],
-                                        ),
-                                    )
-                                conversation_history.append(
-                                    types.Content(
-                                        parts=response_parts,
-                                        role="user",
-                                    ),
-                                )
-                                # Make continuation call
-                                yield StreamChunk(
-                                    type="custom_tool_status",
-                                    status="continuation_call",
-                                    content=f"🔄 Making continuation call with {len(tool_responses)} tool results...",
-                                    source="custom_tools",
-                                )
-                                # Use same session_config as before
-                                continuation_stream = await client.aio.models.generate_content_stream(
-                                    model=model_name,
-                                    contents=conversation_history,
-                                    config=session_config,
-                                )
+                                tool_args = json.loads(tool_args_str)
+                            except json.JSONDecodeError:
+                                tool_args = {}
+                        else:
+                            tool_args = tool_args_str
-                                # Process continuation stream (same processing as main stream)
-                                async for chunk in continuation_stream:
-                                    # ============================================
-                                    # Process function calls/responses in continuation
-                                    # ============================================
-                                    # Check for function calls in current chunk's candidates
-                                    if hasattr(chunk, "candidates") and chunk.candidates:
-                                        for candidate in chunk.candidates:
-                                            if hasattr(candidate, "content") and candidate.content:
-                                                if hasattr(candidate.content, "parts") and candidate.content.parts:
-                                                    for part in candidate.content.parts:
-                                                        # Check for function_call part
-                                                        if hasattr(part, "function_call") and part.function_call:
-                                                            call_data = self.mcp_extractor.extract_function_call(part.function_call)
-                                                            if call_data:
-                                                                tool_name = call_data["name"]
-                                                                tool_args = call_data["arguments"]
-                                                                # Determine if it's MCP tool or custom tool
-                                                                # MCP tools may come from SDK without prefix
-                                                                is_mcp_tool = False
-                                                                if has_mcp:
-                                                                    if tool_name in available_mcp_tools:
-                                                                        is_mcp_tool = True
-                                                                    else:
-                                                                        # Try matching with MCP prefix format
-                                                                        for mcp_tool in available_mcp_tools:
-                                                                            if mcp_tool.startswith("mcp__") and mcp_tool.endswith(f"__{tool_name}"):
-                                                                                is_mcp_tool = True
-                                                                                break
-                                                                is_custom_tool = has_custom_tools and tool_name in self._custom_tool_names
-                                                                if is_custom_tool:
-                                                                    # Process custom tool call
-                                                                    if custom_tracker.is_new_call(tool_name, tool_args):
-                                                                        call_record = custom_tracker.add_call(tool_name, tool_args)
-                                                                        custom_tools_used.append(
-                                                                            {
-                                                                                "name": tool_name,
-                                                                                "arguments": tool_args,
-                                                                                "timestamp": call_record["timestamp"],
-                                                                            },
-                                                                        )
-                                                                        timestamp_str = time.strftime(
-                                                                            "%H:%M:%S",
-                                                                            time.localtime(call_record["timestamp"]),
-                                                                        )
-                                                                        yield StreamChunk(
-                                                                            type="custom_tool_status",
-                                                                            status="custom_tool_called",
-                                                                            content=f"🔧 Custom Tool Called: {tool_name} at {timestamp_str} with args: {json.dumps(tool_args, indent=2)}",
-                                                                            source="custom_tools",
-                                                                        )
-                                                                        log_tool_call(
-                                                                            agent_id,
-                                                                            tool_name,
-                                                                            tool_args,
-                                                                            backend_name="gemini",
-                                                                        )
-                                                                elif is_mcp_tool:
-                                                                    # Process MCP tool call
-                                                                    if mcp_tracker.is_new_call(tool_name, tool_args):
-                                                                        call_record = mcp_tracker.add_call(tool_name, tool_args)
-                                                                        mcp_tools_used.append(
-                                                                            {
-                                                                                "name": tool_name,
-                                                                                "arguments": tool_args,
-                                                                                "timestamp": call_record["timestamp"],
-                                                                            },
-                                                                        )
-                                                                        timestamp_str = time.strftime(
-                                                                            "%H:%M:%S",
-                                                                            time.localtime(call_record["timestamp"]),
-                                                                        )
-                                                                        yield StreamChunk(
-                                                                            type="mcp_status",
-                                                                            status="mcp_tool_called",
-                                                                            content=f"🔧 MCP Tool Called: {tool_name} at {timestamp_str} with args: {json.dumps(tool_args, indent=2)}",
-                                                                            source="mcp_tools",
-                                                                        )
-                                                                        log_tool_call(
-                                                                            agent_id,
-                                                                            tool_name,
-                                                                            tool_args,
-                                                                            backend_name="gemini",
-                                                                        )
-                                    # Check automatic_function_calling_history (for auto-executed MCP tools)
-                                    if hasattr(chunk, "automatic_function_calling_history") and chunk.automatic_function_calling_history:
-                                        for history_item in chunk.automatic_function_calling_history:
-                                            if hasattr(history_item, "parts") and history_item.parts is not None:
-                                                for part in history_item.parts:
-                                                    # Check for function_call part
-                                                    if hasattr(part, "function_call") and part.function_call:
-                                                        call_data = self.mcp_extractor.extract_function_call(part.function_call)
-                                                        if call_data:
-                                                            tool_name = call_data["name"]
-                                                            tool_args = call_data["arguments"]
-                                                            # Determine if it's MCP tool or custom tool
-                                                            # MCP tools may come from SDK without prefix
-                                                            is_mcp_tool = False
-                                                            if has_mcp:
-                                                                if tool_name in available_mcp_tools:
-                                                                    is_mcp_tool = True
-                                                                else:
-                                                                    # Try matching with MCP prefix format
-                                                                    for mcp_tool in available_mcp_tools:
-                                                                        if mcp_tool.startswith("mcp__") and mcp_tool.endswith(f"__{tool_name}"):
-                                                                            is_mcp_tool = True
-                                                                            break
-                                                            is_custom_tool = has_custom_tools and tool_name in self._custom_tool_names
-                                                            if is_mcp_tool:
-                                                                # Process MCP tool call
-                                                                if mcp_tracker.is_new_call(tool_name, tool_args):
-                                                                    call_record = mcp_tracker.add_call(tool_name, tool_args)
-                                                                    mcp_tools_used.append(
-                                                                        {
-                                                                            "name": tool_name,
-                                                                            "arguments": tool_args,
-                                                                            "timestamp": call_record["timestamp"],
-                                                                        },
-                                                                    )
-                                                                    timestamp_str = time.strftime(
-                                                                        "%H:%M:%S",
-                                                                        time.localtime(call_record["timestamp"]),
-                                                                    )
-                                                                    yield StreamChunk(
-                                                                        type="mcp_status",
-                                                                        status="mcp_tool_called",
-                                                                        content=f"🔧 MCP Tool Called: {tool_name} at {timestamp_str} with args: {json.dumps(tool_args, indent=2)}",
-                                                                        source="mcp_tools",
-                                                                    )
-                                                                    log_tool_call(
-                                                                        agent_id,
-                                                                        tool_name,
-                                                                        tool_args,
-                                                                        backend_name="gemini",
-                                                                    )
-                                                            elif is_custom_tool:
-                                                                # Process custom tool call
-                                                                if custom_tracker.is_new_call(tool_name, tool_args):
-                                                                    call_record = custom_tracker.add_call(tool_name, tool_args)
-                                                                    custom_tools_used.append(
-                                                                        {
-                                                                            "name": tool_name,
-                                                                            "arguments": tool_args,
-                                                                            "timestamp": call_record["timestamp"],
-                                                                        },
-                                                                    )
-                                                                    timestamp_str = time.strftime(
-                                                                        "%H:%M:%S",
-                                                                        time.localtime(call_record["timestamp"]),
-                                                                    )
-                                                                    yield StreamChunk(
-                                                                        type="custom_tool_status",
-                                                                        status="custom_tool_called",
-                                                                        content=f"🔧 Custom Tool Called: {tool_name} at {timestamp_str} with args: {json.dumps(tool_args, indent=2)}",
-                                                                        source="custom_tools",
-                                                                    )
-                                                                    log_tool_call(
-                                                                        agent_id,
-                                                                        tool_name,
-                                                                        tool_args,
-                                                                        backend_name="gemini",
-                                                                    )
-                                                    # Check for function_response part
-                                                    elif hasattr(part, "function_response") and part.function_response:
-                                                        response_data = self.mcp_extractor.extract_function_response(part.function_response)
-                                                        if response_data:
-                                                            tool_name = response_data["name"]
-                                                            tool_response = response_data["response"]
-                                                            # Determine if it's MCP tool or custom tool
-                                                            # MCP tools may come from SDK without prefix
-                                                            is_mcp_tool = False
-                                                            if has_mcp:
-                                                                if tool_name in available_mcp_tools:
-                                                                    is_mcp_tool = True
-                                                                else:
-                                                                    # Try matching with MCP prefix format
-                                                                    for mcp_tool in available_mcp_tools:
-                                                                        if mcp_tool.startswith("mcp__") and mcp_tool.endswith(f"__{tool_name}"):
-                                                                            is_mcp_tool = True
-                                                                            break
-                                                            is_custom_tool = has_custom_tools and tool_name in self._custom_tool_names
-                                                            if is_mcp_tool:
-                                                                # Process MCP tool response
-                                                                if mcp_response_tracker.is_new_response(tool_name, tool_response):
-                                                                    response_record = mcp_response_tracker.add_response(tool_name, tool_response)
-                                                                    # Extract text content from CallToolResult
-                                                                    response_text = None
-                                                                    if isinstance(tool_response, dict) and "result" in tool_response:
-                                                                        result = tool_response["result"]
-                                                                        if hasattr(result, "content") and result.content:
-                                                                            first_content = result.content[0]
-                                                                            if hasattr(first_content, "text"):
-                                                                                response_text = first_content.text
-                                                                    if response_text is None:
-                                                                        response_text = str(tool_response)
-                                                                    timestamp_str = time.strftime(
-                                                                        "%H:%M:%S",
-                                                                        time.localtime(response_record["timestamp"]),
-                                                                    )
-                                                                    # Format response as JSON if possible
-                                                                    formatted_response = format_tool_response_as_json(response_text)
-                                                                    yield StreamChunk(
-                                                                        type="mcp_status",
-                                                                        status="mcp_tool_response",
-                                                                        content=f"✅ MCP Tool Response from {tool_name} at {timestamp_str}: {formatted_response}",
-                                                                        source="mcp_tools",
-                                                                    )
-                                                                    log_backend_activity(
-                                                                        "gemini",
-                                                                        "MCP tool response received",
-                                                                        {
-                                                                            "tool_name": tool_name,
-                                                                            "response_preview": str(tool_response)[:],
-                                                                        },
-                                                                        agent_id=agent_id,
-                                                                    )
-                                                            elif is_custom_tool:
-                                                                # Process custom tool response
-                                                                if custom_response_tracker.is_new_response(tool_name, tool_response):
-                                                                    response_record = custom_response_tracker.add_response(tool_name, tool_response)
-                                                                    # Extract text from response
-                                                                    response_text = str(tool_response)
-                                                                    timestamp_str = time.strftime(
-                                                                        "%H:%M:%S",
-                                                                        time.localtime(response_record["timestamp"]),
-                                                                    )
-                                                                    # Format response as JSON if possible
-                                                                    formatted_response = format_tool_response_as_json(response_text)
-                                                                    yield StreamChunk(
-                                                                        type="custom_tool_status",
-                                                                        status="custom_tool_response",
-                                                                        content=f"✅ Custom Tool Response from {tool_name} at {timestamp_str}: {formatted_response}",
-                                                                        source="custom_tools",
-                                                                    )
-                                                                    log_backend_activity(
-                                                                        "gemini",
-                                                                        "Custom tool response received",
-                                                                        {
-                                                                            "tool_name": tool_name,
-                                                                            "response_preview": str(tool_response),
-                                                                        },
-                                                                        agent_id=agent_id,
-                                                                    )
-                                    # ============================================
-                                    # Process text content
-                                    # ============================================
-                                    if hasattr(chunk, "text") and chunk.text:
-                                        chunk_text = chunk.text
-                                        full_content_text += chunk_text
-                                        log_stream_chunk("backend.gemini", "continuation_content", chunk_text, agent_id)
-                                        yield StreamChunk(type="content", content=chunk_text)
-                                    # ============================================
-                                    # Buffer last chunk
-                                    # ============================================
-                                    if hasattr(chunk, "candidates") and chunk.candidates:
-                                        last_response_with_candidates = chunk
-                            except Exception as e:
-                                error_msg = f"Error in continuation call: {str(e)}"
-                                logger.error(error_msg)
-                                yield StreamChunk(
-                                    type="custom_tool_status",
-                                    status="continuation_error",
-                                    content=f"❌ {error_msg}",
-                                    source="custom_tools",
-                                )
+                        # Log the coordination action
+                        logger.info(f"[Gemini] Function call coordination action: {tool_name}")
+                        log_tool_call(
+                            agent_id,
+                            tool_name,
+                            tool_args,
+                            None,
+                            backend_name="gemini",
+                        )
-                    # ====================================================================
-                    # Completion phase: Output summary
-                    # ====================================================================
+                        # Build tool call in standard format
+                        workflow_tool_calls.append(
+                            {
+                                "id": call.get("call_id", f"call_{len(workflow_tool_calls)}"),
+                                "type": "function",
+                                "function": {
+                                    "name": tool_name,
+                                    "arguments": tool_args,
+                                },
+                            },
+                        )
-                    # Add MCP usage indicator with detailed summary
-                    if has_mcp:
-                        mcp_summary = mcp_tracker.get_summary()
-                        if not mcp_summary or mcp_summary == "No MCP tools called":
-                            mcp_summary = "MCP session completed (no tools explicitly called)"
-                        else:
-                            mcp_summary = f"MCP session complete - {mcp_summary}"
+                    # Emit tool_calls chunk for orchestrator to process
+                    if workflow_tool_calls:
+                        log_stream_chunk("backend.gemini", "tool_calls", workflow_tool_calls, agent_id)
+                        yield StreamChunk(
+                            type="tool_calls",
+                            tool_calls=workflow_tool_calls,
+                            source="gemini",
+                        )
-                        log_stream_chunk("backend.gemini", "mcp_indicator", mcp_summary, agent_id)
+                    if mcp_used:
                         yield StreamChunk(
                             type="mcp_status",
                             status="mcp_session_complete",
-                            content=mcp_summary,
+                            content="✅ [MCP] Session completed",
                             source="mcp_tools",
                         )
-                    # Add custom tool usage indicator with detailed summary
-                    if has_custom_tools:
-                        custom_summary = custom_tracker.get_summary()
-                        if not custom_summary or custom_summary == "No MCP tools called":
-                            custom_summary = "Custom tools session completed (no tools explicitly called)"
-                        else:
-                            # Replace "MCP tool" with "Custom tool"
-                            custom_summary = custom_summary.replace("MCP tool", "Custom tool")
-                            custom_summary = f"Custom tools session complete - {custom_summary}"
+                    yield StreamChunk(type="done")
+                    return
+                # Initialize for execution
+                updated_messages = messages.copy()
+                processed_call_ids = set()
+                # Configuration for custom tool execution
+                CUSTOM_TOOL_CONFIG = ToolExecutionConfig(
+                    tool_type="custom",
+                    chunk_type="custom_tool_status",
+                    emoji_prefix="🔧 [Custom Tool]",
+                    success_emoji="✅ [Custom Tool]",
+                    error_emoji="❌ [Custom Tool Error]",
+                    source_prefix="custom_",
+                    status_called="custom_tool_called",
+                    status_response="custom_tool_response",
+                    status_error="custom_tool_error",
+                    execution_callback=self._execute_custom_tool,
+                )
-                        log_stream_chunk("backend.gemini", "custom_tools_indicator", custom_summary, agent_id)
-                        yield StreamChunk(
-                            type="custom_tool_status",
-                            status="custom_tools_session_complete",
-                            content=custom_summary,
-                            source="custom_tools",
-                        )
+                # Configuration for MCP tool execution
+                MCP_TOOL_CONFIG = ToolExecutionConfig(
+                    tool_type="mcp",
+                    chunk_type="mcp_status",
+                    emoji_prefix="🔧 [MCP Tool]",
+                    success_emoji="✅ [MCP Tool]",
+                    error_emoji="❌ [MCP Tool Error]",
+                    source_prefix="mcp_",
+                    status_called="mcp_tool_called",
+                    status_response="mcp_tool_response",
+                    status_error="mcp_tool_error",
+                    execution_callback=self._execute_mcp_function_with_retry,
+                )
-                except (
-                    MCPConnectionError,
-                    MCPTimeoutError,
-                    MCPServerError,
-                    MCPError,
-                    Exception,
-                ) as e:
-                    log_stream_chunk("backend.gemini", "tools_error", str(e), agent_id)
-                    # ====================================================================
-                    # Error handling: Distinguish MCP and custom tools errors
-                    # ====================================================================
-                    # Determine error type
-                    is_mcp_error = isinstance(e, (MCPConnectionError, MCPTimeoutError, MCPServerError, MCPError))
-                    is_custom_tool_error = not is_mcp_error and using_custom_tools
-                    # Emit user-friendly error message
-                    if is_mcp_error:
-                        async for chunk in self.mcp_manager.handle_mcp_error_and_fallback(e):
+                # Capture tool execution results for continuation loop
+                tool_results: Dict[str, str] = {}
+                self._active_tool_result_store = tool_results
+                try:
+                    # Execute custom tools
+                    for call in custom_calls:
+                        async for chunk in self._execute_tool_with_logging(
+                            call,
+                            CUSTOM_TOOL_CONFIG,
+                            updated_messages,
+                            processed_call_ids,
+                        ):
                             yield chunk
-                    elif is_custom_tool_error:
-                        yield StreamChunk(
-                            type="custom_tool_status",
-                            status="custom_tools_error",
-                            content=f"⚠️ [Custom Tools] Error: {str(e)}; falling back to non-custom-tool mode",
-                            source="custom_tools",
-                        )
-                    else:
+                    # Check circuit breaker before MCP tool execution
+                    if mcp_calls and not await self._check_circuit_breaker_before_execution():
+                        logger.warning("[Gemini] All MCP servers blocked by circuit breaker")
                         yield StreamChunk(
                             type="mcp_status",
-                            status="tools_error",
-                            content=f"⚠️ [Tools] Error: {str(e)}; falling back",
-                            source="tools",
+                            status="mcp_blocked",
+                            content="⚠️ [MCP] All servers blocked by circuit breaker",
+                            source="circuit_breaker",
                         )
+                        # Clear mcp_calls to skip execution
+                        mcp_calls = []
+                    # Execute MCP tools
+                    for call in mcp_calls:
+                        # Mark MCP as used when at least one MCP call is about to be executed
+                        mcp_used = True
+                        async for chunk in self._execute_tool_with_logging(
+                            call,
+                            MCP_TOOL_CONFIG,
+                            updated_messages,
+                            processed_call_ids,
+                        ):
+                            yield chunk
+                finally:
+                    self._active_tool_result_store = None
-                    # Fallback configuration
-                    manual_config = dict(config)
+                executed_calls = custom_calls + mcp_calls
-                    # Decide fallback configuration based on error type
-                    if is_mcp_error and using_custom_tools:
-                        # MCP error but custom tools available: exclude MCP, keep custom tools
-                        try:
-                            custom_tools_schemas = self._get_custom_tools_schemas()
-                            if custom_tools_schemas:
-                                # Convert to Gemini format using formatter
-                                custom_tools_functions = self.formatter.format_custom_tools(
-                                    custom_tools_schemas,
-                                    return_sdk_objects=True,
-                                )
-                                # Wrap FunctionDeclarations in a Tool object for Gemini SDK
-                                from google.genai import types
+                # Build initial conversation history using SDK Content objects
+                conversation_history: List[types.Content] = [
+                    types.Content(parts=[types.Part(text=full_content)], role="user"),
+                ]
-                                custom_tool = types.Tool(function_declarations=custom_tools_functions)
-                                manual_config["tools"] = [custom_tool]
-                                logger.info("[Gemini] Fallback: using custom tools only (MCP failed)")
-                            else:
-                                # Custom tools also unavailable, use builtin tools
-                                if all_tools:
-                                    manual_config["tools"] = all_tools
-                                logger.info("[Gemini] Fallback: using builtin tools only (both MCP and custom tools failed)")
-                        except Exception:
-                            if all_tools:
-                                manual_config["tools"] = all_tools
-                            logger.info("[Gemini] Fallback: using builtin tools only (custom tools also failed)")
-                    elif is_custom_tool_error and using_sdk_mcp:
-                        # Custom tools error but MCP available: exclude custom tools, keep MCP
-                        try:
-                            if self._mcp_client:
-                                mcp_sessions = self.mcp_manager.get_active_mcp_sessions(
-                                    convert_to_permission_sessions=bool(self.filesystem_manager),
-                                )
-                                if mcp_sessions:
-                                    manual_config["tools"] = mcp_sessions
-                                    logger.info("[Gemini] Fallback: using MCP only (custom tools failed)")
-                                else:
-                                    if all_tools:
-                                        manual_config["tools"] = all_tools
-                                    logger.info("[Gemini] Fallback: using builtin tools only (both custom tools and MCP failed)")
-                        except Exception:
-                            if all_tools:
-                                manual_config["tools"] = all_tools
-                            logger.info("[Gemini] Fallback: using builtin tools only (MCP also failed)")
+                if executed_calls:
+                    model_parts = []
+                    for call in executed_calls:
+                        args_payload: Any = call.get("arguments", {})
+                        if isinstance(args_payload, str):
+                            try:
+                                args_payload = json.loads(args_payload)
+                            except json.JSONDecodeError:
+                                args_payload = {}
+                        if not isinstance(args_payload, dict):
+                            args_payload = {}
+                        model_parts.append(
+                            types.Part.from_function_call(
+                                name=call.get("name", ""),
+                                args=args_payload,
+                            ),
+                        )
+                    if model_parts:
+                        conversation_history.append(types.Content(parts=model_parts, role="model"))
+                    response_parts = []
+                    for call in executed_calls:
+                        call_id = call.get("call_id")
+                        result_text = tool_results.get(call_id or "", "No result")
+                        response_parts.append(
+                            types.Part.from_function_response(
+                                name=call.get("name", ""),
+                                response={"result": result_text},
+                            ),
+                        )
+                    if response_parts:
+                        conversation_history.append(types.Content(parts=response_parts, role="user"))
-                    else:
-                        # Both failed or cannot determine: use builtin tools
-                        if all_tools:
-                            manual_config["tools"] = all_tools
-                        logger.info("[Gemini] Fallback: using builtin tools only (all advanced tools failed)")
+                last_continuation_chunk = None
-                    # Create new stream for fallback
-                    stream = await client.aio.models.generate_content_stream(
+                while True:
+                    continuation_stream = await client.aio.models.generate_content_stream(
                         model=model_name,
-                        contents=full_content,
-                        config=manual_config,
+                        contents=conversation_history,
+                        config=config,
                     )
+                    stream = continuation_stream
-                    async for chunk in stream:
-                        # Process text content
-                        if hasattr(chunk, "text") and chunk.text:
-                            chunk_text = chunk.text
-                            full_content_text += chunk_text
-                            log_stream_chunk(
-                                "backend.gemini",
-                                "fallback_content",
-                                chunk_text,
-                                agent_id,
-                            )
-                            yield StreamChunk(type="content", content=chunk_text)
-                        # Buffer last chunk with candidates for fallback path
+                    new_function_calls = []
+                    continuation_text = ""
+                    async for chunk in continuation_stream:
                         if hasattr(chunk, "candidates") and chunk.candidates:
-                            last_response_with_candidates = chunk
-            else:
-                # Non-MCP streaming path: execute when MCP is disabled
-                try:
-                    # Use the standard config (with builtin tools if configured)
-                    stream = await client.aio.models.generate_content_stream(
-                        model=model_name,
-                        contents=full_content,
-                        config=config,
-                    )
+                            last_continuation_chunk = chunk
+                            for candidate in chunk.candidates:
+                                if hasattr(candidate, "content") and candidate.content:
+                                    if hasattr(candidate.content, "parts") and candidate.content.parts:
+                                        for part in candidate.content.parts:
+                                            if hasattr(part, "function_call") and part.function_call:
+                                                tool_name = part.function_call.name
+                                                tool_args = dict(part.function_call.args) if part.function_call.args else {}
+                                                call_id = f"call_{len(new_function_calls)}"
+                                                new_function_calls.append(
+                                                    {
+                                                        "call_id": call_id,
+                                                        "name": tool_name,
+                                                        "arguments": json.dumps(tool_args),
+                                                    },
+                                                )
-                    # Process streaming chunks
-                    async for chunk in stream:
-                        # Process text content
                         if hasattr(chunk, "text") and chunk.text:
                             chunk_text = chunk.text
-                            full_content_text += chunk_text
+                            continuation_text += chunk_text
                             log_backend_agent_message(
                                 agent_id,
                                 "RECV",
@@ -1615,86 +771,316 @@ class GeminiBackend(CustomToolAndMCPBackend):
                             )
                             log_stream_chunk("backend.gemini", "content", chunk_text, agent_id)
                             yield StreamChunk(type="content", content=chunk_text)
-                        # Buffer last chunk with candidates for non-MCP path
-                        if hasattr(chunk, "candidates") and chunk.candidates:
-                            last_response_with_candidates = chunk
-                except Exception as e:
-                    error_msg = f"Non-MCP streaming error: {e}"
-                    log_stream_chunk(
-                        "backend.gemini",
-                        "non_mcp_stream_error",
-                        {"error_type": type(e).__name__, "error_message": str(e)},
-                        agent_id,
-                    )
-                    yield StreamChunk(type="error", error=error_msg)
+                    if continuation_text:
+                        conversation_history.append(
+                            types.Content(parts=[types.Part(text=continuation_text)], role="model"),
+                        )
+                        full_content_text += continuation_text
+                    if last_continuation_chunk:
+                        last_response_with_candidates = last_continuation_chunk
+                    if not new_function_calls:
+                        # ====================================================================
+                        # Continuation Structured Coordination Output Parsing
+                        # ====================================================================
+                        # Check for structured coordination output when no function calls in continuation
+                        if is_coordination and full_content_text:
+                            # Try to parse structured response from accumulated text content
+                            parsed = self.formatter.extract_structured_response(full_content_text)
+                            if parsed and isinstance(parsed, dict):
+                                # Convert structured response to tool calls
+                                tool_calls = self.formatter.convert_structured_to_tool_calls(parsed)
+                                if tool_calls:
+                                    # Categorize the tool calls
+                                    mcp_calls, custom_calls, provider_calls = self._categorize_tool_calls(tool_calls)
+                                    if provider_calls:
+                                        # Convert provider calls to tool_calls format for orchestrator
+                                        workflow_tool_calls = []
+                                        for call in provider_calls:
+                                            tool_name = call.get("name", "")
+                                            tool_args_str = call.get("arguments", "{}")
+                                            # Parse arguments if they're a string
+                                            if isinstance(tool_args_str, str):
+                                                try:
+                                                    tool_args = json.loads(tool_args_str)
+                                                except json.JSONDecodeError:
+                                                    tool_args = {}
+                                            else:
+                                                tool_args = tool_args_str
+                                            # Log the coordination action
+                                            logger.info(f"[Gemini] Continuation structured coordination action: {tool_name}")
+                                            log_tool_call(
+                                                agent_id,
+                                                tool_name,
+                                                tool_args,
+                                                None,
+                                                backend_name="gemini",
+                                            )
+                                            # Build tool call in standard format
+                                            workflow_tool_calls.append(
+                                                {
+                                                    "id": call.get("call_id", f"call_{len(workflow_tool_calls)}"),
+                                                    "type": "function",
+                                                    "function": {
+                                                        "name": tool_name,
+                                                        "arguments": tool_args,
+                                                    },
+                                                },
+                                            )
+                                        # Emit tool_calls chunk for orchestrator to process
+                                        if workflow_tool_calls:
+                                            log_stream_chunk("backend.gemini", "tool_calls", workflow_tool_calls, agent_id)
+                                            yield StreamChunk(
+                                                type="tool_calls",
+                                                tool_calls=workflow_tool_calls,
+                                                source="gemini",
+                                            )
+                                        if mcp_used:
+                                            yield StreamChunk(
+                                                type="mcp_status",
+                                                status="mcp_session_complete",
+                                                content="✅ [MCP] Session completed",
+                                                source="mcp_tools",
+                                            )
+                                        yield StreamChunk(type="done")
+                                        return
+                        # No structured output found, break continuation loop
+                        break
+                    next_mcp_calls, next_custom_calls, provider_calls = self._categorize_tool_calls(new_function_calls)
+                    # Handle provider calls emitted during continuation
+                    if provider_calls:
+                        workflow_tool_calls = []
+                        for call in provider_calls:
+                            tool_name = call.get("name", "")
+                            tool_args_str = call.get("arguments", "{}")
+                            if isinstance(tool_args_str, str):
+                                try:
+                                    tool_args = json.loads(tool_args_str)
+                                except json.JSONDecodeError:
+                                    tool_args = {}
+                            else:
+                                tool_args = tool_args_str
+                            logger.info(f"[Gemini] Continuation coordination action: {tool_name}")
+                            log_tool_call(
+                                agent_id,
+                                tool_name,
+                                tool_args,
+                                None,
+                                backend_name="gemini",
+                            )
+                            workflow_tool_calls.append(
+                                {
+                                    "id": call.get("call_id", f"call_{len(workflow_tool_calls)}"),
+                                    "type": "function",
+                                    "function": {
+                                        "name": tool_name,
+                                        "arguments": tool_args,
+                                    },
+                                },
+                            )
+                        if workflow_tool_calls:
+                            log_stream_chunk("backend.gemini", "tool_calls", workflow_tool_calls, agent_id)
+                            yield StreamChunk(
+                                type="tool_calls",
+                                tool_calls=workflow_tool_calls,
+                                source="gemini",
+                            )
+                        if mcp_used:
+                            yield StreamChunk(
+                                type="mcp_status",
+                                status="mcp_session_complete",
+                                content="✅ [MCP] Session completed",
+                                source="mcp_tools",
+                            )
+                        yield StreamChunk(type="done")
+                        return
+                    new_tool_results: Dict[str, str] = {}
+                    self._active_tool_result_store = new_tool_results
+                    try:
+                        for call in next_custom_calls:
+                            async for chunk in self._execute_tool_with_logging(
+                                call,
+                                CUSTOM_TOOL_CONFIG,
+                                updated_messages,
+                                processed_call_ids,
+                            ):
+                                yield chunk
+                        if next_mcp_calls and not await self._check_circuit_breaker_before_execution():
+                            logger.warning("[Gemini] All MCP servers blocked by circuit breaker during continuation")
+                            yield StreamChunk(
+                                type="mcp_status",
+                                status="mcp_blocked",
+                                content="⚠️ [MCP] All servers blocked by circuit breaker",
+                                source="circuit_breaker",
+                            )
+                            next_mcp_calls = []
+                        for call in next_mcp_calls:
+                            mcp_used = True
+                            async for chunk in self._execute_tool_with_logging(
+                                call,
+                                MCP_TOOL_CONFIG,
+                                updated_messages,
+                                processed_call_ids,
+                            ):
+                                yield chunk
+                    finally:
+                        self._active_tool_result_store = None
+                    if new_tool_results:
+                        tool_results.update(new_tool_results)
+                    executed_calls = next_custom_calls + next_mcp_calls
+                    if executed_calls:
+                        model_parts = []
+                        for call in executed_calls:
+                            args_payload: Any = call.get("arguments", {})
+                            if isinstance(args_payload, str):
+                                try:
+                                    args_payload = json.loads(args_payload)
+                                except json.JSONDecodeError:
+                                    args_payload = {}
+                            if not isinstance(args_payload, dict):
+                                args_payload = {}
+                            model_parts.append(
+                                types.Part.from_function_call(
+                                    name=call.get("name", ""),
+                                    args=args_payload,
+                                ),
+                            )
+                        if model_parts:
+                            conversation_history.append(types.Content(parts=model_parts, role="model"))
+                        response_parts = []
+                        for call in executed_calls:
+                            call_id = call.get("call_id")
+                            result_text = new_tool_results.get(call_id or "", "No result")
+                            response_parts.append(
+                                types.Part.from_function_response(
+                                    name=call.get("name", ""),
+                                    response={"result": result_text},
+                                ),
+                            )
+                        if response_parts:
+                            conversation_history.append(types.Content(parts=response_parts, role="user"))
-            content = full_content_text
+            # ====================================================================
+            # Completion Phase: Process structured tool calls and builtin indicators
+            # ====================================================================
+            final_response = last_response_with_candidates
-            # Process tool calls - coordination and post-evaluation tool calls (MCP manual mode removed)
             tool_calls_detected: List[Dict[str, Any]] = []
-            # Process coordination tools OR post-evaluation tools if present
-            if (is_coordination or is_post_evaluation) and content.strip() and not tool_calls_detected:
-                # For structured output mode, the entire content is JSON
+            if (is_coordination or is_post_evaluation) and full_content_text.strip():
+                content = full_content_text
                 structured_response = None
-                # Try multiple parsing strategies
                 try:
-                    # Strategy 1: Parse entire content as JSON (works for both modes)
                     structured_response = json.loads(content.strip())
                 except json.JSONDecodeError:
-                    # Strategy 2: Extract JSON from mixed text content (handles markdown-wrapped JSON)
                     structured_response = self.formatter.extract_structured_response(content)
-                if structured_response and isinstance(structured_response, dict) and "action_type" in structured_response:
-                    # Convert to tool calls
-                    tool_calls = self.formatter.convert_structured_to_tool_calls(structured_response)
-                    if tool_calls:
-                        tool_calls_detected = tool_calls
-                        # Log conversion to tool calls (summary)
-                        log_stream_chunk("backend.gemini", "tool_calls", tool_calls, agent_id)
+                if structured_response and isinstance(structured_response, dict) and structured_response.get("action_type"):
+                    raw_tool_calls = self.formatter.convert_structured_to_tool_calls(structured_response)
-                        # Log each tool call for analytics/debugging
+                    if raw_tool_calls:
                         tool_type = "post_evaluation" if is_post_evaluation else "coordination"
-                        try:
-                            for tool_call in tool_calls:
+                        workflow_tool_calls: List[Dict[str, Any]] = []
+                        for call in raw_tool_calls:
+                            tool_name = call.get("name", "")
+                            tool_args_str = call.get("arguments", "{}")
+                            if isinstance(tool_args_str, str):
+                                try:
+                                    tool_args = json.loads(tool_args_str)
+                                except json.JSONDecodeError:
+                                    tool_args = {}
+                            else:
+                                tool_args = tool_args_str
+                            try:
                                 log_tool_call(
                                     agent_id,
-                                    tool_call.get("function", {}).get("name", f"unknown_{tool_type}_tool"),
-                                    tool_call.get("function", {}).get("arguments", {}),
+                                    tool_name or f"unknown_{tool_type}_tool",
+                                    tool_args,
                                     result=f"{tool_type}_tool_called",
                                     backend_name="gemini",
                                 )
-                        except Exception:
-                            # Ensure logging does not interrupt flow
-                            pass
+                            except Exception:
+                                pass
+                            workflow_tool_calls.append(
+                                {
+                                    "id": call.get("call_id", f"call_{len(workflow_tool_calls)}"),
+                                    "type": "function",
+                                    "function": {
+                                        "name": tool_name,
+                                        "arguments": tool_args,
+                                    },
+                                },
+                            )
-            # Assign buffered final response (if available) so builtin tool indicators can be emitted
-            if last_response_with_candidates is not None:
-                final_response = last_response_with_candidates
+                        if workflow_tool_calls:
+                            tool_calls_detected = workflow_tool_calls
+                            log_stream_chunk("backend.gemini", "tool_calls", workflow_tool_calls, agent_id)
+            if tool_calls_detected:
+                yield StreamChunk(type="tool_calls", tool_calls=tool_calls_detected, source="gemini")
+                if mcp_used:
+                    yield StreamChunk(
+                        type="mcp_status",
+                        status="mcp_session_complete",
+                        content="✅ [MCP] Session completed",
+                        source="mcp_tools",
+                    )
+                yield StreamChunk(type="done")
+                return
-            # Process builtin tool results if any tools were used
             if builtin_tools and final_response and hasattr(final_response, "candidates") and final_response.candidates:
-                # Check for grounding or code execution results
                 candidate = final_response.candidates[0]
-                # Check for web search results - only show if actually used
                 if hasattr(candidate, "grounding_metadata") and candidate.grounding_metadata:
-                    # Check if web search was actually used by looking for queries or chunks
                     search_actually_used = False
-                    search_queries = []
+                    search_queries: List[str] = []
-                    # Look for web search queries
                     if hasattr(candidate.grounding_metadata, "web_search_queries") and candidate.grounding_metadata.web_search_queries:
                         try:
                             for query in candidate.grounding_metadata.web_search_queries:
-                                if query and query.strip():
-                                    search_queries.append(query.strip())
+                                if query and isinstance(query, str) and query.strip():
+                                    trimmed_query = query.strip()
+                                    search_queries.append(trimmed_query)
                                     search_actually_used = True
                         except (TypeError, AttributeError):
                             pass
-                    # Look for grounding chunks (indicates actual search results)
                     if hasattr(candidate.grounding_metadata, "grounding_chunks") and candidate.grounding_metadata.grounding_chunks:
                         try:
                             if len(candidate.grounding_metadata.grounding_chunks) > 0:
@@ -1702,9 +1088,7 @@ class GeminiBackend(CustomToolAndMCPBackend):
                         except (TypeError, AttributeError):
                             pass
-                    # Only show indicators if search was actually used
                     if search_actually_used:
-                        # Enhanced web search logging
                         log_stream_chunk(
                             "backend.gemini",
                             "web_search_result",
@@ -1716,17 +1100,17 @@ class GeminiBackend(CustomToolAndMCPBackend):
                             "google_search_retrieval",
                             {
                                 "queries": search_queries,
-                                "chunks_found": len(candidate.grounding_metadata.grounding_chunks) if hasattr(candidate.grounding_metadata, "grounding_chunks") else 0,
+                                "chunks_found": len(getattr(candidate.grounding_metadata, "grounding_chunks", []) or []),
                             },
                             result="search_completed",
                             backend_name="gemini",
                         )
                         yield StreamChunk(
                             type="content",
                             content="🔍 [Builtin Tool: Web Search] Results integrated\n",
                         )
-                        # Show search queries
                         for query in search_queries:
                             log_stream_chunk(
                                 "backend.gemini",
@@ -1738,240 +1122,308 @@ class GeminiBackend(CustomToolAndMCPBackend):
                         self.search_count += 1
-                # Check for code execution in the response parts
+                enable_code_execution = bool(
+                    all_params.get("enable_code_execution") or all_params.get("code_execution"),
+                )
                 if enable_code_execution and hasattr(candidate, "content") and hasattr(candidate.content, "parts"):
-                    # Look for executable_code and code_execution_result parts
-                    code_parts = []
+                    code_parts: List[str] = []
                     for part in candidate.content.parts:
                         if hasattr(part, "executable_code") and part.executable_code:
                             code_content = getattr(part.executable_code, "code", str(part.executable_code))
                             code_parts.append(f"Code: {code_content}")
                         elif hasattr(part, "code_execution_result") and part.code_execution_result:
-                            result_content = getattr(
-                                part.code_execution_result,
-                                "output",
-                                str(part.code_execution_result),
-                            )
+                            result_content = getattr(part.code_execution_result, "output", str(part.code_execution_result))
                             code_parts.append(f"Result: {result_content}")
                     if code_parts:
-                        # Code execution was actually used
                         log_stream_chunk(
                             "backend.gemini",
                             "code_execution",
                             "Code executed",
                             agent_id,
                         )
-                        # Log code execution as a tool call event
-                        try:
-                            log_tool_call(
-                                agent_id,
-                                "code_execution",
-                                {"code_parts_count": len(code_parts)},
-                                result="code_executed",
-                                backend_name="gemini",
-                            )
-                        except Exception:
-                            pass
+                        log_tool_call(
+                            agent_id,
+                            "code_execution",
+                            {"details": code_parts},
+                            result="code_execution_completed",
+                            backend_name="gemini",
+                        )
                         yield StreamChunk(
                             type="content",
-                            content="💻 [Builtin Tool: Code Execution] Code executed\n",
+                            content="🧮 [Builtin Tool: Code Execution] Results integrated\n",
                         )
-                        # Also show the actual code and result
-                        for part in code_parts:
-                            if part.startswith("Code: "):
-                                code_content = part[6:]  # Remove "Code: " prefix
-                                log_stream_chunk(
-                                    "backend.gemini",
-                                    "code_execution_result",
-                                    {
-                                        "code_parts": len(code_parts),
-                                        "execution_successful": True,
-                                        "snippet": code_content,
-                                    },
-                                    agent_id,
-                                )
-                                yield StreamChunk(
-                                    type="content",
-                                    content=f"💻 [Code Executed]\n```python\n{code_content}\n```\n",
-                                )
-                            elif part.startswith("Result: "):
-                                result_content = part[8:]  # Remove "Result: " prefix
-                                log_stream_chunk(
-                                    "backend.gemini",
-                                    "code_execution_result",
-                                    {
-                                        "code_parts": len(code_parts),
-                                        "execution_successful": True,
-                                        "result": result_content,
-                                    },
-                                    agent_id,
-                                )
-                                yield StreamChunk(
-                                    type="content",
-                                    content=f"📊 [Result] {result_content}\n",
-                                )
+                        for entry in code_parts:
+                            yield StreamChunk(type="content", content=f"🧮 {entry}\n")
                         self.code_execution_count += 1
-            # Yield coordination tool calls if detected
-            if tool_calls_detected:
-                # Enhanced tool calls summary logging
-                log_stream_chunk(
-                    "backend.gemini",
-                    "tool_calls_yielded",
-                    {
-                        "tool_count": len(tool_calls_detected),
-                        "tool_names": [tc.get("function", {}).get("name") for tc in tool_calls_detected],
-                    },
-                    agent_id,
+            elif final_response and hasattr(final_response, "candidates"):
+                for candidate in final_response.candidates:
+                    if hasattr(candidate, "grounding_metadata"):
+                        self.search_count += 1
+                        logger.debug(f"[Gemini] Grounding (web search) used, count: {self.search_count}")
+                    if hasattr(candidate, "content") and candidate.content:
+                        if hasattr(candidate.content, "parts"):
+                            for part in candidate.content.parts:
+                                if hasattr(part, "executable_code") or hasattr(part, "code_execution_result"):
+                                    self.code_execution_count += 1
+                                    logger.debug(f"[Gemini] Code execution used, count: {self.code_execution_count}")
+                                    break
+            # Emit completion status
+            if mcp_used:
+                yield StreamChunk(
+                    type="mcp_status",
+                    status="mcp_session_complete",
+                    content="✅ [MCP] Session completed",
+                    source="mcp_tools",
                 )
-                yield StreamChunk(type="tool_calls", tool_calls=tool_calls_detected)
-            # Build complete message
-            complete_message = {"role": "assistant", "content": content.strip()}
-            if tool_calls_detected:
-                complete_message["tool_calls"] = tool_calls_detected
-            # Enhanced complete message logging with metadata
-            log_stream_chunk(
-                "backend.gemini",
-                "complete_message",
-                {
-                    "content_length": len(content.strip()),
-                    "has_tool_calls": bool(tool_calls_detected),
-                },
-                agent_id,
-            )
-            yield StreamChunk(type="complete_message", complete_message=complete_message)
-            log_stream_chunk("backend.gemini", "done", None, agent_id)
             yield StreamChunk(type="done")
         except Exception as e:
-            error_msg = f"Gemini API error: {e}"
-            # Enhanced error logging with structured details
-            log_stream_chunk(
-                "backend.gemini",
-                "stream_error",
-                {"error_type": type(e).__name__, "error_message": str(e)},
-                agent_id,
-            )
-            yield StreamChunk(type="error", error=error_msg)
+            logger.error(f"[Gemini] Error in stream_with_tools: {e}")
+            raise
         finally:
-            # Cleanup resources
-            await self.mcp_manager.cleanup_genai_resources(stream, client)
-            # Ensure context manager exit for MCP cleanup
-            try:
-                await self.__aexit__(None, None, None)
-            except Exception as e:
-                log_backend_activity(
-                    "gemini",
-                    "MCP cleanup failed",
-                    {"error": str(e)},
-                    agent_id=self.agent_id,
-                )
+            await self._cleanup_genai_resources(stream, client)
-    def get_provider_name(self) -> str:
-        """Get the provider name."""
-        return "Gemini"
+    async def _try_close_resource(
+        self,
+        resource: Any,
+        method_names: tuple,
+        resource_label: str,
+    ) -> bool:
+        """Try to close a resource using one of the provided method names.
-    def get_filesystem_support(self) -> FilesystemSupport:
-        """Gemini supports filesystem through MCP servers."""
-        return FilesystemSupport.MCP
+        Args:
+            resource: Object to close
+            method_names: Method names to try (e.g., ("aclose", "close"))
+            resource_label: Label for error logging
-    def get_supported_builtin_tools(self) -> List[str]:
-        """Get list of builtin tools supported by Gemini."""
-        return ["google_search_retrieval", "code_execution"]
+        Returns:
+            True if closed successfully, False otherwise
+        """
+        if resource is None:
+            return False
-    def get_mcp_results(self) -> Dict[str, Any]:
+        for method_name in method_names:
+            close_method = getattr(resource, method_name, None)
+            if close_method is not None:
+                try:
+                    result = close_method()
+                    if hasattr(result, "__await__"):
+                        await result
+                    return True
+                except Exception as e:
+                    log_backend_activity(
+                        "gemini",
+                        f"{resource_label} cleanup failed",
+                        {"error": str(e), "method": method_name},
+                        agent_id=self.agent_id,
+                    )
+                    return False
+        return False
+    async def _cleanup_genai_resources(self, stream, client) -> None:
+        """Cleanup google-genai resources to avoid unclosed aiohttp sessions.
+        Cleanup order is critical: stream → session → transport → client.
+        Each resource is cleaned independently with error isolation.
         """
-        Get all captured MCP tool calls and responses.
+        # 1. Close stream
+        await self._try_close_resource(stream, ("aclose", "close"), "Stream")
+        # 2. Close internal aiohttp session (requires special handling)
+        if client is not None:
+            base_client = getattr(client, "_api_client", None)
+            if base_client is not None:
+                session = getattr(base_client, "_aiohttp_session", None)
+                if session is not None and not getattr(session, "closed", True):
+                    try:
+                        await session.close()
+                        log_backend_activity(
+                            "gemini",
+                            "Closed google-genai aiohttp session",
+                            {},
+                            agent_id=self.agent_id,
+                        )
+                        base_client._aiohttp_session = None
+                        # Yield control to allow connector cleanup
+                        await asyncio.sleep(0)
+                    except Exception as e:
+                        log_backend_activity(
+                            "gemini",
+                            "Failed to close google-genai aiohttp session",
+                            {"error": str(e)},
+                            agent_id=self.agent_id,
+                        )
-        Returns:
-            Dict containing:
-            - calls: List of all MCP tool calls
-            - responses: List of all MCP tool responses
-            - pairs: List of matched call-response pairs
-            - summary: Statistical summary of interactions
+        # 3. Close internal async transport
+        if client is not None:
+            aio_obj = getattr(client, "aio", None)
+            await self._try_close_resource(aio_obj, ("close", "stop"), "Client AIO")
+        # 4. Close client
+        await self._try_close_resource(client, ("aclose", "close"), "Client")
+    def _append_tool_result_message(
+        self,
+        updated_messages: List[Dict[str, Any]],
+        call: Dict[str, Any],
+        result: Any,
+        tool_type: str,
+    ) -> None:
+        """Append tool result to messages in Gemini conversation format.
+        Gemini uses a different message format than OpenAI/Response API.
+        We need to append messages in a format that Gemini SDK can understand
+        when making recursive calls.
+        Args:
+            updated_messages: Message list to append to
+            call: Tool call dictionary with call_id, name, arguments
+            result: Tool execution result
+            tool_type: "custom" or "mcp"
         """
-        return {
-            "calls": self.mcp_extractor.mcp_calls,
-            "responses": self.mcp_extractor.mcp_responses,
-            "pairs": self.mcp_extractor.call_response_pairs,
-            "summary": self.mcp_extractor.get_summary(),
+        tool_result_msg = {
+            "role": "tool",
+            "name": call.get("name", ""),
+            "content": str(result),
         }
+        updated_messages.append(tool_result_msg)
-    def get_mcp_paired_results(self) -> List[Dict[str, Any]]:
-        """
-        Get only the paired MCP tool calls and responses.
+        tool_results_store = getattr(self, "_active_tool_result_store", None)
+        call_id = call.get("call_id")
+        if isinstance(tool_results_store, dict) and call_id:
+            tool_results_store[call_id] = str(result)
-        Returns:
-            List of dictionaries containing matched call-response pairs
-        """
-        return self.mcp_extractor.call_response_pairs
+    def _append_tool_error_message(
+        self,
+        updated_messages: List[Dict[str, Any]],
+        call: Dict[str, Any],
+        error_msg: str,
+        tool_type: str,
+    ) -> None:
+        """Append tool error to messages in Gemini conversation format.
-    def get_mcp_summary(self) -> Dict[str, Any]:
+        Args:
+            updated_messages: Message list to append to
+            call: Tool call dictionary with call_id, name, arguments
+            error_msg: Error message string
+            tool_type: "custom" or "mcp"
         """
-        Get a summary of MCP tool interactions.
+        # Append error as function result
+        error_result_msg = {
+            "role": "tool",
+            "name": call.get("name", ""),
+            "content": f"Error: {error_msg}",
+        }
+        updated_messages.append(error_result_msg)
-        Returns:
-            Dictionary with statistics about MCP tool usage
+        tool_results_store = getattr(self, "_active_tool_result_store", None)
+        call_id = call.get("call_id")
+        if isinstance(tool_results_store, dict) and call_id:
+            tool_results_store[call_id] = f"Error: {error_msg}"
+    async def _execute_custom_tool(self, call: Dict[str, Any]) -> AsyncGenerator[CustomToolChunk, None]:
+        """Execute custom tool with streaming support - async generator for base class.
+        This method is called by _execute_tool_with_logging and yields CustomToolChunk
+        objects for intermediate streaming output. The base class detects the async
+        generator and streams intermediate results to users in real-time.
+        Args:
+            call: Tool call dictionary with name and arguments
+        Yields:
+            CustomToolChunk objects with streaming data
+        Note:
+            - Intermediate chunks (completed=False) are streamed to users in real-time
+            - Final chunk (completed=True) contains the accumulated result for message history
+            - The base class automatically handles extracting and displaying intermediate chunks
         """
-        return self.mcp_extractor.get_summary()
+        async for chunk in self.stream_custom_tool_execution(call):
+            yield chunk
+    def get_provider_name(self) -> str:
+        """Get the provider name."""
+        return "Gemini"
+    def get_filesystem_support(self) -> FilesystemSupport:
+        """Gemini supports filesystem through MCP servers."""
+        return FilesystemSupport.MCP
-    def clear_mcp_results(self):
-        """Clear all stored MCP interaction data."""
-        self.mcp_extractor.clear()
+    def get_supported_builtin_tools(self) -> List[str]:
+        """Get list of builtin tools supported by Gemini."""
+        return ["google_search_retrieval", "code_execution"]
     def reset_tool_usage(self):
         """Reset tool usage tracking."""
         self.search_count = 0
         self.code_execution_count = 0
-        # Reset MCP monitoring metrics
-        self._mcp_tool_calls_count = 0
-        self._mcp_tool_failures = 0
-        self._mcp_tool_successes = 0
-        self._mcp_connection_retries = 0
-        # Clear MCP extractor data
-        self.mcp_extractor.clear()
+        # Reset MCP monitoring metrics when available
+        for attr in (
+            "_mcp_tool_calls_count",
+            "_mcp_tool_failures",
+            "_mcp_tool_successes",
+            "_mcp_connection_retries",
+        ):
+            if hasattr(self, attr):
+                setattr(self, attr, 0)
         super().reset_token_usage()
     async def cleanup_mcp(self):
         """Cleanup MCP connections - override parent class to use Gemini-specific cleanup."""
-        if self._mcp_client:
+        if MCPResourceManager:
             try:
-                await self._mcp_client.disconnect()
-                log_backend_activity("gemini", "MCP client disconnected", {}, agent_id=self.agent_id)
-            except (
-                MCPConnectionError,
-                MCPTimeoutError,
-                MCPServerError,
-                MCPError,
-                Exception,
-            ) as e:
+                await super().cleanup_mcp()
+                return
+            except Exception as error:
+                log_backend_activity(
+                    "gemini",
+                    "MCP cleanup via resource manager failed",
+                    {"error": str(error)},
+                    agent_id=self.agent_id,
+                )
+                # Fall back to manual cleanup below
+        if not self._mcp_client:
+            return
+        try:
+            await self._mcp_client.disconnect()
+            log_backend_activity("gemini", "MCP client disconnected", {}, agent_id=self.agent_id)
+        except (
+            MCPConnectionError,
+            MCPTimeoutError,
+            MCPServerError,
+            MCPError,
+            Exception,
+        ) as e:
+            if MCPErrorHandler:
                 MCPErrorHandler.get_error_details(e, "disconnect", log=True)
-            finally:
-                self._mcp_client = None
-                self._mcp_initialized = False
-                # Also clear parent class attributes if they exist (for compatibility)
-                if hasattr(self, "_mcp_functions"):
-                    self._mcp_functions.clear()
-                if hasattr(self, "_mcp_function_names"):
-                    self._mcp_function_names.clear()
+            else:
+                logger.exception("[Gemini] MCP disconnect error during cleanup")
+        finally:
+            self._mcp_client = None
+            self._mcp_initialized = False
+            if hasattr(self, "_mcp_functions"):
+                self._mcp_functions.clear()
+            if hasattr(self, "_mcp_function_names"):
+                self._mcp_function_names.clear()
     async def __aenter__(self) -> "GeminiBackend":
         """Async context manager entry."""
-        try:
-            await self.mcp_manager.setup_mcp_tools(agent_id=self.agent_id)
-        except Exception as e:
-            log_backend_activity(
-                "gemini",
-                "MCP setup failed during context entry",
-                {"error": str(e)},
-                agent_id=self.agent_id,
-            )
+        # Call parent class __aenter__ which handles MCP setup
+        await super().__aenter__()
         return self
     async def __aexit__(
@@ -1984,11 +1436,15 @@ class GeminiBackend(CustomToolAndMCPBackend):
         # Parameters are required by context manager protocol but not used
         _ = (exc_type, exc_val, exc_tb)
         try:
-            await self.cleanup_mcp()
-        except Exception as e:
-            log_backend_activity(
-                "gemini",
-                "Backend cleanup error",
-                {"error": str(e)},
-                agent_id=self.agent_id,
-            )
+            await super().__aexit__(exc_type, exc_val, exc_tb)
+        finally:
+            if not MCPResourceManager:
+                try:
+                    await self.cleanup_mcp()
+                except Exception as e:
+                    log_backend_activity(
+                        "gemini",
+                        "Backend cleanup error",
+                        {"error": str(e)},
+                        agent_id=self.agent_id,
+                    )

massgen 0.1.4__py3-none-any.whl → 0.1.6__py3-none-any.whl

Potentially problematic release.

massgen 0.1.4py3-none-any.whl → 0.1.6py3-none-any.whl