PyPI - massgen - Versions diffs - 0.0.3__py3-none-any.whl → 0.1.0__py3-none-any.whl - Mend

massgen 0.0.3py3-none-any.whl → 0.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of massgen might be problematic. Click here for more details.

Files changed (268) hide show

massgen/__init__.py +142 -8
massgen/adapters/__init__.py +29 -0
massgen/adapters/ag2_adapter.py +483 -0
massgen/adapters/base.py +183 -0
massgen/adapters/tests/__init__.py +0 -0
massgen/adapters/tests/test_ag2_adapter.py +439 -0
massgen/adapters/tests/test_agent_adapter.py +128 -0
massgen/adapters/utils/__init__.py +2 -0
massgen/adapters/utils/ag2_utils.py +236 -0
massgen/adapters/utils/tests/__init__.py +0 -0
massgen/adapters/utils/tests/test_ag2_utils.py +138 -0
massgen/agent_config.py +329 -55
massgen/api_params_handler/__init__.py +10 -0
massgen/api_params_handler/_api_params_handler_base.py +99 -0
massgen/api_params_handler/_chat_completions_api_params_handler.py +176 -0
massgen/api_params_handler/_claude_api_params_handler.py +113 -0
massgen/api_params_handler/_response_api_params_handler.py +130 -0
massgen/backend/__init__.py +39 -4
massgen/backend/azure_openai.py +385 -0
massgen/backend/base.py +341 -69
massgen/backend/base_with_mcp.py +1102 -0
massgen/backend/capabilities.py +386 -0
massgen/backend/chat_completions.py +577 -130
massgen/backend/claude.py +1033 -537
massgen/backend/claude_code.py +1203 -0
massgen/backend/cli_base.py +209 -0
massgen/backend/docs/BACKEND_ARCHITECTURE.md +126 -0
massgen/backend/{CLAUDE_API_RESEARCH.md → docs/CLAUDE_API_RESEARCH.md} +18 -18
massgen/backend/{GEMINI_API_DOCUMENTATION.md → docs/GEMINI_API_DOCUMENTATION.md} +9 -9
massgen/backend/docs/Gemini MCP Integration Analysis.md +1050 -0
massgen/backend/docs/MCP_IMPLEMENTATION_CLAUDE_BACKEND.md +177 -0
massgen/backend/docs/MCP_INTEGRATION_RESPONSE_BACKEND.md +352 -0
massgen/backend/docs/OPENAI_GPT5_MODELS.md +211 -0
massgen/backend/{OPENAI_RESPONSES_API_FORMAT.md → docs/OPENAI_RESPONSE_API_TOOL_CALLS.md} +3 -3
massgen/backend/docs/OPENAI_response_streaming.md +20654 -0
massgen/backend/docs/inference_backend.md +257 -0
massgen/backend/docs/permissions_and_context_files.md +1085 -0
massgen/backend/external.py +126 -0
massgen/backend/gemini.py +1850 -241
massgen/backend/grok.py +40 -156
massgen/backend/inference.py +156 -0
massgen/backend/lmstudio.py +171 -0
massgen/backend/response.py +1095 -322
massgen/chat_agent.py +131 -113
massgen/cli.py +1560 -275
massgen/config_builder.py +2396 -0
massgen/configs/BACKEND_CONFIGURATION.md +458 -0
massgen/configs/README.md +559 -216
massgen/configs/ag2/ag2_case_study.yaml +27 -0
massgen/configs/ag2/ag2_coder.yaml +34 -0
massgen/configs/ag2/ag2_coder_case_study.yaml +36 -0
massgen/configs/ag2/ag2_gemini.yaml +27 -0
massgen/configs/ag2/ag2_groupchat.yaml +108 -0
massgen/configs/ag2/ag2_groupchat_gpt.yaml +118 -0
massgen/configs/ag2/ag2_single_agent.yaml +21 -0
massgen/configs/basic/multi/fast_timeout_example.yaml +37 -0
massgen/configs/basic/multi/gemini_4o_claude.yaml +31 -0
massgen/configs/basic/multi/gemini_gpt5nano_claude.yaml +36 -0
massgen/configs/{gemini_4o_claude.yaml → basic/multi/geminicode_4o_claude.yaml} +3 -3
massgen/configs/basic/multi/geminicode_gpt5nano_claude.yaml +36 -0
massgen/configs/basic/multi/glm_gemini_claude.yaml +25 -0
massgen/configs/basic/multi/gpt4o_audio_generation.yaml +30 -0
massgen/configs/basic/multi/gpt4o_image_generation.yaml +31 -0
massgen/configs/basic/multi/gpt5nano_glm_qwen.yaml +26 -0
massgen/configs/basic/multi/gpt5nano_image_understanding.yaml +26 -0
massgen/configs/{three_agents_default.yaml → basic/multi/three_agents_default.yaml} +8 -4
massgen/configs/basic/multi/three_agents_opensource.yaml +27 -0
massgen/configs/basic/multi/three_agents_vllm.yaml +20 -0
massgen/configs/basic/multi/two_agents_gemini.yaml +19 -0
massgen/configs/{two_agents.yaml → basic/multi/two_agents_gpt5.yaml} +14 -6
massgen/configs/basic/multi/two_agents_opensource_lmstudio.yaml +31 -0
massgen/configs/basic/multi/two_qwen_vllm_sglang.yaml +28 -0
massgen/configs/{single_agent.yaml → basic/single/single_agent.yaml} +1 -1
massgen/configs/{single_flash2.5.yaml → basic/single/single_flash2.5.yaml} +1 -2
massgen/configs/basic/single/single_gemini2.5pro.yaml +16 -0
massgen/configs/basic/single/single_gpt4o_audio_generation.yaml +22 -0
massgen/configs/basic/single/single_gpt4o_image_generation.yaml +22 -0
massgen/configs/basic/single/single_gpt4o_video_generation.yaml +24 -0
massgen/configs/basic/single/single_gpt5nano.yaml +20 -0
massgen/configs/basic/single/single_gpt5nano_file_search.yaml +18 -0
massgen/configs/basic/single/single_gpt5nano_image_understanding.yaml +17 -0
massgen/configs/basic/single/single_gptoss120b.yaml +15 -0
massgen/configs/basic/single/single_openrouter_audio_understanding.yaml +15 -0
massgen/configs/basic/single/single_qwen_video_understanding.yaml +15 -0
massgen/configs/debug/code_execution/command_filtering_blacklist.yaml +29 -0
massgen/configs/debug/code_execution/command_filtering_whitelist.yaml +28 -0
massgen/configs/debug/code_execution/docker_verification.yaml +29 -0
massgen/configs/debug/skip_coordination_test.yaml +27 -0
massgen/configs/debug/test_sdk_migration.yaml +17 -0
massgen/configs/docs/DISCORD_MCP_SETUP.md +208 -0
massgen/configs/docs/TWITTER_MCP_ENESCINAR_SETUP.md +82 -0
massgen/configs/providers/azure/azure_openai_multi.yaml +21 -0
massgen/configs/providers/azure/azure_openai_single.yaml +19 -0
massgen/configs/providers/claude/claude.yaml +14 -0
massgen/configs/providers/gemini/gemini_gpt5nano.yaml +28 -0
massgen/configs/providers/local/lmstudio.yaml +11 -0
massgen/configs/providers/openai/gpt5.yaml +46 -0
massgen/configs/providers/openai/gpt5_nano.yaml +46 -0
massgen/configs/providers/others/grok_single_agent.yaml +19 -0
massgen/configs/providers/others/zai_coding_team.yaml +108 -0
massgen/configs/providers/others/zai_glm45.yaml +12 -0
massgen/configs/{creative_team.yaml → teams/creative/creative_team.yaml} +16 -6
massgen/configs/{travel_planning.yaml → teams/creative/travel_planning.yaml} +16 -6
massgen/configs/{news_analysis.yaml → teams/research/news_analysis.yaml} +16 -6
massgen/configs/{research_team.yaml → teams/research/research_team.yaml} +15 -7
massgen/configs/{technical_analysis.yaml → teams/research/technical_analysis.yaml} +16 -6
massgen/configs/tools/code-execution/basic_command_execution.yaml +25 -0
massgen/configs/tools/code-execution/code_execution_use_case_simple.yaml +41 -0
massgen/configs/tools/code-execution/docker_claude_code.yaml +32 -0
massgen/configs/tools/code-execution/docker_multi_agent.yaml +32 -0
massgen/configs/tools/code-execution/docker_simple.yaml +29 -0
massgen/configs/tools/code-execution/docker_with_resource_limits.yaml +32 -0
massgen/configs/tools/code-execution/multi_agent_playwright_automation.yaml +57 -0
massgen/configs/tools/filesystem/cc_gpt5_gemini_filesystem.yaml +34 -0
massgen/configs/tools/filesystem/claude_code_context_sharing.yaml +68 -0
massgen/configs/tools/filesystem/claude_code_flash2.5.yaml +43 -0
massgen/configs/tools/filesystem/claude_code_flash2.5_gptoss.yaml +49 -0
massgen/configs/tools/filesystem/claude_code_gpt5nano.yaml +31 -0
massgen/configs/tools/filesystem/claude_code_single.yaml +40 -0
massgen/configs/tools/filesystem/fs_permissions_test.yaml +87 -0
massgen/configs/tools/filesystem/gemini_gemini_workspace_cleanup.yaml +54 -0
massgen/configs/tools/filesystem/gemini_gpt5_filesystem_casestudy.yaml +30 -0
massgen/configs/tools/filesystem/gemini_gpt5nano_file_context_path.yaml +43 -0
massgen/configs/tools/filesystem/gemini_gpt5nano_protected_paths.yaml +45 -0
massgen/configs/tools/filesystem/gpt5mini_cc_fs_context_path.yaml +31 -0
massgen/configs/tools/filesystem/grok4_gpt5_gemini_filesystem.yaml +32 -0
massgen/configs/tools/filesystem/multiturn/grok4_gpt5_claude_code_filesystem_multiturn.yaml +58 -0
massgen/configs/tools/filesystem/multiturn/grok4_gpt5_gemini_filesystem_multiturn.yaml +58 -0
massgen/configs/tools/filesystem/multiturn/two_claude_code_filesystem_multiturn.yaml +47 -0
massgen/configs/tools/filesystem/multiturn/two_gemini_flash_filesystem_multiturn.yaml +48 -0
massgen/configs/tools/mcp/claude_code_discord_mcp_example.yaml +27 -0
massgen/configs/tools/mcp/claude_code_simple_mcp.yaml +35 -0
massgen/configs/tools/mcp/claude_code_twitter_mcp_example.yaml +32 -0
massgen/configs/tools/mcp/claude_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/claude_mcp_test.yaml +27 -0
massgen/configs/tools/mcp/five_agents_travel_mcp_test.yaml +157 -0
massgen/configs/tools/mcp/five_agents_weather_mcp_test.yaml +103 -0
massgen/configs/tools/mcp/gemini_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/gemini_mcp_filesystem_test.yaml +23 -0
massgen/configs/tools/mcp/gemini_mcp_filesystem_test_sharing.yaml +23 -0
massgen/configs/tools/mcp/gemini_mcp_filesystem_test_single_agent.yaml +17 -0
massgen/configs/tools/mcp/gemini_mcp_filesystem_test_with_claude_code.yaml +24 -0
massgen/configs/tools/mcp/gemini_mcp_test.yaml +27 -0
massgen/configs/tools/mcp/gemini_notion_mcp.yaml +52 -0
massgen/configs/tools/mcp/gpt5_nano_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/gpt5_nano_mcp_test.yaml +27 -0
massgen/configs/tools/mcp/gpt5mini_claude_code_discord_mcp_example.yaml +38 -0
massgen/configs/tools/mcp/gpt_oss_mcp_example.yaml +25 -0
massgen/configs/tools/mcp/gpt_oss_mcp_test.yaml +28 -0
massgen/configs/tools/mcp/grok3_mini_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/grok3_mini_mcp_test.yaml +27 -0
massgen/configs/tools/mcp/multimcp_gemini.yaml +111 -0
massgen/configs/tools/mcp/qwen_api_mcp_example.yaml +25 -0
massgen/configs/tools/mcp/qwen_api_mcp_test.yaml +28 -0
massgen/configs/tools/mcp/qwen_local_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/qwen_local_mcp_test.yaml +27 -0
massgen/configs/tools/planning/five_agents_discord_mcp_planning_mode.yaml +140 -0
massgen/configs/tools/planning/five_agents_filesystem_mcp_planning_mode.yaml +151 -0
massgen/configs/tools/planning/five_agents_notion_mcp_planning_mode.yaml +151 -0
massgen/configs/tools/planning/five_agents_twitter_mcp_planning_mode.yaml +155 -0
massgen/configs/tools/planning/gpt5_mini_case_study_mcp_planning_mode.yaml +73 -0
massgen/configs/tools/web-search/claude_streamable_http_test.yaml +43 -0
massgen/configs/tools/web-search/gemini_streamable_http_test.yaml +43 -0
massgen/configs/tools/web-search/gpt5_mini_streamable_http_test.yaml +43 -0
massgen/configs/tools/web-search/gpt_oss_streamable_http_test.yaml +44 -0
massgen/configs/tools/web-search/grok3_mini_streamable_http_test.yaml +43 -0
massgen/configs/tools/web-search/qwen_api_streamable_http_test.yaml +44 -0
massgen/configs/tools/web-search/qwen_local_streamable_http_test.yaml +43 -0
massgen/coordination_tracker.py +708 -0
massgen/docker/README.md +462 -0
massgen/filesystem_manager/__init__.py +21 -0
massgen/filesystem_manager/_base.py +9 -0
massgen/filesystem_manager/_code_execution_server.py +545 -0
massgen/filesystem_manager/_docker_manager.py +477 -0
massgen/filesystem_manager/_file_operation_tracker.py +248 -0
massgen/filesystem_manager/_filesystem_manager.py +813 -0
massgen/filesystem_manager/_path_permission_manager.py +1261 -0
massgen/filesystem_manager/_workspace_tools_server.py +1815 -0
massgen/formatter/__init__.py +10 -0
massgen/formatter/_chat_completions_formatter.py +284 -0
massgen/formatter/_claude_formatter.py +235 -0
massgen/formatter/_formatter_base.py +156 -0
massgen/formatter/_response_formatter.py +263 -0
massgen/frontend/__init__.py +1 -2
massgen/frontend/coordination_ui.py +471 -286
massgen/frontend/displays/base_display.py +56 -11
massgen/frontend/displays/create_coordination_table.py +1956 -0
massgen/frontend/displays/rich_terminal_display.py +1259 -619
massgen/frontend/displays/simple_display.py +9 -4
massgen/frontend/displays/terminal_display.py +27 -68
massgen/logger_config.py +681 -0
massgen/mcp_tools/README.md +232 -0
massgen/mcp_tools/__init__.py +105 -0
massgen/mcp_tools/backend_utils.py +1035 -0
massgen/mcp_tools/circuit_breaker.py +195 -0
massgen/mcp_tools/client.py +894 -0
massgen/mcp_tools/config_validator.py +138 -0
massgen/mcp_tools/docs/circuit_breaker.md +646 -0
massgen/mcp_tools/docs/client.md +950 -0
massgen/mcp_tools/docs/config_validator.md +478 -0
massgen/mcp_tools/docs/exceptions.md +1165 -0
massgen/mcp_tools/docs/security.md +854 -0
massgen/mcp_tools/exceptions.py +338 -0
massgen/mcp_tools/hooks.py +212 -0
massgen/mcp_tools/security.py +780 -0
massgen/message_templates.py +342 -64
massgen/orchestrator.py +1515 -241
massgen/stream_chunk/__init__.py +35 -0
massgen/stream_chunk/base.py +92 -0
massgen/stream_chunk/multimodal.py +237 -0
massgen/stream_chunk/text.py +162 -0
massgen/tests/mcp_test_server.py +150 -0
massgen/tests/multi_turn_conversation_design.md +0 -8
massgen/tests/test_azure_openai_backend.py +156 -0
massgen/tests/test_backend_capabilities.py +262 -0
massgen/tests/test_backend_event_loop_all.py +179 -0
massgen/tests/test_chat_completions_refactor.py +142 -0
massgen/tests/test_claude_backend.py +15 -28
massgen/tests/test_claude_code.py +268 -0
massgen/tests/test_claude_code_context_sharing.py +233 -0
massgen/tests/test_claude_code_orchestrator.py +175 -0
massgen/tests/test_cli_backends.py +180 -0
massgen/tests/test_code_execution.py +679 -0
massgen/tests/test_external_agent_backend.py +134 -0
massgen/tests/test_final_presentation_fallback.py +237 -0
massgen/tests/test_gemini_planning_mode.py +351 -0
massgen/tests/test_grok_backend.py +7 -10
massgen/tests/test_http_mcp_server.py +42 -0
massgen/tests/test_integration_simple.py +198 -0
massgen/tests/test_mcp_blocking.py +125 -0
massgen/tests/test_message_context_building.py +29 -47
massgen/tests/test_orchestrator_final_presentation.py +48 -0
massgen/tests/test_path_permission_manager.py +2087 -0
massgen/tests/test_rich_terminal_display.py +14 -13
massgen/tests/test_timeout.py +133 -0
massgen/tests/test_v3_3agents.py +11 -12
massgen/tests/test_v3_simple.py +8 -13
massgen/tests/test_v3_three_agents.py +11 -18
massgen/tests/test_v3_two_agents.py +8 -13
massgen/token_manager/__init__.py +7 -0
massgen/token_manager/token_manager.py +400 -0
massgen/utils.py +52 -16
massgen/v1/agent.py +45 -91
massgen/v1/agents.py +18 -53
massgen/v1/backends/gemini.py +50 -153
massgen/v1/backends/grok.py +21 -54
massgen/v1/backends/oai.py +39 -111
massgen/v1/cli.py +36 -93
massgen/v1/config.py +8 -12
massgen/v1/logging.py +43 -127
massgen/v1/main.py +18 -32
massgen/v1/orchestrator.py +68 -209
massgen/v1/streaming_display.py +62 -163
massgen/v1/tools.py +8 -12
massgen/v1/types.py +9 -23
massgen/v1/utils.py +5 -23
massgen-0.1.0.dist-info/METADATA +1245 -0
massgen-0.1.0.dist-info/RECORD +273 -0
massgen-0.1.0.dist-info/entry_points.txt +2 -0
massgen/frontend/logging/__init__.py +0 -9
massgen/frontend/logging/realtime_logger.py +0 -197
massgen-0.0.3.dist-info/METADATA +0 -568
massgen-0.0.3.dist-info/RECORD +0 -76
massgen-0.0.3.dist-info/entry_points.txt +0 -2
/massgen/backend/{Function calling openai responses.md → docs/Function calling openai responses.md} +0 -0
{massgen-0.0.3.dist-info → massgen-0.1.0.dist-info}/WHEEL +0 -0
{massgen-0.0.3.dist-info → massgen-0.1.0.dist-info}/licenses/LICENSE +0 -0
{massgen-0.0.3.dist-info → massgen-0.1.0.dist-info}/top_level.txt +0 -0

massgen/backend/claude.py CHANGED Viewed

@@ -1,5 +1,4 @@
-from __future__ import annotations
+# -*- coding: utf-8 -*-
 """
 Claude backend implementation using Anthropic's Messages API.
 Production-ready implementation with full multi-tool support.
@@ -20,14 +19,28 @@ Multi-Tool Capabilities:
 - Parallel and sequential tool execution supported
 - Perfect integration with MassGen StreamChunk pattern
 """
+from __future__ import annotations
-import os
+import base64
+import binascii
 import json
-from typing import Dict, List, Any, AsyncGenerator, Optional
-from .base import LLMBackend, StreamChunk
+import mimetypes
+import os
+from pathlib import Path
+from typing import Any, AsyncGenerator, Callable, Dict, List, Optional, Tuple
+import anthropic
+import httpx
+from ..api_params_handler import ClaudeAPIParamsHandler
+from ..formatter import ClaudeFormatter
+from ..logger_config import log_backend_agent_message, log_stream_chunk, logger
+from ..mcp_tools.backend_utils import MCPErrorHandler
+from .base import FilesystemSupport, StreamChunk
+from .base_with_mcp import MCPBackend, UploadFileError
-class ClaudeBackend(LLMBackend):
+class ClaudeBackend(MCPBackend):
     """Claude backend using Anthropic's Messages API with full multi-tool support."""
     def __init__(self, api_key: Optional[str] = None, **kwargs):
@@ -35,556 +48,1071 @@ class ClaudeBackend(LLMBackend):
         self.api_key = api_key or os.getenv("ANTHROPIC_API_KEY")
         self.search_count = 0  # Track web search usage for pricing
         self.code_session_hours = 0.0  # Track code execution usage
+        self.formatter = ClaudeFormatter()
+        self.api_params_handler = ClaudeAPIParamsHandler(self)
+        self._uploaded_file_ids: List[str] = []
+    def supports_upload_files(self) -> bool:
+        """Claude Vision supports inline images; Files API handles PDFs and text docs."""
-    def convert_tools_to_claude_format(
-        self, tools: List[Dict[str, Any]]
+        return True
+    async def stream_with_tools(
+        self,
+        messages: List[Dict[str, Any]],
+        tools: List[Dict[str, Any]],
+        **kwargs,
+    ) -> AsyncGenerator[StreamChunk, None]:
+        """Override to ensure Files API cleanup happens after streaming completes."""
+        try:
+            async for chunk in super().stream_with_tools(messages, tools, **kwargs):
+                yield chunk
+        finally:
+            await self._cleanup_files_api_resources(**kwargs)
+    async def _process_upload_files(
+        self,
+        messages: List[Dict[str, Any]],
+        all_params: Dict[str, Any],
     ) -> List[Dict[str, Any]]:
-        """Convert tools to Claude's expected format.
+        """Convert upload_files entries into Claude-compatible multimodal content."""
-        Input formats supported:
-        - Response API format: {"type": "function", "name": ..., "description": ..., "parameters": ...}
-        - Chat Completions format: {"type": "function", "function": {"name": ..., "description": ..., "parameters": ...}}
+        processed_messages = await super()._process_upload_files(messages, all_params)
+        if not processed_messages:
+            return processed_messages
-        Claude format: {"type": "function", "name": ..., "description": ..., "input_schema": ...}
-        """
-        if not tools:
-            return tools
-        converted_tools = []
-        for tool in tools:
-            if tool.get("type") == "function":
-                if "function" in tool:
-                    # Chat Completions format -> Claude custom tool
-                    func = tool["function"]
-                    converted_tools.append(
-                        {
-                            "type": "custom",
-                            "name": func["name"],
-                            "description": func["description"],
-                            "input_schema": func.get("parameters", {}),
-                        }
+        allowed_mime_types = {
+            "image/jpeg",
+            "image/png",
+            "image/gif",
+            "image/webp",
+        }
+        max_image_size_bytes = 5 * 1024 * 1024
+        for message in processed_messages:
+            content = message.get("content")
+            if not isinstance(content, list):
+                continue
+            converted_items: List[Dict[str, Any]] = []
+            for item in content:
+                if not isinstance(item, dict):
+                    converted_items.append(item)
+                    continue
+                item_type = item.get("type")
+                if item_type == "file_pending_upload":
+                    converted_items.append(item)
+                    continue
+                if item_type != "image":
+                    converted_items.append(item)
+                    continue
+                if "source" in item and isinstance(item["source"], dict):
+                    converted_items.append(item)
+                    continue
+                # Handle base64-encoded images
+                if "base64" in item:
+                    mime_type = (item.get("mime_type") or "").lower()
+                    if mime_type not in allowed_mime_types:
+                        raise UploadFileError(
+                            f"Unsupported Claude image MIME type: {mime_type or 'unknown'}",
+                        )
+                    try:
+                        decoded = base64.b64decode(item["base64"], validate=True)
+                    except binascii.Error as exc:
+                        raise UploadFileError("Invalid base64 image data") from exc
+                    if len(decoded) > max_image_size_bytes:
+                        raise UploadFileError(
+                            "Claude Vision image exceeds 5MB size limit",
+                        )
+                    converted_item = {key: value for key, value in item.items() if key not in {"base64", "mime_type"}}
+                    converted_item["type"] = "image"
+                    converted_item["source"] = {
+                        "type": "base64",
+                        "media_type": mime_type,
+                        "data": item["base64"],
+                    }
+                    logger.debug(
+                        "Converted base64 image for Claude Vision: %s",
+                        converted_item.get("source_path", "inline"),
                     )
-                elif "name" in tool and "description" in tool:
-                    # Response API format -> Claude custom tool
-                    converted_tools.append(
-                        {
-                            "type": "custom",
-                            "name": tool["name"],
-                            "description": tool["description"],
-                            "input_schema": tool.get("parameters", {}),
-                        }
+                    converted_items.append(converted_item)
+                    continue
+                # Handle URL-referenced images
+                if "url" in item:
+                    converted_item = {key: value for key, value in item.items() if key != "url"}
+                    converted_item["type"] = "image"
+                    converted_item["source"] = {
+                        "type": "url",
+                        "url": item["url"],
+                    }
+                    logger.debug(
+                        "Converted URL image for Claude Vision: %s",
+                        item["url"],
                     )
-                else:
-                    # Unknown format - keep as-is
-                    converted_tools.append(tool)
-            else:
-                # Non-function tool (builtin tools) - keep as-is
-                converted_tools.append(tool)
+                    converted_items.append(converted_item)
+                    continue
-        return converted_tools
+                # Handle Files API references
+                if "file_id" in item:
+                    converted_item = {key: value for key, value in item.items() if key != "file_id"}
+                    converted_item["type"] = "image"
+                    converted_item["source"] = {
+                        "type": "file",
+                        "file_id": item["file_id"],
+                    }
+                    logger.debug(
+                        "Attached Claude file_id reference for image: %s",
+                        item["file_id"],
+                    )
+                    converted_items.append(converted_item)
+                    continue
-    def convert_messages_to_claude_format(
-        self, messages: List[Dict[str, Any]]
-    ) -> tuple:
-        """Convert messages to Claude's expected format.
+                converted_items.append(item)
-        Handle different tool message formats and extract system message:
-        - Chat Completions tool message: {"role": "tool", "tool_call_id": "...", "content": "..."}
-        - Response API tool message: {"type": "function_call_output", "call_id": "...", "output": "..."}
-        - System messages: Extract and return separately for top-level system parameter
+            message["content"] = converted_items
-        Returns:
-            tuple: (converted_messages, system_message)
+        return processed_messages
+    async def _upload_files_via_files_api(
+        self,
+        messages: List[Dict[str, Any]],
+        client,
+        agent_id: Optional[str] = None,
+    ) -> List[Dict[str, Any]]:
+        """Upload files via Claude Files API and replace pending markers with document blocks.
+        Claude Files API only supports PDF and TXT files. Unsupported files are gracefully
+        skipped and replaced with informative text notes to maintain workflow continuity.
         """
-        converted_messages = []
-        system_message = ""
-        for message in messages:
-            if message.get("role") == "system":
-                # Extract system message for top-level parameter
-                system_message = message.get("content", "")
-            elif message.get("role") == "tool":
-                # Chat Completions tool message -> Claude tool result
-                converted_messages.append(
-                    {
-                        "role": "user",
-                        "content": [
-                            {
-                                "type": "tool_result",
-                                "tool_use_id": message.get("tool_call_id"),
-                                "content": message.get("content", ""),
-                            }
-                        ],
-                    }
-                )
-            elif message.get("type") == "function_call_output":
-                # Response API tool message -> Claude tool result
-                converted_messages.append(
-                    {
-                        "role": "user",
-                        "content": [
-                            {
-                                "type": "tool_result",
-                                "tool_use_id": message.get("call_id"),
-                                "content": message.get("output", ""),
-                            }
-                        ],
-                    }
-                )
-            elif message.get("role") == "assistant" and "tool_calls" in message:
-                # Assistant message with tool calls - convert to Claude format
-                content = []
+        # Claude Files API only supports PDF and TXT files
+        CLAUDE_FILES_API_SUPPORTED_EXTENSIONS = {".pdf", ".txt"}
+        CLAUDE_FILES_API_SUPPORTED_MIME_TYPES = {
+            "application/pdf",
+            "text/plain",
+            "text/txt",
+        }
-                # Add text content if present
-                if message.get("content"):
-                    content.append({"type": "text", "text": message["content"]})
+        # Find all file_pending_upload markers
+        file_locations: List[Tuple[int, int]] = []
+        for msg_idx, message in enumerate(messages):
+            content = message.get("content")
+            if not isinstance(content, list):
+                continue
+            for item_idx, item in enumerate(content):
+                if isinstance(item, dict) and item.get("type") == "file_pending_upload":
+                    file_locations.append((msg_idx, item_idx))
-                # Convert tool calls to Claude tool use format
-                for tool_call in message["tool_calls"]:
-                    tool_name = self.extract_tool_name(tool_call)
-                    tool_args = self.extract_tool_arguments(tool_call)
-                    tool_id = self.extract_tool_call_id(tool_call)
+        if not file_locations:
+            return messages
-                    content.append(
-                        {
-                            "type": "tool_use",
-                            "id": tool_id,
-                            "name": tool_name,
-                            "input": tool_args,
-                        }
+        httpx_client = None
+        try:
+            httpx_client = httpx.AsyncClient()
+            # Track uploaded file IDs, skipped files, failed uploads, and their corresponding locations
+            uploaded_files: List[Tuple[int, int, str]] = []  # (msg_idx, item_idx, file_id)
+            skipped_files: List[Tuple[int, int, str, str]] = []  # (msg_idx, item_idx, filename, reason)
+            failed_uploads: List[Tuple[int, int, str, str]] = []  # (msg_idx, item_idx, filename, reason)
+            for msg_idx, item_idx in file_locations:
+                marker = messages[msg_idx]["content"][item_idx]
+                source = marker.get("source")
+                file_path = marker.get("path")
+                url = marker.get("url")
+                mime_type = marker.get("mime_type", "application/octet-stream")
+                filename_hint = marker.get("filename") or marker.get("name")
+                # Validate file extension and MIME type for Claude Files API
+                file_ext = None
+                filename = None
+                if source == "local" and file_path:
+                    file_ext = Path(file_path).suffix.lower()
+                    filename = Path(file_path).name
+                    # Re-validate MIME type using mimetypes module for accuracy
+                    guessed_mime, _ = mimetypes.guess_type(file_path)
+                    if guessed_mime:
+                        mime_type = guessed_mime
+                elif source == "url" and url:
+                    # Extract extension from URL (strip query parameters and fragments)
+                    url_path = url.split("?")[0].split("#")[0]
+                    file_ext = Path(url_path).suffix.lower()
+                    filename = Path(url_path).name or url
+                    if not filename_hint:
+                        filename_hint = filename
+                    # Re-validate MIME type using mimetypes module
+                    guessed_mime, _ = mimetypes.guess_type(url_path)
+                    if guessed_mime:
+                        mime_type = guessed_mime
+                # Check if file type is supported (both extension and MIME type)
+                is_supported = False
+                skip_reason = None
+                if file_ext and file_ext.lower() in CLAUDE_FILES_API_SUPPORTED_EXTENSIONS:
+                    # Extension is supported, now check MIME type
+                    if mime_type and mime_type.lower() in CLAUDE_FILES_API_SUPPORTED_MIME_TYPES:
+                        is_supported = True
+                    else:
+                        skip_reason = f"MIME type '{mime_type}' not supported (extension {file_ext} is valid)"
+                else:
+                    skip_reason = f"File extension '{file_ext or 'unknown'}' not supported"
+                # If file is not supported, skip it gracefully and log warning
+                if not is_supported:
+                    logger.warning(
+                        f"[Agent {agent_id or 'default'}] Skipping unsupported file for Claude Files API: "
+                        f"{filename or file_path or url} - {skip_reason}. "
+                        f"Only PDF and TXT files are supported.",
                     )
+                    skipped_files.append((msg_idx, item_idx, filename or file_path or url or "unknown", skip_reason))
+                    continue
-                converted_messages.append({"role": "assistant", "content": content})
-            elif message.get("role") in ["user", "assistant"]:
-                # Keep user and assistant messages, skip system
-                converted_message = dict(message)
-                if isinstance(converted_message.get("content"), str):
-                    # Claude expects content to be text for simple messages
-                    pass  # String content is fine
-                converted_messages.append(converted_message)
+                try:
+                    if source == "local" and file_path:
+                        # Upload local file
+                        path_obj = Path(file_path)
+                        filename = path_obj.name
+                        with open(file_path, "rb") as f:
+                            file_bytes = f.read()
+                        uploaded_file = await client.beta.files.upload(
+                            file=(filename, file_bytes, mime_type),
+                        )
+                        file_id = getattr(uploaded_file, "id", None)
+                        if file_id:
+                            self._uploaded_file_ids.append(file_id)
+                            uploaded_files.append((msg_idx, item_idx, file_id))
+                            logger.info(
+                                f"[Agent {agent_id or 'default'}] Uploaded local file via Files API: {filename} -> {file_id}",
+                            )
+                        else:
+                            failure_reason = "Claude Files API response missing file_id"
+                            failed_uploads.append(
+                                (
+                                    msg_idx,
+                                    item_idx,
+                                    filename or filename_hint or file_path or "unknown",
+                                    failure_reason,
+                                ),
+                            )
+                            logger.warning(
+                                f"[Agent {agent_id or 'default'}] Failed to upload file via Files API: {failure_reason}",
+                            )
-        return converted_messages, system_message
+                    elif source == "url" and url:
+                        # Download and upload URL file
+                        response = await httpx_client.get(url, timeout=30.0)
+                        response.raise_for_status()
+                        # Enforce Claude Files API 500 MB size limit
+                        max_size_bytes = 500 * 1024 * 1024  # 500 MB
+                        content_length = response.headers.get("Content-Length")
+                        if content_length:
+                            file_size = int(content_length)
+                            if file_size > max_size_bytes:
+                                raise UploadFileError(
+                                    f"File size {file_size / (1024 * 1024):.2f} MB exceeds Claude Files API limit of 500 MB",
+                                )
-    async def stream_with_tools(
-        self, messages: List[Dict[str, Any]], tools: List[Dict[str, Any]], **kwargs
-    ) -> AsyncGenerator[StreamChunk, None]:
-        """Stream response using Claude's Messages API with full multi-tool support."""
-        try:
-            import anthropic
-            # Initialize client
-            client = anthropic.AsyncAnthropic(api_key=self.api_key)
-            # Extract parameters
-            model = kwargs.get(
-                "model", "claude-3-5-haiku-latest"
-            )  # Use model that supports code execution
-            max_tokens = kwargs.get("max_tokens", 8192)
-            temperature = kwargs.get("temperature", None)
-            enable_web_search = kwargs.get("enable_web_search", False)
-            enable_code_execution = kwargs.get("enable_code_execution", False)
-            # Convert messages to Claude format and extract system message
-            converted_messages, system_message = self.convert_messages_to_claude_format(
-                messages
-            )
+                        file_bytes = response.content
-            # Combine all tool types (Claude's key advantage!)
-            combined_tools = []
+                        # Cap bytes read if Content-Length was missing
+                        if len(file_bytes) > max_size_bytes:
+                            raise UploadFileError(
+                                f"Downloaded file size {len(file_bytes) / (1024 * 1024):.2f} MB exceeds Claude Files API limit of 500 MB",
+                            )
-            # Add server-side tools if enabled (use correct Claude format)
-            if enable_web_search:
-                combined_tools.append(
-                    {"type": "web_search_20250305", "name": "web_search"}
-                )
+                        filename = url.split("/")[-1] or "document"
+                        uploaded_file = await client.beta.files.upload(
+                            file=(filename, file_bytes, mime_type),
+                        )
+                        file_id = getattr(uploaded_file, "id", None)
+                        if file_id:
+                            self._uploaded_file_ids.append(file_id)
+                            uploaded_files.append((msg_idx, item_idx, file_id))
+                            logger.info(
+                                f"[Agent {agent_id or 'default'}] Uploaded URL file via Files API: {url} -> {file_id}",
+                            )
+                        else:
+                            failure_reason = "Claude Files API response missing file_id"
+                            failed_uploads.append(
+                                (
+                                    msg_idx,
+                                    item_idx,
+                                    filename or filename_hint or url or "unknown",
+                                    failure_reason,
+                                ),
+                            )
+                            logger.warning(
+                                f"[Agent {agent_id or 'default'}] Failed to upload file via Files API: {failure_reason}",
+                            )
-            if enable_code_execution:
-                combined_tools.append(
-                    {"type": "code_execution_20250522", "name": "code_execution"}
-                )
+                except Exception as upload_error:
+                    logger.warning(
+                        f"[Agent {agent_id or 'default'}] Failed to upload file via Files API: {upload_error}",
+                    )
+                    failure_context = filename or filename_hint or file_path or url or "unknown"
+                    failed_uploads.append((msg_idx, item_idx, failure_context, str(upload_error)))
+                    continue
-            # Add user-defined tools
-            if tools:
-                converted_tools = self.convert_tools_to_claude_format(tools)
-                combined_tools.extend(converted_tools)
-            # Build API parameters
-            api_params = {
-                "model": model,
-                "messages": converted_messages,
-                "max_tokens": max_tokens,
-                "stream": True,
-            }
+        except Exception as e:
+            logger.warning(f"[Agent {agent_id or 'default'}] Files API upload error: {e}")
+            raise UploadFileError(f"Files API upload failed: {e}") from e
+        finally:
+            if httpx_client:
+                await httpx_client.aclose()
+        # Clone messages and replace markers with document blocks or text notes
+        updated_messages = [msg.copy() for msg in messages]
+        # Replace successfully uploaded files with document blocks
+        for msg_idx, item_idx, file_id in reversed(uploaded_files):
+            content = updated_messages[msg_idx]["content"]
+            if isinstance(content, list):
+                # Create document block
+                document_block = {
+                    "type": "document",
+                    "source": {
+                        "type": "file",
+                        "file_id": file_id,
+                    },
+                }
+                # Replace marker with document block
+                new_content = content[:item_idx] + [document_block] + content[item_idx + 1 :]
+                updated_messages[msg_idx]["content"] = new_content
+        # Replace skipped files with informative text notes
+        for msg_idx, item_idx, filename, reason in reversed(skipped_files):
+            content = updated_messages[msg_idx]["content"]
+            if isinstance(content, list):
+                # Create text note explaining the limitation
+                text_note = {
+                    "type": "text",
+                    "text": (f"\n[Note: File '{filename}' was not uploaded to Claude Files API. " f"Reason: {reason}. " f"Claude Files API only supports PDF and TXT files.]\n"),
+                }
+                # Replace marker with text note
+                new_content = content[:item_idx] + [text_note] + content[item_idx + 1 :]
+                updated_messages[msg_idx]["content"] = new_content
+        # Replace failed uploads with informative text notes
+        for msg_idx, item_idx, filename, reason in reversed(failed_uploads):
+            content = updated_messages[msg_idx]["content"]
+            if isinstance(content, list):
+                text_note = {
+                    "type": "text",
+                    "text": (f"\n[Note: File '{filename}' failed to upload to Claude Files API. " f"Reason: {reason}.]\n"),
+                }
+                new_content = content[:item_idx] + [text_note] + content[item_idx + 1 :]
+                updated_messages[msg_idx]["content"] = new_content
-            if system_message:
-                api_params["system"] = system_message
+        # Final sweep to ensure all file_pending_upload markers were replaced
+        self._ensure_no_pending_upload_markers(updated_messages)
-            if temperature is not None:
-                api_params["temperature"] = temperature
+        return updated_messages
-            if combined_tools:
-                api_params["tools"] = combined_tools
+    async def _cleanup_files_api_resources(self, **kwargs) -> None:
+        """Clean up uploaded files via Files API."""
+        if not self._uploaded_file_ids:
+            return
-            # Set up beta features and create stream
-            if enable_code_execution:
-                # Code execution requires beta client and beta headers
-                api_params["betas"] = ["code-execution-2025-05-22"]
-                stream = await client.beta.messages.create(**api_params)
-            else:
-                # Regular client for non-code-execution requests
-                stream = await client.messages.create(**api_params)
+        agent_id = kwargs.get("agent_id")
+        logger.info(
+            f"[Agent {agent_id or 'default'}] Cleaning up {len(self._uploaded_file_ids)} Files API resources...",
+        )
-            content = ""
-            current_tool_uses = {}
+        client = None
+        try:
+            client = self._create_client(**kwargs)
-            async for event in stream:
+            for file_id in self._uploaded_file_ids:
                 try:
-                    if event.type == "message_start":
-                        # Message started
+                    await client.beta.files.delete(file_id)
+                    logger.debug(f"[Agent {agent_id or 'default'}] Deleted Files API file: {file_id}")
+                except Exception as delete_error:
+                    logger.warning(
+                        f"[Agent {agent_id or 'default'}] Failed to delete Files API file {file_id}: {delete_error}",
+                    )
+                    continue
+            self._uploaded_file_ids.clear()
+            logger.info(f"[Agent {agent_id or 'default'}] Files API cleanup completed")
+        except Exception as e:
+            logger.warning(f"[Agent {agent_id or 'default'}] Files API cleanup error: {e}")
+        finally:
+            if client and hasattr(client, "aclose"):
+                await client.aclose()
+    def _ensure_no_pending_upload_markers(self, messages: List[Dict[str, Any]]) -> None:
+        """Raise UploadFileError if any file_pending_upload markers remain."""
+        if not messages:
+            return
+        for msg_idx, message in enumerate(messages):
+            content = message.get("content")
+            if not isinstance(content, list):
+                continue
+            for item_idx, item in enumerate(content):
+                if isinstance(item, dict) and item.get("type") == "file_pending_upload":
+                    identifier = item.get("filename") or item.get("name") or item.get("path") or item.get("url") or "unknown"
+                    raise UploadFileError(
+                        "Claude Files API upload left unresolved file_pending_upload marker " f"(message {msg_idx}, item {item_idx}, source {identifier}).",
+                    )
+    async def _stream_without_mcp_tools(
+        self,
+        messages: List[Dict[str, Any]],
+        tools: List[Dict[str, Any]],
+        client,
+        **kwargs,
+    ) -> AsyncGenerator[StreamChunk, None]:
+        """Override to integrate Files API uploads into non-MCP streaming."""
+        agent_id = kwargs.get("agent_id", None)
+        all_params = {**self.config, **kwargs}
+        processed_messages = await self._process_upload_files(messages, all_params)
+        # Check if we need to upload files via Files API
+        if all_params.get("_has_file_search_files"):
+            logger.info("Processing Files API uploads...")
+            processed_messages = await self._upload_files_via_files_api(processed_messages, client, agent_id)
+            all_params["_has_files_api_files"] = True
+            all_params.pop("_has_file_search_files", None)
+        self._ensure_no_pending_upload_markers(processed_messages)
+        api_params = await self.api_params_handler.build_api_params(processed_messages, tools, all_params)
+        # Remove any MCP tools from the tools list
+        if "tools" in api_params:
+            non_mcp_tools = []
+            for tool in api_params.get("tools", []):
+                # Check different formats for MCP tools
+                if tool.get("type") == "function":
+                    name = tool.get("function", {}).get("name") if "function" in tool else tool.get("name")
+                    if name and name in self._mcp_function_names:
                         continue
+                elif tool.get("type") == "mcp":
+                    continue
+                non_mcp_tools.append(tool)
+            if non_mcp_tools:
+                api_params["tools"] = non_mcp_tools
+            else:
+                api_params.pop("tools", None)
+        # Create stream (handle betas)
+        if "betas" in api_params:
+            stream = await client.beta.messages.create(**api_params)
+        else:
+            stream = await client.messages.create(**api_params)
+        # Process stream chunks
+        async for chunk in self._process_stream(stream, all_params, agent_id):
+            yield chunk
+    async def _stream_with_mcp_tools(
+        self,
+        current_messages: List[Dict[str, Any]],
+        tools: List[Dict[str, Any]],
+        client,
+        **kwargs,
+    ) -> AsyncGenerator[StreamChunk, None]:
+        """Recursively stream responses, executing MCP function calls when detected."""
+        # Build API params for this iteration
+        all_params = {**self.config, **kwargs}
+        # Check if we need to upload files via Files API
+        if all_params.get("_has_file_search_files"):
+            logger.info("Processing Files API uploads in MCP mode...")
+            agent_id = kwargs.get("agent_id")
+            current_messages = await self._upload_files_via_files_api(current_messages, client, agent_id)
+            all_params["_has_files_api_files"] = True
+            all_params.pop("_has_file_search_files", None)
+        self._ensure_no_pending_upload_markers(current_messages)
-                    elif event.type == "content_block_start":
-                        # Content block started (text, tool use, or tool result)
-                        if hasattr(event, "content_block"):
-                            if event.content_block.type == "tool_use":
-                                # Regular tool use started (user-defined tools)
-                                tool_id = event.content_block.id
-                                tool_name = event.content_block.name
-                                current_tool_uses[tool_id] = {
-                                    "id": tool_id,
-                                    "name": tool_name,
-                                    "input": "",  # Will accumulate JSON fragments
-                                    "index": getattr(event, "index", None),
-                                }
-                            elif event.content_block.type == "server_tool_use":
-                                # Server-side tool use (code execution, web search) - show status immediately
-                                tool_id = event.content_block.id
-                                tool_name = event.content_block.name
-                                current_tool_uses[tool_id] = {
-                                    "id": tool_id,
-                                    "name": tool_name,
-                                    "input": "",  # Will accumulate JSON fragments
-                                    "index": getattr(event, "index", None),
-                                    "server_side": True,
-                                }
-                                # Show tool execution starting
+        api_params = await self.api_params_handler.build_api_params(current_messages, tools, all_params)
+        agent_id = kwargs.get("agent_id", None)
+        # Create stream (handle code execution beta)
+        if "betas" in api_params:
+            stream = await client.beta.messages.create(**api_params)
+        else:
+            stream = await client.messages.create(**api_params)
+        content = ""
+        current_tool_uses: Dict[str, Dict[str, Any]] = {}
+        mcp_tool_calls: List[Dict[str, Any]] = []
+        response_completed = False
+        async for event in stream:
+            try:
+                if event.type == "message_start":
+                    continue
+                elif event.type == "content_block_start":
+                    if hasattr(event, "content_block"):
+                        if event.content_block.type == "tool_use":
+                            tool_id = event.content_block.id
+                            tool_name = event.content_block.name
+                            current_tool_uses[tool_id] = {
+                                "id": tool_id,
+                                "name": tool_name,
+                                "input": "",
+                                "index": getattr(event, "index", None),
+                            }
+                        elif event.content_block.type == "server_tool_use":
+                            tool_id = event.content_block.id
+                            tool_name = event.content_block.name
+                            current_tool_uses[tool_id] = {
+                                "id": tool_id,
+                                "name": tool_name,
+                                "input": "",
+                                "index": getattr(event, "index", None),
+                                "server_side": True,
+                            }
+                            if tool_name == "code_execution":
+                                yield StreamChunk(
+                                    type="content",
+                                    content="\n💻 [Code Execution] Starting...\n",
+                                )
+                            elif tool_name == "web_search":
+                                yield StreamChunk(
+                                    type="content",
+                                    content="\n🔍 [Web Search] Starting search...\n",
+                                )
+                        elif event.content_block.type == "code_execution_tool_result":
+                            result_block = event.content_block
+                            result_parts = []
+                            if hasattr(result_block, "stdout") and result_block.stdout:
+                                result_parts.append(f"Output: {result_block.stdout.strip()}")
+                            if hasattr(result_block, "stderr") and result_block.stderr:
+                                result_parts.append(f"Error: {result_block.stderr.strip()}")
+                            if hasattr(result_block, "return_code") and result_block.return_code != 0:
+                                result_parts.append(f"Exit code: {result_block.return_code}")
+                            if result_parts:
+                                result_text = f"\n💻 [Code Execution Result]\n{chr(10).join(result_parts)}\n"
+                                yield StreamChunk(type="content", content=result_text)
+                elif event.type == "content_block_delta":
+                    if hasattr(event, "delta"):
+                        if event.delta.type == "text_delta":
+                            text_chunk = event.delta.text
+                            content += text_chunk
+                            log_backend_agent_message(
+                                agent_id or "default",
+                                "RECV",
+                                {"content": text_chunk},
+                                backend_name="claude",
+                            )
+                            log_stream_chunk("backend.claude", "content", text_chunk, agent_id)
+                            yield StreamChunk(type="content", content=text_chunk)
+                        elif event.delta.type == "input_json_delta":
+                            if hasattr(event, "index"):
+                                for tool_id, tool_data in current_tool_uses.items():
+                                    if tool_data.get("index") == event.index:
+                                        partial_json = getattr(event.delta, "partial_json", "")
+                                        tool_data["input"] += partial_json
+                                        break
+                elif event.type == "content_block_stop":
+                    if hasattr(event, "index"):
+                        for tool_id, tool_data in current_tool_uses.items():
+                            if tool_data.get("index") == event.index and tool_data.get("server_side"):
+                                tool_name = tool_data.get("name", "")
+                                tool_input = tool_data.get("input", "")
+                                try:
+                                    parsed_input = json.loads(tool_input) if tool_input else {}
+                                except json.JSONDecodeError:
+                                    parsed_input = {"raw_input": tool_input}
                                 if tool_name == "code_execution":
+                                    code = parsed_input.get("code", "")
+                                    if code:
+                                        yield StreamChunk(type="content", content=f"💻 [Code] {code}\n")
                                     yield StreamChunk(
                                         type="content",
-                                        content=f"\n💻 [Code Execution] Starting...\n",
+                                        content="✅ [Code Execution] Completed\n",
                                     )
                                 elif tool_name == "web_search":
+                                    query = parsed_input.get("query", "")
+                                    if query:
+                                        yield StreamChunk(
+                                            type="content",
+                                            content=f"🔍 [Query] '{query}'\n",
+                                        )
                                     yield StreamChunk(
                                         type="content",
-                                        content=f"\n🔍 [Web Search] Starting search...\n",
-                                    )
-                            elif (
-                                event.content_block.type == "code_execution_tool_result"
-                            ):
-                                # Code execution result - format properly
-                                result_block = event.content_block
-                                # Format execution result nicely
-                                result_parts = []
-                                if (
-                                    hasattr(result_block, "stdout")
-                                    and result_block.stdout
-                                ):
-                                    result_parts.append(
-                                        f"Output: {result_block.stdout.strip()}"
-                                    )
-                                if (
-                                    hasattr(result_block, "stderr")
-                                    and result_block.stderr
-                                ):
-                                    result_parts.append(
-                                        f"Error: {result_block.stderr.strip()}"
-                                    )
-                                if (
-                                    hasattr(result_block, "return_code")
-                                    and result_block.return_code != 0
-                                ):
-                                    result_parts.append(
-                                        f"Exit code: {result_block.return_code}"
+                                        content="✅ [Web Search] Completed\n",
                                     )
+                                tool_data["processed"] = True
+                                break
+                elif event.type == "message_delta":
+                    pass
+                elif event.type == "message_stop":
+                    # Identify MCP and non-MCP tool calls among current_tool_uses
+                    non_mcp_tool_calls = []
+                    if current_tool_uses:
+                        for tool_use in current_tool_uses.values():
+                            tool_name = tool_use.get("name", "")
+                            is_server_side = tool_use.get("server_side", False)
+                            if is_server_side:
+                                continue
+                            # Parse accumulated JSON input for tool
+                            tool_input = tool_use.get("input", "")
+                            try:
+                                parsed_input = json.loads(tool_input) if tool_input else {}
+                            except json.JSONDecodeError:
+                                parsed_input = {"raw_input": tool_input}
+                            if self.is_mcp_tool_call(tool_name):
+                                mcp_tool_calls.append(
+                                    {
+                                        "id": tool_use["id"],
+                                        "type": "function",
+                                        "function": {
+                                            "name": tool_name,
+                                            "arguments": parsed_input,
+                                        },
+                                    },
+                                )
+                            else:
+                                non_mcp_tool_calls.append(
+                                    {
+                                        "id": tool_use["id"],
+                                        "type": "function",
+                                        "function": {
+                                            "name": tool_name,
+                                            "arguments": parsed_input,
+                                        },
+                                    },
+                                )
+                    # Emit non-MCP tool calls for the caller to execute
+                    if non_mcp_tool_calls:
+                        log_stream_chunk("backend.claude", "tool_calls", non_mcp_tool_calls, agent_id)
+                        yield StreamChunk(type="tool_calls", tool_calls=non_mcp_tool_calls)
+                    response_completed = True
+                    break
+            except Exception as event_error:
+                error_msg = f"Event processing error: {event_error}"
+                log_stream_chunk("backend.claude", "error", error_msg, agent_id)
+                yield StreamChunk(type="error", error=error_msg)
+                continue
+        # If we captured MCP tool calls, execute them and recurse
+        if response_completed and mcp_tool_calls:
+            # Circuit breaker pre-execution check using base class method
+            if not await self._check_circuit_breaker_before_execution():
+                yield StreamChunk(
+                    type="mcp_status",
+                    status="mcp_blocked",
+                    content="⚠️ [MCP] All servers blocked by circuit breaker",
+                    source="circuit_breaker",
+                )
+                yield StreamChunk(type="done")
+                return
-                                if result_parts:
-                                    result_text = f"\n💻 [Code Execution Result]\n{chr(10).join(result_parts)}\n"
-                                    yield StreamChunk(
-                                        type="content", content=result_text
-                                    )
+            updated_messages = current_messages.copy()
-                    elif event.type == "content_block_delta":
-                        # Content streaming
-                        if hasattr(event, "delta"):
-                            if event.delta.type == "text_delta":
-                                # Text content
-                                text_chunk = event.delta.text
-                                content += text_chunk
-                                yield StreamChunk(type="content", content=text_chunk)
-                            elif event.delta.type == "input_json_delta":
-                                # Tool input streaming - accumulate JSON fragments
-                                if hasattr(event, "index"):
-                                    # Find tool by index
-                                    for tool_id, tool_data in current_tool_uses.items():
-                                        if tool_data.get("index") == event.index:
-                                            # Accumulate partial JSON
-                                            partial_json = getattr(
-                                                event.delta, "partial_json", ""
-                                            )
-                                            tool_data["input"] += partial_json
-                                            break
-                    elif event.type == "content_block_stop":
-                        # Content block completed - check if it was a server-side tool
-                        if hasattr(event, "index"):
-                            # Find the tool that just completed
-                            for tool_id, tool_data in current_tool_uses.items():
-                                if tool_data.get(
-                                    "index"
-                                ) == event.index and tool_data.get("server_side"):
-                                    tool_name = tool_data.get("name", "")
-                                    # Parse the accumulated input to show what was executed
-                                    tool_input = tool_data.get("input", "")
-                                    try:
-                                        if tool_input:
-                                            parsed_input = json.loads(tool_input)
-                                        else:
-                                            parsed_input = {}
-                                    except json.JSONDecodeError:
-                                        parsed_input = {"raw_input": tool_input}
-                                    if tool_name == "code_execution":
-                                        code = parsed_input.get("code", "")
-                                        if code:
-                                            yield StreamChunk(
-                                                type="content",
-                                                content=f"💻 [Code] {code}\n",
-                                            )
-                                        yield StreamChunk(
-                                            type="content",
-                                            content=f"✅ [Code Execution] Completed\n",
-                                        )
+            # Build assistant message with tool_use blocks for all MCP tool calls
+            assistant_content = []
+            if content:  # Add text content if any
+                assistant_content.append({"type": "text", "text": content})
-                                        # Yield builtin tool result immediately
-                                        builtin_result = {
-                                            "id": tool_id,
-                                            "tool_type": "code_execution",
-                                            "status": "completed",
-                                            "code": code,
-                                            "input": parsed_input,
-                                        }
-                                        yield StreamChunk(
-                                            type="builtin_tool_results",
-                                            builtin_tool_results=[builtin_result],
-                                        )
+            for tool_call in mcp_tool_calls:
+                tool_name = tool_call["function"]["name"]
+                tool_args = tool_call["function"]["arguments"]
+                tool_id = tool_call["id"]
-                                    elif tool_name == "web_search":
-                                        query = parsed_input.get("query", "")
-                                        if query:
-                                            yield StreamChunk(
-                                                type="content",
-                                                content=f"🔍 [Query] '{query}'\n",
-                                            )
-                                        yield StreamChunk(
-                                            type="content",
-                                            content=f"✅ [Web Search] Completed\n",
-                                        )
+                assistant_content.append(
+                    {
+                        "type": "tool_use",
+                        "id": tool_id,
+                        "name": tool_name,
+                        "input": tool_args,
+                    },
+                )
-                                        # Yield builtin tool result immediately
-                                        builtin_result = {
-                                            "id": tool_id,
-                                            "tool_type": "web_search",
-                                            "status": "completed",
-                                            "query": query,
-                                            "input": parsed_input,
-                                        }
-                                        yield StreamChunk(
-                                            type="builtin_tool_results",
-                                            builtin_tool_results=[builtin_result],
-                                        )
+            # Append the assistant message with tool uses
+            updated_messages.append({"role": "assistant", "content": assistant_content})
-                                    # Mark this tool as processed so we don't duplicate it later
-                                    tool_data["processed"] = True
-                                    break
+            # Now execute the MCP tool calls and append results
+            for tool_call in mcp_tool_calls:
+                function_name = tool_call["function"]["name"]
-                    elif event.type == "message_delta":
-                        # Message metadata updates (usage, etc.)
-                        if hasattr(event, "usage"):
-                            # Track token usage
-                            pass
+                # Yield MCP tool call status
+                yield StreamChunk(
+                    type="mcp_status",
+                    status="mcp_tool_called",
+                    content=f"🔧 [MCP Tool] Calling {function_name}...",
+                    source=f"mcp_{function_name}",
+                )
-                    elif event.type == "message_stop":
-                        # Message completed - build final response
+                try:
+                    # Execute MCP function
+                    args_json = json.dumps(tool_call["function"]["arguments"]) if isinstance(tool_call["function"].get("arguments"), (dict, list)) else tool_call["function"].get("arguments", "{}")
+                    result_list = await self._execute_mcp_function_with_retry(function_name, args_json)
+                    if not result_list or (isinstance(result_list[0], str) and result_list[0].startswith("Error:")):
+                        logger.warning(f"MCP function {function_name} failed after retries: {result_list[0] if result_list else 'unknown error'}")
+                        continue
+                    result_str = result_list[0]
+                    result_obj = result_list[1] if len(result_list) > 1 else None
+                except Exception as e:
+                    logger.error(f"Unexpected error in MCP function execution: {e}")
+                    continue
-                        # Handle any completed tool uses
-                        if current_tool_uses:
-                            # Separate server-side tools from user-defined tools
-                            builtin_tool_results = []
-                            user_tool_calls = []
+                # Build tool result message: { "role":"user", "content":[{ "type":"tool_result", "tool_use_id": tool_call["id"], "content": result_str }] }
+                tool_result_msg = {
+                    "role": "user",
+                    "content": [
+                        {
+                            "type": "tool_result",
+                            "tool_use_id": tool_call["id"],
+                            "content": result_str,
+                        },
+                    ],
+                }
-                            for tool_use in current_tool_uses.values():
-                                tool_name = tool_use.get("name", "")
-                                is_server_side = tool_use.get("server_side", False)
+                # Append to updated_messages
+                updated_messages.append(tool_result_msg)
-                                # Parse accumulated JSON input
-                                tool_input = tool_use.get("input", "")
-                                try:
-                                    if tool_input:
-                                        parsed_input = json.loads(tool_input)
-                                    else:
-                                        parsed_input = {}
-                                except json.JSONDecodeError:
-                                    parsed_input = {"raw_input": tool_input}
+                yield StreamChunk(
+                    type="mcp_status",
+                    status="function_call",
+                    content=f"Arguments for Calling {function_name}: {json.dumps(tool_call['function'].get('arguments', {}))}",
+                    source=f"mcp_{function_name}",
+                )
-                                if is_server_side or tool_name in [
-                                    "web_search",
-                                    "code_execution",
-                                ]:
-                                    # Convert server-side tools to builtin_tool_results
-                                    builtin_result = {
-                                        "id": tool_use["id"],
-                                        "tool_type": tool_name,
-                                        "status": "completed",
-                                        "input": parsed_input,
-                                    }
-                                    # Add tool-specific data
-                                    if tool_name == "code_execution":
-                                        builtin_result["code"] = parsed_input.get(
-                                            "code", ""
-                                        )
-                                        # Note: actual execution results come via content_block events
-                                    elif tool_name == "web_search":
-                                        builtin_result["query"] = parsed_input.get(
-                                            "query", ""
-                                        )
-                                        # Note: search results come via content_block events
-                                    builtin_tool_results.append(builtin_result)
-                                else:
-                                    # User-defined tools that need external execution
-                                    user_tool_calls.append(
-                                        {
-                                            "id": tool_use["id"],
-                                            "type": "function",
-                                            "function": {
-                                                "name": tool_name,
-                                                "arguments": parsed_input,
-                                            },
-                                        }
-                                    )
+                # If result_obj might be structured, try to display summary
+                result_display = None
+                try:
+                    if hasattr(result_obj, "content") and result_obj.content:
+                        part = result_obj.content[0]
+                        if hasattr(part, "text"):
+                            result_display = str(part.text)
+                except Exception:
+                    result_display = None
+                if result_display:
+                    yield StreamChunk(
+                        type="mcp_status",
+                        status="function_call_output",
+                        content=f"Results for Calling {function_name}: {result_display}",
+                        source=f"mcp_{function_name}",
+                    )
+                else:
+                    yield StreamChunk(
+                        type="mcp_status",
+                        status="function_call_output",
+                        content=f"Results for Calling {function_name}: {result_str}",
+                        source=f"mcp_{function_name}",
+                    )
-                            # Only yield builtin tool results that weren't already processed during content_block_stop
-                            unprocessed_builtin_results = []
-                            for result in builtin_tool_results:
-                                tool_id = result.get("id")
-                                # Check if this tool was already processed during streaming
-                                tool_data = current_tool_uses.get(tool_id, {})
-                                if not tool_data.get("processed"):
-                                    unprocessed_builtin_results.append(result)
+                logger.info(f"Executed MCP function {function_name} (stdio/streamable-http)")
+                yield StreamChunk(
+                    type="mcp_status",
+                    status="mcp_tool_response",
+                    content=f"✅ [MCP Tool] {function_name} completed",
+                    source=f"mcp_{function_name}",
+                )
+            # Trim updated_messages using base class method
+            updated_messages = self._trim_message_history(updated_messages)
-                            if unprocessed_builtin_results:
+            # After processing all MCP calls, recurse: async for chunk in self._stream_mcp_recursive(updated_messages, tools, client, **kwargs): yield chunk
+            async for chunk in self._stream_with_mcp_tools(updated_messages, tools, client, **kwargs):
+                yield chunk
+            return
+        else:
+            # No MCP function calls; finalize this turn
+            # Ensure termination with a done chunk when no further tool calls
+            complete_message = {
+                "role": "assistant",
+                "content": content.strip(),
+            }
+            log_stream_chunk("backend.claude", "complete_message", complete_message, agent_id)
+            yield StreamChunk(type="complete_message", complete_message=complete_message)
+            yield StreamChunk(
+                type="mcp_status",
+                status="mcp_session_complete",
+                content="✅ [MCP] Session completed",
+                source="mcp_session",
+            )
+            yield StreamChunk(type="done")
+            return
+    async def _process_stream(
+        self,
+        stream,
+        all_params: Dict[str, Any],
+        agent_id: Optional[str],
+    ) -> AsyncGenerator[StreamChunk, None]:
+        """Process stream events and yield StreamChunks."""
+        content_local = ""
+        current_tool_uses_local: Dict[str, Dict[str, Any]] = {}
+        async for chunk in stream:
+            try:
+                if chunk.type == "message_start":
+                    continue
+                elif chunk.type == "content_block_start":
+                    if hasattr(chunk, "content_block"):
+                        if chunk.content_block.type == "tool_use":
+                            tool_id = chunk.content_block.id
+                            tool_name = chunk.content_block.name
+                            current_tool_uses_local[tool_id] = {
+                                "id": tool_id,
+                                "name": tool_name,
+                                "input": "",
+                                "index": getattr(chunk, "index", None),
+                            }
+                        elif chunk.content_block.type == "server_tool_use":
+                            tool_id = chunk.content_block.id
+                            tool_name = chunk.content_block.name
+                            current_tool_uses_local[tool_id] = {
+                                "id": tool_id,
+                                "name": tool_name,
+                                "input": "",
+                                "index": getattr(chunk, "index", None),
+                                "server_side": True,
+                            }
+                            if tool_name == "code_execution":
                                 yield StreamChunk(
-                                    type="builtin_tool_results",
-                                    builtin_tool_results=unprocessed_builtin_results,
+                                    type="content",
+                                    content="\n💻 [Code Execution] Starting...\n",
                                 )
-                            # Yield user tool calls if any
-                            if user_tool_calls:
+                            elif tool_name == "web_search":
                                 yield StreamChunk(
-                                    type="tool_calls", tool_calls=user_tool_calls
+                                    type="content",
+                                    content="\n🔍 [Web Search] Starting search...\n",
                                 )
-                            # Build complete message with only user tool calls (builtin tools are handled separately)
-                            complete_message = {
-                                "role": "assistant",
-                                "content": content.strip(),
-                            }
-                            if user_tool_calls:
-                                complete_message["tool_calls"] = user_tool_calls
-                            yield StreamChunk(
-                                type="complete_message",
-                                complete_message=complete_message,
+                        elif chunk.content_block.type == "code_execution_tool_result":
+                            result_block = chunk.content_block
+                            result_parts = []
+                            if hasattr(result_block, "stdout") and result_block.stdout:
+                                result_parts.append(f"Output: {result_block.stdout.strip()}")
+                            if hasattr(result_block, "stderr") and result_block.stderr:
+                                result_parts.append(f"Error: {result_block.stderr.strip()}")
+                            if hasattr(result_block, "return_code") and result_block.return_code != 0:
+                                result_parts.append(f"Exit code: {result_block.return_code}")
+                            if result_parts:
+                                result_text = f"\n💻 [Code Execution Result]\n{chr(10).join(result_parts)}\n"
+                                yield StreamChunk(
+                                    type="content",
+                                    content=result_text,
+                                )
+                elif chunk.type == "content_block_delta":
+                    if hasattr(chunk, "delta"):
+                        if chunk.delta.type == "text_delta":
+                            text_chunk = chunk.delta.text
+                            content_local += text_chunk
+                            log_backend_agent_message(
+                                agent_id or "default",
+                                "RECV",
+                                {"content": text_chunk},
+                                backend_name="claude",
                             )
-                        else:
-                            # Regular text response
-                            complete_message = {
-                                "role": "assistant",
-                                "content": content.strip(),
-                            }
-                            yield StreamChunk(
-                                type="complete_message",
-                                complete_message=complete_message,
+                            log_stream_chunk(
+                                "backend.claude",
+                                "content",
+                                text_chunk,
+                                agent_id,
+                            )
+                            yield StreamChunk(type="content", content=text_chunk)
+                        elif chunk.delta.type == "input_json_delta":
+                            if hasattr(chunk, "index"):
+                                for (
+                                    tool_id,
+                                    tool_data,
+                                ) in current_tool_uses_local.items():
+                                    if tool_data.get("index") == chunk.index:
+                                        partial_json = getattr(
+                                            chunk.delta,
+                                            "partial_json",
+                                            "",
+                                        )
+                                        tool_data["input"] += partial_json
+                                        break
+                elif chunk.type == "content_block_stop":
+                    if hasattr(chunk, "index"):
+                        for (
+                            tool_id,
+                            tool_data,
+                        ) in current_tool_uses_local.items():
+                            if tool_data.get("index") == chunk.index and tool_data.get("server_side"):
+                                tool_name = tool_data.get("name", "")
+                                tool_input = tool_data.get("input", "")
+                                try:
+                                    parsed_input = json.loads(tool_input) if tool_input else {}
+                                except json.JSONDecodeError:
+                                    parsed_input = {"raw_input": tool_input}
+                                if tool_name == "code_execution":
+                                    code = parsed_input.get("code", "")
+                                    if code:
+                                        yield StreamChunk(
+                                            type="content",
+                                            content=f"💻 [Code] {code}\n",
+                                        )
+                                    yield StreamChunk(
+                                        type="content",
+                                        content="✅ [Code Execution] Completed\n",
+                                    )
+                                elif tool_name == "web_search":
+                                    query = parsed_input.get("query", "")
+                                    if query:
+                                        yield StreamChunk(
+                                            type="content",
+                                            content=f"🔍 [Query] '{query}'\n",
+                                        )
+                                    yield StreamChunk(
+                                        type="content",
+                                        content="✅ [Web Search] Completed\n",
+                                    )
+                                tool_data["processed"] = True
+                                break
+                elif chunk.type == "message_delta":
+                    pass
+                elif chunk.type == "message_stop":
+                    # Build final response and yield tool_calls for user-defined non-MCP tools
+                    user_tool_calls = []
+                    for tool_use in current_tool_uses_local.values():
+                        tool_name = tool_use.get("name", "")
+                        is_server_side = tool_use.get("server_side", False)
+                        if not is_server_side and tool_name not in ["web_search", "code_execution"]:
+                            tool_input = tool_use.get("input", "")
+                            try:
+                                parsed_input = json.loads(tool_input) if tool_input else {}
+                            except json.JSONDecodeError:
+                                parsed_input = {"raw_input": tool_input}
+                            user_tool_calls.append(
+                                {
+                                    "id": tool_use["id"],
+                                    "type": "function",
+                                    "function": {
+                                        "name": tool_name,
+                                        "arguments": parsed_input,
+                                    },
+                                },
                             )
-                        # Track usage for pricing
-                        if enable_web_search:
-                            self.search_count += 1  # Approximate search usage
-                        if enable_code_execution:
-                            self.code_session_hours += 0.083  # 5 min minimum session
-                        yield StreamChunk(type="done")
-                        return
-                except Exception as event_error:
+                    if user_tool_calls:
+                        log_stream_chunk(
+                            "backend.claude",
+                            "tool_calls",
+                            user_tool_calls,
+                            agent_id,
+                        )
+                        yield StreamChunk(
+                            type="tool_calls",
+                            tool_calls=user_tool_calls,
+                        )
+                    complete_message = {
+                        "role": "assistant",
+                        "content": content_local.strip(),
+                    }
+                    if user_tool_calls:
+                        complete_message["tool_calls"] = user_tool_calls
+                    log_stream_chunk(
+                        "backend.claude",
+                        "complete_message",
+                        complete_message,
+                        agent_id,
+                    )
                     yield StreamChunk(
-                        type="error", error=f"Event processing error: {event_error}"
+                        type="complete_message",
+                        complete_message=complete_message,
                     )
-                    continue
-        except Exception as e:
-            yield StreamChunk(type="error", error=f"Claude API error: {e}")
-    def get_provider_name(self) -> str:
-        """Get the provider name."""
-        return "Claude"
+                    # Track usage for pricing
+                    if all_params.get("enable_web_search", False):
+                        self.search_count += 1
+                    if all_params.get("enable_code_execution", False):
+                        self.code_session_hours += 0.083
+                    log_stream_chunk("backend.claude", "done", None, agent_id)
+                    yield StreamChunk(type="done")
+                    return
+            except Exception as event_error:
+                error_msg = f"Event processing error: {event_error}"
+                log_stream_chunk("backend.claude", "error", error_msg, agent_id)
+                yield StreamChunk(type="error", error=error_msg)
+                continue
+    async def _handle_mcp_error_and_fallback(
+        self,
+        error: Exception,
+        api_params: Dict[str, Any],
+        provider_tools: List[Dict[str, Any]],
+        stream_func: Callable[[Dict[str, Any]], AsyncGenerator[StreamChunk, None]],
+    ) -> AsyncGenerator[StreamChunk, None]:
+        """Handle MCP errors with user-friendly messaging and fallback to non-MCP tools."""
-    def get_supported_builtin_tools(self) -> List[str]:
-        """Get list of builtin tools supported by Claude."""
-        return ["web_search", "code_execution"]
+        async with self._stats_lock:
+            self._mcp_tool_failures += 1
+            call_index_snapshot = self._mcp_tool_calls_count
-    def extract_tool_name(self, tool_call: Dict[str, Any]) -> str:
-        """Extract tool name from tool call (handles multiple formats)."""
-        # Chat Completions format
-        if "function" in tool_call:
-            return tool_call.get("function", {}).get("name", "unknown")
-        # Claude native format
-        elif "name" in tool_call:
-            return tool_call.get("name", "unknown")
-        # Fallback
-        return "unknown"
-    def extract_tool_arguments(self, tool_call: Dict[str, Any]) -> Dict[str, Any]:
-        """Extract tool arguments from tool call (handles multiple formats)."""
-        # Chat Completions format
-        if "function" in tool_call:
-            args = tool_call.get("function", {}).get("arguments", {})
-        # Claude native format
-        elif "input" in tool_call:
-            args = tool_call.get("input", {})
+        if MCPErrorHandler:
+            log_type, user_message, _ = MCPErrorHandler.get_error_details(error)  # type: ignore[assignment]
         else:
-            args = {}
+            log_type, user_message = "mcp_error", "[MCP] Error occurred"
-        # Ensure JSON parsing if needed
-        if isinstance(args, str):
-            try:
-                return json.loads(args)
-            except:
-                return {}
-        return args
-    def extract_tool_call_id(self, tool_call: Dict[str, Any]) -> str:
-        """Extract tool call ID from tool call."""
-        return tool_call.get("id") or tool_call.get("call_id") or ""
-    def create_tool_result_message(
-        self, tool_call: Dict[str, Any], result_content: str
-    ) -> Dict[str, Any]:
+        logger.warning(f"MCP tool call #{call_index_snapshot} failed - {log_type}: {error}")
+        yield StreamChunk(
+            type="content",
+            content=f"\n⚠️  {user_message} ({error}); continuing without MCP tools\n",
+        )
+        # Build non-MCP configuration and stream fallback
+        fallback_params = dict(api_params)
+        # Remove any MCP tools from the tools list
+        if "tools" in fallback_params and self._mcp_functions:
+            mcp_names = set(self._mcp_functions.keys())
+            non_mcp_tools = []
+            for tool in fallback_params["tools"]:
+                name = tool.get("name")
+                if name in mcp_names:
+                    continue
+                non_mcp_tools.append(tool)
+            fallback_params["tools"] = non_mcp_tools
+        # Add back provider tools if they were present
+        if provider_tools:
+            if "tools" not in fallback_params:
+                fallback_params["tools"] = []
+            fallback_params["tools"].extend(provider_tools)
+        async for chunk in stream_func(fallback_params):
+            yield chunk
+    async def _execute_mcp_function_with_retry(
+        self,
+        function_name: str,
+        arguments_json: str,
+        max_retries: int = 3,
+    ) -> List[str | Any]:
+        """Execute MCP function with Claude-specific formatting."""
+        # Use parent class method which returns tuple
+        result_str, result_obj = await super()._execute_mcp_function_with_retry(
+            function_name,
+            arguments_json,
+            max_retries,
+        )
+        # Convert to list format expected by Claude streaming
+        if result_str.startswith("Error:"):
+            return [result_str]
+        return [result_str, result_obj]
+    def create_tool_result_message(self, tool_call: Dict[str, Any], result_content: str) -> Dict[str, Any]:
         """Create tool result message in Claude's expected format."""
         tool_call_id = self.extract_tool_call_id(tool_call)
         return {
@@ -594,7 +1122,7 @@ class ClaudeBackend(LLMBackend):
                     "type": "tool_result",
                     "tool_use_id": tool_call_id,
                     "content": result_content,
-                }
+                },
             ],
         }
@@ -607,55 +1135,23 @@ class ClaudeBackend(LLMBackend):
                     return item.get("content", "")
         return ""
-    def estimate_tokens(self, text: str) -> int:
-        """Estimate token count for text (Claude uses ~4 chars per token)."""
-        return len(text) // 4
-    def calculate_cost(
-        self, input_tokens: int, output_tokens: int, model: str
-    ) -> float:
-        """Calculate cost for Claude token usage (2025 pricing)."""
-        model_lower = model.lower()
-        if "claude-4" in model_lower:
-            if "opus" in model_lower:
-                # Claude 4 Opus
-                input_cost = (input_tokens / 1_000_000) * 15.0
-                output_cost = (output_tokens / 1_000_000) * 75.0
-            else:
-                # Claude 4 Sonnet
-                input_cost = (input_tokens / 1_000_000) * 3.0
-                output_cost = (output_tokens / 1_000_000) * 15.0
-        elif "claude-3.7" in model_lower or "claude-3-7" in model_lower:
-            # Claude 3.7 Sonnet
-            input_cost = (input_tokens / 1_000_000) * 3.0
-            output_cost = (output_tokens / 1_000_000) * 15.0
-        elif "claude-3.5" in model_lower or "claude-3-5" in model_lower:
-            if "haiku" in model_lower:
-                # Claude 3.5 Haiku
-                input_cost = (input_tokens / 1_000_000) * 1.0
-                output_cost = (output_tokens / 1_000_000) * 5.0
-            else:
-                # Claude 3.5 Sonnet (legacy)
-                input_cost = (input_tokens / 1_000_000) * 3.0
-                output_cost = (output_tokens / 1_000_000) * 15.0
-        else:
-            # Default fallback (assume Claude 4 Sonnet pricing)
-            input_cost = (input_tokens / 1_000_000) * 3.0
-            output_cost = (output_tokens / 1_000_000) * 15.0
-        # Add tool usage costs
-        tool_costs = 0.0
-        if self.search_count > 0:
-            tool_costs += (self.search_count / 1000) * 10.0  # $10 per 1,000 searches
-        if self.code_session_hours > 0:
-            tool_costs += self.code_session_hours * 0.05  # $0.05 per session-hour
-        return input_cost + output_cost + tool_costs
     def reset_tool_usage(self):
         """Reset tool usage tracking."""
         self.search_count = 0
         self.code_session_hours = 0.0
         super().reset_token_usage()
+    def _create_client(self, **kwargs):
+        return anthropic.AsyncAnthropic(api_key=self.api_key)
+    def get_provider_name(self) -> str:
+        """Get the provider name."""
+        return "Claude"
+    def get_supported_builtin_tools(self) -> List[str]:
+        """Get list of builtin tools supported by Claude."""
+        return ["web_search", "code_execution"]
+    def get_filesystem_support(self) -> FilesystemSupport:
+        """Claude supports filesystem through MCP servers."""
+        return FilesystemSupport.MCP

massgen 0.0.3__py3-none-any.whl → 0.1.0__py3-none-any.whl

Potentially problematic release.

massgen 0.0.3py3-none-any.whl → 0.1.0py3-none-any.whl