PyPI - massgen - Versions diffs - 0.0.3__py3-none-any.whl → 0.1.0__py3-none-any.whl - Mend

massgen 0.0.3py3-none-any.whl → 0.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of massgen might be problematic. Click here for more details.

Files changed (268) hide show

massgen/__init__.py +142 -8
massgen/adapters/__init__.py +29 -0
massgen/adapters/ag2_adapter.py +483 -0
massgen/adapters/base.py +183 -0
massgen/adapters/tests/__init__.py +0 -0
massgen/adapters/tests/test_ag2_adapter.py +439 -0
massgen/adapters/tests/test_agent_adapter.py +128 -0
massgen/adapters/utils/__init__.py +2 -0
massgen/adapters/utils/ag2_utils.py +236 -0
massgen/adapters/utils/tests/__init__.py +0 -0
massgen/adapters/utils/tests/test_ag2_utils.py +138 -0
massgen/agent_config.py +329 -55
massgen/api_params_handler/__init__.py +10 -0
massgen/api_params_handler/_api_params_handler_base.py +99 -0
massgen/api_params_handler/_chat_completions_api_params_handler.py +176 -0
massgen/api_params_handler/_claude_api_params_handler.py +113 -0
massgen/api_params_handler/_response_api_params_handler.py +130 -0
massgen/backend/__init__.py +39 -4
massgen/backend/azure_openai.py +385 -0
massgen/backend/base.py +341 -69
massgen/backend/base_with_mcp.py +1102 -0
massgen/backend/capabilities.py +386 -0
massgen/backend/chat_completions.py +577 -130
massgen/backend/claude.py +1033 -537
massgen/backend/claude_code.py +1203 -0
massgen/backend/cli_base.py +209 -0
massgen/backend/docs/BACKEND_ARCHITECTURE.md +126 -0
massgen/backend/{CLAUDE_API_RESEARCH.md → docs/CLAUDE_API_RESEARCH.md} +18 -18
massgen/backend/{GEMINI_API_DOCUMENTATION.md → docs/GEMINI_API_DOCUMENTATION.md} +9 -9
massgen/backend/docs/Gemini MCP Integration Analysis.md +1050 -0
massgen/backend/docs/MCP_IMPLEMENTATION_CLAUDE_BACKEND.md +177 -0
massgen/backend/docs/MCP_INTEGRATION_RESPONSE_BACKEND.md +352 -0
massgen/backend/docs/OPENAI_GPT5_MODELS.md +211 -0
massgen/backend/{OPENAI_RESPONSES_API_FORMAT.md → docs/OPENAI_RESPONSE_API_TOOL_CALLS.md} +3 -3
massgen/backend/docs/OPENAI_response_streaming.md +20654 -0
massgen/backend/docs/inference_backend.md +257 -0
massgen/backend/docs/permissions_and_context_files.md +1085 -0
massgen/backend/external.py +126 -0
massgen/backend/gemini.py +1850 -241
massgen/backend/grok.py +40 -156
massgen/backend/inference.py +156 -0
massgen/backend/lmstudio.py +171 -0
massgen/backend/response.py +1095 -322
massgen/chat_agent.py +131 -113
massgen/cli.py +1560 -275
massgen/config_builder.py +2396 -0
massgen/configs/BACKEND_CONFIGURATION.md +458 -0
massgen/configs/README.md +559 -216
massgen/configs/ag2/ag2_case_study.yaml +27 -0
massgen/configs/ag2/ag2_coder.yaml +34 -0
massgen/configs/ag2/ag2_coder_case_study.yaml +36 -0
massgen/configs/ag2/ag2_gemini.yaml +27 -0
massgen/configs/ag2/ag2_groupchat.yaml +108 -0
massgen/configs/ag2/ag2_groupchat_gpt.yaml +118 -0
massgen/configs/ag2/ag2_single_agent.yaml +21 -0
massgen/configs/basic/multi/fast_timeout_example.yaml +37 -0
massgen/configs/basic/multi/gemini_4o_claude.yaml +31 -0
massgen/configs/basic/multi/gemini_gpt5nano_claude.yaml +36 -0
massgen/configs/{gemini_4o_claude.yaml → basic/multi/geminicode_4o_claude.yaml} +3 -3
massgen/configs/basic/multi/geminicode_gpt5nano_claude.yaml +36 -0
massgen/configs/basic/multi/glm_gemini_claude.yaml +25 -0
massgen/configs/basic/multi/gpt4o_audio_generation.yaml +30 -0
massgen/configs/basic/multi/gpt4o_image_generation.yaml +31 -0
massgen/configs/basic/multi/gpt5nano_glm_qwen.yaml +26 -0
massgen/configs/basic/multi/gpt5nano_image_understanding.yaml +26 -0
massgen/configs/{three_agents_default.yaml → basic/multi/three_agents_default.yaml} +8 -4
massgen/configs/basic/multi/three_agents_opensource.yaml +27 -0
massgen/configs/basic/multi/three_agents_vllm.yaml +20 -0
massgen/configs/basic/multi/two_agents_gemini.yaml +19 -0
massgen/configs/{two_agents.yaml → basic/multi/two_agents_gpt5.yaml} +14 -6
massgen/configs/basic/multi/two_agents_opensource_lmstudio.yaml +31 -0
massgen/configs/basic/multi/two_qwen_vllm_sglang.yaml +28 -0
massgen/configs/{single_agent.yaml → basic/single/single_agent.yaml} +1 -1
massgen/configs/{single_flash2.5.yaml → basic/single/single_flash2.5.yaml} +1 -2
massgen/configs/basic/single/single_gemini2.5pro.yaml +16 -0
massgen/configs/basic/single/single_gpt4o_audio_generation.yaml +22 -0
massgen/configs/basic/single/single_gpt4o_image_generation.yaml +22 -0
massgen/configs/basic/single/single_gpt4o_video_generation.yaml +24 -0
massgen/configs/basic/single/single_gpt5nano.yaml +20 -0
massgen/configs/basic/single/single_gpt5nano_file_search.yaml +18 -0
massgen/configs/basic/single/single_gpt5nano_image_understanding.yaml +17 -0
massgen/configs/basic/single/single_gptoss120b.yaml +15 -0
massgen/configs/basic/single/single_openrouter_audio_understanding.yaml +15 -0
massgen/configs/basic/single/single_qwen_video_understanding.yaml +15 -0
massgen/configs/debug/code_execution/command_filtering_blacklist.yaml +29 -0
massgen/configs/debug/code_execution/command_filtering_whitelist.yaml +28 -0
massgen/configs/debug/code_execution/docker_verification.yaml +29 -0
massgen/configs/debug/skip_coordination_test.yaml +27 -0
massgen/configs/debug/test_sdk_migration.yaml +17 -0
massgen/configs/docs/DISCORD_MCP_SETUP.md +208 -0
massgen/configs/docs/TWITTER_MCP_ENESCINAR_SETUP.md +82 -0
massgen/configs/providers/azure/azure_openai_multi.yaml +21 -0
massgen/configs/providers/azure/azure_openai_single.yaml +19 -0
massgen/configs/providers/claude/claude.yaml +14 -0
massgen/configs/providers/gemini/gemini_gpt5nano.yaml +28 -0
massgen/configs/providers/local/lmstudio.yaml +11 -0
massgen/configs/providers/openai/gpt5.yaml +46 -0
massgen/configs/providers/openai/gpt5_nano.yaml +46 -0
massgen/configs/providers/others/grok_single_agent.yaml +19 -0
massgen/configs/providers/others/zai_coding_team.yaml +108 -0
massgen/configs/providers/others/zai_glm45.yaml +12 -0
massgen/configs/{creative_team.yaml → teams/creative/creative_team.yaml} +16 -6
massgen/configs/{travel_planning.yaml → teams/creative/travel_planning.yaml} +16 -6
massgen/configs/{news_analysis.yaml → teams/research/news_analysis.yaml} +16 -6
massgen/configs/{research_team.yaml → teams/research/research_team.yaml} +15 -7
massgen/configs/{technical_analysis.yaml → teams/research/technical_analysis.yaml} +16 -6
massgen/configs/tools/code-execution/basic_command_execution.yaml +25 -0
massgen/configs/tools/code-execution/code_execution_use_case_simple.yaml +41 -0
massgen/configs/tools/code-execution/docker_claude_code.yaml +32 -0
massgen/configs/tools/code-execution/docker_multi_agent.yaml +32 -0
massgen/configs/tools/code-execution/docker_simple.yaml +29 -0
massgen/configs/tools/code-execution/docker_with_resource_limits.yaml +32 -0
massgen/configs/tools/code-execution/multi_agent_playwright_automation.yaml +57 -0
massgen/configs/tools/filesystem/cc_gpt5_gemini_filesystem.yaml +34 -0
massgen/configs/tools/filesystem/claude_code_context_sharing.yaml +68 -0
massgen/configs/tools/filesystem/claude_code_flash2.5.yaml +43 -0
massgen/configs/tools/filesystem/claude_code_flash2.5_gptoss.yaml +49 -0
massgen/configs/tools/filesystem/claude_code_gpt5nano.yaml +31 -0
massgen/configs/tools/filesystem/claude_code_single.yaml +40 -0
massgen/configs/tools/filesystem/fs_permissions_test.yaml +87 -0
massgen/configs/tools/filesystem/gemini_gemini_workspace_cleanup.yaml +54 -0
massgen/configs/tools/filesystem/gemini_gpt5_filesystem_casestudy.yaml +30 -0
massgen/configs/tools/filesystem/gemini_gpt5nano_file_context_path.yaml +43 -0
massgen/configs/tools/filesystem/gemini_gpt5nano_protected_paths.yaml +45 -0
massgen/configs/tools/filesystem/gpt5mini_cc_fs_context_path.yaml +31 -0
massgen/configs/tools/filesystem/grok4_gpt5_gemini_filesystem.yaml +32 -0
massgen/configs/tools/filesystem/multiturn/grok4_gpt5_claude_code_filesystem_multiturn.yaml +58 -0
massgen/configs/tools/filesystem/multiturn/grok4_gpt5_gemini_filesystem_multiturn.yaml +58 -0
massgen/configs/tools/filesystem/multiturn/two_claude_code_filesystem_multiturn.yaml +47 -0
massgen/configs/tools/filesystem/multiturn/two_gemini_flash_filesystem_multiturn.yaml +48 -0
massgen/configs/tools/mcp/claude_code_discord_mcp_example.yaml +27 -0
massgen/configs/tools/mcp/claude_code_simple_mcp.yaml +35 -0
massgen/configs/tools/mcp/claude_code_twitter_mcp_example.yaml +32 -0
massgen/configs/tools/mcp/claude_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/claude_mcp_test.yaml +27 -0
massgen/configs/tools/mcp/five_agents_travel_mcp_test.yaml +157 -0
massgen/configs/tools/mcp/five_agents_weather_mcp_test.yaml +103 -0
massgen/configs/tools/mcp/gemini_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/gemini_mcp_filesystem_test.yaml +23 -0
massgen/configs/tools/mcp/gemini_mcp_filesystem_test_sharing.yaml +23 -0
massgen/configs/tools/mcp/gemini_mcp_filesystem_test_single_agent.yaml +17 -0
massgen/configs/tools/mcp/gemini_mcp_filesystem_test_with_claude_code.yaml +24 -0
massgen/configs/tools/mcp/gemini_mcp_test.yaml +27 -0
massgen/configs/tools/mcp/gemini_notion_mcp.yaml +52 -0
massgen/configs/tools/mcp/gpt5_nano_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/gpt5_nano_mcp_test.yaml +27 -0
massgen/configs/tools/mcp/gpt5mini_claude_code_discord_mcp_example.yaml +38 -0
massgen/configs/tools/mcp/gpt_oss_mcp_example.yaml +25 -0
massgen/configs/tools/mcp/gpt_oss_mcp_test.yaml +28 -0
massgen/configs/tools/mcp/grok3_mini_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/grok3_mini_mcp_test.yaml +27 -0
massgen/configs/tools/mcp/multimcp_gemini.yaml +111 -0
massgen/configs/tools/mcp/qwen_api_mcp_example.yaml +25 -0
massgen/configs/tools/mcp/qwen_api_mcp_test.yaml +28 -0
massgen/configs/tools/mcp/qwen_local_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/qwen_local_mcp_test.yaml +27 -0
massgen/configs/tools/planning/five_agents_discord_mcp_planning_mode.yaml +140 -0
massgen/configs/tools/planning/five_agents_filesystem_mcp_planning_mode.yaml +151 -0
massgen/configs/tools/planning/five_agents_notion_mcp_planning_mode.yaml +151 -0
massgen/configs/tools/planning/five_agents_twitter_mcp_planning_mode.yaml +155 -0
massgen/configs/tools/planning/gpt5_mini_case_study_mcp_planning_mode.yaml +73 -0
massgen/configs/tools/web-search/claude_streamable_http_test.yaml +43 -0
massgen/configs/tools/web-search/gemini_streamable_http_test.yaml +43 -0
massgen/configs/tools/web-search/gpt5_mini_streamable_http_test.yaml +43 -0
massgen/configs/tools/web-search/gpt_oss_streamable_http_test.yaml +44 -0
massgen/configs/tools/web-search/grok3_mini_streamable_http_test.yaml +43 -0
massgen/configs/tools/web-search/qwen_api_streamable_http_test.yaml +44 -0
massgen/configs/tools/web-search/qwen_local_streamable_http_test.yaml +43 -0
massgen/coordination_tracker.py +708 -0
massgen/docker/README.md +462 -0
massgen/filesystem_manager/__init__.py +21 -0
massgen/filesystem_manager/_base.py +9 -0
massgen/filesystem_manager/_code_execution_server.py +545 -0
massgen/filesystem_manager/_docker_manager.py +477 -0
massgen/filesystem_manager/_file_operation_tracker.py +248 -0
massgen/filesystem_manager/_filesystem_manager.py +813 -0
massgen/filesystem_manager/_path_permission_manager.py +1261 -0
massgen/filesystem_manager/_workspace_tools_server.py +1815 -0
massgen/formatter/__init__.py +10 -0
massgen/formatter/_chat_completions_formatter.py +284 -0
massgen/formatter/_claude_formatter.py +235 -0
massgen/formatter/_formatter_base.py +156 -0
massgen/formatter/_response_formatter.py +263 -0
massgen/frontend/__init__.py +1 -2
massgen/frontend/coordination_ui.py +471 -286
massgen/frontend/displays/base_display.py +56 -11
massgen/frontend/displays/create_coordination_table.py +1956 -0
massgen/frontend/displays/rich_terminal_display.py +1259 -619
massgen/frontend/displays/simple_display.py +9 -4
massgen/frontend/displays/terminal_display.py +27 -68
massgen/logger_config.py +681 -0
massgen/mcp_tools/README.md +232 -0
massgen/mcp_tools/__init__.py +105 -0
massgen/mcp_tools/backend_utils.py +1035 -0
massgen/mcp_tools/circuit_breaker.py +195 -0
massgen/mcp_tools/client.py +894 -0
massgen/mcp_tools/config_validator.py +138 -0
massgen/mcp_tools/docs/circuit_breaker.md +646 -0
massgen/mcp_tools/docs/client.md +950 -0
massgen/mcp_tools/docs/config_validator.md +478 -0
massgen/mcp_tools/docs/exceptions.md +1165 -0
massgen/mcp_tools/docs/security.md +854 -0
massgen/mcp_tools/exceptions.py +338 -0
massgen/mcp_tools/hooks.py +212 -0
massgen/mcp_tools/security.py +780 -0
massgen/message_templates.py +342 -64
massgen/orchestrator.py +1515 -241
massgen/stream_chunk/__init__.py +35 -0
massgen/stream_chunk/base.py +92 -0
massgen/stream_chunk/multimodal.py +237 -0
massgen/stream_chunk/text.py +162 -0
massgen/tests/mcp_test_server.py +150 -0
massgen/tests/multi_turn_conversation_design.md +0 -8
massgen/tests/test_azure_openai_backend.py +156 -0
massgen/tests/test_backend_capabilities.py +262 -0
massgen/tests/test_backend_event_loop_all.py +179 -0
massgen/tests/test_chat_completions_refactor.py +142 -0
massgen/tests/test_claude_backend.py +15 -28
massgen/tests/test_claude_code.py +268 -0
massgen/tests/test_claude_code_context_sharing.py +233 -0
massgen/tests/test_claude_code_orchestrator.py +175 -0
massgen/tests/test_cli_backends.py +180 -0
massgen/tests/test_code_execution.py +679 -0
massgen/tests/test_external_agent_backend.py +134 -0
massgen/tests/test_final_presentation_fallback.py +237 -0
massgen/tests/test_gemini_planning_mode.py +351 -0
massgen/tests/test_grok_backend.py +7 -10
massgen/tests/test_http_mcp_server.py +42 -0
massgen/tests/test_integration_simple.py +198 -0
massgen/tests/test_mcp_blocking.py +125 -0
massgen/tests/test_message_context_building.py +29 -47
massgen/tests/test_orchestrator_final_presentation.py +48 -0
massgen/tests/test_path_permission_manager.py +2087 -0
massgen/tests/test_rich_terminal_display.py +14 -13
massgen/tests/test_timeout.py +133 -0
massgen/tests/test_v3_3agents.py +11 -12
massgen/tests/test_v3_simple.py +8 -13
massgen/tests/test_v3_three_agents.py +11 -18
massgen/tests/test_v3_two_agents.py +8 -13
massgen/token_manager/__init__.py +7 -0
massgen/token_manager/token_manager.py +400 -0
massgen/utils.py +52 -16
massgen/v1/agent.py +45 -91
massgen/v1/agents.py +18 -53
massgen/v1/backends/gemini.py +50 -153
massgen/v1/backends/grok.py +21 -54
massgen/v1/backends/oai.py +39 -111
massgen/v1/cli.py +36 -93
massgen/v1/config.py +8 -12
massgen/v1/logging.py +43 -127
massgen/v1/main.py +18 -32
massgen/v1/orchestrator.py +68 -209
massgen/v1/streaming_display.py +62 -163
massgen/v1/tools.py +8 -12
massgen/v1/types.py +9 -23
massgen/v1/utils.py +5 -23
massgen-0.1.0.dist-info/METADATA +1245 -0
massgen-0.1.0.dist-info/RECORD +273 -0
massgen-0.1.0.dist-info/entry_points.txt +2 -0
massgen/frontend/logging/__init__.py +0 -9
massgen/frontend/logging/realtime_logger.py +0 -197
massgen-0.0.3.dist-info/METADATA +0 -568
massgen-0.0.3.dist-info/RECORD +0 -76
massgen-0.0.3.dist-info/entry_points.txt +0 -2
/massgen/backend/{Function calling openai responses.md → docs/Function calling openai responses.md} +0 -0
{massgen-0.0.3.dist-info → massgen-0.1.0.dist-info}/WHEEL +0 -0
{massgen-0.0.3.dist-info → massgen-0.1.0.dist-info}/licenses/LICENSE +0 -0
{massgen-0.0.3.dist-info → massgen-0.1.0.dist-info}/top_level.txt +0 -0

massgen/backend/response.py CHANGED Viewed

@@ -1,341 +1,1132 @@
-from __future__ import annotations
+# -*- coding: utf-8 -*-
 """
-Response API backend implementation.
+Response API backend implementation with multimodal support.
 Standalone implementation optimized for the standard Response API format (originated by OpenAI).
+Supports image input (URL and base64) and image generation via tools.
 """
+from __future__ import annotations
+import asyncio
 import os
-from typing import Dict, List, Any, AsyncGenerator, Optional
-from .base import LLMBackend, StreamChunk
+from datetime import datetime, timezone
+from io import BytesIO
+from pathlib import Path
+from typing import Any, AsyncGenerator, Dict, List, Optional, Tuple, Union
+from urllib.parse import urlparse
+import httpx
+import openai
+from openai import AsyncOpenAI
-class ResponseBackend(LLMBackend):
-    """Backend using the standard Response API format."""
+from ..api_params_handler import ResponseAPIParamsHandler
+from ..formatter import ResponseFormatter
+from ..logger_config import log_backend_agent_message, log_stream_chunk, logger
+from ..stream_chunk import ChunkType, TextStreamChunk
+from .base import FilesystemSupport, StreamChunk
+from .base_with_mcp import MCPBackend, UploadFileError
+class ResponseBackend(MCPBackend):
+    """Backend using the standard Response API format with multimodal support."""
     def __init__(self, api_key: Optional[str] = None, **kwargs):
         super().__init__(api_key, **kwargs)
         self.api_key = api_key or os.getenv("OPENAI_API_KEY")
+        self.formatter = ResponseFormatter()
+        self.api_params_handler = ResponseAPIParamsHandler(self)
+        # Queue for pending image saves
+        self._pending_image_saves = []
-    def convert_tools_to_response_api_format(
-        self, tools: List[Dict[str, Any]]
-    ) -> List[Dict[str, Any]]:
-        """Convert tools from Chat Completions format to Response API format if needed.
+        # File Search tracking for cleanup
+        self._vector_store_ids: List[str] = []
+        self._uploaded_file_ids: List[str] = []
-        Chat Completions format: {"type": "function", "function": {"name": ..., "description": ..., "parameters": ...}}
-        Response API format: {"type": "function", "name": ..., "description": ..., "parameters": ...}
+    def supports_upload_files(self) -> bool:
+        return True
+    async def stream_with_tools(
+        self,
+        messages: List[Dict[str, Any]],
+        tools: List[Dict[str, Any]],
+        **kwargs,
+    ) -> AsyncGenerator[StreamChunk, None]:
+        """Stream response using OpenAI Response API with unified MCP/non-MCP processing.
+        Wraps parent implementation to ensure File Search cleanup happens after streaming completes.
         """
-        if not tools:
-            return tools
+        try:
+            async for chunk in super().stream_with_tools(messages, tools, **kwargs):
+                yield chunk
+        finally:
+            # Cleanup File Search resources after stream completes
+            await self._cleanup_file_search_if_needed(**kwargs)
-        converted_tools = []
-        for tool in tools:
-            if tool.get("type") == "function" and "function" in tool:
-                # Chat Completions format - convert to Response API format
-                func = tool["function"]
-                converted_tools.append(
-                    {
-                        "type": "function",
-                        "name": func["name"],
-                        "description": func["description"],
-                        "parameters": func.get("parameters", {}),
+    async def _cleanup_file_search_if_needed(self, **kwargs) -> None:
+        """Cleanup File Search resources if needed."""
+        if not (self._vector_store_ids or self._uploaded_file_ids):
+            return
+        agent_id = kwargs.get("agent_id")
+        logger.info("Cleaning up File Search resources...")
+        client = None
+        try:
+            # Create a client for cleanup
+            client = self._create_client(**kwargs)
+            await self._cleanup_file_search_resources(client, agent_id)
+        except Exception as cleanup_error:
+            logger.error(
+                f"Error during File Search cleanup: {cleanup_error}",
+                extra={"agent_id": agent_id},
+            )
+        finally:
+            # Close the client if it has an aclose method
+            if client and hasattr(client, "aclose"):
+                try:
+                    await client.aclose()
+                except Exception:
+                    pass
+    async def _stream_without_mcp_tools(
+        self,
+        messages: List[Dict[str, Any]],
+        tools: List[Dict[str, Any]],
+        client,
+        **kwargs,
+    ) -> AsyncGenerator[StreamChunk, None]:
+        agent_id = kwargs.get("agent_id")
+        all_params = {**self.config, **kwargs}
+        processed_messages = await self._process_upload_files(messages, all_params)
+        if all_params.get("_has_file_search_files"):
+            logger.info("Processing File Search uploads...")
+            processed_messages, vector_store_id = await self._upload_files_and_create_vector_store(
+                processed_messages,
+                client,
+                agent_id,
+            )
+            if vector_store_id:
+                existing_ids = list(all_params.get("_file_search_vector_store_ids", []))
+                existing_ids.append(vector_store_id)
+                all_params["_file_search_vector_store_ids"] = existing_ids
+                logger.info(f"File Search enabled with vector store: {vector_store_id}")
+            all_params.pop("_has_file_search_files", None)
+        api_params = await self.api_params_handler.build_api_params(processed_messages, tools, all_params)
+        if "tools" in api_params:
+            non_mcp_tools = []
+            for tool in api_params.get("tools", []):
+                if tool.get("type") == "function":
+                    name = tool.get("function", {}).get("name") if "function" in tool else tool.get("name")
+                    if name and name in self._mcp_function_names:
+                        continue
+                elif tool.get("type") == "mcp":
+                    continue
+                non_mcp_tools.append(tool)
+            api_params["tools"] = non_mcp_tools
+        stream = await client.responses.create(**api_params)
+        async for chunk in self._process_stream(stream, all_params, agent_id):
+            yield chunk
+    async def _stream_with_mcp_tools(
+        self,
+        current_messages: List[Dict[str, Any]],
+        tools: List[Dict[str, Any]],
+        client,
+        **kwargs,
+    ) -> AsyncGenerator[StreamChunk, None]:
+        """Recursively stream MCP responses, executing function calls as needed."""
+        agent_id = kwargs.get("agent_id")
+        # Build API params for this iteration
+        all_params = {**self.config, **kwargs}
+        if all_params.get("_has_file_search_files"):
+            logger.info("Processing File Search uploads...")
+            current_messages, vector_store_id = await self._upload_files_and_create_vector_store(
+                current_messages,
+                client,
+                agent_id,
+            )
+            if vector_store_id:
+                existing_ids = list(all_params.get("_file_search_vector_store_ids", []))
+                existing_ids.append(vector_store_id)
+                all_params["_file_search_vector_store_ids"] = existing_ids
+                logger.info(f"File Search enabled with vector store: {vector_store_id}")
+            all_params.pop("_has_file_search_files", None)
+        api_params = await self.api_params_handler.build_api_params(current_messages, tools, all_params)
+        # Start streaming
+        stream = await client.responses.create(**api_params)
+        # Track function calls in this iteration
+        captured_function_calls = []
+        current_function_call = None
+        response_completed = False
+        async for chunk in stream:
+            if hasattr(chunk, "type"):
+                # Detect function call start
+                if chunk.type == "response.output_item.added" and hasattr(chunk, "item") and chunk.item and getattr(chunk.item, "type", None) == "function_call":
+                    current_function_call = {
+                        "call_id": getattr(chunk.item, "call_id", ""),
+                        "name": getattr(chunk.item, "name", ""),
+                        "arguments": "",
                     }
+                    logger.info(f"Function call detected: {current_function_call['name']}")
+                # Accumulate function arguments
+                elif chunk.type == "response.function_call_arguments.delta" and current_function_call is not None:
+                    delta = getattr(chunk, "delta", "")
+                    current_function_call["arguments"] += delta
+                # Function call completed
+                elif chunk.type == "response.output_item.done" and current_function_call is not None:
+                    captured_function_calls.append(current_function_call)
+                    current_function_call = None
+                # Handle regular content and other events
+                elif chunk.type == "response.output_text.delta":
+                    delta = getattr(chunk, "delta", "")
+                    yield TextStreamChunk(
+                        type=ChunkType.CONTENT,
+                        content=delta,
+                        source="response_api",
+                    )
+                # Handle other streaming events (reasoning, provider tools, etc.)
+                else:
+                    result = self._process_stream_chunk(chunk, agent_id)
+                    yield result
+                # Response completed
+                if chunk.type == "response.completed":
+                    response_completed = True
+                    if captured_function_calls:
+                        # Execute captured function calls and recurse
+                        break  # Exit chunk loop to execute functions
+                    else:
+                        # No function calls, we're done (base case)
+                        yield TextStreamChunk(type=ChunkType.DONE, source="response_api")
+                        return
+        # Execute any captured function calls
+        if captured_function_calls and response_completed:
+            # Check if any of the function calls are NOT MCP functions
+            non_mcp_functions = [call for call in captured_function_calls if call["name"] not in self._mcp_functions]
+            if non_mcp_functions:
+                logger.info(f"Non-MCP function calls detected: {[call['name'] for call in non_mcp_functions]}. Ending MCP processing.")
+                yield TextStreamChunk(type=ChunkType.DONE, source="response_api")
+                return
+            # Check circuit breaker status before executing MCP functions
+            if not await super()._check_circuit_breaker_before_execution():
+                logger.warning("All MCP servers blocked by circuit breaker")
+                yield TextStreamChunk(
+                    type=ChunkType.MCP_STATUS,
+                    status="mcp_blocked",
+                    content="⚠️ [MCP] All servers blocked by circuit breaker",
+                    source="circuit_breaker",
                 )
-            else:
-                # Already in Response API format or non-function tool
-                converted_tools.append(tool)
+                yield TextStreamChunk(type=ChunkType.DONE, source="response_api")
+                return
-        return converted_tools
+            # Execute only MCP function calls
+            mcp_functions_executed = False
+            updated_messages = current_messages.copy()
-    def convert_messages_to_response_api_format(
-        self, messages: List[Dict[str, Any]]
-    ) -> List[Dict[str, Any]]:
-        """Convert messages from Chat Completions format to Response API format.
+            # Check if planning mode is enabled - block MCP tool execution during planning
+            if self.is_planning_mode_enabled():
+                logger.info("[MCP] Planning mode enabled - blocking all MCP tool execution")
+                yield StreamChunk(
+                    type="mcp_status",
+                    status="planning_mode_blocked",
+                    content="🚫 [MCP] Planning mode active - MCP tools blocked during coordination",
+                    source="planning_mode",
+                )
+                # Skip all MCP tool execution but still continue with workflow
+                yield StreamChunk(type="done")
+                return
-        Chat Completions tool message: {"role": "tool", "tool_call_id": "...", "content": "..."}
-        Response API tool message: {"type": "function_call_output", "call_id": "...", "output": "..."}
+            # Ensure every captured function call gets a result to prevent hanging
+            processed_call_ids = set()
-        Note: Assistant messages with tool_calls should not be in input - they're generated by the backend.
-        """
-        converted_messages = []
+            for call in captured_function_calls:
+                function_name = call["name"]
+                if function_name in self._mcp_functions:
+                    # Yield MCP tool call status
+                    yield TextStreamChunk(
+                        type=ChunkType.MCP_STATUS,
+                        status="mcp_tool_called",
+                        content=f"🔧 [MCP Tool] Calling {function_name}...",
+                        source=f"mcp_{function_name}",
+                    )
-        for message in messages:
-            if message.get("role") == "tool":
-                # Convert Chat Completions tool message to Response API format
-                converted_messages.append(
-                    {
+                    try:
+                        # Execute MCP function with retry and exponential backoff
+                        result, result_obj = await super()._execute_mcp_function_with_retry(
+                            function_name,
+                            call["arguments"],
+                        )
+                        # Check if function failed after all retries
+                        if isinstance(result, str) and result.startswith("Error:"):
+                            # Log failure but still create tool response
+                            logger.warning(f"MCP function {function_name} failed after retries: {result}")
+                            # Add error result to messages
+                            function_call_msg = {
+                                "type": "function_call",
+                                "call_id": call["call_id"],
+                                "name": function_name,
+                                "arguments": call["arguments"],
+                            }
+                            updated_messages.append(function_call_msg)
+                            error_output_msg = {
+                                "type": "function_call_output",
+                                "call_id": call["call_id"],
+                                "output": result,
+                            }
+                            updated_messages.append(error_output_msg)
+                            processed_call_ids.add(call["call_id"])
+                            mcp_functions_executed = True
+                            continue
+                    except Exception as e:
+                        # Only catch unexpected non-MCP system errors
+                        logger.error(f"Unexpected error in MCP function execution: {e}")
+                        error_msg = f"Error executing {function_name}: {str(e)}"
+                        # Add error result to messages
+                        function_call_msg = {
+                            "type": "function_call",
+                            "call_id": call["call_id"],
+                            "name": function_name,
+                            "arguments": call["arguments"],
+                        }
+                        updated_messages.append(function_call_msg)
+                        error_output_msg = {
+                            "type": "function_call_output",
+                            "call_id": call["call_id"],
+                            "output": error_msg,
+                        }
+                        updated_messages.append(error_output_msg)
+                        processed_call_ids.add(call["call_id"])
+                        mcp_functions_executed = True
+                        continue
+                    # Add function call to messages and yield status chunk
+                    function_call_msg = {
+                        "type": "function_call",
+                        "call_id": call["call_id"],
+                        "name": function_name,
+                        "arguments": call["arguments"],
+                    }
+                    updated_messages.append(function_call_msg)
+                    yield TextStreamChunk(
+                        type=ChunkType.MCP_STATUS,
+                        status="function_call",
+                        content=f"Arguments for Calling {function_name}: {call['arguments']}",
+                        source=f"mcp_{function_name}",
+                    )
+                    # Add function output to messages and yield status chunk
+                    function_output_msg = {
                         "type": "function_call_output",
-                        "call_id": message.get("tool_call_id"),
-                        "output": message.get("content", ""),
+                        "call_id": call["call_id"],
+                        "output": str(result),
                     }
-                )
-            elif message.get("type") == "function_call_output":
-                # Already in Response API format - keep as-is
-                converted_messages.append(message)
-            elif message.get("role") == "assistant" and "tool_calls" in message:
-                # Assistant message with tool_calls in native Responses API format
-                # Remove tool_calls when sending as input - only results should be sent back
-                cleaned_message = {
-                    k: v for k, v in message.items() if k != "tool_calls"
-                }
-                converted_messages.append(cleaned_message)
+                    updated_messages.append(function_output_msg)
+                    yield TextStreamChunk(
+                        type=ChunkType.MCP_STATUS,
+                        status="function_call_output",
+                        content=f"Results for Calling {function_name}: {str(result_obj.content[0].text)}",
+                        source=f"mcp_{function_name}",
+                    )
+                    logger.info(f"Executed MCP function {function_name} (stdio/streamable-http)")
+                    processed_call_ids.add(call["call_id"])
+                    # Yield MCP tool response status
+                    yield TextStreamChunk(
+                        type=ChunkType.MCP_STATUS,
+                        status="mcp_tool_response",
+                        content=f"✅ [MCP Tool] {function_name} completed",
+                        source=f"mcp_{function_name}",
+                    )
+                    mcp_functions_executed = True
+            # Ensure all captured function calls have results to prevent hanging
+            for call in captured_function_calls:
+                if call["call_id"] not in processed_call_ids:
+                    logger.warning(f"Tool call {call['call_id']} for function {call['name']} was not processed - adding error result")
+                    # Add missing function call and error result to messages
+                    function_call_msg = {
+                        "type": "function_call",
+                        "call_id": call["call_id"],
+                        "name": call["name"],
+                        "arguments": call["arguments"],
+                    }
+                    updated_messages.append(function_call_msg)
+                    error_output_msg = {
+                        "type": "function_call_output",
+                        "call_id": call["call_id"],
+                        "output": f"Error: Tool call {call['call_id']} for function {call['name']} was not processed. This may indicate a validation or execution error.",
+                    }
+                    updated_messages.append(error_output_msg)
+                    mcp_functions_executed = True
+            # Trim history after function executions to bound memory usage
+            if mcp_functions_executed:
+                updated_messages = super()._trim_message_history(updated_messages)
+                # Recursive call with updated messages
+                async for chunk in self._stream_with_mcp_tools(updated_messages, tools, client, **kwargs):
+                    yield chunk
             else:
-                # Keep other message types as-is
-                converted_messages.append(message)
+                # No MCP functions were executed, we're done
-        return converted_messages
+                yield TextStreamChunk(type=ChunkType.DONE, source="response_api")
+                return
+        elif response_completed:
+            # Response completed with no function calls - we're done (base case)
+            yield TextStreamChunk(
+                type=ChunkType.MCP_STATUS,
+                status="mcp_session_complete",
+                content="✅ [MCP] Session completed",
+                source="mcp_session",
+            )
+            yield TextStreamChunk(type=ChunkType.DONE, source="response_api")
+            return
+    async def _upload_files_and_create_vector_store(
+        self,
+        messages: List[Dict[str, Any]],
+        client: AsyncOpenAI,
+        agent_id: Optional[str] = None,
+    ) -> Tuple[List[Dict[str, Any]], Optional[str]]:
+        """Upload file_pending_upload items and create a vector store."""
-    async def stream_with_tools(
-        self, messages: List[Dict[str, Any]], tools: List[Dict[str, Any]], **kwargs
-    ) -> AsyncGenerator[StreamChunk, None]:
-        """Stream response using OpenAI Response API."""
         try:
-            import openai
+            pending_files: List[Dict[str, Any]] = []
+            file_locations: List[Tuple[int, int]] = []
+            for message_index, message in enumerate(messages):
+                content = message.get("content")
+                if not isinstance(content, list):
+                    continue
+                for item_index, item in enumerate(content):
+                    if isinstance(item, dict) and item.get("type") == "file_pending_upload":
+                        pending_files.append(item)
+                        file_locations.append((message_index, item_index))
+            if not pending_files:
+                return messages, None
+            uploaded_file_ids: List[str] = []
+            http_client: Optional[httpx.AsyncClient] = None
+            try:
+                for pending in pending_files:
+                    source = pending.get("source")
+                    if source == "local":
+                        path_str = pending.get("path")
+                        if not path_str:
+                            logger.warning("Missing local path for file_pending_upload entry")
+                            continue
+                        file_path = Path(path_str)
+                        if not file_path.exists():
+                            raise UploadFileError(f"File not found for upload: {file_path}")
+                        try:
+                            with file_path.open("rb") as file_handle:
+                                uploaded_file = await client.files.create(
+                                    purpose="assistants",
+                                    file=file_handle,
+                                )
+                        except Exception as exc:
+                            raise UploadFileError(f"Failed to upload file {file_path}: {exc}") from exc
+                    elif source == "url":
+                        file_url = pending.get("url")
+                        if not file_url:
+                            logger.warning("Missing URL for file_pending_upload entry")
+                            continue
-            client = openai.AsyncOpenAI(api_key=self.api_key)
+                        parsed = urlparse(file_url)
+                        if parsed.scheme not in {"http", "https"}:
+                            raise UploadFileError(f"Unsupported URL scheme for file upload: {file_url}")
-            # Extract model and provider tool settings
-            model = kwargs.get("model", "gpt-4o-mini")
-            enable_web_search = kwargs.get("enable_web_search", False)
-            enable_code_interpreter = kwargs.get("enable_code_interpreter", False)
+                        if http_client is None:
+                            http_client = httpx.AsyncClient()
-            # Convert messages to Response API format (handles tool messages)
-            converted_messages = self.convert_messages_to_response_api_format(messages)
+                        try:
+                            response = await http_client.get(file_url, timeout=30.0)
+                            response.raise_for_status()
+                        except httpx.HTTPError as exc:
+                            raise UploadFileError(f"Failed to download file from URL {file_url}: {exc}") from exc
-            # Response API parameters (uses 'input', not 'messages')
-            api_params = {"model": model, "input": converted_messages, "stream": True}
+                        filename = Path(parsed.path).name or "remote_file"
+                        file_bytes = BytesIO(response.content)
-            # Add max_output_tokens if specified (o-series models don't support this)
-            max_tokens = kwargs.get("max_tokens")
-            if max_tokens and not model.startswith("o"):
-                api_params["max_output_tokens"] = max_tokens
+                        try:
+                            uploaded_file = await client.files.create(
+                                purpose="assistants",
+                                file=(filename, file_bytes),
+                            )
+                        except Exception as exc:
+                            raise UploadFileError(f"Failed to upload file from URL {file_url}: {exc}") from exc
+                    else:
+                        raise UploadFileError(f"Unknown file_pending_upload source: {source}")
+                    file_id = getattr(uploaded_file, "id", None)
+                    if not file_id:
+                        raise UploadFileError("Uploaded file response missing ID")
-            # Add framework tools (convert to Response API format)
-            if tools:
-                converted_tools = self.convert_tools_to_response_api_format(tools)
-                api_params["tools"] = converted_tools
+                    uploaded_file_ids.append(file_id)
+                    self._uploaded_file_ids.append(file_id)
+                    logger.info(f"Uploaded file for File Search (file_id={file_id})")
-            # Add provider tools (web search, code interpreter) if enabled
-            provider_tools = []
-            if enable_web_search:
-                provider_tools.append({"type": "web_search"})
+            finally:
+                if http_client is not None:
+                    await http_client.aclose()
+            timestamp = datetime.now(timezone.utc).strftime("%Y%m%d_%H%M%S")
+            vector_store_name = f"massgen_file_search_{agent_id or 'default'}_{timestamp}"
+            try:
+                vector_store = await client.vector_stores.create(name=vector_store_name)
+            except Exception as exc:
+                raise UploadFileError(f"Failed to create vector store: {exc}") from exc
-            if enable_code_interpreter:
-                provider_tools.append(
-                    {"type": "code_interpreter", "container": {"type": "auto"}}
+            vector_store_id = getattr(vector_store, "id", None)
+            if not vector_store_id:
+                raise UploadFileError("Vector store response missing ID")
+            self._vector_store_ids.append(vector_store_id)
+            logger.info(
+                "Created vector store for File Search",
+                extra={
+                    "vector_store_id": vector_store_id,
+                    "file_count": len(uploaded_file_ids),
+                },
+            )
+            for file_id in uploaded_file_ids:
+                try:
+                    vs_file = await client.vector_stores.files.create_and_poll(
+                        vector_store_id=vector_store_id,
+                        file_id=file_id,
+                    )
+                    logger.info(
+                        "File indexed and attached to vector store",
+                        extra={
+                            "vector_store_id": vector_store_id,
+                            "file_id": file_id,
+                            "status": getattr(vs_file, "status", None),
+                        },
+                    )
+                except Exception as exc:
+                    raise UploadFileError(
+                        f"Failed to attach and index file {file_id} to vector store {vector_store_id}: {exc}",
+                    ) from exc
+            if uploaded_file_ids:
+                logger.info(
+                    "All files indexed for File Search; waiting 2s for vector store to stabilize",
+                    extra={
+                        "vector_store_id": vector_store_id,
+                        "file_count": len(uploaded_file_ids),
+                    },
                 )
+                await asyncio.sleep(2)
-            if provider_tools:
-                if "tools" not in api_params:
-                    api_params["tools"] = []
-                api_params["tools"].extend(provider_tools)
-            stream = await client.responses.create(**api_params)
-            content = ""
-            async for chunk in stream:
-                # Handle Responses API streaming format
-                if hasattr(chunk, "type"):
-                    if chunk.type == "response.output_text.delta" and hasattr(
-                        chunk, "delta"
-                    ):
-                        content += chunk.delta
-                        yield StreamChunk(type="content", content=chunk.delta)
-                    elif chunk.type == "response.web_search_call.in_progress":
-                        yield StreamChunk(
-                            type="content",
-                            content=f"\n🔍 [Provider Tool: Web Search] Starting search...",
-                        )
-                    elif chunk.type == "response.web_search_call.searching":
-                        yield StreamChunk(
-                            type="content",
-                            content=f"🔍 [Provider Tool: Web Search] Searching...",
-                        )
-                    elif chunk.type == "response.web_search_call.completed":
-                        yield StreamChunk(
-                            type="content",
-                            content=f"✅ [Provider Tool: Web Search] Search completed",
+            updated_messages = []
+            for message in messages:
+                cloned = dict(message)
+                if isinstance(message.get("content"), list):
+                    cloned["content"] = [dict(item) if isinstance(item, dict) else item for item in message["content"]]
+                updated_messages.append(cloned)
+            for message_index, item_index in reversed(file_locations):
+                content_list = updated_messages[message_index].get("content")
+                if isinstance(content_list, list):
+                    content_list.pop(item_index)
+                    if not content_list:
+                        content_list.append(
+                            {
+                                "type": "text",
+                                "text": "[Files uploaded for search integration]",
+                            },
                         )
-                    elif chunk.type == "response.code_interpreter_call.in_progress":
-                        yield StreamChunk(
-                            type="content",
-                            content=f"\n💻 [Provider Tool: Code Interpreter] Starting execution...",
-                        )
-                    elif chunk.type == "response.code_interpreter_call.executing":
-                        yield StreamChunk(
-                            type="content",
-                            content=f"💻 [Provider Tool: Code Interpreter] Executing...",
-                        )
-                    elif chunk.type == "response.code_interpreter_call.completed":
-                        yield StreamChunk(
-                            type="content",
-                            content=f"✅ [Provider Tool: Code Interpreter] Execution completed",
-                        )
-                    elif chunk.type == "response.output_item.done":
-                        # Get search query or executed code details - show them right after completion
-                        if hasattr(chunk, "item") and chunk.item:
-                            if (
-                                hasattr(chunk.item, "type")
-                                and chunk.item.type == "web_search_call"
-                            ):
-                                if hasattr(chunk.item, "action") and hasattr(
-                                    chunk.item.action, "query"
-                                ):
-                                    search_query = chunk.item.action.query
-                                    if search_query:
-                                        yield StreamChunk(
-                                            type="content",
-                                            content=f"🔍 [Search Query] '{search_query}'",
-                                        )
-                            elif (
-                                hasattr(chunk.item, "type")
-                                and chunk.item.type == "code_interpreter_call"
-                            ):
-                                if hasattr(chunk.item, "code") and chunk.item.code:
-                                    # Format code as a proper code block - don't assume language
-                                    yield StreamChunk(
-                                        type="content",
-                                        content=f"💻 [Code Executed]\n```\n{chunk.item.code}\n```\n",
-                                    )
-                                # Also show the execution output if available
-                                if (
-                                    hasattr(chunk.item, "outputs")
-                                    and chunk.item.outputs
-                                ):
-                                    for output in chunk.item.outputs:
-                                        output_text = None
-                                        if hasattr(output, "text") and output.text:
-                                            output_text = output.text
-                                        elif (
-                                            hasattr(output, "content")
-                                            and output.content
-                                        ):
-                                            output_text = output.content
-                                        elif hasattr(output, "data") and output.data:
-                                            output_text = str(output.data)
-                                        elif isinstance(output, str):
-                                            output_text = output
-                                        elif isinstance(output, dict):
-                                            # Handle dict format outputs
-                                            if "text" in output:
-                                                output_text = output["text"]
-                                            elif "content" in output:
-                                                output_text = output["content"]
-                                            elif "data" in output:
-                                                output_text = str(output["data"])
-                                        if output_text and output_text.strip():
-                                            yield StreamChunk(
-                                                type="content",
-                                                content=f"📊 [Result] {output_text.strip()}\n",
-                                            )
-                    elif chunk.type == "response.completed":
-                        # Extract and yield tool calls from the complete response
-                        if hasattr(chunk, "response"):
-                            response_dict = self._convert_to_dict(chunk.response)
-                            # Extract builtin tool results from output array
-                            builtin_tool_results = []
-                            if (
-                                isinstance(response_dict, dict)
-                                and "output" in response_dict
-                            ):
-                                for item in response_dict["output"]:
-                                    if item.get("type") == "code_interpreter_call":
-                                        # Code execution result
-                                        builtin_tool_results.append(
-                                            {
-                                                "id": item.get("id", ""),
-                                                "tool_type": "code_interpreter",
-                                                "status": item.get("status"),
-                                                "code": item.get("code", ""),
-                                                "outputs": item.get("outputs"),
-                                                "container_id": item.get(
-                                                    "container_id"
-                                                ),
-                                            }
-                                        )
-                                    elif item.get("type") == "web_search_call":
-                                        # Web search result
-                                        builtin_tool_results.append(
-                                            {
-                                                "id": item.get("id", ""),
-                                                "tool_type": "web_search",
-                                                "status": item.get("status"),
-                                                "query": item.get("query", ""),
-                                                "results": item.get("results"),
-                                            }
-                                        )
-                            # Yield builtin tool results if any were found
-                            if builtin_tool_results:
-                                yield StreamChunk(
-                                    type="builtin_tool_results",
-                                    builtin_tool_results=builtin_tool_results,
-                                )
-                            # Yield the complete response for internal use
-                            yield StreamChunk(
-                                type="complete_response", response=response_dict
+            return updated_messages, vector_store_id
+        except Exception as error:
+            logger.warning(f"File Search upload failed: {error}. Continuing without file search.")
+            return messages, None
+    async def _cleanup_file_search_resources(
+        self,
+        client: AsyncOpenAI,
+        agent_id: Optional[str] = None,
+    ) -> None:
+        """Clean up File Search vector stores and uploaded files."""
+        for vector_store_id in list(self._vector_store_ids):
+            try:
+                await client.vector_stores.delete(vector_store_id)
+                logger.info(
+                    "Deleted File Search vector store",
+                    extra={
+                        "vector_store_id": vector_store_id,
+                        "agent_id": agent_id,
+                    },
+                )
+            except Exception as exc:
+                logger.warning(
+                    f"Failed to delete vector store {vector_store_id}: {exc}",
+                    extra={"agent_id": agent_id},
+                )
+        for file_id in list(self._uploaded_file_ids):
+            try:
+                await client.files.delete(file_id)
+                logger.debug(
+                    "Deleted File Search uploaded file",
+                    extra={
+                        "file_id": file_id,
+                        "agent_id": agent_id,
+                    },
+                )
+            except Exception as exc:
+                logger.warning(
+                    f"Failed to delete file {file_id}: {exc}",
+                    extra={"agent_id": agent_id},
+                )
+        self._vector_store_ids.clear()
+        self._uploaded_file_ids.clear()
+    # def _save_image_sync(
+    #     self,
+    #     image_data: str,
+    #     prompt: str = None,
+    #     image_format: str = "png",
+    # ) -> Optional[str]:
+    #     """
+    #     Save generated image directly to filesystem (synchronous version).
+    #     Args:
+    #         image_data: Base64 encoded image data
+    #         prompt: Generation prompt (used for naming)
+    #         image_format: Image format (default png)
+    #     Returns:
+    #         Saved file path, or None if failed
+    #     """
+    #     try:
+    #         # Use agent's filesystem workspace if available, otherwise use current working directory
+    #         if self.filesystem_manager:
+    #             workspace_path = self.filesystem_manager.get_current_workspace()
+    #         else:
+    #             workspace_path = Path.cwd()
+    #         # Create generated_images subdirectory path
+    #         images_dir = workspace_path
+    #         # Create directory if it doesn't exist
+    #         images_dir.mkdir(parents=True, exist_ok=True)
+    #         # Generate filename
+    #         timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+    #         if prompt:
+    #             # Clean prompt for filename
+    #             clean_prompt = "".join(c for c in prompt[:30] if c.isalnum() or c in (" ", "-", "_")).strip()
+    #             clean_prompt = clean_prompt.replace(" ", "_")
+    #             filename = f"{timestamp}_{clean_prompt}.{image_format}"
+    #         else:
+    #             filename = f"{timestamp}_generated.{image_format}"
+    #         file_path = images_dir / filename
+    #         # Decode base64 and write to file
+    #         image_bytes = base64.b64decode(image_data)
+    #         file_path.write_bytes(image_bytes)
+    #         logger.info(f"Image saved to: {file_path}")
+    #         return str(file_path)
+    #     except Exception as e:
+    #         logger.error(f"Error saving image: {e}")
+    #         return None
+    def _convert_mcp_tools_to_openai_format(self) -> List[Dict[str, Any]]:
+        """Convert MCP tools (stdio + streamable-http) to OpenAI function declarations."""
+        if not self._mcp_functions:
+            return []
+        converted_tools = []
+        for function in self._mcp_functions.values():
+            converted_tools.append(function.to_openai_format())
+        logger.debug(
+            f"Converted {len(converted_tools)} MCP tools (stdio + streamable-http) to OpenAI format",
+        )
+        return converted_tools
+    async def _process_stream(self, stream, all_params, agent_id=None):
+        async for chunk in stream:
+            processed = self._process_stream_chunk(chunk, agent_id)
+            if processed.type == "complete_response":
+                # Yield the complete response first
+                yield processed
+                # Then signal completion with done chunk
+                log_stream_chunk("backend.response", "done", None, agent_id)
+                yield TextStreamChunk(type=ChunkType.DONE, source="response_api")
+            else:
+                yield processed
+    def _process_stream_chunk(self, chunk, agent_id) -> Union[TextStreamChunk, StreamChunk]:
+        """
+        Process individual stream chunks and convert to appropriate chunk format.
+        Returns TextStreamChunk for text/reasoning/tool content,
+        or legacy StreamChunk for backward compatibility.
+        """
+        if not hasattr(chunk, "type"):
+            # Return legacy StreamChunk for backward compatibility
+            return StreamChunk(type="content", content="")
+        chunk_type = chunk.type
+        # Handle different chunk types
+        if chunk_type == "response.output_text.delta" and hasattr(chunk, "delta"):
+            log_backend_agent_message(
+                agent_id or "default",
+                "RECV",
+                {"content": chunk.delta},
+                backend_name=self.get_provider_name(),
+            )
+            log_stream_chunk("backend.response", "content", chunk.delta, agent_id)
+            return TextStreamChunk(
+                type=ChunkType.CONTENT,
+                content=chunk.delta,
+                source="response_api",
+            )
+        elif chunk_type == "response.reasoning_text.delta" and hasattr(chunk, "delta"):
+            log_stream_chunk("backend.response", "reasoning", chunk.delta, agent_id)
+            return TextStreamChunk(
+                type=ChunkType.REASONING,
+                content=f"🧠 [Reasoning] {chunk.delta}",
+                reasoning_delta=chunk.delta,
+                item_id=getattr(chunk, "item_id", None),
+                content_index=getattr(chunk, "content_index", None),
+                source="response_api",
+            )
+        elif chunk_type == "response.reasoning_text.done":
+            reasoning_text = getattr(chunk, "text", "")
+            log_stream_chunk("backend.response", "reasoning_done", reasoning_text, agent_id)
+            return TextStreamChunk(
+                type=ChunkType.REASONING_DONE,
+                content="\n🧠 [Reasoning Complete]\n",
+                reasoning_text=reasoning_text,
+                item_id=getattr(chunk, "item_id", None),
+                content_index=getattr(chunk, "content_index", None),
+                source="response_api",
+            )
+        elif chunk_type == "response.reasoning_summary_text.delta" and hasattr(chunk, "delta"):
+            log_stream_chunk("backend.response", "reasoning_summary", chunk.delta, agent_id)
+            return TextStreamChunk(
+                type=ChunkType.REASONING_SUMMARY,
+                content=chunk.delta,
+                reasoning_summary_delta=chunk.delta,
+                item_id=getattr(chunk, "item_id", None),
+                summary_index=getattr(chunk, "summary_index", None),
+                source="response_api",
+            )
+        elif chunk_type == "response.reasoning_summary_text.done":
+            summary_text = getattr(chunk, "text", "")
+            log_stream_chunk("backend.response", "reasoning_summary_done", summary_text, agent_id)
+            return TextStreamChunk(
+                type=ChunkType.REASONING_SUMMARY_DONE,
+                content="\n📋 [Reasoning Summary Complete]\n",
+                reasoning_summary_text=summary_text,
+                item_id=getattr(chunk, "item_id", None),
+                summary_index=getattr(chunk, "summary_index", None),
+                source="response_api",
+            )
+        # Provider tool events
+        elif chunk_type == "response.file_search_call.in_progress":
+            item_id = getattr(chunk, "item_id", None)
+            output_index = getattr(chunk, "output_index", None)
+            log_stream_chunk("backend.response", "file_search", "Starting file search", agent_id)
+            return TextStreamChunk(
+                type=ChunkType.CONTENT,
+                content="\n📁 [File Search] Starting search...",
+                item_id=item_id,
+                content_index=output_index,
+                source="response_api",
+            )
+        elif chunk_type == "response.file_search_call.searching":
+            item_id = getattr(chunk, "item_id", None)
+            output_index = getattr(chunk, "output_index", None)
+            queries = getattr(chunk, "queries", None)
+            query_text = ""
+            if queries:
+                try:
+                    if isinstance(queries, (list, tuple)):
+                        query_text = ", ".join(str(q) for q in queries if q)
+                    else:
+                        query_text = str(queries)
+                except Exception:
+                    query_text = ""
+            message = "\n📁 [File Search] Searching..."
+            if query_text:
+                message += f" Query: {query_text}"
+            log_stream_chunk(
+                "backend.response",
+                "file_search",
+                f"Searching files{f' for {query_text}' if query_text else ''}",
+                agent_id,
+            )
+            return TextStreamChunk(
+                type=ChunkType.CONTENT,
+                content=message,
+                item_id=item_id,
+                content_index=output_index,
+                source="response_api",
+            )
+        elif chunk_type == "response.file_search_call.completed":
+            item_id = getattr(chunk, "item_id", None)
+            output_index = getattr(chunk, "output_index", None)
+            results = getattr(chunk, "results", None)
+            if results is None:
+                results = getattr(chunk, "search_results", None)
+            queries = getattr(chunk, "queries", None)
+            query_text = ""
+            if queries:
+                try:
+                    if isinstance(queries, (list, tuple)):
+                        query_text = ", ".join(str(q) for q in queries if q)
+                    else:
+                        query_text = str(queries)
+                except Exception:
+                    query_text = ""
+            if results is not None:
+                try:
+                    result_count = len(results)
+                except Exception:
+                    result_count = None
+            else:
+                result_count = None
+            message_parts = ["\n✅ [File Search] Completed"]
+            if query_text:
+                message_parts.append(f"Query: {query_text}")
+            if result_count is not None:
+                message_parts.append(f"Results: {result_count}")
+            message = " ".join(message_parts)
+            log_stream_chunk(
+                "backend.response",
+                "file_search",
+                f"Completed file search{f' for {query_text}' if query_text else ''}{f' with {result_count} results' if result_count is not None else ''}",
+                agent_id,
+            )
+            return TextStreamChunk(
+                type=ChunkType.CONTENT,
+                content=message,
+                item_id=item_id,
+                content_index=output_index,
+                source="response_api",
+            )
+        elif chunk_type == "response.web_search_call.in_progress":
+            log_stream_chunk("backend.response", "web_search", "Starting search", agent_id)
+            return TextStreamChunk(
+                type=ChunkType.CONTENT,
+                content="\n🔍 [Provider Tool: Web Search] Starting search...",
+                source="response_api",
+            )
+        elif chunk_type == "response.web_search_call.searching":
+            log_stream_chunk("backend.response", "web_search", "Searching", agent_id)
+            return TextStreamChunk(
+                type=ChunkType.CONTENT,
+                content="\n🔍 [Provider Tool: Web Search] Searching...",
+                source="response_api",
+            )
+        elif chunk_type == "response.web_search_call.completed":
+            log_stream_chunk("backend.response", "web_search", "Search completed", agent_id)
+            return TextStreamChunk(
+                type=ChunkType.CONTENT,
+                content="\n✅ [Provider Tool: Web Search] Search completed",
+                source="response_api",
+            )
+        elif chunk_type == "response.code_interpreter_call.in_progress":
+            log_stream_chunk("backend.response", "code_interpreter", "Starting execution", agent_id)
+            return TextStreamChunk(
+                type=ChunkType.CONTENT,
+                content="\n💻 [Provider Tool: Code Interpreter] Starting execution...",
+                source="response_api",
+            )
+        elif chunk_type == "response.code_interpreter_call.executing":
+            log_stream_chunk("backend.response", "code_interpreter", "Executing", agent_id)
+            return TextStreamChunk(
+                type=ChunkType.CONTENT,
+                content="\n💻 [Provider Tool: Code Interpreter] Executing...",
+                source="response_api",
+            )
+        elif chunk_type == "response.code_interpreter_call.completed":
+            log_stream_chunk("backend.response", "code_interpreter", "Execution completed", agent_id)
+            return TextStreamChunk(
+                type=ChunkType.CONTENT,
+                content="\n✅ [Provider Tool: Code Interpreter] Execution completed",
+                source="response_api",
+            )
+        # Image Generation events
+        elif chunk_type == "response.image_generation_call.in_progress":
+            log_stream_chunk("backend.response", "image_generation", "Starting image generation", agent_id)
+            return TextStreamChunk(
+                type=ChunkType.CONTENT,
+                content="\n🎨 [Provider Tool: Image Generation] Starting generation...",
+                source="response_api",
+            )
+        elif chunk_type == "response.image_generation_call.generating":
+            log_stream_chunk("backend.response", "image_generation", "Generating image", agent_id)
+            return TextStreamChunk(
+                type=ChunkType.CONTENT,
+                content="\n🎨 [Provider Tool: Image Generation] Generating image...",
+                source="response_api",
+            )
+        elif chunk_type == "response.image_generation_call.completed":
+            log_stream_chunk("backend.response", "image_generation", "Image generation completed", agent_id)
+            return TextStreamChunk(
+                type=ChunkType.CONTENT,
+                content="\n✅ [Provider Tool: Image Generation] Image generated successfully",
+                source="response_api",
+            )
+        elif chunk_type == "image_generation.completed":
+            # Handle the final image generation result
+            if hasattr(chunk, "b64_json"):
+                log_stream_chunk("backend.response", "image_generation", "Image data received", agent_id)
+                # The image is complete, return a status message
+                return TextStreamChunk(
+                    type=ChunkType.CONTENT,
+                    content="\n✅ [Image Generation] Image successfully created",
+                    source="response_api",
+                )
+        elif chunk.type == "response.output_item.done":
+            # Get search query or executed code details - show them right after completion
+            if hasattr(chunk, "item") and chunk.item:
+                if hasattr(chunk.item, "type") and chunk.item.type == "web_search_call":
+                    if hasattr(chunk.item, "action") and ("query" in chunk.item.action):
+                        search_query = chunk.item.action["query"]
+                        if search_query:
+                            log_stream_chunk("backend.response", "search_query", search_query, agent_id)
+                            return TextStreamChunk(
+                                type=ChunkType.CONTENT,
+                                content=f"\n🔍 [Search Query] '{search_query}'\n",
+                                source="response_api",
                             )
-                        else:
-                            # Fallback if no response object
-                            complete_message = {
-                                "role": "assistant",
-                                "content": content.strip(),
-                            }
-                            yield StreamChunk(
-                                type="complete_message",
-                                complete_message=complete_message,
+                elif hasattr(chunk.item, "type") and chunk.item.type == "code_interpreter_call":
+                    if hasattr(chunk.item, "code") and chunk.item.code:
+                        # Format code as a proper code block - don't assume language
+                        log_stream_chunk("backend.response", "code_executed", chunk.item.code, agent_id)
+                        return TextStreamChunk(
+                            type=ChunkType.CONTENT,
+                            content=f"💻 [Code Executed]\n```\n{chunk.item.code}\n```\n",
+                            source="response_api",
+                        )
+                    # Also show the execution output if available
+                    if hasattr(chunk.item, "outputs") and chunk.item.outputs:
+                        for output in chunk.item.outputs:
+                            output_text = None
+                            if hasattr(output, "text") and output.text:
+                                output_text = output.text
+                            elif hasattr(output, "content") and output.content:
+                                output_text = output.content
+                            elif hasattr(output, "data") and output.data:
+                                output_text = str(output.data)
+                            elif isinstance(output, str):
+                                output_text = output
+                            elif isinstance(output, dict):
+                                # Handle dict format outputs
+                                if "text" in output:
+                                    output_text = output["text"]
+                                elif "content" in output:
+                                    output_text = output["content"]
+                                elif "data" in output:
+                                    output_text = str(output["data"])
+                            if output_text and output_text.strip():
+                                log_stream_chunk("backend.response", "code_result", output_text.strip(), agent_id)
+                                return TextStreamChunk(
+                                    type=ChunkType.CONTENT,
+                                    content=f"📊 [Result] {output_text.strip()}\n",
+                                    source="response_api",
+                                )
+                elif hasattr(chunk.item, "type") and chunk.item.type == "image_generation_call":
+                    # Image generation completed - show details
+                    if hasattr(chunk.item, "action") and chunk.item.action:
+                        prompt = chunk.item.action.get("prompt", "")
+                        size = chunk.item.action.get("size", "1024x1024")
+                        if prompt:
+                            log_stream_chunk("backend.response", "image_prompt", prompt, agent_id)
+                            return TextStreamChunk(
+                                type=ChunkType.CONTENT,
+                                content=f"\n🎨 [Image Generated] Prompt: '{prompt}' (Size: {size})\n",
+                                source="response_api",
                             )
+        # MCP events
+        elif chunk_type == "response.mcp_list_tools.started":
+            return TextStreamChunk(
+                type=ChunkType.MCP_STATUS,
+                content="\n🔧 [MCP] Listing available tools...",
+                source="response_api",
+            )
+        elif chunk_type == "response.mcp_list_tools.completed":
+            return TextStreamChunk(
+                type=ChunkType.MCP_STATUS,
+                content="\n✅ [MCP] Tool listing completed",
+                source="response_api",
+            )
+        elif chunk_type == "response.mcp_list_tools.failed":
+            return TextStreamChunk(
+                type=ChunkType.MCP_STATUS,
+                content="\n❌ [MCP] Tool listing failed",
+                source="response_api",
+            )
-                        # Signal completion
-                        yield StreamChunk(type="done")
+        elif chunk_type == "response.mcp_call.started":
+            tool_name = getattr(chunk, "tool_name", "unknown")
+            return TextStreamChunk(
+                type=ChunkType.MCP_STATUS,
+                content=f"\n🔧 [MCP] Calling tool '{tool_name}'...",
+                source="response_api",
+            )
+        elif chunk_type == "response.mcp_call.in_progress":
+            return TextStreamChunk(
+                type=ChunkType.MCP_STATUS,
+                content="\n⏳ [MCP] Tool execution in progress...",
+                source="response_api",
+            )
+        elif chunk_type == "response.mcp_call.completed":
+            tool_name = getattr(chunk, "tool_name", "unknown")
+            return TextStreamChunk(
+                type=ChunkType.MCP_STATUS,
+                content=f"\n✅ [MCP] Tool '{tool_name}' completed",
+                source="response_api",
+            )
+        elif chunk_type == "response.mcp_call.failed":
+            tool_name = getattr(chunk, "tool_name", "unknown")
+            error_msg = getattr(chunk, "error", "unknown error")
+            return TextStreamChunk(
+                type=ChunkType.MCP_STATUS,
+                content=f"\n❌ [MCP] Tool '{tool_name}' failed: {error_msg}",
+                source="response_api",
+            )
-        except Exception as e:
-            yield StreamChunk(type="error", error=str(e))
+        elif chunk.type == "response.completed":
+            # Extract and yield tool calls from the complete response
+            if hasattr(chunk, "response"):
+                response_dict = self._convert_to_dict(chunk.response)
-    def get_provider_name(self) -> str:
-        """Get the provider name."""
-        return "OpenAI"
+                # Handle builtin tool results from output array with simple content format
+                if isinstance(response_dict, dict) and "output" in response_dict:
+                    for item in response_dict["output"]:
+                        if item.get("type") == "code_interpreter_call":
+                            # Code execution result
+                            status = item.get("status", "unknown")
+                            code = item.get("code", "")
+                            outputs = item.get("outputs")
+                            content = f"\n🔧 Code Interpreter [{status.title()}]"
+                            if code:
+                                content += f": {code}"
+                            if outputs:
+                                content += f" → {outputs}"
-    def get_supported_builtin_tools(self) -> List[str]:
-        """Get list of builtin tools supported by OpenAI."""
-        return ["web_search", "code_interpreter"]
+                            log_stream_chunk("backend.response", "code_interpreter_result", content, agent_id)
+                            return TextStreamChunk(
+                                type=ChunkType.CONTENT,
+                                content=content,
+                                source="response_api",
+                            )
+                        elif item.get("type") == "web_search_call":
+                            # Web search result
+                            status = item.get("status", "unknown")
+                            # Query is in action.query, not directly in item
+                            query = item.get("action", {}).get("query", "")
+                            results = item.get("results")
-    def extract_tool_name(self, tool_call: Dict[str, Any]) -> str:
-        """Extract tool name from OpenAI format (handles both Chat Completions and Responses API)."""
-        # Check if it's Chat Completions format
-        if "function" in tool_call:
-            return tool_call.get("function", {}).get("name", "unknown")
-        # Otherwise assume Responses API format
-        return tool_call.get("name", "unknown")
-    def extract_tool_arguments(self, tool_call: Dict[str, Any]) -> Dict[str, Any]:
-        """Extract tool arguments from OpenAI format (handles both Chat Completions and Responses API)."""
-        # Check if it's Chat Completions format
-        if "function" in tool_call:
-            return tool_call.get("function", {}).get("arguments", {})
-        # Otherwise assume Responses API format
-        arguments = tool_call.get("arguments", {})
-        if isinstance(arguments, str):
-            try:
-                import json
+                            # Only show web search completion if query is present
+                            if query:
+                                content = f"\n🔧 Web Search [{status.title()}]: {query}"
+                                if results:
+                                    content += f" → Found {len(results)} results"
+                                log_stream_chunk("backend.response", "web_search_result", content, agent_id)
+                                return TextStreamChunk(
+                                    type=ChunkType.CONTENT,
+                                    content=content,
+                                    source="response_api",
+                                )
+                        elif item.get("type") == "image_generation_call":
+                            # Image generation result in completed response
+                            status = item.get("status", "unknown")
+                            action = item.get("action", {})
+                            prompt = action.get("prompt", "")
+                            size = action.get("size", "1024x1024")
-                return json.loads(arguments)
-            except:
-                return {}
-        return arguments
+                            if prompt:
+                                content = f"\n🔧 Image Generation [{status.title()}]: {prompt} (Size: {size})"
+                                log_stream_chunk("backend.response", "image_generation_result", content, agent_id)
+                                return TextStreamChunk(
+                                    type=ChunkType.CONTENT,
+                                    content=content,
+                                    source="response_api",
+                                )
+                # Yield the complete response for internal use
+                log_stream_chunk("backend.response", "complete_response", "Response completed", agent_id)
+                return TextStreamChunk(
+                    type=ChunkType.COMPLETE_RESPONSE,
+                    response=response_dict,
+                    source="response_api",
+                )
-    def extract_tool_call_id(self, tool_call: Dict[str, Any]) -> str:
-        """Extract tool call ID from OpenAI format (handles both Chat Completions and Responses API)."""
-        # For Responses API, use call_id (for tool results), for Chat Completions use id
-        return tool_call.get("call_id") or tool_call.get("id") or ""
+        # Default chunk - this should not happen for valid responses
+        # Return legacy StreamChunk for backward compatibility
+        return StreamChunk(type="content", content="")
     def create_tool_result_message(
-        self, tool_call: Dict[str, Any], result_content: str
+        self,
+        tool_call: Dict[str, Any],
+        result_content: str,
     ) -> Dict[str, Any]:
         """Create tool result message for OpenAI Responses API format."""
         tool_call_id = self.extract_tool_call_id(tool_call)
@@ -350,6 +1141,9 @@ class ResponseBackend(LLMBackend):
         """Extract content from OpenAI Responses API tool result message."""
         return tool_result_message.get("output", "")
+    def _create_client(self, **kwargs) -> AsyncOpenAI:
+        return openai.AsyncOpenAI(api_key=self.api_key)
     def _convert_to_dict(self, obj) -> Dict[str, Any]:
         """Convert any object to dictionary with multiple fallback methods."""
         try:
@@ -359,39 +1153,18 @@ class ResponseBackend(LLMBackend):
                 return obj.dict()
             else:
                 return dict(obj)
-        except:
+        except Exception:
             # Final fallback: extract key attributes manually
-            return {
-                key: getattr(obj, key, None)
-                for key in dir(obj)
-                if not key.startswith("_") and not callable(getattr(obj, key, None))
-            }
-    def estimate_tokens(self, text: str) -> int:
-        """Estimate token count for text (rough approximation)."""
-        return len(text) // 4
-    def calculate_cost(
-        self, input_tokens: int, output_tokens: int, model: str
-    ) -> float:
-        """Calculate cost for OpenAI token usage (2024-2025 pricing)."""
-        model_lower = model.lower()
-        if "gpt-4" in model_lower:
-            if "4o-mini" in model_lower:
-                input_cost = input_tokens * 0.00015 / 1000
-                output_cost = output_tokens * 0.0006 / 1000
-            elif "4o" in model_lower:
-                input_cost = input_tokens * 0.005 / 1000
-                output_cost = output_tokens * 0.020 / 1000
-            else:
-                input_cost = input_tokens * 0.03 / 1000
-                output_cost = output_tokens * 0.06 / 1000
-        elif "gpt-3.5" in model_lower:
-            input_cost = input_tokens * 0.0005 / 1000
-            output_cost = output_tokens * 0.0015 / 1000
-        else:
-            input_cost = input_tokens * 0.0005 / 1000
-            output_cost = output_tokens * 0.0015 / 1000
-        return input_cost + output_cost
+            return {key: getattr(obj, key, None) for key in dir(obj) if not key.startswith("_") and not callable(getattr(obj, key, None))}
+    def get_provider_name(self) -> str:
+        """Get the provider name."""
+        return "OpenAI"
+    def get_filesystem_support(self) -> FilesystemSupport:
+        """OpenAI supports filesystem through MCP servers."""
+        return FilesystemSupport.MCP
+    def get_supported_builtin_tools(self) -> List[str]:
+        """Get list of builtin tools supported by OpenAI."""
+        return ["web_search", "code_interpreter"]

massgen 0.0.3__py3-none-any.whl → 0.1.0__py3-none-any.whl

Potentially problematic release.

massgen 0.0.3py3-none-any.whl → 0.1.0py3-none-any.whl