PyPI - massgen - Versions diffs - 0.0.3__py3-none-any.whl → 0.1.0__py3-none-any.whl - Mend

massgen 0.0.3py3-none-any.whl → 0.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of massgen might be problematic. Click here for more details.

Files changed (268) hide show

massgen/__init__.py +142 -8
massgen/adapters/__init__.py +29 -0
massgen/adapters/ag2_adapter.py +483 -0
massgen/adapters/base.py +183 -0
massgen/adapters/tests/__init__.py +0 -0
massgen/adapters/tests/test_ag2_adapter.py +439 -0
massgen/adapters/tests/test_agent_adapter.py +128 -0
massgen/adapters/utils/__init__.py +2 -0
massgen/adapters/utils/ag2_utils.py +236 -0
massgen/adapters/utils/tests/__init__.py +0 -0
massgen/adapters/utils/tests/test_ag2_utils.py +138 -0
massgen/agent_config.py +329 -55
massgen/api_params_handler/__init__.py +10 -0
massgen/api_params_handler/_api_params_handler_base.py +99 -0
massgen/api_params_handler/_chat_completions_api_params_handler.py +176 -0
massgen/api_params_handler/_claude_api_params_handler.py +113 -0
massgen/api_params_handler/_response_api_params_handler.py +130 -0
massgen/backend/__init__.py +39 -4
massgen/backend/azure_openai.py +385 -0
massgen/backend/base.py +341 -69
massgen/backend/base_with_mcp.py +1102 -0
massgen/backend/capabilities.py +386 -0
massgen/backend/chat_completions.py +577 -130
massgen/backend/claude.py +1033 -537
massgen/backend/claude_code.py +1203 -0
massgen/backend/cli_base.py +209 -0
massgen/backend/docs/BACKEND_ARCHITECTURE.md +126 -0
massgen/backend/{CLAUDE_API_RESEARCH.md → docs/CLAUDE_API_RESEARCH.md} +18 -18
massgen/backend/{GEMINI_API_DOCUMENTATION.md → docs/GEMINI_API_DOCUMENTATION.md} +9 -9
massgen/backend/docs/Gemini MCP Integration Analysis.md +1050 -0
massgen/backend/docs/MCP_IMPLEMENTATION_CLAUDE_BACKEND.md +177 -0
massgen/backend/docs/MCP_INTEGRATION_RESPONSE_BACKEND.md +352 -0
massgen/backend/docs/OPENAI_GPT5_MODELS.md +211 -0
massgen/backend/{OPENAI_RESPONSES_API_FORMAT.md → docs/OPENAI_RESPONSE_API_TOOL_CALLS.md} +3 -3
massgen/backend/docs/OPENAI_response_streaming.md +20654 -0
massgen/backend/docs/inference_backend.md +257 -0
massgen/backend/docs/permissions_and_context_files.md +1085 -0
massgen/backend/external.py +126 -0
massgen/backend/gemini.py +1850 -241
massgen/backend/grok.py +40 -156
massgen/backend/inference.py +156 -0
massgen/backend/lmstudio.py +171 -0
massgen/backend/response.py +1095 -322
massgen/chat_agent.py +131 -113
massgen/cli.py +1560 -275
massgen/config_builder.py +2396 -0
massgen/configs/BACKEND_CONFIGURATION.md +458 -0
massgen/configs/README.md +559 -216
massgen/configs/ag2/ag2_case_study.yaml +27 -0
massgen/configs/ag2/ag2_coder.yaml +34 -0
massgen/configs/ag2/ag2_coder_case_study.yaml +36 -0
massgen/configs/ag2/ag2_gemini.yaml +27 -0
massgen/configs/ag2/ag2_groupchat.yaml +108 -0
massgen/configs/ag2/ag2_groupchat_gpt.yaml +118 -0
massgen/configs/ag2/ag2_single_agent.yaml +21 -0
massgen/configs/basic/multi/fast_timeout_example.yaml +37 -0
massgen/configs/basic/multi/gemini_4o_claude.yaml +31 -0
massgen/configs/basic/multi/gemini_gpt5nano_claude.yaml +36 -0
massgen/configs/{gemini_4o_claude.yaml → basic/multi/geminicode_4o_claude.yaml} +3 -3
massgen/configs/basic/multi/geminicode_gpt5nano_claude.yaml +36 -0
massgen/configs/basic/multi/glm_gemini_claude.yaml +25 -0
massgen/configs/basic/multi/gpt4o_audio_generation.yaml +30 -0
massgen/configs/basic/multi/gpt4o_image_generation.yaml +31 -0
massgen/configs/basic/multi/gpt5nano_glm_qwen.yaml +26 -0
massgen/configs/basic/multi/gpt5nano_image_understanding.yaml +26 -0
massgen/configs/{three_agents_default.yaml → basic/multi/three_agents_default.yaml} +8 -4
massgen/configs/basic/multi/three_agents_opensource.yaml +27 -0
massgen/configs/basic/multi/three_agents_vllm.yaml +20 -0
massgen/configs/basic/multi/two_agents_gemini.yaml +19 -0
massgen/configs/{two_agents.yaml → basic/multi/two_agents_gpt5.yaml} +14 -6
massgen/configs/basic/multi/two_agents_opensource_lmstudio.yaml +31 -0
massgen/configs/basic/multi/two_qwen_vllm_sglang.yaml +28 -0
massgen/configs/{single_agent.yaml → basic/single/single_agent.yaml} +1 -1
massgen/configs/{single_flash2.5.yaml → basic/single/single_flash2.5.yaml} +1 -2
massgen/configs/basic/single/single_gemini2.5pro.yaml +16 -0
massgen/configs/basic/single/single_gpt4o_audio_generation.yaml +22 -0
massgen/configs/basic/single/single_gpt4o_image_generation.yaml +22 -0
massgen/configs/basic/single/single_gpt4o_video_generation.yaml +24 -0
massgen/configs/basic/single/single_gpt5nano.yaml +20 -0
massgen/configs/basic/single/single_gpt5nano_file_search.yaml +18 -0
massgen/configs/basic/single/single_gpt5nano_image_understanding.yaml +17 -0
massgen/configs/basic/single/single_gptoss120b.yaml +15 -0
massgen/configs/basic/single/single_openrouter_audio_understanding.yaml +15 -0
massgen/configs/basic/single/single_qwen_video_understanding.yaml +15 -0
massgen/configs/debug/code_execution/command_filtering_blacklist.yaml +29 -0
massgen/configs/debug/code_execution/command_filtering_whitelist.yaml +28 -0
massgen/configs/debug/code_execution/docker_verification.yaml +29 -0
massgen/configs/debug/skip_coordination_test.yaml +27 -0
massgen/configs/debug/test_sdk_migration.yaml +17 -0
massgen/configs/docs/DISCORD_MCP_SETUP.md +208 -0
massgen/configs/docs/TWITTER_MCP_ENESCINAR_SETUP.md +82 -0
massgen/configs/providers/azure/azure_openai_multi.yaml +21 -0
massgen/configs/providers/azure/azure_openai_single.yaml +19 -0
massgen/configs/providers/claude/claude.yaml +14 -0
massgen/configs/providers/gemini/gemini_gpt5nano.yaml +28 -0
massgen/configs/providers/local/lmstudio.yaml +11 -0
massgen/configs/providers/openai/gpt5.yaml +46 -0
massgen/configs/providers/openai/gpt5_nano.yaml +46 -0
massgen/configs/providers/others/grok_single_agent.yaml +19 -0
massgen/configs/providers/others/zai_coding_team.yaml +108 -0
massgen/configs/providers/others/zai_glm45.yaml +12 -0
massgen/configs/{creative_team.yaml → teams/creative/creative_team.yaml} +16 -6
massgen/configs/{travel_planning.yaml → teams/creative/travel_planning.yaml} +16 -6
massgen/configs/{news_analysis.yaml → teams/research/news_analysis.yaml} +16 -6
massgen/configs/{research_team.yaml → teams/research/research_team.yaml} +15 -7
massgen/configs/{technical_analysis.yaml → teams/research/technical_analysis.yaml} +16 -6
massgen/configs/tools/code-execution/basic_command_execution.yaml +25 -0
massgen/configs/tools/code-execution/code_execution_use_case_simple.yaml +41 -0
massgen/configs/tools/code-execution/docker_claude_code.yaml +32 -0
massgen/configs/tools/code-execution/docker_multi_agent.yaml +32 -0
massgen/configs/tools/code-execution/docker_simple.yaml +29 -0
massgen/configs/tools/code-execution/docker_with_resource_limits.yaml +32 -0
massgen/configs/tools/code-execution/multi_agent_playwright_automation.yaml +57 -0
massgen/configs/tools/filesystem/cc_gpt5_gemini_filesystem.yaml +34 -0
massgen/configs/tools/filesystem/claude_code_context_sharing.yaml +68 -0
massgen/configs/tools/filesystem/claude_code_flash2.5.yaml +43 -0
massgen/configs/tools/filesystem/claude_code_flash2.5_gptoss.yaml +49 -0
massgen/configs/tools/filesystem/claude_code_gpt5nano.yaml +31 -0
massgen/configs/tools/filesystem/claude_code_single.yaml +40 -0
massgen/configs/tools/filesystem/fs_permissions_test.yaml +87 -0
massgen/configs/tools/filesystem/gemini_gemini_workspace_cleanup.yaml +54 -0
massgen/configs/tools/filesystem/gemini_gpt5_filesystem_casestudy.yaml +30 -0
massgen/configs/tools/filesystem/gemini_gpt5nano_file_context_path.yaml +43 -0
massgen/configs/tools/filesystem/gemini_gpt5nano_protected_paths.yaml +45 -0
massgen/configs/tools/filesystem/gpt5mini_cc_fs_context_path.yaml +31 -0
massgen/configs/tools/filesystem/grok4_gpt5_gemini_filesystem.yaml +32 -0
massgen/configs/tools/filesystem/multiturn/grok4_gpt5_claude_code_filesystem_multiturn.yaml +58 -0
massgen/configs/tools/filesystem/multiturn/grok4_gpt5_gemini_filesystem_multiturn.yaml +58 -0
massgen/configs/tools/filesystem/multiturn/two_claude_code_filesystem_multiturn.yaml +47 -0
massgen/configs/tools/filesystem/multiturn/two_gemini_flash_filesystem_multiturn.yaml +48 -0
massgen/configs/tools/mcp/claude_code_discord_mcp_example.yaml +27 -0
massgen/configs/tools/mcp/claude_code_simple_mcp.yaml +35 -0
massgen/configs/tools/mcp/claude_code_twitter_mcp_example.yaml +32 -0
massgen/configs/tools/mcp/claude_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/claude_mcp_test.yaml +27 -0
massgen/configs/tools/mcp/five_agents_travel_mcp_test.yaml +157 -0
massgen/configs/tools/mcp/five_agents_weather_mcp_test.yaml +103 -0
massgen/configs/tools/mcp/gemini_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/gemini_mcp_filesystem_test.yaml +23 -0
massgen/configs/tools/mcp/gemini_mcp_filesystem_test_sharing.yaml +23 -0
massgen/configs/tools/mcp/gemini_mcp_filesystem_test_single_agent.yaml +17 -0
massgen/configs/tools/mcp/gemini_mcp_filesystem_test_with_claude_code.yaml +24 -0
massgen/configs/tools/mcp/gemini_mcp_test.yaml +27 -0
massgen/configs/tools/mcp/gemini_notion_mcp.yaml +52 -0
massgen/configs/tools/mcp/gpt5_nano_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/gpt5_nano_mcp_test.yaml +27 -0
massgen/configs/tools/mcp/gpt5mini_claude_code_discord_mcp_example.yaml +38 -0
massgen/configs/tools/mcp/gpt_oss_mcp_example.yaml +25 -0
massgen/configs/tools/mcp/gpt_oss_mcp_test.yaml +28 -0
massgen/configs/tools/mcp/grok3_mini_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/grok3_mini_mcp_test.yaml +27 -0
massgen/configs/tools/mcp/multimcp_gemini.yaml +111 -0
massgen/configs/tools/mcp/qwen_api_mcp_example.yaml +25 -0
massgen/configs/tools/mcp/qwen_api_mcp_test.yaml +28 -0
massgen/configs/tools/mcp/qwen_local_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/qwen_local_mcp_test.yaml +27 -0
massgen/configs/tools/planning/five_agents_discord_mcp_planning_mode.yaml +140 -0
massgen/configs/tools/planning/five_agents_filesystem_mcp_planning_mode.yaml +151 -0
massgen/configs/tools/planning/five_agents_notion_mcp_planning_mode.yaml +151 -0
massgen/configs/tools/planning/five_agents_twitter_mcp_planning_mode.yaml +155 -0
massgen/configs/tools/planning/gpt5_mini_case_study_mcp_planning_mode.yaml +73 -0
massgen/configs/tools/web-search/claude_streamable_http_test.yaml +43 -0
massgen/configs/tools/web-search/gemini_streamable_http_test.yaml +43 -0
massgen/configs/tools/web-search/gpt5_mini_streamable_http_test.yaml +43 -0
massgen/configs/tools/web-search/gpt_oss_streamable_http_test.yaml +44 -0
massgen/configs/tools/web-search/grok3_mini_streamable_http_test.yaml +43 -0
massgen/configs/tools/web-search/qwen_api_streamable_http_test.yaml +44 -0
massgen/configs/tools/web-search/qwen_local_streamable_http_test.yaml +43 -0
massgen/coordination_tracker.py +708 -0
massgen/docker/README.md +462 -0
massgen/filesystem_manager/__init__.py +21 -0
massgen/filesystem_manager/_base.py +9 -0
massgen/filesystem_manager/_code_execution_server.py +545 -0
massgen/filesystem_manager/_docker_manager.py +477 -0
massgen/filesystem_manager/_file_operation_tracker.py +248 -0
massgen/filesystem_manager/_filesystem_manager.py +813 -0
massgen/filesystem_manager/_path_permission_manager.py +1261 -0
massgen/filesystem_manager/_workspace_tools_server.py +1815 -0
massgen/formatter/__init__.py +10 -0
massgen/formatter/_chat_completions_formatter.py +284 -0
massgen/formatter/_claude_formatter.py +235 -0
massgen/formatter/_formatter_base.py +156 -0
massgen/formatter/_response_formatter.py +263 -0
massgen/frontend/__init__.py +1 -2
massgen/frontend/coordination_ui.py +471 -286
massgen/frontend/displays/base_display.py +56 -11
massgen/frontend/displays/create_coordination_table.py +1956 -0
massgen/frontend/displays/rich_terminal_display.py +1259 -619
massgen/frontend/displays/simple_display.py +9 -4
massgen/frontend/displays/terminal_display.py +27 -68
massgen/logger_config.py +681 -0
massgen/mcp_tools/README.md +232 -0
massgen/mcp_tools/__init__.py +105 -0
massgen/mcp_tools/backend_utils.py +1035 -0
massgen/mcp_tools/circuit_breaker.py +195 -0
massgen/mcp_tools/client.py +894 -0
massgen/mcp_tools/config_validator.py +138 -0
massgen/mcp_tools/docs/circuit_breaker.md +646 -0
massgen/mcp_tools/docs/client.md +950 -0
massgen/mcp_tools/docs/config_validator.md +478 -0
massgen/mcp_tools/docs/exceptions.md +1165 -0
massgen/mcp_tools/docs/security.md +854 -0
massgen/mcp_tools/exceptions.py +338 -0
massgen/mcp_tools/hooks.py +212 -0
massgen/mcp_tools/security.py +780 -0
massgen/message_templates.py +342 -64
massgen/orchestrator.py +1515 -241
massgen/stream_chunk/__init__.py +35 -0
massgen/stream_chunk/base.py +92 -0
massgen/stream_chunk/multimodal.py +237 -0
massgen/stream_chunk/text.py +162 -0
massgen/tests/mcp_test_server.py +150 -0
massgen/tests/multi_turn_conversation_design.md +0 -8
massgen/tests/test_azure_openai_backend.py +156 -0
massgen/tests/test_backend_capabilities.py +262 -0
massgen/tests/test_backend_event_loop_all.py +179 -0
massgen/tests/test_chat_completions_refactor.py +142 -0
massgen/tests/test_claude_backend.py +15 -28
massgen/tests/test_claude_code.py +268 -0
massgen/tests/test_claude_code_context_sharing.py +233 -0
massgen/tests/test_claude_code_orchestrator.py +175 -0
massgen/tests/test_cli_backends.py +180 -0
massgen/tests/test_code_execution.py +679 -0
massgen/tests/test_external_agent_backend.py +134 -0
massgen/tests/test_final_presentation_fallback.py +237 -0
massgen/tests/test_gemini_planning_mode.py +351 -0
massgen/tests/test_grok_backend.py +7 -10
massgen/tests/test_http_mcp_server.py +42 -0
massgen/tests/test_integration_simple.py +198 -0
massgen/tests/test_mcp_blocking.py +125 -0
massgen/tests/test_message_context_building.py +29 -47
massgen/tests/test_orchestrator_final_presentation.py +48 -0
massgen/tests/test_path_permission_manager.py +2087 -0
massgen/tests/test_rich_terminal_display.py +14 -13
massgen/tests/test_timeout.py +133 -0
massgen/tests/test_v3_3agents.py +11 -12
massgen/tests/test_v3_simple.py +8 -13
massgen/tests/test_v3_three_agents.py +11 -18
massgen/tests/test_v3_two_agents.py +8 -13
massgen/token_manager/__init__.py +7 -0
massgen/token_manager/token_manager.py +400 -0
massgen/utils.py +52 -16
massgen/v1/agent.py +45 -91
massgen/v1/agents.py +18 -53
massgen/v1/backends/gemini.py +50 -153
massgen/v1/backends/grok.py +21 -54
massgen/v1/backends/oai.py +39 -111
massgen/v1/cli.py +36 -93
massgen/v1/config.py +8 -12
massgen/v1/logging.py +43 -127
massgen/v1/main.py +18 -32
massgen/v1/orchestrator.py +68 -209
massgen/v1/streaming_display.py +62 -163
massgen/v1/tools.py +8 -12
massgen/v1/types.py +9 -23
massgen/v1/utils.py +5 -23
massgen-0.1.0.dist-info/METADATA +1245 -0
massgen-0.1.0.dist-info/RECORD +273 -0
massgen-0.1.0.dist-info/entry_points.txt +2 -0
massgen/frontend/logging/__init__.py +0 -9
massgen/frontend/logging/realtime_logger.py +0 -197
massgen-0.0.3.dist-info/METADATA +0 -568
massgen-0.0.3.dist-info/RECORD +0 -76
massgen-0.0.3.dist-info/entry_points.txt +0 -2
/massgen/backend/{Function calling openai responses.md → docs/Function calling openai responses.md} +0 -0
{massgen-0.0.3.dist-info → massgen-0.1.0.dist-info}/WHEEL +0 -0
{massgen-0.0.3.dist-info → massgen-0.1.0.dist-info}/licenses/LICENSE +0 -0
{massgen-0.0.3.dist-info → massgen-0.1.0.dist-info}/top_level.txt +0 -0

massgen/tests/test_azure_openai_backend.py ADDED Viewed

@@ -0,0 +1,156 @@
+# -*- coding: utf-8 -*-
+"""
+Test Azure OpenAI backend functionality.
+"""
+import os
+import sys
+from unittest.mock import AsyncMock, MagicMock, patch
+import pytest
+# Add the parent directory to sys.path to allow relative imports
+sys.path.insert(0, os.path.join(os.path.dirname(__file__), ".."))
+from backend.azure_openai import AzureOpenAIBackend  # noqa: E402
+class TestAzureOpenAIBackend:
+    """Test Azure OpenAI backend functionality."""
+    def test_init_with_env_vars(self):
+        """Test initialization with environment variables."""
+        with patch.dict(
+            os.environ,
+            {
+                "AZURE_OPENAI_API_KEY": "test-key",
+                "AZURE_OPENAI_ENDPOINT": "https://test.openai.azure.com/",
+                "AZURE_OPENAI_API_VERSION": "2024-02-15-preview",
+            },
+        ):
+            backend = AzureOpenAIBackend()
+            assert backend.api_key == "test-key"
+            assert backend.azure_endpoint == "https://test.openai.azure.com"
+            assert backend.api_version == "2024-02-15-preview"
+    def test_init_with_kwargs(self):
+        """Test initialization with keyword arguments."""
+        backend = AzureOpenAIBackend(
+            api_key="custom-key",
+            base_url="https://custom.openai.azure.com/",
+            api_version="2024-01-01",
+        )
+        assert backend.api_key == "custom-key"
+        assert backend.azure_endpoint == "https://custom.openai.azure.com"
+        assert backend.api_version == "2024-01-01"
+    def test_init_missing_api_key(self):
+        """Test initialization fails without API key."""
+        with patch.dict(os.environ, {}, clear=True):
+            with pytest.raises(ValueError, match="Azure OpenAI endpoint URL is required"):
+                AzureOpenAIBackend()
+    def test_init_missing_endpoint(self):
+        """Test initialization fails without endpoint."""
+        with patch.dict(os.environ, {"AZURE_OPENAI_API_KEY": "test-key"}, clear=True):
+            with pytest.raises(ValueError, match="Azure OpenAI endpoint URL is required"):
+                AzureOpenAIBackend()
+    def test_init_missing_api_key_with_endpoint(self):
+        """Test initialization fails without API key when endpoint is provided."""
+        with patch.dict(os.environ, {}, clear=True):
+            with pytest.raises(ValueError, match="Azure OpenAI API key is required"):
+                AzureOpenAIBackend(base_url="https://test.openai.azure.com/")
+    def test_base_url_normalization(self):
+        """Test base URL is properly normalized."""
+        backend = AzureOpenAIBackend(api_key="test-key", base_url="https://test.openai.azure.com")
+        assert backend.azure_endpoint == "https://test.openai.azure.com"
+        backend2 = AzureOpenAIBackend(api_key="test-key", base_url="https://test2.openai.azure.com/")
+        assert backend2.azure_endpoint == "https://test2.openai.azure.com"
+    def test_get_provider_name(self):
+        """Test provider name is correct."""
+        backend = AzureOpenAIBackend(api_key="test-key", base_url="https://test.openai.azure.com/")
+        assert backend.get_provider_name() == "Azure OpenAI"
+    def test_estimate_tokens(self):
+        """Test token estimation."""
+        backend = AzureOpenAIBackend(api_key="test-key", base_url="https://test.openai.azure.com/")
+        text = "This is a test message with several words."
+        estimated = backend.estimate_tokens(text)
+        assert estimated > 0
+        assert isinstance(estimated, (int, float))
+    def test_calculate_cost(self):
+        """Test cost calculation."""
+        backend = AzureOpenAIBackend(api_key="test-key", base_url="https://test.openai.azure.com/")
+        # Test GPT-4 cost calculation
+        cost = backend.calculate_cost(1000, 500, "gpt-4o")
+        assert cost > 0
+        assert isinstance(cost, float)
+        # Test GPT-3.5 cost calculation
+        cost2 = backend.calculate_cost(1000, 500, "gpt-3.5-turbo")
+        assert cost2 > 0
+        assert cost2 < cost  # GPT-3.5 should be cheaper than GPT-4
+    @pytest.mark.asyncio
+    async def test_stream_with_tools_missing_model(self):
+        """Test stream_with_tools fails without model parameter."""
+        backend = AzureOpenAIBackend(api_key="test-key", base_url="https://test.openai.azure.com/")
+        messages = [{"role": "user", "content": "Hello"}]
+        tools = []
+        # The validation happens at the beginning of the method, before any API calls
+        # So we don't need to mock the client for this test
+        try:
+            async for chunk in backend.stream_with_tools(messages, tools):
+                # If we get here, the validation didn't work as expected
+                # Check if it's an error chunk
+                if chunk.type == "error" and "deployment name" in chunk.error:
+                    # This is the expected behavior - validation error is yielded as a chunk
+                    return
+                else:
+                    # Unexpected - validation should have failed
+                    pytest.fail(f"Expected validation error, but got chunk: {chunk}")
+        except ValueError as e:
+            # This is the expected behavior - validation error is raised
+            if "deployment name" in str(e):
+                return
+            else:
+                pytest.fail(f"Unexpected ValueError: {e}")
+        except Exception as e:
+            pytest.fail(f"Unexpected exception: {e}")
+    @pytest.mark.asyncio
+    async def test_stream_with_tools_with_model(self):
+        """Test stream_with_tools works with model parameter."""
+        backend = AzureOpenAIBackend(api_key="test-key", base_url="https://test.openai.azure.com/")
+        messages = [{"role": "user", "content": "Hello"}]
+        tools = []
+        # Mock the client and create a mock stream response
+        mock_chunk = MagicMock()
+        mock_chunk.choices = [MagicMock()]
+        mock_chunk.choices[0].delta = MagicMock()
+        mock_chunk.choices[0].delta.content = "Hello"
+        mock_chunk.choices[0].finish_reason = "stop"
+        mock_stream = [mock_chunk]
+        with patch.object(backend, "client") as mock_client:
+            mock_client.chat.completions.create = AsyncMock(return_value=mock_stream)
+            # Test that it doesn't raise an error with model parameter
+            try:
+                async for chunk in backend.stream_with_tools(messages, tools, model="gpt-4"):
+                    # Just consume the stream
+                    pass
+            except Exception as e:
+                # If there's an error, it should not be about missing model
+                assert "deployment name" not in str(e)

massgen/tests/test_backend_capabilities.py ADDED Viewed

@@ -0,0 +1,262 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for backend capabilities registry.
+These tests ensure the capabilities registry is consistent and valid.
+Run with: uv run pytest massgen/tests/test_backend_capabilities.py -v
+"""
+import pytest
+from massgen.backend.capabilities import (
+    BACKEND_CAPABILITIES,
+    get_all_backend_types,
+    get_backends_with_capability,
+    get_capabilities,
+    has_capability,
+    validate_backend_config,
+)
+class TestBackendCapabilitiesRegistry:
+    """Test the capabilities registry structure and validity."""
+    def test_all_backends_have_required_fields(self):
+        """Ensure all backend entries have required fields."""
+        for backend_type, caps in BACKEND_CAPABILITIES.items():
+            assert caps.backend_type == backend_type, f"{backend_type}: backend_type mismatch"
+            assert caps.provider_name, f"{backend_type}: provider_name is empty"
+            assert caps.supported_capabilities is not None, f"{backend_type}: supported_capabilities is None"
+            assert caps.builtin_tools is not None, f"{backend_type}: builtin_tools is None"
+            assert caps.filesystem_support in ["none", "native", "mcp"], f"{backend_type}: invalid filesystem_support"
+            assert caps.models, f"{backend_type}: models list is empty"
+            assert caps.default_model, f"{backend_type}: default_model is empty"
+    def test_default_model_in_models_list(self):
+        """Ensure default model exists in models list."""
+        for backend_type, caps in BACKEND_CAPABILITIES.items():
+            assert caps.default_model in caps.models, f"{backend_type}: default_model '{caps.default_model}' not in models list"
+    def test_filesystem_support_values(self):
+        """Ensure filesystem_support has valid values."""
+        valid_values = {"none", "native", "mcp"}
+        for backend_type, caps in BACKEND_CAPABILITIES.items():
+            assert caps.filesystem_support in valid_values, f"{backend_type}: filesystem_support '{caps.filesystem_support}' " f"not in {valid_values}"
+    def test_no_empty_backend_types(self):
+        """Ensure no backend has an empty backend_type."""
+        for backend_type, caps in BACKEND_CAPABILITIES.items():
+            assert backend_type, "Found backend with empty backend_type"
+            assert caps.backend_type, f"Backend {backend_type} has empty backend_type field"
+    def test_capability_strings_are_valid(self):
+        """Ensure capability strings follow conventions."""
+        valid_capabilities = {
+            "web_search",
+            "code_execution",
+            "bash",
+            "multimodal",  # Legacy - being phased out
+            "vision",  # Legacy - use image_understanding
+            "mcp",
+            "filesystem_native",
+            "filesystem_mcp",
+            "reasoning",
+            "image_generation",
+            "image_understanding",
+            "audio_generation",
+            "audio_understanding",
+            "video_generation",
+            "video_understanding",
+        }
+        for backend_type, caps in BACKEND_CAPABILITIES.items():
+            for cap in caps.supported_capabilities:
+                assert cap in valid_capabilities, f"{backend_type}: unknown capability '{cap}'. " f"Valid capabilities: {valid_capabilities}"
+class TestCapabilityQueries:
+    """Test capability query functions."""
+    def test_get_capabilities_existing_backend(self):
+        """Test getting capabilities for existing backends."""
+        caps = get_capabilities("openai")
+        assert caps is not None
+        assert caps.backend_type == "openai"
+        assert caps.provider_name == "OpenAI"
+    def test_get_capabilities_nonexistent_backend(self):
+        """Test getting capabilities for non-existent backend."""
+        caps = get_capabilities("nonexistent_backend")
+        assert caps is None
+    def test_has_capability_true(self):
+        """Test checking for existing capability."""
+        # OpenAI has web_search
+        assert has_capability("openai", "web_search") is True
+    def test_has_capability_false(self):
+        """Test checking for non-existent capability."""
+        # LM Studio doesn't have web_search
+        assert has_capability("lmstudio", "web_search") is False
+    def test_has_capability_nonexistent_backend(self):
+        """Test checking capability on non-existent backend."""
+        assert has_capability("nonexistent", "web_search") is False
+    def test_get_all_backend_types(self):
+        """Test getting all backend types."""
+        backend_types = get_all_backend_types()
+        assert len(backend_types) > 0
+        assert "openai" in backend_types
+        assert "claude" in backend_types
+        assert "gemini" in backend_types
+    def test_get_backends_with_capability(self):
+        """Test getting backends by capability."""
+        web_search_backends = get_backends_with_capability("web_search")
+        assert "openai" in web_search_backends
+        assert "gemini" in web_search_backends
+        assert "grok" in web_search_backends
+        # Backends without web search should not be included
+        assert "claude_code" not in web_search_backends
+class TestBackendValidation:
+    """Test backend configuration validation."""
+    def test_validate_valid_openai_config(self):
+        """Test validating a valid OpenAI config."""
+        config = {
+            "type": "openai",
+            "model": "gpt-4o",
+            "enable_web_search": True,
+            "enable_code_interpreter": True,
+        }
+        errors = validate_backend_config("openai", config)
+        assert len(errors) == 0
+    def test_validate_invalid_capability(self):
+        """Test validation catches unsupported capability."""
+        # Claude Code doesn't support web_search
+        config = {
+            "type": "claude_code",
+            "enable_web_search": True,
+        }
+        errors = validate_backend_config("claude_code", config)
+        assert len(errors) > 0
+        assert any("web_search" in error for error in errors)
+    def test_validate_invalid_backend_type(self):
+        """Test validation catches unknown backend."""
+        config = {"type": "nonexistent"}
+        errors = validate_backend_config("nonexistent", config)
+        assert len(errors) > 0
+        assert any("Unknown backend" in error for error in errors)
+    def test_validate_code_execution_variants(self):
+        """Test validation handles different code execution config keys."""
+        # OpenAI uses enable_code_interpreter
+        config_openai = {"type": "openai", "enable_code_interpreter": True}
+        errors = validate_backend_config("openai", config_openai)
+        assert len(errors) == 0
+        # Claude uses enable_code_execution
+        config_claude = {"type": "claude", "enable_code_execution": True}
+        errors = validate_backend_config("claude", config_claude)
+        assert len(errors) == 0
+    def test_validate_mcp_servers(self):
+        """Test validation of MCP server configuration."""
+        # Valid MCP config for backend that supports it
+        config = {
+            "type": "openai",
+            "mcp_servers": [
+                {
+                    "name": "weather",
+                    "command": "npx",
+                    "args": ["-y", "@fak111/weather-mcp"],
+                },
+            ],
+        }
+        errors = validate_backend_config("openai", config)
+        assert len(errors) == 0
+class TestSpecificBackends:
+    """Test specific backend configurations."""
+    def test_openai_capabilities(self):
+        """Test OpenAI backend capabilities."""
+        caps = get_capabilities("openai")
+        assert "web_search" in caps.supported_capabilities
+        assert "code_execution" in caps.supported_capabilities
+        assert "mcp" in caps.supported_capabilities
+        assert "reasoning" in caps.supported_capabilities
+        assert "image_generation" in caps.supported_capabilities
+        assert "image_understanding" in caps.supported_capabilities
+        assert "audio_generation" in caps.supported_capabilities
+        assert "video_generation" in caps.supported_capabilities
+        assert caps.filesystem_support == "mcp"
+        assert caps.env_var == "OPENAI_API_KEY"
+    def test_claude_capabilities(self):
+        """Test Claude backend capabilities."""
+        caps = get_capabilities("claude")
+        assert "web_search" in caps.supported_capabilities
+        assert "code_execution" in caps.supported_capabilities
+        assert "mcp" in caps.supported_capabilities
+        assert caps.filesystem_support == "mcp"
+        assert caps.env_var == "ANTHROPIC_API_KEY"
+    def test_claude_code_capabilities(self):
+        """Test Claude Code backend capabilities."""
+        caps = get_capabilities("claude_code")
+        assert "bash" in caps.supported_capabilities
+        assert "mcp" in caps.supported_capabilities
+        assert caps.filesystem_support == "native"
+        assert caps.env_var == "ANTHROPIC_API_KEY"
+        assert len(caps.builtin_tools) > 0
+    def test_gemini_capabilities(self):
+        """Test Gemini backend capabilities."""
+        caps = get_capabilities("gemini")
+        assert "web_search" in caps.supported_capabilities
+        assert "code_execution" in caps.supported_capabilities
+        assert "mcp" in caps.supported_capabilities
+        assert "image_understanding" in caps.supported_capabilities
+        assert caps.filesystem_support == "mcp"
+        assert caps.env_var == "GEMINI_API_KEY"
+    def test_local_backends_no_api_key(self):
+        """Test local backends don't require API keys."""
+        local_backends = ["lmstudio", "inference", "chatcompletion"]
+        for backend_type in local_backends:
+            caps = get_capabilities(backend_type)
+            # These backends may or may not require API keys depending on provider
+            # Just verify they're in the registry
+            assert caps is not None
+class TestConsistency:
+    """Test consistency between related fields."""
+    def test_filesystem_native_implies_capability(self):
+        """Backends with native filesystem should have filesystem capability."""
+        for backend_type, caps in BACKEND_CAPABILITIES.items():
+            if caps.filesystem_support == "native":
+                # Should have filesystem_native in capabilities
+                assert "filesystem_native" in caps.supported_capabilities or len(caps.builtin_tools) > 0, f"{backend_type}: native filesystem but no capability/tools"  # Or have filesystem tools
+    def test_mcp_capability_consistency(self):
+        """All backends should support MCP except where explicitly excluded."""
+        # Most backends support MCP
+        mcp_backends = get_backends_with_capability("mcp")
+        assert len(mcp_backends) > 0
+        assert "openai" in mcp_backends
+        assert "claude" in mcp_backends
+        assert "gemini" in mcp_backends
+if __name__ == "__main__":
+    pytest.main([__file__, "-v"])

massgen/tests/test_backend_event_loop_all.py ADDED Viewed

@@ -0,0 +1,179 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+"""
+Event loop/resource cleanup tests for multiple backends without changing code.
+These tests mock SDK async clients and assert aclose() is awaited by backends.
+Backends covered:
+- ResponseBackend (OpenAI Responses API)
+- GrokBackend (xAI via OpenAI-compatible client)
+- ClaudeBackend (Anthropic Messages API)
+NOTE: Some tests may currently FAIL, revealing missing cleanup in backends.
+"""
+import asyncio
+from types import SimpleNamespace
+from typing import Any, List
+import pytest
+from massgen.backend import ClaudeBackend, GrokBackend, ResponseBackend
+# ---- Common fakes ----
+class _FakeStreamSingleStop:
+    """Async stream that yields once, then stops. Shape varies per backend needs."""
+    def __init__(self, item_factory):
+        self._yielded = False
+        self._item_factory = item_factory
+    def __aiter__(self):
+        return self
+    async def __anext__(self):
+        if self._yielded:
+            raise StopAsyncIteration
+        self._yielded = True
+        await asyncio.sleep(0)
+        return self._item_factory()
+class _FakeAsyncClientBase:
+    def __init__(self, *args: Any, **kwargs: Any):
+        self.args = args
+        self.kwargs = kwargs
+        self._closed = False
+    async def aclose(self) -> None:
+        await asyncio.sleep(0)
+        self._closed = True
+# ---- ResponseBackend test ----
+class _FakeResponses:
+    async def create(self, **kwargs: Any):
+        # Build a stream where each chunk has a 'type' attribute that ends the response quickly
+        def _item():
+            return SimpleNamespace(type="response.completed", response={"output": []})
+        return _FakeStreamSingleStop(_item)
+class _FakeOpenAIClient(_FakeAsyncClientBase):
+    def __init__(self, *args: Any, **kwargs: Any):
+        super().__init__(*args, **kwargs)
+        self.responses = _FakeResponses()
+@pytest.mark.asyncio
+async def test_response_backend_stream_closes_client(monkeypatch):
+    import sys
+    created: List[_FakeOpenAIClient] = []
+    def _factory(*args: Any, **kwargs: Any) -> _FakeOpenAIClient:
+        client = _FakeOpenAIClient(*args, **kwargs)
+        created.append(client)
+        return client
+    # Inject fake openai module so in-function import resolves to our factory
+    monkeypatch.setitem(sys.modules, "openai", SimpleNamespace(AsyncOpenAI=_factory))
+    backend = ResponseBackend()
+    messages = [{"role": "user", "content": "hi"}]
+    # Drain the stream
+    async for _ in backend.stream_with_tools(messages, tools=[], model="gpt-4o-mini"):
+        pass
+    assert len(created) == 1
+    # Expectation: backend should close client to avoid event-loop errors
+    assert created[0]._closed is True
+# ---- GrokBackend test ----
+class _FakeChatCompletions:
+    async def create(self, **kwargs: Any):
+        # Yield a single finishing chunk similar to Chat Completions
+        def _item():
+            choice = SimpleNamespace(delta=None, finish_reason="stop")
+            return SimpleNamespace(choices=[choice], usage=None)
+        return _FakeStreamSingleStop(_item)
+class _FakeOpenAIClientForGrok(_FakeAsyncClientBase):
+    def __init__(self, *args: Any, **kwargs: Any):
+        super().__init__(*args, **kwargs)
+        self.chat = SimpleNamespace(completions=_FakeChatCompletions())
+@pytest.mark.asyncio
+async def test_grok_backend_stream_closes_client(monkeypatch):
+    import sys
+    created: List[_FakeOpenAIClientForGrok] = []
+    def _factory(*args: Any, **kwargs: Any) -> _FakeOpenAIClientForGrok:
+        client = _FakeOpenAIClientForGrok(*args, **kwargs)
+        created.append(client)
+        return client
+    # Inject fake openai module for dynamic import inside function
+    monkeypatch.setitem(sys.modules, "openai", SimpleNamespace(AsyncOpenAI=_factory))
+    backend = GrokBackend()
+    messages = [{"role": "user", "content": "hi"}]
+    async for _ in backend.stream_with_tools(messages, tools=[], model="grok-2-mini"):
+        pass
+    assert len(created) == 1
+    # Expectation: backend should close client to avoid event-loop errors
+    assert created[0]._closed is True
+# ---- ClaudeBackend test ----
+class _FakeClaudeMessages:
+    async def create(self, **kwargs: Any):
+        # Stream that yields a single message_stop event
+        def _item():
+            return SimpleNamespace(type="message_stop")
+        return _FakeStreamSingleStop(_item)
+class _FakeAnthropicClient(_FakeAsyncClientBase):
+    def __init__(self, *args: Any, **kwargs: Any):
+        super().__init__(*args, **kwargs)
+        # Provide both .messages and .beta.messages to cover branches
+        self.messages = _FakeClaudeMessages()
+        self.beta = SimpleNamespace(messages=_FakeClaudeMessages())
+@pytest.mark.asyncio
+async def test_claude_backend_stream_closes_client(monkeypatch):
+    import sys
+    created: List[_FakeAnthropicClient] = []
+    def _factory(*args: Any, **kwargs: Any) -> _FakeAnthropicClient:
+        client = _FakeAnthropicClient(*args, **kwargs)
+        created.append(client)
+        return client
+    # Inject fake anthropic module for dynamic import inside function
+    monkeypatch.setitem(sys.modules, "anthropic", SimpleNamespace(AsyncAnthropic=_factory))
+    backend = ClaudeBackend()
+    messages = [{"role": "user", "content": "hi"}]
+    async for _ in backend.stream_with_tools(messages, tools=[], model="claude-3.7-sonnet"):
+        pass
+    assert len(created) == 1
+    # Expectation: backend should close client to avoid event-loop errors
+    assert created[0]._closed is True

massgen 0.0.3__py3-none-any.whl → 0.1.0__py3-none-any.whl

Potentially problematic release.

massgen 0.0.3py3-none-any.whl → 0.1.0py3-none-any.whl