PyPI - massgen - Versions diffs - 0.0.3__py3-none-any.whl → 0.1.0__py3-none-any.whl - Mend

massgen 0.0.3py3-none-any.whl → 0.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of massgen might be problematic. Click here for more details.

Files changed (268) hide show

massgen/__init__.py +142 -8
massgen/adapters/__init__.py +29 -0
massgen/adapters/ag2_adapter.py +483 -0
massgen/adapters/base.py +183 -0
massgen/adapters/tests/__init__.py +0 -0
massgen/adapters/tests/test_ag2_adapter.py +439 -0
massgen/adapters/tests/test_agent_adapter.py +128 -0
massgen/adapters/utils/__init__.py +2 -0
massgen/adapters/utils/ag2_utils.py +236 -0
massgen/adapters/utils/tests/__init__.py +0 -0
massgen/adapters/utils/tests/test_ag2_utils.py +138 -0
massgen/agent_config.py +329 -55
massgen/api_params_handler/__init__.py +10 -0
massgen/api_params_handler/_api_params_handler_base.py +99 -0
massgen/api_params_handler/_chat_completions_api_params_handler.py +176 -0
massgen/api_params_handler/_claude_api_params_handler.py +113 -0
massgen/api_params_handler/_response_api_params_handler.py +130 -0
massgen/backend/__init__.py +39 -4
massgen/backend/azure_openai.py +385 -0
massgen/backend/base.py +341 -69
massgen/backend/base_with_mcp.py +1102 -0
massgen/backend/capabilities.py +386 -0
massgen/backend/chat_completions.py +577 -130
massgen/backend/claude.py +1033 -537
massgen/backend/claude_code.py +1203 -0
massgen/backend/cli_base.py +209 -0
massgen/backend/docs/BACKEND_ARCHITECTURE.md +126 -0
massgen/backend/{CLAUDE_API_RESEARCH.md → docs/CLAUDE_API_RESEARCH.md} +18 -18
massgen/backend/{GEMINI_API_DOCUMENTATION.md → docs/GEMINI_API_DOCUMENTATION.md} +9 -9
massgen/backend/docs/Gemini MCP Integration Analysis.md +1050 -0
massgen/backend/docs/MCP_IMPLEMENTATION_CLAUDE_BACKEND.md +177 -0
massgen/backend/docs/MCP_INTEGRATION_RESPONSE_BACKEND.md +352 -0
massgen/backend/docs/OPENAI_GPT5_MODELS.md +211 -0
massgen/backend/{OPENAI_RESPONSES_API_FORMAT.md → docs/OPENAI_RESPONSE_API_TOOL_CALLS.md} +3 -3
massgen/backend/docs/OPENAI_response_streaming.md +20654 -0
massgen/backend/docs/inference_backend.md +257 -0
massgen/backend/docs/permissions_and_context_files.md +1085 -0
massgen/backend/external.py +126 -0
massgen/backend/gemini.py +1850 -241
massgen/backend/grok.py +40 -156
massgen/backend/inference.py +156 -0
massgen/backend/lmstudio.py +171 -0
massgen/backend/response.py +1095 -322
massgen/chat_agent.py +131 -113
massgen/cli.py +1560 -275
massgen/config_builder.py +2396 -0
massgen/configs/BACKEND_CONFIGURATION.md +458 -0
massgen/configs/README.md +559 -216
massgen/configs/ag2/ag2_case_study.yaml +27 -0
massgen/configs/ag2/ag2_coder.yaml +34 -0
massgen/configs/ag2/ag2_coder_case_study.yaml +36 -0
massgen/configs/ag2/ag2_gemini.yaml +27 -0
massgen/configs/ag2/ag2_groupchat.yaml +108 -0
massgen/configs/ag2/ag2_groupchat_gpt.yaml +118 -0
massgen/configs/ag2/ag2_single_agent.yaml +21 -0
massgen/configs/basic/multi/fast_timeout_example.yaml +37 -0
massgen/configs/basic/multi/gemini_4o_claude.yaml +31 -0
massgen/configs/basic/multi/gemini_gpt5nano_claude.yaml +36 -0
massgen/configs/{gemini_4o_claude.yaml → basic/multi/geminicode_4o_claude.yaml} +3 -3
massgen/configs/basic/multi/geminicode_gpt5nano_claude.yaml +36 -0
massgen/configs/basic/multi/glm_gemini_claude.yaml +25 -0
massgen/configs/basic/multi/gpt4o_audio_generation.yaml +30 -0
massgen/configs/basic/multi/gpt4o_image_generation.yaml +31 -0
massgen/configs/basic/multi/gpt5nano_glm_qwen.yaml +26 -0
massgen/configs/basic/multi/gpt5nano_image_understanding.yaml +26 -0
massgen/configs/{three_agents_default.yaml → basic/multi/three_agents_default.yaml} +8 -4
massgen/configs/basic/multi/three_agents_opensource.yaml +27 -0
massgen/configs/basic/multi/three_agents_vllm.yaml +20 -0
massgen/configs/basic/multi/two_agents_gemini.yaml +19 -0
massgen/configs/{two_agents.yaml → basic/multi/two_agents_gpt5.yaml} +14 -6
massgen/configs/basic/multi/two_agents_opensource_lmstudio.yaml +31 -0
massgen/configs/basic/multi/two_qwen_vllm_sglang.yaml +28 -0
massgen/configs/{single_agent.yaml → basic/single/single_agent.yaml} +1 -1
massgen/configs/{single_flash2.5.yaml → basic/single/single_flash2.5.yaml} +1 -2
massgen/configs/basic/single/single_gemini2.5pro.yaml +16 -0
massgen/configs/basic/single/single_gpt4o_audio_generation.yaml +22 -0
massgen/configs/basic/single/single_gpt4o_image_generation.yaml +22 -0
massgen/configs/basic/single/single_gpt4o_video_generation.yaml +24 -0
massgen/configs/basic/single/single_gpt5nano.yaml +20 -0
massgen/configs/basic/single/single_gpt5nano_file_search.yaml +18 -0
massgen/configs/basic/single/single_gpt5nano_image_understanding.yaml +17 -0
massgen/configs/basic/single/single_gptoss120b.yaml +15 -0
massgen/configs/basic/single/single_openrouter_audio_understanding.yaml +15 -0
massgen/configs/basic/single/single_qwen_video_understanding.yaml +15 -0
massgen/configs/debug/code_execution/command_filtering_blacklist.yaml +29 -0
massgen/configs/debug/code_execution/command_filtering_whitelist.yaml +28 -0
massgen/configs/debug/code_execution/docker_verification.yaml +29 -0
massgen/configs/debug/skip_coordination_test.yaml +27 -0
massgen/configs/debug/test_sdk_migration.yaml +17 -0
massgen/configs/docs/DISCORD_MCP_SETUP.md +208 -0
massgen/configs/docs/TWITTER_MCP_ENESCINAR_SETUP.md +82 -0
massgen/configs/providers/azure/azure_openai_multi.yaml +21 -0
massgen/configs/providers/azure/azure_openai_single.yaml +19 -0
massgen/configs/providers/claude/claude.yaml +14 -0
massgen/configs/providers/gemini/gemini_gpt5nano.yaml +28 -0
massgen/configs/providers/local/lmstudio.yaml +11 -0
massgen/configs/providers/openai/gpt5.yaml +46 -0
massgen/configs/providers/openai/gpt5_nano.yaml +46 -0
massgen/configs/providers/others/grok_single_agent.yaml +19 -0
massgen/configs/providers/others/zai_coding_team.yaml +108 -0
massgen/configs/providers/others/zai_glm45.yaml +12 -0
massgen/configs/{creative_team.yaml → teams/creative/creative_team.yaml} +16 -6
massgen/configs/{travel_planning.yaml → teams/creative/travel_planning.yaml} +16 -6
massgen/configs/{news_analysis.yaml → teams/research/news_analysis.yaml} +16 -6
massgen/configs/{research_team.yaml → teams/research/research_team.yaml} +15 -7
massgen/configs/{technical_analysis.yaml → teams/research/technical_analysis.yaml} +16 -6
massgen/configs/tools/code-execution/basic_command_execution.yaml +25 -0
massgen/configs/tools/code-execution/code_execution_use_case_simple.yaml +41 -0
massgen/configs/tools/code-execution/docker_claude_code.yaml +32 -0
massgen/configs/tools/code-execution/docker_multi_agent.yaml +32 -0
massgen/configs/tools/code-execution/docker_simple.yaml +29 -0
massgen/configs/tools/code-execution/docker_with_resource_limits.yaml +32 -0
massgen/configs/tools/code-execution/multi_agent_playwright_automation.yaml +57 -0
massgen/configs/tools/filesystem/cc_gpt5_gemini_filesystem.yaml +34 -0
massgen/configs/tools/filesystem/claude_code_context_sharing.yaml +68 -0
massgen/configs/tools/filesystem/claude_code_flash2.5.yaml +43 -0
massgen/configs/tools/filesystem/claude_code_flash2.5_gptoss.yaml +49 -0
massgen/configs/tools/filesystem/claude_code_gpt5nano.yaml +31 -0
massgen/configs/tools/filesystem/claude_code_single.yaml +40 -0
massgen/configs/tools/filesystem/fs_permissions_test.yaml +87 -0
massgen/configs/tools/filesystem/gemini_gemini_workspace_cleanup.yaml +54 -0
massgen/configs/tools/filesystem/gemini_gpt5_filesystem_casestudy.yaml +30 -0
massgen/configs/tools/filesystem/gemini_gpt5nano_file_context_path.yaml +43 -0
massgen/configs/tools/filesystem/gemini_gpt5nano_protected_paths.yaml +45 -0
massgen/configs/tools/filesystem/gpt5mini_cc_fs_context_path.yaml +31 -0
massgen/configs/tools/filesystem/grok4_gpt5_gemini_filesystem.yaml +32 -0
massgen/configs/tools/filesystem/multiturn/grok4_gpt5_claude_code_filesystem_multiturn.yaml +58 -0
massgen/configs/tools/filesystem/multiturn/grok4_gpt5_gemini_filesystem_multiturn.yaml +58 -0
massgen/configs/tools/filesystem/multiturn/two_claude_code_filesystem_multiturn.yaml +47 -0
massgen/configs/tools/filesystem/multiturn/two_gemini_flash_filesystem_multiturn.yaml +48 -0
massgen/configs/tools/mcp/claude_code_discord_mcp_example.yaml +27 -0
massgen/configs/tools/mcp/claude_code_simple_mcp.yaml +35 -0
massgen/configs/tools/mcp/claude_code_twitter_mcp_example.yaml +32 -0
massgen/configs/tools/mcp/claude_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/claude_mcp_test.yaml +27 -0
massgen/configs/tools/mcp/five_agents_travel_mcp_test.yaml +157 -0
massgen/configs/tools/mcp/five_agents_weather_mcp_test.yaml +103 -0
massgen/configs/tools/mcp/gemini_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/gemini_mcp_filesystem_test.yaml +23 -0
massgen/configs/tools/mcp/gemini_mcp_filesystem_test_sharing.yaml +23 -0
massgen/configs/tools/mcp/gemini_mcp_filesystem_test_single_agent.yaml +17 -0
massgen/configs/tools/mcp/gemini_mcp_filesystem_test_with_claude_code.yaml +24 -0
massgen/configs/tools/mcp/gemini_mcp_test.yaml +27 -0
massgen/configs/tools/mcp/gemini_notion_mcp.yaml +52 -0
massgen/configs/tools/mcp/gpt5_nano_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/gpt5_nano_mcp_test.yaml +27 -0
massgen/configs/tools/mcp/gpt5mini_claude_code_discord_mcp_example.yaml +38 -0
massgen/configs/tools/mcp/gpt_oss_mcp_example.yaml +25 -0
massgen/configs/tools/mcp/gpt_oss_mcp_test.yaml +28 -0
massgen/configs/tools/mcp/grok3_mini_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/grok3_mini_mcp_test.yaml +27 -0
massgen/configs/tools/mcp/multimcp_gemini.yaml +111 -0
massgen/configs/tools/mcp/qwen_api_mcp_example.yaml +25 -0
massgen/configs/tools/mcp/qwen_api_mcp_test.yaml +28 -0
massgen/configs/tools/mcp/qwen_local_mcp_example.yaml +24 -0
massgen/configs/tools/mcp/qwen_local_mcp_test.yaml +27 -0
massgen/configs/tools/planning/five_agents_discord_mcp_planning_mode.yaml +140 -0
massgen/configs/tools/planning/five_agents_filesystem_mcp_planning_mode.yaml +151 -0
massgen/configs/tools/planning/five_agents_notion_mcp_planning_mode.yaml +151 -0
massgen/configs/tools/planning/five_agents_twitter_mcp_planning_mode.yaml +155 -0
massgen/configs/tools/planning/gpt5_mini_case_study_mcp_planning_mode.yaml +73 -0
massgen/configs/tools/web-search/claude_streamable_http_test.yaml +43 -0
massgen/configs/tools/web-search/gemini_streamable_http_test.yaml +43 -0
massgen/configs/tools/web-search/gpt5_mini_streamable_http_test.yaml +43 -0
massgen/configs/tools/web-search/gpt_oss_streamable_http_test.yaml +44 -0
massgen/configs/tools/web-search/grok3_mini_streamable_http_test.yaml +43 -0
massgen/configs/tools/web-search/qwen_api_streamable_http_test.yaml +44 -0
massgen/configs/tools/web-search/qwen_local_streamable_http_test.yaml +43 -0
massgen/coordination_tracker.py +708 -0
massgen/docker/README.md +462 -0
massgen/filesystem_manager/__init__.py +21 -0
massgen/filesystem_manager/_base.py +9 -0
massgen/filesystem_manager/_code_execution_server.py +545 -0
massgen/filesystem_manager/_docker_manager.py +477 -0
massgen/filesystem_manager/_file_operation_tracker.py +248 -0
massgen/filesystem_manager/_filesystem_manager.py +813 -0
massgen/filesystem_manager/_path_permission_manager.py +1261 -0
massgen/filesystem_manager/_workspace_tools_server.py +1815 -0
massgen/formatter/__init__.py +10 -0
massgen/formatter/_chat_completions_formatter.py +284 -0
massgen/formatter/_claude_formatter.py +235 -0
massgen/formatter/_formatter_base.py +156 -0
massgen/formatter/_response_formatter.py +263 -0
massgen/frontend/__init__.py +1 -2
massgen/frontend/coordination_ui.py +471 -286
massgen/frontend/displays/base_display.py +56 -11
massgen/frontend/displays/create_coordination_table.py +1956 -0
massgen/frontend/displays/rich_terminal_display.py +1259 -619
massgen/frontend/displays/simple_display.py +9 -4
massgen/frontend/displays/terminal_display.py +27 -68
massgen/logger_config.py +681 -0
massgen/mcp_tools/README.md +232 -0
massgen/mcp_tools/__init__.py +105 -0
massgen/mcp_tools/backend_utils.py +1035 -0
massgen/mcp_tools/circuit_breaker.py +195 -0
massgen/mcp_tools/client.py +894 -0
massgen/mcp_tools/config_validator.py +138 -0
massgen/mcp_tools/docs/circuit_breaker.md +646 -0
massgen/mcp_tools/docs/client.md +950 -0
massgen/mcp_tools/docs/config_validator.md +478 -0
massgen/mcp_tools/docs/exceptions.md +1165 -0
massgen/mcp_tools/docs/security.md +854 -0
massgen/mcp_tools/exceptions.py +338 -0
massgen/mcp_tools/hooks.py +212 -0
massgen/mcp_tools/security.py +780 -0
massgen/message_templates.py +342 -64
massgen/orchestrator.py +1515 -241
massgen/stream_chunk/__init__.py +35 -0
massgen/stream_chunk/base.py +92 -0
massgen/stream_chunk/multimodal.py +237 -0
massgen/stream_chunk/text.py +162 -0
massgen/tests/mcp_test_server.py +150 -0
massgen/tests/multi_turn_conversation_design.md +0 -8
massgen/tests/test_azure_openai_backend.py +156 -0
massgen/tests/test_backend_capabilities.py +262 -0
massgen/tests/test_backend_event_loop_all.py +179 -0
massgen/tests/test_chat_completions_refactor.py +142 -0
massgen/tests/test_claude_backend.py +15 -28
massgen/tests/test_claude_code.py +268 -0
massgen/tests/test_claude_code_context_sharing.py +233 -0
massgen/tests/test_claude_code_orchestrator.py +175 -0
massgen/tests/test_cli_backends.py +180 -0
massgen/tests/test_code_execution.py +679 -0
massgen/tests/test_external_agent_backend.py +134 -0
massgen/tests/test_final_presentation_fallback.py +237 -0
massgen/tests/test_gemini_planning_mode.py +351 -0
massgen/tests/test_grok_backend.py +7 -10
massgen/tests/test_http_mcp_server.py +42 -0
massgen/tests/test_integration_simple.py +198 -0
massgen/tests/test_mcp_blocking.py +125 -0
massgen/tests/test_message_context_building.py +29 -47
massgen/tests/test_orchestrator_final_presentation.py +48 -0
massgen/tests/test_path_permission_manager.py +2087 -0
massgen/tests/test_rich_terminal_display.py +14 -13
massgen/tests/test_timeout.py +133 -0
massgen/tests/test_v3_3agents.py +11 -12
massgen/tests/test_v3_simple.py +8 -13
massgen/tests/test_v3_three_agents.py +11 -18
massgen/tests/test_v3_two_agents.py +8 -13
massgen/token_manager/__init__.py +7 -0
massgen/token_manager/token_manager.py +400 -0
massgen/utils.py +52 -16
massgen/v1/agent.py +45 -91
massgen/v1/agents.py +18 -53
massgen/v1/backends/gemini.py +50 -153
massgen/v1/backends/grok.py +21 -54
massgen/v1/backends/oai.py +39 -111
massgen/v1/cli.py +36 -93
massgen/v1/config.py +8 -12
massgen/v1/logging.py +43 -127
massgen/v1/main.py +18 -32
massgen/v1/orchestrator.py +68 -209
massgen/v1/streaming_display.py +62 -163
massgen/v1/tools.py +8 -12
massgen/v1/types.py +9 -23
massgen/v1/utils.py +5 -23
massgen-0.1.0.dist-info/METADATA +1245 -0
massgen-0.1.0.dist-info/RECORD +273 -0
massgen-0.1.0.dist-info/entry_points.txt +2 -0
massgen/frontend/logging/__init__.py +0 -9
massgen/frontend/logging/realtime_logger.py +0 -197
massgen-0.0.3.dist-info/METADATA +0 -568
massgen-0.0.3.dist-info/RECORD +0 -76
massgen-0.0.3.dist-info/entry_points.txt +0 -2
/massgen/backend/{Function calling openai responses.md → docs/Function calling openai responses.md} +0 -0
{massgen-0.0.3.dist-info → massgen-0.1.0.dist-info}/WHEEL +0 -0
{massgen-0.0.3.dist-info → massgen-0.1.0.dist-info}/licenses/LICENSE +0 -0
{massgen-0.0.3.dist-info → massgen-0.1.0.dist-info}/top_level.txt +0 -0

massgen/backend/cli_base.py ADDED Viewed

@@ -0,0 +1,209 @@
+# -*- coding: utf-8 -*-
+"""
+CLI Backend Base Class - Abstract interface for CLI-based LLM backends.
+This module provides the base class for backends that interact with LLM providers
+through command-line interfaces (like Claude Code CLI, Gemini CLI, etc.).
+"""
+import asyncio
+import subprocess
+import tempfile
+from abc import abstractmethod
+from pathlib import Path
+from typing import Any, AsyncGenerator, Dict, List, Optional
+from .base import LLMBackend, StreamChunk, TokenUsage
+class CLIBackend(LLMBackend):
+    """Abstract base class for CLI-based LLM backends."""
+    def __init__(self, cli_command: str, api_key: Optional[str] = None, **kwargs):
+        super().__init__(api_key, **kwargs)
+        self.cli_command = cli_command
+        self.working_dir = kwargs.get("working_dir", Path.cwd())
+        self.timeout = kwargs.get("timeout", 300)  # 5 minutes default
+    @abstractmethod
+    def _build_command(self, messages: List[Dict[str, Any]], tools: List[Dict[str, Any]], **kwargs) -> List[str]:
+        """Build the CLI command to execute.
+        Args:
+            messages: Conversation messages
+            tools: Available tools
+            **kwargs: Additional parameters
+        Returns:
+            List of command arguments for subprocess
+        """
+    @abstractmethod
+    def _parse_output(self, output: str) -> Dict[str, Any]:
+        """Parse CLI output into structured format.
+        Args:
+            output: Raw CLI output
+        Returns:
+            Parsed response data
+        """
+    async def _execute_cli_command(self, command: List[str]) -> str:
+        """Execute CLI command asynchronously.
+        Args:
+            command: Command arguments
+        Returns:
+            Command output
+        Raises:
+            subprocess.CalledProcessError: If command fails
+            asyncio.TimeoutError: If command times out
+        """
+        process = await asyncio.create_subprocess_exec(
+            *command,
+            stdout=asyncio.subprocess.PIPE,
+            stderr=asyncio.subprocess.PIPE,
+            cwd=self.working_dir,
+        )
+        try:
+            stdout, stderr = await asyncio.wait_for(process.communicate(), timeout=self.timeout)
+            if process.returncode != 0:
+                error_msg = stderr.decode("utf-8") if stderr else "Unknown error"
+                raise subprocess.CalledProcessError(process.returncode, command, error_msg)
+            return stdout.decode("utf-8")
+        except asyncio.TimeoutError as exc:
+            process.kill()
+            await process.wait()
+            raise asyncio.TimeoutError(f"CLI command timed out after {self.timeout} seconds") from exc
+    def _create_temp_file(self, content: str, suffix: str = ".txt") -> Path:
+        """Create a temporary file with content.
+        Args:
+            content: File content
+            suffix: File suffix
+        Returns:
+            Path to temporary file
+        """
+        with tempfile.NamedTemporaryFile(mode="w", suffix=suffix, delete=False) as temp_file:
+            temp_file.write(content)
+            return Path(temp_file.name)
+    def _format_messages_for_cli(self, messages: List[Dict[str, Any]]) -> str:
+        """Format messages for CLI input.
+        Args:
+            messages: Conversation messages
+        Returns:
+            Formatted string for CLI
+        """
+        formatted_parts = []
+        for msg in messages:
+            role = msg.get("role", "user")
+            content = msg.get("content", "")
+            if role == "system":
+                formatted_parts.append(f"System: {content}")
+            elif role == "user":
+                formatted_parts.append(f"User: {content}")
+            elif role == "assistant":
+                formatted_parts.append(f"Assistant: {content}")
+        return "\n\n".join(formatted_parts)
+    async def stream_with_tools(self, messages: List[Dict[str, Any]], tools: List[Dict[str, Any]], **kwargs) -> AsyncGenerator[StreamChunk, None]:
+        """Stream response with tools support."""
+        try:
+            # Build CLI command
+            command = self._build_command(messages, tools, **kwargs)
+            # Execute command
+            output = await self._execute_cli_command(command)
+            # Parse output
+            parsed_response = self._parse_output(output)
+            # Convert to stream chunks
+            async for chunk in self._convert_to_stream_chunks(parsed_response):
+                yield chunk
+        except Exception as e:
+            yield StreamChunk(
+                type="error",
+                error=f"CLI backend error: {str(e)}",
+                source=self.__class__.__name__,
+            )
+    async def _convert_to_stream_chunks(self, response: Dict[str, Any]) -> AsyncGenerator[StreamChunk, None]:
+        """Convert parsed response to stream chunks.
+        Args:
+            response: Parsed response data
+        Yields:
+            StreamChunk objects
+        """
+        # Yield content
+        if "content" in response and response["content"]:
+            yield StreamChunk(
+                type="content",
+                content=response["content"],
+                source=self.__class__.__name__,
+            )
+        # Yield tool calls if present
+        if "tool_calls" in response and response["tool_calls"]:
+            yield StreamChunk(
+                type="tool_calls",
+                tool_calls=response["tool_calls"],
+                source=self.__class__.__name__,
+            )
+        # Yield complete message
+        yield StreamChunk(
+            type="complete_message",
+            complete_message=response,
+            source=self.__class__.__name__,
+        )
+        # Yield done
+        yield StreamChunk(type="done", source=self.__class__.__name__)
+    def get_token_usage(self) -> TokenUsage:
+        """Get token usage statistics."""
+        # CLI backends typically don't provide detailed token usage
+        # This could be estimated or left as zero
+        return self.token_usage
+    def get_cost_per_token(self) -> Dict[str, float]:
+        """Get cost per token for this provider."""
+        # Override in specific implementations
+        return {"input": 0.0, "output": 0.0}
+    def get_model_name(self) -> str:
+        """Get the model name being used."""
+        return self.config.get("model", "unknown")
+    def get_provider_info(self) -> Dict[str, Any]:
+        """Get provider information."""
+        return {
+            "provider": self.__class__.__name__,
+            "cli_command": self.cli_command,
+            "model": self.get_model_name(),
+            "supports_tools": True,
+            "supports_streaming": True,
+        }
+    def get_provider_name(self) -> str:
+        """Get the name of this provider."""
+        return self.__class__.__name__

massgen/backend/docs/BACKEND_ARCHITECTURE.md ADDED Viewed

@@ -0,0 +1,126 @@
+# Backend Architecture: Stateful vs Stateless
+## Overview
+The MassGen backend system supports two distinct architectural patterns for AI model backends: stateless and stateful. Understanding these patterns is crucial for proper agent implementation and state management.
+## Backend Types
+### Stateless Backends
+**Examples:** `ChatCompletionBackend`, OpenAI GPT models, Gemini
+**Characteristics:**
+- No conversation state maintained between requests
+- Each request is independent and self-contained
+- Complete context must be provided with every request
+- No memory of previous interactions
+- Simpler to scale horizontally
+**Implementation Pattern:**
+```python
+# Each request includes full conversation history
+# NOTE: Documentation uses .generate() for clarity, actual code uses .stream_with_tools()
+response = backend.generate(
+    messages=[
+        {"role": "user", "content": "Previous context..."},
+        {"role": "assistant", "content": "Previous response..."},
+        {"role": "user", "content": "Current request..."}
+    ]
+)
+```
+### Stateful Backends
+**Examples:** `Claude Code CLI`, Interactive CLI sessions
+**Characteristics:**
+- Maintains conversation context across interactions
+- State persists between requests
+- Can reference previous interactions without resending context
+- Requires explicit state management (reset, clear, etc.)
+- More complex but efficient for long conversations
+**Implementation Pattern:**
+```python
+# Only current request needed, context maintained internally
+# NOTE: Documentation uses .generate() for clarity, actual code uses .stream_with_tools()
+response = backend.generate(message="Current request...")
+```
+## Current Agent Implementation Issue
+The current agent implementation assumes all backends are **stateless**, which creates inefficiencies and potential issues:
+### Problems with Current Approach:
+1. **Redundant Context**: Sends complete conversation history to stateful backends
+2. **Inefficient Resource Usage**: Wastes bandwidth and processing power
+3. **State Confusion**: May conflict with backend's internal state management
+4. **Reset Handling**: Doesn't properly clear stateful backend state on reset
+## Recommended Solution
+### 1. Backend Detection
+Add capability detection to identify backend type:
+```python
+class Backend:
+    @property
+    def is_stateful(self) -> bool:
+        """Returns True if backend maintains conversation state"""
+        return False  # Default to stateless
+```
+### 2. Conditional Context Management
+Adjust message sending based on backend type:
+```python
+def send_message(self, message: str):
+    if self.backend.is_stateful:
+        # Send only current message
+        # NOTE: Documentation uses .generate() for clarity, actual code uses .stream_with_tools()
+        response = self.backend.generate(message)
+    else:
+        # Send full conversation history
+        # NOTE: Documentation uses .generate() for clarity, actual code uses .stream_with_tools()
+        response = self.backend.generate(self.get_full_context())
+```
+### 3. Reset Handling
+Handle resets differently for each backend type:
+```python
+# NOTE: Methods shown are conceptual examples, not current implementation
+def reset_conversation(self):
+    if self.backend.is_stateful:
+        # Clear backend's internal state
+        self.backend.reset()
+    else:
+        # Clear local conversation history
+        self.conversation_history.clear()
+```
+## Implementation Files
+- `base.py` - Base backend interface with `LLMBackend` abstract class
+- `chat_completions.py` - Stateless ChatCompletion backends (OpenAI-compatible)
+- `claude_code.py` - **Stateful** Claude Code backend with streaming support
+- `cli_base.py` - Base CLI backend functionality
+## Benefits of Proper Implementation
+1. **Performance**: Reduced context transmission for stateful backends
+2. **Reliability**: Proper state management prevents confusion
+3. **Scalability**: Optimized resource usage
+4. **Consistency**: Uniform behavior across backend types
+5. **Maintainability**: Clear separation of concerns
+## Next Steps
+1. Add `is_stateful` property to backend interface
+2. Update agent logic to detect and handle backend types
+3. Implement proper reset mechanisms for both types
+4. Add tests for both stateful and stateless scenarios
+5. Update documentation for backend developers
+TODO: Clean up the design - StreamChunk has grown complex with many optional fields for different reasoning types and provider-specific features

massgen/backend/{CLAUDE_API_RESEARCH.md → docs/CLAUDE_API_RESEARCH.md} RENAMED Viewed

@@ -2,14 +2,14 @@
 ## API Status & Availability (2025)
-✅ **Production Ready**: Claude API is stable and production-ready
-✅ **Active Development**: Regular updates with new features in 2025
-✅ **Strong SDK Support**: Official Python SDK with async/sync support
+✅ **Production Ready**: Claude API is stable and production-ready
+✅ **Active Development**: Regular updates with new features in 2025
+✅ **Strong SDK Support**: Official Python SDK with async/sync support
 ## Models Available (2025)
 - **Claude 4 Opus**: Most capable, hybrid with extended thinking mode
-- **Claude 4 Sonnet**: Balanced performance, also available to free users
+- **Claude 4 Sonnet**: Balanced performance, also available to free users
 - **Claude 3.7 Sonnet**: Previous generation, still supported
 - **Claude 3.5 Haiku**: Fastest, cost-effective option
@@ -17,7 +17,7 @@
 ### ✅ Excellent Multi-Tool Support
 **Key Advantage**: Claude can combine ALL tool types in a single request:
-- ✅ **Server-side tools** (web search, code execution)
+- ✅ **Server-side tools** (web search, code execution)
 - ✅ **User-defined functions** (custom tools)
 - ✅ **File processing** via Files API
 - ✅ **No restrictions** on combining different tool types
@@ -114,7 +114,7 @@ response = await beta_client.beta.messages.create(
 ## Advanced Features (2025)
-### New Beta Features
+### New Beta Features
 - **Code execution**: Python sandbox with server-side execution
   - Header: `"anthropic-beta": "code-execution-2025-05-22"`
   - Tool type: `code_execution_20250522`
@@ -144,7 +144,7 @@ response = await beta_client.beta.messages.create(
 **Production Readiness:**
 - ✅ Stable API with predictable pricing
-- ✅ No session limits or experimental restrictions
+- ✅ No session limits or experimental restrictions
 - ✅ Strong error handling and rate limits
 ## Implementation Recommendation
@@ -165,7 +165,7 @@ response = await beta_client.beta.messages.create(
 ### Suggested Implementation Order:
 1. ✅ OpenAI Backend (completed)
-2. ✅ Grok Backend (completed)
+2. ✅ Grok Backend (completed)
 3. 🎯 **Claude Backend** (recommended next)
 4. ⏳ Gemini Backend (when API supports multi-tools)
@@ -175,27 +175,27 @@ response = await beta_client.beta.messages.create(
 class ClaudeBackend(LLMBackend):
     def __init__(self, api_key: Optional[str] = None):
         self.client = anthropic.AsyncAnthropic(api_key=api_key)
     async def stream_with_tools(self, messages, tools, **kwargs):
         # Can freely combine all tool types
         combined_tools = []
-        # Add server-side tools
+        # Add server-side tools
         if kwargs.get("enable_web_search"):
             combined_tools.append({"type": "web_search_20250305"})
         if kwargs.get("enable_code_execution"):
             combined_tools.append({"type": "code_execution_20250522"})
         # Add user-defined tools
         if tools:
             combined_tools.extend(tools)
         # Single API call with all tools - USE BETA CLIENT FOR CODE EXECUTION
         headers = {}
         if kwargs.get("enable_code_execution"):
             headers["anthropic-beta"] = "code-execution-2025-05-22"
         stream = await self.client.beta.messages.create(
             model="claude-3-5-sonnet-20241022",
             messages=messages,
@@ -203,7 +203,7 @@ class ClaudeBackend(LLMBackend):
             headers=headers,
             stream=True
         )
         async for event in stream:
             yield StreamChunk(...)
 ```
@@ -219,13 +219,13 @@ class ClaudeBackend(LLMBackend):
 ### ✅ Tool Execution Pattern
 Claude's code execution is **server-side** - Claude executes the code and streams results back:
 1. Send request with `code_execution_20250522` tool
-2. Claude generates code and executes it server-side
+2. Claude generates code and executes it server-side
 3. Claude streams back execution results automatically
 4. No client-side tool execution needed for code execution tools
 ### ✅ Streaming Event Types to Handle
 - `content_block_start`: Tool use begins
-- `content_block_delta`: Tool input streaming
+- `content_block_delta`: Tool input streaming
 - `input_json_delta`: Tool arguments as JSON fragments
 - Tool execution results are streamed as additional content blocks

massgen/backend/{GEMINI_API_DOCUMENTATION.md → docs/GEMINI_API_DOCUMENTATION.md} RENAMED Viewed

@@ -12,7 +12,7 @@ The Gemini API provides access to Google's latest generative AI models with mult
 ## Models Available
 1. **Gemini 2.5 Pro**: Most powerful thinking model with features for complex reasoning
-2. **Gemini 2.5 Flash**: Newest multimodal model with next generation features
+2. **Gemini 2.5 Flash**: Newest multimodal model with next generation features
 3. **Gemini 2.5 Flash-Lite**: Lighter version
 **Note**: Starting April 29, 2025, Gemini 1.5 Pro and Gemini 1.5 Flash models are not available in projects with no prior usage.
@@ -41,7 +41,7 @@ print(response.text)
 ### Synchronous Streaming
 ```python
 for chunk in client.models.generate_content_stream(
-    model='gemini-2.0-flash',
+    model='gemini-2.0-flash',
     contents='Tell me a story in 300 words.'
 ):
     print(chunk.text)
@@ -51,7 +51,7 @@ for chunk in client.models.generate_content_stream(
 ### Asynchronous Streaming
 ```python
 async for chunk in await client.aio.models.generate_content_stream(
-    model='gemini-2.0-flash',
+    model='gemini-2.0-flash',
     contents="Write a cute story about cats."
 ):
     if chunk.text:
@@ -87,7 +87,7 @@ async def async_demo():
 - Allows models to interact with external tools and APIs
 - Three primary use cases:
   1. Augment Knowledge
-  2. Extend Capabilities
+  2. Extend Capabilities
   3. Take Actions
 ### Function Call Workflow
@@ -218,7 +218,7 @@ response = client.models.generate_content(
 **Response Format:**
 - `text`: Model's explanatory text
-- `executableCode`: Generated Python code
+- `executableCode`: Generated Python code
 - `codeExecutionResult`: Execution output
 - Access via `response.candidates[0].content.parts`
@@ -243,7 +243,7 @@ grounding_tool = types.Tool(google_search=types.GoogleSearch())
 config = types.GenerateContentConfig(tools=[grounding_tool])
 response = client.models.generate_content(
-    model="gemini-2.5-flash",
+    model="gemini-2.5-flash",
     contents="Latest AI developments in 2025",
     config=config
 )
@@ -345,11 +345,11 @@ client.models.generate_content(...)
 - `function_declarations` only (user-defined tools)
 **❌ NOT Supported:**
-- `code_execution` + `function_declarations`
+- `code_execution` + `function_declarations`
 - `grounding` + `function_declarations`
 - All three tool types together
-### Live API (Preview/Experimental)
+### Live API (Preview/Experimental)
 **✅ Multi-Tool Support:**
 - Can combine `google_search` + `code_execution` + `function_declarations`
 - Full flexibility but comes with major limitations
@@ -399,7 +399,7 @@ client.models.generate_content(...)
 **Usage Examples:**
 ```python
 # CLI usage
-python -m massgen.cli --backend gemini --model gemini-2.5-flash "Your question"
+uv run python -m massgen.cli --backend gemini --model gemini-2.5-flash "Your question"
 # Configuration
 AgentConfig.create_gemini_config(

massgen 0.0.3__py3-none-any.whl → 0.1.0__py3-none-any.whl

Potentially problematic release.

massgen 0.0.3py3-none-any.whl → 0.1.0py3-none-any.whl