PyPI - massgen - Versions diffs - 0.0.3__py3-none-any.whl - Mend

massgen 0.0.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of massgen might be problematic. Click here for more details.

Files changed (76) hide show

massgen/__init__.py +94 -0
massgen/agent_config.py +507 -0
massgen/backend/CLAUDE_API_RESEARCH.md +266 -0
massgen/backend/Function calling openai responses.md +1161 -0
massgen/backend/GEMINI_API_DOCUMENTATION.md +410 -0
massgen/backend/OPENAI_RESPONSES_API_FORMAT.md +65 -0
massgen/backend/__init__.py +25 -0
massgen/backend/base.py +180 -0
massgen/backend/chat_completions.py +228 -0
massgen/backend/claude.py +661 -0
massgen/backend/gemini.py +652 -0
massgen/backend/grok.py +187 -0
massgen/backend/response.py +397 -0
massgen/chat_agent.py +440 -0
massgen/cli.py +686 -0
massgen/configs/README.md +293 -0
massgen/configs/creative_team.yaml +53 -0
massgen/configs/gemini_4o_claude.yaml +31 -0
massgen/configs/news_analysis.yaml +51 -0
massgen/configs/research_team.yaml +51 -0
massgen/configs/single_agent.yaml +18 -0
massgen/configs/single_flash2.5.yaml +44 -0
massgen/configs/technical_analysis.yaml +51 -0
massgen/configs/three_agents_default.yaml +31 -0
massgen/configs/travel_planning.yaml +51 -0
massgen/configs/two_agents.yaml +39 -0
massgen/frontend/__init__.py +20 -0
massgen/frontend/coordination_ui.py +945 -0
massgen/frontend/displays/__init__.py +24 -0
massgen/frontend/displays/base_display.py +83 -0
massgen/frontend/displays/rich_terminal_display.py +3497 -0
massgen/frontend/displays/simple_display.py +93 -0
massgen/frontend/displays/terminal_display.py +381 -0
massgen/frontend/logging/__init__.py +9 -0
massgen/frontend/logging/realtime_logger.py +197 -0
massgen/message_templates.py +431 -0
massgen/orchestrator.py +1222 -0
massgen/tests/__init__.py +10 -0
massgen/tests/multi_turn_conversation_design.md +214 -0
massgen/tests/multiturn_llm_input_analysis.md +189 -0
massgen/tests/test_case_studies.md +113 -0
massgen/tests/test_claude_backend.py +310 -0
massgen/tests/test_grok_backend.py +160 -0
massgen/tests/test_message_context_building.py +293 -0
massgen/tests/test_rich_terminal_display.py +378 -0
massgen/tests/test_v3_3agents.py +117 -0
massgen/tests/test_v3_simple.py +216 -0
massgen/tests/test_v3_three_agents.py +272 -0
massgen/tests/test_v3_two_agents.py +176 -0
massgen/utils.py +79 -0
massgen/v1/README.md +330 -0
massgen/v1/__init__.py +91 -0
massgen/v1/agent.py +605 -0
massgen/v1/agents.py +330 -0
massgen/v1/backends/gemini.py +584 -0
massgen/v1/backends/grok.py +410 -0
massgen/v1/backends/oai.py +571 -0
massgen/v1/cli.py +351 -0
massgen/v1/config.py +169 -0
massgen/v1/examples/fast-4o-mini-config.yaml +44 -0
massgen/v1/examples/fast_config.yaml +44 -0
massgen/v1/examples/production.yaml +70 -0
massgen/v1/examples/single_agent.yaml +39 -0
massgen/v1/logging.py +974 -0
massgen/v1/main.py +368 -0
massgen/v1/orchestrator.py +1138 -0
massgen/v1/streaming_display.py +1190 -0
massgen/v1/tools.py +160 -0
massgen/v1/types.py +245 -0
massgen/v1/utils.py +199 -0
massgen-0.0.3.dist-info/METADATA +568 -0
massgen-0.0.3.dist-info/RECORD +76 -0
massgen-0.0.3.dist-info/WHEEL +5 -0
massgen-0.0.3.dist-info/entry_points.txt +2 -0
massgen-0.0.3.dist-info/licenses/LICENSE +204 -0
massgen-0.0.3.dist-info/top_level.txt +1 -0

massgen/v1/orchestrator.py ADDED Viewed

@@ -0,0 +1,1138 @@
+import logging
+import threading
+import time
+import json
+from collections import Counter
+from datetime import datetime
+from typing import Any, Optional, Dict, List
+from concurrent.futures import ThreadPoolExecutor
+from .types import SystemState, AgentState, TaskInput, VoteRecord
+from .logging import get_log_manager
+# Set up logging
+logger = logging.getLogger(__name__)
+class MassOrchestrator:
+    """
+    Central orchestrator for managing multiple agents in the MassGen framework, and logging for all events.
+    Simplified workflow:
+    1. Agents work on task (status: "working")
+    2. When agents vote, they become "voted"
+    3. When all votable agents have voted:
+       - Check consensus
+       - If consensus reached: select representative to present final answer
+       - If no consensus: restart all agents for debate
+    4. Representative presents final answer and system completes
+    """
+    def __init__(
+        self,
+        max_duration: int = 600,
+        consensus_threshold: float = 0.0,
+        max_debate_rounds: int = 1,
+        status_check_interval: float = 2.0,
+        thread_pool_timeout: int = 5,
+        streaming_orchestrator=None,
+    ):
+        """
+        Initialize the orchestrator.
+        Args:
+            max_duration: Maximum duration for the entire task in seconds
+            consensus_threshold: Fraction of agents that must agree for consensus (1.0 = unanimous)
+            max_debate_rounds: Maximum number of debate rounds before fallback
+            status_check_interval: Interval for checking agent status (seconds)
+            thread_pool_timeout: Timeout for shutting down thread pool executor (seconds)
+            streaming_orchestrator: Optional streaming orchestrator for real-time display
+        """
+        self.agents: Dict[int, Any] = {}  # agent_id -> MassAgent instance
+        self.agent_states: Dict[int, AgentState] = {}  # agent_id -> AgentState instance
+        self.votes: List[VoteRecord] = []
+        self.system_state = SystemState()
+        self.max_duration = max_duration
+        self.consensus_threshold = consensus_threshold
+        self.max_debate_rounds = max_debate_rounds
+        self.status_check_interval = status_check_interval
+        self.thread_pool_timeout = thread_pool_timeout
+        self.streaming_orchestrator = streaming_orchestrator
+        # Simplified coordination
+        self._lock = threading.RLock()
+        self._stop_event = threading.Event()
+        # Communication and logging
+        self.communication_log: List[Dict[str, Any]] = []
+        self.final_response: Optional[str] = None
+        # Initialize log manager
+        self.log_manager = get_log_manager()
+    def register_agent(self, agent):
+        """
+        Register an agent with the orchestrator.
+        Args:
+            agent: MassAgent instance to register
+        """
+        with self._lock:
+            self.agents[agent.agent_id] = agent
+            self.agent_states[agent.agent_id] = agent.state
+            agent.orchestrator = self
+    def _log_event(self, event_type: str, data: Dict[str, Any]):
+        """Log an orchestrator event."""
+        self.communication_log.append(
+            {"timestamp": time.time(), "event_type": event_type, "data": data}
+        )
+    def update_agent_answer(self, agent_id: int, answer: str):
+        """
+        Update an agent's running answer.
+        Args:
+            agent_id: ID of the agent updating their answer
+            answer: New answer content
+        """
+        with self._lock:
+            if agent_id not in self.agent_states:
+                raise ValueError(f"Agent {agent_id} not registered")
+            old_answer_length = len(self.agent_states[agent_id].curr_answer)
+            self.agent_states[agent_id].add_update(answer)
+            preview = answer[:100] + "..." if len(answer) > 100 else answer
+            print(
+                f"📝 Agent {agent_id} answer updated ({old_answer_length} → {len(answer)} chars)"
+            )
+            print(f"   🔍 {preview}")
+            # Log to the comprehensive logging system
+            if self.log_manager:
+                self.log_manager.log_agent_answer_update(
+                    agent_id=agent_id,
+                    answer=answer,
+                    phase=self.system_state.phase,
+                    orchestrator=self,
+                )
+            self._log_event(
+                "answer_updated",
+                {"agent_id": agent_id, "answer": answer, "timestamp": time.time()},
+            )
+    def _get_current_vote_counts(self) -> Counter:
+        """
+        Get current vote counts based on agent states' vote_target.
+        Returns Counter of agent_id -> vote_count for ALL agents (0 if no votes).
+        """
+        current_votes = []
+        for agent_id, state in self.agent_states.items():
+            if state.status == "voted" and state.curr_vote is not None:
+                current_votes.append(state.curr_vote.target_id)
+        # Create counter from actual votes
+        vote_counts = Counter(current_votes)
+        # Ensure all agents are represented (0 if no votes)
+        for agent_id in self.agent_states.keys():
+            if agent_id not in vote_counts:
+                vote_counts[agent_id] = 0
+        return vote_counts
+    def _get_current_voted_agents_count(self) -> int:
+        """
+        Get count of agents who currently have status "voted".
+        """
+        return len([s for s in self.agent_states.values() if s.status == "voted"])
+    def _get_voting_status(self) -> Dict[str, Any]:
+        """Get current voting status and distribution."""
+        vote_counts = self._get_current_vote_counts()
+        total_agents = len(self.agents)
+        failed_agents = len(
+            [s for s in self.agent_states.values() if s.status == "failed"]
+        )
+        votable_agents = total_agents - failed_agents
+        voted_agents = self._get_current_voted_agents_count()
+        return {
+            "vote_distribution": dict(vote_counts),
+            "total_agents": total_agents,
+            "failed_agents": failed_agents,
+            "votable_agents": votable_agents,
+            "voted_agents": voted_agents,
+            "votes_needed_for_consensus": max(
+                1, int(votable_agents * self.consensus_threshold)
+            ),
+            "leading_agent": vote_counts.most_common(1)[0] if vote_counts else None,
+        }
+    def get_system_status(self) -> Dict[str, Any]:
+        """Get comprehensive system status information."""
+        return {
+            "phase": self.system_state.phase,
+            "consensus_reached": self.system_state.consensus_reached,
+            "agents": {
+                agent_id: {
+                    "status": state.status,
+                    "update_times": len(state.updated_answers),
+                    "chat_round": state.chat_round,
+                    "vote_target": (
+                        state.curr_vote.target_id if state.curr_vote else None
+                    ),
+                    "execution_time": state.execution_time,
+                }
+                for agent_id, state in self.agent_states.items()
+            },
+            "voting_status": self._get_voting_status(),
+            "runtime": (
+                (time.time() - self.system_state.start_time)
+                if self.system_state.start_time
+                else 0
+            ),
+        }
+    def cast_vote(self, voter_id: int, target_id: int, reason: str = ""):
+        """
+        Record a vote from one agent for another agent's solution.
+        Args:
+            voter_id: ID of the agent casting the vote
+            target_id: ID of the agent being voted for
+            reason: The reason for the vote (optional)
+        """
+        with self._lock:
+            logger.info(f"🗳️ VOTING: Agent {voter_id} casting vote")
+            print(
+                f"🗳️  VOTE: Agent {voter_id} → Agent {target_id} ({self.system_state.phase})"
+            )
+            if reason:
+                print(f"   📝 Voting reason: {len(reason)} chars")
+            if voter_id not in self.agent_states:
+                logger.error(f"   ❌ Invalid voter: Agent {voter_id} not registered")
+                raise ValueError(f"Voter agent {voter_id} not registered")
+            if target_id not in self.agent_states:
+                logger.error(f"   ❌ Invalid target: Agent {target_id} not registered")
+                raise ValueError(f"Target agent {target_id} not registered")
+            # Check current vote status
+            previous_vote = self.agent_states[voter_id].curr_vote
+            # Log vote change type
+            if previous_vote:
+                logger.info(
+                    f"   🔄 Agent {voter_id} changed vote from Agent {previous_vote.target_id} to Agent {target_id}"
+                )
+            else:
+                logger.info(f"   ✨ Agent {voter_id} new vote for Agent {target_id}")
+            # Add vote record to permanent history (only for actual changes)
+            vote = VoteRecord(
+                voter_id=voter_id,
+                target_id=target_id,
+                reason=reason,
+                timestamp=time.time(),
+            )
+            # record the vote in the system's vote history
+            self.votes.append(vote)
+            # Update agent state
+            old_status = self.agent_states[voter_id].status
+            self.agent_states[voter_id].status = "voted"
+            self.agent_states[voter_id].curr_vote = vote
+            self.agent_states[voter_id].cast_votes.append(vote)
+            self.agent_states[voter_id].execution_end_time = time.time()
+            # Update streaming display
+            if self.streaming_orchestrator:
+                self.streaming_orchestrator.update_agent_status(voter_id, "voted")
+                self.streaming_orchestrator.update_agent_vote_target(
+                    voter_id, target_id
+                )
+                # Update agent update count
+                update_count = len(self.agent_states[voter_id].updated_answers)
+                self.streaming_orchestrator.update_agent_update_count(
+                    voter_id, update_count
+                )
+                # Update vote cast counts for all agents
+                for agent_id, agent_state in self.agent_states.items():
+                    vote_cast_count = len(agent_state.cast_votes)
+                    self.streaming_orchestrator.update_agent_votes_cast(
+                        agent_id, vote_cast_count
+                    )
+                vote_counts = self._get_current_vote_counts()
+                self.streaming_orchestrator.update_vote_distribution(dict(vote_counts))
+                vote_msg = f"👍 Agent {voter_id} voted for Agent {target_id}"
+                self.streaming_orchestrator.add_system_message(vote_msg)
+            # Log to the comprehensive logging system
+            if self.log_manager:
+                self.log_manager.log_voting_event(
+                    voter_id=voter_id,
+                    target_id=target_id,
+                    phase=self.system_state.phase,
+                    reason=reason,
+                    orchestrator=self,
+                )
+                self.log_manager.log_agent_status_change(
+                    agent_id=voter_id,
+                    old_status=old_status,
+                    new_status="voted",
+                    phase=self.system_state.phase,
+                )
+            # Show current vote distribution
+            vote_counts = self._get_current_vote_counts()
+            voted_agents_count = self._get_current_voted_agents_count()
+            logger.info(f"   📊 Vote distribution: {dict(vote_counts)}")
+            logger.info(
+                f"   📈 Voting progress: {voted_agents_count}/{len(self.agent_states)} agents voted"
+            )
+            # Calculate consensus requirements
+            total_agents = len(self.agent_states)
+            votes_needed = max(1, int(total_agents * self.consensus_threshold))
+            if vote_counts:
+                leading_agent, leading_votes = vote_counts.most_common(1)[0]
+                logger.info(
+                    f"   🏆 Leading: Agent {leading_agent} with {leading_votes} votes (need {votes_needed} for consensus)"
+                )
+            # Log event for internal tracking
+            self._log_event(
+                "vote_cast",
+                {
+                    "voter_id": voter_id,
+                    "target_id": target_id,
+                    "timestamp": vote.timestamp,
+                    "vote_distribution": dict(vote_counts),
+                    "total_votes": voted_agents_count,
+                },
+            )
+    def notify_answer_update(self, agent_id: int, answer: str):
+        """
+        Called when an agent updates their answer.
+        This should restart all voted agents who haven't seen this update yet.
+        """
+        logger.info(f"📢 Agent {agent_id} updated answer")
+        # Update the answer in agent state
+        self.update_agent_answer(agent_id, answer)
+        # Update streaming display
+        if self.streaming_orchestrator:
+            answer_msg = f"📝 Agent {agent_id} updated answer ({len(answer)} chars)"
+            self.streaming_orchestrator.add_system_message(answer_msg)
+            # Update agent update count
+            update_count = len(self.agent_states[agent_id].updated_answers)
+            self.streaming_orchestrator.update_agent_update_count(
+                agent_id, update_count
+            )
+        # CRITICAL FIX: Restart voted agents when any agent shares new updates
+        with self._lock:
+            restarted_agents = []
+            current_time = time.time()
+            for other_agent_id, state in self.agent_states.items():
+                if other_agent_id != agent_id and state.status == "voted":
+                    # Restart the voted agent
+                    state.status = "working"
+                    # This vote should be cleared as answers have been updated
+                    state.curr_vote = None
+                    state.execution_start_time = time.time()
+                    restarted_agents.append(other_agent_id)
+                    logger.info(
+                        f"🔄 Agent {other_agent_id} restarted due to update from Agent {agent_id}"
+                    )
+                    # Update streaming display
+                    if self.streaming_orchestrator:
+                        self.streaming_orchestrator.update_agent_status(
+                            other_agent_id, "working"
+                        )
+                        self.streaming_orchestrator.update_agent_vote_target(
+                            other_agent_id, None
+                        )  # Clear vote target in display
+                        # Update agent update count for restarted agent
+                        update_count = len(
+                            self.agent_states[other_agent_id].updated_answers
+                        )
+                        self.streaming_orchestrator.update_agent_update_count(
+                            other_agent_id, update_count
+                        )
+                        restart_msg = (
+                            f"🔄 Agent {other_agent_id} restarted due to new update"
+                        )
+                        self.streaming_orchestrator.add_system_message(restart_msg)
+                    # Log agent restart
+                    if self.log_manager:
+                        self.log_manager.log_agent_restart(
+                            agent_id=other_agent_id,
+                            reason=f"new_update_from_agent_{agent_id}",
+                            phase=self.system_state.phase,
+                        )
+            if restarted_agents:
+                # Note: We don't remove historical votes as self.votes is a permanent record
+                # The current vote distribution will automatically reflect the change via agent.vote_target = None
+                logger.info(f"🔄 Restarted agents: {restarted_agents}")
+                # Update vote distribution in streaming display
+                if self.streaming_orchestrator:
+                    vote_counts = self._get_current_vote_counts()
+                    self.streaming_orchestrator.update_vote_distribution(
+                        dict(vote_counts)
+                    )
+                    # Update vote cast counts for all agents to ensure accuracy
+                    for agent_id, agent_state in self.agent_states.items():
+                        vote_cast_count = len(agent_state.cast_votes)
+                        self.streaming_orchestrator.update_agent_votes_cast(
+                            agent_id, vote_cast_count
+                        )
+            return restarted_agents
+    def _check_consensus(self) -> bool:
+        """
+        Check if consensus has been reached based on current votes.
+        Improved to handle edge cases and ensure proper consensus calculation.
+        """
+        with self._lock:
+            total_agents = len(self.agents)
+            failed_agents_count = len(
+                [s for s in self.agent_states.values() if s.status == "failed"]
+            )
+            votable_agents_count = total_agents - failed_agents_count
+            # Edge case: no votable agents
+            if votable_agents_count == 0:
+                logger.warning("⚠️ No votable agents available for consensus")
+                return False
+            # Edge case: only one votable agent
+            if votable_agents_count == 1:
+                working_agents = [
+                    aid
+                    for aid, state in self.agent_states.items()
+                    if state.status == "working"
+                ]
+                if not working_agents:  # The single agent has voted
+                    # Find the single votable agent
+                    votable_agent = [
+                        aid
+                        for aid, state in self.agent_states.items()
+                        if state.status != "failed"
+                    ][0]
+                    logger.info(f"🎯 Single agent consensus: Agent {votable_agent}")
+                    self._reach_consensus(votable_agent)
+                    return True
+                return False
+            vote_counts = self._get_current_vote_counts()
+            votes_needed = max(1, int(votable_agents_count * self.consensus_threshold))
+            if vote_counts and vote_counts.most_common(1)[0][1] >= votes_needed:
+                winning_agent_id = vote_counts.most_common(1)[0][0]
+                winning_votes = vote_counts.most_common(1)[0][1]
+                # Ensure the winning agent is still votable (not failed)
+                if self.agent_states[winning_agent_id].status == "failed":
+                    logger.warning(
+                        f"⚠️ Winning agent {winning_agent_id} has failed - recalculating"
+                    )
+                    return False
+                logger.info(
+                    f"✅ Consensus reached: Agent {winning_agent_id} with {winning_votes}/{votable_agents_count} votes"
+                )
+                self._reach_consensus(winning_agent_id)
+                return True
+            return False
+    def mark_agent_failed(self, agent_id: int, reason: str = ""):
+        """
+        Mark an agent as failed.
+        Args:
+            agent_id: ID of the agent to mark as failed
+            reason: Optional reason for the failure
+        """
+        with self._lock:
+            logger.info(f"💥 AGENT FAILURE: Agent {agent_id} marked as failed")
+            print(f"      💥 MARK_FAILED: Agent {agent_id}")
+            print(f"      📊 Current phase: {self.system_state.phase}")
+            if agent_id not in self.agent_states:
+                logger.error(f"   ❌ Invalid agent: Agent {agent_id} not registered")
+                raise ValueError(f"Agent {agent_id} not registered")
+            # Update agent state
+            old_status = self.agent_states[agent_id].status
+            self.agent_states[agent_id].status = "failed"
+            self.agent_states[agent_id].execution_end_time = time.time()
+            # Update streaming display
+            if self.streaming_orchestrator:
+                self.streaming_orchestrator.update_agent_status(agent_id, "failed")
+                failure_msg = (
+                    f"💥 Agent {agent_id} failed: {reason}"
+                    if reason
+                    else f"💥 Agent {agent_id} failed"
+                )
+                self.streaming_orchestrator.add_system_message(failure_msg)
+            # Log to the comprehensive logging system
+            if self.log_manager:
+                self.log_manager.log_agent_status_change(
+                    agent_id=agent_id,
+                    old_status=old_status,
+                    new_status="failed",
+                    phase=self.system_state.phase,
+                )
+            # Log the failure event
+            self._log_event(
+                "agent_failed",
+                {
+                    "agent_id": agent_id,
+                    "reason": reason,
+                    "timestamp": time.time(),
+                    "old_status": old_status,
+                },
+            )
+            # Show current agent status distribution
+            status_counts = Counter(
+                state.status for state in self.agent_states.values()
+            )
+            logger.info(f"   📊 Status distribution: {dict(status_counts)}")
+            logger.info(
+                f"   📈 Failed agents: {status_counts.get('failed', 0)}/{len(self.agent_states)} total"
+            )
+    def _reach_consensus(self, winning_agent_id: int):
+        """Mark consensus as reached and finalize the system."""
+        old_phase = self.system_state.phase
+        self.system_state.consensus_reached = True
+        self.system_state.representative_agent_id = winning_agent_id
+        self.system_state.phase = "consensus"
+        # Update streaming orchestrator if available
+        if self.streaming_orchestrator:
+            vote_distribution = dict(self._get_current_vote_counts())
+            self.streaming_orchestrator.update_consensus_status(
+                winning_agent_id, vote_distribution
+            )
+            self.streaming_orchestrator.update_phase(old_phase, "consensus")
+        # Log to the comprehensive logging system
+        if self.log_manager:
+            vote_distribution = dict(self._get_current_vote_counts())
+            self.log_manager.log_consensus_reached(
+                winning_agent_id=winning_agent_id,
+                vote_distribution=vote_distribution,
+                is_fallback=False,
+                phase=self.system_state.phase,
+            )
+            self.log_manager.log_phase_transition(
+                old_phase=old_phase,
+                new_phase="consensus",
+                additional_data={
+                    "consensus_reached": True,
+                    "winning_agent_id": winning_agent_id,
+                    "is_fallback": False,
+                },
+            )
+        self._log_event(
+            "consensus_reached",
+            {
+                "winning_agent_id": winning_agent_id,
+                "fallback_to_majority": False,
+                "final_vote_distribution": dict(self._get_current_vote_counts()),
+            },
+        )
+    def export_detailed_session_log(self) -> Dict[str, Any]:
+        """
+        Export complete detailed session information for comprehensive analysis.
+        Includes all outputs, metrics, and evaluation results.
+        """
+        session_log = {
+            "session_metadata": {
+                "session_id": (
+                    f"mass_session_{int(self.system_state.start_time)}"
+                    if self.system_state.start_time
+                    else None
+                ),
+                "start_time": self.system_state.start_time,
+                "end_time": self.system_state.end_time,
+                "total_duration": (
+                    (self.system_state.end_time - self.system_state.start_time)
+                    if self.system_state.start_time and self.system_state.end_time
+                    else None
+                ),
+                "timestamp": datetime.now().isoformat(),
+                "system_version": "MassGen v1.0",
+            },
+            "task_information": {
+                "question": (
+                    self.system_state.task.question if self.system_state.task else None
+                ),
+                "task_id": (
+                    self.system_state.task.task_id if self.system_state.task else None
+                ),
+                "context": (
+                    self.system_state.task.context if self.system_state.task else None
+                ),
+            },
+            "system_configuration": {
+                "max_duration": self.max_duration,
+                "consensus_threshold": self.consensus_threshold,
+                "max_debate_rounds": self.max_debate_rounds,
+                "agents": [agent.model for agent in self.agents.values()],
+            },
+            "agent_details": {
+                agent_id: {
+                    "status": state.status,
+                    "updates_count": len(state.updated_answers),
+                    "chat_length": len(state.chat_history),
+                    "chat_round": state.chat_round,
+                    "vote_target": (
+                        state.curr_vote.target_id if state.curr_vote else None
+                    ),
+                    "execution_time": state.execution_time,
+                    "execution_start_time": state.execution_start_time,
+                    "execution_end_time": state.execution_end_time,
+                    "updated_answers": [
+                        {
+                            "timestamp": update.timestamp,
+                            "status": update.status,
+                            "answer_length": len(update.answer),
+                        }
+                        for update in state.updated_answers
+                    ],
+                }
+                for agent_id, state in self.agent_states.items()
+            },
+            "voting_analysis": {
+                "vote_records": [
+                    {
+                        "voter_id": vote.voter_id,
+                        "target_id": vote.target_id,
+                        "timestamp": vote.timestamp,
+                        "reason_length": len(vote.reason) if vote.reason else 0,
+                    }
+                    for vote in self.votes
+                ],
+                "vote_timeline": [
+                    {
+                        "timestamp": vote.timestamp,
+                        "event": f"Agent {vote.voter_id} → Agent {vote.target_id}",
+                    }
+                    for vote in self.votes
+                ],
+            },
+            "communication_log": self.communication_log,
+            "system_events": [
+                {
+                    "timestamp": entry["timestamp"],
+                    "event_type": entry["event_type"],
+                    "data_summary": {
+                        k: (len(v) if isinstance(v, (str, list, dict)) else v)
+                        for k, v in entry["data"].items()
+                    },
+                }
+                for entry in self.communication_log
+            ],
+        }
+        return session_log
+    def start_task(self, task: TaskInput):
+        """
+        Initialize the system for a new task and run the main workflow.
+        Args:
+            task: TaskInput containing the problem to solve
+        Returns:
+            response: Dict[str, Any] containing the final answer to the task's question, and relevant information
+        """
+        with self._lock:
+            logger.info("🎯 ORCHESTRATOR: Starting new task")
+            logger.info(f"   Task ID: {task.task_id}")
+            logger.info(f"   Question preview: {task.question}")
+            logger.info(f"   Registered agents: {list(self.agents.keys())}")
+            logger.info(f"   Max duration: {self.max_duration}")
+            logger.info(f"   Consensus threshold: {self.consensus_threshold}")
+            self.system_state.task = task
+            self.system_state.start_time = time.time()
+            self.system_state.phase = "collaboration"
+            self.final_response = None
+            # Reset all agent states
+            for agent_id, agent in self.agents.items():
+                agent.state = AgentState(agent_id=agent_id)
+                self.agent_states[agent_id] = agent.state
+                # Initialize the saved chat
+                agent.state.chat_history = []
+                # Initialize streaming display for each agent
+                if self.streaming_orchestrator:
+                    self.streaming_orchestrator.set_agent_model(agent_id, agent.model)
+                    self.streaming_orchestrator.update_agent_status(agent_id, "working")
+                    # Initialize agent update count
+                    self.streaming_orchestrator.update_agent_update_count(agent_id, 0)
+            # Clear previous session data
+            self.votes.clear()
+            self.communication_log.clear()
+            # Initialize streaming display system message
+            if self.streaming_orchestrator:
+                self.streaming_orchestrator.update_phase("unknown", "collaboration")
+                # Initialize debate rounds to 0
+                self.streaming_orchestrator.update_debate_rounds(0)
+                init_msg = f"🚀 Starting MassGen task with {len(self.agents)} agents"
+                self.streaming_orchestrator.add_system_message(init_msg)
+            self._log_event(
+                "task_started", {"task_id": task.task_id, "question": task.question}
+            )
+            logger.info("✅ Task initialization completed successfully")
+        # Run the workflow
+        return self._run_mass_workflow(task)
+    def _run_mass_workflow(self, task: TaskInput) -> Dict[str, Any]:
+        """
+        Run the MassGen workflow with dynamic agent restart support:
+        1. All agents work in parallel
+        2. Agents restart when others share updates (if they had voted)
+        3. When all have voted, check consensus
+        4. If no consensus, restart all for debate
+        5. If consensus, representative presents final answer
+        """
+        logger.info("🚀 Starting MassGen workflow")
+        debate_rounds = 0
+        start_time = time.time()
+        while not self._stop_event.is_set():
+            # Check timeout
+            if time.time() - start_time > self.max_duration:
+                logger.warning("⏰ Maximum duration reached - forcing consensus")
+                self._force_consensus_by_timeout()
+                # Representative will present final answer
+                self._present_final_answer(task)
+                break
+            # Run all agents with dynamic restart support
+            # Restart all agents if they have been updated
+            logger.info(f"📢 Starting collaboration round {debate_rounds + 1}")
+            self._run_all_agents_with_dynamic_restart(task)
+            # Check if all votable agents have voted
+            if self._all_agents_voted():
+                logger.info("🗳️ All agents have voted - checking consensus")
+                if self._check_consensus():
+                    logger.info("🎉 Consensus reached!")
+                    # Representative will present final answer
+                    self._present_final_answer(task)
+                    break
+                else:
+                    # No consensus - start debate round
+                    debate_rounds += 1
+                    # Update streaming display with new debate round count
+                    if self.streaming_orchestrator:
+                        self.streaming_orchestrator.update_debate_rounds(debate_rounds)
+                    if debate_rounds > self.max_debate_rounds:
+                        logger.warning(
+                            f"⚠️ Maximum debate rounds ({self.max_debate_rounds}) reached"
+                        )
+                        self._force_consensus_by_timeout()
+                        # Representative will present final answer
+                        self._present_final_answer(task)
+                        break
+                    logger.info(
+                        f"🗣️ No consensus - starting debate round {debate_rounds}"
+                    )
+                    # Add debate instruction to the chat history and will be restarted in the next round
+                    self._restart_all_agents_for_debate()
+            else:
+                # Still waiting for some agents to vote
+                time.sleep(self.status_check_interval)
+        return self._finalize_session()
+    def _run_all_agents_with_dynamic_restart(self, task: TaskInput):
+        """
+        Run all agents in parallel with support for dynamic restarts.
+        This approach handles agents restarting mid-execution.
+        """
+        active_futures = {}
+        executor = ThreadPoolExecutor(max_workers=len(self.agents))
+        try:
+            # Start all working agents
+            for agent_id in self.agents.keys():
+                if self.agent_states[agent_id].status not in ["failed"]:
+                    self._start_agent_if_working(
+                        agent_id, task, executor, active_futures
+                    )
+            # Monitor agents and handle restarts
+            while active_futures and not self._all_agents_voted():
+                completed_futures = []
+                # Check for completed agents
+                for agent_id, future in list(active_futures.items()):
+                    if future.done():
+                        completed_futures.append(agent_id)
+                        try:
+                            future.result()  # Get result and handle exceptions
+                        except Exception as e:
+                            logger.error(f"❌ Agent {agent_id} failed: {e}")
+                            self.mark_agent_failed(agent_id, str(e))
+                # Remove completed futures
+                for agent_id in completed_futures:
+                    del active_futures[agent_id]
+                # Check for agents that need to restart (status changed back to "working")
+                for agent_id in self.agents.keys():
+                    if (
+                        agent_id not in active_futures
+                        and self.agent_states[agent_id].status == "working"
+                    ):
+                        self._start_agent_if_working(
+                            agent_id, task, executor, active_futures
+                        )
+                time.sleep(0.1)  # Small delay to prevent busy waiting
+        finally:
+            # Cancel any remaining futures
+            for future in active_futures.values():
+                future.cancel()
+            executor.shutdown(wait=True)
+    def _start_agent_if_working(
+        self,
+        agent_id: int,
+        task: TaskInput,
+        executor: ThreadPoolExecutor,
+        active_futures: Dict,
+    ):
+        """Start an agent if it's in working status and not already running."""
+        if (
+            self.agent_states[agent_id].status == "working"
+            and agent_id not in active_futures
+        ):
+            self.agent_states[agent_id].execution_start_time = time.time()
+            future = executor.submit(self._run_single_agent, agent_id, task)
+            active_futures[agent_id] = future
+            logger.info(f"🤖 Agent {agent_id} started/restarted")
+    def _run_single_agent(self, agent_id: int, task: TaskInput):
+        """Run a single agent's work_on_task method."""
+        agent = self.agents[agent_id]
+        try:
+            logger.info(f"🤖 Agent {agent_id} starting work")
+            # Run agent's work_on_task with current conversation state
+            updated_messages = agent.work_on_task(task)
+            # Update conversation state
+            self.agent_states[agent_id].chat_history.append(updated_messages)
+            self.agent_states[agent_id].chat_round = agent.state.chat_round
+            # Update streaming display with chat round
+            if self.streaming_orchestrator:
+                self.streaming_orchestrator.update_agent_chat_round(
+                    agent_id, agent.state.chat_round
+                )
+                # Update agent update count
+                update_count = len(self.agent_states[agent_id].updated_answers)
+                self.streaming_orchestrator.update_agent_update_count(
+                    agent_id, update_count
+                )
+            logger.info(
+                f"✅ Agent {agent_id} completed work with status: {self.agent_states[agent_id].status}"
+            )
+        except Exception as e:
+            logger.error(f"❌ Agent {agent_id} failed: {e}")
+            self.mark_agent_failed(agent_id, str(e))
+    def _all_agents_voted(self) -> bool:
+        """Check if all votable agents have voted."""
+        votable_agents = [
+            aid
+            for aid, state in self.agent_states.items()
+            if state.status not in ["failed"]
+        ]
+        voted_agents = [
+            aid for aid, state in self.agent_states.items() if state.status == "voted"
+        ]
+        return len(voted_agents) == len(votable_agents) and len(votable_agents) > 0
+    def _restart_all_agents_for_debate(self):
+        """
+        Restart all agents for debate by resetting their status
+        We don't clear vote target when restarting for debate as answers are not updated
+        """
+        logger.info("🔄 Restarting all agents for debate")
+        with self._lock:
+            # Update streaming display
+            if self.streaming_orchestrator:
+                self.streaming_orchestrator.reset_consensus()
+                self.streaming_orchestrator.update_phase(
+                    self.system_state.phase, "collaboration"
+                )
+                self.streaming_orchestrator.add_system_message(
+                    "🗣️ Starting debate phase - no consensus reached"
+                )
+            # Log debate start
+            if self.log_manager:
+                self.log_manager.log_debate_started(phase="collaboration")
+                self.log_manager.log_phase_transition(
+                    old_phase=self.system_state.phase,
+                    new_phase="collaboration",
+                    additional_data={
+                        "reason": "no_consensus_reached",
+                        "debate_round": True,
+                    },
+                )
+            # Reset agent statuses and add debate instruction to conversation
+            # Note: We don't clear self.votes as it's a historical record
+            for agent_id, state in self.agent_states.items():
+                if state.status not in ["failed"]:
+                    old_status = state.status
+                    state.status = "working"
+                    # We don't clear vote target when restarting for debate
+                    # state.curr_vote = None
+                    # Update streaming display for each agent
+                    if self.streaming_orchestrator:
+                        self.streaming_orchestrator.update_agent_status(
+                            agent_id, "working"
+                        )
+                    # Log agent restart
+                    if self.log_manager:
+                        self.log_manager.log_agent_restart(
+                            agent_id=agent_id,
+                            reason="debate_phase_restart",
+                            phase="collaboration",
+                        )
+            # Update system phase
+            self.system_state.phase = "collaboration"
+    def _present_final_answer(self, task: TaskInput):
+        """
+        Run the final presentation by the representative agent.
+        """
+        representative_id = self.system_state.representative_agent_id
+        if not representative_id:
+            logger.error("No representative agent selected")
+            return
+        logger.info(f"🎯 Agent {representative_id} presenting final answer")
+        try:
+            representative_agent = self.agents[representative_id]
+            # if self.final_response:
+            #     logger.info(f"✅ Final response already exists")
+            #     return
+            # if representative_agent.state.curr_answer:
+            #     self.final_response = representative_agent.state.curr_answer
+            # else:
+            # Run one more inference to generate the final answer
+            _, user_input = representative_agent._get_task_input(task)
+            messages = [
+                {
+                    "role": "system",
+                    "content": """
+You are given a task and multiple agents' answers and their votes.
+Please incorporate these information and provide a final BEST answer to the original message.
+""",
+                },
+                {
+                    "role": "user",
+                    "content": user_input
+                    + """
+Please provide the final BEST answer to the original message by incorporating these information.
+The final answer must be self-contained, complete, well-sourced, compelling, and ready to serve as the definitive final response.
+""",
+                },
+            ]
+            result = representative_agent.process_message(messages)
+            self.final_response = result.text
+            # Mark
+            self.system_state.phase = "completed"
+            self.system_state.end_time = time.time()
+            logger.info(f"✅ Final presentation completed by Agent {representative_id}")
+        except Exception as e:
+            logger.error(f"❌ Final presentation failed: {e}")
+            self.final_response = f"Error in final presentation: {str(e)}"
+    def _force_consensus_by_timeout(self):
+        """
+        Force consensus selection when maximum duration is reached.
+        """
+        logger.warning("⏰ Forcing consensus due to timeout")
+        with self._lock:
+            # Find agent with most votes, or earliest voter in case of tie
+            vote_counts = self._get_current_vote_counts()
+            if vote_counts:
+                # Select agent with most votes
+                winning_agent_id = vote_counts.most_common(1)[0][0]
+                logger.info(
+                    f"   Selected Agent {winning_agent_id} with {vote_counts[winning_agent_id]} votes"
+                )
+            else:
+                # No votes - select first working agent
+                working_agents = [
+                    aid
+                    for aid, state in self.agent_states.items()
+                    if state.status == "working"
+                ]
+                winning_agent_id = (
+                    working_agents[0] if working_agents else list(self.agents.keys())[0]
+                )
+                logger.info(
+                    f"   No votes - selected Agent {winning_agent_id} as fallback"
+                )
+            self._reach_consensus(winning_agent_id)
+    def _finalize_session(self) -> Dict[str, Any]:
+        """
+        Finalize the session and return comprehensive results.
+        """
+        logger.info("🏁 Finalizing session")
+        with self._lock:
+            if not self.system_state.end_time:
+                self.system_state.end_time = time.time()
+            session_duration = (
+                self.system_state.end_time - self.system_state.start_time
+                if self.system_state.start_time
+                else 0
+            )
+            # Save final agent states to files
+            if self.log_manager:
+                self.log_manager.save_agent_states(self)
+                self.log_manager.log_task_completion(
+                    {
+                        "final_answer": self.final_response,
+                        "consensus_reached": self.system_state.consensus_reached,
+                        "representative_agent_id": self.system_state.representative_agent_id,
+                        "session_duration": session_duration,
+                    }
+                )
+            # Prepare clean, user-facing result
+            result = {
+                "answer": self.final_response or "No final answer generated",
+                "consensus_reached": self.system_state.consensus_reached,
+                "representative_agent_id": self.system_state.representative_agent_id,
+                "session_duration": session_duration,
+                "summary": {
+                    "total_agents": len(self.agents),
+                    "failed_agents": len(
+                        [s for s in self.agent_states.values() if s.status == "failed"]
+                    ),
+                    "total_votes": len(self.votes),
+                    "final_vote_distribution": dict(self._get_current_vote_counts()),
+                },
+                "system_logs": self.export_detailed_session_log(),
+            }
+            # Save result to result.json in the session directory
+            if self.log_manager and not self.log_manager.non_blocking:
+                try:
+                    result_file = self.log_manager.session_dir / "result.json"
+                    with open(result_file, "w", encoding="utf-8") as f:
+                        json.dump(result, f, indent=2, ensure_ascii=False, default=str)
+                    logger.info(f"💾 Result saved to {result_file}")
+                except Exception as e:
+                    logger.warning(f"⚠️ Failed to save result.json: {e}")
+            logger.info(f"✅ Session completed in {session_duration:.2f} seconds")
+            logger.info(f"   Consensus: {result['consensus_reached']}")
+            logger.info(f"   Representative: Agent {result['representative_agent_id']}")
+            return result
+    def cleanup(self):
+        """
+        Clean up resources and stop all agents.
+        """
+        logger.info("🧹 Cleaning up orchestrator resources")
+        self._stop_event.set()
+        # Save final agent states before cleanup
+        if self.log_manager and self.agent_states:
+            try:
+                self.log_manager.save_agent_states(self)
+                logger.info("✅ Final agent states saved")
+            except Exception as e:
+                logger.warning(f"⚠️ Error saving final agent states: {e}")
+        # Clean up logging manager
+        if self.log_manager:
+            try:
+                self.log_manager.cleanup()
+                logger.info("✅ Log manager cleaned up")
+            except Exception as e:
+                logger.warning(f"⚠️ Error cleaning up log manager: {e}")
+        # Clean up streaming orchestrator if it exists
+        if self.streaming_orchestrator:
+            try:
+                self.streaming_orchestrator.cleanup()
+                logger.info("✅ Streaming orchestrator cleaned up")
+            except Exception as e:
+                logger.warning(f"⚠️ Error cleaning up streaming orchestrator: {e}")
+        # No longer using _agent_threads since we use ThreadPoolExecutor in workflow methods
+        # The executor is properly shut down in _run_all_agents_with_dynamic_restart
+        logger.info("✅ Orchestrator cleanup completed")