PyPI - massgen - Versions diffs - 0.1.3__py3-none-any.whl → 0.1.5__py3-none-any.whl - Mend

massgen 0.1.3py3-none-any.whl → 0.1.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of massgen might be problematic. Click here for more details.

Files changed (90) hide show

massgen/__init__.py +1 -1
massgen/api_params_handler/_chat_completions_api_params_handler.py +4 -0
massgen/api_params_handler/_claude_api_params_handler.py +4 -0
massgen/api_params_handler/_gemini_api_params_handler.py +4 -0
massgen/api_params_handler/_response_api_params_handler.py +4 -0
massgen/backend/base_with_custom_tool_and_mcp.py +25 -5
massgen/backend/docs/permissions_and_context_files.md +2 -2
massgen/backend/response.py +2 -0
massgen/chat_agent.py +340 -20
massgen/cli.py +326 -19
massgen/configs/README.md +92 -41
massgen/configs/memory/gpt5mini_gemini_baseline_research_to_implementation.yaml +94 -0
massgen/configs/memory/gpt5mini_gemini_context_window_management.yaml +187 -0
massgen/configs/memory/gpt5mini_gemini_research_to_implementation.yaml +127 -0
massgen/configs/memory/gpt5mini_high_reasoning_gemini.yaml +107 -0
massgen/configs/memory/single_agent_compression_test.yaml +64 -0
massgen/configs/tools/custom_tools/crawl4ai_example.yaml +55 -0
massgen/configs/tools/custom_tools/multimodal_tools/text_to_file_generation_multi.yaml +61 -0
massgen/configs/tools/custom_tools/multimodal_tools/text_to_file_generation_single.yaml +29 -0
massgen/configs/tools/custom_tools/multimodal_tools/text_to_image_generation_multi.yaml +51 -0
massgen/configs/tools/custom_tools/multimodal_tools/text_to_image_generation_single.yaml +33 -0
massgen/configs/tools/custom_tools/multimodal_tools/text_to_speech_generation_multi.yaml +55 -0
massgen/configs/tools/custom_tools/multimodal_tools/text_to_speech_generation_single.yaml +33 -0
massgen/configs/tools/custom_tools/multimodal_tools/text_to_video_generation_multi.yaml +47 -0
massgen/configs/tools/custom_tools/multimodal_tools/text_to_video_generation_single.yaml +29 -0
massgen/configs/tools/custom_tools/multimodal_tools/understand_audio.yaml +1 -1
massgen/configs/tools/custom_tools/multimodal_tools/understand_file.yaml +1 -1
massgen/configs/tools/custom_tools/multimodal_tools/understand_image.yaml +1 -1
massgen/configs/tools/custom_tools/multimodal_tools/understand_video.yaml +1 -1
massgen/configs/tools/custom_tools/multimodal_tools/youtube_video_analysis.yaml +1 -1
massgen/filesystem_manager/_filesystem_manager.py +1 -0
massgen/filesystem_manager/_path_permission_manager.py +148 -0
massgen/memory/README.md +277 -0
massgen/memory/__init__.py +26 -0
massgen/memory/_base.py +193 -0
massgen/memory/_compression.py +237 -0
massgen/memory/_context_monitor.py +211 -0
massgen/memory/_conversation.py +255 -0
massgen/memory/_fact_extraction_prompts.py +333 -0
massgen/memory/_mem0_adapters.py +257 -0
massgen/memory/_persistent.py +687 -0
massgen/memory/docker-compose.qdrant.yml +36 -0
massgen/memory/docs/DESIGN.md +388 -0
massgen/memory/docs/QUICKSTART.md +409 -0
massgen/memory/docs/SUMMARY.md +319 -0
massgen/memory/docs/agent_use_memory.md +408 -0
massgen/memory/docs/orchestrator_use_memory.md +586 -0
massgen/memory/examples.py +237 -0
massgen/message_templates.py +160 -12
massgen/orchestrator.py +223 -7
massgen/tests/memory/test_agent_compression.py +174 -0
massgen/{configs/tools → tests}/memory/test_context_window_management.py +30 -30
massgen/tests/memory/test_force_compression.py +154 -0
massgen/tests/memory/test_simple_compression.py +147 -0
massgen/tests/test_agent_memory.py +534 -0
massgen/tests/test_binary_file_blocking.py +274 -0
massgen/tests/test_case_studies.md +12 -12
massgen/tests/test_conversation_memory.py +382 -0
massgen/tests/test_multimodal_size_limits.py +407 -0
massgen/tests/test_orchestrator_memory.py +620 -0
massgen/tests/test_persistent_memory.py +435 -0
massgen/token_manager/token_manager.py +6 -0
massgen/tool/_manager.py +7 -2
massgen/tool/_multimodal_tools/image_to_image_generation.py +293 -0
massgen/tool/_multimodal_tools/text_to_file_generation.py +455 -0
massgen/tool/_multimodal_tools/text_to_image_generation.py +222 -0
massgen/tool/_multimodal_tools/text_to_speech_continue_generation.py +226 -0
massgen/tool/_multimodal_tools/text_to_speech_transcription_generation.py +217 -0
massgen/tool/_multimodal_tools/text_to_video_generation.py +223 -0
massgen/tool/_multimodal_tools/understand_audio.py +19 -1
massgen/tool/_multimodal_tools/understand_file.py +6 -1
massgen/tool/_multimodal_tools/understand_image.py +112 -8
massgen/tool/_multimodal_tools/understand_video.py +32 -5
massgen/tool/_web_tools/crawl4ai_tool.py +718 -0
massgen/tool/docs/multimodal_tools.md +589 -0
massgen/tools/__init__.py +8 -0
massgen/tools/_planning_mcp_server.py +520 -0
massgen/tools/planning_dataclasses.py +434 -0
{massgen-0.1.3.dist-info → massgen-0.1.5.dist-info}/METADATA +142 -82
{massgen-0.1.3.dist-info → massgen-0.1.5.dist-info}/RECORD +84 -41
massgen/configs/tools/custom_tools/crawl4ai_mcp_example.yaml +0 -67
massgen/configs/tools/custom_tools/crawl4ai_multi_agent_example.yaml +0 -68
massgen/configs/tools/memory/README.md +0 -199
massgen/configs/tools/memory/gpt5mini_gemini_context_window_management.yaml +0 -131
massgen/configs/tools/memory/gpt5mini_gemini_no_persistent_memory.yaml +0 -133
massgen/configs/tools/multimodal/gpt5mini_gpt5nano_documentation_evolution.yaml +0 -97
{massgen-0.1.3.dist-info → massgen-0.1.5.dist-info}/WHEEL +0 -0
{massgen-0.1.3.dist-info → massgen-0.1.5.dist-info}/entry_points.txt +0 -0
{massgen-0.1.3.dist-info → massgen-0.1.5.dist-info}/licenses/LICENSE +0 -0
{massgen-0.1.3.dist-info → massgen-0.1.5.dist-info}/top_level.txt +0 -0

massgen/__init__.py CHANGED Viewed

@@ -68,7 +68,7 @@ from .chat_agent import (
 from .message_templates import MessageTemplates, get_templates
 from .orchestrator import Orchestrator, create_orchestrator
-__version__ = "0.1.3"
+__version__ = "0.1.5"
 __author__ = "MassGen Contributors"

massgen/api_params_handler/_chat_completions_api_params_handler.py CHANGED Viewed

@@ -24,6 +24,10 @@ class ChatCompletionsAPIParamsHandler(APIParamsHandlerBase):
                 "allowed_tools",
                 "exclude_tools",
                 "custom_tools",  # Custom tools configuration (processed separately)
+                "enable_file_generation",  # Internal flag for file generation (used in system messages only)
+                "enable_image_generation",  # Internal flag for image generation (used in system messages only)
+                "enable_audio_generation",  # Internal flag for audio generation (used in system messages only)
+                "enable_video_generation",  # Internal flag for video generation (used in system messages only)
             },
         )

massgen/api_params_handler/_claude_api_params_handler.py CHANGED Viewed

@@ -24,6 +24,10 @@ class ClaudeAPIParamsHandler(APIParamsHandlerBase):
                 "exclude_tools",
                 "custom_tools",  # Custom tools configuration (processed separately)
                 "_has_files_api_files",
+                "enable_file_generation",  # Internal flag for file generation (used in system messages only)
+                "enable_image_generation",  # Internal flag for image generation (used in system messages only)
+                "enable_audio_generation",  # Internal flag for audio generation (used in system messages only)
+                "enable_video_generation",  # Internal flag for video generation (used in system messages only)
             },
         )

massgen/api_params_handler/_gemini_api_params_handler.py CHANGED Viewed

@@ -19,6 +19,10 @@ class GeminiAPIParamsHandler(APIParamsHandlerBase):
             "allowed_tools",
             "exclude_tools",
             "custom_tools",
+            "enable_file_generation",  # Internal flag for file generation (used in system messages only)
+            "enable_image_generation",  # Internal flag for image generation (used in system messages only)
+            "enable_audio_generation",  # Internal flag for audio generation (used in system messages only)
+            "enable_video_generation",  # Internal flag for video generation (used in system messages only)
         }
         return set(base) | extra

massgen/api_params_handler/_response_api_params_handler.py CHANGED Viewed

@@ -24,6 +24,10 @@ class ResponseAPIParamsHandler(APIParamsHandlerBase):
                 "exclude_tools",
                 "custom_tools",  # Custom tools configuration (processed separately)
                 "_has_file_search_files",  # Internal flag for file search tracking
+                "enable_file_generation",  # Internal flag for file generation (used in system messages only)
+                "enable_image_generation",  # Internal flag for image generation (used in system messages only)
+                "enable_audio_generation",  # Internal flag for audio generation (used in system messages only)
+                "enable_video_generation",  # Internal flag for video generation (used in system messages only)
             },
         )

massgen/backend/base_with_custom_tool_and_mcp.py CHANGED Viewed

@@ -284,9 +284,19 @@ class CustomToolAndMCPBackend(LLMBackend):
                     # Register each function with its corresponding values
                     for i, func in enumerate(functions):
+                        # Inject agent_cwd into preset_args if filesystem_manager is available
+                        final_preset_args = preset_args_list[i].copy() if preset_args_list[i] else {}
+                        if self.filesystem_manager and self.filesystem_manager.cwd:
+                            final_preset_args["agent_cwd"] = self.filesystem_manager.cwd
+                            logger.info(f"Injecting agent_cwd for {func}: {self.filesystem_manager.cwd}")
+                        elif self.filesystem_manager:
+                            logger.warning(f"filesystem_manager exists but cwd is None for {func}")
+                        else:
+                            logger.warning(f"No filesystem_manager available for {func}")
                         # Load the function first if custom name is needed
                         if names[i] and names[i] != func:
-                            # Need to load function and apply custom name
+                            # Load function to apply custom name
                             if path:
                                 loaded_func = self.custom_tool_manager._load_function_from_path(path, func)
                             else:
@@ -296,7 +306,6 @@ class CustomToolAndMCPBackend(LLMBackend):
                                 logger.error(f"Could not load function '{func}' from path: {path}")
                                 continue
-                            # Apply custom name by modifying __name__ attribute
                             loaded_func.__name__ = names[i]
                             # Register with loaded function (no path needed)
@@ -304,7 +313,7 @@ class CustomToolAndMCPBackend(LLMBackend):
                                 path=None,
                                 func=loaded_func,
                                 category=category,
-                                preset_args=preset_args_list[i],
+                                preset_args=final_preset_args,
                                 description=descriptions[i],
                             )
                         else:
@@ -313,7 +322,7 @@ class CustomToolAndMCPBackend(LLMBackend):
                                 path=path,
                                 func=func,
                                 category=category,
-                                preset_args=preset_args_list[i],
+                                preset_args=final_preset_args,
                                 description=descriptions[i],
                             )
@@ -404,9 +413,19 @@ class CustomToolAndMCPBackend(LLMBackend):
         """
         import json
+        # Parse arguments
+        arguments = json.loads(call["arguments"]) if isinstance(call["arguments"], str) else call["arguments"]
+        # Ensure agent_cwd is always injected if filesystem_manager is available
+        # This provides a fallback in case preset_args didn't work during registration
+        if self.filesystem_manager and self.filesystem_manager.cwd:
+            if "agent_cwd" not in arguments or arguments.get("agent_cwd") is None:
+                arguments["agent_cwd"] = self.filesystem_manager.cwd
+                logger.info(f"Dynamically injected agent_cwd at execution time: {self.filesystem_manager.cwd}")
         tool_request = {
             "name": call["name"],
-            "input": json.loads(call["arguments"]) if isinstance(call["arguments"], str) else call["arguments"],
+            "input": arguments,
         }
         result_text = ""
@@ -1120,6 +1139,7 @@ class CustomToolAndMCPBackend(LLMBackend):
         **kwargs,
     ) -> AsyncGenerator[StreamChunk, None]:
         """Simple passthrough streaming without MCP processing."""
         agent_id = kwargs.get("agent_id", None)
         all_params = {**self.config, **kwargs}
         processed_messages = await self._process_upload_files(messages, all_params)

massgen/backend/docs/permissions_and_context_files.md CHANGED Viewed

@@ -1067,8 +1067,8 @@ Files delivered:
 - **Multi-Turn Design**: `docs/dev_notes/multi_turn_filesystem_design.md` - Detailed architecture for session persistence and turn-based workflows
 - **MCP Integration**: `docs/dev_notes/gemini_filesystem_mcp_design.md` - How filesystem access works through Model Context Protocol
 - **Context Sharing**: `docs/dev_notes/v0.0.14-context.md` - Original context sharing design
-- **User Context Paths**: `docs/case_studies/user-context-path-support-with-copy-mcp.md` - Case study on adding user-specified paths
-- **Claude Code Workspace**: `docs/case_studies/claude-code-workspace-management.md` - Native filesystem integration patterns
+- **User Context Paths**: `docs/source/examples/case_studies/user-context-path-support-with-copy-mcp.md` - Case study on adding user-specified paths
+- **Claude Code Workspace**: `docs/source/examples/case_studies/claude-code-workspace-management.md` - Native filesystem integration patterns
 ## Conclusion

massgen/backend/response.py CHANGED Viewed

@@ -57,6 +57,7 @@ class ResponseBackend(CustomToolAndMCPBackend):
         Wraps parent implementation to ensure File Search cleanup happens after streaming completes.
         """
         try:
             async for chunk in super().stream_with_tools(messages, tools, **kwargs):
                 yield chunk
@@ -145,6 +146,7 @@ class ResponseBackend(CustomToolAndMCPBackend):
         **kwargs,
     ) -> AsyncGenerator[StreamChunk, None]:
         """Recursively stream MCP responses, executing function calls as needed."""
         agent_id = kwargs.get("agent_id")
         # Build API params for this iteration

massgen/chat_agent.py CHANGED Viewed

@@ -14,6 +14,8 @@ from abc import ABC, abstractmethod
 from typing import Any, AsyncGenerator, Dict, List, Optional
 from .backend.base import LLMBackend, StreamChunk
+from .logger_config import logger
+from .memory import ConversationMemory, PersistentMemoryBase
 from .stream_chunk import ChunkType
 from .utils import CoordinationStage
@@ -26,10 +28,19 @@ class ChatAgent(ABC):
     providing a unified way to interact with any type of agent system.
     """
-    def __init__(self, session_id: Optional[str] = None):
+    def __init__(
+        self,
+        session_id: Optional[str] = None,
+        conversation_memory: Optional[ConversationMemory] = None,
+        persistent_memory: Optional[PersistentMemoryBase] = None,
+    ):
         self.session_id = session_id or f"chat_session_{uuid.uuid4().hex[:8]}"
         self.conversation_history: List[Dict[str, Any]] = []
+        # Memory components
+        self.conversation_memory = conversation_memory
+        self.persistent_memory = persistent_memory
     @abstractmethod
     async def chat(
         self,
@@ -132,6 +143,9 @@ class SingleAgent(ChatAgent):
         agent_id: Optional[str] = None,
         system_message: Optional[str] = None,
         session_id: Optional[str] = None,
+        conversation_memory: Optional[ConversationMemory] = None,
+        persistent_memory: Optional[PersistentMemoryBase] = None,
+        context_monitor: Optional[Any] = None,
     ):
         """
         Initialize single agent.
@@ -141,11 +155,43 @@ class SingleAgent(ChatAgent):
             agent_id: Optional agent identifier
             system_message: Optional system message for the agent
             session_id: Optional session identifier
+            conversation_memory: Optional conversation memory instance
+            persistent_memory: Optional persistent memory instance
+            context_monitor: Optional context window monitor for tracking token usage
         """
-        super().__init__(session_id)
+        super().__init__(session_id, conversation_memory, persistent_memory)
         self.backend = backend
         self.agent_id = agent_id or f"agent_{uuid.uuid4().hex[:8]}"
         self.system_message = system_message
+        self.context_monitor = context_monitor
+        self._turn_number = 0
+        # Track orchestrator turn number (for turn-aware memory)
+        self._orchestrator_turn = None
+        # Track if compression has occurred (for smart retrieval)
+        self._compression_has_occurred = False
+        # Retrieval configuration (defaults, can be overridden from config)
+        self._retrieval_limit = 5  # Number of memory facts to retrieve from mem0
+        self._retrieval_exclude_recent = True  # Don't retrieve before compression (avoid duplicates)
+        # Track previous winning agents for shared memory retrieval
+        # Format: [{"agent_id": "agent_b", "turn": 1}, {"agent_id": "agent_a", "turn": 2}]
+        self._previous_winners = []
+        # Create context compressor if monitor and conversation_memory exist
+        self.context_compressor = None
+        if self.context_monitor and self.conversation_memory:
+            from .memory._compression import ContextCompressor
+            from .token_manager.token_manager import TokenCostCalculator
+            self.context_compressor = ContextCompressor(
+                token_calculator=TokenCostCalculator(),
+                conversation_memory=self.conversation_memory,
+                persistent_memory=self.persistent_memory,
+            )
+            logger.info(f"🗜️  Context compressor created for {self.agent_id}")
         # Add system message to history if provided
         if self.system_message:
@@ -174,6 +220,11 @@ class SingleAgent(ChatAgent):
         assistant_response = ""
         tool_calls = []
         complete_message = None
+        messages_to_record = []
+        # Accumulate all chunks for complete memory recording
+        reasoning_chunks = []  # Accumulate reasoning content
+        reasoning_summaries = []  # Accumulate reasoning summaries
         try:
             async for chunk in backend_stream:
@@ -185,6 +236,16 @@ class SingleAgent(ChatAgent):
                     chunk_tool_calls = getattr(chunk, "tool_calls", []) or []
                     tool_calls.extend(chunk_tool_calls)
                     yield chunk
+                elif chunk_type == "reasoning":
+                    # Accumulate reasoning chunks for memory
+                    if hasattr(chunk, "content") and chunk.content:
+                        reasoning_chunks.append(chunk.content)
+                    yield chunk
+                elif chunk_type == "reasoning_summary":
+                    # Accumulate reasoning summaries
+                    if hasattr(chunk, "content") and chunk.content:
+                        reasoning_summaries.append(chunk.content)
+                    yield chunk
                 elif chunk_type == "complete_message":
                     # Backend provided the complete message structure
                     complete_message = chunk.complete_message
@@ -207,24 +268,161 @@ class SingleAgent(ChatAgent):
                                 yield StreamChunk(type="tool_calls", tool_calls=response_tool_calls)
                     # Complete response is for internal use - don't yield it
                 elif chunk_type == "done":
-                    # Add complete response to history
+                    # Debug: Log what we have before assembling
+                    logger.debug(
+                        f"🔍 [done] complete_message type: {type(complete_message)}, has_output: {isinstance(complete_message, dict) and 'output' in complete_message if complete_message else False}",
+                    )
+                    logger.debug(f"🔍 [done] assistant_response length: {len(assistant_response)}, reasoning: {len(reasoning_chunks)}, summaries: {len(reasoning_summaries)}")
+                    # Assemble complete memory from all accumulated chunks
+                    messages_to_record = []
+                    # 1. Add reasoning if present (full context for memory)
+                    if reasoning_chunks:
+                        combined_reasoning = "\n".join(reasoning_chunks)
+                        messages_to_record.append(
+                            {
+                                "role": "assistant",
+                                "content": f"[Reasoning]\n{combined_reasoning}",
+                            },
+                        )
+                    # 2. Add reasoning summaries if present
+                    if reasoning_summaries:
+                        combined_summary = "\n".join(reasoning_summaries)
+                        messages_to_record.append(
+                            {
+                                "role": "assistant",
+                                "content": f"[Reasoning Summary]\n{combined_summary}",
+                            },
+                        )
+                    # 3. Add final text response (MCP tools not included - they're implementation details)
                     if complete_message:
                         # For Responses API: complete_message is the response object with 'output' array
-                        # Each item in output should be added to conversation history individually
                         if isinstance(complete_message, dict) and "output" in complete_message:
+                            # Store raw output for orchestrator (needs full format)
                             self.conversation_history.extend(complete_message["output"])
+                            # Debug: Log what's in the output array
+                            logger.debug(f"🔍 [done] complete_message['output'] has {len(complete_message['output'])} items")
+                            for i, item in enumerate(complete_message["output"][:3]):  # Show first 3
+                                item_type = item.get("type") if isinstance(item, dict) else type(item).__name__
+                                logger.debug(f"   [{i}] type={item_type}")
+                            # Extract text from output items
+                            for output_item in complete_message["output"]:
+                                if not isinstance(output_item, dict):
+                                    continue
+                                output_type = output_item.get("type")
+                                # Skip function_call (workflow tools - not conversation content)
+                                if output_type == "function_call":
+                                    continue
+                                # Extract text content from various formats
+                                if output_type == "output_text":
+                                    # Responses API format
+                                    text_content = output_item.get("text", "")
+                                elif output_type == "message":
+                                    # Standard message format
+                                    text_content = output_item.get("content", "")
+                                elif output_type == "reasoning":
+                                    # Reasoning chunks are already captured above, skip duplicate
+                                    continue
+                                else:
+                                    # Unknown type - try to get content/text
+                                    text_content = output_item.get("content") or output_item.get("text", "")
+                                    logger.debug(f"   ⚠️  Unknown output type '{output_type}', extracted: {bool(text_content)}")
+                                if text_content:
+                                    logger.debug(f"   ✅ Extracted text ({len(text_content)} chars) from type={output_type}")
+                                    messages_to_record.append(
+                                        {
+                                            "role": "assistant",
+                                            "content": text_content,
+                                        },
+                                    )
+                                else:
+                                    logger.debug(f"   ⚠️  No text content found in type={output_type}")
                         else:
                             # Fallback if it's already in message format
                             self.conversation_history.append(complete_message)
-                    elif assistant_response.strip() or tool_calls:
-                        # Fallback for legacy backends
+                            if isinstance(complete_message, dict) and complete_message.get("content"):
+                                messages_to_record.append(complete_message)
+                    elif assistant_response.strip():
+                        # Fallback for legacy backends - use accumulated text
                         message_data = {
                             "role": "assistant",
                             "content": assistant_response.strip(),
                         }
-                        if tool_calls:
-                            message_data["tool_calls"] = tool_calls
                         self.conversation_history.append(message_data)
+                        messages_to_record.append(message_data)
+                    # Record to memories
+                    logger.debug(f"📋 [done chunk] messages_to_record has {len(messages_to_record)} message(s)")
+                    if messages_to_record:
+                        logger.debug(f"✅ Will record {len(messages_to_record)} message(s) to memory")
+                        # Add to conversation memory (use formatted messages, not raw output)
+                        if self.conversation_memory:
+                            try:
+                                await self.conversation_memory.add(messages_to_record)
+                                logger.debug(f"📝 Added {len(messages_to_record)} message(s) to conversation memory")
+                            except Exception as e:
+                                # Log but don't fail if memory add fails
+                                logger.warning(f"⚠️  Failed to add response to conversation memory: {e}")
+                        # Record to persistent memory with turn metadata
+                        if self.persistent_memory:
+                            try:
+                                # Include turn number in metadata for temporal filtering
+                                logger.debug(f"📝 Recording {len(messages_to_record)} messages to persistent memory (turn {self._orchestrator_turn})")
+                                await self.persistent_memory.record(
+                                    messages_to_record,
+                                    metadata={"turn": self._orchestrator_turn} if self._orchestrator_turn else None,
+                                )
+                                logger.debug("✅ Successfully recorded to persistent memory")
+                            except NotImplementedError:
+                                # Memory backend doesn't support record
+                                logger.warning("⚠️  Persistent memory doesn't support record()")
+                            except Exception as e:
+                                # Log but don't fail if memory record fails
+                                logger.warning(f"⚠️  Failed to record to persistent memory: {e}")
+                    else:
+                        logger.warning("⚠️  [done chunk] messages_to_record is EMPTY - nothing to record!")
+                    # Log context usage after response (if monitor enabled)
+                    if self.context_monitor:
+                        # Use conversation history for accurate token count
+                        current_history = self.conversation_history if not self.conversation_memory else await self.conversation_memory.get_messages()
+                        usage_info = self.context_monitor.log_context_usage(current_history, turn_number=self._turn_number)
+                        # Compress if needed
+                        if self.context_compressor and usage_info.get("should_compress"):
+                            logger.info(
+                                f"🔄 Attempting compression for {self.agent_id} " f"({usage_info['current_tokens']:,} → {usage_info['target_tokens']:,} tokens)",
+                            )
+                            compression_stats = await self.context_compressor.compress_if_needed(
+                                messages=current_history,
+                                current_tokens=usage_info["current_tokens"],
+                                target_tokens=usage_info["target_tokens"],
+                                should_compress=True,
+                            )
+                            # Update conversation_history if compression occurred
+                            if compression_stats and self.conversation_memory:
+                                # Reload from conversation memory (it was updated by compressor)
+                                self.conversation_history = await self.conversation_memory.get_messages()
+                                # Mark that compression has occurred
+                                self._compression_has_occurred = True
+                                logger.info(
+                                    f"✅ Conversation history updated after compression: " f"{len(self.conversation_history)} messages",
+                                )
+                        elif usage_info.get("should_compress") and not self.context_compressor:
+                            logger.warning(
+                                f"⚠️  Should compress but compressor not available " f"(monitor={self.context_monitor is not None}, " f"conv_mem={self.conversation_memory is not None})",
+                            )
                     yield chunk
                 else:
                     yield chunk
@@ -242,12 +440,28 @@ class SingleAgent(ChatAgent):
         reset_chat: bool = False,
         clear_history: bool = False,
         current_stage: CoordinationStage = None,
+        orchestrator_turn: Optional[int] = None,
+        previous_winners: Optional[List[Dict[str, Any]]] = None,
     ) -> AsyncGenerator[StreamChunk, None]:
-        # print("Agent: ", self.agent_id)
-        # for message in messages:
-        #     print(f"Message: {message}\n")
-        # print("Messages End. \n")
-        """Process messages through single backend with tool support."""
+        """
+        Process messages through single backend with tool support.
+        Args:
+            orchestrator_turn: Current orchestrator turn number (for turn-aware memory)
+            previous_winners: List of previous winning agents with turns
+                             Format: [{"agent_id": "agent_b", "turn": 1}, ...]
+        """
+        # Update orchestrator turn if provided
+        if orchestrator_turn is not None:
+            logger.debug(f"🔍 [chat] Setting orchestrator_turn={orchestrator_turn} for {self.agent_id}")
+            self._orchestrator_turn = orchestrator_turn
+        # Update previous winners if provided
+        if previous_winners is not None:
+            logger.debug(f"🔍 [chat] Setting previous_winners={previous_winners} for {self.agent_id}")
+            self._previous_winners = previous_winners
+        else:
+            logger.debug(f"🔍 [chat] No previous_winners provided to {self.agent_id} (current: {self._previous_winners})")
         if clear_history:
             # Clear history but keep system message if it exists
             system_messages = [msg for msg in self.conversation_history if msg.get("role") == "system"]
@@ -255,28 +469,121 @@ class SingleAgent(ChatAgent):
             # Clear backend history while maintaining session
             if self.backend.is_stateful():
                 await self.backend.clear_history()
+            # Clear conversation memory if available
+            if self.conversation_memory:
+                await self.conversation_memory.clear()
         if reset_chat:
+            # Skip pre-restart recording - messages are already recorded via done chunks
+            # Pre-restart would duplicate content and include orchestrator system prompts (noise)
+            # The conversation_memory contains:
+            # 1. User messages - will be in new conversation after reset
+            # 2. Agent responses - already recorded to persistent_memory via done chunks
+            # 3. System messages - orchestrator prompts, don't want in long-term memory
+            logger.debug(f"🔄 Resetting chat for {self.agent_id} (skipping pre-restart recording - already captured via done chunks)")
             # Reset conversation history to the provided messages
             self.conversation_history = messages.copy()
             # Reset backend state completely
             if self.backend.is_stateful():
                 await self.backend.reset_state()
+            # Reset conversation memory
+            if self.conversation_memory:
+                await self.conversation_memory.clear()
+                await self.conversation_memory.add(messages)
             backend_messages = self.conversation_history.copy()
         else:
             # Regular conversation - append new messages to agent's history
             self.conversation_history.extend(messages)
-            # Handle stateful vs stateless backends differently
-            if self.backend.is_stateful():
-                # Stateful: only send new messages, backend maintains context
-                backend_messages = messages.copy()
-            else:
-                # Stateless: send full conversation history
-                backend_messages = self.conversation_history.copy()
+            # Add to conversation memory
+            if self.conversation_memory:
+                try:
+                    await self.conversation_memory.add(messages)
+                except Exception as e:
+                    # Log but don't fail if memory add fails
+                    logger.warning(f"Failed to add messages to conversation memory: {e}")
+            backend_messages = self.conversation_history.copy()
+        # Retrieve relevant persistent memories if available
+        # ALWAYS retrieve on reset_chat (to restore recent context after restart)
+        # Otherwise, only retrieve if compression has occurred (to avoid duplicating recent context)
+        memory_context = ""
+        should_retrieve = self.persistent_memory and (reset_chat or self._compression_has_occurred or not self._retrieval_exclude_recent)  # Always retrieve on reset to restore context
+        if should_retrieve:
+            try:
+                # Log retrieval reason and scope
+                if reset_chat:
+                    logger.info(
+                        f"🔄 Retrieving memories after reset for {self.agent_id} " f"(restoring recent context + {len(self._previous_winners) if self._previous_winners else 0} winner(s))...",
+                    )
+                elif self._previous_winners:
+                    logger.info(
+                        f"🔍 Retrieving memories for {self.agent_id} + {len(self._previous_winners)} previous winner(s) " f"(limit={self._retrieval_limit}/agent)...",
+                    )
+                    logger.debug(f"   Previous winners: {self._previous_winners}")
+                else:
+                    logger.info(
+                        f"🔍 Retrieving memories for {self.agent_id} " f"(limit={self._retrieval_limit}, compressed={self._compression_has_occurred})...",
+                    )
+                memory_context = await self.persistent_memory.retrieve(
+                    messages,
+                    limit=self._retrieval_limit,
+                    previous_winners=self._previous_winners if self._previous_winners else None,
+                )
+                if memory_context:
+                    memory_lines = memory_context.strip().split("\n")
+                    logger.info(
+                        f"💭 Retrieved {len(memory_lines)} memory fact(s) from mem0",
+                    )
+                    # Show preview at INFO level (truncate to first 300 chars for readability)
+                    preview = memory_context[:300] + "..." if len(memory_context) > 300 else memory_context
+                    logger.info(f"   📝 Preview:\n{preview}")
+                else:
+                    logger.info("   ℹ️  No relevant memories found")
+            except NotImplementedError:
+                logger.debug("   Persistent memory doesn't support retrieval")
+            except Exception as e:
+                logger.warning(f"⚠️  Failed to retrieve from persistent memory: {e}")
+        elif self.persistent_memory and self._retrieval_exclude_recent:
+            logger.debug(
+                f"⏭️  Skipping retrieval for {self.agent_id} " f"(no compression yet, all context in conversation_memory)",
+            )
+        # Handle stateful vs stateless backends differently
+        if self.backend.is_stateful():
+            # Stateful: only send new messages, backend maintains context
+            backend_messages = messages.copy()
+            # Inject memory context before user messages if available
+            if memory_context:
+                memory_msg = {
+                    "role": "system",
+                    "content": f"Relevant memories:\n{memory_context}",
+                }
+                backend_messages.insert(0, memory_msg)
+        else:
+            # Stateless: send full conversation history
+            backend_messages = self.conversation_history.copy()
+            # Inject memory context after system message but before conversation
+            if memory_context:
+                memory_msg = {
+                    "role": "system",
+                    "content": f"Relevant memories:\n{memory_context}",
+                }
+                # Insert after existing system messages
+                system_count = sum(1 for msg in backend_messages if msg.get("role") == "system")
+                backend_messages.insert(system_count, memory_msg)
         if current_stage:
             self.backend.set_stage(current_stage)
+        # Log context usage before processing (if monitor enabled)
+        self._turn_number += 1
+        if self.context_monitor:
+            self.context_monitor.log_context_usage(backend_messages, turn_number=self._turn_number)
         # Create backend stream and process it
         backend_stream = self.backend.stream_with_tools(
             messages=backend_messages,
@@ -311,6 +618,10 @@ class SingleAgent(ChatAgent):
         if self.backend.is_stateful():
             await self.backend.reset_state()
+        # Clear conversation memory (not persistent memory)
+        if self.conversation_memory:
+            await self.conversation_memory.clear()
         # Re-add system message if it exists
         if self.system_message:
             self.conversation_history.append({"role": "system", "content": self.system_message})
@@ -356,6 +667,9 @@ class ConfigurableAgent(SingleAgent):
         config,  # AgentConfig - avoid circular import
         backend: LLMBackend,
         session_id: Optional[str] = None,
+        conversation_memory: Optional[ConversationMemory] = None,
+        persistent_memory: Optional[PersistentMemoryBase] = None,
+        context_monitor: Optional[Any] = None,
     ):
         """
         Initialize configurable agent.
@@ -364,6 +678,9 @@ class ConfigurableAgent(SingleAgent):
             config: AgentConfig with all settings
             backend: LLM backend
             session_id: Optional session identifier
+            conversation_memory: Optional conversation memory instance
+            persistent_memory: Optional persistent memory instance
+            context_monitor: Optional context window monitor for tracking token usage
         """
         # Extract system message without triggering deprecation warning
         system_message = None
@@ -375,6 +692,9 @@ class ConfigurableAgent(SingleAgent):
             agent_id=config.agent_id,
             system_message=system_message,
             session_id=session_id,
+            conversation_memory=conversation_memory,
+            persistent_memory=persistent_memory,
+            context_monitor=context_monitor,
         )
         self.config = config

massgen 0.1.3__py3-none-any.whl → 0.1.5__py3-none-any.whl

Potentially problematic release.

massgen 0.1.3py3-none-any.whl → 0.1.5py3-none-any.whl