PyPI - code-puppy - Versions diffs - 0.0.169__py3-none-any.whl → 0.0.366__py3-none-any.whl - Mend

code-puppy 0.0.169py3-none-any.whl → 0.0.366py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (243) hide show

code_puppy/__init__.py +7 -1
code_puppy/agents/__init__.py +8 -8
code_puppy/agents/agent_c_reviewer.py +155 -0
code_puppy/agents/agent_code_puppy.py +9 -2
code_puppy/agents/agent_code_reviewer.py +90 -0
code_puppy/agents/agent_cpp_reviewer.py +132 -0
code_puppy/agents/agent_creator_agent.py +48 -9
code_puppy/agents/agent_golang_reviewer.py +151 -0
code_puppy/agents/agent_javascript_reviewer.py +160 -0
code_puppy/agents/agent_manager.py +146 -199
code_puppy/agents/agent_pack_leader.py +383 -0
code_puppy/agents/agent_planning.py +163 -0
code_puppy/agents/agent_python_programmer.py +165 -0
code_puppy/agents/agent_python_reviewer.py +90 -0
code_puppy/agents/agent_qa_expert.py +163 -0
code_puppy/agents/agent_qa_kitten.py +208 -0
code_puppy/agents/agent_security_auditor.py +181 -0
code_puppy/agents/agent_terminal_qa.py +323 -0
code_puppy/agents/agent_typescript_reviewer.py +166 -0
code_puppy/agents/base_agent.py +1713 -1
code_puppy/agents/event_stream_handler.py +350 -0
code_puppy/agents/json_agent.py +12 -1
code_puppy/agents/pack/__init__.py +34 -0
code_puppy/agents/pack/bloodhound.py +304 -0
code_puppy/agents/pack/husky.py +321 -0
code_puppy/agents/pack/retriever.py +393 -0
code_puppy/agents/pack/shepherd.py +348 -0
code_puppy/agents/pack/terrier.py +287 -0
code_puppy/agents/pack/watchdog.py +367 -0
code_puppy/agents/prompt_reviewer.py +145 -0
code_puppy/agents/subagent_stream_handler.py +276 -0
code_puppy/api/__init__.py +13 -0
code_puppy/api/app.py +169 -0
code_puppy/api/main.py +21 -0
code_puppy/api/pty_manager.py +446 -0
code_puppy/api/routers/__init__.py +12 -0
code_puppy/api/routers/agents.py +36 -0
code_puppy/api/routers/commands.py +217 -0
code_puppy/api/routers/config.py +74 -0
code_puppy/api/routers/sessions.py +232 -0
code_puppy/api/templates/terminal.html +361 -0
code_puppy/api/websocket.py +154 -0
code_puppy/callbacks.py +174 -4
code_puppy/chatgpt_codex_client.py +283 -0
code_puppy/claude_cache_client.py +586 -0
code_puppy/cli_runner.py +916 -0
code_puppy/command_line/add_model_menu.py +1079 -0
code_puppy/command_line/agent_menu.py +395 -0
code_puppy/command_line/attachments.py +395 -0
code_puppy/command_line/autosave_menu.py +605 -0
code_puppy/command_line/clipboard.py +527 -0
code_puppy/command_line/colors_menu.py +520 -0
code_puppy/command_line/command_handler.py +233 -627
code_puppy/command_line/command_registry.py +150 -0
code_puppy/command_line/config_commands.py +715 -0
code_puppy/command_line/core_commands.py +792 -0
code_puppy/command_line/diff_menu.py +863 -0
code_puppy/command_line/load_context_completion.py +15 -22
code_puppy/command_line/mcp/base.py +1 -4
code_puppy/command_line/mcp/catalog_server_installer.py +175 -0
code_puppy/command_line/mcp/custom_server_form.py +688 -0
code_puppy/command_line/mcp/custom_server_installer.py +195 -0
code_puppy/command_line/mcp/edit_command.py +148 -0
code_puppy/command_line/mcp/handler.py +9 -4
code_puppy/command_line/mcp/help_command.py +6 -5
code_puppy/command_line/mcp/install_command.py +16 -27
code_puppy/command_line/mcp/install_menu.py +685 -0
code_puppy/command_line/mcp/list_command.py +3 -3
code_puppy/command_line/mcp/logs_command.py +174 -65
code_puppy/command_line/mcp/remove_command.py +2 -2
code_puppy/command_line/mcp/restart_command.py +12 -4
code_puppy/command_line/mcp/search_command.py +17 -11
code_puppy/command_line/mcp/start_all_command.py +22 -13
code_puppy/command_line/mcp/start_command.py +50 -31
code_puppy/command_line/mcp/status_command.py +6 -7
code_puppy/command_line/mcp/stop_all_command.py +11 -8
code_puppy/command_line/mcp/stop_command.py +11 -10
code_puppy/command_line/mcp/test_command.py +2 -2
code_puppy/command_line/mcp/utils.py +1 -1
code_puppy/command_line/mcp/wizard_utils.py +22 -18
code_puppy/command_line/mcp_completion.py +174 -0
code_puppy/command_line/model_picker_completion.py +89 -30
code_puppy/command_line/model_settings_menu.py +884 -0
code_puppy/command_line/motd.py +14 -8
code_puppy/command_line/onboarding_slides.py +179 -0
code_puppy/command_line/onboarding_wizard.py +340 -0
code_puppy/command_line/pin_command_completion.py +329 -0
code_puppy/command_line/prompt_toolkit_completion.py +626 -75
code_puppy/command_line/session_commands.py +296 -0
code_puppy/command_line/utils.py +54 -0
code_puppy/config.py +1181 -51
code_puppy/error_logging.py +118 -0
code_puppy/gemini_code_assist.py +385 -0
code_puppy/gemini_model.py +602 -0
code_puppy/http_utils.py +220 -104
code_puppy/keymap.py +128 -0
code_puppy/main.py +5 -594
code_puppy/{mcp → mcp_}/__init__.py +17 -0
code_puppy/{mcp → mcp_}/async_lifecycle.py +35 -4
code_puppy/{mcp → mcp_}/blocking_startup.py +70 -43
code_puppy/{mcp → mcp_}/captured_stdio_server.py +2 -2
code_puppy/{mcp → mcp_}/config_wizard.py +5 -5
code_puppy/{mcp → mcp_}/dashboard.py +15 -6
code_puppy/{mcp → mcp_}/examples/retry_example.py +4 -1
code_puppy/{mcp → mcp_}/managed_server.py +66 -39
code_puppy/{mcp → mcp_}/manager.py +146 -52
code_puppy/mcp_/mcp_logs.py +224 -0
code_puppy/{mcp → mcp_}/registry.py +6 -6
code_puppy/{mcp → mcp_}/server_registry_catalog.py +25 -8
code_puppy/messaging/__init__.py +199 -2
code_puppy/messaging/bus.py +610 -0
code_puppy/messaging/commands.py +167 -0
code_puppy/messaging/markdown_patches.py +57 -0
code_puppy/messaging/message_queue.py +17 -48
code_puppy/messaging/messages.py +500 -0
code_puppy/messaging/queue_console.py +1 -24
code_puppy/messaging/renderers.py +43 -146
code_puppy/messaging/rich_renderer.py +1027 -0
code_puppy/messaging/spinner/__init__.py +33 -5
code_puppy/messaging/spinner/console_spinner.py +92 -52
code_puppy/messaging/spinner/spinner_base.py +29 -0
code_puppy/messaging/subagent_console.py +461 -0
code_puppy/model_factory.py +686 -80
code_puppy/model_utils.py +167 -0
code_puppy/models.json +86 -104
code_puppy/models_dev_api.json +1 -0
code_puppy/models_dev_parser.py +592 -0
code_puppy/plugins/__init__.py +164 -10
code_puppy/plugins/antigravity_oauth/__init__.py +10 -0
code_puppy/plugins/antigravity_oauth/accounts.py +406 -0
code_puppy/plugins/antigravity_oauth/antigravity_model.py +704 -0
code_puppy/plugins/antigravity_oauth/config.py +42 -0
code_puppy/plugins/antigravity_oauth/constants.py +136 -0
code_puppy/plugins/antigravity_oauth/oauth.py +478 -0
code_puppy/plugins/antigravity_oauth/register_callbacks.py +406 -0
code_puppy/plugins/antigravity_oauth/storage.py +271 -0
code_puppy/plugins/antigravity_oauth/test_plugin.py +319 -0
code_puppy/plugins/antigravity_oauth/token.py +167 -0
code_puppy/plugins/antigravity_oauth/transport.py +767 -0
code_puppy/plugins/antigravity_oauth/utils.py +169 -0
code_puppy/plugins/chatgpt_oauth/__init__.py +8 -0
code_puppy/plugins/chatgpt_oauth/config.py +52 -0
code_puppy/plugins/chatgpt_oauth/oauth_flow.py +328 -0
code_puppy/plugins/chatgpt_oauth/register_callbacks.py +94 -0
code_puppy/plugins/chatgpt_oauth/test_plugin.py +293 -0
code_puppy/plugins/chatgpt_oauth/utils.py +489 -0
code_puppy/plugins/claude_code_oauth/README.md +167 -0
code_puppy/plugins/claude_code_oauth/SETUP.md +93 -0
code_puppy/plugins/claude_code_oauth/__init__.py +6 -0
code_puppy/plugins/claude_code_oauth/config.py +50 -0
code_puppy/plugins/claude_code_oauth/register_callbacks.py +308 -0
code_puppy/plugins/claude_code_oauth/test_plugin.py +283 -0
code_puppy/plugins/claude_code_oauth/utils.py +518 -0
code_puppy/plugins/customizable_commands/__init__.py +0 -0
code_puppy/plugins/customizable_commands/register_callbacks.py +169 -0
code_puppy/plugins/example_custom_command/README.md +280 -0
code_puppy/plugins/example_custom_command/register_callbacks.py +51 -0
code_puppy/plugins/file_permission_handler/__init__.py +4 -0
code_puppy/plugins/file_permission_handler/register_callbacks.py +523 -0
code_puppy/plugins/frontend_emitter/__init__.py +25 -0
code_puppy/plugins/frontend_emitter/emitter.py +121 -0
code_puppy/plugins/frontend_emitter/register_callbacks.py +261 -0
code_puppy/plugins/oauth_puppy_html.py +228 -0
code_puppy/plugins/shell_safety/__init__.py +6 -0
code_puppy/plugins/shell_safety/agent_shell_safety.py +69 -0
code_puppy/plugins/shell_safety/command_cache.py +156 -0
code_puppy/plugins/shell_safety/register_callbacks.py +202 -0
code_puppy/prompts/antigravity_system_prompt.md +1 -0
code_puppy/prompts/codex_system_prompt.md +310 -0
code_puppy/pydantic_patches.py +131 -0
code_puppy/reopenable_async_client.py +8 -8
code_puppy/round_robin_model.py +10 -15
code_puppy/session_storage.py +294 -0
code_puppy/status_display.py +21 -4
code_puppy/summarization_agent.py +52 -14
code_puppy/terminal_utils.py +418 -0
code_puppy/tools/__init__.py +139 -6
code_puppy/tools/agent_tools.py +548 -49
code_puppy/tools/browser/__init__.py +37 -0
code_puppy/tools/browser/browser_control.py +289 -0
code_puppy/tools/browser/browser_interactions.py +545 -0
code_puppy/tools/browser/browser_locators.py +640 -0
code_puppy/tools/browser/browser_manager.py +316 -0
code_puppy/tools/browser/browser_navigation.py +251 -0
code_puppy/tools/browser/browser_screenshot.py +179 -0
code_puppy/tools/browser/browser_scripts.py +462 -0
code_puppy/tools/browser/browser_workflows.py +221 -0
code_puppy/tools/browser/chromium_terminal_manager.py +259 -0
code_puppy/tools/browser/terminal_command_tools.py +521 -0
code_puppy/tools/browser/terminal_screenshot_tools.py +556 -0
code_puppy/tools/browser/terminal_tools.py +525 -0
code_puppy/tools/command_runner.py +941 -153
code_puppy/tools/common.py +1146 -6
code_puppy/tools/display.py +84 -0
code_puppy/tools/file_modifications.py +288 -89
code_puppy/tools/file_operations.py +352 -266
code_puppy/tools/subagent_context.py +158 -0
code_puppy/uvx_detection.py +242 -0
code_puppy/version_checker.py +30 -11
code_puppy-0.0.366.data/data/code_puppy/models.json +110 -0
code_puppy-0.0.366.data/data/code_puppy/models_dev_api.json +1 -0
{code_puppy-0.0.169.dist-info → code_puppy-0.0.366.dist-info}/METADATA +184 -67
code_puppy-0.0.366.dist-info/RECORD +217 -0
{code_puppy-0.0.169.dist-info → code_puppy-0.0.366.dist-info}/WHEEL +1 -1
{code_puppy-0.0.169.dist-info → code_puppy-0.0.366.dist-info}/entry_points.txt +1 -0
code_puppy/agent.py +0 -231
code_puppy/agents/agent_orchestrator.json +0 -26
code_puppy/agents/runtime_manager.py +0 -272
code_puppy/command_line/mcp/add_command.py +0 -183
code_puppy/command_line/meta_command_handler.py +0 -153
code_puppy/message_history_processor.py +0 -490
code_puppy/messaging/spinner/textual_spinner.py +0 -101
code_puppy/state_management.py +0 -200
code_puppy/tui/__init__.py +0 -10
code_puppy/tui/app.py +0 -986
code_puppy/tui/components/__init__.py +0 -21
code_puppy/tui/components/chat_view.py +0 -550
code_puppy/tui/components/command_history_modal.py +0 -218
code_puppy/tui/components/copy_button.py +0 -139
code_puppy/tui/components/custom_widgets.py +0 -63
code_puppy/tui/components/human_input_modal.py +0 -175
code_puppy/tui/components/input_area.py +0 -167
code_puppy/tui/components/sidebar.py +0 -309
code_puppy/tui/components/status_bar.py +0 -182
code_puppy/tui/messages.py +0 -27
code_puppy/tui/models/__init__.py +0 -8
code_puppy/tui/models/chat_message.py +0 -25
code_puppy/tui/models/command_history.py +0 -89
code_puppy/tui/models/enums.py +0 -24
code_puppy/tui/screens/__init__.py +0 -15
code_puppy/tui/screens/help.py +0 -130
code_puppy/tui/screens/mcp_install_wizard.py +0 -803
code_puppy/tui/screens/settings.py +0 -290
code_puppy/tui/screens/tools.py +0 -74
code_puppy-0.0.169.data/data/code_puppy/models.json +0 -128
code_puppy-0.0.169.dist-info/RECORD +0 -112
/code_puppy/{mcp → mcp_}/circuit_breaker.py +0 -0
/code_puppy/{mcp → mcp_}/error_isolation.py +0 -0
/code_puppy/{mcp → mcp_}/health_monitor.py +0 -0
/code_puppy/{mcp → mcp_}/retry_manager.py +0 -0
/code_puppy/{mcp → mcp_}/status_tracker.py +0 -0
/code_puppy/{mcp → mcp_}/system_tools.py +0 -0
{code_puppy-0.0.169.dist-info → code_puppy-0.0.366.dist-info}/licenses/LICENSE +0 -0

code_puppy/tools/agent_tools.py CHANGED Viewed

@@ -1,22 +1,209 @@
 # agent_tools.py
-from typing import List
+import asyncio
+import hashlib
+import itertools
+import json
+import pickle
+import re
+import traceback
+from datetime import datetime
+from functools import partial
+from pathlib import Path
+from typing import List, Set
+from dbos import DBOS, SetWorkflowID
 from pydantic import BaseModel
-from pydantic_ai import RunContext
+# Import Agent from pydantic_ai to create temporary agents for invocation
+from pydantic_ai import Agent, RunContext, UsageLimits
+from pydantic_ai.messages import ModelMessage
+from code_puppy.config import (
+    DATA_DIR,
+    get_message_limit,
+    get_use_dbos,
+    get_value,
+)
 from code_puppy.messaging import (
-    emit_info,
-    emit_divider,
-    emit_system_message,
+    SubAgentInvocationMessage,
+    SubAgentResponseMessage,
     emit_error,
+    emit_info,
+    emit_success,
+    get_message_bus,
+    get_session_context,
+    set_session_context,
 )
 from code_puppy.tools.common import generate_group_id
-from code_puppy.agents.agent_manager import get_available_agents, load_agent_config
+from code_puppy.tools.subagent_context import subagent_context
-# Import Agent from pydantic_ai to create temporary agents for invocation
-from pydantic_ai import Agent
-from code_puppy.model_factory import ModelFactory
-from code_puppy.config import get_model_name
+# Set to track active subagent invocation tasks
+_active_subagent_tasks: Set[asyncio.Task] = set()
+# Atomic counter for DBOS workflow IDs - ensures uniqueness even in rapid back-to-back calls
+# itertools.count() is thread-safe for next() calls
+_dbos_workflow_counter = itertools.count()
+def _generate_dbos_workflow_id(base_id: str) -> str:
+    """Generate a unique DBOS workflow ID by appending an atomic counter.
+    DBOS requires workflow IDs to be unique across all executions.
+    This function ensures uniqueness by combining the base_id with
+    an atomically incrementing counter.
+    Args:
+        base_id: The base identifier (e.g., group_id from generate_group_id)
+    Returns:
+        A unique workflow ID in format: {base_id}-wf-{counter}
+    """
+    counter = next(_dbos_workflow_counter)
+    return f"{base_id}-wf-{counter}"
+def _generate_session_hash_suffix() -> str:
+    """Generate a short SHA1 hash suffix based on current timestamp for uniqueness.
+    Returns:
+        A 6-character hex string, e.g., "a3f2b1"
+    """
+    timestamp = str(datetime.now().timestamp())
+    return hashlib.sha1(timestamp.encode()).hexdigest()[:6]
+# Regex pattern for kebab-case session IDs
+SESSION_ID_PATTERN = re.compile(r"^[a-z0-9]+(-[a-z0-9]+)*$")
+SESSION_ID_MAX_LENGTH = 128
+def _validate_session_id(session_id: str) -> None:
+    """Validate that a session ID follows kebab-case naming conventions.
+    Args:
+        session_id: The session identifier to validate
+    Raises:
+        ValueError: If the session_id is invalid
+    Valid format:
+        - Lowercase letters (a-z)
+        - Numbers (0-9)
+        - Hyphens (-) to separate words
+        - No uppercase, no underscores, no special characters
+        - Length between 1 and 128 characters
+    Examples:
+        Valid: "my-session", "agent-session-1", "discussion-about-code"
+        Invalid: "MySession", "my_session", "my session", "my--session"
+    """
+    if not session_id:
+        raise ValueError("session_id cannot be empty")
+    if len(session_id) > SESSION_ID_MAX_LENGTH:
+        raise ValueError(
+            f"Invalid session_id '{session_id}': must be {SESSION_ID_MAX_LENGTH} characters or less"
+        )
+    if not SESSION_ID_PATTERN.match(session_id):
+        raise ValueError(
+            f"Invalid session_id '{session_id}': must be kebab-case "
+            "(lowercase letters, numbers, and hyphens only). "
+            "Examples: 'my-session', 'agent-session-1', 'discussion-about-code'"
+        )
+def _get_subagent_sessions_dir() -> Path:
+    """Get the directory for storing subagent session data.
+    Returns:
+        Path to XDG data directory/subagent_sessions/
+    """
+    sessions_dir = Path(DATA_DIR) / "subagent_sessions"
+    sessions_dir.mkdir(parents=True, exist_ok=True, mode=0o700)
+    return sessions_dir
+def _save_session_history(
+    session_id: str,
+    message_history: List[ModelMessage],
+    agent_name: str,
+    initial_prompt: str | None = None,
+) -> None:
+    """Save session history to filesystem.
+    Args:
+        session_id: The session identifier (must be kebab-case)
+        message_history: List of messages to save
+        agent_name: Name of the agent being invoked
+        initial_prompt: The first prompt that started this session (for .txt metadata)
+    Raises:
+        ValueError: If session_id is not valid kebab-case format
+    """
+    # Validate session_id format before saving
+    _validate_session_id(session_id)
+    sessions_dir = _get_subagent_sessions_dir()
+    # Save pickle file with message history
+    pkl_path = sessions_dir / f"{session_id}.pkl"
+    with open(pkl_path, "wb") as f:
+        pickle.dump(message_history, f)
+    # Save or update txt file with metadata
+    txt_path = sessions_dir / f"{session_id}.txt"
+    if not txt_path.exists() and initial_prompt:
+        # Only write initial metadata on first save
+        metadata = {
+            "session_id": session_id,
+            "agent_name": agent_name,
+            "initial_prompt": initial_prompt,
+            "created_at": datetime.now().isoformat(),
+            "message_count": len(message_history),
+        }
+        with open(txt_path, "w") as f:
+            json.dump(metadata, f, indent=2)
+    elif txt_path.exists():
+        # Update message count on subsequent saves
+        try:
+            with open(txt_path, "r") as f:
+                metadata = json.load(f)
+            metadata["message_count"] = len(message_history)
+            metadata["last_updated"] = datetime.now().isoformat()
+            with open(txt_path, "w") as f:
+                json.dump(metadata, f, indent=2)
+        except Exception:
+            pass  # If we can't update metadata, no big deal
+def _load_session_history(session_id: str) -> List[ModelMessage]:
+    """Load session history from filesystem.
+    Args:
+        session_id: The session identifier (must be kebab-case)
+    Returns:
+        List of ModelMessage objects, or empty list if session doesn't exist
+    Raises:
+        ValueError: If session_id is not valid kebab-case format
+    """
+    # Validate session_id format before loading
+    _validate_session_id(session_id)
+    sessions_dir = _get_subagent_sessions_dir()
+    pkl_path = sessions_dir / f"{session_id}.pkl"
+    if not pkl_path.exists():
+        return []
+    try:
+        with open(pkl_path, "rb") as f:
+            return pickle.load(f)
+    except Exception:
+        # If pickle is corrupted or incompatible, return empty history
+        return []
 class AgentInfo(BaseModel):
@@ -24,6 +211,7 @@ class AgentInfo(BaseModel):
     name: str
     display_name: str
+    description: str
 class ListAgentsOutput(BaseModel):
@@ -38,6 +226,7 @@ class AgentInvokeOutput(BaseModel):
     response: str | None
     agent_name: str
+    session_id: str | None = None
     error: str | None = None
@@ -58,36 +247,50 @@ def register_list_agents(agent):
         # Generate a group ID for this tool execution
         group_id = generate_group_id("list_agents")
+        from rich.text import Text
+        from code_puppy.config import get_banner_color
+        list_agents_color = get_banner_color("list_agents")
         emit_info(
-            "\n[bold white on blue] LIST AGENTS [/bold white on blue]",
+            Text.from_markup(
+                f"\n[bold white on {list_agents_color}] LIST AGENTS [/bold white on {list_agents_color}]"
+            ),
             message_group=group_id,
         )
-        emit_divider(message_group=group_id)
         try:
-            # Get available agents from the agent manager
+            from code_puppy.agents import get_agent_descriptions, get_available_agents
+            # Get available agents and their descriptions from the agent manager
             agents_dict = get_available_agents()
+            descriptions_dict = get_agent_descriptions()
             # Convert to list of AgentInfo objects
             agents = [
-                AgentInfo(name=name, display_name=display_name)
+                AgentInfo(
+                    name=name,
+                    display_name=display_name,
+                    description=descriptions_dict.get(name, "No description available"),
+                )
                 for name, display_name in agents_dict.items()
             ]
-            # Display the agents in the console
+            # Accumulate output into a single string and emit once
+            # Use Text.from_markup() to pass a Rich object that won't be escaped
+            lines = []
             for agent_item in agents:
-                emit_system_message(
-                    f"- [bold]{agent_item.name}[/bold]: {agent_item.display_name}",
-                    message_group=group_id,
+                lines.append(
+                    f"- [bold]{agent_item.name}[/bold]: {agent_item.display_name}\n"
+                    f"  [dim]{agent_item.description}[/dim]"
                 )
+            emit_info(Text.from_markup("\n".join(lines)), message_group=group_id)
-            emit_divider(message_group=group_id)
             return ListAgentsOutput(agents=agents)
         except Exception as e:
             error_msg = f"Error listing agents: {str(e)}"
             emit_error(error_msg, message_group=group_id)
-            emit_divider(message_group=group_id)
             return ListAgentsOutput(agents=[], error=error_msg)
     return list_agents
@@ -101,35 +304,162 @@ def register_invoke_agent(agent):
     """
     @agent.tool
-    def invoke_agent(
-        context: RunContext, agent_name: str, prompt: str
+    async def invoke_agent(
+        context: RunContext, agent_name: str, prompt: str, session_id: str | None = None
     ) -> AgentInvokeOutput:
         """Invoke a specific sub-agent with a given prompt.
         Args:
             agent_name: The name of the agent to invoke
             prompt: The prompt to send to the agent
+            session_id: Optional session ID for maintaining conversation memory across invocations.
+                       **Session ID Format:**
+                       - Must be kebab-case (lowercase letters, numbers, hyphens only)
+                       - Should be human-readable: e.g., "implement-oauth", "review-auth"
+                       - For NEW sessions, a SHA1 hash suffix is automatically appended for uniqueness
+                       - To CONTINUE a session, use the full session_id (with hash) from the previous invocation
+                       - If None (default), auto-generates like "agent-name-session-1"
+                       **When to use session_id:**
+                       - **NEW SESSION**: Provide a base name like "review-auth" - we'll append a unique hash
+                       - **CONTINUE SESSION**: Use the full session_id from output (e.g., "review-auth-a3f2b1")
+                       - **ONE-OFF TASKS**: Leave as None (auto-generate)
+                       **Most common pattern:** Leave session_id as None (auto-generate) unless you
+                       specifically need conversational memory.
         Returns:
-            AgentInvokeOutput: The agent's response to the prompt
+            AgentInvokeOutput: Contains:
+                - response (str | None): The agent's response to the prompt
+                - agent_name (str): Name of the invoked agent
+                - session_id (str | None): The full session ID (with hash suffix) - USE THIS to continue the conversation!
+                - error (str | None): Error message if invocation failed
+        Examples:
+            # COMMON CASE: One-off invocation, no memory needed (auto-generate session)
+            result = invoke_agent(
+                "qa-expert",
+                "Review this function: def add(a, b): return a + b"
+            )
+            # result.session_id will be something like "qa-expert-session-a3f2b1"
+            # MULTI-TURN: Start a NEW conversation with a base session ID
+            # A hash suffix is auto-appended: "review-add-function" -> "review-add-function-a3f2b1"
+            result1 = invoke_agent(
+                "qa-expert",
+                "Review this function: def add(a, b): return a + b",
+                session_id="review-add-function"
+            )
+            # result1.session_id contains the full ID like "review-add-function-a3f2b1"
+            # Continue the SAME conversation using session_id from the previous result
+            result2 = invoke_agent(
+                "qa-expert",
+                "Can you suggest edge cases for that function?",
+                session_id=result1.session_id  # Use the session_id from previous output!
+            )
+            # Multiple INDEPENDENT reviews (each gets unique hash suffix)
+            auth_review = invoke_agent(
+                "code-reviewer",
+                "Review my authentication code",
+                session_id="auth-review"  # -> "auth-review-<hash1>"
+            )
+            # auth_review.session_id contains the full ID to continue this review
+            payment_review = invoke_agent(
+                "code-reviewer",
+                "Review my payment processing code",
+                session_id="payment-review"  # -> "payment-review-<hash2>"
+            )
+            # payment_review.session_id contains a different full ID
         """
+        from code_puppy.agents.agent_manager import load_agent
+        # Validate user-provided session_id if given
+        if session_id is not None:
+            try:
+                _validate_session_id(session_id)
+            except ValueError as e:
+                # Return error immediately if session_id is invalid
+                group_id = generate_group_id("invoke_agent", agent_name)
+                emit_error(str(e), message_group=group_id)
+                return AgentInvokeOutput(
+                    response=None, agent_name=agent_name, error=str(e)
+                )
         # Generate a group ID for this tool execution
         group_id = generate_group_id("invoke_agent", agent_name)
-        emit_info(
-            f"\n[bold white on blue] INVOKE AGENT [/bold white on blue] {agent_name}",
-            message_group=group_id,
+        # Check if this is an existing session or a new one
+        # For user-provided session_id, check if it exists
+        # For None, we'll generate a new one below
+        if session_id is not None:
+            message_history = _load_session_history(session_id)
+            is_new_session = len(message_history) == 0
+        else:
+            message_history = []
+            is_new_session = True
+        # Generate or finalize session_id
+        if session_id is None:
+            # Auto-generate a session ID with hash suffix for uniqueness
+            # Example: "qa-expert-session-a3f2b1"
+            hash_suffix = _generate_session_hash_suffix()
+            session_id = f"{agent_name}-session-{hash_suffix}"
+        elif is_new_session:
+            # User provided a base name for a NEW session - append hash suffix
+            # Example: "review-auth" -> "review-auth-a3f2b1"
+            hash_suffix = _generate_session_hash_suffix()
+            session_id = f"{session_id}-{hash_suffix}"
+        # else: continuing existing session, use session_id as-is
+        # Lazy imports to avoid circular dependency
+        from code_puppy.agents.subagent_stream_handler import subagent_stream_handler
+        # Emit structured invocation message via MessageBus
+        bus = get_message_bus()
+        bus.emit(
+            SubAgentInvocationMessage(
+                agent_name=agent_name,
+                session_id=session_id,
+                prompt=prompt,
+                is_new_session=is_new_session,
+                message_count=len(message_history),
+            )
+        )
+        # Save current session context and set the new one for this sub-agent
+        previous_session_id = get_session_context()
+        set_session_context(session_id)
+        # Set terminal session for browser-based terminal tools
+        # This uses contextvars which properly propagate through async tasks
+        from code_puppy.tools.browser.terminal_tools import (
+            _terminal_session_var,
+            set_terminal_session,
+        )
+        terminal_session_token = set_terminal_session(f"terminal-{session_id}")
+        # Set browser session for browser tools (qa-kitten, etc.)
+        # This allows parallel agent invocations to each have their own browser
+        from code_puppy.tools.browser.browser_manager import (
+            set_browser_session,
         )
-        emit_divider(message_group=group_id)
-        emit_system_message(f"Prompt: {prompt}", message_group=group_id)
-        emit_divider(message_group=group_id)
+        browser_session_token = set_browser_session(f"browser-{session_id}")
         try:
+            # Lazy import to break circular dependency with messaging module
+            from code_puppy.model_factory import ModelFactory, make_model_settings
             # Load the specified agent config
-            agent_config = load_agent_config(agent_name)
+            agent_config = load_agent(agent_name)
             # Get the current model for creating a temporary agent
-            model_name = get_model_name()
+            model_name = agent_config.get_model_name()
             models_config = ModelFactory.load_config()
             # Only proceed if we have a valid model configuration
@@ -140,36 +470,205 @@ def register_invoke_agent(agent):
             # Create a temporary agent instance to avoid interfering with current agent state
             instructions = agent_config.get_system_prompt()
-            temp_agent = Agent(
-                model=model,
-                instructions=instructions,
-                output_type=str,
-                retries=3,
+            # Add AGENTS.md content to subagents
+            puppy_rules = agent_config.load_puppy_rules()
+            if puppy_rules:
+                instructions += f"\n\n{puppy_rules}"
+            # Apply prompt additions (like file permission handling) to temporary agents
+            from code_puppy import callbacks
+            from code_puppy.model_utils import prepare_prompt_for_model
+            prompt_additions = callbacks.on_load_prompt()
+            if len(prompt_additions):
+                instructions += "\n" + "\n".join(prompt_additions)
+            # Handle claude-code models: swap instructions, and prepend system prompt only on first message
+            prepared = prepare_prompt_for_model(
+                model_name,
+                instructions,
+                prompt,
+                prepend_system_to_user=is_new_session,  # Only prepend on first message
             )
+            instructions = prepared.instructions
+            prompt = prepared.user_prompt
+            subagent_name = f"temp-invoke-agent-{session_id}"
+            model_settings = make_model_settings(model_name)
+            # Get MCP servers for sub-agents (same as main agent)
+            from code_puppy.mcp_ import get_mcp_manager
+            mcp_servers = []
+            mcp_disabled = get_value("disable_mcp_servers")
+            if not (
+                mcp_disabled and str(mcp_disabled).lower() in ("1", "true", "yes", "on")
+            ):
+                manager = get_mcp_manager()
+                mcp_servers = manager.get_servers_for_agent()
+            if get_use_dbos():
+                from pydantic_ai.durable_exec.dbos import DBOSAgent
+                # For DBOS, create agent without MCP servers (to avoid serialization issues)
+                # and add them at runtime
+                temp_agent = Agent(
+                    model=model,
+                    instructions=instructions,
+                    output_type=str,
+                    retries=3,
+                    toolsets=[],  # MCP servers added separately for DBOS
+                    history_processors=[agent_config.message_history_accumulator],
+                    model_settings=model_settings,
+                )
+                # Register the tools that the agent needs
+                from code_puppy.tools import register_tools_for_agent
-            # Register the tools that the agent needs
-            from code_puppy.tools import register_tools_for_agent
+                agent_tools = agent_config.get_available_tools()
+                register_tools_for_agent(temp_agent, agent_tools)
-            agent_tools = agent_config.get_available_tools()
-            register_tools_for_agent(temp_agent, agent_tools)
+                # Wrap with DBOS - no streaming for sub-agents
+                dbos_agent = DBOSAgent(
+                    temp_agent,
+                    name=subagent_name,
+                )
+                temp_agent = dbos_agent
+                # Store MCP servers to add at runtime
+                subagent_mcp_servers = mcp_servers
+            else:
+                # Non-DBOS path - include MCP servers directly in the agent
+                temp_agent = Agent(
+                    model=model,
+                    instructions=instructions,
+                    output_type=str,
+                    retries=3,
+                    toolsets=mcp_servers,
+                    history_processors=[agent_config.message_history_accumulator],
+                    model_settings=model_settings,
+                )
-            # Run the temporary agent with the provided prompt
-            result = temp_agent.run_sync(prompt)
+                # Register the tools that the agent needs
+                from code_puppy.tools import register_tools_for_agent
+                agent_tools = agent_config.get_available_tools()
+                register_tools_for_agent(temp_agent, agent_tools)
+                subagent_mcp_servers = None
+            # Run the temporary agent with the provided prompt as an asyncio task
+            # Pass the message_history from the session to continue the conversation
+            workflow_id = None  # Track for potential cancellation
+            # Always use subagent_stream_handler to silence output and update console manager
+            # This ensures all sub-agent output goes through the aggregated dashboard
+            stream_handler = partial(subagent_stream_handler, session_id=session_id)
+            # Wrap the agent run in subagent context for tracking
+            with subagent_context(agent_name):
+                if get_use_dbos():
+                    # Generate a unique workflow ID for DBOS - ensures no collisions in back-to-back calls
+                    workflow_id = _generate_dbos_workflow_id(group_id)
+                    # Add MCP servers to the DBOS agent's toolsets
+                    # (temp_agent is discarded after this invocation, so no need to restore)
+                    if subagent_mcp_servers:
+                        temp_agent._toolsets = (
+                            temp_agent._toolsets + subagent_mcp_servers
+                        )
+                    with SetWorkflowID(workflow_id):
+                        task = asyncio.create_task(
+                            temp_agent.run(
+                                prompt,
+                                message_history=message_history,
+                                usage_limits=UsageLimits(
+                                    request_limit=get_message_limit()
+                                ),
+                                event_stream_handler=stream_handler,
+                            )
+                        )
+                        _active_subagent_tasks.add(task)
+                else:
+                    task = asyncio.create_task(
+                        temp_agent.run(
+                            prompt,
+                            message_history=message_history,
+                            usage_limits=UsageLimits(request_limit=get_message_limit()),
+                            event_stream_handler=stream_handler,
+                        )
+                    )
+                    _active_subagent_tasks.add(task)
+                try:
+                    result = await task
+                finally:
+                    _active_subagent_tasks.discard(task)
+                    if task.cancelled():
+                        if get_use_dbos() and workflow_id:
+                            DBOS.cancel_workflow(workflow_id)
             # Extract the response from the result
             response = result.output
-            emit_system_message(f"Response: {response}", message_group=group_id)
-            emit_divider(message_group=group_id)
+            # Update the session history with the new messages from this interaction
+            # The result contains all_messages which includes the full conversation
+            updated_history = result.all_messages()
-            return AgentInvokeOutput(response=response, agent_name=agent_name)
+            # Save to filesystem (include initial prompt only for new sessions)
+            _save_session_history(
+                session_id=session_id,
+                message_history=updated_history,
+                agent_name=agent_name,
+                initial_prompt=prompt if is_new_session else None,
+            )
+            # Emit structured response message via MessageBus
+            bus.emit(
+                SubAgentResponseMessage(
+                    agent_name=agent_name,
+                    session_id=session_id,
+                    response=response,
+                    message_count=len(updated_history),
+                )
+            )
+            # Emit clean completion summary
+            emit_success(
+                f"✓ {agent_name} completed successfully", message_group=group_id
+            )
+            return AgentInvokeOutput(
+                response=response, agent_name=agent_name, session_id=session_id
+            )
         except Exception as e:
-            error_msg = f"Error invoking agent '{agent_name}': {str(e)}"
+            # Emit clean failure summary
+            emit_error(f"✗ {agent_name} failed: {str(e)}", message_group=group_id)
+            # Full traceback for debugging
+            error_msg = f"Error invoking agent '{agent_name}': {traceback.format_exc()}"
             emit_error(error_msg, message_group=group_id)
-            emit_divider(message_group=group_id)
             return AgentInvokeOutput(
-                response=None, agent_name=agent_name, error=error_msg
+                response=None,
+                agent_name=agent_name,
+                session_id=session_id,
+                error=error_msg,
             )
+        finally:
+            # Restore the previous session context
+            set_session_context(previous_session_id)
+            # Reset terminal session context
+            _terminal_session_var.reset(terminal_session_token)
+            # Reset browser session context
+            from code_puppy.tools.browser.browser_manager import (
+                _browser_session_var,
+            )
+            _browser_session_var.reset(browser_session_token)
     return invoke_agent

code-puppy 0.0.169__py3-none-any.whl → 0.0.366__py3-none-any.whl

code-puppy 0.0.169py3-none-any.whl → 0.0.366py3-none-any.whl