PyPI - emdash-core - Versions diffs - 0.1.33__py3-none-any.whl → 0.1.37__py3-none-any.whl - Mend

emdash-core 0.1.33py3-none-any.whl → 0.1.37py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

emdash_core/agent/agents.py +84 -23
emdash_core/agent/hooks.py +419 -0
emdash_core/agent/inprocess_subagent.py +44 -9
emdash_core/agent/prompts/main_agent.py +35 -0
emdash_core/agent/prompts/subagents.py +24 -8
emdash_core/agent/prompts/workflow.py +37 -23
emdash_core/agent/runner/agent_runner.py +12 -0
emdash_core/agent/runner/context.py +28 -9
emdash_core/agent/toolkits/__init__.py +117 -18
emdash_core/agent/toolkits/base.py +87 -2
emdash_core/agent/toolkits/explore.py +18 -0
emdash_core/agent/toolkits/plan.py +18 -0
emdash_core/agent/tools/task.py +11 -4
emdash_core/api/agent.py +154 -3
emdash_core/ingestion/repository.py +17 -198
emdash_core/models/agent.py +4 -0
{emdash_core-0.1.33.dist-info → emdash_core-0.1.37.dist-info}/METADATA +3 -1
{emdash_core-0.1.33.dist-info → emdash_core-0.1.37.dist-info}/RECORD +20 -19
{emdash_core-0.1.33.dist-info → emdash_core-0.1.37.dist-info}/WHEEL +0 -0
{emdash_core-0.1.33.dist-info → emdash_core-0.1.37.dist-info}/entry_points.txt +0 -0

emdash_core/agent/agents.py CHANGED Viewed

@@ -2,16 +2,74 @@
 Allows users to define custom agent configurations with
 specialized system prompts and tool selections.
+Example agent file:
+```markdown
+---
+description: GitHub integration agent
+model: claude-sonnet-4-20250514
+tools: [grep, glob, read_file]
+mcp_servers:
+  github:
+    command: github-mcp-server
+    args: []
+    env:
+      GITHUB_TOKEN: ${GITHUB_TOKEN}
+    enabled: true
+  filesystem:
+    command: npx
+    args: [-y, "@anthropic/mcp-server-filesystem", "/tmp"]
+    enabled: false  # Disabled - won't be started
+---
+# System Prompt
+You are a GitHub integration specialist...
+```
 """
 from dataclasses import dataclass, field
 from pathlib import Path
-from typing import Optional
+from typing import Any, Optional
 import re
+import yaml
 from ..utils.logger import log
+@dataclass
+class AgentMCPServerConfig:
+    """MCP server configuration for a custom agent.
+    Attributes:
+        name: Server name (key in mcp_servers dict)
+        command: Command to run the server
+        args: Arguments to pass to the command
+        env: Environment variables (supports ${VAR} syntax)
+        enabled: Whether this server is enabled (default: True)
+        timeout: Timeout in seconds for tool calls
+    """
+    name: str
+    command: str
+    args: list[str] = field(default_factory=list)
+    env: dict[str, str] = field(default_factory=dict)
+    enabled: bool = True
+    timeout: int = 30
+    @classmethod
+    def from_dict(cls, name: str, data: dict[str, Any]) -> "AgentMCPServerConfig":
+        """Create from dictionary parsed from YAML."""
+        return cls(
+            name=name,
+            command=data.get("command", ""),
+            args=data.get("args", []),
+            env=data.get("env", {}),
+            enabled=data.get("enabled", True),
+            timeout=data.get("timeout", 30),
+        )
 @dataclass
 class CustomAgent:
     """A custom agent configuration loaded from markdown.
@@ -19,16 +77,20 @@ class CustomAgent:
     Attributes:
         name: Agent name (from filename)
         description: Brief description
+        model: Model to use for this agent (optional, uses default if not set)
         system_prompt: Custom system prompt
         tools: List of tools to enable
+        mcp_servers: MCP server configurations for this agent
         examples: Example interactions
         file_path: Source file path
     """
     name: str
     description: str = ""
+    model: Optional[str] = None
     system_prompt: str = ""
     tools: list[str] = field(default_factory=list)
+    mcp_servers: list[AgentMCPServerConfig] = field(default_factory=list)
     examples: list[dict] = field(default_factory=list)
     file_path: Optional[Path] = None
@@ -121,46 +183,45 @@ def _parse_agent_file(file_path: Path) -> Optional[CustomAgent]:
     if system_prompt.startswith("# System Prompt"):
         system_prompt = system_prompt[len("# System Prompt") :].strip()
+    # Parse MCP servers from frontmatter
+    mcp_servers = []
+    mcp_servers_data = frontmatter.get("mcp_servers", {})
+    if isinstance(mcp_servers_data, dict):
+        for server_name, server_config in mcp_servers_data.items():
+            if isinstance(server_config, dict):
+                mcp_servers.append(
+                    AgentMCPServerConfig.from_dict(server_name, server_config)
+                )
     return CustomAgent(
         name=file_path.stem,
         description=frontmatter.get("description", ""),
+        model=frontmatter.get("model"),
         system_prompt=system_prompt,
         tools=frontmatter.get("tools", []),
+        mcp_servers=mcp_servers,
         examples=examples,
         file_path=file_path,
     )
 def _parse_frontmatter(frontmatter_str: str) -> dict:
-    """Parse YAML-like frontmatter.
+    """Parse YAML frontmatter.
-    Simple parser for key: value pairs.
+    Uses PyYAML for proper nested structure parsing.
     Args:
-        frontmatter_str: Frontmatter string
+        frontmatter_str: Frontmatter string (YAML format)
     Returns:
         Dict of parsed values
     """
-    result = {}
-    for line in frontmatter_str.strip().split("\n"):
-        if ":" not in line:
-            continue
-        key, value = line.split(":", 1)
-        key = key.strip()
-        value = value.strip()
-        # Parse list values
-        if value.startswith("[") and value.endswith("]"):
-            # Simple list parsing
-            items = value[1:-1].split(",")
-            result[key] = [item.strip().strip("'\"") for item in items if item.strip()]
-        else:
-            result[key] = value.strip("'\"")
-    return result
+    try:
+        result = yaml.safe_load(frontmatter_str)
+        return result if isinstance(result, dict) else {}
+    except yaml.YAMLError as e:
+        log.warning(f"Failed to parse frontmatter as YAML: {e}")
+        return {}
 def _parse_examples(examples_str: str) -> list[dict]:

emdash_core/agent/hooks.py ADDED Viewed

@@ -0,0 +1,419 @@
+"""Hook system for running commands on agent events.
+Hooks allow users to run shell commands when specific events occur
+during agent execution. Hooks are configured per-project in
+.emdash/hooks.json and run asynchronously (non-blocking).
+Example .emdash/hooks.json:
+{
+  "hooks": [
+    {
+      "id": "notify-done",
+      "event": "session_end",
+      "command": "notify-send 'Agent finished'",
+      "enabled": true
+    }
+  ]
+}
+"""
+from dataclasses import dataclass, field, asdict
+from enum import Enum
+from pathlib import Path
+from typing import Any
+import json
+import os
+import subprocess
+import threading
+from .events import AgentEvent, EventHandler, EventType
+from ..utils.logger import log
+class HookEventType(str, Enum):
+    """Event types that can trigger hooks.
+    This is a subset of EventType exposed for hook configuration.
+    """
+    TOOL_START = "tool_start"
+    TOOL_RESULT = "tool_result"
+    SESSION_START = "session_start"
+    SESSION_END = "session_end"
+    RESPONSE = "response"
+    ERROR = "error"
+    @classmethod
+    def from_event_type(cls, event_type: EventType) -> "HookEventType | None":
+        """Convert an EventType to HookEventType if mappable."""
+        mapping = {
+            EventType.TOOL_START: cls.TOOL_START,
+            EventType.TOOL_RESULT: cls.TOOL_RESULT,
+            EventType.SESSION_START: cls.SESSION_START,
+            EventType.SESSION_END: cls.SESSION_END,
+            EventType.RESPONSE: cls.RESPONSE,
+            EventType.ERROR: cls.ERROR,
+        }
+        return mapping.get(event_type)
+@dataclass
+class HookEventData:
+    """Data passed to hook commands via stdin as JSON.
+    Attributes:
+        event: The event type that triggered the hook
+        timestamp: ISO format timestamp of when the event occurred
+        session_id: The session ID (if available)
+        # Tool-specific fields (for tool_start, tool_result)
+        tool_name: Name of the tool being executed
+        tool_args: Arguments passed to the tool (tool_start only)
+        tool_result: Result summary from the tool (tool_result only)
+        tool_success: Whether the tool succeeded (tool_result only)
+        tool_error: Error message if tool failed (tool_result only)
+        # Response fields (for response event)
+        response_text: The response content
+        # Session fields
+        goal: The goal/query for the session (session_start only)
+        success: Whether the session completed successfully (session_end only)
+        # Error fields
+        error_message: Error message (error event only)
+        error_details: Additional error details (error event only)
+    """
+    event: str
+    timestamp: str
+    session_id: str | None = None
+    # Tool fields
+    tool_name: str | None = None
+    tool_args: dict[str, Any] | None = None
+    tool_result: str | None = None
+    tool_success: bool | None = None
+    tool_error: str | None = None
+    # Response fields
+    response_text: str | None = None
+    # Session fields
+    goal: str | None = None
+    success: bool | None = None
+    # Error fields
+    error_message: str | None = None
+    error_details: str | None = None
+    def to_json(self) -> str:
+        """Convert to JSON string, excluding None values."""
+        data = {k: v for k, v in asdict(self).items() if v is not None}
+        return json.dumps(data)
+    def to_env_vars(self) -> dict[str, str]:
+        """Convert to environment variables for quick access.
+        Returns a dict of EMDASH_* prefixed env vars.
+        """
+        env = {
+            "EMDASH_EVENT": self.event,
+            "EMDASH_TIMESTAMP": self.timestamp,
+        }
+        if self.session_id:
+            env["EMDASH_SESSION_ID"] = self.session_id
+        if self.tool_name:
+            env["EMDASH_TOOL_NAME"] = self.tool_name
+        if self.tool_success is not None:
+            env["EMDASH_TOOL_SUCCESS"] = str(self.tool_success).lower()
+        if self.goal:
+            env["EMDASH_GOAL"] = self.goal
+        if self.success is not None:
+            env["EMDASH_SUCCESS"] = str(self.success).lower()
+        if self.error_message:
+            env["EMDASH_ERROR"] = self.error_message
+        return env
+@dataclass
+class HookConfig:
+    """Configuration for a single hook.
+    Attributes:
+        id: Unique identifier for the hook
+        event: Event type that triggers this hook
+        command: Shell command to execute
+        enabled: Whether the hook is active
+    """
+    id: str
+    event: HookEventType
+    command: str
+    enabled: bool = True
+    def to_dict(self) -> dict[str, Any]:
+        """Convert to dictionary for JSON serialization."""
+        return {
+            "id": self.id,
+            "event": self.event.value,
+            "command": self.command,
+            "enabled": self.enabled,
+        }
+    @classmethod
+    def from_dict(cls, data: dict[str, Any]) -> "HookConfig":
+        """Create from dictionary."""
+        return cls(
+            id=data["id"],
+            event=HookEventType(data["event"]),
+            command=data["command"],
+            enabled=data.get("enabled", True),
+        )
+@dataclass
+class HooksFile:
+    """The .emdash/hooks.json file structure.
+    Attributes:
+        hooks: List of hook configurations
+    """
+    hooks: list[HookConfig] = field(default_factory=list)
+    def to_dict(self) -> dict[str, Any]:
+        """Convert to dictionary for JSON serialization."""
+        return {
+            "hooks": [h.to_dict() for h in self.hooks],
+        }
+    @classmethod
+    def from_dict(cls, data: dict[str, Any]) -> "HooksFile":
+        """Create from dictionary."""
+        hooks = [HookConfig.from_dict(h) for h in data.get("hooks", [])]
+        return cls(hooks=hooks)
+class HookManager:
+    """Manages hook loading, execution, and configuration.
+    Hooks are loaded from .emdash/hooks.json and executed asynchronously
+    when matching events occur.
+    """
+    def __init__(self, repo_root: Path | None = None):
+        """Initialize the hook manager.
+        Args:
+            repo_root: Root directory of the repository.
+                      Defaults to current working directory.
+        """
+        self._repo_root = repo_root or Path.cwd()
+        self._hooks_file = self._repo_root / ".emdash" / "hooks.json"
+        self._hooks: list[HookConfig] = []
+        self._session_id: str | None = None
+        self._load_hooks()
+    @property
+    def hooks_file_path(self) -> Path:
+        """Get the path to the hooks file."""
+        return self._hooks_file
+    def set_session_id(self, session_id: str | None) -> None:
+        """Set the current session ID for event data."""
+        self._session_id = session_id
+    def _load_hooks(self) -> None:
+        """Load hooks from .emdash/hooks.json."""
+        if not self._hooks_file.exists():
+            self._hooks = []
+            return
+        try:
+            data = json.loads(self._hooks_file.read_text())
+            hooks_file = HooksFile.from_dict(data)
+            self._hooks = hooks_file.hooks
+            log.debug(f"Loaded {len(self._hooks)} hooks from {self._hooks_file}")
+        except Exception as e:
+            log.warning(f"Failed to load hooks: {e}")
+            self._hooks = []
+    def reload(self) -> None:
+        """Reload hooks from disk."""
+        self._load_hooks()
+    def get_hooks(self) -> list[HookConfig]:
+        """Get all configured hooks."""
+        return self._hooks.copy()
+    def get_enabled_hooks(self, event: HookEventType) -> list[HookConfig]:
+        """Get enabled hooks for a specific event type."""
+        return [h for h in self._hooks if h.enabled and h.event == event]
+    def add_hook(self, hook: HookConfig) -> None:
+        """Add a new hook and save to disk."""
+        # Check for duplicate ID
+        if any(h.id == hook.id for h in self._hooks):
+            raise ValueError(f"Hook with id '{hook.id}' already exists")
+        self._hooks.append(hook)
+        self._save_hooks()
+    def remove_hook(self, hook_id: str) -> bool:
+        """Remove a hook by ID. Returns True if removed."""
+        for i, h in enumerate(self._hooks):
+            if h.id == hook_id:
+                self._hooks.pop(i)
+                self._save_hooks()
+                return True
+        return False
+    def toggle_hook(self, hook_id: str) -> bool | None:
+        """Toggle a hook's enabled state. Returns new state or None if not found."""
+        for h in self._hooks:
+            if h.id == hook_id:
+                h.enabled = not h.enabled
+                self._save_hooks()
+                return h.enabled
+        return None
+    def _save_hooks(self) -> None:
+        """Save hooks to .emdash/hooks.json."""
+        self._hooks_file.parent.mkdir(parents=True, exist_ok=True)
+        hooks_file = HooksFile(hooks=self._hooks)
+        self._hooks_file.write_text(
+            json.dumps(hooks_file.to_dict(), indent=2) + "\n"
+        )
+        log.debug(f"Saved {len(self._hooks)} hooks to {self._hooks_file}")
+    def _build_event_data(self, event: AgentEvent, hook_event: HookEventType) -> HookEventData:
+        """Build HookEventData from an AgentEvent."""
+        data = HookEventData(
+            event=hook_event.value,
+            timestamp=event.timestamp.isoformat(),
+            session_id=self._session_id,
+        )
+        # Populate event-specific fields
+        if hook_event == HookEventType.TOOL_START:
+            data.tool_name = event.data.get("name")
+            data.tool_args = event.data.get("args")
+        elif hook_event == HookEventType.TOOL_RESULT:
+            data.tool_name = event.data.get("name")
+            data.tool_success = event.data.get("success")
+            data.tool_result = event.data.get("summary")
+            if not data.tool_success:
+                data.tool_error = event.data.get("data", {}).get("error")
+        elif hook_event == HookEventType.SESSION_START:
+            data.goal = event.data.get("goal")
+        elif hook_event == HookEventType.SESSION_END:
+            data.success = event.data.get("success")
+        elif hook_event == HookEventType.RESPONSE:
+            data.response_text = event.data.get("content")
+        elif hook_event == HookEventType.ERROR:
+            data.error_message = event.data.get("message")
+            data.error_details = event.data.get("details")
+        return data
+    def _execute_hook_async(self, hook: HookConfig, event_data: HookEventData) -> None:
+        """Execute a hook command asynchronously (fire and forget)."""
+        def run():
+            try:
+                env = os.environ.copy()
+                env.update(event_data.to_env_vars())
+                process = subprocess.Popen(
+                    hook.command,
+                    shell=True,
+                    stdin=subprocess.PIPE,
+                    stdout=subprocess.PIPE,
+                    stderr=subprocess.PIPE,
+                    env=env,
+                    cwd=str(self._repo_root),
+                )
+                # Send JSON data to stdin
+                json_data = event_data.to_json()
+                assert process.stdin is not None
+                process.stdin.write(json_data.encode())
+                process.stdin.close()
+                # Don't wait for completion - fire and forget
+                # But log if there's an error
+                def log_completion():
+                    _, stderr = process.communicate(timeout=30)
+                    if process.returncode != 0:
+                        log.warning(
+                            f"Hook '{hook.id}' exited with code {process.returncode}: "
+                            f"{stderr.decode()[:200]}"
+                        )
+                # Run completion logging in another thread to not block
+                completion_thread = threading.Thread(target=log_completion, daemon=True)
+                completion_thread.start()
+            except Exception as e:
+                log.warning(f"Failed to execute hook '{hook.id}': {e}")
+        thread = threading.Thread(target=run, daemon=True)
+        thread.start()
+    def trigger(self, event: AgentEvent) -> None:
+        """Trigger hooks for an event.
+        Called by the event system when events occur.
+        """
+        hook_event = HookEventType.from_event_type(event.type)
+        if hook_event is None:
+            return
+        hooks = self.get_enabled_hooks(hook_event)
+        if not hooks:
+            return
+        event_data = self._build_event_data(event, hook_event)
+        for hook in hooks:
+            log.debug(f"Triggering hook '{hook.id}' for event '{hook_event.value}'")
+            self._execute_hook_async(hook, event_data)
+class HookHandler(EventHandler):
+    """Event handler that triggers hooks.
+    Add this handler to an AgentEventEmitter to enable hooks.
+    """
+    def __init__(self, manager: HookManager):
+        """Initialize with a hook manager.
+        Args:
+            manager: The HookManager to use for triggering hooks
+        """
+        self._manager = manager
+    def handle(self, event: AgentEvent) -> None:
+        """Handle an event by triggering matching hooks."""
+        self._manager.trigger(event)
+# Convenience functions
+_default_manager: HookManager | None = None
+def get_hook_manager(repo_root: Path | None = None) -> HookManager:
+    """Get or create the default hook manager."""
+    global _default_manager
+    if _default_manager is None:
+        _default_manager = HookManager(repo_root)
+    return _default_manager
+def reset_hook_manager() -> None:
+    """Reset the default hook manager (for testing)."""
+    global _default_manager
+    _default_manager = None

emdash_core/agent/inprocess_subagent.py CHANGED Viewed

@@ -16,6 +16,12 @@ from .toolkits import get_toolkit
 from .subagent_prompts import get_subagent_prompt
 from .providers import get_provider
 from .providers.factory import DEFAULT_MODEL
+from .context_manager import (
+    truncate_tool_output,
+    reduce_context_for_retry,
+    is_context_overflow_error,
+)
+from .runner.context import estimate_context_tokens
 from ..utils.logger import log
@@ -90,7 +96,7 @@ class InProcessSubAgent:
         self.provider = get_provider(model_name)
         # Get system prompt and inject thoroughness level
-        base_prompt = get_subagent_prompt(subagent_type)
+        base_prompt = get_subagent_prompt(subagent_type, repo_root=repo_root)
         self.system_prompt = self._inject_thoroughness(base_prompt)
         # Tracking
@@ -234,12 +240,39 @@ Now, your task:
                 log.debug(f"SubAgent {self.agent_id} turn {iterations}/{self.max_turns}")
-                # Call LLM
-                response = self.provider.chat(
-                    messages=messages,
-                    tools=self.toolkit.get_all_schemas(),
-                    system=self.system_prompt,
-                )
+                # Check context size and compact if needed
+                context_tokens = estimate_context_tokens(messages, self.system_prompt)
+                context_limit = self.provider.get_context_limit()
+                if context_tokens > context_limit * 0.8:
+                    log.info(
+                        f"SubAgent {self.agent_id} context at {context_tokens:,}/{context_limit:,} "
+                        f"({context_tokens/context_limit:.0%}), reducing..."
+                    )
+                    messages = reduce_context_for_retry(messages, keep_recent=6)
+                # Call LLM with retry on context overflow
+                response = None
+                max_retries = 2
+                for retry in range(max_retries + 1):
+                    try:
+                        response = self.provider.chat(
+                            messages=messages,
+                            tools=self.toolkit.get_all_schemas(),
+                            system=self.system_prompt,
+                        )
+                        break  # Success
+                    except Exception as e:
+                        if is_context_overflow_error(e) and retry < max_retries:
+                            log.warning(
+                                f"SubAgent {self.agent_id} context overflow on attempt {retry + 1}, reducing..."
+                            )
+                            messages = reduce_context_for_retry(messages, keep_recent=4 - retry)
+                        else:
+                            raise  # Re-raise if not overflow or out of retries
+                if response is None:
+                    raise RuntimeError("Failed to get response from LLM")
                 # Add assistant response
                 assistant_msg = self.provider.format_assistant_message(response)
@@ -283,10 +316,12 @@ Now, your task:
                         summary=summary,
                     )
-                    # Add tool result to messages
+                    # Add tool result to messages (truncated to avoid context overflow)
+                    tool_output = json.dumps(result.to_dict(), indent=2)
+                    tool_output = truncate_tool_output(tool_output, max_tokens=15000)
                     tool_result_msg = self.provider.format_tool_result(
                         tool_call.id,
-                        json.dumps(result.to_dict(), indent=2),
+                        tool_output,
                     )
                     if tool_result_msg:
                         messages.append(tool_result_msg)

emdash-core 0.1.33__py3-none-any.whl → 0.1.37__py3-none-any.whl

emdash-core 0.1.33py3-none-any.whl → 0.1.37py3-none-any.whl