npm - bone-agent - Versions diffs - 1.3.2 → 1.4.0 - Mend

bone-agent 1.3.2 → 1.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (87) hide show

package/README.md +19 -2
package/config.yaml.example +13 -2
package/package.json +3 -2
package/prompts/main/ask_questions.md +31 -0
package/prompts/main/batch_independent_calls.md +5 -0
package/prompts/main/casual_interactions.md +11 -0
package/prompts/main/code_references.md +8 -0
package/prompts/main/communication_style.md +12 -0
package/prompts/main/context_reliability.md +12 -0
package/prompts/main/conversational_tool_calling.md +15 -0
package/prompts/main/dream.md +50 -0
package/prompts/main/editing_pattern.md +13 -0
package/prompts/main/error_handling.md +6 -0
package/prompts/main/exploration_pattern.md +21 -0
package/prompts/main/intro.md +1 -0
package/prompts/main/obsidian.md +16 -0
package/prompts/main/obsidian_project.md +79 -0
package/prompts/main/professional_objectivity.md +3 -0
package/prompts/main/skills.md +3 -0
package/prompts/main/targeted_searching.md +10 -0
package/prompts/main/task_lists_pattern.md +8 -0
package/prompts/main/temp_folder.md +9 -0
package/prompts/main/think_before_acting.md +10 -0
package/prompts/main/tone_and_style.md +4 -0
package/prompts/main/tool_preferences.md +24 -0
package/prompts/main/trust_subagent_context.md +21 -0
package/prompts/main/when_to_use_sub_agent.md +7 -0
package/prompts/micro/ask_questions.md +1 -0
package/prompts/micro/batch_independent_calls.md +1 -0
package/prompts/micro/casual_interactions.md +1 -0
package/prompts/micro/code_references.md +1 -0
package/prompts/micro/communication_style.md +1 -0
package/prompts/micro/context_reliability.md +1 -0
package/prompts/micro/conversational_tool_calling.md +1 -0
package/prompts/micro/editing_pattern.md +1 -0
package/prompts/micro/error_handling.md +1 -0
package/prompts/micro/exploration_pattern.md +1 -0
package/prompts/micro/intro.md +1 -0
package/prompts/micro/obsidian.md +4 -0
package/prompts/micro/obsidian_project.md +5 -0
package/prompts/micro/professional_objectivity.md +1 -0
package/prompts/micro/skills.md +1 -0
package/prompts/micro/targeted_searching.md +1 -0
package/prompts/micro/task_lists_pattern.md +1 -0
package/prompts/micro/temp_folder.md +1 -0
package/prompts/micro/think_before_acting.md +5 -0
package/prompts/micro/tone_and_style.md +1 -0
package/prompts/micro/tool_preferences.md +1 -0
package/prompts/micro/trust_subagent_context.md +1 -0
package/prompts/micro/when_to_use_sub_agent.md +1 -0
package/src/core/agentic.py +134 -106
package/src/core/chat_manager.py +60 -12
package/src/core/config_manager.py +14 -1
package/src/core/cron.py +57 -6
package/src/core/memory.py +3 -90
package/src/core/metadata.py +75 -0
package/src/core/skills.py +463 -0
package/src/core/sub_agent.py +93 -43
package/src/core/tool_feedback.py +87 -76
package/src/llm/client.py +7 -2
package/src/llm/codex_provider.py +350 -0
package/src/llm/config.py +74 -4
package/src/llm/prompts.py +261 -502
package/src/llm/providers.py +28 -7
package/src/llm/token_tracker.py +32 -1
package/src/tools/__init__.py +24 -85
package/src/tools/create_file.py +1 -1
package/src/tools/directory.py +1 -1
package/src/tools/edit.py +13 -7
package/src/tools/file_reader.py +1 -1
package/src/tools/helpers/__init__.py +1 -7
package/src/tools/helpers/base.py +65 -16
package/src/tools/helpers/loader.py +2 -88
package/src/tools/helpers/path_resolver.py +70 -13
package/src/tools/helpers/plugin_manifest.py +99 -70
package/src/tools/review_sub_agent.py +2 -1
package/src/tools/rg_search.py +119 -35
package/src/tools/search_plugins.py +140 -72
package/src/tools/shell.py +3 -3
package/src/ui/commands.py +470 -33
package/src/ui/displays.py +27 -1
package/src/ui/main.py +1 -4
package/src/ui/tool_confirmation.py +16 -5
package/src/utils/editor.py +88 -39
package/src/utils/settings.py +25 -4
package/src/utils/user_message_logger.py +120 -0
package/src/utils/validation.py +10 -0

package/src/core/skills.py ADDED Viewed

@@ -0,0 +1,463 @@
+"""User skill storage and active session skill helpers."""
+from __future__ import annotations
+import logging
+import os
+import re
+import tempfile
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Callable, Generic, TypeVar
+import yaml
+logger = logging.getLogger(__name__)
+MAX_SKILL_BYTES = 32 * 1024
+SKILL_NAME_RE = re.compile(r"^[a-z0-9][a-z0-9_-]{0,63}$")
+_HEADING_RE = re.compile(r"^#\s+(.+?)\s*$")
+_FRONTMATTER_RE = re.compile(r"^---\s*\n(.*?)\n---\s*\n", re.DOTALL)
+@dataclass
+class SkillSummary:
+    name: str
+    path: Path
+    preview: str
+    modified: float
+    description: str = ""
+    tags: list[str] = field(default_factory=list)
+T = TypeVar("T")
+@dataclass
+class SearchCandidate(Generic[T]):
+    item: T
+    text: str
+    compact_text: str
+    exact_text: str = ""
+@dataclass
+class SearchMatch(Generic[T]):
+    item: T
+    score: float
+class SkillError(ValueError):
+    """Raised when a skill operation cannot be completed."""
+def get_skills_dir() -> Path:
+    """Return the configured skills directory."""
+    override = os.environ.get("BONE_SKILLS_DIR")
+    if override:
+        return Path(override).expanduser().resolve()
+    return Path.home() / ".bone" / "skills"
+def ensure_skills_dir() -> Path:
+    """Create and return the skills directory."""
+    path = get_skills_dir()
+    path.mkdir(parents=True, exist_ok=True)
+    return path
+def normalize_skill_name(raw: str) -> str:
+    """Normalize a user-provided skill name for filesystem storage."""
+    return (raw or "").strip().lower().replace(" ", "_")
+def validate_skill_name(raw: str) -> str:
+    """Validate and return a normalized skill name."""
+    name = normalize_skill_name(raw)
+    if not SKILL_NAME_RE.fullmatch(name):
+        raise SkillError(
+            "Invalid skill name. Use lowercase letters, numbers, underscores, "
+            "or hyphens; start with a letter or number."
+        )
+    if "/" in name or "\\" in name or name.startswith(".") or ".." in name:
+        raise SkillError("Invalid skill name.")
+    return name
+def get_skill_path(name: str) -> Path:
+    """Return the safe path for a skill name."""
+    valid_name = validate_skill_name(name)
+    base = ensure_skills_dir().resolve()
+    return base / f"{valid_name}.md"
+def _check_size(content: str) -> None:
+    if len(content.encode("utf-8")) > MAX_SKILL_BYTES:
+        raise SkillError(f"Skill is too large. Maximum size is {MAX_SKILL_BYTES} bytes.")
+def _parse_frontmatter(content: str) -> tuple[dict, str]:
+    """Extract YAML frontmatter and remaining body from content.
+    Returns:
+        (metadata_dict, body_text). metadata_dict may be empty.
+    Notes:
+        If a frontmatter block is present but invalid, preserve the original content
+        as body so callers do not silently discard user-authored metadata.
+    """
+    match = _FRONTMATTER_RE.match(content)
+    if not match:
+        return {}, content
+    try:
+        meta = yaml.safe_load(match.group(1)) or {}
+    except yaml.YAMLError:
+        return {}, content
+    if not isinstance(meta, dict):
+        return {}, content
+    body = content[match.end():]
+    return meta, body
+def _normalize_description(value: object) -> str:
+    text = str(value or "").strip()
+    return text
+def _normalize_tags(value: object) -> list[str]:
+    if value is None:
+        return []
+    if isinstance(value, str):
+        candidates = [value]
+    elif isinstance(value, (list, tuple, set)):
+        candidates = list(value)
+    else:
+        candidates = [value]
+    tags: list[str] = []
+    for candidate in candidates:
+        tag = str(candidate or "").strip()
+        if tag:
+            tags.append(tag)
+    return tags
+def _render_frontmatter(description: str, tags: list[str]) -> str:
+    """Render YAML frontmatter block for a skill file."""
+    if not description and not tags:
+        return ""
+    meta = {}
+    if description:
+        meta["description"] = description
+    if tags:
+        meta["tags"] = tags
+    return f"---\n{yaml.dump(meta, default_flow_style=False).strip()}\n---\n"
+def _needs_metadata(meta: dict) -> bool:
+    """Check if frontmatter is missing description or tags."""
+    return not meta.get("description") or not meta.get("tags")
+def _strip_heading(name: str, content: str) -> str:
+    lines = content.splitlines()
+    if not lines:
+        return ""
+    match = _HEADING_RE.match(lines[0])
+    if match and normalize_skill_name(match.group(1)) == normalize_skill_name(name):
+        return "\n".join(lines[1:]).strip()
+    return content.strip()
+def format_skill_file(name: str, content: str, *, description: str = "", tags: list[str] | None = None) -> str:
+    """Format a skill as a markdown file with optional frontmatter and title heading."""
+    valid_name = validate_skill_name(name)
+    body = _strip_heading(valid_name, content)
+    if not body:
+        raise SkillError("Skill prompt cannot be empty.")
+    frontmatter = _render_frontmatter(description, tags or [])
+    formatted = f"{frontmatter}# {valid_name}\n\n{body.strip()}\n"
+    _check_size(formatted)
+    return formatted
+def read_skill(name: str, strip_heading: bool = True) -> str:
+    """Read a skill body by name.
+    Returns the prompt body without frontmatter or heading (unless strip_heading=False,
+    in which case frontmatter is still stripped but heading is kept).
+    """
+    path = get_skill_path(name)
+    if path.is_symlink():
+        raise SkillError("Refusing to read a symlinked skill.")
+    if not path.is_file():
+        raise SkillError(f"Skill '{validate_skill_name(name)}' not found.")
+    content = path.read_text(encoding="utf-8")
+    _, body = _parse_frontmatter(content)
+    if strip_heading:
+        return _strip_heading(name, body)
+    return body.strip()
+def write_skill(name: str, content: str, overwrite: bool = False) -> Path:
+    """Create or replace a skill file.
+    If the content contains YAML frontmatter with description and tags, those are
+    preserved. Otherwise, metadata is auto-generated from the content via the LLM.
+    """
+    valid_name = validate_skill_name(name)
+    path = get_skill_path(valid_name)
+    if path.exists() and not overwrite:
+        raise SkillError(f"Skill '{valid_name}' already exists.")
+    # Parse any existing frontmatter from the content
+    body = content
+    description = ""
+    tags: list[str] = []
+    # Check if the raw content has frontmatter already
+    raw_meta, raw_body = _parse_frontmatter(content)
+    if raw_meta:
+        description = _normalize_description(raw_meta.get("description", ""))
+        tags = _normalize_tags(raw_meta.get("tags"))
+        body = raw_body
+    # If still missing metadata, try to preserve from existing file
+    if _needs_metadata({"description": description, "tags": tags}) and path.is_file():
+        existing_content = path.read_text(encoding="utf-8")
+        existing_meta, _ = _parse_frontmatter(existing_content)
+        if not description and existing_meta.get("description"):
+            description = _normalize_description(existing_meta["description"])
+        if not tags and existing_meta.get("tags"):
+            tags = _normalize_tags(existing_meta.get("tags"))
+    # If still missing, auto-generate
+    if _needs_metadata({"description": description, "tags": tags}):
+        prompt_body = _strip_heading(valid_name, body)
+        if prompt_body:
+            from core.metadata import generate_metadata
+            generated = generate_metadata(prompt_body, valid_name)
+            generated_description = _normalize_description(generated.get("description", ""))
+            generated_tags = _normalize_tags(generated.get("tags"))
+            if not description:
+                description = generated_description
+            if not tags:
+                tags = generated_tags
+    formatted = format_skill_file(valid_name, body, description=description, tags=tags)
+    _atomic_write(path, formatted)
+    return path
+def remove_skill(name: str) -> Path:
+    """Remove a skill file."""
+    path = get_skill_path(name)
+    if not path.is_file():
+        raise SkillError(f"Skill '{validate_skill_name(name)}' not found.")
+    if path.is_symlink():
+        raise SkillError("Refusing to remove a symlinked skill.")
+    path.unlink()
+    return path
+def list_skills(query: str | None = None) -> list[SkillSummary]:
+    """List stored skills, optionally filtering by name/body preview."""
+    return [match.item for match in search_skill_matches(query=query)]
+def iter_skill_summaries() -> list[SkillSummary]:
+    """Return all valid stored skill summaries."""
+    base = ensure_skills_dir()
+    summaries: list[SkillSummary] = []
+    for path in sorted(base.glob("*.md")):
+        if not path.is_file() or path.is_symlink():
+            continue
+        try:
+            name = validate_skill_name(path.stem)
+            raw = path.read_text(encoding="utf-8")
+            meta, body_text = _parse_frontmatter(raw)
+            heading_stripped = _strip_heading(name, body_text)
+        except SkillError:
+            continue
+        summaries.append(
+            SkillSummary(
+                name=name,
+                path=path,
+                preview=_preview(heading_stripped),
+                modified=path.stat().st_mtime,
+                description=_normalize_description(meta.get("description", "")),
+                tags=_normalize_tags(meta.get("tags")),
+            )
+        )
+    return summaries
+def search_candidates(
+    query: str,
+    candidates: list[SearchCandidate[T]],
+    *,
+    max_results: int = 5,
+    item_key: Callable[[T], str] | None = None,
+) -> list[SearchMatch[T]]:
+    """Score and return matching candidates in descending relevance order."""
+    query_text = (query or "").strip().lower()
+    if not query_text:
+        matches = [SearchMatch(item=candidate.item, score=0.0) for candidate in candidates]
+        if item_key is not None:
+            matches.sort(key=lambda match: item_key(match.item))
+        return matches[:max_results]
+    query_compact = _compact_match_text(query_text)
+    query_terms = [term for term in query_text.split() if term]
+    scored: list[SearchMatch[T]] = []
+    for candidate in candidates:
+        text = candidate.text.lower()
+        compact_text = candidate.compact_text or _compact_match_text(text)
+        exact_text = (candidate.exact_text or "").lower()
+        score = 0.0
+        if exact_text and query_text == exact_text:
+            score += 120.0
+        if exact_text and query_text in exact_text:
+            score += 60.0
+        if query_text in text:
+            score += 40.0
+        if query_compact and query_compact in compact_text:
+            score += 25.0
+        for term in query_terms:
+            if exact_text and term in exact_text:
+                score += 15.0
+            if term in text:
+                score += 10.0
+        if score > 0:
+            scored.append(SearchMatch(item=candidate.item, score=score))
+    scored.sort(
+        key=lambda match: (
+            -match.score,
+            item_key(match.item) if item_key is not None else "",
+        )
+    )
+    return scored[:max_results]
+def search_skill_matches(query: str | None = None, max_results: int = 20) -> list[SearchMatch[SkillSummary]]:
+    """Return scored skill matches for discovery surfaces."""
+    skills = iter_skill_summaries()
+    candidates = [
+        SearchCandidate(
+            item=skill,
+            text=" ".join(
+                part
+                for part in [
+                    skill.name,
+                    skill.description,
+                    skill.preview,
+                    " ".join(skill.tags),
+                ]
+                if part
+            ),
+            compact_text=_compact_match_text(
+                " ".join(
+                    part
+                    for part in [skill.name, skill.description, " ".join(skill.tags)]
+                    if part
+                )
+            ),
+            exact_text=skill.name,
+        )
+        for skill in skills
+    ]
+    return search_candidates(
+        query or "",
+        candidates,
+        max_results=max_results,
+        item_key=lambda skill: skill.name,
+    )
+def activate_skill(chat_manager, name: str, content: str | None = None, reload: bool = False) -> int:
+    """Activate a skill in session state and refresh the system prompt."""
+    valid_name = validate_skill_name(name)
+    body = (content if content is not None else read_skill(valid_name)).strip()
+    if not body:
+        raise SkillError("Skill prompt cannot be empty.")
+    loaded_skills = getattr(chat_manager, "loaded_skills", None)
+    if loaded_skills is None:
+        loaded_skills = set()
+        setattr(chat_manager, "loaded_skills", loaded_skills)
+    if valid_name in loaded_skills and not reload:
+        raise SkillError(f"Skill '{valid_name}' is already active in this chat.")
+    loaded_skills.add(valid_name)
+    if hasattr(chat_manager, "update_system_prompt"):
+        chat_manager.update_system_prompt()
+    else:
+        chat_manager._update_context_tokens()
+    return chat_manager.token_tracker.estimate_tokens(render_active_skills_section([valid_name]))
+def get_active_skill_contents(skill_names: list[str] | set[str] | tuple[str, ...]) -> list[tuple[str, str]]:
+    """Return validated active skill name/body pairs sorted by skill name."""
+    active_skills = []
+    for raw_name in sorted({validate_skill_name(name) for name in skill_names}):
+        body = read_skill(raw_name)
+        if body:
+            active_skills.append((raw_name, body))
+    return active_skills
+def render_active_skills_section(skill_names: list[str] | set[str] | tuple[str, ...]) -> str:
+    """Render active skills for inclusion in the system prompt."""
+    try:
+        active_skills = get_active_skill_contents(skill_names)
+    except SkillError:
+        active_skills = []
+    if not active_skills:
+        return ""
+    sections = ["## Active skills", "Apply these active skill instructions in addition to the base prompt."]
+    for name, body in active_skills:
+        sections.append(f"### {name}\n{body}")
+    return "\n\n".join(sections)
+def _preview(content: str, max_chars: int = 90) -> str:
+    text = " ".join(content.split())
+    if len(text) <= max_chars:
+        return text
+    return text[: max_chars - 3].rstrip() + "..."
+def _compact_match_text(text: str) -> str:
+    return re.sub(r"[^a-z0-9]+", "", (text or "").lower())
+def _atomic_write(path: Path, content: str) -> None:
+    path.parent.mkdir(parents=True, exist_ok=True)
+    fd, tmp_name = tempfile.mkstemp(
+        prefix=f".{path.stem}.",
+        suffix=".tmp",
+        dir=str(path.parent),
+        text=True,
+    )
+    tmp_path = Path(tmp_name)
+    try:
+        with os.fdopen(fd, "w", encoding="utf-8", newline="\n") as handle:
+            handle.write(content)
+        tmp_path.replace(path)
+    except Exception:
+        try:
+            tmp_path.unlink()
+        except OSError:
+            pass
+        raise

package/src/core/sub_agent.py CHANGED Viewed

@@ -4,11 +4,12 @@ Uses existing AgenticOrchestrator with isolated message context
 and read-only tools to execute generic delegated tasks.
 """
-from pathlib import Path
-from core.chat_manager import ChatManager
-from llm.prompts import build_sub_agent_prompt
-from utils.settings import sub_agent_settings
+from pathlib import Path
+from core.chat_manager import ChatManager
+from exceptions import LLMError
+from llm.prompts import build_sub_agent_prompt
+from utils.settings import sub_agent_settings
 class HardLimitExceeded(Exception):
@@ -16,6 +17,11 @@ class HardLimitExceeded(Exception):
     pass
+class BilledLimitExceeded(Exception):
+    """Raised when the sub-agent hits its cumulative billed token limit."""
+    pass
 def _format_messages_dump(messages) -> str:
     """Format sub-agent message history as a markdown dump.
@@ -89,7 +95,7 @@ def _inject_system_prompt(chat_manager, sub_agent_type: str = "research"):
     chat_manager.messages = [{"role": "system", "content": base_prompt}]
-def _load_codebase_map(chat_manager):
+def _load_codebase_map(chat_manager):
     """Load agents.md codebase map into sub-agent context if available.
     Args:
@@ -98,19 +104,13 @@ def _load_codebase_map(chat_manager):
     agents_path = Path.cwd() / "agents.md"
     if agents_path.exists():
         map_content = agents_path.read_text(encoding="utf-8").strip()
-        user_msg = (
-            "Here is the codebase map for this project. "
-            "This provides an overview of the repository structure and file purposes. "
-            "Use this as a reference when exploring the codebase.\n\n"
-            f"## Codebase Map (auto-generated from agents.md)\n\n{map_content}"
-        )
-        assistant_msg = (
-            "I've received the codebase map. I'll use this as a reference when "
-            "exploring the repository, but I'll always verify current state by "
-            "reading files and searching the codebase before making changes."
-        )
-        chat_manager.messages.append({"role": "user", "content": user_msg})
-        chat_manager.messages.append({"role": "assistant", "content": assistant_msg})
+        user_msg = (
+            "Here is the codebase map for this project. "
+            "This provides an overview of the repository structure and file purposes. "
+            "Use this as a reference when exploring the codebase.\n\n"
+            f"## Codebase Map (auto-generated from agents.md)\n\n{map_content}"
+        )
+        chat_manager.messages.append({"role": "user", "content": user_msg})
 def _configure_isolation(chat_manager):
@@ -183,14 +183,11 @@ def run_sub_agent(
     # Create fresh ChatManager for sub-agent
     temp_chat_manager = _create_chat_manager(sub_agent_type=sub_agent_type)
-    # Inject initial context as a user/assistant exchange if provided
-    if initial_context:
-        temp_chat_manager.messages.append(
-            {"role": "user", "content": initial_context}
-        )
-        temp_chat_manager.messages.append(
-            {"role": "assistant", "content": "I've received the context. I'll analyze it and use the available tools to gather additional information as needed."}
-        )
+    # Inject initial context as a user/assistant exchange if provided
+    if initial_context:
+        temp_chat_manager.messages.append(
+            {"role": "user", "content": initial_context}
+        )
     # Import here to avoid circular import with core.agentic
     from core.agentic import AgenticOrchestrator
@@ -216,27 +213,40 @@ def run_sub_agent(
     original_chat_completion = temp_chat_manager.client.chat_completion
     _soft_limit_warned = False
+    _billed_warning_sent = False
     def _chat_completion_with_token_hint(messages, **kwargs):
-        """Prepend a system-level token budget hint (and soft-limit warning once) to every LLM call."""
-        nonlocal _soft_limit_warned
+        """Prepend a system-level token budget hint and one-time warnings to every LLM call."""
+        nonlocal _soft_limit_warned, _billed_warning_sent
         tt = temp_chat_manager.token_tracker
-        hint = f"[Token budget: {tt.current_context_tokens:,} curr / {tt.conv_total_tokens:,} total]"
+        hint = f"[Token budget: {tt.current_context_tokens:,} curr / {tt.conv_total_tokens:,} total billed]"
+        warnings = []
         if not _soft_limit_warned and tt.current_context_tokens >= sub_agent_settings.soft_limit_tokens:
             _soft_limit_warned = True
-            hint = (
-                f"WARNING: You have exceeded the soft token limit "
+            warnings.append(
+                f"WARNING: You have exceeded the current-context soft token limit "
                 f"({tt.current_context_tokens:,} / {sub_agent_settings.soft_limit_tokens:,}). "
-                "STOP exploring and return your findings immediately. Do NOT call any more tools. "
-                + hint
+                "STOP exploring and return your findings immediately. Do NOT call any more tools."
             )
+        if not _billed_warning_sent and tt.conv_total_tokens >= sub_agent_settings.billed_warning_tokens:
+            _billed_warning_sent = True
+            warnings.append(
+                f"WARNING: You have exceeded the cumulative billed token warning limit "
+                f"({tt.conv_total_tokens:,} / {sub_agent_settings.billed_warning_tokens:,}). "
+                "This sub-agent may be running away. STOP exploring and return your findings immediately. "
+                "Do NOT call any more tools."
+            )
+        if warnings:
+            hint = "\n".join([*warnings, hint])
         token_msg = {"role": "system", "content": hint}
         return original_chat_completion([token_msg, *messages], **kwargs)
-    def _get_llm_response_with_hard_limit(allowed_tools=None):
-        """Wrapper to check hard token limit and update panel with live token counts."""
+    def _get_llm_response_with_hard_limit(allowed_tools=None, allow_active_plugins=False):
+        """Wrapper to check context and billed token limits and update panel state."""
         tt = temp_chat_manager.token_tracker
         # Check hard token limit before making LLM call
@@ -248,6 +258,19 @@ def run_sub_agent(
                 f"{tt.current_context_tokens:,} / {sub_agent_settings.hard_limit_tokens:,} tokens."
             )
+        # Check cumulative billed tokens to stop runaway sub-agents even when
+        # current context remains below the prompt-size hard limit.
+        #
+        # Note: the billed warning is injected by _chat_completion_with_token_hint
+        # on the next chat_completion call. This hard stop runs before each LLM
+        # response, so once we hit the billed hard limit the warning may never be
+        # delivered if no further chat_completion call is made.
+        if tt.conv_total_tokens >= sub_agent_settings.billed_hard_limit_tokens:
+            raise BilledLimitExceeded(
+                f"Sub-agent billed token limit exceeded: "
+                f"{tt.conv_total_tokens:,} / {sub_agent_settings.billed_hard_limit_tokens:,} tokens."
+            )
         # Update panel with live token counts
         # Order: conversation length (current context) first, total tokens billed second
         conv_length = tt.current_context_tokens
@@ -256,27 +279,45 @@ def run_sub_agent(
             panel_updater.token_info = f"{conv_length:,} curr | {total_billed:,} total"
             panel_updater.append("")  # Refresh panel title
-        return original_get_llm_response(allowed_tools=allowed_tools)
+        return original_get_llm_response(
+            allowed_tools=allowed_tools,
+            allow_active_plugins=allow_active_plugins,
+        )
     # Apply both patches once, before the orchestrator loop starts
     orchestrator._get_llm_response = _get_llm_response_with_hard_limit
     temp_chat_manager.client.chat_completion = _chat_completion_with_token_hint
     hard_limit_exceeded = False
+    billed_limit_exceeded = False
     try:
         # Run sub-agent task
         orchestrator.run(
             task_query,
             thinking_indicator=None,
-            allowed_tools=sub_agent_settings.allowed_tools
+            allowed_tools=sub_agent_settings.allowed_tools,
+            allow_active_plugins=sub_agent_settings.allow_active_plugins,
         )
     except HardLimitExceeded:
         hard_limit_exceeded = True
-    except Exception as e:
-        import traceback
-        error_details = f"{e}\n\nTraceback:\n{traceback.format_exc()}"
-        return {
+    except BilledLimitExceeded:
+        billed_limit_exceeded = True
+    except LLMError as e:
+        return {
+            "result": "",
+            "usage": {
+                "prompt_tokens": 0,
+                "completion_tokens": 0,
+                "total_tokens": 0
+            },
+            "model": temp_chat_manager.client.model,
+            "error": str(e)
+        }
+    except Exception as e:
+        import traceback
+        error_details = f"{e}\n\nTraceback:\n{traceback.format_exc()}"
+        return {
             "result": "",
             "usage": {
                 "prompt_tokens": 0,
@@ -306,7 +347,15 @@ def run_sub_agent(
             if msg.get("role") == "assistant" and msg.get("content"):
                 final_content = msg["content"].strip()
                 break
-        result = final_content
+        if billed_limit_exceeded:
+            prefix = (
+                "WARNING: Sub-agent billed token limit reached. "
+                "Returning current findings early to prevent runaway execution."
+            )
+            result = f"{prefix}\n\n{final_content}" if final_content else prefix
+        else:
+            result = final_content
     usage = {
         "prompt_tokens": delta_prompt,
@@ -323,4 +372,5 @@ def run_sub_agent(
         "model": temp_chat_manager.client.model,
         "error": None,
         "hard_limit_exceeded": hard_limit_exceeded,
+        "billed_limit_exceeded": billed_limit_exceeded,
     }