npm - bone-agent - Versions diffs - 1.3.3 → 1.4.0 - Mend

bone-agent 1.3.3 → 1.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (43) hide show

package/README.md +17 -0
package/config.yaml.example +5 -2
package/package.json +1 -1
package/prompts/main/communication_style.md +1 -1
package/prompts/main/dream.md +23 -9
package/prompts/main/skills.md +3 -0
package/prompts/micro/communication_style.md +1 -1
package/prompts/micro/skills.md +1 -0
package/src/core/agentic.py +138 -38
package/src/core/chat_manager.py +19 -6
package/src/core/config_manager.py +8 -1
package/src/core/cron.py +0 -4
package/src/core/metadata.py +75 -0
package/src/core/skills.py +463 -0
package/src/core/sub_agent.py +93 -43
package/src/core/tool_feedback.py +87 -76
package/src/llm/client.py +7 -2
package/src/llm/codex_provider.py +350 -0
package/src/llm/config.py +46 -2
package/src/llm/prompts.py +12 -7
package/src/llm/providers.py +3 -1
package/src/llm/token_tracker.py +15 -0
package/src/tools/__init__.py +24 -85
package/src/tools/create_file.py +1 -1
package/src/tools/directory.py +1 -1
package/src/tools/edit.py +5 -1
package/src/tools/file_reader.py +1 -1
package/src/tools/helpers/__init__.py +1 -7
package/src/tools/helpers/base.py +65 -16
package/src/tools/helpers/loader.py +2 -88
package/src/tools/helpers/path_resolver.py +54 -3
package/src/tools/helpers/plugin_manifest.py +99 -70
package/src/tools/review_sub_agent.py +2 -1
package/src/tools/rg_search.py +24 -7
package/src/tools/search_plugins.py +140 -72
package/src/tools/shell.py +3 -3
package/src/ui/commands.py +355 -33
package/src/ui/displays.py +26 -1
package/src/ui/main.py +0 -4
package/src/ui/tool_confirmation.py +16 -5
package/src/utils/editor.py +88 -39
package/src/utils/settings.py +6 -2
package/src/utils/validation.py +10 -0

package/src/llm/codex_provider.py ADDED Viewed

@@ -0,0 +1,350 @@
+"""Codex provider adapter.
+Codex is intentionally isolated from the normal provider handlers because it is
+not a Chat Completions-compatible API. It targets the ChatGPT Codex Responses
+backend and adapts that protocol back into vmCode's OpenAI-style internal shape.
+"""
+import copy
+import hashlib
+import json
+from typing import Any, Dict, Iterator, Optional
+import requests
+from exceptions import LLMResponseError
+class CodexResponsesHandler:
+    """Adapter for the ChatGPT Codex Responses backend.
+    Codex-specific behavior kept here:
+    - Uses `instructions` + `input` instead of Chat Completions `messages`.
+    - Always sends `stream: true`; the backend returns SSE even for logical
+      non-streaming agent calls.
+    - Stores `_responses_output` replay metadata so tool-call turns can be sent
+      back in Responses-native form while using `store: false`.
+    """
+    supports_sse_response_fallback = True
+    def build_headers(self, config: Dict[str, Any]) -> Dict[str, str]:
+        """Build request headers."""
+        headers = {"Content-Type": "application/json"}
+        if config.get("type") == "api" and config.get("api_key"):
+            headers["Authorization"] = f"Bearer {config['api_key']}"
+        if "headers_extra" in config:
+            headers.update(config["headers_extra"])
+        return headers
+    def build_payload(self, config: Dict[str, Any], messages: list,
+                      tools: Optional[list] = None, stream: bool = True) -> Dict[str, Any]:
+        """Build request payload for Codex backend Responses API."""
+        system_parts = [m["content"] for m in messages if m.get("role") == "system"]
+        instructions = "\n".join(system_parts) if system_parts else "You are a helpful assistant."
+        codex_input = []
+        for m in messages:
+            if m.get("role") == "system":
+                continue
+            role = m.get("role", "user")
+            content = m.get("content", "")
+            if role == "assistant" and m.get("_responses_output"):
+                codex_input.extend(m.get("_responses_output") or [])
+                continue
+            if role == "assistant" and m.get("tool_calls"):
+                if content:
+                    codex_input.append({
+                        "role": "assistant",
+                        "content": [{"type": "input_text", "text": content}]
+                    })
+                for tool_call in m.get("tool_calls", []):
+                    function = tool_call.get("function", {})
+                    codex_input.append({
+                        "type": "function_call",
+                        "call_id": tool_call.get("id"),
+                        "name": function.get("name", ""),
+                        "arguments": function.get("arguments", "{}"),
+                    })
+                continue
+            if role == "tool":
+                codex_input.append({
+                    "type": "function_call_output",
+                    "call_id": m.get("tool_call_id"),
+                    "output": content,
+                })
+                continue
+            content_type = "output_text" if role == "assistant" else "input_text"
+            codex_input.append({
+                "role": role,
+                "content": [{"type": content_type, "text": content}]
+            })
+        payload = {
+            **config.get("payload", {}),
+            "instructions": instructions,
+            "input": codex_input,
+            "store": False,
+            "stream": True,
+        }
+        if "model" not in payload:
+            model_name = config.get("api_model") or config.get("model")
+            if model_name:
+                payload["model"] = model_name
+        if tools:
+            payload["tools"] = [self._convert_tool_to_responses(tool) for tool in tools]
+        if "prompt_cache_key" not in payload:
+            model = payload.get("model") or "unknown-model"
+            payload["prompt_cache_key"] = self._build_prompt_cache_key(
+                model=model,
+                instructions=instructions,
+                tools=payload.get("tools"),
+            )
+        if "temperature" not in payload and config.get("allow_temperature", True):
+            payload["temperature"] = config.get("default_temperature", 0.1)
+        if "top_p" not in payload and config.get("allow_top_p", True):
+            payload["top_p"] = config.get("default_top_p", 0.9)
+        return payload
+    def _build_prompt_cache_key(
+        self,
+        *,
+        model: str,
+        instructions: str,
+        tools: Optional[list] = None,
+    ) -> str:
+        """Build a stable prompt-cache key for the reusable Codex prefix."""
+        cache_scope = {
+            "model": model,
+            "instructions": instructions,
+            "tools": tools or [],
+        }
+        canonical = json.dumps(
+            cache_scope,
+            sort_keys=True,
+            separators=(",", ":"),
+            ensure_ascii=True,
+        )
+        cache_hash = hashlib.sha256(canonical.encode("utf-8")).hexdigest()[:24]
+        return f"bone-agent:{cache_hash}"
+    def parse_response(self, response_json: Dict[str, Any]) -> Dict[str, Any]:
+        """Parse Responses API output into Chat Completions format."""
+        return self._normalize_response(response_json)
+    def parse_sse_response(self, response_text: str) -> Dict[str, Any]:
+        """Parse a full SSE response body into Chat Completions format."""
+        completed_response = None
+        output_items = []
+        for raw_line in response_text.splitlines():
+            line = raw_line.strip()
+            if not line.startswith("data: "):
+                continue
+            data_str = line[6:]
+            if data_str == "[DONE]":
+                break
+            try:
+                data = json.loads(data_str)
+            except json.JSONDecodeError as e:
+                raise LLMResponseError(
+                    "Failed to decode SSE response from Codex backend",
+                    details={"original_error": str(e)}
+                )
+            if data.get("type") == "response.output_item.done":
+                item = data.get("item")
+                if item:
+                    output_items.append(item)
+                continue
+            if data.get("type") == "response.completed":
+                completed_response = data.get("response")
+                break
+        if completed_response is None:
+            raise LLMResponseError(
+                "Codex backend returned streaming data without a completed response event"
+            )
+        if not completed_response.get("output") and output_items:
+            completed_response = dict(completed_response)
+            completed_response["output"] = output_items
+        return self._normalize_response(completed_response)
+    def parse_stream(self, response: requests.Response) -> Iterator[Dict[str, Any]]:
+        """Parse streaming Responses API."""
+        usage_data = None
+        for line in response.iter_lines():
+            if line:
+                line = line.decode('utf-8')
+                if line.startswith('data: '):
+                    data_str = line[6:]
+                    if data_str.strip() == '[DONE]':
+                        break
+                    try:
+                        data = json.loads(data_str)
+                        if 'error' in data:
+                            error_msg = data.get('error', {}).get('message', 'Unknown streaming error')
+                            raise LLMResponseError(
+                                f"Streaming error: {error_msg}",
+                                details={"error_data": data.get('error')}
+                            )
+                        event_type = data.get("type", "")
+                        if event_type == "response.completed":
+                            resp = data.get("response", {})
+                            if "usage" in resp:
+                                usage_data = self._normalize_usage(resp["usage"])
+                        if event_type == "response.output_text.delta":
+                            delta = data.get("delta", "")
+                            if delta:
+                                yield delta
+                    except json.JSONDecodeError as e:
+                        raise LLMResponseError(
+                            f"Failed to decode streaming response",
+                            details={"original_error": str(e)}
+                        )
+        if usage_data:
+            yield {'__usage__': usage_data}
+    def _convert_tool_to_responses(self, tool: Dict[str, Any]) -> Dict[str, Any]:
+        """Convert Chat Completions tool schema to Responses/Codex schema."""
+        if tool.get("type") == "function" and "function" in tool:
+            function = tool["function"]
+            return {
+                "type": "function",
+                "name": function.get("name", ""),
+                "description": function.get("description", ""),
+                "parameters": self._normalize_json_schema(function.get("parameters", {})),
+                "strict": False,
+            }
+        return tool
+    def _normalize_response(self, response_json: Dict[str, Any]) -> Dict[str, Any]:
+        """Normalize Responses output into Chat Completions message shape."""
+        raw_usage = response_json.get("usage", {})
+        usage = self._normalize_usage(raw_usage)
+        output_items = response_json.get("output", [])
+        content_parts = []
+        tool_calls = []
+        for item in output_items:
+            item_type = item.get("type")
+            if item_type == "function_call":
+                call_id = item.get("call_id") or item.get("id")
+                tool_calls.append({
+                    "id": call_id,
+                    "type": "function",
+                    "function": {
+                        "name": item.get("name", ""),
+                        "arguments": item.get("arguments", "{}"),
+                    }
+                })
+                continue
+            if item_type != "message":
+                continue
+            for c in item.get("content", []):
+                if c.get("type") in {"output_text", "text"}:
+                    text = c.get("text")
+                    if text is not None:
+                        content_parts.append(text)
+        message = {"role": "assistant"}
+        text_content = "\n".join(content_parts) if content_parts else ""
+        if tool_calls:
+            message["tool_calls"] = tool_calls
+            message["content"] = text_content or None
+        else:
+            message["content"] = text_content
+        replay_items = copy.deepcopy(output_items)
+        for item in replay_items:
+            item.pop("id", None)
+        message["_responses_output"] = replay_items
+        return {
+            "choices": [{
+                "message": message,
+                "finish_reason": "tool_calls" if tool_calls else "stop",
+            }],
+            "usage": usage,
+        }
+    def _normalize_usage(self, usage: Any) -> Dict[str, Any]:
+        """Normalize Codex Responses usage into vmCode's OpenAI-style usage shape."""
+        if not isinstance(usage, dict):
+            return {}
+        normalized = dict(usage)
+        input_tokens = normalized.get("input_tokens")
+        output_tokens = normalized.get("output_tokens")
+        if normalized.get("prompt_tokens") is None and input_tokens is not None:
+            normalized["prompt_tokens"] = input_tokens
+        if normalized.get("completion_tokens") is None and output_tokens is not None:
+            normalized["completion_tokens"] = output_tokens
+        if normalized.get("total_tokens") is None:
+            prompt_tokens = normalized.get("prompt_tokens")
+            completion_tokens = normalized.get("completion_tokens")
+            if prompt_tokens is not None and completion_tokens is not None:
+                normalized["total_tokens"] = prompt_tokens + completion_tokens
+        input_details = normalized.get("input_tokens_details")
+        if isinstance(input_details, dict) and input_details.get("cached_tokens") is not None:
+            cached_tokens = input_details["cached_tokens"]
+            if normalized.get("prompt_tokens_details") is None:
+                normalized["prompt_tokens_details"] = {"cached_tokens": cached_tokens}
+            elif isinstance(normalized["prompt_tokens_details"], dict):
+                normalized["prompt_tokens_details"].setdefault("cached_tokens", cached_tokens)
+            normalized.setdefault("cached_tokens", cached_tokens)
+        return normalized
+    def _normalize_json_schema(self, schema: Any) -> Any:
+        """Normalize JSON Schema for strict Responses function tools."""
+        if not isinstance(schema, dict):
+            return schema
+        normalized = dict(schema)
+        schema_type = normalized.get("type")
+        if schema_type == "object":
+            properties = normalized.get("properties", {})
+            normalized["properties"] = {
+                key: self._normalize_json_schema(value)
+                for key, value in properties.items()
+            }
+            normalized.setdefault("additionalProperties", False)
+        if schema_type == "array" and "items" in normalized:
+            normalized["items"] = self._normalize_json_schema(normalized["items"])
+        for key in ("anyOf", "oneOf", "allOf"):
+            if key in normalized and isinstance(normalized[key], list):
+                normalized[key] = [self._normalize_json_schema(item) for item in normalized[key]]
+        return normalized

package/src/llm/config.py CHANGED Viewed

@@ -32,6 +32,7 @@ ENV_API_KEYS = {
     'MINIMAX_PLAN_API_KEY': os.environ.get('MINIMAX_PLAN_API_KEY'),
     'MINIMAX_API_KEY': os.environ.get('MINIMAX_API_KEY'),
     'BONE_PROXY_API_KEY': os.environ.get('BONE_PROXY_API_KEY'),
+    'CODEX_PLAN_API_KEY': os.environ.get('CODEX_PLAN_API_KEY'),
 }
 # Detect platform for llama.cpp paths
@@ -73,6 +74,24 @@ def _load_config():
 _CONFIG = _load_config()
+def _get_codex_token() -> str:
+    """Read access token from Codex CLI's cached auth (~/.codex/auth.json).
+    Returns the access_token if available, empty string otherwise.
+    Codex CLI stores OAuth tokens here after `codex login`.
+    """
+    try:
+        auth_path = Path.home() / ".codex" / "auth.json"
+        if not auth_path.exists():
+            return ""
+        import json
+        data = json.loads(auth_path.read_text(encoding="utf-8"))
+        return data.get("tokens", {}).get("access_token", "")
+    except Exception:
+        return ""
 # Cache for provider registry (built once at module load)
 _provider_registry_cache = None
 _cached_provider = None
@@ -134,8 +153,8 @@ def _get_provider_registry():
             },
             "default_temperature": 0.1,
             "default_top_p": 0.9,
-            "allow_top_p": True,
-            "allow_temperature": True,
+            "allow_top_p": False,
+            "allow_temperature": False,
             "cost_in": 0.0,
             "cost_out": 0.0
         },
@@ -311,6 +330,22 @@ def _get_provider_registry():
             "allow_temperature": True,
             **_model_cost("KIMI_MODEL"),
         },
+        "codex": {
+            "type": "api",
+            "api_key": _CONFIG.get("CODEX_PLAN_API_KEY", "") or _get_codex_token(),
+            "model": _CONFIG.get("CODEX_PLAN_MODEL", "gpt-5.4-mini"),
+            "api_base": _CONFIG.get("CODEX_PLAN_API_BASE", "https://chatgpt.com/backend-api/codex"),
+            "endpoint": "/responses",
+            "error_prefix": "Codex",
+            "config_keys": {
+                "CODEX_PLAN_API_KEY": "",
+                "CODEX_PLAN_MODEL": "",
+                "CODEX_PLAN_API_BASE": "https://chatgpt.com/backend-api/codex",
+            },
+            "allow_temperature": False,
+            "allow_top_p": False,
+            **_model_cost("CODEX_PLAN_MODEL"),
+        },
         "bone": {
             "type": "api",
             "api_key": _CONFIG.get("BONE_PROXY_API_KEY", ""),
@@ -421,6 +456,14 @@ def get_providers():
     return list(PROVIDER_REGISTRY.keys())
+def get_provider_display_name(provider: str) -> str:
+    """Return the user-facing provider name for a provider key."""
+    display_names = {
+        "codex": "Codex",
+    }
+    return display_names.get(provider, provider.replace("_", " ").title())
 # ============================================================================
 # PROVIDER REGISTRY - Centralized provider configuration
 # ============================================================================
@@ -434,6 +477,7 @@ __all__ = [
     "CONFIG_PATH",
     "PROVIDER_REGISTRY",
     "get_providers",
+    "get_provider_display_name",
     "get_model_cost",
     "LLM_PROVIDER",
     "TOOLS_ENABLED",

package/src/llm/prompts.py CHANGED Viewed

@@ -262,18 +262,17 @@ def _build_vault_section(variant: str = "main") -> str | None:
 def _build_context_section() -> str:
-    """Build a dynamic section with current date, time, and location."""
+    """Build a dynamic section with current date and location."""
     from datetime import datetime
+    import os
     now = datetime.now()
     date_str = now.strftime("%A, %B %d, %Y")
-    time_str = now.strftime("%I:%M %p")
-    timezone = now.astimezone().tzinfo
     return (
         "## Current Context\n\n"
         f"**Date:** {date_str}\n"
-        f"**Time:** {time_str} ({timezone})\n"
+        f"**Working directory:** {os.getcwd()}\n"
     )
@@ -364,6 +363,7 @@ def _main_sections(variant: str) -> list[tuple[str, callable]]:
         ("communication_style", lambda: _static(variant, "communication_style.md")),
         ("trust_subagent_context", lambda: _static(variant, "trust_subagent_context.md")),
         ("context_reliability", lambda: _static(variant, "context_reliability.md")),
+        ("skills", lambda: _static(variant, "skills.md")),
         ("conversational_tool_calling", lambda: _static(variant, "conversational_tool_calling.md")),
         ("professional_objectivity", lambda: _static(variant, "professional_objectivity.md")),
         ("think_before_acting", lambda: _static(variant, "think_before_acting.md")),
@@ -405,12 +405,14 @@ def _sub_agent_sections(variant: str) -> list[tuple[str, callable]]:
         middle = [
             ("trust_subagent_context", lambda: _static(variant, "trust_subagent_context.md")),
             ("context_reliability", lambda: _static(variant, "context_reliability.md")),
+            ("skills", lambda: _static(variant, "skills.md")),
             ("exploration_pattern", lambda: _static(variant, "exploration_pattern.md")),
             ("targeted_searching", lambda: _static(variant, "targeted_searching.md")),
             ("tool_preferences", lambda: _static(variant, "tool_preferences.md")),
         ]
     else:
         middle = [
+            ("skills", lambda: _static(variant, "skills.md")),
             ("conversational_tool_calling", lambda: _static(variant, "conversational_tool_calling.md")),
             ("professional_objectivity", lambda: _static(variant, "professional_objectivity.md")),
             ("think_before_acting", lambda: _static(variant, "think_before_acting.md")),
@@ -426,7 +428,7 @@ def _sub_agent_sections(variant: str) -> list[tuple[str, callable]]:
     return base + middle
-def build_system_prompt(variant: str | None = None) -> str:
+def build_system_prompt(variant: str | None = None, active_skills_section: str = "") -> str:
     """Build system prompt for main agent.
     Loads section content from prompts/<variant>/. Order is defined by
@@ -435,6 +437,7 @@ def build_system_prompt(variant: str | None = None) -> str:
     Args:
         variant: Variant name (e.g. 'main', 'micro').
             If None, reads from settings.
+        active_skills_section: Optional rendered active-skills block to append.
     Returns:
         Complete system prompt string
@@ -446,7 +449,10 @@ def build_system_prompt(variant: str | None = None) -> str:
             f"Prompt variant '{variant}' not found: "
             f"{_PROMPTS_DIR / variant} does not exist"
         )
-    return _build_prompt(_main_sections(variant))
+    result = _build_prompt(_main_sections(variant))
+    if active_skills_section.strip():
+        result += "\n\n" + active_skills_section.strip()
+    return result
 def build_sub_agent_prompt(sub_agent_type: str = "research", soft_limit_tokens: int | None = None, hard_limit_tokens: int | None = None) -> str:
@@ -486,4 +492,3 @@ def build_sub_agent_prompt(sub_agent_type: str = "research", soft_limit_tokens:
     return "\n\n".join(result)

package/src/llm/providers.py CHANGED Viewed

@@ -8,6 +8,7 @@ from typing import Optional, Dict, Any, Iterator
 import requests
 from exceptions import LLMResponseError
+from .codex_provider import CodexResponsesHandler
 class OpenAIHandler:
@@ -417,6 +418,7 @@ HANDLER_REGISTRY = {
     "kimi": OpenAIHandler,
     "anthropic": AnthropicHandler,
     "local": OpenAIHandler,
+    "codex": CodexResponsesHandler,
 }
@@ -433,4 +435,4 @@ def get_handler(provider_name: str):
     return handler_class()
-__all__ = ['OpenAIHandler', 'AnthropicHandler', 'get_handler']
+__all__ = ['OpenAIHandler', 'AnthropicHandler', 'CodexResponsesHandler', 'get_handler']

package/src/llm/token_tracker.py CHANGED Viewed

@@ -56,6 +56,11 @@ class TokenTracker:
         self.conv_cache_read_tokens = 0        # Per-conversation cache read tokens
         self.conv_cache_creation_tokens = 0    # Per-conversation cache creation tokens
+        # Last usage payload diagnostics (useful for debugging provider reporting gaps)
+        self.last_usage_snapshot = None
+        self.last_usage_keys = []
+        self.last_cache_metrics_reported = None
         # Active prompt variant (loaded from prompts/ directory)
         self.current_variant = "main"
@@ -85,6 +90,16 @@ class TokenTracker:
         if "usage" in usage_data:
             usage_data = usage_with_cost(usage_data)
+        self.last_usage_snapshot = dict(usage_data)
+        self.last_usage_keys = sorted(usage_data.keys())
+        details = usage_data.get('prompt_tokens_details')
+        self.last_cache_metrics_reported = (
+            usage_data.get('cache_read_input_tokens') is not None
+            or usage_data.get('cache_creation_input_tokens') is not None
+            or usage_data.get('cached_tokens') is not None
+            or (isinstance(details, dict) and details.get('cached_tokens') is not None)
+        )
         # Update cumulative token counts (accumulated for billing, never reset by compaction)
         prompt_tokens = usage_data.get('prompt_tokens', 0)
         completion_tokens = usage_data.get('completion_tokens', 0)