PyPI - coding-agent-wrapper - Versions diffs - 0.1.0__py3-none-any.whl - Mend

coding-agent-wrapper 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (31) hide show

caw/__init__.py +88 -0
caw/agent.py +578 -0
caw/auth/README.md +118 -0
caw/auth/__init__.py +23 -0
caw/auth/cli.py +68 -0
caw/auth/collector.py +324 -0
caw/auth/linker.py +174 -0
caw/auth/manifest.py +77 -0
caw/auth/providers.py +433 -0
caw/auth/status.py +241 -0
caw/cli.py +50 -0
caw/display.py +223 -0
caw/faststats.py +298 -0
caw/mcp.py +602 -0
caw/models.py +385 -0
caw/pricing.json +15 -0
caw/pricing.py +33 -0
caw/provider.py +135 -0
caw/providers/__init__.py +0 -0
caw/providers/claude_code.py +648 -0
caw/providers/codex.py +564 -0
caw/py.typed +0 -0
caw/storage.py +184 -0
caw/toolkit.py +198 -0
caw/viewer/__init__.py +149 -0
caw/viewer/static/index.html +847 -0
coding_agent_wrapper-0.1.0.dist-info/METADATA +213 -0
coding_agent_wrapper-0.1.0.dist-info/RECORD +31 -0
coding_agent_wrapper-0.1.0.dist-info/WHEEL +4 -0
coding_agent_wrapper-0.1.0.dist-info/entry_points.txt +2 -0
coding_agent_wrapper-0.1.0.dist-info/licenses/LICENSE +202 -0

caw/models.py ADDED Viewed

@@ -0,0 +1,385 @@
+"""Core data models for the coding agent wrapper."""
+from __future__ import annotations
+import enum
+from dataclasses import dataclass, field
+from typing import Any, Union
+class ModelTier(enum.Enum):
+    """Abstract model selection tiers.
+    Each provider maps these to concrete model identifiers::
+        agent = Agent(model=ModelTier.STRONGEST)  # provider picks its best model
+        agent = Agent(model=ModelTier.FAST)        # provider picks its fast model
+        agent = Agent(model="claude-opus-4-6")     # explicit model string still works
+    """
+    STRONGEST = "strongest"
+    FAST = "fast"
+class ToolGroup(enum.Flag):
+    """Abstract tool permission groups.
+    Combine with ``|`` (union) and ``-`` (subtract) to build permission sets::
+        ToolGroup.READER | ToolGroup.EXEC          # read + execute only
+        ToolGroup.ALL - ToolGroup.WRITER            # everything except writes
+        ToolGroup.ALL - ToolGroup.INTERACTION       # default for automated pipelines
+    """
+    READER = enum.auto()
+    WRITER = enum.auto()
+    EXEC = enum.auto()
+    WEB = enum.auto()
+    PARALLEL = enum.auto()
+    INTERACTION = enum.auto()
+    ALL = READER | WRITER | EXEC | WEB | PARALLEL | INTERACTION
+    NO_INTERACTION = READER | WRITER | EXEC | WEB | PARALLEL
+    def __sub__(self, other):
+        if not isinstance(other, ToolGroup):
+            return NotImplemented
+        return self & ~other
+@dataclass
+class MCPServer:
+    """Configuration for an MCP server.
+    For stdio transport, set ``command``/``args``/``env``.
+    For HTTP transport, set ``url`` (command/args/env are ignored).
+    """
+    name: str
+    command: str = ""
+    args: list[str] = field(default_factory=list)
+    env: dict[str, str] = field(default_factory=dict)
+    url: str = ""
+@dataclass
+class AgentSpec:
+    """Configuration for a subagent."""
+    name: str = ""
+    description: str = ""
+    system_prompt: str = ""
+    model: str = ""
+    reasoning: str = ""
+    tools: ToolGroup | None = None
+    tool_servers: list[Any] = field(default_factory=list)
+    mcp_servers: list[MCPServer] = field(default_factory=list)
+    subagents: list["AgentSpec"] = field(default_factory=list)
+    metadata: dict[str, Any] = field(default_factory=dict)
+@dataclass
+class MCPTool:
+    """Descriptor for a tool provided by an MCP server."""
+    name: str
+    description: str = ""
+    server: str = ""
+    input_schema: dict[str, Any] = field(default_factory=dict)
+@dataclass
+class TextBlock:
+    """A block of text output from the agent."""
+    text: str
+@dataclass
+class ThinkingBlock:
+    """A block of thinking/reasoning output from the agent."""
+    text: str
+@dataclass
+class ToolUse:
+    """A tool invocation paired with its result."""
+    id: str
+    name: str
+    arguments: dict[str, Any] = field(default_factory=dict)
+    output: str = ""
+    is_error: bool = False
+    subagent_trajectory: Trajectory | None = None
+ContentBlock = Union[TextBlock, ThinkingBlock, ToolUse]
+@dataclass
+class UsageStats:
+    """Token usage and cost statistics."""
+    input_tokens: int = 0
+    output_tokens: int = 0
+    cache_read_tokens: int = 0
+    cache_write_tokens: int = 0
+    cost_usd: float = 0.0
+    @property
+    def total_tokens(self) -> int:
+        """Total tokens consumed (input + output)."""
+        return self.input_tokens + self.output_tokens
+    def __add__(self, other: UsageStats) -> UsageStats:
+        return UsageStats(
+            input_tokens=self.input_tokens + other.input_tokens,
+            output_tokens=self.output_tokens + other.output_tokens,
+            cache_read_tokens=self.cache_read_tokens + other.cache_read_tokens,
+            cache_write_tokens=self.cache_write_tokens + other.cache_write_tokens,
+            cost_usd=self.cost_usd + other.cost_usd,
+        )
+    def to_dict(self) -> dict[str, Any]:
+        return {
+            "input_tokens": self.input_tokens,
+            "output_tokens": self.output_tokens,
+            "cache_read_tokens": self.cache_read_tokens,
+            "cache_write_tokens": self.cache_write_tokens,
+            "cost_usd": self.cost_usd,
+        }
+    @classmethod
+    def from_dict(cls, d: dict[str, Any]) -> UsageStats:
+        return cls(
+            input_tokens=d.get("input_tokens", 0),
+            output_tokens=d.get("output_tokens", 0),
+            cache_read_tokens=d.get("cache_read_tokens", 0),
+            cache_write_tokens=d.get("cache_write_tokens", 0),
+            cost_usd=d.get("cost_usd", 0.0),
+        )
+@dataclass
+class Turn:
+    """A single turn: user sends a message, agent responds."""
+    input: str
+    output: list[ContentBlock] = field(default_factory=list)
+    usage: UsageStats = field(default_factory=UsageStats)
+    duration_ms: int = 0
+    @property
+    def result(self) -> str:
+        """Last text block's content."""
+        for block in reversed(self.output):
+            if isinstance(block, TextBlock) and block.text:
+                return block.text
+        return ""
+    @property
+    def tool_calls(self) -> list[ToolUse]:
+        """All tool calls made during this turn."""
+        return [b for b in self.output if isinstance(b, ToolUse)]
+    def to_dict(self) -> dict[str, Any]:
+        return {
+            "input": self.input,
+            "output": [_block_to_dict(b) for b in self.output],
+            "usage": self.usage.to_dict(),
+            "duration_ms": self.duration_ms,
+        }
+    @classmethod
+    def from_dict(cls, d: dict[str, Any]) -> Turn:
+        return cls(
+            input=d.get("input", ""),
+            output=[_block_from_dict(b) for b in d.get("output", [])],
+            usage=UsageStats.from_dict(d.get("usage", {})),
+            duration_ms=d.get("duration_ms", 0),
+        )
+@dataclass
+class Trajectory:
+    """Complete record of a session.
+    ``usage`` tracks this agent's own token usage. Use ``total_usage`` to get
+    the accumulated usage including all nested subagent trajectories.
+    """
+    agent: str
+    model: str = ""
+    session_id: str = ""
+    created_at: str = ""
+    completed_at: str = ""
+    usage_limited: bool = False
+    system_prompt: str = ""
+    reasoning: str = ""
+    mcp_servers: list[MCPServer] = field(default_factory=list)
+    turns: list[Turn] = field(default_factory=list)
+    usage: UsageStats = field(default_factory=UsageStats)
+    duration_ms: int = 0
+    metadata: dict[str, Any] = field(default_factory=dict)
+    @property
+    def num_turns(self) -> int:
+        return len(self.turns)
+    @property
+    def result(self) -> str:
+        """The final result from the last turn."""
+        if self.turns:
+            return self.turns[-1].result
+        return ""
+    @property
+    def total_tool_calls(self) -> int:
+        return sum(len(t.tool_calls) for t in self.turns)
+    @property
+    def total_usage(self) -> UsageStats:
+        """Accumulated usage: own + all nested subagent trajectories (recursive)."""
+        total = self.usage
+        for turn in self.turns:
+            for block in turn.output:
+                if isinstance(block, ToolUse) and block.subagent_trajectory:
+                    total = total + block.subagent_trajectory.total_usage
+        return total
+    @property
+    def subagent_trajectories(self) -> list[Trajectory]:
+        """All subagent trajectories across all turns."""
+        trajs: list[Trajectory] = []
+        for turn in self.turns:
+            for block in turn.output:
+                if isinstance(block, ToolUse) and block.subagent_trajectory:
+                    trajs.append(block.subagent_trajectory)
+        return trajs
+    @property
+    def is_usage_limited(self) -> bool:
+        """Whether the session ended due to a usage limit.
+        Set by ``Session.end()`` using the provider's ``detect_usage_limit``.
+        """
+        return self.usage_limited
+    @property
+    def is_complete(self) -> bool:
+        """Whether the session completed normally.
+        A trajectory is complete when it has been finalized (``completed_at``
+        is set by ``Session.end()``) and was not usage-limited.  Mid-session
+        snapshots written by ``append_turn`` have an empty ``completed_at``
+        and are therefore not considered complete.
+        """
+        return bool(self.completed_at) and not self.is_usage_limited
+    def to_dict(self) -> dict[str, Any]:
+        return {
+            "agent": self.agent,
+            "model": self.model,
+            "session_id": self.session_id,
+            "created_at": self.created_at,
+            "completed_at": self.completed_at,
+            "usage_limited": self.usage_limited,
+            "system_prompt": self.system_prompt,
+            "reasoning": self.reasoning,
+            "mcp_servers": [
+                {"name": s.name, "command": s.command, "args": s.args, "env": s.env, "url": s.url}
+                for s in self.mcp_servers
+            ],
+            "turns": [t.to_dict() for t in self.turns],
+            "usage": self.usage.to_dict(),
+            "total_usage": self.total_usage.to_dict(),
+            "duration_ms": self.duration_ms,
+            "metadata": self.metadata,
+        }
+    @classmethod
+    def from_dict(cls, d: dict[str, Any]) -> Trajectory:
+        return cls(
+            agent=d.get("agent", ""),
+            model=d.get("model", ""),
+            session_id=d.get("session_id", ""),
+            created_at=d.get("created_at", ""),
+            completed_at=d.get("completed_at", ""),
+            usage_limited=d.get("usage_limited", False),
+            system_prompt=d.get("system_prompt", ""),
+            reasoning=d.get("reasoning", ""),
+            mcp_servers=[
+                MCPServer(
+                    name=s.get("name", ""),
+                    command=s.get("command", ""),
+                    args=s.get("args", []),
+                    env=s.get("env", {}),
+                    url=s.get("url", ""),
+                )
+                for s in d.get("mcp_servers", [])
+            ],
+            turns=[Turn.from_dict(t) for t in d.get("turns", [])],
+            usage=UsageStats.from_dict(d.get("usage", {})),
+            duration_ms=d.get("duration_ms", 0),
+            metadata=d.get("metadata", {}),
+        )
+# -- Serialization helpers for content blocks --------------------------------
+@dataclass
+class InteractiveResult:
+    """Result from an interactive agent session."""
+    exit_code: int
+    output: str = ""  # raw terminal output (may include ANSI escape sequences)
+    @property
+    def session_id(self) -> str | None:
+        """Extract the session ID from Claude Code's exit output, if present."""
+        import re
+        m = re.search(r"--resume\s+(\S+)", self.output)
+        return m.group(1) if m else None
+def _block_to_dict(block: ContentBlock) -> dict[str, Any]:
+    if isinstance(block, TextBlock):
+        return {"type": "text", "text": block.text}
+    elif isinstance(block, ThinkingBlock):
+        return {"type": "thinking", "text": block.text}
+    else:  # ToolUse
+        d: dict[str, Any] = {
+            "type": "tool_use",
+            "id": block.id,
+            "name": block.name,
+            "arguments": block.arguments,
+            "output": block.output,
+        }
+        if block.is_error:
+            d["is_error"] = True
+        if block.subagent_trajectory:
+            d["subagent_trajectory"] = block.subagent_trajectory.to_dict()
+        return d
+def _block_from_dict(d: dict[str, Any]) -> ContentBlock:
+    btype = d.get("type", "")
+    if btype == "text":
+        return TextBlock(text=d.get("text", ""))
+    elif btype == "thinking":
+        return ThinkingBlock(text=d.get("text", ""))
+    else:  # tool_use
+        sub_traj = None
+        if d.get("subagent_trajectory"):
+            sub_traj = Trajectory.from_dict(d["subagent_trajectory"])
+        return ToolUse(
+            id=d.get("id", ""),
+            name=d.get("name", ""),
+            arguments=d.get("arguments", {}),
+            output=d.get("output", ""),
+            is_error=d.get("is_error", False),
+            subagent_trajectory=sub_traj,
+        )

caw/pricing.json ADDED Viewed

@@ -0,0 +1,15 @@
+{
+  "_comment": "Pricing in USD per 1 million tokens, keyed by agent then model",
+  "codex": {
+    "gpt-5.2-codex": {
+      "input": 1.75,
+      "cached_input": 0.175,
+      "output": 14.0
+    },
+    "gpt-5.3-codex": {
+      "input": 1.75,
+      "cached_input": 0.175,
+      "output": 14.0
+    }
+  }
+}

caw/pricing.py ADDED Viewed

@@ -0,0 +1,33 @@
+"""Token-based cost computation from pricing config."""
+from __future__ import annotations
+import json
+from pathlib import Path
+from typing import Any
+from caw.models import UsageStats
+_pricing_cache: dict[str, Any] | None = None
+def _load_pricing() -> dict[str, Any]:
+    global _pricing_cache
+    if _pricing_cache is None:
+        path = Path(__file__).parent / "pricing.json"
+        if path.exists():
+            _pricing_cache = json.loads(path.read_text())
+        else:
+            _pricing_cache = {}
+    return _pricing_cache
+def compute_cost(agent: str, model: str, usage: UsageStats) -> float:
+    """Compute cost in USD from token counts and pricing config."""
+    pricing = _load_pricing().get(agent, {}).get(model, {})
+    cost = (
+        usage.input_tokens * pricing.get("input", 0.0)
+        + usage.cache_read_tokens * pricing.get("cached_input", 0.0)
+        + usage.output_tokens * pricing.get("output", 0.0)
+    ) / 1_000_000
+    return cost

caw/provider.py ADDED Viewed

@@ -0,0 +1,135 @@
+"""Abstract base classes for provider implementations."""
+from __future__ import annotations
+from abc import ABC, abstractmethod
+from collections.abc import Callable
+from typing import Any
+from caw.models import InteractiveResult, MCPServer, ModelTier, ToolGroup, Trajectory, Turn
+class ProviderSession(ABC):
+    """ABC that each provider implements to manage a live session."""
+    @abstractmethod
+    def send(self, message: str) -> Turn:
+        """Send a message and return the agent's response turn."""
+        ...
+    @abstractmethod
+    def end(self) -> Trajectory:
+        """Finalize the session and return the complete trajectory."""
+        ...
+    @property
+    @abstractmethod
+    def trajectory(self) -> Trajectory:
+        """The accumulated trajectory so far."""
+        ...
+    def detect_usage_limit(self, turn: Turn) -> int | None:
+        """Check whether *turn* indicates the provider's usage limit was hit.
+        Returns the number of minutes to wait before retrying, or ``None``
+        if no limit was detected.  Override in provider subclasses to
+        implement provider-specific detection logic.
+        """
+        return None
+    @property
+    def session_id(self) -> str | None:
+        """Provider-assigned session ID (if any)."""
+        return None
+    @property
+    def last_raw_output(self) -> str | None:
+        """Raw CLI stdout from the most recent send() call (if available)."""
+        return None
+    def set_step_callback(self, callback: Callable[[list], None] | None) -> None:
+        """Set callback invoked after each step within send()."""
+        pass  # default no-op; concrete providers override
+class Provider(ABC):
+    """ABC that each coding agent backend implements."""
+    @property
+    @abstractmethod
+    def name(self) -> str:
+        """Provider identifier (e.g. 'claude_code', 'codex')."""
+        ...
+    def resolve_model(self, tier: ModelTier) -> str:
+        """Translate a :class:`ModelTier` into a concrete model identifier.
+        Each provider must override this to map abstract tiers (e.g.
+        ``ModelTier.STRONGEST``) to the actual model string it supports.
+        """
+        raise NotImplementedError(
+            f"{self.name} provider does not implement resolve_model(); "
+            f"pass an explicit model string instead of ModelTier.{tier.name}"
+        )
+    def resolve_tool_restrictions(self, tools: ToolGroup) -> dict[str, Any]:
+        """Translate ToolGroup into provider-specific session kwargs.
+        Receives a concrete ToolGroup value (never None — the Agent layer
+        applies the default before calling this).
+        """
+        return {}
+    def check_limit(self, model: str | None = None) -> int | None:
+        """Probe whether the provider's usage limit is currently active.
+        Sends a minimal test prompt and checks if the response indicates a
+        usage-limit.  Returns the estimated number of minutes to wait before
+        the limit resets, or ``None`` if no limit is detected.
+        This incurs a small token cost for the probe request.
+        """
+        from caw.display import get_global_display, set_global_display
+        old_display = get_global_display()
+        set_global_display(None)
+        try:
+            session = self.start_session(
+                mcp_servers=[],
+                model=model,
+                system_prompt="Reply with the single word 'ok'.",
+                **self._limit_probe_kwargs(),
+            )
+            try:
+                turn = session.send("hi")
+                return session.detect_usage_limit(turn)
+            finally:
+                session.end()
+        finally:
+            set_global_display(old_display)
+    def _limit_probe_kwargs(self) -> dict[str, Any]:
+        """Extra session kwargs for the limit-check probe.
+        Override in subclasses to disable tools and minimise side-effects.
+        """
+        return {}
+    def start_interactive(
+        self, initial_prompt: str, mcp_servers: list[MCPServer], capture_bytes: int = 0, **kwargs: Any
+    ) -> InteractiveResult:
+        """Launch the provider binary interactively with an initial prompt.
+        Hands control to the user's terminal — stdin/stdout/stderr are
+        inherited so the user interacts with the agent directly.
+        A copy of stdout is captured via a pty.
+        Returns an :class:`InteractiveResult` with the exit code and
+        captured output.
+        """
+        raise NotImplementedError(f"{self.name} provider does not support interactive mode.")
+    @abstractmethod
+    def start_session(self, mcp_servers: list[MCPServer], **kwargs: Any) -> ProviderSession:
+        """Create and return a new provider session."""
+        ...

caw/providers/__init__.py ADDED Viewed

File without changes