PyPI - zwarm - Versions diffs - 3.2.1__py3-none-any.whl → 3.6.0__py3-none-any.whl - Mend

zwarm 3.2.1py3-none-any.whl → 3.6.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

zwarm/cli/interactive.py +346 -30
zwarm/cli/main.py +221 -90
zwarm/cli/pilot.py +107 -9
zwarm/core/config.py +26 -9
zwarm/core/costs.py +55 -183
zwarm/core/registry.py +329 -0
zwarm/core/test_config.py +2 -3
zwarm/orchestrator.py +17 -43
zwarm/sessions/__init__.py +48 -9
zwarm/sessions/base.py +501 -0
zwarm/sessions/claude.py +481 -0
zwarm/sessions/manager.py +233 -486
zwarm/tools/delegation.py +93 -31
{zwarm-3.2.1.dist-info → zwarm-3.6.0.dist-info}/METADATA +73 -21
{zwarm-3.2.1.dist-info → zwarm-3.6.0.dist-info}/RECORD +17 -21
zwarm/adapters/__init__.py +0 -21
zwarm/adapters/base.py +0 -109
zwarm/adapters/claude_code.py +0 -357
zwarm/adapters/codex_mcp.py +0 -1262
zwarm/adapters/registry.py +0 -69
zwarm/adapters/test_codex_mcp.py +0 -274
zwarm/adapters/test_registry.py +0 -68
{zwarm-3.2.1.dist-info → zwarm-3.6.0.dist-info}/WHEEL +0 -0
{zwarm-3.2.1.dist-info → zwarm-3.6.0.dist-info}/entry_points.txt +0 -0

zwarm/core/registry.py ADDED Viewed

@@ -0,0 +1,329 @@
+"""
+Model Registry - Centralized LLM model definitions for zwarm.
+This registry defines all supported models with:
+- Canonical names and aliases
+- Adapter mapping (which CLI handles the model)
+- Pricing information
+Add new models here and they'll automatically appear in:
+- `zwarm interactive` help and `models` command
+- Cost estimation
+- Adapter auto-detection from model name
+"""
+from __future__ import annotations
+from dataclasses import dataclass, field
+from typing import Any
+@dataclass
+class ModelInfo:
+    """Complete information about an LLM model."""
+    # Identity
+    canonical: str  # Full model name (e.g., "gpt-5.1-codex-mini")
+    adapter: str  # "codex" or "claude"
+    aliases: list[str] = field(default_factory=list)  # Short names
+    # Pricing ($ per million tokens)
+    input_per_million: float = 0.0
+    output_per_million: float = 0.0
+    cached_input_per_million: float | None = None
+    # Metadata
+    description: str = ""
+    is_default: bool = False  # Default model for this adapter
+    def estimate_cost(
+        self,
+        input_tokens: int,
+        output_tokens: int,
+        cached_tokens: int = 0,
+    ) -> float:
+        """Estimate cost in dollars."""
+        input_cost = (input_tokens / 1_000_000) * self.input_per_million
+        output_cost = (output_tokens / 1_000_000) * self.output_per_million
+        cached_cost = 0.0
+        if cached_tokens and self.cached_input_per_million:
+            cached_cost = (cached_tokens / 1_000_000) * self.cached_input_per_million
+        return input_cost + output_cost + cached_cost
+# =============================================================================
+# Model Registry - ADD NEW MODELS HERE
+# =============================================================================
+MODELS: list[ModelInfo] = [
+    # -------------------------------------------------------------------------
+    # OpenAI Codex Models (via `codex` CLI)
+    # -------------------------------------------------------------------------
+    ModelInfo(
+        canonical="gpt-5.1-codex-mini",
+        adapter="codex",
+        aliases=["codex-mini", "mini"],
+        input_per_million=0.25,
+        output_per_million=2.00,
+        cached_input_per_million=0.025,
+        description="Fast, cost-effective coding model",
+        is_default=True,
+    ),
+    ModelInfo(
+        canonical="gpt-5.1-codex",
+        adapter="codex",
+        aliases=["codex", "codex-full"],
+        input_per_million=1.25,
+        output_per_million=10.00,
+        cached_input_per_million=0.125,
+        description="Full Codex model with extended reasoning",
+    ),
+    ModelInfo(
+        canonical="gpt-5.1-codex-max",
+        adapter="codex",
+        aliases=["codex-max", "max"],
+        input_per_million=1.25,
+        output_per_million=10.00,
+        cached_input_per_million=0.125,
+        description="Maximum context Codex model",
+    ),
+    # -------------------------------------------------------------------------
+    # Anthropic Claude Models (via `claude` CLI)
+    # -------------------------------------------------------------------------
+    ModelInfo(
+        canonical="sonnet",
+        adapter="claude",
+        aliases=["claude-sonnet", "claude-4-sonnet"],
+        input_per_million=3.00,
+        output_per_million=15.00,
+        description="Balanced Claude model for most tasks",
+        is_default=True,
+    ),
+    ModelInfo(
+        canonical="opus",
+        adapter="claude",
+        aliases=["claude-opus", "claude-4-opus"],
+        input_per_million=15.00,
+        output_per_million=75.00,
+        description="Most capable Claude model",
+    ),
+    ModelInfo(
+        canonical="haiku",
+        adapter="claude",
+        aliases=["claude-haiku", "claude-4-haiku"],
+        input_per_million=0.25,
+        output_per_million=1.25,
+        description="Fast, lightweight Claude model",
+    ),
+]
+# =============================================================================
+# Registry Lookups
+# =============================================================================
+def _build_lookup_tables() -> tuple[dict[str, ModelInfo], dict[str, ModelInfo]]:
+    """Build lookup tables for fast model resolution."""
+    by_canonical: dict[str, ModelInfo] = {}
+    by_alias: dict[str, ModelInfo] = {}
+    for model in MODELS:
+        by_canonical[model.canonical.lower()] = model
+        by_alias[model.canonical.lower()] = model
+        for alias in model.aliases:
+            by_alias[alias.lower()] = model
+    return by_canonical, by_alias
+_BY_CANONICAL, _BY_ALIAS = _build_lookup_tables()
+def resolve_model(name: str) -> ModelInfo | None:
+    """
+    Resolve a model name or alias to its ModelInfo.
+    Args:
+        name: Model name, alias, or partial match
+    Returns:
+        ModelInfo or None if not found
+    """
+    name_lower = name.lower()
+    # Exact match on alias or canonical
+    if name_lower in _BY_ALIAS:
+        return _BY_ALIAS[name_lower]
+    # Prefix match (e.g., "gpt-5.1-codex-mini-2026-01" -> "gpt-5.1-codex-mini")
+    for canonical, model in _BY_CANONICAL.items():
+        if name_lower.startswith(canonical):
+            return model
+    return None
+def get_adapter_for_model(name: str) -> str | None:
+    """
+    Get the adapter name for a model.
+    Args:
+        name: Model name or alias
+    Returns:
+        Adapter name ("codex" or "claude") or None if unknown
+    """
+    model = resolve_model(name)
+    return model.adapter if model else None
+def get_default_model(adapter: str) -> str | None:
+    """
+    Get the default model for an adapter.
+    Args:
+        adapter: Adapter name ("codex" or "claude")
+    Returns:
+        Default model canonical name or None
+    """
+    for model in MODELS:
+        if model.adapter == adapter and model.is_default:
+            return model.canonical
+    return None
+def list_models(adapter: str | None = None) -> list[ModelInfo]:
+    """
+    List available models.
+    Args:
+        adapter: Filter by adapter, or None for all
+    Returns:
+        List of ModelInfo objects
+    """
+    if adapter:
+        return [m for m in MODELS if m.adapter == adapter]
+    return MODELS.copy()
+def list_adapters() -> list[str]:
+    """Get list of unique adapter names."""
+    return sorted(set(m.adapter for m in MODELS))
+def get_models_help_text() -> str:
+    """
+    Generate help text showing all available models.
+    Returns formatted string for display in help messages.
+    """
+    lines = ["", "Available models:"]
+    for adapter in list_adapters():
+        lines.append(f"\n  {adapter.upper()}:")
+        for model in list_models(adapter):
+            default_marker = " *" if model.is_default else ""
+            aliases = ", ".join(model.aliases) if model.aliases else ""
+            alias_str = f" ({aliases})" if aliases else ""
+            lines.append(f"    {model.canonical}{alias_str}{default_marker}")
+    lines.append("\n  * = default for adapter")
+    return "\n".join(lines)
+def get_models_table_data() -> list[dict[str, Any]]:
+    """
+    Get model data formatted for table display.
+    Returns list of dicts with keys: adapter, model, aliases, default, price, description
+    """
+    data = []
+    for model in MODELS:
+        data.append({
+            "adapter": model.adapter,
+            "model": model.canonical,
+            "aliases": ", ".join(model.aliases),
+            "default": model.is_default,
+            "input_price": model.input_per_million,
+            "output_price": model.output_per_million,
+            "description": model.description,
+        })
+    return data
+# =============================================================================
+# Cost Estimation
+# =============================================================================
+def estimate_cost(
+    model: str,
+    input_tokens: int,
+    output_tokens: int,
+    cached_tokens: int = 0,
+) -> float | None:
+    """
+    Estimate cost for a model run.
+    Args:
+        model: Model name or alias
+        input_tokens: Number of input tokens
+        output_tokens: Number of output tokens
+        cached_tokens: Number of cached input tokens
+    Returns:
+        Cost in USD, or None if model unknown
+    """
+    model_info = resolve_model(model)
+    if model_info is None:
+        return None
+    return model_info.estimate_cost(input_tokens, output_tokens, cached_tokens)
+def format_cost(cost: float | None) -> str:
+    """Format cost as a human-readable string."""
+    if cost is None:
+        return "?"
+    if cost < 0.01:
+        return f"${cost:.4f}"
+    elif cost < 1.00:
+        return f"${cost:.3f}"
+    else:
+        return f"${cost:.2f}"
+def estimate_session_cost(
+    model: str,
+    token_usage: dict[str, Any],
+) -> dict[str, Any]:
+    """
+    Estimate cost for a session given its token usage.
+    Args:
+        model: Model used
+        token_usage: Dict with input_tokens, output_tokens, etc.
+    Returns:
+        Dict with cost info: {cost, cost_formatted, pricing_known, ...}
+    """
+    input_tokens = token_usage.get("input_tokens", 0)
+    output_tokens = token_usage.get("output_tokens", 0)
+    cached_tokens = token_usage.get("cached_tokens", 0)
+    cost = estimate_cost(model, input_tokens, output_tokens, cached_tokens)
+    return {
+        "cost": cost,
+        "cost_formatted": format_cost(cost),
+        "pricing_known": cost is not None,
+        "model": model,
+        "input_tokens": input_tokens,
+        "output_tokens": output_tokens,
+    }

zwarm/core/test_config.py CHANGED Viewed

@@ -20,7 +20,6 @@ def test_default_config():
     assert config.executor.adapter == "codex_mcp"
     assert config.executor.sandbox == "workspace-write"
     assert config.orchestrator.lm == "gpt-5-mini"
-    assert config.orchestrator.sync_first is True
     assert config.state_dir == ".zwarm"
@@ -68,8 +67,8 @@ def test_apply_overrides():
     assert result["executor"]["adapter"] == "claude_code"
     # Override with boolean
-    result = apply_overrides(config, ["orchestrator.sync_first=false"])
-    assert result["orchestrator"]["sync_first"] is False
+    result = apply_overrides(config, ["executor.web_search=true"])
+    assert result["executor"]["web_search"] is True
     # Create new nested path
     result = apply_overrides(config, ["weave.project=my-project"])

zwarm/orchestrator.py CHANGED Viewed

@@ -23,7 +23,6 @@ from wbal.helper import TOOL_CALL_TYPE, format_openai_tool_response
 from wbal.lm import LM as wbalLMGeneric
 from wbal.lm import GPT5LargeVerbose
-from zwarm.adapters import ExecutorAdapter, get_adapter
 from zwarm.core.compact import compact_messages, should_compact
 from zwarm.core.config import ZwarmConfig, load_config
 from zwarm.core.environment import OrchestratorEnv
@@ -72,7 +71,6 @@ class Orchestrator(YamlAgent):
     # State management
     _state: StateManager = PrivateAttr()
     _sessions: dict[str, ConversationSession] = PrivateAttr(default_factory=dict)
-    _adapters: dict[str, ExecutorAdapter] = PrivateAttr(default_factory=dict)
     _watcher_manager: WatcherManager | None = PrivateAttr(default=None)
     _resumed: bool = PrivateAttr(default=False)
     _total_tokens: int = PrivateAttr(default=0)  # Cumulative orchestrator tokens
@@ -83,9 +81,11 @@ class Orchestrator(YamlAgent):
             "total_tokens": 0,
         }
     )
+    # Callback for step progress (used by CLI to print tool calls)
+    _step_callback: Callable[[int, list[tuple[dict[str, Any], Any]]], None] | None = PrivateAttr(default=None)
     def model_post_init(self, __context: Any) -> None:
-        """Initialize state and adapters after model creation."""
+        """Initialize state after model creation."""
         super().model_post_init(__context)
         # Initialize state manager with instance isolation
@@ -151,40 +151,9 @@ class Orchestrator(YamlAgent):
         """Access state manager."""
         return self._state
-    def _get_adapter(self, name: str) -> ExecutorAdapter:
-        """Get or create an adapter by name using the adapter registry."""
-        if name not in self._adapters:
-            # Get model from config (adapters have their own defaults if None)
-            model = self.config.executor.model
-            # Use isolated codex config if available
-            config_path = self.working_dir / self.config.state_dir / "codex.toml"
-            if not config_path.exists():
-                config_path = None  # Fallback to adapter defaults
-            self._adapters[name] = get_adapter(
-                name, model=model, config_path=config_path
-            )
-        return self._adapters[name]
     def get_executor_usage(self) -> dict[str, int]:
-        """Get aggregated token usage across all executors."""
-        total = {
-            "input_tokens": 0,
-            "output_tokens": 0,
-            "total_tokens": 0,
-        }
-        for adapter in self._adapters.values():
-            if hasattr(adapter, "total_usage"):
-                usage = adapter.total_usage
-                for key in total:
-                    total[key] += usage.get(key, 0)
-        return total
-    @property
-    def executor_usage(self) -> dict[str, int]:
-        """Aggregated executor token usage (for Weave tracking)."""
-        return self.get_executor_usage()
+        """Get aggregated token usage from executor sessions."""
+        return self._executor_usage
     def save_state(self) -> None:
         """Save orchestrator state for resume."""
@@ -587,7 +556,11 @@ Review what was accomplished in the previous session and delegate new tasks as n
                 }
             # NUDGE and CONTINUE just continue
-            self.step()
+            tool_results = self.step()
+            # Call step callback if registered (for CLI progress display)
+            if self._step_callback:
+                self._step_callback(self._step_count, tool_results)
             if self.stopCondition:
                 break
@@ -599,8 +572,7 @@ Review what was accomplished in the previous session and delegate new tasks as n
     async def cleanup(self) -> None:
         """Clean up resources."""
-        for adapter in self._adapters.values():
-            await adapter.cleanup()
+        pass  # Session cleanup handled by CodexSessionManager
 def build_orchestrator(
@@ -631,15 +603,17 @@ def build_orchestrator(
     """
     from uuid import uuid4
-    # Load configuration
+    # Resolve working directory first (needed for config loading)
+    working_dir = working_dir or Path.cwd()
+    # Load configuration from working_dir (not cwd!)
+    # This ensures config.toml and .env are loaded from the project being worked on
     config = load_config(
         config_path=config_path,
         overrides=overrides,
+        working_dir=working_dir,
     )
-    # Resolve working directory
-    working_dir = working_dir or Path.cwd()
     # Generate instance ID if not provided (enables isolation by default for new runs)
     # For resume, instance_id should be provided explicitly
     if instance_id is None and not resume:

zwarm/sessions/__init__.py CHANGED Viewed

@@ -1,26 +1,65 @@
 """
-Codex Session Manager.
+Session Manager - Background process management for executor agents.
-A standalone session manager for running Codex agents in the background.
-Similar to Sculptor/Claude parallel tools but for Codex.
+Supports multiple executor adapters:
+- Codex (CodexSessionManager) - OpenAI's Codex CLI
+- Claude (ClaudeSessionManager) - Anthropic's Claude Code CLI
 Features:
-- Start codex exec tasks in background processes
+- Start executor tasks in background processes
 - Monitor status and view message history
 - Inject follow-up messages (continue conversations)
 - Kill running sessions
+- Unified interface via BaseSessionManager
 """
-from zwarm.sessions.manager import (
-    CodexSession,
-    CodexSessionManager,
+from zwarm.sessions.base import (
+    BaseSessionManager,
+    CodexSession,  # Alias for Session (backwards compat)
+    Session,
     SessionMessage,
     SessionStatus,
 )
+from zwarm.sessions.manager import CodexSessionManager
+# Available adapters
+AVAILABLE_ADAPTERS = ["codex", "claude"]
 __all__ = [
-    "CodexSession",
-    "CodexSessionManager",
+    # Base classes
+    "BaseSessionManager",
+    "Session",
     "SessionMessage",
     "SessionStatus",
+    # Backwards compatibility
+    "CodexSession",
+    # Adapters
+    "CodexSessionManager",
+    # Registry
+    "AVAILABLE_ADAPTERS",
+    # Factory
+    "get_session_manager",
 ]
+def get_session_manager(adapter: str, state_dir: str = ".zwarm") -> BaseSessionManager:
+    """
+    Factory function to get a session manager for the given adapter.
+    Args:
+        adapter: Adapter name ("codex" or "claude")
+        state_dir: State directory path
+    Returns:
+        Session manager instance
+    Raises:
+        ValueError: If adapter is not recognized
+    """
+    if adapter == "codex":
+        return CodexSessionManager(state_dir)
+    elif adapter == "claude":
+        from zwarm.sessions.claude import ClaudeSessionManager
+        return ClaudeSessionManager(state_dir)
+    else:
+        raise ValueError(f"Unknown adapter: {adapter}. Available: {AVAILABLE_ADAPTERS}")

zwarm 3.2.1__py3-none-any.whl → 3.6.0__py3-none-any.whl

zwarm 3.2.1py3-none-any.whl → 3.6.0py3-none-any.whl