PyPI - claude-in-codex - Versions diffs - 0.6.0__py3-none-any.whl - Mend

claude-in-codex 0.6.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

claude_in_codex/__init__.py +5 -0
claude_in_codex/claude.py +381 -0
claude_in_codex/cli_contract.py +123 -0
claude_in_codex/config.py +295 -0
claude_in_codex/context.py +310 -0
claude_in_codex/jobs.py +603 -0
claude_in_codex/normalize.py +268 -0
claude_in_codex/preflight.py +94 -0
claude_in_codex/py.typed +0 -0
claude_in_codex/schemas.py +405 -0
claude_in_codex/server.py +2087 -0
claude_in_codex-0.6.0.dist-info/METADATA +253 -0
claude_in_codex-0.6.0.dist-info/RECORD +16 -0
claude_in_codex-0.6.0.dist-info/WHEEL +4 -0
claude_in_codex-0.6.0.dist-info/entry_points.txt +2 -0
claude_in_codex-0.6.0.dist-info/licenses/LICENSE +21 -0

claude_in_codex/__init__.py ADDED Viewed

@@ -0,0 +1,5 @@
+"""claude-in-codex: call Claude Code from Codex for bounded, read-only critique."""
+from importlib.metadata import version
+__version__ = version("claude-in-codex")

claude_in_codex/claude.py ADDED Viewed

@@ -0,0 +1,381 @@
+"""Build and run the `claude` CLI invocation; classify failures."""
+from __future__ import annotations
+import contextlib
+import json
+import os
+import signal
+import subprocess
+import time
+from dataclasses import dataclass
+from typing import TYPE_CHECKING
+import anyio
+from anyio.to_thread import run_sync
+from claude_in_codex import cli_contract, preflight
+from claude_in_codex.config import (
+    INDEPENDENT_CRITIC_PROMPT,
+    access_flags,
+    config_mode_flags,
+    is_env_placeholder,
+)
+from claude_in_codex.schemas import ErrorInfo
+_BUDGET_REPAIR = (
+    "Raise max_budget_usd or reduce context. For small prompts, try at least "
+    "$0.10-$0.20; lower best-effort budgets can spend and still stop before a "
+    "useful answer."
+)
+_LOGIN_MODES = frozenset({"inherit", "scoped", "safe"})
+_LOGIN_CREDENTIAL_ENV_VARS = ("ANTHROPIC_API_KEY", "ANTHROPIC_AUTH_TOKEN")
+if TYPE_CHECKING:
+    from claude_in_codex.preflight import FlagSupport
+@dataclass
+class ClaudeRun:
+    stdout: str
+    stderr: str
+    exit_code: int
+    elapsed_ms: int
+    timed_out: bool
+def _claude_subprocess_env(config_mode: str | None) -> dict[str, str] | None:
+    """Return an explicit subprocess env when the selected mode must alter it.
+    Login-backed modes must use Claude Code's OAuth/session path, even if the
+    MCP server process was launched with stale or placeholder Anthropic direct
+    credential env vars. Bare mode deliberately relies on those credentials, so
+    leave inheritance intact.
+    """
+    if config_mode not in _LOGIN_MODES:
+        return None
+    env = os.environ.copy()
+    for name in _LOGIN_CREDENTIAL_ENV_VARS:
+        env.pop(name, None)
+    return env
+def _gate_optional(tokens: list[str], fs: FlagSupport) -> tuple[list[str], list[str]]:
+    """Drop any HELP_GATED flag (and its value, if it takes one) the installed
+    `claude` does not advertise in --help. Returns (kept_tokens, dropped_flags).
+    ALWAYS_SEND flags are never in HELP_GATED_FLAGS, so they always survive."""
+    kept: list[str] = []
+    dropped: list[str] = []
+    i = 0
+    while i < len(tokens):
+        token = tokens[i]
+        takes_value = cli_contract.HELP_GATED_FLAGS.get(token)
+        if takes_value is not None and not preflight.is_supported(token, fs):
+            dropped.append(token)
+            i += 2 if takes_value else 1
+            continue
+        kept.append(token)
+        i += 1
+    return kept, dropped
+def build_command(
+    prompt: str,
+    config_mode: str,
+    access: str,
+    model: str | None,
+    max_budget_usd: float,
+    effort: str | None = None,
+    flag_support: FlagSupport | None = None,
+) -> tuple[list[str], list[str]]:
+    """Build the `claude` invocation. Returns (cmd, dropped_optional_flags).
+    Guarantee-bearing flags are sent unconditionally; HELP_GATED (depth/cosmetic)
+    flags are dropped when the installed CLI does not list them, so a minor
+    upstream change degrades instead of aborting a paid run. dropped_optional_flags
+    feeds Meta.compat_warnings."""
+    fs = flag_support if flag_support is not None else preflight.flag_support()
+    # --no-chrome disables the "Claude in Chrome" integration, which could
+    # otherwise open an interactive picker that hangs an unattended run until the
+    # timeout (burning the whole timeout and the spend) instead of answering.
+    tokens = [cli_contract.CLAUDE_BIN, *cli_contract.CORE_INVOCATION, "--no-chrome"]
+    tokens += config_mode_flags(config_mode)
+    tokens += access_flags(access)
+    tokens += ["--append-system-prompt", INDEPENDENT_CRITIC_PROMPT]
+    tokens += ["--max-budget-usd", f"{max_budget_usd}"]
+    if effort and effort in cli_contract.VALID_EFFORTS:
+        tokens += ["--effort", effort]
+    if model:
+        tokens += ["--model", model]
+    cmd, dropped = _gate_optional(tokens, fs)
+    # The prompt is supplied over stdin by the runner. Keeping it out of argv
+    # avoids exposing gathered diffs/context through local process listings.
+    _ = prompt
+    return cmd, dropped
+def auth_status(
+    timeout_seconds: int = 10, *, config_mode: str | None
+) -> tuple[bool | None, str | None]:
+    """Probe `claude auth status` without making a paid call.
+    Returns (logged_in, detail). logged_in is None when the probe could not run
+    (claude missing, timeout) so callers can report 'unknown' rather than a
+    misleading False. detail is a NON-identifying phrase, never the raw CLI output:
+    `claude auth status` prints the account email and organization, which would leak
+    into shared logs/transcripts. The boolean already carries the machine-readable
+    truth, so we deliberately drop the raw text."""
+    try:
+        proc = subprocess.run(
+            [cli_contract.CLAUDE_BIN, *cli_contract.AUTH_STATUS_ARGS],
+            capture_output=True,
+            text=True,
+            timeout=timeout_seconds,
+            check=False,
+            env=_claude_subprocess_env(config_mode),
+        )
+    except (OSError, subprocess.SubprocessError):
+        return None, None
+    logged_in = proc.returncode == 0
+    detail = (
+        "Claude CLI reports an authenticated session."
+        if logged_in
+        else "Claude CLI reports no authenticated session; run `claude /login`."
+    )
+    return logged_in, detail
+def _kill_process_tree(proc: subprocess.Popen) -> None:
+    """Best-effort terminate the process and its children. POSIX: kill the
+    process group (the child is its own session leader). Falls back to killing
+    just the process where process groups are unavailable (e.g. Windows)."""
+    if proc.poll() is not None:
+        return
+    try:
+        if hasattr(os, "killpg"):
+            os.killpg(os.getpgid(proc.pid), signal.SIGKILL)
+        else:  # pragma: no cover - non-POSIX fallback
+            proc.kill()
+    except (ProcessLookupError, PermissionError):
+        with contextlib.suppress(ProcessLookupError):
+            proc.kill()
+async def run_claude_async(
+    cmd: list[str],
+    cwd: str,
+    timeout_seconds: int,
+    stdin_text: str | None = None,
+    *,
+    config_mode: str,
+) -> ClaudeRun:
+    """Run `claude` as a subprocess, returning a ClaudeRun.
+    The subprocess is started in its own session (process group) so that, on a
+    timeout OR an MCP request cancellation, we can terminate the whole tree
+    rather than orphaning a paid Claude run."""
+    start = time.monotonic()
+    try:
+        proc = subprocess.Popen(
+            cmd,
+            cwd=cwd,
+            stdin=subprocess.PIPE if stdin_text is not None else None,
+            stdout=subprocess.PIPE,
+            stderr=subprocess.PIPE,
+            text=True,
+            encoding="utf-8",
+            env=_claude_subprocess_env(config_mode),
+            start_new_session=True,
+        )
+    except OSError:
+        elapsed = int((time.monotonic() - start) * 1000)
+        return ClaudeRun("", "claude_not_found", 127, elapsed, False)
+    def _wait() -> tuple[str, str, bool]:
+        try:
+            out, err = proc.communicate(input=stdin_text, timeout=timeout_seconds)
+            return out, err, False
+        except subprocess.TimeoutExpired:
+            _kill_process_tree(proc)
+            out, err = proc.communicate()
+            return out, err, True
+    try:
+        out, err, timed_out = await run_sync(_wait, abandon_on_cancel=True)
+    except anyio.get_cancelled_exc_class():
+        _kill_process_tree(proc)
+        raise
+    elapsed = int((time.monotonic() - start) * 1000)
+    if timed_out:
+        return ClaudeRun("", "timeout", -9, elapsed, True)
+    return ClaudeRun(out, err, proc.returncode, elapsed, False)
+def _auth_repair_for(config_mode: str | None) -> str:
+    if config_mode in _LOGIN_MODES:
+        return "Run `claude /login`; the attempted config_mode uses the Claude login path."
+    if config_mode == "bare":
+        return (
+            "Set a valid ANTHROPIC_API_KEY, or use config_mode inherit/scoped/safe "
+            "after `claude /login`."
+        )
+    return "Run `claude /login`, or set a valid ANTHROPIC_API_KEY for config_mode=bare."
+def _api_key_repair_for(config_mode: str | None) -> str:
+    # A literal `${ANTHROPIC_API_KEY}` is the host failing to expand env vars, not a
+    # rotated/revoked key — point at host substitution instead of "set a valid key".
+    if is_env_placeholder(os.environ.get("ANTHROPIC_API_KEY")):
+        return (
+            "ANTHROPIC_API_KEY is a literal ${...} placeholder; your MCP host is not "
+            "expanding env substitutions. Use an env_vars passthrough list, or set a "
+            "literal key."
+        )
+    if config_mode == "bare":
+        return (
+            "Set a valid ANTHROPIC_API_KEY, or use config_mode inherit/scoped/safe "
+            "after `claude /login`."
+        )
+    if config_mode in _LOGIN_MODES:
+        return (
+            "The attempted config_mode does not rely on ANTHROPIC_API_KEY; unset or fix "
+            "ANTHROPIC_API_KEY, then rerun claude_status before retrying."
+        )
+    return (
+        "Set a valid ANTHROPIC_API_KEY, or use config_mode inherit/scoped/safe "
+        "after `claude /login`."
+    )
+def _has_logged_out_signal(blob: str) -> bool:
+    # Narrow on purpose: a bare "/login" can appear in reviewed content or URLs
+    # echoed by Claude, so require the explicit prompt wording.
+    return "not logged in" in blob or "please run /login" in blob
+def _has_invalid_api_key_signal(blob: str) -> bool:
+    return (
+        "api_key_invalid" in blob
+        or "invalid api key" in blob
+        or "anthropic_api_key is invalid" in blob
+    )
+def classify_failure(run: ClaudeRun, *, config_mode: str | None = None) -> ErrorInfo:
+    env = None
+    with contextlib.suppress(json.JSONDecodeError, ValueError, TypeError):
+        env = json.loads(run.stdout)
+    if run.stderr == "claude_not_found":
+        return ErrorInfo(
+            code="claude_not_found",
+            message="The `claude` CLI was not found on PATH.",
+            repair="Install Claude Code and ensure `claude` is on PATH.",
+        )
+    if run.timed_out:
+        return ErrorInfo(
+            code="timeout",
+            message="claude exceeded the timeout.",
+            repair="Narrow the scope/focus or raise timeout_seconds.",
+            retryable=True,
+        )
+    if isinstance(env, dict) and (
+        env.get("is_error") or env.get("subtype") not in cli_contract.SUCCESS_SUBTYPES
+    ):
+        subtype = str(env.get("subtype") or "").lower()
+        result = str(env.get("result") or "")
+        structured_blob = f"{subtype}\n{result}".lower()
+        combined_blob = f"{structured_blob}\n{run.stderr}".lower()
+        if _has_logged_out_signal(combined_blob):
+            return ErrorInfo(
+                code="claude_auth_required",
+                message="claude is not authenticated.",
+                repair=_auth_repair_for(config_mode),
+            )
+        if _has_invalid_api_key_signal(structured_blob):
+            return ErrorInfo(
+                code="api_key_invalid",
+                message="ANTHROPIC_API_KEY is invalid.",
+                repair=_api_key_repair_for(config_mode),
+            )
+        if "auth" in structured_blob or "login" in structured_blob:
+            return ErrorInfo(
+                code="claude_auth_required",
+                message="claude is not authenticated.",
+                repair=_auth_repair_for(config_mode),
+            )
+        if "budget" in structured_blob:
+            return ErrorInfo(
+                code="budget_exceeded",
+                message="claude reached the max-budget stop threshold "
+                "(a best-effort limit, not a hard cap).",
+                repair=_BUDGET_REPAIR,
+                retryable=True,
+            )
+        if "permission" in structured_blob or "denied" in structured_blob:
+            return ErrorInfo(
+                code="claude_permission_error",
+                message="claude was denied a requested permission.",
+                repair="Use access=toolless, or allow the needed read-only tools.",
+            )
+        if "rate" in structured_blob or "overloaded" in structured_blob:
+            return ErrorInfo(
+                code="nonzero_exit",
+                message=f"claude reported a retryable error: {result[:200]}",
+                repair="Retry later, or reduce request size.",
+                retryable=True,
+            )
+        if cli_contract.is_contract_drift(result, subtype):
+            return contract_changed_error()
+        detail = result.strip() or subtype or "unknown error"
+        return ErrorInfo(
+            code="nonzero_exit",
+            message=f"claude reported an error: {detail[:200]}",
+            repair="Inspect the error; retry with a smaller or corrected request.",
+        )
+    extra = ""
+    if isinstance(env, dict):
+        extra = f"{env.get('subtype', '')} {env.get('result', '')}"
+    blob = f"{extra}\n{run.stdout}\n{run.stderr}".lower()
+    if _has_logged_out_signal(blob):
+        return ErrorInfo(
+            code="claude_auth_required",
+            message="claude is not authenticated.",
+            repair=_auth_repair_for(config_mode),
+        )
+    if _has_invalid_api_key_signal(blob):
+        return ErrorInfo(
+            code="api_key_invalid",
+            message="ANTHROPIC_API_KEY is invalid.",
+            repair=_api_key_repair_for(config_mode),
+        )
+    if "budget" in blob:
+        return ErrorInfo(
+            code="budget_exceeded",
+            message="claude reached the max-budget stop threshold "
+            "(a best-effort limit, not a hard cap).",
+            repair=_BUDGET_REPAIR,
+            retryable=True,
+        )
+    # An unknown flag / invalid value means the CLI contract drifted from what this
+    # plugin sends. Check last so an auth/budget message is never misread as drift.
+    if cli_contract.is_contract_drift(run.stderr, run.stdout):
+        return contract_changed_error()
+    return ErrorInfo(
+        code="nonzero_exit",
+        message=f"claude exited {run.exit_code}: {run.stderr.strip()[:200]}",
+        repair="Inspect the error; retry with a smaller request.",
+    )
+def contract_changed_error() -> ErrorInfo:
+    """Shared cli_contract_changed error, reused across every failure path so a
+    drift is reported identically whether it surfaces on the sync, envelope, or
+    async-job path."""
+    return ErrorInfo(
+        code="cli_contract_changed",
+        message="claude rejected a flag or value this plugin sent — its CLI "
+        "contract likely changed for your installed version.",
+        repair="Update claude-in-codex (or pin claude to a supported version); "
+        "run claude_status to check the version.",
+    )

claude_in_codex/cli_contract.py ADDED Viewed

@@ -0,0 +1,123 @@
+"""Single source of truth for the external `claude` CLI contract.
+Every assumption this server makes about the `claude` CLI — its flags,
+subcommands, JSON-envelope keys, accepted effort levels, supported major
+versions, and the stderr phrasings that mean the contract drifted — lives here so
+an upstream breaking change is a one-file, greppable, testable edit. See
+COMPATIBILITY.md for the assumption -> upstream-source map.
+"""
+from __future__ import annotations
+CLAUDE_BIN = "claude"
+# Core invocation that CANNOT be dropped: -p (print mode) + JSON output. If these
+# disappear upstream the server cannot function, so a run must fail loudly rather
+# than silently degrade.
+CORE_INVOCATION = ("-p", "--output-format", "json")
+END_OF_OPTIONS = "--"
+# Subcommands / probes (free; no paid call).
+VERSION_ARGS = ("--version",)
+AUTH_STATUS_ARGS = ("auth", "status", "--text")
+HELP_ARGS = ("--help",)
+# --- Flag classes (see Item 5 of the resilience plan / COMPATIBILITY.md) --------
+# ALWAYS_SEND: guarantee-bearing flags, sent unconditionally and NEVER gated on
+# `--help` parsing. If upstream removes/renames one, `claude` rejects it at
+# arg-parse BEFORE any model call (zero spend) and classify_failure() labels it
+# cli_contract_changed. Gating these on the (inherently fuzzy) --help parse could
+# silently drop a security/cost/behavioral guarantee, so we never do. All are long
+# flags (the diagnostic in claude_status checks them against parsed --help).
+ALWAYS_SEND_FLAGS = frozenset(
+    {
+        "--output-format",  # core JSON output
+        "--no-chrome",  # no interactive picker hanging an unattended run
+        "--append-system-prompt",  # the independent-critic guardrails
+        "--max-budget-usd",  # best-effort spend stop threshold
+        "--no-session-persistence",  # avoid storing sensitive review prompts/results on disk
+        "--tools",  # read-only / no-tool guarantee
+        "--strict-mcp-config",
+        "--mcp-config",  # strip the user's MCP fleet (security boundary)
+        "--setting-sources",  # scoped-mode isolation
+        "--bare",  # bare-mode isolation
+        "--safe-mode",  # OAuth-preserving customization/hook isolation
+    }
+)
+# HELP_GATED: dropping one only reduces depth or relies on a still-present primary
+# guard — never a safety/cost regression. The value is whether the flag takes an
+# argument (so the gate skips the value token too). These are the ONLY flags gated
+# on `claude --help`; a false negative here merely drops a harmless flag.
+HELP_GATED_FLAGS = {
+    "--effort": True,  # reasoning depth only
+    "--model": True,  # falls back to the configured default model
+    "--disallowed-tools": True,  # defense-in-depth; --tools is the primary allowlist
+}
+# Cache TTL for the `claude --help` probe, so a long-lived server re-probes after
+# an in-place CLI upgrade instead of trusting a stale snapshot forever.
+HELP_CACHE_TTL_SECONDS = 300
+# --- Reasoning effort -----------------------------------------------------------
+VALID_EFFORTS = ("low", "medium", "high", "xhigh", "max")
+DEFAULT_EFFORT = "xhigh"
+# --- Supported `claude` major version(s) ----------------------------------------
+# A set (not a single int) so a future major can be added without a code change,
+# and overridable via env so a user can opt into an untested major themselves.
+SUPPORTED_MAJORS = frozenset({2})
+SUPPORTED_MAJORS_ENV = "CLAUDE_IN_CODEX_SUPPORTED_MAJORS"
+# --- JSON envelope keys read from `claude -p --output-format json` ---------------
+# normalize.py / apply_cost_usage parse these tolerantly with .get(); listing them
+# here keeps the consumed surface greppable and gives the golden-envelope test a
+# canonical reference.
+SUCCESS_SUBTYPES = (None, "success")
+ENVELOPE_KEYS = frozenset(
+    {
+        "is_error",
+        "subtype",
+        "result",
+        "total_cost_usd",
+        "usage",
+        "session_id",
+        "modelUsage",
+        "permission_denials",
+    }
+)
+USAGE_KEYS = frozenset(
+    {
+        "input_tokens",
+        "output_tokens",
+        "cache_read_input_tokens",
+        "cache_creation_input_tokens",
+    }
+)
+# --- Contract-drift stderr signatures -------------------------------------------
+# Phrasings a CLI prints when it rejects a flag or value we sent. Matching any
+# (case-insensitive) reclassifies an otherwise-generic failure as
+# cli_contract_changed, telling the user the plugin needs an update for their CLI
+# rather than leaving a confusing nonzero_exit.
+CONTRACT_DRIFT_STDERR_PATTERNS = (
+    "unknown option",
+    "unknown flag",
+    "unknown argument",
+    "unrecognized option",
+    "unrecognized argument",
+    "no such option",
+    "invalid choice",
+    "invalid value",
+    "unexpected argument",
+)
+def is_contract_drift(*texts: str | None) -> bool:
+    """Whether any provided text carries a contract-drift signature.
+    Used on every failure path (sync classify_failure, the zero-exit is_error
+    envelope, and the async job error) so drift is labelled consistently no matter
+    where `claude` surfaces it."""
+    blob = "\n".join(t for t in texts if t).lower()
+    return any(pattern in blob for pattern in CONTRACT_DRIFT_STDERR_PATTERNS)