npm - @ictechgy/context-guard - Versions diffs - 0.4.8 → 0.4.10 - Mend

@ictechgy/context-guard 0.4.8 → 0.4.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (54) hide show

package/CHANGELOG.md +29 -0
package/README.ko.md +92 -37
package/README.md +111 -37
package/docs/benchmark-fixtures/token-savings-12task-baseline.prompt.example.md +7 -0
package/docs/benchmark-fixtures/token-savings-12task-contextguard.prompt.example.md +7 -0
package/docs/benchmark-fixtures/token-savings-12task.tasks.example.json +182 -0
package/docs/benchmark-fixtures/token-savings-12task.variants.example.json +10 -0
package/docs/distribution.md +10 -7
package/docs/experimental-benchmark-fixtures.md +8 -1
package/package.json +3 -6
package/packaging/homebrew/context-guard.rb.template +1 -1
package/plugins/context-guard/.claude-plugin/plugin.json +1 -1
package/plugins/context-guard/README.ko.md +9 -6
package/plugins/context-guard/README.md +27 -12
package/plugins/context-guard/bin/context-guard +113 -26
package/plugins/context-guard/bin/context-guard-artifact +542 -46
package/plugins/context-guard/bin/context-guard-cache-score +380 -0
package/plugins/context-guard/bin/context-guard-compress +146 -1
package/plugins/context-guard/bin/context-guard-cost +783 -4
package/plugins/context-guard/bin/context-guard-experiments +2211 -121
package/plugins/context-guard/bin/context-guard-failed-nudge +3 -0
package/plugins/context-guard/bin/context-guard-filter +163 -7
package/plugins/context-guard/bin/context-guard-guard-read +3 -0
package/plugins/context-guard/bin/context-guard-pack +602 -43
package/plugins/context-guard/bin/context-guard-rewrite-bash +3 -0
package/plugins/context-guard/bin/context-guard-setup +165 -31
package/plugins/context-guard/bin/context-guard-statusline +490 -283
package/plugins/context-guard/bin/context-guard-statusline-merged +5 -0
package/plugins/context-guard/bin/context-guard-tool-prune +241 -1
package/plugins/context-guard/lib/context_guard_commands.py +206 -0
package/plugins/context-guard/skills/setup/SKILL.md +1 -0
package/context-guard-kit/README.md +0 -91
package/context-guard-kit/benchmark_runner.py +0 -2401
package/context-guard-kit/claude_transcript_cost_audit.py +0 -2346
package/context-guard-kit/context_compress.py +0 -695
package/context-guard-kit/context_escrow.py +0 -935
package/context-guard-kit/context_filter.py +0 -637
package/context-guard-kit/context_guard_cli.py +0 -325
package/context-guard-kit/context_guard_diet.py +0 -1711
package/context-guard-kit/context_pack.py +0 -2713
package/context-guard-kit/cost_guard.py +0 -2349
package/context-guard-kit/experimental_registry.py +0 -2339
package/context-guard-kit/failed_attempt_nudge.py +0 -567
package/context-guard-kit/guard_large_read.py +0 -690
package/context-guard-kit/hook_secret_patterns.py +0 -43
package/context-guard-kit/read_symbol.py +0 -483
package/context-guard-kit/rewrite_bash_for_token_budget.py +0 -501
package/context-guard-kit/sanitize_output.py +0 -725
package/context-guard-kit/settings.example.json +0 -67
package/context-guard-kit/setup_wizard.py +0 -2515
package/context-guard-kit/statusline.sh +0 -362
package/context-guard-kit/statusline_merged.sh +0 -157
package/context-guard-kit/tool_schema_pruner.py +0 -837
package/context-guard-kit/trim_command_output.py +0 -1449

package/plugins/context-guard/bin/context-guard-statusline CHANGED Viewed

@@ -6,223 +6,161 @@ if [[ -t 0 ]]; then
   exit 0
 fi
-statusline_input_tmp=''
-statusline_tmp_base() {
-  local candidate="${TMPDIR:-/tmp}" resolved
-  if [[ "$candidate" != "/" ]]; then
-    candidate="${candidate%/}"
-  fi
-  if [[ -z "$candidate" || "$candidate" != /* || ! -d "$candidate" || ! -w "$candidate" ]]; then
-    candidate="/tmp"
-  fi
-  if resolved=$(cd "$candidate" 2>/dev/null && pwd -P); then
-    if [[ "$resolved" != "/" ]]; then
-      resolved="${resolved%/}"
-    fi
-    printf '%s\n' "${resolved:-/}"
-  else
-    printf '/tmp\n'
-  fi
-}
-statusline_input_max_bytes() {
-  local raw="${CONTEXT_GUARD_STATUSLINE_INPUT_MAX_BYTES:-${CLAUDE_TOKEN_STATUSLINE_INPUT_MAX_BYTES:-65536}}" max=65536
-  if [[ "$raw" =~ ^[0-9]+$ ]] && (( ${#raw} <= 7 )); then
-    max=$((10#$raw))
-  fi
-  if (( max < 1 || max > 1048576 )); then
-    max=65536
-  fi
-  printf '%s\n' "$max"
-}
-statusline_context_warn_threshold() {
-  local raw="${CONTEXT_GUARD_STATUSLINE_CTX_WARN:-${CLAUDE_TOKEN_STATUSLINE_CTX_WARN:-80}}" threshold=80
-  if [[ "$raw" =~ ^[0-9]{1,3}$ ]]; then
-    threshold=$((10#$raw))
-    if (( threshold < 1 )); then
-      threshold=1
-    elif (( threshold > 100 )); then
-      threshold=100
-    fi
-  fi
-  printf '%s\n' "$threshold"
-}
-read_bounded_statusline_input() {
-  local max input_len tmp_base
-  max=$(statusline_input_max_bytes)
-  tmp_base=$(statusline_tmp_base)
-  statusline_input_tmp=$(mktemp "$tmp_base/context-guard-statusline.XXXXXX") || {
-    printf '[input-error] could not create statusline input buffer\n'
-    exit 0
-  }
-  trap 'rm -f "${statusline_input_tmp:-}"' EXIT
-  LC_ALL=C head -c "$((max + 1))" >"$statusline_input_tmp" 2>/dev/null || true
-  input_len=$(LC_ALL=C wc -c <"$statusline_input_tmp" | tr -d '[:space:]')
-  if (( input_len > max )); then
-    printf '[input-too-large] Claude statusline JSON exceeds %s bytes\n' "$max"
-    exit 0
-  fi
-  input=$(cat "$statusline_input_tmp" 2>/dev/null || true)
-  rm -f "$statusline_input_tmp"
-  statusline_input_tmp=''
-  trap - EXIT
-}
-read_bounded_statusline_input
-if ! command -v jq >/dev/null 2>&1; then
-  echo "[needs-jq] install jq for Claude token statusline"
+if ! command -v python3 >/dev/null 2>&1; then
+  echo "[needs-python3] install python3 for Claude token statusline"
   exit 0
 fi
-jq_get() {
-  jq -r "$1 // empty" <<<"$input" 2>/dev/null || true
-}
-strip_terminal_sequences() {
-  if command -v perl >/dev/null 2>&1; then
-    perl -pe 's/\e\][^\a\e]*(?:\a|\e\\)//g; s/\e[@-_][0-?]*[ -\/]*[@-~]//g'
-  else
-    cat
-  fi
-}
-sanitize_status() {
-  # Statusline values may come from untrusted workspace metadata; keep one-line printable text.
-  local cleaned
-  cleaned=$(printf '%s' "$1" \
-    | strip_terminal_sequences \
-    | LC_ALL=C tr '\r\n' '  ' \
-    | LC_ALL=C tr -d '\000-\010\013\014\016-\037\177-\237' \
-    | cut -c 1-160)
-  if printf '%s' "$cleaned" | LC_ALL=C grep -Eiq '(gh[pousr]_|github_pat_|glpat-|xox[abprs]-|AKIA|ASIA|sk-|npm_|AIza|Bearer[[:space:]]|Basic[[:space:]])'; then
-    printf '[redacted]'
-  else
-    printf '%s' "$cleaned"
-  fi
-}
-git_head_branch() {
-  # Keep the statusline cheap and non-blocking: do not invoke `git` here.  Some
-  # workspaces have slow network filesystems, hydrated-on-demand git objects, or
-  # broken config; reading .git/HEAD is enough for a best-effort branch label.
-  local current="$1"
-  local dotgit gitdir_line gitdir head_file head_line branch
-  [[ -n "$current" && -d "$current" ]] || return 1
-  current=$(cd "$current" 2>/dev/null && pwd -P) || return 1
-  while [[ -n "$current" ]]; do
-    head_file=''
-    dotgit="$current/.git"
-    if [[ -d "$dotgit" && ! -L "$dotgit" ]]; then
-      head_file="$dotgit/HEAD"
-    elif [[ -f "$dotgit" && ! -L "$dotgit" ]]; then
-      IFS= read -r gitdir_line <"$dotgit" 2>/dev/null || gitdir_line=''
-      if [[ "$gitdir_line" == gitdir:\ * ]]; then
-        gitdir="${gitdir_line#gitdir: }"
-        [[ "$gitdir" == /* ]] || gitdir="$current/$gitdir"
-        if gitdir=$(cd "$gitdir" 2>/dev/null && pwd -P) && [[ -f "$gitdir/HEAD" && ! -L "$gitdir/HEAD" ]]; then
-          head_file="$gitdir/HEAD"
-        fi
-      fi
-    fi
-    if [[ -n "$head_file" && -f "$head_file" && ! -L "$head_file" ]]; then
-      IFS= read -r head_line <"$head_file" 2>/dev/null || return 1
-      if [[ "$head_line" == ref:\ refs/heads/* ]]; then
-        branch="${head_line#ref: refs/heads/}"
-        [[ -n "$branch" ]] && printf '%s\n' "$branch"
-        return 0
-      fi
-      if [[ "$head_line" =~ ^[0-9a-fA-F]{7,40}$ ]]; then
-        printf '%s\n' "${head_line:0:12}"
-        return 0
-      fi
-      return 1
-    fi
-    [[ "$current" == "/" ]] && break
-    current="${current%/*}"
-    [[ -n "$current" ]] || current="/"
-  done
-  return 1
-}
-model=$(jq_get '.model.display_name')
-model=${model:-$(jq_get '.model.id')}
-model=${model:-unknown}
-model=$(sanitize_status "$model")
-context_raw=$(jq_get '.context_window.used_percentage')
-context_is_numeric=0
-if [[ -n "$context_raw" ]]; then
-  if context_pct=$(LC_NUMERIC=C printf '%.0f' "$context_raw" 2>/dev/null); then
-    if [[ "$context_pct" =~ ^-?[0-9]+$ ]]; then
-      context_is_numeric=1
-    else
-      context_pct=$(sanitize_status "$context_raw")
-    fi
-  else
-    context_pct=$(sanitize_status "$context_raw")
-  fi
-else
-  context_pct="?"
-fi
-context_label="${context_pct}%"
-if (( context_is_numeric )); then
-  context_warn_threshold=$(statusline_context_warn_threshold)
-  if (( context_pct >= context_warn_threshold )); then
-    context_label="${context_label} ⚠"
-  fi
-fi
-cost=$(jq_get '.cost.total_cost_usd')
-if [[ -n "$cost" ]]; then
-  cost=$(printf '$%.3f' "$cost" 2>/dev/null || sanitize_status "$cost")
-else
-  cost='n/a'
-fi
-cwd=$(jq_get '.workspace.current_dir')
-dir=${cwd##*/}
-dir=${dir:-.}
-dir=$(sanitize_status "$dir")
-branch=''
-branch_dir=${cwd:-$PWD}
-b=$(git_head_branch "$branch_dir" 2>/dev/null || true)
-if [[ -n "$b" ]]; then
-  b=$(sanitize_status "$b")
-  branch=" | ${b}"
-fi
+read -r -d '' CONTEXT_GUARD_STATUSLINE_PY <<'PYEOF' || true
+from __future__ import annotations
-# Cache metrics from the transcript tail (best-effort, fast — reads only the last 1MB).
-# Stays empty when transcript is unavailable or python3 fails so the status line never breaks.
-# NOTE: keep the token-key list and usage-extraction shape in sync with claude_transcript_cost_audit.py
-# so the statusline metric matches the audit metric for the same transcript.
-metrics_label=''
-transcript_path=$(jq_get '.transcript_path')
-if [[ -n "$transcript_path" && -r "$transcript_path" ]] && command -v python3 >/dev/null 2>&1; then
-  transcript_metrics=$(python3 - "$transcript_path" 2>/dev/null <<'PYEOF' || true
+import hashlib
 import json
+import math
 import os
+import re
 import stat
 import sys
+import time
+from typing import Any
-path = sys.argv[1] if len(sys.argv) > 1 else ""
-if not path:
-    sys.exit(0)
-# Bounded tail read so the statusline never stalls on huge transcripts.
 TAIL_BYTES = 1024 * 1024
 MAX_RECORDS = 300
+CACHE_SCHEMA_VERSION = 1
+DEFAULT_CACHE_TTL_SECONDS = 2.0
+MAX_CACHE_TTL_SECONDS = 30.0
+MAX_CACHE_BYTES = 4096
+METRIC_RE = re.compile(r"^\d+(?:\.\d)?$")
+SECRET_RE = re.compile(
+    r"(gh[pousr]_|github_pat_|glpat-|xox[abprs]-|AKIA|ASIA|sk-|npm_|AIza|Bearer\s|Basic\s)",
+    re.IGNORECASE,
+)
+OSC_RE = re.compile(r"\x1b\][^\x07\x1b]*(?:\x07|\x1b\\)")
+CSI_RE = re.compile(r"\x1b[@-_][0-?]*[ -/]*[@-~]")
+CONTROL_RE = re.compile(r"[\x00-\x08\x0b\x0c\x0e-\x1f\x7f-\x9f]")
+def _bounded_int_env(primary: str, legacy: str, default: int, *, lower: int, upper: int) -> int:
+    raw = os.environ.get(primary, os.environ.get(legacy, str(default)))
+    value = default
+    if raw.isdigit() and len(raw) <= 7:
+        value = int(raw, 10)
+    if value < lower or value > upper:
+        return default
+    return value
+def statusline_input_max_bytes() -> int:
+    return _bounded_int_env(
+        "CONTEXT_GUARD_STATUSLINE_INPUT_MAX_BYTES",
+        "CLAUDE_TOKEN_STATUSLINE_INPUT_MAX_BYTES",
+        65536,
+        lower=1,
+        upper=1048576,
+    )
+def statusline_context_warn_threshold() -> int:
+    raw = os.environ.get(
+        "CONTEXT_GUARD_STATUSLINE_CTX_WARN",
+        os.environ.get("CLAUDE_TOKEN_STATUSLINE_CTX_WARN", "80"),
+    )
+    threshold = 80
+    if re.fullmatch(r"\d{1,3}", raw or ""):
+        threshold = int(raw, 10)
+        if threshold < 1:
+            threshold = 1
+        elif threshold > 100:
+            threshold = 100
+    return threshold
+def _json_tostring(value: Any) -> str:
+    if value is None:
+        return ""
+    if isinstance(value, bool):
+        return "true" if value else "false"
+    if isinstance(value, (dict, list)):
+        return json.dumps(value, ensure_ascii=False, separators=(",", ":"))
+    return str(value)
+def _get_path(data: dict[str, Any], *keys: str) -> str:
+    cur: Any = data
+    for key in keys:
+        if not isinstance(cur, dict):
+            return ""
+        cur = cur.get(key)
+    return _json_tostring(cur)
+def strip_terminal_sequences(value: str) -> str:
+    value = OSC_RE.sub("", value)
+    return CSI_RE.sub("", value)
+def sanitize_status(value: str) -> str:
+    cleaned = strip_terminal_sequences(str(value))
+    cleaned = cleaned.replace("\r", " ").replace("\n", " ")
+    cleaned = CONTROL_RE.sub("", cleaned)[:160]
+    if SECRET_RE.search(cleaned):
+        return "[redacted]"
+    return cleaned
-def _int_or_zero(value):
-    """transcript usage 토큰값을 정수로 강제. bool은 int 서브클래스이므로 별도 차단."""
+def git_head_branch(current: str) -> str | None:
+    if not current or not os.path.isdir(current):
+        return None
+    try:
+        current = os.path.realpath(current)
+    except Exception:
+        return None
+    while current:
+        head_file = ""
+        dotgit = os.path.join(current, ".git")
+        if os.path.isdir(dotgit) and not os.path.islink(dotgit):
+            head_file = os.path.join(dotgit, "HEAD")
+        elif os.path.isfile(dotgit) and not os.path.islink(dotgit):
+            try:
+                with open(dotgit, "r", encoding="utf-8", errors="replace") as fh:
+                    gitdir_line = fh.readline().rstrip("\n")
+            except OSError:
+                gitdir_line = ""
+            if gitdir_line.startswith("gitdir: "):
+                gitdir = gitdir_line[len("gitdir: ") :]
+                if not os.path.isabs(gitdir):
+                    gitdir = os.path.join(current, gitdir)
+                try:
+                    gitdir = os.path.realpath(gitdir)
+                except Exception:
+                    gitdir = ""
+                candidate = os.path.join(gitdir, "HEAD") if gitdir else ""
+                if candidate and os.path.isfile(candidate) and not os.path.islink(candidate):
+                    head_file = candidate
+        if head_file and os.path.isfile(head_file) and not os.path.islink(head_file):
+            try:
+                with open(head_file, "r", encoding="utf-8", errors="replace") as fh:
+                    head_line = fh.readline().strip()
+            except OSError:
+                return None
+            if head_line.startswith("ref: refs/heads/"):
+                branch = head_line[len("ref: refs/heads/") :]
+                return branch or None
+            if re.fullmatch(r"[0-9a-fA-F]{7,40}", head_line or ""):
+                return head_line[:12]
+            return None
+        parent = os.path.dirname(current)
+        if parent == current:
+            break
+        current = parent or os.sep
+    return None
+def _int_or_zero(value: Any) -> int:
+    """Coerce transcript usage token values. bool is an int subclass, so block it."""
     if isinstance(value, bool):
         return 0
     if isinstance(value, int):
@@ -230,18 +168,12 @@ def _int_or_zero(value):
     return 0
-def _extract_usage(record):
-    """transcript record에서 알려진 usage 객체 1개만 꺼낸다.
-    Claude Code transcript JSONL은 record 당 한 번의 LLM 호출 usage를 다음 중 한 자리에
-    넣는 것이 일반적이다 — top-level "usage", "message.usage", "response.usage".
-    재귀 walk 대신 알려진 경로만 보아야 동일 값이 여러 nested 사본으로 들어왔을 때
-    이중 합산되는 문제를 피할 수 있다.
-    """
+def _extract_usage(record: Any) -> dict[str, Any] | None:
+    """Extract one known transcript usage object without recursively double-counting copies."""
     if not isinstance(record, dict):
         return None
     for path_keys in (("usage",), ("message", "usage"), ("response", "usage")):
-        cur = record
+        cur: Any = record
         for key in path_keys:
             if not isinstance(cur, dict):
                 cur = None
@@ -252,9 +184,7 @@ def _extract_usage(record):
     return None
-input_tokens = cache_read = cache_creation = 0
-def _open_regular_transcript(path):
+def _open_regular_transcript(path: str) -> tuple[int, os.stat_result] | None:
     flags = os.O_RDONLY
     if hasattr(os, "O_CLOEXEC"):
         flags |= os.O_CLOEXEC
@@ -262,26 +192,32 @@ def _open_regular_transcript(path):
         flags |= os.O_NOFOLLOW
     if hasattr(os, "O_NONBLOCK"):
         flags |= os.O_NONBLOCK
-    st = os.lstat(path)
+    try:
+        st = os.lstat(path)
+    except OSError:
+        return None
     if not stat.S_ISREG(st.st_mode):
         return None
-    fd = os.open(path, flags)
+    try:
+        fd = os.open(path, flags)
+    except OSError:
+        return None
     try:
         opened = os.fstat(fd)
         if not stat.S_ISREG(opened.st_mode):
             os.close(fd)
             return None
-        return fd, opened.st_size
+        return fd, opened
     except Exception:
         os.close(fd)
         raise
-def _read_tail(fd, size):
+def _read_tail(fd: int, size: int) -> tuple[bytes, int]:
     read_size = min(size, TAIL_BYTES)
     if size > read_size:
         os.lseek(fd, size - read_size, os.SEEK_SET)
-    chunks = []
+    chunks: list[bytes] = []
     remaining = read_size
     while remaining > 0:
         chunk = os.read(fd, remaining)
@@ -292,71 +228,342 @@ def _read_tail(fd, size):
     return b"".join(chunks), read_size
-try:
-    opened = _open_regular_transcript(path)
-    if opened is None:
-        sys.exit(0)
-    fd, size = opened
+def _cache_ttl_seconds() -> float:
+    raw = os.environ.get("CONTEXT_GUARD_STATUSLINE_CACHE_TTL_SECONDS", "")
+    if raw == "":
+        return DEFAULT_CACHE_TTL_SECONDS
+    try:
+        ttl = float(raw)
+    except (TypeError, ValueError, OverflowError):
+        return DEFAULT_CACHE_TTL_SECONDS
+    if ttl <= 0:
+        return 0.0
+    return min(ttl, MAX_CACHE_TTL_SECONDS)
+def _path_contains(parent: str, child: str) -> bool:
+    try:
+        parent_real = os.path.realpath(parent)
+        child_real = os.path.realpath(child)
+        return os.path.commonpath([parent_real, child_real]) == parent_real
+    except Exception:
+        return False
+def _private_cache_dir(workspace: str) -> str | None:
+    home = os.path.expanduser("~")
+    if not home or not os.path.isabs(home):
+        return None
+    root = os.path.join(home, ".cache", "context-guard", "statusline")
+    if workspace and os.path.isabs(workspace) and os.path.isdir(workspace) and _path_contains(workspace, root):
+        return None
+    try:
+        os.makedirs(root, mode=0o700, exist_ok=True)
+        st = os.lstat(root)
+        if not stat.S_ISDIR(st.st_mode) or stat.S_ISLNK(st.st_mode):
+            return None
+        if hasattr(os, "getuid") and st.st_uid != os.getuid():
+            return None
+        if stat.S_IMODE(st.st_mode) != 0o700:
+            os.chmod(root, 0o700)
+            st = os.lstat(root)
+            if stat.S_IMODE(st.st_mode) != 0o700:
+                return None
+        return root
+    except Exception:
+        return None
+def _identity(path: str, st: os.stat_result) -> dict[str, int | str]:
+    absolute = os.path.abspath(path)
+    path_hash = hashlib.sha256(os.fsencode(absolute)).hexdigest()
+    return {
+        "path_hash": path_hash,
+        "size": int(st.st_size),
+        "mtime_ns": int(getattr(st, "st_mtime_ns", int(st.st_mtime * 1_000_000_000))),
+        "dev": int(getattr(st, "st_dev", 0)),
+        "ino": int(getattr(st, "st_ino", 0)),
+    }
+def _cache_path(identity: dict[str, int | str], workspace_dir: str) -> str | None:
+    root = _private_cache_dir(workspace_dir)
+    if not root:
+        return None
+    return os.path.join(root, f"{identity['path_hash']}.json")
+def _open_no_follow_read(path: str) -> tuple[int, int] | None:
+    flags = os.O_RDONLY
+    if hasattr(os, "O_CLOEXEC"):
+        flags |= os.O_CLOEXEC
+    if hasattr(os, "O_NOFOLLOW"):
+        flags |= os.O_NOFOLLOW
     try:
-        chunk, read_size = _read_tail(fd, size)
-    finally:
+        fd = os.open(path, flags)
+    except OSError:
+        return None
+    try:
+        st = os.fstat(fd)
+        if not stat.S_ISREG(st.st_mode) or st.st_size > MAX_CACHE_BYTES:
+            os.close(fd)
+            return None
+        return fd, int(st.st_size)
+    except Exception:
         os.close(fd)
-    lines = chunk.splitlines()
-    if size > read_size and lines:
-        # First line in the tail window is likely partial; drop it.
-        lines = lines[1:]
-    for raw in lines[-MAX_RECORDS:]:
-        if not raw.strip():
-            continue
+        raise
+def _validated_metric(value: Any, *, minimum: float, maximum: float) -> str | None:
+    if not isinstance(value, str) or not METRIC_RE.match(value):
+        return None
+    try:
+        number = float(value)
+    except (TypeError, ValueError, OverflowError):
+        return None
+    if not math.isfinite(number) or number < minimum or number > maximum:
+        return None
+    return value
+def _metric_parts(cache_pct: Any, reuse_x: Any) -> str | None:
+    cache_pct = _validated_metric(cache_pct, minimum=0.0, maximum=100.0)
+    if cache_pct is None:
+        return None
+    if reuse_x is not None:
+        reuse_x = _validated_metric(reuse_x, minimum=0.0, maximum=1_000_000.0)
+        if reuse_x is None:
+            return None
+    parts = [f"cache_pct={cache_pct}"]
+    if reuse_x:
+        parts.append(f"reuse_x={reuse_x}")
+    return " ".join(parts)
+def _read_cache(identity: dict[str, int | str], workspace_dir: str, ttl: float) -> str | None:
+    if ttl <= 0:
+        return None
+    path = _cache_path(identity, workspace_dir)
+    if not path:
+        return None
+    try:
+        opened = _open_no_follow_read(path)
+        if opened is None:
+            return None
+        fd, size = opened
         try:
-            obj = json.loads(raw)
+            raw = os.read(fd, size + 1)
+        finally:
+            os.close(fd)
+        data = json.loads(raw.decode("utf-8", errors="strict"))
+        if not isinstance(data, dict):
+            return None
+        if data.get("schema_version") != CACHE_SCHEMA_VERSION:
+            return None
+        computed_at = float(data.get("computed_at", 0))
+        now = time.time()
+        if not math.isfinite(computed_at):
+            return None
+        if now - computed_at > ttl or computed_at - now > ttl:
+            return None
+        for key, value in identity.items():
+            if data.get(key) != value:
+                return None
+        return _metric_parts(data.get("cache_pct"), data.get("reuse_x"))
+    except Exception:
+        return None
+def _write_cache(identity: dict[str, int | str], workspace_dir: str, cache_pct: str, reuse_x: str | None) -> None:
+    ttl = _cache_ttl_seconds()
+    if ttl <= 0:
+        return
+    path = _cache_path(identity, workspace_dir)
+    if not path:
+        return
+    payload = {
+        "schema_version": CACHE_SCHEMA_VERSION,
+        **identity,
+        "computed_at": time.time(),
+        "cache_pct": cache_pct,
+        "reuse_x": reuse_x,
+    }
+    raw = (json.dumps(payload, ensure_ascii=False, sort_keys=True, separators=(",", ":")) + "\n").encode("utf-8")
+    if len(raw) > MAX_CACHE_BYTES:
+        return
+    tmp_path = f"{path}.{os.getpid()}.tmp"
+    fd = -1
+    try:
+        flags = os.O_WRONLY | os.O_CREAT | os.O_EXCL
+        if hasattr(os, "O_CLOEXEC"):
+            flags |= os.O_CLOEXEC
+        if hasattr(os, "O_NOFOLLOW"):
+            flags |= os.O_NOFOLLOW
+        fd = os.open(tmp_path, flags, 0o600)
+        os.write(fd, raw)
+        os.close(fd)
+        fd = -1
+        os.replace(tmp_path, path)
+        os.chmod(path, 0o600)
+    except Exception:
+        if fd >= 0:
+            try:
+                os.close(fd)
+            except Exception:
+                pass
+        try:
+            os.unlink(tmp_path)
         except Exception:
-            continue
-        usage = _extract_usage(obj)
-        if not usage:
-            continue
-        input_tokens += _int_or_zero(usage.get("input_tokens"))
-        cr = usage.get("cache_read_input_tokens")
-        if cr is None:
-            cr = usage.get("cacheRead")
-        cache_read += _int_or_zero(cr)
-        cc = usage.get("cache_creation_input_tokens")
-        if cc is None:
-            cc = usage.get("cacheCreation")
-        cache_creation += _int_or_zero(cc)
-    denom = input_tokens + cache_read + cache_creation
-    # Skip the label entirely on empty / cache-cold sessions so the user does not see a
-    # confusing "cache 0%" before the cache has had a chance to warm up.
-    if denom <= 0 or cache_read <= 0:
-        sys.exit(0)
-    pct = max(0.0, min(100.0, cache_read / denom * 100))
-    parts = [f"cache_pct={pct:.0f}"]
-    if cache_creation > 0:
-        parts.append(f"reuse_x={cache_read / cache_creation:.1f}")
-    print(" ".join(parts))
-except Exception:
-    sys.exit(0)
+            pass
+def transcript_metrics(path: str, workspace_dir: str) -> str | None:
+    input_tokens = 0
+    cache_read = 0
+    cache_creation = 0
+    try:
+        opened = _open_regular_transcript(path)
+        if opened is None:
+            return None
+        fd, st = opened
+        size = int(st.st_size)
+        identity = _identity(path, st)
+        cached = _read_cache(identity, workspace_dir, _cache_ttl_seconds())
+        if cached:
+            os.close(fd)
+            return cached
+        try:
+            chunk, read_size = _read_tail(fd, size)
+        finally:
+            os.close(fd)
+        lines = chunk.splitlines()
+        if size > read_size and lines:
+            lines = lines[1:]
+        for raw in lines[-MAX_RECORDS:]:
+            if not raw.strip():
+                continue
+            try:
+                obj = json.loads(raw)
+            except Exception:
+                continue
+            usage = _extract_usage(obj)
+            if not usage:
+                continue
+            input_tokens += _int_or_zero(usage.get("input_tokens"))
+            cr = usage.get("cache_read_input_tokens")
+            if cr is None:
+                cr = usage.get("cacheRead")
+            cache_read += _int_or_zero(cr)
+            cc = usage.get("cache_creation_input_tokens")
+            if cc is None:
+                cc = usage.get("cacheCreation")
+            cache_creation += _int_or_zero(cc)
+        denom = input_tokens + cache_read + cache_creation
+        if denom <= 0 or cache_read <= 0:
+            return None
+        pct = max(0.0, min(100.0, cache_read / denom * 100))
+        cache_pct = f"{pct:.0f}"
+        reuse_x = f"{cache_read / cache_creation:.1f}" if cache_creation > 0 else None
+        _write_cache(identity, workspace_dir, cache_pct, reuse_x)
+        parts = [f"cache_pct={cache_pct}"]
+        if reuse_x:
+            parts.append(f"reuse_x={reuse_x}")
+        return " ".join(parts)
+    except Exception:
+        return None
+def _load_payload(raw: bytes) -> dict[str, Any]:
+    try:
+        data = json.loads(raw.decode("utf-8", errors="strict"))
+    except Exception:
+        return {}
+    return data if isinstance(data, dict) else {}
+def _rounded_context(raw: str) -> tuple[str, bool]:
+    if not raw:
+        return "?", False
+    try:
+        number = float(raw)
+    except (TypeError, ValueError, OverflowError):
+        return sanitize_status(raw), False
+    if not math.isfinite(number):
+        return sanitize_status(raw), False
+    rendered = f"{number:.0f}"
+    if re.fullmatch(r"-?\d+", rendered):
+        return rendered, True
+    return sanitize_status(raw), False
+def render_statusline(payload: dict[str, Any]) -> str:
+    model_display = _get_path(payload, "model", "display_name")
+    model_id = _get_path(payload, "model", "id")
+    context_raw = _get_path(payload, "context_window", "used_percentage")
+    cost_raw = _get_path(payload, "cost", "total_cost_usd")
+    cwd = _get_path(payload, "workspace", "current_dir")
+    transcript_path = _get_path(payload, "transcript_path")
+    model = sanitize_status(model_display or model_id or "unknown")
+    context_pct, context_is_numeric = _rounded_context(context_raw)
+    context_label = f"{context_pct}%"
+    if context_is_numeric and int(context_pct) >= statusline_context_warn_threshold():
+        context_label = f"{context_label} ⚠"
+    if cost_raw:
+        try:
+            cost_number = float(cost_raw)
+            if not math.isfinite(cost_number):
+                raise ValueError("non-finite cost")
+            cost = f"${cost_number:.3f}"
+        except (TypeError, ValueError, OverflowError):
+            cost = sanitize_status(cost_raw)
+    else:
+        cost = "n/a"
+    dir_label = os.path.basename(cwd) if cwd else "."
+    dir_label = sanitize_status(dir_label or ".")
+    branch_label = ""
+    branch_dir = cwd or os.getcwd()
+    branch = git_head_branch(branch_dir)
+    if branch:
+        branch_label = f" | {sanitize_status(branch)}"
+    metrics_label = ""
+    if transcript_path and os.access(transcript_path, os.R_OK):
+        raw_metrics = transcript_metrics(transcript_path, cwd)
+        if raw_metrics:
+            cache_pct = ""
+            reuse_x = ""
+            for metric in raw_metrics.split():
+                if metric.startswith("cache_pct="):
+                    cache_pct = metric[len("cache_pct=") :]
+                elif metric.startswith("reuse_x="):
+                    reuse_x = metric[len("reuse_x=") :]
+            if cache_pct:
+                metrics_label = f" | cache {sanitize_status(cache_pct)}%"
+                if reuse_x:
+                    metrics_label += f" | reuse {sanitize_status(reuse_x)}x"
+    return f"[{model}] {dir_label}{branch_label} | ctx {context_label} | cost {cost}{metrics_label}"
+def main() -> int:
+    max_bytes = statusline_input_max_bytes()
+    raw = sys.stdin.buffer.read(max_bytes + 1)
+    if len(raw) > max_bytes:
+        print(f"[input-too-large] Claude statusline JSON exceeds {max_bytes} bytes")
+        return 0
+    print(render_statusline(_load_payload(raw)))
+    return 0
+try:
+    raise SystemExit(main())
+except BrokenPipeError:
+    raise SystemExit(0)
 PYEOF
-  )
-  if [[ -n "$transcript_metrics" ]]; then
-    cache_pct=''
-    reuse_x=''
-    for metric in $transcript_metrics; do
-      case "$metric" in
-        cache_pct=*) cache_pct="${metric#cache_pct=}" ;;
-        reuse_x=*) reuse_x="${metric#reuse_x=}" ;;
-      esac
-    done
-    if [[ -n "$cache_pct" ]]; then
-      cache_pct=$(sanitize_status "$cache_pct")
-      metrics_label=" | cache ${cache_pct}%"
-      if [[ -n "$reuse_x" ]]; then
-        reuse_x=$(sanitize_status "$reuse_x")
-        metrics_label+=" | reuse ${reuse_x}x"
-      fi
-    fi
-  fi
-fi
-# Keep it one line and cheap: this script runs locally and should not do expensive git status.
-echo "[$model] ${dir}${branch} | ctx ${context_label} | cost ${cost}${metrics_label}"
+exec python3 -c "$CONTEXT_GUARD_STATUSLINE_PY" "$@"