npm - @ictechgy/context-guard - Versions diffs - 0.4.0 - Mend

@ictechgy/context-guard 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (71) hide show

package/CHANGELOG.md +49 -0
package/LICENSE +201 -0
package/NOTICE +4 -0
package/README.ko.md +353 -0
package/README.md +353 -0
package/context-guard-kit/README.md +76 -0
package/context-guard-kit/benchmark_runner.py +1898 -0
package/context-guard-kit/claude_transcript_cost_audit.py +1591 -0
package/context-guard-kit/context_compress.py +543 -0
package/context-guard-kit/context_escrow.py +919 -0
package/context-guard-kit/context_guard_cli.py +149 -0
package/context-guard-kit/context_guard_diet.py +1036 -0
package/context-guard-kit/context_pack.py +929 -0
package/context-guard-kit/failed_attempt_nudge.py +567 -0
package/context-guard-kit/guard_large_read.py +690 -0
package/context-guard-kit/hook_secret_patterns.py +43 -0
package/context-guard-kit/read_symbol.py +483 -0
package/context-guard-kit/rewrite_bash_for_token_budget.py +501 -0
package/context-guard-kit/sanitize_output.py +725 -0
package/context-guard-kit/settings.example.json +67 -0
package/context-guard-kit/setup_wizard.py +1724 -0
package/context-guard-kit/statusline.sh +362 -0
package/context-guard-kit/statusline_merged.sh +157 -0
package/context-guard-kit/tool_schema_pruner.py +837 -0
package/context-guard-kit/trim_command_output.py +1098 -0
package/docs/distribution.md +55 -0
package/package.json +70 -0
package/packaging/homebrew/context-guard.rb.template +34 -0
package/plugins/context-guard/.claude-plugin/plugin.json +41 -0
package/plugins/context-guard/LICENSE +201 -0
package/plugins/context-guard/NOTICE +4 -0
package/plugins/context-guard/README.ko.md +135 -0
package/plugins/context-guard/README.md +135 -0
package/plugins/context-guard/bin/claude-read-symbol +6 -0
package/plugins/context-guard/bin/claude-sanitize-output +6 -0
package/plugins/context-guard/bin/claude-token-artifact +6 -0
package/plugins/context-guard/bin/claude-token-audit +6 -0
package/plugins/context-guard/bin/claude-token-bench +6 -0
package/plugins/context-guard/bin/claude-token-diet +6 -0
package/plugins/context-guard/bin/claude-token-failed-nudge +6 -0
package/plugins/context-guard/bin/claude-token-guard-read +6 -0
package/plugins/context-guard/bin/claude-token-rewrite-bash +6 -0
package/plugins/context-guard/bin/claude-token-setup +6 -0
package/plugins/context-guard/bin/claude-token-statusline +6 -0
package/plugins/context-guard/bin/claude-token-statusline-merged +6 -0
package/plugins/context-guard/bin/claude-trim-output +6 -0
package/plugins/context-guard/bin/context-guard +149 -0
package/plugins/context-guard/bin/context-guard-artifact +919 -0
package/plugins/context-guard/bin/context-guard-audit +1591 -0
package/plugins/context-guard/bin/context-guard-bench +1898 -0
package/plugins/context-guard/bin/context-guard-compress +543 -0
package/plugins/context-guard/bin/context-guard-diet +1036 -0
package/plugins/context-guard/bin/context-guard-failed-nudge +567 -0
package/plugins/context-guard/bin/context-guard-guard-read +690 -0
package/plugins/context-guard/bin/context-guard-pack +929 -0
package/plugins/context-guard/bin/context-guard-read-symbol +483 -0
package/plugins/context-guard/bin/context-guard-rewrite-bash +501 -0
package/plugins/context-guard/bin/context-guard-sanitize-output +725 -0
package/plugins/context-guard/bin/context-guard-setup +1724 -0
package/plugins/context-guard/bin/context-guard-statusline +362 -0
package/plugins/context-guard/bin/context-guard-statusline-merged +157 -0
package/plugins/context-guard/bin/context-guard-tool-prune +837 -0
package/plugins/context-guard/bin/context-guard-trim-output +1098 -0
package/plugins/context-guard/brief/README.md +65 -0
package/plugins/context-guard/brief/brief-mode.lite.md +29 -0
package/plugins/context-guard/brief/brief-mode.standard.md +31 -0
package/plugins/context-guard/brief/brief-mode.ultra.md +32 -0
package/plugins/context-guard/lib/hook_secret_patterns.py +43 -0
package/plugins/context-guard/skills/audit/SKILL.md +39 -0
package/plugins/context-guard/skills/optimize/SKILL.md +48 -0
package/plugins/context-guard/skills/setup/SKILL.md +40 -0

package/context-guard-kit/claude_transcript_cost_audit.py ADDED Viewed

@@ -0,0 +1,1591 @@
+#!/usr/bin/env python3
+"""Best-effort Claude Code transcript usage auditor.
+Claude Code transcript schemas may change. This script scans JSONL objects for
+common token/cost fields rather than relying on one exact schema. It reports
+parse/read skips so totals are not mistaken for billing-authoritative data.
+"""
+from __future__ import annotations
+import argparse
+import datetime as _dt
+import errno
+import hashlib
+import json
+import math
+import os
+import re
+import shlex
+import stat
+import sys
+from collections import Counter, defaultdict
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Any, BinaryIO, Iterable
+TOKEN_KEY_GROUPS: tuple[tuple[str, tuple[str, ...]], ...] = (
+    ("input", ("input_tokens",)),
+    ("output", ("output_tokens",)),
+    ("cache_creation", ("cache_creation_input_tokens", "cacheCreation")),
+    ("cache_read", ("cache_read_input_tokens", "cacheRead")),
+)
+KNOWN_TOKEN_BUCKETS = {bucket for bucket, _ in TOKEN_KEY_GROUPS}
+TOKEN_TYPE_ALIASES = {
+    "input": "input",
+    "input_tokens": "input",
+    "output": "output",
+    "output_tokens": "output",
+    "cacheRead": "cache_read",
+    "cache_read": "cache_read",
+    "cache_read_input_tokens": "cache_read",
+    "cacheCreation": "cache_creation",
+    "cache_creation": "cache_creation",
+    "cache_creation_input_tokens": "cache_creation",
+}
+COST_KEYS = ("total_cost_usd", "cost_usd", "costUSD")
+MODEL_KEYS = ("model", "model_id", "modelId")
+QUERY_SOURCE_KEYS = ("query_source", "querySource")
+FEASIBILITY_SCHEMA_VERSION = "contextguard.metric-feasibility.v1.1"
+FEASIBILITY_PRODUCER = "context-guard-audit"
+MAX_ERROR_EXAMPLES = 20
+JSON_PARSE_RECURSION_LIMIT = 10_000
+READ_CHUNK_BYTES = 64 * 1024
+DEFAULT_MAX_FILE_BYTES = 50 * 1024 * 1024
+DEFAULT_MAX_LINE_BYTES = 2 * 1024 * 1024
+MAX_FILE_BYTES_LIMIT = 2 * 1024 * 1024 * 1024
+MAX_LINE_BYTES_LIMIT = 128 * 1024 * 1024
+SECRET_VALUE_RE = re.compile(
+    r"(?i)(gh[pousr]_[A-Za-z0-9_]{8,}|github_pat_[A-Za-z0-9_]{20,}|"
+    r"xox[abprs]-[A-Za-z0-9-]{8,}|(?:AKIA|ASIA)[0-9A-Z]{8,}|"
+    r"AIza[0-9A-Za-z_\-]{8,}|Bearer\s+[A-Za-z0-9._~+/=-]+|"
+    r"Basic\s+[A-Za-z0-9._~+/=-]+|"
+    r"sk-ant-[A-Za-z0-9_-]{12,}|sk-[A-Za-z0-9_-]{12,}|glpat-[A-Za-z0-9_-]{12,}|"
+    r"npm_[A-Za-z0-9]{20,}|eyJ[A-Za-z0-9_-]+\.[A-Za-z0-9_-]+\.[A-Za-z0-9_-]+|"
+    r"[a-z][a-z0-9+.-]*://[^/\s:@]+:[^/\s@]+@|"
+    r"(?:--password|-p)\s+\S+|(?:-u|--user)\s+\S+:\S+|"
+    r"(api[_-]?key|token|secret|password)=\S+)"
+)
+REDACTED_PATH_COMPONENT = "[REDACTED-PATH-COMPONENT]"
+COMMAND_KEYS = ("command", "cmd")
+TOOL_NAME_KEYS = ("tool_name", "toolName", "tool")
+PROMPT_AUDIT_MAX_RECORDS = 200
+PROMPT_AUDIT_MAX_TEXT_BYTES = 32 * 1024
+PROMPT_AUDIT_MAX_SEGMENTS_PER_RECORD = 32
+PROMPT_AUDIT_PREFIX_SEGMENTS = 3
+PROMPT_AUDIT_TAIL_SEGMENTS = 3
+PROMPT_AUDIT_MIN_RECORDS = 3
+PROMPT_PREFIX_VOLATILE_THRESHOLD = 0.66
+PROMPT_PREFIX_TAIL_CHURN_DELTA = 0.34
+PROMPT_AUDIT_MAX_FINDINGS = 5
+PROMPT_SEGMENT_HASH_CHARS = 16
+PROMPT_AUDIT_MAX_TEXT_VALUES = 64
+PROMPT_AUDIT_MAX_ROOT_NODES = 4096
+PROMPT_AUDIT_MAX_CONTENT_NODES = 2048
+PROMPT_AUDIT_MAX_DEPTH = 64
+USER_PROMPT_ROLES = {"user", "human"}
+TEXT_BLOCK_TYPES = {"text", "input_text"}
+def push_bounded(
+    stack: list[tuple[Any, int]],
+    items: Iterable[Any],
+    depth: int,
+    *,
+    visited: int,
+    max_nodes: int,
+) -> bool:
+    """Push traversal children without letting broad structures grow unbounded."""
+    budget = max(0, max_nodes - visited - len(stack))
+    if budget <= 0:
+        return True
+    pushed = 0
+    capped = False
+    for item in items:
+        if pushed >= budget:
+            capped = True
+            break
+        stack.append((item, depth))
+        pushed += 1
+    return capped
+@dataclass(frozen=True)
+class PromptSegmentSample:
+    prefix_hashes: tuple[str, ...]
+    tail_hashes: tuple[str, ...]
+    segment_count: int
+    bytes_sampled: int
+    redactions: int
+@dataclass
+class RecordUsage:
+    tokens: Counter[str] = field(default_factory=Counter)
+    cost_usd: float = 0.0
+    commands: set[str] = field(default_factory=set)
+    tools: set[str] = field(default_factory=set)
+@dataclass
+class PromptCacheAudit:
+    sampled_records: int = 0
+    analyzed_prompt_records: int = 0
+    capped_records: int = 0
+    prompt_collection_capped_records: int = 0
+    total_segments: int = 0
+    total_bytes_sampled: int = 0
+    redacted_segments: int = 0
+    samples: list[PromptSegmentSample] = field(default_factory=list)
+    def observe(self, root: Any) -> None:
+        self.sampled_records += 1
+        segments, bytes_sampled, redactions, collection_capped = prompt_segments_for_record(root)
+        if collection_capped:
+            self.prompt_collection_capped_records += 1
+        if not segments:
+            return
+        if len(self.samples) >= PROMPT_AUDIT_MAX_RECORDS:
+            self.capped_records += 1
+            return
+        self.analyzed_prompt_records += 1
+        self.total_segments += len(segments)
+        self.total_bytes_sampled += bytes_sampled
+        self.redacted_segments += redactions
+        self.samples.append(PromptSegmentSample(
+            prefix_hashes=tuple(stable_hash(segment, PROMPT_SEGMENT_HASH_CHARS) for segment in segments[:PROMPT_AUDIT_PREFIX_SEGMENTS]),
+            tail_hashes=tuple(stable_hash(segment, PROMPT_SEGMENT_HASH_CHARS) for segment in segments[-PROMPT_AUDIT_TAIL_SEGMENTS:]),
+            segment_count=len(segments),
+            bytes_sampled=bytes_sampled,
+            redactions=redactions,
+        ))
+@dataclass
+class UsageSummary:
+    files: int = 0
+    records: int = 0
+    skipped_files: int = 0
+    skipped_records: int = 0
+    parse_errors: list[str] = field(default_factory=list)
+    tokens: Counter[str] = field(default_factory=Counter)
+    cost_usd: float = 0.0
+    by_model: dict[str, Counter[str]] = field(default_factory=lambda: defaultdict(Counter))
+    by_query_source: dict[str, Counter[str]] = field(default_factory=lambda: defaultdict(Counter))
+    by_file: Counter[str] = field(default_factory=Counter)
+    cost_by_file: Counter[str] = field(default_factory=Counter)
+    by_command: Counter[str] = field(default_factory=Counter)
+    by_tool: Counter[str] = field(default_factory=Counter)
+    token_field_presence: Counter[str] = field(default_factory=Counter)
+    cost_field_count: int = 0
+    prompt_cache_audit: PromptCacheAudit = field(default_factory=PromptCacheAudit)
+    cache_friendliness_cache: dict[str, Any] | None = field(default=None, init=False, repr=False)
+    @property
+    def total_tokens(self) -> int:
+        return sum(self.tokens.values())
+    @property
+    def cache_hit_rate(self) -> float:
+        """cache_read의 입력 측 비중 = cache_read / (input + cache_read + cache_creation).
+        cache_creation이 분모에 포함되므로 신규 prefix를 막 만든 세션에서는 비율이 낮게
+        나타날 수 있다. 고전적 hit-rate(cache 가능 풀 대비 hit)가 아니라 입력 비용 절감
+        지표로 해석해야 한다. denom == 0이면 0.0.
+        """
+        cr = self.tokens.get("cache_read", 0)
+        cc = self.tokens.get("cache_creation", 0)
+        inp = self.tokens.get("input", 0)
+        denom = cr + cc + inp
+        return (cr / denom) if denom > 0 else 0.0
+    @property
+    def cache_amortization(self) -> float:
+        """cache_read / cache_creation. 토큰 단위로 본 평균 재사용 배수의 근사.
+        cache_creation == 0인 경우 의미가 정의되지 않으므로 0.0을 반환한다 (정의되지 않음을
+        표현하기 위해 cache_amortization_defined 플래그를 함께 노출한다). 같은 prefix가
+        길이 변화 없이 N회 재사용되면 토큰 비도 약 N배가 되지만, prefix 길이가 변하는
+        세션에서는 정확히 호출 횟수가 아닌 토큰 비율로 본 근사값임에 주의.
+        """
+        cc = self.tokens.get("cache_creation", 0)
+        cr = self.tokens.get("cache_read", 0)
+        return (cr / cc) if cc > 0 else 0.0
+    @property
+    def cache_amortization_defined(self) -> bool:
+        """cache_amortization이 의미를 갖는지 여부. cache_creation > 0일 때만 True."""
+        return self.tokens.get("cache_creation", 0) > 0
+    def note_error(self, message: str) -> None:
+        if len(self.parse_errors) < MAX_ERROR_EXAMPLES:
+            self.parse_errors.append(message)
+def iter_jsonl_files(paths: Iterable[str]) -> Iterable[Path]:
+    seen: set[Path] = set()
+    for raw in paths:
+        path = Path(raw).expanduser()
+        root = path.resolve()
+        candidates: Iterable[Path]
+        if path.is_file() and path.suffix in {".jsonl", ".json"}:
+            candidates = [path]
+        elif path.is_dir():
+            candidates = (
+                candidate
+                for pattern in ("*.jsonl", "*.json")
+                for candidate in path.rglob(pattern)
+            )
+        else:
+            continue
+        for candidate in candidates:
+            if candidate.is_symlink():
+                # The scanner opens candidates with O_NOFOLLOW and will skip
+                # this path.  Do not let a rejected link reserve its target's
+                # dedupe key and suppress a later real transcript in scope.
+                yield candidate
+                continue
+            resolved = candidate.resolve()
+            try:
+                resolved.relative_to(root if path.is_dir() else root.parent)
+            except ValueError:
+                continue
+            if resolved in seen:
+                continue
+            seen.add(resolved)
+            yield candidate
+def walk(obj: Any) -> Iterable[dict[str, Any]]:
+    stack = [obj]
+    while stack:
+        current = stack.pop()
+        if isinstance(current, dict):
+            yield current
+            stack.extend(current.values())
+        elif isinstance(current, list):
+            stack.extend(current)
+def first_string(obj: dict[str, Any], keys: Iterable[str]) -> str | None:
+    for key in keys:
+        val = obj.get(key)
+        if isinstance(val, str):
+            return val
+        if isinstance(val, dict):
+            nested = val.get("id") or val.get("name")
+            if isinstance(nested, str):
+                return nested
+    return None
+MAX_METRIC_VALUE = 10**18
+def finite_nonnegative_number(value: Any, *, clamp_negative: bool) -> int | float | None:
+    if isinstance(value, bool):
+        return None
+    if isinstance(value, int):
+        if value < 0 and not clamp_negative:
+            return None
+        return min(max(value, 0), MAX_METRIC_VALUE)
+    if isinstance(value, float):
+        if not math.isfinite(value) or (value < 0 and not clamp_negative):
+            return None
+        return min(max(value, 0.0), float(MAX_METRIC_VALUE))
+    return None
+def normalize_token_bucket(raw: str) -> str:
+    return TOKEN_TYPE_ALIASES.get(raw, raw)
+def stable_token_counter(tokens: Counter[str]) -> dict[str, int]:
+    return {bucket: tokens[bucket] for bucket in sorted(KNOWN_TOKEN_BUCKETS) if tokens.get(bucket, 0) != 0}
+def stable_token_presence(presence: Counter[str]) -> dict[str, int]:
+    return {bucket: presence[bucket] for bucket in sorted(KNOWN_TOKEN_BUCKETS) if presence.get(bucket, 0) > 0}
+def add_token_groups(local_tokens: Counter[str], d: dict[str, Any]) -> set[str]:
+    present: set[str] = set()
+    for bucket, keys in TOKEN_KEY_GROUPS:
+        for raw_key in keys:
+            val = d.get(raw_key)
+            metric = finite_nonnegative_number(val, clamp_negative=True)
+            if metric is not None:
+                local_tokens[bucket] += int(metric)
+                present.add(bucket)
+                break
+    return present
+def sanitize_label(value: str, limit: int = 120) -> str:
+    compact = " ".join(value.strip().split())
+    compact = SECRET_VALUE_RE.sub("[REDACTED]", compact)
+    if len(compact) > limit:
+        compact = compact[: limit - 15].rstrip() + " ...[truncated]"
+    return compact
+def stable_hash(value: str, length: int = 12) -> str:
+    return hashlib.sha256(value.encode("utf-8", errors="replace")).hexdigest()[:length]
+def truncate_utf8(text: str, max_bytes: int) -> tuple[str, bool]:
+    raw = text.encode("utf-8", errors="replace")
+    if len(raw) <= max_bytes:
+        return text, False
+    return raw[:max_bytes].decode("utf-8", errors="ignore"), True
+def collect_content_text(value: Any, out: list[str]) -> bool:
+    """Collect allowlisted text blocks without recursive descent.
+    Returns True when collection hit a bounded traversal cap. Deep or very broad
+    transcript shapes should downgrade cache-friendliness evidence instead of
+    crashing the whole audit.
+    """
+    capped = False
+    visited = 0
+    stack: list[tuple[Any, int]] = [(value, 0)]
+    while stack and len(out) < PROMPT_AUDIT_MAX_TEXT_VALUES:
+        current, depth = stack.pop()
+        visited += 1
+        if visited > PROMPT_AUDIT_MAX_CONTENT_NODES or depth > PROMPT_AUDIT_MAX_DEPTH:
+            capped = True
+            break
+        if isinstance(current, str):
+            if current.strip():
+                out.append(current)
+            continue
+        if isinstance(current, list):
+            if depth >= PROMPT_AUDIT_MAX_DEPTH:
+                capped = True
+                continue
+            capped = push_bounded(
+                stack,
+                reversed(current),
+                depth + 1,
+                visited=visited,
+                max_nodes=PROMPT_AUDIT_MAX_CONTENT_NODES,
+            ) or capped
+            continue
+        if not isinstance(current, dict):
+            continue
+        block_type = current.get("type")
+        if block_type in TEXT_BLOCK_TYPES and isinstance(current.get("text"), str):
+            stack.append((current.get("text"), depth + 1))
+            continue
+        if depth >= PROMPT_AUDIT_MAX_DEPTH:
+            capped = True
+            continue
+        if "content" in current:
+            capped = push_bounded(
+                stack,
+                (current.get("content"),),
+                depth + 1,
+                visited=visited,
+                max_nodes=PROMPT_AUDIT_MAX_CONTENT_NODES,
+            ) or capped
+        if isinstance(current.get("text"), str):
+            capped = push_bounded(
+                stack,
+                (current.get("text"),),
+                depth + 1,
+                visited=visited,
+                max_nodes=PROMPT_AUDIT_MAX_CONTENT_NODES,
+            ) or capped
+    if stack or len(out) >= PROMPT_AUDIT_MAX_TEXT_VALUES:
+        capped = True
+    return capped
+def extract_prompt_texts(root: Any) -> tuple[list[str], bool]:
+    """Best-effort prompt text extraction from allowlisted user/prompt shapes."""
+    texts: list[str] = []
+    capped = False
+    visited = 0
+    stack: list[tuple[Any, int]] = [(root, 0)]
+    while stack and len(texts) < PROMPT_AUDIT_MAX_TEXT_VALUES:
+        current, depth = stack.pop()
+        visited += 1
+        if visited > PROMPT_AUDIT_MAX_ROOT_NODES or depth > PROMPT_AUDIT_MAX_DEPTH:
+            capped = True
+            break
+        if isinstance(current, dict):
+            role = current.get("role")
+            role_text = str(role).lower() if isinstance(role, str) else ""
+            if role_text in USER_PROMPT_ROLES:
+                if "content" in current:
+                    capped = collect_content_text(current.get("content"), texts) or capped
+                if isinstance(current.get("text"), str):
+                    capped = collect_content_text(current.get("text"), texts) or capped
+                if isinstance(current.get("prompt"), str):
+                    capped = collect_content_text(current.get("prompt"), texts) or capped
+                # Role-scoped content was handled above; do not re-walk it and
+                # risk duplicating text blocks.
+                continue
+            prompt = current.get("prompt")
+            if isinstance(prompt, str) and prompt.strip():
+                texts.append(prompt)
+            if depth >= PROMPT_AUDIT_MAX_DEPTH:
+                capped = True
+                continue
+            capped = push_bounded(
+                stack,
+                current.values(),
+                depth + 1,
+                visited=visited,
+                max_nodes=PROMPT_AUDIT_MAX_ROOT_NODES,
+            ) or capped
+        elif isinstance(current, list):
+            if depth >= PROMPT_AUDIT_MAX_DEPTH:
+                capped = True
+                continue
+            capped = push_bounded(
+                stack,
+                reversed(current),
+                depth + 1,
+                visited=visited,
+                max_nodes=PROMPT_AUDIT_MAX_ROOT_NODES,
+            ) or capped
+    if stack or len(texts) >= PROMPT_AUDIT_MAX_TEXT_VALUES:
+        capped = True
+    return texts, capped
+def prompt_segments_for_record(root: Any) -> tuple[list[str], int, int, bool]:
+    texts, collection_capped = extract_prompt_texts(root)
+    if not texts:
+        return [], 0, 0, collection_capped
+    budget = PROMPT_AUDIT_MAX_TEXT_BYTES
+    segments: list[str] = []
+    bytes_sampled = 0
+    redactions = 0
+    for text in texts:
+        if budget <= 0 or len(segments) >= PROMPT_AUDIT_MAX_SEGMENTS_PER_RECORD:
+            break
+        clipped, _truncated = truncate_utf8(text, budget)
+        sanitized, count = SECRET_VALUE_RE.subn("[REDACTED]", clipped)
+        redactions += count
+        bytes_sampled += len(sanitized.encode("utf-8", errors="replace"))
+        budget = max(0, PROMPT_AUDIT_MAX_TEXT_BYTES - bytes_sampled)
+        for raw_line in sanitized.splitlines():
+            compact = " ".join(raw_line.strip().split())
+            if not compact:
+                continue
+            segment, _ = truncate_utf8(compact, 512)
+            segments.append(segment)
+            if len(segments) >= PROMPT_AUDIT_MAX_SEGMENTS_PER_RECORD:
+                break
+        if not segments and sanitized.strip():
+            segment, _ = truncate_utf8(" ".join(sanitized.strip().split()), 512)
+            if segment:
+                segments.append(segment)
+    return segments, bytes_sampled, redactions, collection_capped
+def safe_resolve(path: Path) -> Path:
+    try:
+        return path.resolve()
+    except (OSError, RuntimeError):
+        return path.absolute()
+def path_component_contains_secret(component: str) -> bool:
+    return bool(component and component not in {".", ".."} and SECRET_VALUE_RE.search(component))
+def sanitize_path_component(component: str) -> str:
+    if not component or component in {".", ".."}:
+        return component
+    if not path_component_contains_secret(component):
+        return component
+    return REDACTED_PATH_COMPONENT
+def sanitize_path_text(path: str) -> str:
+    return "/".join(sanitize_path_component(component) for component in path.replace(os.sep, "/").split("/"))
+def display_path_hash(path: Path) -> str:
+    return stable_hash(sanitize_path_text(str(safe_resolve(path))))
+def path_label(path: Path, show_paths: bool = False) -> str:
+    if show_paths:
+        return sanitize_path_text(str(path))
+    name = sanitize_label(sanitize_path_component(path.name or "transcript"), 80)
+    return f"{name}#path:{display_path_hash(path)}"
+def command_label(command: str, show_commands: bool = False) -> str:
+    sanitized = sanitize_label(command)
+    if show_commands:
+        return sanitized
+    try:
+        argv = shlex.split(sanitized)
+    except ValueError:
+        argv = sanitized.split()
+    if not argv:
+        category = "command"
+    elif len(argv) >= 3 and argv[0] in {"python", "python3"} and argv[1] == "-m":
+        category = " ".join(argv[:3])
+    elif len(argv) >= 2 and argv[0] in {"npm", "pnpm", "yarn", "bun"} and argv[1] in {"run", "run-script"}:
+        category = " ".join(argv[:3]) if len(argv) >= 3 else " ".join(argv[:2])
+    else:
+        category = argv[0]
+    return f"{category}#cmd:{stable_hash(sanitized)}"
+def bounded_int(value: object, default: int, minimum: int, maximum: int) -> int:
+    try:
+        number = int(value)
+    except (TypeError, ValueError, OverflowError):
+        return default
+    return min(max(number, minimum), maximum)
+def require_scan_limit(parser: argparse.ArgumentParser, option: str, value: int, maximum: int) -> int:
+    if value < 1 or value > maximum:
+        parser.error(f"{option} must be between 1 and {maximum}")
+    return value
+def os_error_summary(exc: OSError) -> str:
+    """Return OSError metadata without embedding raw filenames from str(exc)."""
+    parts = [exc.__class__.__name__]
+    if exc.errno is not None:
+        parts.append(f"errno={exc.errno}")
+    message = sanitize_label(str(exc.strerror or ""), 160)
+    if message:
+        parts.append(message)
+    return ": ".join(parts)
+@dataclass(frozen=True)
+class ScanLimits:
+    max_file_bytes: int = DEFAULT_MAX_FILE_BYTES
+    max_line_bytes: int = DEFAULT_MAX_LINE_BYTES
+def open_regular_no_symlink(file: Path):
+    """Open a transcript candidate only if it is still a regular non-symlink file."""
+    before = file.lstat()
+    if stat.S_ISLNK(before.st_mode):
+        raise OSError(errno.ELOOP, "transcript file must not be a symlink", str(file))
+    if not stat.S_ISREG(before.st_mode):
+        raise OSError(errno.EINVAL, "transcript file must be a regular file", str(file))
+    flags = os.O_RDONLY
+    for optional_flag in ("O_CLOEXEC", "O_NOFOLLOW", "O_NONBLOCK"):
+        flags |= getattr(os, optional_flag, 0)
+    fd = os.open(file, flags)
+    try:
+        opened = os.fstat(fd)
+        after = file.lstat()
+        if (
+            not stat.S_ISREG(opened.st_mode)
+            or not os.path.samestat(before, opened)
+            or not os.path.samestat(after, opened)
+        ):
+            raise OSError(errno.ELOOP, "transcript file changed while opening", str(file))
+        return os.fdopen(fd, "rb")
+    except Exception:
+        os.close(fd)
+        raise
+def iter_bounded_lines(handle: BinaryIO, max_line_bytes: int) -> Iterable[tuple[int, str | None]]:
+    """Yield decoded lines without retaining an oversized JSONL record in memory.
+    `None` means the record exceeded `max_line_bytes` and was skipped after the
+    iterator consumed bytes up to the next newline.  This keeps transcript audit
+    robust when a corrupted trace contains one huge single-line payload.
+    """
+    line_no = 1
+    buffer = bytearray()
+    oversized = False
+    while True:
+        chunk = handle.read(READ_CHUNK_BYTES)
+        if not chunk:
+            if oversized:
+                yield line_no, None
+            elif buffer:
+                yield line_no, buffer.decode("utf-8", errors="replace")
+            break
+        start = 0
+        while start < len(chunk):
+            newline = chunk.find(b"\n", start)
+            end = len(chunk) if newline == -1 else newline + 1
+            piece = chunk[start:end]
+            if not oversized:
+                if len(buffer) + len(piece) > max_line_bytes:
+                    buffer.clear()
+                    oversized = True
+                else:
+                    buffer.extend(piece)
+            if newline == -1:
+                break
+            if oversized:
+                yield line_no, None
+            else:
+                yield line_no, buffer.decode("utf-8", errors="replace")
+                buffer.clear()
+            line_no += 1
+            oversized = False
+            start = end
+def collect_record_hints(root: Any, show_commands: bool = False) -> tuple[set[str], set[str]]:
+    commands: set[str] = set()
+    tools: set[str] = set()
+    for d in walk(root):
+        for key in COMMAND_KEYS:
+            value = d.get(key)
+            if isinstance(value, str) and value.strip():
+                commands.add(command_label(value, show_commands=show_commands))
+        for key in TOOL_NAME_KEYS:
+            value = d.get(key)
+            if isinstance(value, str) and value.strip():
+                name = sanitize_label(value, 80)
+                if name and len(name.split()) <= 4:
+                    tools.add(name)
+    return commands, tools
+def add_usage(
+    summary: UsageSummary,
+    root: Any,
+    file: Path | None = None,
+    show_paths: bool = False,
+    show_commands: bool = False,
+) -> RecordUsage:
+    root_model = None
+    root_query_source = None
+    if isinstance(root, dict):
+        root_model = first_string(root, MODEL_KEYS)
+        root_query_source = first_string(root, QUERY_SOURCE_KEYS)
+    record = RecordUsage()
+    summary.prompt_cache_audit.observe(root)
+    for d in walk(root):
+        local_tokens: Counter[str] = Counter()
+        present_buckets = add_token_groups(local_tokens, d)
+        # OpenTelemetry-style records sometimes use {name, value, attributes.type}.
+        name = d.get("name") or d.get("metric")
+        if name == "claude_code.token.usage":
+            value = d.get("value")
+            if value is None:
+                value = d.get("sum")
+            if value is None:
+                value = d.get("count")
+            attrs = d.get("attributes") or {}
+            token_type = attrs.get("type", "unknown") if isinstance(attrs, dict) else "unknown"
+            metric = finite_nonnegative_number(value, clamp_negative=True)
+            if metric is not None:
+                bucket = normalize_token_bucket(str(token_type))
+                local_tokens[bucket] += int(metric)
+                present_buckets.add(bucket)
+        for bucket in present_buckets:
+            summary.token_field_presence[bucket] += 1
+        if local_tokens:
+            summary.tokens.update(local_tokens)
+            record.tokens.update(local_tokens)
+            model = sanitize_label(first_string(d, MODEL_KEYS) or root_model or "unknown", 80)
+            query_source = sanitize_label(first_string(d, QUERY_SOURCE_KEYS) or root_query_source or "unknown", 80)
+            summary.by_model[model].update(local_tokens)
+            summary.by_query_source[query_source].update(local_tokens)
+        for key in COST_KEYS:
+            val = d.get(key)
+            metric = finite_nonnegative_number(val, clamp_negative=False)
+            if metric is not None:
+                cost = float(metric)
+                summary.cost_usd += cost
+                record.cost_usd += cost
+                summary.cost_field_count += 1
+                break
+    commands, tools = collect_record_hints(root, show_commands=show_commands)
+    record.commands = commands
+    record.tools = tools
+    record_total = sum(record.tokens.values())
+    if file is not None and (record_total or record.cost_usd):
+        file_key = path_label(file, show_paths=show_paths)
+        summary.by_file[file_key] += record_total
+        summary.cost_by_file[file_key] += record.cost_usd
+    for command in commands:
+        summary.by_command[command] += 1
+    for tool in tools:
+        summary.by_tool[tool] += 1
+    return record
+def parse_json_line(line: str) -> Any:
+    # Python 3.11's json decoder can hit the interpreter recursion limit on
+    # deeply nested transcript payloads before our iterative walker sees them.
+    # Raise the process limit enough for realistic hostile fixtures, while still
+    # treating too-deep input as a skipped parse record instead of crashing.
+    if sys.getrecursionlimit() < JSON_PARSE_RECURSION_LIMIT:
+        sys.setrecursionlimit(JSON_PARSE_RECURSION_LIMIT)
+    return json.loads(line)
+def scan(
+    paths: list[str],
+    show_paths: bool = False,
+    show_commands: bool = False,
+    limits: ScanLimits | None = None,
+) -> UsageSummary:
+    limits = limits or ScanLimits()
+    summary = UsageSummary()
+    for file in iter_jsonl_files(paths):
+        summary.files += 1
+        try:
+            with open_regular_no_symlink(file) as handle:
+                size = os.fstat(handle.fileno()).st_size
+                if size > limits.max_file_bytes:
+                    summary.skipped_files += 1
+                    summary.note_error(
+                        f"{path_label(file, show_paths=show_paths)}: skipped oversized transcript file "
+                        f"({size} bytes > {limits.max_file_bytes})"
+                    )
+                    continue
+                for line_no, line in iter_bounded_lines(handle, limits.max_line_bytes):
+                    if line is None:
+                        summary.skipped_records += 1
+                        summary.note_error(
+                            f"{path_label(file, show_paths=show_paths)}:{line_no}: "
+                            f"skipped oversized JSONL record (> {limits.max_line_bytes} bytes)"
+                        )
+                        continue
+                    line = line.strip()
+                    if not line:
+                        continue
+                    try:
+                        obj = parse_json_line(line)
+                    except json.JSONDecodeError as exc:
+                        summary.skipped_records += 1
+                        summary.note_error(f"{path_label(file, show_paths=show_paths)}:{line_no}: JSON parse error: {exc.msg}")
+                        continue
+                    except RecursionError as exc:
+                        summary.skipped_records += 1
+                        summary.note_error(f"{path_label(file, show_paths=show_paths)}:{line_no}: JSON parse error: nested JSON exceeds supported depth")
+                        continue
+                    summary.records += 1
+                    add_usage(summary, obj, file, show_paths=show_paths, show_commands=show_commands)
+        except OSError as exc:
+            summary.skipped_files += 1
+            summary.note_error(f"{path_label(file, show_paths=show_paths)}: read error: {os_error_summary(exc)}")
+            continue
+    return summary
+def print_counter(title: str, counter: Counter[str], top: int) -> None:
+    print(f"\n{title}")
+    for key, val in counter.most_common(top):
+        print(f"  {key:24s} {val:12d}")
+def counter_json(counter: Counter[str], top: int) -> list[dict[str, Any]]:
+    return [{"name": key, "value": val} for key, val in counter.most_common(top)]
+def utc_now_iso() -> str:
+    return _dt.datetime.now(_dt.timezone.utc).replace(microsecond=0).isoformat().replace("+00:00", "Z")
+def availability_status(*, present: bool, skipped: bool = False, partial: bool = False) -> str:
+    if present and partial:
+        return "partial"
+    if present:
+        return "available"
+    if skipped:
+        return "partial"
+    return "missing"
+# 측정 증거 3-상태 등급. status(available/partial/missing)와 직교하는 보조 축으로,
+# 값이 "어떻게" 알려졌는지를 GUI/소비자에게 노출한다.
+EVIDENCE_OBSERVED = "observed"
+EVIDENCE_INFERRED = "inferred"
+EVIDENCE_UNAVAILABLE = "unavailable"
+def evidence_class(*, observed: bool, inferable: bool = False) -> str:
+    """관측/추론/불가 3-상태 증거 등급을 반환한다.
+    - observed: transcript 필드에서 직접 읽은 값.
+    - inferred: 관측값에서 문서화된 공식으로 파생한 값(추정치).
+    - unavailable: scan 데이터만으로는 판별할 수 없는 값.
+    observed가 우선한다. 직접 관측이 없고 inferable한 경우에만 inferred로, 둘 다
+    아니면 unavailable로 분류해 보수적 측정 원칙을 지킨다.
+    """
+    if observed:
+        return EVIDENCE_OBSERVED
+    if inferable:
+        return EVIDENCE_INFERRED
+    return EVIDENCE_UNAVAILABLE
+def build_headroom_availability(summary: UsageSummary) -> dict[str, Any]:
+    """Context-window headroom 가용성/증거 등급을 보수적으로 분류한다.
+    transcript JSON에는 live `context_window`/잔여 토큰 정보가 없으므로 과거 scan
+    만으로는 headroom을 관측하거나 추론할 수 없다. 따라서 status는 기존 context와
+    동일하게 "missing", evidence는 "unavailable"로 둔다. live statusline snapshot을
+    입력으로 받는 미래 surface에서는 observed로 승급될 수 있음을 contract로 남긴다.
+    """
+    return {
+        "status": "missing",
+        "evidence": EVIDENCE_UNAVAILABLE,
+        "reason": (
+            "Transcript scans do not carry live context-window or remaining-token data, "
+            "so context headroom cannot be observed or conservatively inferred from history alone."
+        ),
+        "observable_via": "live_statusline_snapshot",
+    }
+def scan_integrity(summary: UsageSummary) -> dict[str, Any]:
+    skipped = summary.skipped_files + summary.skipped_records
+    complete = skipped == 0 and not summary.parse_errors
+    return {
+        "status": "complete" if complete else "partial",
+        "files_scanned": summary.files,
+        "records_scanned": summary.records,
+        "skipped_files": summary.skipped_files,
+        "skipped_records": summary.skipped_records,
+        "parse_error_count": len(summary.parse_errors),
+        "complete": complete,
+        "reason": (
+            "All candidate transcript files/records were parsed within configured limits."
+            if complete
+            else "Some transcript files or records were skipped; downstream GUI surfaces should label totals as partial."
+        ),
+    }
+def build_metric_availability(summary: UsageSummary) -> dict[str, Any]:
+    token_presence = stable_token_presence(summary.token_field_presence)
+    has_any_token = bool(token_presence)
+    has_cache_read = summary.token_field_presence.get("cache_read", 0) > 0
+    has_cache_creation = summary.token_field_presence.get("cache_creation", 0) > 0
+    has_cache_any = has_cache_read or has_cache_creation
+    cache_partial = has_cache_any and not (has_cache_read and has_cache_creation)
+    skipped = bool(summary.skipped_files or summary.skipped_records or summary.parse_errors)
+    has_input = summary.token_field_presence.get("input", 0) > 0
+    has_output = summary.token_field_presence.get("output", 0) > 0
+    return {
+        "tokens": {
+            "status": availability_status(present=has_any_token, skipped=skipped and not has_any_token, partial=skipped and has_any_token),
+            "present_fields": token_presence,
+            "evidence": evidence_class(observed=has_any_token),
+        },
+        "input": {
+            "status": availability_status(present=has_input, partial=skipped and has_input),
+            "present_count": summary.token_field_presence.get("input", 0),
+            "evidence": evidence_class(observed=has_input),
+        },
+        "output": {
+            "status": availability_status(present=has_output, partial=skipped and has_output),
+            "present_count": summary.token_field_presence.get("output", 0),
+            "evidence": evidence_class(observed=has_output),
+        },
+        "cache": {
+            "status": availability_status(present=has_cache_any, partial=cache_partial or (skipped and has_cache_any)),
+            "present_fields": {
+                "cache_read": summary.token_field_presence.get("cache_read", 0),
+                "cache_creation": summary.token_field_presence.get("cache_creation", 0),
+            },
+            "zero_values_observed": {
+                "cache_read": has_cache_read and summary.tokens.get("cache_read", 0) == 0,
+                "cache_creation": has_cache_creation and summary.tokens.get("cache_creation", 0) == 0,
+            },
+            # 원시 cache 토큰 수는 관측값(observed)이지만, share/reuse 비율은 관측값에서
+            # 파생한 추정값(inferred)이므로 별도로 분류해 노출한다.
+            "evidence": evidence_class(observed=has_cache_any),
+            "derived": {
+                "cache_read_share": {
+                    "evidence": evidence_class(observed=False, inferable=has_cache_any),
+                    "value": summary.cache_hit_rate if has_cache_any else None,
+                },
+                "cache_reuse_ratio": {
+                    "evidence": evidence_class(observed=False, inferable=summary.cache_amortization_defined),
+                    "value": summary.cache_amortization if summary.cache_amortization_defined else None,
+                },
+            },
+        },
+        "cost": {
+            "status": availability_status(present=summary.cost_field_count > 0, partial=skipped and summary.cost_field_count > 0),
+            "present_count": summary.cost_field_count,
+            "observed_cost_usd": summary.cost_usd,
+            "evidence": evidence_class(observed=summary.cost_field_count > 0),
+        },
+        "context": {
+            "status": "missing",
+            "evidence": EVIDENCE_UNAVAILABLE,
+            "reason": (
+                "Transcript scans do not include live Claude Code context_window data. "
+                "Pass a live statusline snapshot in a future surface to populate context availability."
+            ),
+        },
+        "headroom": build_headroom_availability(summary),
+    }
+def segment_stability(samples: list[PromptSegmentSample], attr: str, window: int) -> tuple[float, int, int]:
+    stabilities: list[float] = []
+    unique_total = 0
+    observed_positions = 0
+    for pos in range(window):
+        values: list[str] = []
+        for sample in samples:
+            hashes = getattr(sample, attr)
+            if len(hashes) > pos:
+                values.append(hashes[pos])
+        if not values:
+            continue
+        counts = Counter(values)
+        observed_positions += 1
+        unique_total += len(counts)
+        stabilities.append(max(counts.values()) / len(values))
+    if not stabilities:
+        return 0.0, 0, 0
+    return sum(stabilities) / len(stabilities), unique_total, observed_positions
+def segment_position_stats(samples: list[PromptSegmentSample], attr: str, window: int) -> list[dict[str, Any]]:
+    stats: list[dict[str, Any]] = []
+    for pos in range(window):
+        values: list[str] = []
+        for sample in samples:
+            hashes = getattr(sample, attr)
+            if len(hashes) > pos:
+                values.append(hashes[pos])
+        if not values:
+            continue
+        counts = Counter(values)
+        stability = max(counts.values()) / len(values)
+        stats.append({
+            "position": pos,
+            "stability": stability,
+            "volatile_share": 1.0 - stability,
+            "unique_hashes": len(counts),
+        })
+    return stats
+def prompt_window_overlap_counts(samples: list[PromptSegmentSample]) -> tuple[int, int]:
+    """Return (non_overlapping, overlapping) prefix/tail evidence counts.
+    Prefix and tail segment windows are independent evidence only when the
+    sampled prompt has enough segments for the configured windows not to share
+    positions. Short prompts are still useful, but prefix-vs-tail deltas from
+    overlapping windows are lower-confidence diagnostics.
+    """
+    non_overlapping = 0
+    overlapping = 0
+    for sample in samples:
+        if sample.segment_count >= PROMPT_AUDIT_PREFIX_SEGMENTS + PROMPT_AUDIT_TAIL_SEGMENTS:
+            non_overlapping += 1
+        else:
+            overlapping += 1
+    return non_overlapping, overlapping
+def build_cache_friendliness(summary: UsageSummary) -> dict[str, Any]:
+    audit = summary.prompt_cache_audit
+    skipped = bool(
+        summary.skipped_files
+        or summary.skipped_records
+        or summary.parse_errors
+        or audit.capped_records
+        or audit.prompt_collection_capped_records
+    )
+    samples = audit.samples
+    if not samples:
+        return {
+            "status": "partial" if skipped else "missing",
+            "confidence": "partial" if skipped else "unavailable",
+            "evidence": EVIDENCE_UNAVAILABLE,
+            "heuristic": True,
+            "sampled_records": audit.sampled_records,
+            "analyzed_prompt_records": 0,
+            "non_overlapping_prompt_records": 0,
+            "overlapping_prompt_records": 0,
+            "prefix_tail_windows_overlap": False,
+            "prompt_collection_capped_records": audit.prompt_collection_capped_records,
+            "skipped_evidence": skipped,
+            "segment_window": {"prefix_segments": PROMPT_AUDIT_PREFIX_SEGMENTS, "tail_segments": PROMPT_AUDIT_TAIL_SEGMENTS},
+            "signals": {
+                "stable_prefix_share": None,
+                "volatile_prefix_share": None,
+                "volatile_tail_share": None,
+                "cache_reuse_ratio": summary.cache_amortization if summary.cache_amortization_defined else None,
+                "cache_read_share": summary.cache_hit_rate,
+            },
+            "findings": [],
+            "caveats": [
+                "No allowlisted user prompt text was found in scanned transcript records; cache layout cannot be inferred.",
+                "Deep or broad prompt content structures are bounded and skipped rather than recursively expanded.",
+                "Provider cache token fields, when present, remain diagnostic telemetry rather than ContextGuard-caused token reduction.",
+            ],
+        }
+    prefix_stability, prefix_unique, prefix_positions = segment_stability(samples, "prefix_hashes", PROMPT_AUDIT_PREFIX_SEGMENTS)
+    tail_stability, tail_unique, tail_positions = segment_stability(samples, "tail_hashes", PROMPT_AUDIT_TAIL_SEGMENTS)
+    prefix_position_stats = segment_position_stats(samples, "prefix_hashes", PROMPT_AUDIT_PREFIX_SEGMENTS)
+    non_overlapping_prompt_records, overlapping_prompt_records = prompt_window_overlap_counts(samples)
+    prefix_tail_windows_overlap = overlapping_prompt_records > 0
+    volatile_prefix = 1.0 - prefix_stability
+    volatile_tail = 1.0 - tail_stability
+    most_volatile_prefix = max(prefix_position_stats, key=lambda item: item["volatile_share"], default=None)
+    max_prefix_position_volatile = float(most_volatile_prefix["volatile_share"]) if most_volatile_prefix else 0.0
+    analyzed = audit.analyzed_prompt_records
+    status = "available"
+    if skipped or analyzed < PROMPT_AUDIT_MIN_RECORDS or non_overlapping_prompt_records == 0:
+        status = "partial"
+    confidence = "partial" if status == "partial" or prefix_tail_windows_overlap else "observed"
+    average_prefix_churn = (
+        volatile_prefix >= PROMPT_PREFIX_VOLATILE_THRESHOLD
+        and (volatile_prefix - volatile_tail) >= PROMPT_PREFIX_TAIL_CHURN_DELTA
+    )
+    early_prefix_churn = (
+        max_prefix_position_volatile >= PROMPT_PREFIX_VOLATILE_THRESHOLD
+        and (max_prefix_position_volatile - volatile_tail) >= PROMPT_PREFIX_TAIL_CHURN_DELTA
+    )
+    findings: list[dict[str, Any]] = []
+    if analyzed >= PROMPT_AUDIT_MIN_RECORDS and (average_prefix_churn or early_prefix_churn):
+        findings.append({
+            "id": "volatile-content-near-prefix",
+            "severity": "P1",
+            "confidence": confidence,
+            "title": "Volatile content appears near prompt prefix",
+            "reason": (
+                "Observed user prompt segment hashes churn much more near the prefix than in the tail window; "
+                "provider cache telemetry is used only as corroborating diagnostic context."
+            ),
+            "action": "Move generated logs, diffs, file evidence, and run-specific context after stable instructions and reusable policy text.",
+            "heuristic": True,
+            "evidence": {
+                "records": analyzed,
+                "non_overlapping_prompt_records": non_overlapping_prompt_records,
+                "overlapping_prompt_records": overlapping_prompt_records,
+                "prefix_tail_windows_overlap": prefix_tail_windows_overlap,
+                "confidence": confidence,
+                "prefix_positions": prefix_positions,
+                "tail_positions": tail_positions,
+                "prefix_unique_hashes": prefix_unique,
+                "tail_unique_hashes": tail_unique,
+                "volatile_prefix_share": round(volatile_prefix, 4),
+                "volatile_tail_share": round(volatile_tail, 4),
+                "max_prefix_position_volatile_share": round(max_prefix_position_volatile, 4),
+                "max_prefix_position": most_volatile_prefix["position"] if most_volatile_prefix else None,
+                "trigger": "prefix_window_average" if average_prefix_churn else "early_prefix_position",
+                "cache_creation": summary.tokens.get("cache_creation", 0),
+                "cache_read": summary.tokens.get("cache_read", 0),
+            },
+        })
+    findings = findings[:PROMPT_AUDIT_MAX_FINDINGS]
+    return {
+        "status": status,
+        "confidence": confidence,
+        "evidence": EVIDENCE_OBSERVED,
+        "heuristic": True,
+        "sampled_records": audit.sampled_records,
+        "analyzed_prompt_records": analyzed,
+        "non_overlapping_prompt_records": non_overlapping_prompt_records,
+        "overlapping_prompt_records": overlapping_prompt_records,
+        "prefix_tail_windows_overlap": prefix_tail_windows_overlap,
+        "capped_records": audit.capped_records,
+        "prompt_collection_capped_records": audit.prompt_collection_capped_records,
+        "skipped_evidence": skipped,
+        "total_segments": audit.total_segments,
+        "total_bytes_sampled": audit.total_bytes_sampled,
+        "redacted_segments": audit.redacted_segments,
+        "segment_window": {"prefix_segments": PROMPT_AUDIT_PREFIX_SEGMENTS, "tail_segments": PROMPT_AUDIT_TAIL_SEGMENTS},
+        "thresholds": {
+            "min_records": PROMPT_AUDIT_MIN_RECORDS,
+            "prefix_volatile_threshold": PROMPT_PREFIX_VOLATILE_THRESHOLD,
+            "prefix_tail_churn_delta": PROMPT_PREFIX_TAIL_CHURN_DELTA,
+        },
+        "signals": {
+            "stable_prefix_share": round(prefix_stability, 4),
+            "volatile_prefix_share": round(volatile_prefix, 4),
+            "volatile_tail_share": round(volatile_tail, 4),
+            "max_prefix_position_volatile_share": round(max_prefix_position_volatile, 4),
+            "cache_reuse_ratio": summary.cache_amortization if summary.cache_amortization_defined else None,
+            "cache_read_share": summary.cache_hit_rate,
+        },
+        "findings": findings,
+        "caveats": [
+            "Prompt layout findings are heuristic and based on bounded redacted user-message segment hashes, not raw prompt text or exact provider cache-prefix state.",
+            "When prefix and tail segment windows overlap in short prompts, cache-friendliness findings are partial-confidence diagnostics.",
+            "Deep or broad prompt content structures are bounded and make cache-friendliness evidence partial.",
+            "Provider cache read/write fields are diagnostic telemetry and do not prove ContextGuard-caused token reduction.",
+            "Unknown transcript prompt schemas are skipped rather than inferred aggressively.",
+        ],
+    }
+def cache_friendliness_for_summary(summary: UsageSummary) -> dict[str, Any]:
+    if summary.cache_friendliness_cache is None:
+        summary.cache_friendliness_cache = build_cache_friendliness(summary)
+    return summary.cache_friendliness_cache
+def build_metric_caveats(summary: UsageSummary) -> list[str]:
+    caveats = [
+        "Values are observed from local Claude Code transcript JSON/JSONL fields and are not official billing records.",
+        "Claude Code transcript schemas may change; skipped files/records and parse errors reduce confidence.",
+        "cache-read share is cache_read / (input + cache_read + cache_creation), not a provider billing hit-rate.",
+        "reuse ratio is cache_read / cache_creation when cache_creation is non-zero; it is undefined for cache-cold sessions.",
+        "each metric carries an evidence class: observed (read from transcript fields), inferred "
+        "(derived via a documented formula), or unavailable (not determinable from a historical scan).",
+        "context headroom is unavailable from transcript scans; it requires a live statusline snapshot to be observed.",
+    ]
+    if summary.cost_field_count == 0:
+        caveats.append("No cost fields were observed; use Claude Console or official billing exports for invoice-grade cost.")
+    if not (summary.token_field_presence.get("cache_read") or summary.token_field_presence.get("cache_creation")):
+        caveats.append("No cache fields were observed; hide cache UI or label cache availability as missing.")
+    if summary.skipped_files or summary.skipped_records:
+        caveats.append("Some transcript files or records were skipped, so hotspot rankings may be incomplete.")
+    return caveats
+def feasibility_json(
+    summary: UsageSummary,
+    top: int = 15,
+    include_recommendations: bool = False,
+    limits: ScanLimits | None = None,
+    *,
+    generated_at: str | None = None,
+) -> dict[str, Any]:
+    generated_at = generated_at or utc_now_iso()
+    base = summary_json(summary, top, include_recommendations=include_recommendations, limits=limits)
+    availability = build_metric_availability(summary)
+    integrity = scan_integrity(summary)
+    stable_tokens = stable_token_counter(summary.tokens)
+    stable_total_tokens = sum(stable_tokens.values())
+    cache_friendliness = cache_friendliness_for_summary(summary)
+    return {
+        "schema_version": FEASIBILITY_SCHEMA_VERSION,
+        "producer": FEASIBILITY_PRODUCER,
+        "generated_at": generated_at,
+        "consumer_contract": {
+            "stable_top_level_fields": [
+                "schema_version",
+                "producer",
+                "generated_at",
+                "source_kind",
+                "source_freshness",
+                "scan_integrity",
+                "metric_availability",
+                "metric_caveats",
+                "redaction_mode",
+                "context_availability",
+                "headroom_availability",
+                "cache_friendliness",
+                "totals",
+            ],
+            "diagnostic_fields": ["summary"],
+            "summary_contract": (
+                "summary is the legacy audit JSON payload for diagnostics and backward compatibility; "
+                "new GUI prototypes should bind to stable top-level feasibility fields first."
+            ),
+        },
+        "source_kind": "historical_transcript_scan",
+        "source_freshness": {
+            "status": "snapshot_at_scan_time",
+            "live": False,
+            "generated_at": generated_at,
+            "description": "Local transcript files were scanned when this report was generated; this is not a live statusline snapshot.",
+        },
+        "scan_integrity": integrity,
+        "metric_availability": availability,
+        "metric_caveats": build_metric_caveats(summary),
+        "redaction_mode": {
+            "paths": "basename_plus_stable_hash_by_default",
+            "commands": "command_category_plus_stable_hash_by_default",
+            "secret_like_values": "pattern_redacted",
+            "raw_path_and_command_flags": ["--show-paths", "--show-commands"],
+        },
+        "context_availability": availability["context"],
+        "headroom_availability": availability["headroom"],
+        "cache_friendliness": cache_friendliness,
+        "totals": {
+            "total_tokens": stable_total_tokens,
+            "tokens": stable_tokens,
+            "cost_usd_observed": summary.cost_usd,
+            "cache_read_share": summary.cache_hit_rate,
+            "cache_reuse_ratio": summary.cache_amortization if summary.cache_amortization_defined else None,
+        },
+        "summary": base,
+    }
+def recommendation(
+    ident: str,
+    title: str,
+    reason: str,
+    action: str,
+    priority: str,
+    evidence: dict[str, Any],
+) -> dict[str, Any]:
+    return {
+        "id": ident,
+        "priority": priority,
+        "title": title,
+        "reason": reason,
+        "action": action,
+        "evidence": evidence,
+    }
+def build_recommendations(summary: UsageSummary, top: int) -> list[dict[str, Any]]:
+    recs: list[dict[str, Any]] = []
+    total = max(0, summary.total_tokens)
+    if total == 0:
+        recs.append(recommendation(
+            "no-usage-found",
+            "No token usage found in scanned transcripts",
+            "The scanner did not find recognizable Claude Code usage fields.",
+            "Verify the transcript path or run again against ~/.claude/projects after more Claude Code activity.",
+            "P2",
+            {"files_scanned": summary.files, "records": summary.records},
+        ))
+        return recs
+    output_tokens = summary.tokens.get("output", 0)
+    input_tokens = summary.tokens.get("input", 0)
+    cache_creation = summary.tokens.get("cache_creation", 0)
+    cache_read = summary.tokens.get("cache_read", 0)
+    output_ratio = output_tokens / total
+    input_ratio = input_tokens / total
+    cache_friendliness = cache_friendliness_for_summary(summary)
+    for finding in cache_friendliness.get("findings", []):
+        if isinstance(finding, dict) and finding.get("id") == "volatile-content-near-prefix":
+            evidence = dict(finding.get("evidence") or {})
+            evidence["heuristic"] = True
+            if finding.get("confidence"):
+                evidence["confidence"] = finding.get("confidence")
+            rec = recommendation(
+                "move-volatile-context-after-stable-prefix",
+                "Volatile context appears before stable prompt prefix",
+                str(finding.get("reason") or "Observed prompt prefix churn is higher than tail churn."),
+                str(finding.get("action") or "Move run-specific context after stable instructions."),
+                str(finding.get("severity") or "P1"),
+                evidence,
+            )
+            rec["heuristic"] = True
+            if finding.get("confidence"):
+                rec["confidence"] = finding.get("confidence")
+            recs.append(rec)
+            break
+    if output_tokens >= 5_000 or output_ratio >= 0.35:
+        recs.append(recommendation(
+            "trim-output-heavy-sessions",
+            "Output tokens are a major hotspot",
+            f"Output accounts for {output_ratio:.0%} of observed tokens.",
+            "Enable/keep Bash output trimming and add runner-aware failure extraction for repeated test/build commands.",
+            "P0",
+            {"output_tokens": output_tokens, "total_tokens": total},
+        ))
+    if input_tokens >= 5_000 or input_ratio >= 0.45:
+        recs.append(recommendation(
+            "reduce-large-reads",
+            "Input tokens are a major hotspot",
+            f"Input accounts for {input_ratio:.0%} of observed tokens.",
+            "Prefer diff-first review, symbol-scoped reads, and large-file read guards before sending whole files to Claude.",
+            "P0",
+            {"input_tokens": input_tokens, "total_tokens": total},
+        ))
+    if (
+        cache_creation >= 10_000
+        and cache_read >= 1
+        and summary.cache_amortization < 0.5
+    ):
+        recs.append(recommendation(
+            "improve-prompt-cache-reuse",
+            "Prompt cache reuse looks low",
+            (
+                f"Cache amortization is {summary.cache_amortization:.2f}x "
+                f"(cache_read={cache_read}, cache_creation={cache_creation}); each cached prefix is barely re-served."
+            ),
+            "Keep stable instructions early, move volatile context later, and avoid editing large instruction files during active sessions.",
+            "P1",
+            {
+                "cache_creation": cache_creation,
+                "cache_read": cache_read,
+                "cache_amortization": round(summary.cache_amortization, 4),
+                "cache_hit_rate": round(summary.cache_hit_rate, 4),
+            },
+        ))
+    if cache_creation >= 50_000 and 1.0 <= summary.cache_amortization < 5.0:
+        recs.append(recommendation(
+            "evaluate-1h-ttl-cache",
+            "Cache writes are large; evaluate the 1h TTL cache beta",
+            (
+                f"Heuristic only — cache amortization {summary.cache_amortization:.2f}x with "
+                f"{cache_creation} write tokens; absolute write cost is high and reuse is moderate. "
+                "This metric does not inspect timestamps, so confirm reuse spans >5min in a sample "
+                "session before enabling 1h TTL."
+            ),
+            (
+                "If sessions reuse the same prefix beyond the 5-minute default TTL, evaluate the 1h prompt cache "
+                "beta (write 2x, read 0.1x). It pays off when reuse spans the gap between two 5-min cache writes."
+            ),
+            "P2",
+            {
+                "cache_creation": cache_creation,
+                "cache_read": cache_read,
+                "cache_amortization": round(summary.cache_amortization, 4),
+                "cache_hit_rate": round(summary.cache_hit_rate, 4),
+                "heuristic": True,
+            },
+        ))
+    if cache_read >= 10_000 and summary.cache_hit_rate >= 0.5:
+        rec = recommendation(
+            "separate-cache-discounts-from-token-reduction",
+            "Provider cache reuse is visible, but it is not token reduction",
+            (
+                f"Cache read share is {summary.cache_hit_rate:.0%}; this can reduce provider input cost/latency, "
+                "but the prompt content may still be sent logically and should not be counted as ContextGuard token reduction."
+            ),
+            (
+                "Report cache_read/cache_creation separately from bytes avoided by local guards, and keep stable cached "
+                "instructions before volatile evidence to preserve provider-cache eligibility."
+            ),
+            "P2",
+            {
+                "cache_read": cache_read,
+                "cache_creation": cache_creation,
+                "cache_hit_rate": round(summary.cache_hit_rate, 4),
+                "cache_amortization": round(summary.cache_amortization, 4) if summary.cache_amortization_defined else None,
+                "provider_cache_telemetry_only": True,
+            },
+        )
+        rec["heuristic"] = True
+        recs.append(rec)
+    for command, record_count in summary.by_command.most_common(top):
+        lowered = command.lower()
+        if any(marker in lowered for marker in ("pytest", "jest", "vitest", "go test", "cargo test", "npm test", "pnpm test", "yarn test")):
+            recs.append(recommendation(
+                "runner-aware-test-summary",
+                "Test command appears in transcript records",
+                "A test command category was observed in transcript records; token totals are session-level, not precise per-command billing.",
+                "Route this command through runner-aware failure extraction so Claude sees failing test names, file:line, assertion text, and rerun commands only.",
+                "P0",
+                {"command_hint": command, "record_count": record_count},
+            ))
+            break
+    top_files = summary.by_file.most_common(3)
+    if top_files:
+        largest_file, largest_tokens = top_files[0]
+        if largest_tokens >= max(1_000, total * 0.25):
+            recs.append(recommendation(
+                "inspect-costliest-transcript",
+                "One transcript file dominates observed usage",
+                "A single transcript file accounts for a large share of observed tokens.",
+                "Inspect this session first, then use /clear between unrelated tasks or /compact during long-running work.",
+                "P1",
+                {"file": largest_file, "tokens": largest_tokens, "share": round(largest_tokens / total, 3)},
+            ))
+    if summary.by_model:
+        model_totals = Counter({model: sum(tokens.values()) for model, tokens in summary.by_model.items()})
+        model, model_tokens = model_totals.most_common(1)[0]
+        if model != "unknown" and model_tokens >= max(2_000, total * 0.5):
+            recs.append(recommendation(
+                "route-heavy-work-by-model",
+                "One model carries most observed token usage",
+                "A single model dominates the observed transcript tokens.",
+                "Use lower-cost/auxiliary models for broad search, logs, and first-pass summaries; reserve Claude for final reasoning and edits.",
+                "P1",
+                {"model": model, "tokens": model_tokens, "share": round(model_tokens / total, 3)},
+            ))
+    if summary.skipped_files or summary.skipped_records:
+        recs.append(recommendation(
+            "fix-transcript-scan-gaps",
+            "Some transcript data was skipped",
+            "Skipped records can hide token hotspots and make recommendations less reliable.",
+            "Review parse warnings and rerun with a narrower path if malformed or unrelated JSON files are mixed in.",
+            "P2",
+            {"skipped_files": summary.skipped_files, "skipped_records": summary.skipped_records},
+        ))
+    return recs
+def summary_json(
+    summary: UsageSummary,
+    top: int = 15,
+    include_recommendations: bool = False,
+    limits: ScanLimits | None = None,
+) -> dict[str, Any]:
+    limits = limits or ScanLimits()
+    data = {
+        "files": summary.files,
+        "records": summary.records,
+        "skipped_files": summary.skipped_files,
+        "skipped_records": summary.skipped_records,
+        "parse_errors": summary.parse_errors,
+        "scan_limits": {
+            "max_file_bytes": limits.max_file_bytes,
+            "max_line_bytes": limits.max_line_bytes,
+        },
+        "total_tokens": summary.total_tokens,
+        "tokens": dict(summary.tokens),
+        "cache_metrics": {
+            "cache_hit_rate": round(summary.cache_hit_rate, 4),
+            "cache_amortization": round(summary.cache_amortization, 4),
+            "cache_amortization_defined": summary.cache_amortization_defined,
+            "cache_read_tokens": summary.tokens.get("cache_read", 0),
+            "cache_creation_tokens": summary.tokens.get("cache_creation", 0),
+            "input_tokens": summary.tokens.get("input", 0),
+        },
+        "cost_usd_observed": summary.cost_usd,
+        "by_model": {k: dict(v) for k, v in summary.by_model.items()},
+        "by_query_source": {k: dict(v) for k, v in summary.by_query_source.items()},
+        "top_files": counter_json(summary.by_file, top),
+        "top_commands": counter_json(summary.by_command, top),
+        "top_tools": counter_json(summary.by_tool, top),
+        "cache_friendliness": cache_friendliness_for_summary(summary),
+    }
+    if include_recommendations:
+        data["recommendations"] = build_recommendations(summary, top)
+    return data
+def print_recommendations(summary: UsageSummary, top: int) -> None:
+    print("\nRecommendations")
+    for idx, rec in enumerate(build_recommendations(summary, top), 1):
+        print(f"{idx}. [{rec['priority']}] {rec['title']}")
+        print(f"   reason: {rec['reason']}")
+        print(f"   action: {rec['action']}")
+        if rec.get("evidence"):
+            print(f"   evidence: {json.dumps(rec['evidence'], ensure_ascii=False, sort_keys=True)}")
+def main() -> int:
+    parser = argparse.ArgumentParser()
+    parser.add_argument("paths", nargs="*", default=[os.path.expanduser("~/.claude/projects")])
+    parser.add_argument("--top", type=int, default=15)
+    parser.add_argument("--json", action="store_true")
+    parser.add_argument(
+        "--feasibility-json",
+        action="store_true",
+        help="emit a GUI-consumable local metric availability report with schema, freshness, caveats, and redaction metadata",
+    )
+    parser.add_argument("--recommend", action="store_true", help="Print concrete token-saving recommendations")
+    parser.add_argument(
+        "--show-paths",
+        action="store_true",
+        help="Show transcript paths instead of basename+hash labels; local debugging only; secret-shaped path components remain redacted",
+    )
+    parser.add_argument("--show-commands", action="store_true", help="Show redacted command strings instead of command category+hash labels")
+    parser.add_argument(
+        "--max-file-bytes",
+        type=int,
+        default=DEFAULT_MAX_FILE_BYTES,
+        help="skip transcript files larger than this many bytes (default: 50 MiB)",
+    )
+    parser.add_argument(
+        "--max-line-bytes",
+        type=int,
+        default=DEFAULT_MAX_LINE_BYTES,
+        help="skip individual JSONL records larger than this many bytes (default: 2 MiB)",
+    )
+    args = parser.parse_args()
+    limits = ScanLimits(
+        max_file_bytes=require_scan_limit(parser, "--max-file-bytes", args.max_file_bytes, MAX_FILE_BYTES_LIMIT),
+        max_line_bytes=require_scan_limit(parser, "--max-line-bytes", args.max_line_bytes, MAX_LINE_BYTES_LIMIT),
+    )
+    summary = scan(args.paths, show_paths=args.show_paths, show_commands=args.show_commands, limits=limits)
+    if args.feasibility_json:
+        print(json.dumps(
+            feasibility_json(summary, args.top, include_recommendations=args.recommend, limits=limits),
+            indent=2,
+            sort_keys=True,
+        ))
+        return 0
+    if args.json:
+        print(json.dumps(
+            summary_json(summary, args.top, include_recommendations=args.recommend, limits=limits),
+            indent=2,
+            sort_keys=True,
+        ))
+        return 0
+    print("Claude Code transcript usage audit")
+    print(
+        f"files_scanned={summary.files} records={summary.records} "
+        f"skipped_files={summary.skipped_files} skipped_records={summary.skipped_records}"
+    )
+    print(f"scan_limits=max_file_bytes:{limits.max_file_bytes} max_line_bytes:{limits.max_line_bytes}")
+    print(f"observed_total_tokens={summary.total_tokens}")
+    if summary.cost_usd:
+        print(f"observed_cost_usd={summary.cost_usd:.4f}")
+    if summary.parse_errors:
+        print("\nWarnings")
+        for warning in summary.parse_errors:
+            print(f"  - {warning}")
+    print_counter("Token buckets", summary.tokens, args.top)
+    print("\nCache reuse")
+    print(f"  cache_hit_rate           {summary.cache_hit_rate:.2%}")
+    if summary.cache_amortization_defined:
+        print(f"  cache_amortization       {summary.cache_amortization:.2f}x")
+    else:
+        print("  cache_amortization       n/a (no cache writes observed)")
+    print(f"  cache_read_tokens        {summary.tokens.get('cache_read', 0):12d}")
+    print(f"  cache_creation_tokens    {summary.tokens.get('cache_creation', 0):12d}")
+    cache_friendliness = cache_friendliness_for_summary(summary)
+    if cache_friendliness.get("status") != "missing":
+        signals = cache_friendliness.get("signals", {})
+        print("\nCache friendliness")
+        print(f"  status                  {cache_friendliness.get('status')}")
+        print(f"  heuristic               {str(cache_friendliness.get('heuristic')).lower()}")
+        print(f"  analyzed_prompt_records {cache_friendliness.get('analyzed_prompt_records', 0):12d}")
+        stable_prefix = signals.get("stable_prefix_share")
+        volatile_prefix = signals.get("volatile_prefix_share")
+        volatile_tail = signals.get("volatile_tail_share")
+        if stable_prefix is not None:
+            print(f"  stable_prefix_share     {stable_prefix:.2%}")
+        if volatile_prefix is not None:
+            print(f"  volatile_prefix_share   {volatile_prefix:.2%}")
+        if volatile_tail is not None:
+            print(f"  volatile_tail_share     {volatile_tail:.2%}")
+        for finding in cache_friendliness.get("findings", []):
+            if isinstance(finding, dict):
+                print(f"  finding                 [{finding.get('severity')}] {finding.get('id')}: {finding.get('title')}")
+    model_totals = Counter({model: sum(tokens.values()) for model, tokens in summary.by_model.items()})
+    print_counter("By model", model_totals, args.top)
+    source_totals = Counter({src: sum(tokens.values()) for src, tokens in summary.by_query_source.items()})
+    print_counter("By query_source", source_totals, args.top)
+    print_counter("Top transcript files", summary.by_file, args.top)
+    print_counter("Top command hints observed", summary.by_command, args.top)
+    print_counter("Top tools observed", summary.by_tool, args.top)
+    if args.recommend:
+        print_recommendations(summary, args.top)
+    return 0
+if __name__ == "__main__":
+    raise SystemExit(main())