npm - @seanyao/roll - Versions diffs - 0.5.0 → 2.602.1 - Mend

@seanyao/roll 0.5.0 → 2.602.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (181) hide show

package/CHANGELOG.md +717 -0
package/LICENSE +21 -0
package/README.md +65 -165
package/bin/dream-test-quality-scan +110 -0
package/bin/roll +14897 -815
package/conventions/config.yaml +17 -1
package/conventions/global/AGENTS.md +146 -100
package/conventions/global/CLAUDE.md +1 -21
package/conventions/global/GEMINI.md +8 -22
package/conventions/global/project_rules.md +9 -0
package/conventions/templates/backend-service/AGENTS.md +30 -81
package/conventions/templates/backend-service/GEMINI.md +3 -3
package/conventions/templates/backend-service/project_rules.md +16 -0
package/conventions/templates/cli/AGENTS.md +31 -58
package/conventions/templates/cli/CLAUDE.md +3 -5
package/conventions/templates/cli/GEMINI.md +3 -3
package/conventions/templates/cli/project_rules.md +16 -0
package/conventions/templates/frontend-only/AGENTS.md +29 -64
package/conventions/templates/frontend-only/GEMINI.md +3 -3
package/conventions/templates/frontend-only/project_rules.md +14 -0
package/conventions/templates/fullstack/AGENTS.md +31 -79
package/conventions/templates/fullstack/CLAUDE.md +1 -1
package/conventions/templates/fullstack/GEMINI.md +3 -3
package/conventions/templates/fullstack/project_rules.md +15 -0
package/lib/README.md +42 -0
package/lib/__pycache__/github_sync.cpython-314.pyc +0 -0
package/lib/__pycache__/loop-fmt.cpython-314.pyc +0 -0
package/lib/__pycache__/loop_result_eval.cpython-314.pyc +0 -0
package/lib/__pycache__/loop_unstick.cpython-314.pyc +0 -0
package/lib/__pycache__/model_prices.cpython-314.pyc +0 -0
package/lib/__pycache__/prices_fetcher.cpython-314.pyc +0 -0
package/lib/__pycache__/roll-home.cpython-314.pyc +0 -0
package/lib/__pycache__/roll-loop-status.cpython-314.pyc +0 -0
package/lib/__pycache__/roll_git.cpython-314.pyc +0 -0
package/lib/__pycache__/roll_render.cpython-314.pyc +0 -0
package/lib/__pycache__/slides-render.cpython-314.pyc +0 -0
package/lib/agent_usage/README.md +49 -0
package/lib/agent_usage/__init__.py +108 -0
package/lib/agent_usage/__pycache__/__init__.cpython-314.pyc +0 -0
package/lib/agent_usage/__pycache__/gemini.cpython-314.pyc +0 -0
package/lib/agent_usage/__pycache__/kimi.cpython-314.pyc +0 -0
package/lib/agent_usage/__pycache__/openai.cpython-314.pyc +0 -0
package/lib/agent_usage/__pycache__/pi.cpython-314.pyc +0 -0
package/lib/agent_usage/__pycache__/pi_emit.cpython-314.pyc +0 -0
package/lib/agent_usage/__pycache__/qwen.cpython-314.pyc +0 -0
package/lib/agent_usage/gemini.py +127 -0
package/lib/agent_usage/kimi.py +278 -0
package/lib/agent_usage/kimi_emit.py +123 -0
package/lib/agent_usage/openai.py +126 -0
package/lib/agent_usage/pi.py +200 -0
package/lib/agent_usage/pi_emit.py +135 -0
package/lib/agent_usage/qwen.py +128 -0
package/lib/backfill-pi-usage.py +243 -0
package/lib/changelog_audit.py +155 -0
package/lib/changelog_generate.py +263 -0
package/lib/context_feed_budget.sh +194 -0
package/lib/github_sync.py +876 -0
package/lib/i18n/README.md +54 -0
package/lib/i18n/agent.sh +75 -0
package/lib/i18n/alert.sh +20 -0
package/lib/i18n/backlog.sh +96 -0
package/lib/i18n/brief.sh +5 -0
package/lib/i18n/changelog.sh +5 -0
package/lib/i18n/ci.sh +15 -0
package/lib/i18n/debug.sh +0 -0
package/lib/i18n/doctor.sh +44 -0
package/lib/i18n/dream.sh +0 -0
package/lib/i18n/init.sh +91 -0
package/lib/i18n/lang.sh +10 -0
package/lib/i18n/loop.sh +140 -0
package/lib/i18n/migrate.sh +74 -0
package/lib/i18n/offboard.sh +31 -0
package/lib/i18n/onboard.sh +0 -0
package/lib/i18n/peer.sh +41 -0
package/lib/i18n/peer_help.sh +25 -0
package/lib/i18n/peer_reset.sh +7 -0
package/lib/i18n/peer_status.sh +5 -0
package/lib/i18n/prices.sh +3 -0
package/lib/i18n/prices_refresh.sh +17 -0
package/lib/i18n/prices_show.sh +7 -0
package/lib/i18n/propose.sh +0 -0
package/lib/i18n/release.sh +0 -0
package/lib/i18n/research.sh +0 -0
package/lib/i18n/review_pr.sh +0 -0
package/lib/i18n/sentinel.sh +0 -0
package/lib/i18n/setup.sh +3 -0
package/lib/i18n/shared.sh +157 -0
package/lib/i18n/skills/roll-brief.sh +47 -0
package/lib/i18n/skills/roll-build.sh +97 -0
package/lib/i18n/skills/roll-design.sh +18 -0
package/lib/i18n/skills/roll-fix.sh +53 -0
package/lib/i18n/skills/roll-loop.sh +28 -0
package/lib/i18n/skills/roll-onboard.sh +33 -0
package/lib/i18n/skills_catalog.sh +30 -0
package/lib/i18n/slides.sh +3 -0
package/lib/i18n/slides_build.sh +38 -0
package/lib/i18n/slides_delete.sh +19 -0
package/lib/i18n/slides_list.sh +14 -0
package/lib/i18n/slides_logs.sh +12 -0
package/lib/i18n/slides_new.sh +15 -0
package/lib/i18n/slides_preview.sh +14 -0
package/lib/i18n/slides_templates.sh +7 -0
package/lib/i18n/status.sh +21 -0
package/lib/i18n/update.sh +24 -0
package/lib/i18n.sh +211 -0
package/lib/loop-exit-summary.py +393 -0
package/lib/loop-fmt.py +589 -0
package/lib/loop_pick_agent.py +316 -0
package/lib/loop_result_eval.py +469 -0
package/lib/loop_unstick.py +180 -0
package/lib/model_prices.py +186 -0
package/lib/prices/README.md +35 -0
package/lib/prices/snapshot-2026-05-22.json +22 -0
package/lib/prices/snapshot-2026-05-23-deepseek.json +15 -0
package/lib/prices/snapshot-2026-05-23-kimi.json +14 -0
package/lib/prices_fetcher.py +285 -0
package/lib/roll-backlog.py +225 -0
package/lib/roll-brief.py +286 -0
package/lib/roll-help.py +158 -0
package/lib/roll-home.py +556 -0
package/lib/roll-init.py +156 -0
package/lib/roll-loop-status.py +1683 -0
package/lib/roll-loop-story.py +191 -0
package/lib/roll-onboard-render.py +378 -0
package/lib/roll-peer.py +252 -0
package/lib/roll-plan-validate.py +386 -0
package/lib/roll-setup.py +102 -0
package/lib/roll-status.py +367 -0
package/lib/roll_git.py +41 -0
package/lib/roll_render.py +414 -0
package/lib/slides/components/README.md +123 -0
package/lib/slides/components/cards-2.html +9 -0
package/lib/slides/components/cards-3.html +9 -0
package/lib/slides/components/cards-4.html +9 -0
package/lib/slides/components/compare.html +22 -0
package/lib/slides/components/highlight.html +9 -0
package/lib/slides/components/pipeline.html +12 -0
package/lib/slides/components/plain.html +7 -0
package/lib/slides/components/quote.html +4 -0
package/lib/slides/components/timeline.html +9 -0
package/lib/slides/templates/introduction-v3.html +571 -0
package/lib/slides/templates/pitch.html +0 -0
package/lib/slides-render.py +778 -0
package/lib/slides-validate.py +357 -0
package/lib/test_quality_gate.py +143 -0
package/package.json +8 -7
package/skills/roll-.changelog/SKILL.md +406 -33
package/skills/roll-.clarify/SKILL.md +5 -2
package/skills/roll-.dream/SKILL.md +374 -0
package/skills/roll-.echo/SKILL.md +5 -2
package/skills/roll-.qa/SKILL.md +57 -3
package/skills/roll-.review/SKILL.md +42 -3
package/skills/roll-brief/SKILL.md +209 -0
package/skills/roll-build/SKILL.md +308 -63
package/skills/roll-debug/SKILL.md +341 -162
package/skills/roll-debug/injectable-bb.js +263 -0
package/skills/roll-deck/SKILL.md +296 -0
package/skills/roll-design/ENGINEERING_CHECKLIST.md +1 -1
package/skills/roll-design/SKILL.md +727 -94
package/skills/roll-doc/SKILL.md +595 -0
package/skills/roll-doctor/SKILL.md +192 -0
package/skills/roll-fix/SKILL.md +149 -32
package/skills/{roll-jot → roll-idea}/SKILL.md +18 -10
package/skills/roll-loop/SKILL.md +578 -0
package/skills/roll-notes/SKILL.md +103 -0
package/skills/roll-onboard/SKILL.md +234 -0
package/skills/roll-peer/SKILL.md +336 -0
package/skills/roll-propose/SKILL.md +157 -0
package/skills/roll-review-pr/SKILL.md +58 -0
package/skills/roll-sentinel/SKILL.md +11 -2
package/skills/roll-spar/SKILL.md +8 -6
package/template/.github/workflows/ci.yml +5 -2
package/template/AGENTS.md +20 -74
package/skills/roll-research/SKILL.md +0 -307
package/skills/roll-research/references/schema.json +0 -162
package/skills/roll-research/scripts/md_to_pdf.py +0 -289
package/tools/roll-fetch/SKILL.md +0 -182
package/tools/roll-fetch/package.json +0 -15
package/tools/roll-fetch/smart-web-fetch.js +0 -558
package/tools/roll-probe/SKILL.md +0 -84
/package/template/{BACKLOG.md → .roll/backlog.md} +0 -0

package/lib/roll-peer.py ADDED Viewed

@@ -0,0 +1,252 @@
+#!/usr/bin/env python3
+"""roll-peer — v2 terminal view for `roll peer` (US-VIEW-009).
+Renders a cross-agent review log as a turn-based ROUND transcript:
+eyebrow + subject + proposer/reviewer overview + ROUND N sections
+(each carrying agent turns with weight chips) + final VERDICT line
++ artifact path / next-step hint.
+NO_COLOR=1 falls through to glyph + weight + spacing only.
+"""
+from __future__ import annotations
+import argparse
+import os
+import sys
+_LIB_DIR = os.path.dirname(os.path.realpath(__file__))
+if _LIB_DIR not in sys.path:
+    sys.path.insert(0, _LIB_DIR)
+import roll_render
+from roll_render import c, row, COLS
+# ════════════════════════════════════════════════════════════════════════════
+# Agent palette — each agent gets a stable color so reviewer/proposer pairs
+# read at a glance across rounds. Unknown agents fall back to fg.
+# ════════════════════════════════════════════════════════════════════════════
+_AGENT_COLOR = {
+    "claude":   "blue",
+    "codex":    "pink",
+    "kimi":     "amber",
+    "deepseek": "green",
+    "agy":      "purple",   # Antigravity (formerly Gemini CLI)
+    "pi":       "yellow",
+    "opencode": "muted",
+    "trae":     "fg",
+}
+# Weight chip — (glyph, color, label) per turn.weight
+_WEIGHTS = {
+    "concern": ("●", "amber", "concern"),
+    "nit":     ("○", "dim",   "nit"),
+    "ack":     ("✓", "green", "ack"),
+    "block":   ("✗", "red",   "block"),
+}
+def _agent_c(name: str) -> str:
+    return _AGENT_COLOR.get(name.lower(), "fg")
+# ════════════════════════════════════════════════════════════════════════════
+# Fixture data (test-only; opt in via ROLL_RENDER_FIXTURE=1)
+# Illustrative cross-agent review: claude proposes, codex reviews
+# ════════════════════════════════════════════════════════════════════════════
+_FIXTURE_SUBJECT = {
+    "story":     "US-AUTH-014",
+    "title":     "Session refresh fallback when refresh-token API 5xx",
+    "pr":        "#412",
+    "diff_stat": "+184 −37 · 6 files",
+    "trigger":   "complexity=large",
+    "proposer":  "claude",
+    "reviewer":  "codex",
+}
+_FIXTURE_ROUNDS = [
+    {
+        "n": 1,
+        "hint": "first pass — proposer ships, reviewer probes",
+        "turns": [
+            ("claude", "concern",
+             "Refresh path swallows 503 silently — caller sees a stale session "
+             "without any signal that re-auth is needed."),
+            ("codex",  "nit",
+             "Naming: `tryRefresh` reads as best-effort, but the retry budget "
+             "actually escalates. Suggest `refreshWithBackoff`."),
+            ("codex",  "block",
+             "Backoff jitter uses Math.random — flakes integration tests. "
+             "Inject the rng so tests can pin it."),
+        ],
+    },
+    {
+        "n": 2,
+        "hint": "proposer revises, reviewer signs off",
+        "turns": [
+            ("claude", "ack",
+             "Renamed to `refreshWithBackoff`; threaded `rng` through the "
+             "config object. Added a test that pins seed 42."),
+            ("codex",  "ack",
+             "Looks right — retries fire 3× with jitter, surfaces 503 to "
+             "caller after budget exhausted. Approving."),
+        ],
+    },
+]
+_FIXTURE_VERDICT = {
+    "outcome": "approved",
+    "reason":  "2 rounds · 5 turns · all blocks resolved",
+}
+_FIXTURE_ARTIFACT = ".roll/peer/logs/20260519_213700_claude_codex.md"
+_FIXTURE_NEXT = [
+    ("Continue execution",   "claude resumes work on US-AUTH-014"),
+    ("Inspect log",          "open the artifact above to replay the transcript"),
+]
+# ════════════════════════════════════════════════════════════════════════════
+# Render primitives
+# ════════════════════════════════════════════════════════════════════════════
+def _divider(char: str = "─") -> None:
+    print(c("dim", char * min(COLS, 80)))
+def _eyebrow(trigger: str) -> None:
+    left = ("  " + c("blue", "PEER", bold=True) +
+            c("dim", "  ·  ") +
+            c("dim", "roll peer · cross-agent review"))
+    right = c("purple", trigger, bold=True) + "  "
+    print(row(left, right))
+def _subject(subj: dict) -> None:
+    story = c("blue", subj["story"], bold=True)
+    title = c("fg",   subj["title"])
+    pr    = c("amber", subj["pr"], bold=True)
+    diff  = c("muted", subj["diff_stat"])
+    line  = "  " + story + c("muted", "  ·  ") + title
+    print(line)
+    print("  " + pr + c("muted", "   ") + diff)
+def _pair_overview(subj: dict) -> None:
+    p_name = subj["proposer"]
+    r_name = subj["reviewer"]
+    p_c = _agent_c(p_name)
+    r_c = _agent_c(r_name)
+    proposer = c("dim", "proposer ") + c(p_c, p_name, bold=True)
+    reviewer = c("dim", "reviewer ") + c(r_c, r_name, bold=True)
+    sep = c("muted", "  →  ")
+    print("  " + proposer + sep + reviewer)
+def _round_header(n: int, hint: str) -> None:
+    label = c("pink", f"ROUND {n}", bold=True)
+    print()
+    print("  " + label + c("muted", "  ·  ") + c("dim", hint))
+def _weight_chip(weight: str) -> str:
+    glyph, color, label = _WEIGHTS.get(weight, ("·", "muted", weight))
+    return c(color, glyph + " " + label, bold=(weight in ("ack", "block")))
+def _turn(agent: str, weight: str, body: str) -> None:
+    agent_c = _agent_c(agent)
+    name = c(agent_c, agent, bold=True)
+    chip = _weight_chip(weight)
+    # First line: agent  chip
+    print("    " + name + c("muted", "  ") + chip)
+    # Body wrapped with hanging indent so long sentences stay readable.
+    _print_wrapped(body, indent=6, width=min(COLS, 80))
+def _print_wrapped(s: str, *, indent: int, width: int) -> None:
+    avail = max(20, width - indent)
+    line = ""
+    pad = " " * indent
+    for word in s.split():
+        if line and len(line) + 1 + len(word) > avail:
+            print(pad + c("dim", line))
+            line = word
+        else:
+            line = (line + " " + word) if line else word
+    if line:
+        print(pad + c("dim", line))
+def _verdict(v: dict) -> None:
+    outcome = v["outcome"]
+    if outcome == "approved":
+        glyph, color, label = "✓", "green", "approved"
+    else:
+        glyph, color, label = "✗", "red", "changes requested"
+    head = c(color, f"{glyph} VERDICT", bold=True) + c("muted", "  ·  ") + c(color, label)
+    print()
+    print("  " + head)
+    print("  " + c("dim", v["reason"]))
+def _footer(artifact: str, next_steps: list) -> None:
+    print()
+    print("  " + c("dim", "artifact ") + c("muted", artifact))
+    print()
+    print("  " + c("pink", "NEXT", bold=True) + c("dim", "  ·  下一步"))
+    for i, (label, hint) in enumerate(next_steps, start=1):
+        num = c("dim", f"  {i}.")
+        print(f"{num} {c('fg', label, bold=True)}")
+        print("     " + c("dim", hint))
+    _divider("═")
+# ════════════════════════════════════════════════════════════════════════════
+# Top-level render
+# ════════════════════════════════════════════════════════════════════════════
+def render_fixture() -> None:
+    _eyebrow(_FIXTURE_SUBJECT["trigger"])
+    _divider()
+    print()
+    _subject(_FIXTURE_SUBJECT)
+    print()
+    _pair_overview(_FIXTURE_SUBJECT)
+    for rd in _FIXTURE_ROUNDS:
+        _round_header(rd["n"], rd["hint"])
+        for agent, weight, body in rd["turns"]:
+            _turn(agent, weight, body)
+    _verdict(_FIXTURE_VERDICT)
+    _footer(_FIXTURE_ARTIFACT, _FIXTURE_NEXT)
+# ════════════════════════════════════════════════════════════════════════════
+# Entry point
+# ════════════════════════════════════════════════════════════════════════════
+def main() -> None:
+    ap = argparse.ArgumentParser(add_help=False)
+    ap.add_argument("--no-color", dest="no_color", action="store_true")
+    ap.add_argument("--en",       action="store_true")
+    ap.add_argument("--zh",       action="store_true")
+    args, _ = ap.parse_known_args()
+    if args.no_color or os.environ.get("NO_COLOR") or not sys.stdout.isatty():
+        roll_render.USE_COLOR = False
+    # FIX-076: this standalone entrypoint only knows how to render the fixture
+    # transcript (for UI tests). Real peer review is orchestrated by bin/roll
+    # and never invokes this main(). Require an explicit opt-in so a stray
+    # `python3 lib/roll-peer.py` invocation can't masquerade as live output.
+    if not os.environ.get("ROLL_RENDER_FIXTURE"):
+        print("Error: lib/roll-peer.py only renders fixture data; "
+              "set ROLL_RENDER_FIXTURE=1 to use it (test-only).",
+              file=sys.stderr)
+        sys.exit(2)
+    render_fixture()
+if __name__ == "__main__":
+    main()

package/lib/roll-plan-validate.py ADDED Viewed

@@ -0,0 +1,386 @@
+#!/usr/bin/env python3
+"""
+US-ONBOARD-007: onboard-plan.yaml validator.
+Validates that a plan file produced by $roll-onboard is structurally complete,
+fresh (generated_at within 24h), and version-compatible with the consuming
+bin/roll. Called by `roll init --apply` before any side effects.
+Usage:
+    python3 roll-plan-validate.py <path-to-plan.yaml>
+Exit codes:
+    0   plan is valid
+    1   schema / required field error
+    2   plan is stale (generated_at > 24h)
+    3   plan version not supported
+    4   plan file unreadable / not YAML
+Error messages are written to stderr in both English and Chinese.
+Schema (v1):
+    version: 1
+    generated_at: ISO 8601 timestamp (UTC or with tz offset)
+    project_understanding:
+      type: backend-service | frontend-only | fullstack | cli
+      description: str
+      domains: [str]
+      key_modules: [str]
+    scope:
+      approved: [str]  # subset of {backlog, features, domain, briefs}
+      declined: [str]
+    include_existing: [str]
+    privacy:
+      gitignore_dot_roll: bool
+    sync_targets: [str]
+    enable_loop: bool
+US-ONBOARD-016 — Phase 2 analysis sections (all OPTIONAL, pure-incremental,
+backward compatible; an old plan that omits them still validates). When
+present, each is validated for structure:
+    domain_model:
+      bounded_contexts:
+        - name: str
+          aggregates: [str]
+          ubiquitous_language: [str]   # or [{term, definition}]
+    tech_analysis:
+      stack: [str]
+      dependencies: [str]
+      architecture_notes: [str]
+      risks:
+        - description: str
+          severity: LOW | MEDIUM | HIGH   # optional
+          evidence: detected | inferred   # optional
+    test_assessment:
+      current_layers:     [<claim>]
+      gaps:               [<claim>]
+      recommended_actions:[<claim>]
+ANTI-HALLUCINATION HARD CONSTRAINT (the heart of US-ONBOARD-016):
+Every test_assessment claim MUST be a mapping carrying an `evidence` key whose
+value is exactly `detected` or `inferred`. A schema validator cannot re-run the
+filesystem scan, so the data contract is the lever: free-floating untagged
+strings (e.g. a hallucinated "needs more E2E tests") are REJECTED. When a scan
+finds nothing the skill must still emit a tagged claim such as
+`{claim: "none detected", evidence: detected}` — never invent filler. A scan
+that ran and returned zero matches is a genuine detection, so "none detected"
+carries `evidence: detected` (not a third enum value).
+"""
+from __future__ import annotations
+import sys
+from datetime import datetime, timezone, timedelta
+from pathlib import Path
+try:
+    import yaml  # PyYAML
+except ImportError:
+    print(
+        "[plan-validate] PyYAML not installed. Install with: pip install pyyaml\n"
+        "[plan-validate] PyYAML 未安装，请运行: pip install pyyaml",
+        file=sys.stderr,
+    )
+    sys.exit(4)
+SUPPORTED_VERSIONS = {1}
+MAX_AGE_HOURS = 24
+VALID_PROJECT_TYPES = {"backend-service", "frontend-only", "fullstack", "cli"}
+VALID_SCOPE_ITEMS = {"backlog", "features", "domain", "briefs"}
+# US-ONBOARD-016: anti-hallucination evidence tags. Every test_assessment claim
+# must carry one of these; risks[].evidence (when present) uses the same enum.
+VALID_EVIDENCE = {"detected", "inferred"}
+# test_assessment buckets whose entries are evidence-tagged claims.
+TEST_ASSESSMENT_CLAIM_KEYS = ("current_layers", "gaps", "recommended_actions")
+# Optional severity enum for tech_analysis.risks[].severity.
+VALID_RISK_SEVERITY = {"LOW", "MEDIUM", "HIGH"}
+def err(msg_en: str, msg_zh: str = "") -> None:
+    """Print bilingual error to stderr."""
+    print(f"[plan-validate] {msg_en}", file=sys.stderr)
+    if msg_zh:
+        print(f"[plan-validate] {msg_zh}", file=sys.stderr)
+def validate_required_top_level(plan: dict) -> list[str]:
+    """Return list of missing/invalid top-level fields."""
+    errors = []
+    required = ["version", "generated_at", "project_understanding", "scope", "privacy"]
+    for key in required:
+        if key not in plan:
+            errors.append(f"missing required field: {key}")
+    return errors
+def validate_version(plan: dict) -> list[str]:
+    v = plan.get("version")
+    if not isinstance(v, int):
+        return [f"version must be int, got {type(v).__name__}"]
+    if v not in SUPPORTED_VERSIONS:
+        return [f"version {v} not supported (supported: {sorted(SUPPORTED_VERSIONS)})"]
+    return []
+def validate_freshness(plan: dict) -> tuple[list[str], bool]:
+    """Returns (errors, is_stale). Stale uses exit code 2."""
+    raw = plan.get("generated_at")
+    if not raw:
+        return ["generated_at missing"], False
+    try:
+        if isinstance(raw, datetime):
+            ts = raw
+        else:
+            ts = datetime.fromisoformat(str(raw).replace("Z", "+00:00"))
+    except (ValueError, TypeError) as e:
+        return [f"generated_at not a valid ISO 8601 timestamp: {e}"], False
+    if ts.tzinfo is None:
+        ts = ts.replace(tzinfo=timezone.utc)
+    now = datetime.now(timezone.utc)
+    age = now - ts
+    if age > timedelta(hours=MAX_AGE_HOURS):
+        return [
+            f"plan is stale: generated {age.total_seconds() / 3600:.1f}h ago "
+            f"(max allowed: {MAX_AGE_HOURS}h)"
+        ], True
+    if age < timedelta(seconds=-300):
+        # Plan in future >5 min — clock skew or fabricated timestamp
+        return [
+            f"plan timestamp is in the future (clock skew?): generated_at={ts.isoformat()}"
+        ], False
+    return [], False
+def validate_project_understanding(plan: dict) -> list[str]:
+    errors = []
+    pu = plan.get("project_understanding")
+    if not isinstance(pu, dict):
+        return ["project_understanding must be a mapping"]
+    t = pu.get("type")
+    if t is None:
+        errors.append("project_understanding.type missing")
+    elif t not in VALID_PROJECT_TYPES:
+        errors.append(
+            f"project_understanding.type='{t}' not in {sorted(VALID_PROJECT_TYPES)}"
+        )
+    if "description" not in pu:
+        errors.append("project_understanding.description missing")
+    return errors
+def validate_scope(plan: dict) -> list[str]:
+    errors = []
+    scope = plan.get("scope")
+    if not isinstance(scope, dict):
+        return ["scope must be a mapping"]
+    approved = scope.get("approved", [])
+    if not isinstance(approved, list):
+        errors.append("scope.approved must be a list")
+    else:
+        for item in approved:
+            if item not in VALID_SCOPE_ITEMS:
+                errors.append(
+                    f"scope.approved contains unknown item '{item}' "
+                    f"(valid: {sorted(VALID_SCOPE_ITEMS)})"
+                )
+    return errors
+def validate_privacy(plan: dict) -> list[str]:
+    errors = []
+    privacy = plan.get("privacy")
+    if not isinstance(privacy, dict):
+        return ["privacy must be a mapping"]
+    g = privacy.get("gitignore_dot_roll")
+    if not isinstance(g, bool):
+        errors.append(
+            f"privacy.gitignore_dot_roll must be bool, got {type(g).__name__}"
+        )
+    return errors
+def validate_domain_model(plan: dict) -> list[str]:
+    """US-ONBOARD-016: validate the optional domain_model section.
+    Absent → no errors (pure-incremental). When present it must be a mapping
+    with a bounded_contexts list; each context is a mapping with a name and
+    list-typed aggregates / ubiquitous_language.
+    """
+    errors: list[str] = []
+    if "domain_model" not in plan:
+        return errors
+    dm = plan.get("domain_model")
+    if not isinstance(dm, dict):
+        return ["domain_model must be a mapping"]
+    contexts = dm.get("bounded_contexts")
+    if contexts is None:
+        return ["domain_model.bounded_contexts missing"]
+    if not isinstance(contexts, list):
+        return ["domain_model.bounded_contexts must be a list"]
+    for i, ctx in enumerate(contexts):
+        where = f"domain_model.bounded_contexts[{i}]"
+        if not isinstance(ctx, dict):
+            errors.append(f"{where} must be a mapping")
+            continue
+        if not ctx.get("name"):
+            errors.append(f"{where}.name missing or empty")
+        for list_key in ("aggregates", "ubiquitous_language"):
+            if list_key in ctx and not isinstance(ctx[list_key], list):
+                errors.append(f"{where}.{list_key} must be a list")
+    return errors
+def _validate_evidence_value(value, where: str) -> list[str]:
+    """Shared check: a value must be exactly one of VALID_EVIDENCE."""
+    if value is None:
+        return [f"{where}.evidence missing (must be one of {sorted(VALID_EVIDENCE)})"]
+    if value not in VALID_EVIDENCE:
+        return [
+            f"{where}.evidence='{value}' invalid "
+            f"(must be one of {sorted(VALID_EVIDENCE)})"
+        ]
+    return []
+def validate_tech_analysis(plan: dict) -> list[str]:
+    """US-ONBOARD-016: validate the optional tech_analysis section.
+    Absent → no errors. When present: stack / dependencies / architecture_notes
+    (if given) must be lists; risks (if given) must be a list of mappings each
+    with a description, an optional severity in VALID_RISK_SEVERITY, and an
+    optional evidence tag in VALID_EVIDENCE.
+    """
+    errors: list[str] = []
+    if "tech_analysis" not in plan:
+        return errors
+    ta = plan.get("tech_analysis")
+    if not isinstance(ta, dict):
+        return ["tech_analysis must be a mapping"]
+    for list_key in ("stack", "dependencies", "architecture_notes"):
+        if list_key in ta and not isinstance(ta[list_key], list):
+            errors.append(f"tech_analysis.{list_key} must be a list")
+    if "risks" in ta:
+        risks = ta["risks"]
+        if not isinstance(risks, list):
+            errors.append("tech_analysis.risks must be a list")
+        else:
+            for i, risk in enumerate(risks):
+                where = f"tech_analysis.risks[{i}]"
+                if not isinstance(risk, dict):
+                    errors.append(f"{where} must be a mapping")
+                    continue
+                if not risk.get("description"):
+                    errors.append(f"{where}.description missing or empty")
+                sev = risk.get("severity")
+                if sev is not None and sev not in VALID_RISK_SEVERITY:
+                    errors.append(
+                        f"{where}.severity='{sev}' invalid "
+                        f"(must be one of {sorted(VALID_RISK_SEVERITY)})"
+                    )
+                if "evidence" in risk:
+                    errors += _validate_evidence_value(risk["evidence"], where)
+    return errors
+def validate_test_assessment(plan: dict) -> list[str]:
+    """US-ONBOARD-016 anti-hallucination HARD constraint.
+    Absent → no errors. When present, every entry in current_layers / gaps /
+    recommended_actions MUST be a mapping carrying an `evidence` tag of exactly
+    `detected` or `inferred`. This is the mechanical lever: untagged free-text
+    claims (hallucinated filler) are rejected. An empty bucket is allowed — that
+    is how "the section ran but had nothing in this dimension" is expressed; the
+    skill represents a zero-result scan as a tagged `{claim: "none detected",
+    evidence: detected}` entry rather than inventing a recommendation.
+    """
+    errors: list[str] = []
+    if "test_assessment" not in plan:
+        return errors
+    ta = plan.get("test_assessment")
+    if not isinstance(ta, dict):
+        return ["test_assessment must be a mapping"]
+    for key in TEST_ASSESSMENT_CLAIM_KEYS:
+        if key not in ta:
+            continue
+        claims = ta[key]
+        if not isinstance(claims, list):
+            errors.append(f"test_assessment.{key} must be a list")
+            continue
+        for i, claim in enumerate(claims):
+            where = f"test_assessment.{key}[{i}]"
+            if not isinstance(claim, dict):
+                errors.append(
+                    f"{where} must be a mapping carrying an 'evidence' tag "
+                    f"(got {type(claim).__name__}); untagged claims are rejected "
+                    f"to block unverifiable filler"
+                )
+                continue
+            errors += _validate_evidence_value(claim.get("evidence"), where)
+    return errors
+def main(argv: list[str]) -> int:
+    if len(argv) < 2:
+        err("usage: roll-plan-validate.py <plan.yaml>", "用法: roll-plan-validate.py <plan.yaml>")
+        return 4
+    path = Path(argv[1])
+    if not path.is_file():
+        err(f"plan file not found: {path}", f"未找到 plan 文件：{path}")
+        return 4
+    try:
+        with path.open("r", encoding="utf-8") as f:
+            plan = yaml.safe_load(f)
+    except (yaml.YAMLError, OSError) as e:
+        err(f"failed to parse plan as YAML: {e}", "无法解析 plan YAML")
+        return 4
+    if not isinstance(plan, dict):
+        err("plan must be a top-level mapping", "plan 顶层必须是 mapping")
+        return 1
+    schema_errors: list[str] = []
+    schema_errors += validate_required_top_level(plan)
+    schema_errors += validate_version(plan)
+    schema_errors += validate_project_understanding(plan)
+    schema_errors += validate_scope(plan)
+    schema_errors += validate_privacy(plan)
+    # US-ONBOARD-016: optional Phase 2 analysis sections (validated only when
+    # present so old plans stay compatible).
+    schema_errors += validate_domain_model(plan)
+    schema_errors += validate_tech_analysis(plan)
+    schema_errors += validate_test_assessment(plan)
+    freshness_errors, is_stale = validate_freshness(plan)
+    # Version errors take precedence — if version is wrong, the rest of the
+    # validation may be unreliable.
+    version_errors = [e for e in schema_errors if e.startswith("version")]
+    if version_errors:
+        for e in version_errors:
+            err(e)
+        return 3
+    if is_stale:
+        for e in freshness_errors:
+            err(e, "plan 已过期，请重新运行 $roll-onboard 生成新 plan")
+        return 2
+    all_errors = [e for e in schema_errors if not e.startswith("version")] + [
+        e for e in freshness_errors if not is_stale
+    ]
+    if all_errors:
+        for e in all_errors:
+            err(e)
+        return 1
+    # Valid — silent success (bash caller treats exit 0 as OK).
+    return 0
+if __name__ == "__main__":
+    sys.exit(main(sys.argv))