npm - xp-gate - Versions diffs - 0.5.1 - Mend

xp-gate 0.5.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (90) hide show

package/adapter-common.sh +192 -0
package/adapters/cpp.sh +76 -0
package/adapters/dart.sh +41 -0
package/adapters/flutter.sh +41 -0
package/adapters/go.sh +59 -0
package/adapters/iac.sh +189 -0
package/adapters/java.sh +191 -0
package/adapters/kotlin.sh +77 -0
package/adapters/objectivec.sh +38 -0
package/adapters/powershell.sh +138 -0
package/adapters/python.sh +104 -0
package/adapters/shell.sh +55 -0
package/adapters/swift.sh +44 -0
package/adapters/typescript.sh +61 -0
package/bin/xp-gate.js +157 -0
package/hooks/adapter-common.sh +192 -0
package/hooks/pre-commit +1667 -0
package/hooks/pre-push +395 -0
package/lib/__tests__/detect-deps.test.js +209 -0
package/lib/__tests__/doctor.test.js +448 -0
package/lib/__tests__/download-skill.test.js +281 -0
package/lib/__tests__/init.test.js +327 -0
package/lib/__tests__/install-skill.test.js +326 -0
package/lib/__tests__/migrate.test.js +212 -0
package/lib/__tests__/rollback.test.js +183 -0
package/lib/__tests__/ui-detector.test.ts +200 -0
package/lib/__tests__/uninstall-skill.test.js +189 -0
package/lib/__tests__/uninstall.test.js +589 -0
package/lib/__tests__/update-skill.test.js +276 -0
package/lib/detect-deps.js +157 -0
package/lib/doctor.js +370 -0
package/lib/download-skill.js +96 -0
package/lib/init.js +367 -0
package/lib/install-skill.js +184 -0
package/lib/migrate.js +120 -0
package/lib/rollback.js +78 -0
package/lib/ui-detector.ts +99 -0
package/lib/uninstall-skill.js +69 -0
package/lib/uninstall.js +401 -0
package/lib/update-skill.js +90 -0
package/package.json +39 -0
package/plugins/claude-code/.claude-plugin/plugin.json +21 -0
package/plugins/claude-code/bin/delphi-review-guard.sh +68 -0
package/plugins/claude-code/bin/xp-gate-check +47 -0
package/plugins/claude-code/hooks/hooks.json +37 -0
package/skills/delphi-review/.delphi-config.json.example +45 -0
package/skills/delphi-review/AGENTS.md +54 -0
package/skills/delphi-review/INSTALL.md +152 -0
package/skills/delphi-review/SKILL.md +371 -0
package/skills/delphi-review/evals/evals.json +82 -0
package/skills/delphi-review/opencode.json.delphi.example +56 -0
package/skills/delphi-review/references/code-walkthrough.md +486 -0
package/skills/ralph-loop/SKILL.md +330 -0
package/skills/ralph-loop/evals/evals.json +311 -0
package/skills/ralph-loop/evolution-history.json +59 -0
package/skills/ralph-loop/evolution-log.md +16 -0
package/skills/ralph-loop/references/components/memory.md +55 -0
package/skills/ralph-loop/references/components/middleware.md +54 -0
package/skills/ralph-loop/references/components/skill-invocations.md +39 -0
package/skills/ralph-loop/references/components/system-prompt.md +24 -0
package/skills/ralph-loop/references/components/tool-descriptions.md +32 -0
package/skills/ralph-loop/references/phase-2-build-ralph.md +89 -0
package/skills/ralph-loop/templates/progress-log.md +36 -0
package/skills/sprint-flow/SKILL.md +600 -0
package/skills/sprint-flow/evals/evals.json +78 -0
package/skills/sprint-flow/evolution-history.json +39 -0
package/skills/sprint-flow/evolution-log.md +23 -0
package/skills/sprint-flow/references/components/memory.md +87 -0
package/skills/sprint-flow/references/components/middleware.md +72 -0
package/skills/sprint-flow/references/components/skill-invocations.md +104 -0
package/skills/sprint-flow/references/components/system-prompt.md +27 -0
package/skills/sprint-flow/references/components/tool-descriptions.md +96 -0
package/skills/sprint-flow/references/phase-0-think.md +115 -0
package/skills/sprint-flow/references/phase-1-plan.md +178 -0
package/skills/sprint-flow/references/phase-2-build.md +198 -0
package/skills/sprint-flow/references/phase-3-review.md +213 -0
package/skills/sprint-flow/references/phase-4-uat.md +125 -0
package/skills/sprint-flow/references/phase-5-feedback.md +100 -0
package/skills/sprint-flow/references/phase-6-ship.md +193 -0
package/skills/sprint-flow/references/phase-7-land.md +140 -0
package/skills/sprint-flow/references/phase-8-cleanup.md +192 -0
package/skills/sprint-flow/templates/emergent-issues-template.md +120 -0
package/skills/sprint-flow/templates/pain-document-template.md +115 -0
package/skills/sprint-flow/templates/sprint-summary-template.md +120 -0
package/skills/test-specification-alignment/AGENTS.md +59 -0
package/skills/test-specification-alignment/SKILL.md +605 -0
package/skills/test-specification-alignment/evals/evals.json +75 -0
package/skills/test-specification-alignment/references/alignment-verification-algorithm.md +493 -0
package/skills/test-specification-alignment/references/phase2-constraint-enforcement.md +431 -0
package/skills/test-specification-alignment/references/specification-format.md +348 -0

package/skills/ralph-loop/SKILL.md ADDED Viewed

@@ -0,0 +1,330 @@
+---
+name: ralph-loop
+description: >
+  Default Phase 2 BUILD mode for Sprint-Flow. Processes ONE REQ at a time from
+  specification.yaml with clean isolated context per subagent dispatch, persists
+  memory via git history + classified learnings, runs full regression tests on each
+  REQ, and only commits on verification pass. Designed to reduce token consumption
+  from linear context accumulation to per-REQ fixed budgets (40-67% savings).
+  Token-constraint is the default — every Phase 2 uses this mode automatically.
+  Use `--mode parallel` to opt into the legacy all-at-once mode if needed.
+maturity: stable
+---
+# Ralph Loop — Default REQ-Level Iterative Build
+## 核心原则
+| 原则 | 说明 |
+|------|------|
+| **每次迭代 = 全新上下文** | 每个 REQ dispatch 独立 subagent，不累积历史对话 |
+| **一次只处理一个 REQ** | 小粒度执行，避免大任务吞掉整个 context window |
+| **失败不提交** | 验证不通过的代码不 commit，保持代码库绿色 |
+| **全量回归测试** | 每个 REQ 完成后运行 ALL tests（不只是 @test REQ-XXX），检测跨 REQ 回归 |
+| **Git 持久记忆** | 代码变更 + checkpoint 天然持久，不需要在 prompt 里反复解释 |
+| **浓缩型分类学习** | permanent（架构级）+ contextual（最近 3 条）双层 learnings |
+| **AGENTS.md 统一更新** | orchestrator 统一写，subagent 不直接修改 — 无竞态 |
+## 作为 Phase 2 默认行为
+Ralph Loop 是 Sprint-Flow **Phase 2 BUILD 的默认模式**：
+```
+Sprint-Flow Phase 2 (默认):
+  ralph-loop → 逐 REQ 迭代 → 每次干净上下文 → 全量回归 → token 节约 40-67%
+Sprint-Flow Phase 2 --mode parallel (可选):
+  dispatching-parallel-agents → 所有需求一次性并行 → 上下文线性增长
+```
+**为什么它是默认**: 每个 Sprint 都受 token limit 约束。累积模式在 3+ REQs 时限流频率显著上升。ralph-loop 确保每个 REQ 的 token 预算独立可控。
+**切换回并行模式**: `/sprint-flow "需求" --mode parallel`
+---
+## 完整流程
+```
+Phase 0: 准备 → 读取 specification.yaml → 构建依赖图 → 拓扑排序
+    │
+    ▼
+Phase 1: 迭代循环 (max_iterations=15 默认)
+    │
+    ├── 取下一个 READY REQ（依赖已满足，优先级最高）
+    │
+    ├── 测试基础设施检查
+    │     1. 检查 test-utils.ts（或等效文件）是否存在
+    │     2. 检查必需接口契约：createTestApp()、withTestDb()
+    │     3. 不存在或接口缺失 → dispatch "生成测试基础设施" subagent
+    │        retry max 2 → 仍失败 → BLOCK 或 fallback inline 生成
+    │     4. 与业务代码合并为同一 commit
+    │
+    ├── 注入测试基础设施摘要到业务代码 subagent context：
+    │     【已有测试基础设施】test-utils.ts 已存在，导出以下 API：
+    │     - createTestApp(): 创建应用实例 + 真实测试依赖
+    │     - withTestDb(): 测试数据库生命周期（seed + cleanup）
+    │     必须 import 这些函数，禁止重新手搓同名 helper。
+    │
+    ├── Dispatch 独立 subagent
+    │     使用: task(category="unspecified-high", load_skills=["test-driven-development"], timeout=300)
+    │     Context:
+    │       - 当前 REQ + 所有 AC
+    │       - permanent learnings（架构决策，始终传入）
+    │       - contextual learnings（最近 3 条）
+    │       - retry-failures（仅 retry 时注入失败原因）
+    │       - AGENTS.md（项目约定）
+    │       - git log --oneline -5
+    │       - 【TDD 铁律】RED → GREEN → REFACTOR。任何模块必须先写测试再写实现。
+    │       - 【Mock 边界】（覆盖 TDD skill 默认策略）
+    │           ✅ MOCK: 外部 HTTP API、LLM 调用、第三方平台（钉钉/微信）
+    │           ✅ MOCK: 时间/随机数/UUID（注入依赖）
+    │           ❌ NO MOCK: 数据库操作（用真实测试库或 sqlite-in-memory）
+    │           ❌ NO MOCK: HTTP 路由（用 app.inject() 真实注入）
+    │           ❌ NO MOCK: 模板引擎（用真实 Nunjucks/Jinja 渲染）
+    │           ❌ NO MOCK: 纯业务逻辑（用真实输入输出）
+    │       - 【Mock 密度上限】测试中 mock/spy/fn 引用行数 > 总测试行数 30% 时，
+    │           必须添加 // @mock-justified: <至少10字符理由> 注释说明为何无法用集成测试。
+    │
+    ├── Subagent 完成 → 三层验证
+    │     ├── L1: typecheck + lint → FAIL? → retry
+    │     ├── L2: 全量测试（ALL tests）→ FAIL? → retry
+    │     └── L3: coverage ≥ 80% → FAIL? → retry
+    │
+    ├── PASS → git commit → 标记 done
+    │        → 写 learnings（分类为 permanent/contextual）
+    │        → 调用 `gstack/learn` 及时总结经验教训
+    │        → orchestrator 统一更新 AGENTS.md
+    │        → 原子写 checkpoint
+    │        → 继续下一个 READY REQ
+    │
+    └── FAIL → retry（max 3，注入上次错误摘要）
+         └── 仍失败 → BLOCK → 依赖级联 → 用户决策
+             │
+             ▼
+终止条件:
+  - 所有 REQ done → COMPLETE → 返回 Phase 3 REVIEW
+  - max_iterations 达到 → PARTIAL → 保留 done commits
+  - BLOCK → WAIT_USER → skip/manual/stop/rollback
+```
+---
+## 输入格式 (specification.yaml)
+```yaml
+specification:
+  requirements:
+    - id: REQ-001
+      description: "创建 User Model 和数据库迁移"
+      acceptance_criteria:
+        - id: AC-001-01
+          criteria: "User model 包含 email (unique), password_hash, created_at"
+        - id: AC-001-02
+          criteria: "Migration 成功执行"
+      priority: 1
+      status: pending
+    - id: REQ-002
+      description: "实现密码加密工具函数"
+      depends_on: [REQ-001]
+      acceptance_criteria:
+        - id: AC-002-01
+          criteria: "hashPassword() 返回 bcrypt hash"
+        - id: AC-002-02
+          criteria: "verifyPassword() 正确比对明文和 hash"
+      priority: 2
+      status: pending
+```
+**每个 REQ 自动作为一个迭代单元**，其所有 `AC-XXX-XX` 作为验收标准。
+---
+## 依赖排序
+1. **拓扑排序**：对所有 pending REQs 构建依赖图（基于 `depends_on`）
+2. **Kahn's algorithm**：执行拓扑排序，检测循环依赖
+3. **同层按 priority**：同一拓扑层内的 REQ 按 `priority` 升序排列
+4. **循环依赖**：→ BLOCK + 报告循环链（`REQ-A → REQ-B → REQ-C → REQ-A`）
+---
+## Learnings 分类
+| 分类 | 内容 | 传递策略 | 升级条件 |
+|------|------|---------|---------|
+| **permanent** | 架构决策、接口约定、全局约定 | 始终传入（每个 REQ context）| (1) 被 ≥2 个 REQ 引用<br>(2) 涉及模块接口/数据结构<br>(3) 用户手动标记 |
+| **contextual** | 实现细节、一次性 gotchas、临时技巧 | 滑动窗口（最近 3 条） | 满足 permanent 条件自动升级，否则 3 条后过期 |
+**自动升级示例**：
+- `"migration files must be in src/migrations/"` → 第 2 个 REQ 也引用 → 升级为 permanent
+- `"use bcrypt 不要使用 md5"` → 安全规范 → 自动 permanent
+- `"第 42 行有个 off-by-one"` → 仅影响单个 REQ → 保持 contextual
+---
+## AGENTS.md 更新机制
+**由 orchestrator 统一执行，不由 subagent 各自写**：
+1. subagent 完成后输出 `agentmd_addition` 字段
+2. orchestrator 读取当前 AGENTS.md
+3. orchestrator append `## ralph-loop: [REQ-XXX title] (auto-added)` 段
+4. orchestrator 将 AGENTS.md 变更纳入 git commit
+当 AGENTS.md > 500 行时触发归档：保留最近 6 个月 entries，更早的归档到 `.sprint-state/ralph-loop/agents-archive/`。
+---
+## 三层验证 Gate
+每个 REQ 完成后执行：
+| 层级 | 范围 | 工具 | 失败行为 |
+|------|------|------|---------|
+| L1 | 变更文件 | `lsp_diagnostics` + linter | retry |
+| L1b | 测试先行比率 | 新增测试行数 / (新增测试 + 新增实现) ≥ 40% | retry |
+| L2 | **全量测试**（不只是 @test REQ-XXX） | 项目测试框架 | retry |
+| L3 | 整体覆盖率 ≥ 80% | coverage report | retry |
+---
+## 状态机
+```
+PENDING → test_infra_check → [infra needed?] → test_infra_dispatch
+                                       │                    │
+                                       │ FAIL               │ pass
+                                       │ (max 2 retry)      │
+                                       ▼                    ▼
+                                   BLOCK/fallback      test_infra_ready → in_progress → done (commit)
+                                       │                  │
+                                       │  depend not met  │ all done → COMPLETE
+                                       │  ┌───────────────┘
+                                       ▼  │
+                                    PENDING (waiting)
+                                       │
+                                       │  fail
+                                       ▼
+                                    RETRY (n≤3, 注入上次错误)
+                                       │
+                                       │  n≥3
+                                       ▼
+                                    BLOCKED → 用户决策 (skip/manual/stop/rollback)
+                                       │
+                                       │  依赖上游 blocked → 自动 blocked(含依赖链)
+                                       ▼
+                                    auto-blocked REQs
+```
+**REQ 状态转换规则**：
+| 从 | 到 | 触发 |
+|---|---|---|
+| pending | test_infra_check | 拓扑排序轮到 + 依赖已满足 |
+| test_infra_check | test_infra_dispatch | test-utils.ts 不存在或接口缺失 |
+| test_infra_check | in_progress | test-utils.ts 已存在且接口完整 |
+| test_infra_dispatch | test_infra_ready | 测试基础设施生成完成 |
+| test_infra_dispatch | blocked | retry max 2 仍失败 |
+| test_infra_dispatch | test_infra_ready | fallback inline 生成成功（记录 warning）|
+| test_infra_ready | in_progress | 测试基础设施就绪，dispatch 业务代码 subagent |
+| in_progress | done | L1+L1b+L2+L3 全部通过 |
+| in_progress | retry | 验证失败, n<3 |
+| retry | done | 验证通过 |
+| retry | blocked | n≥3 仍失败 |
+| pending | blocked(auto) | 上游依赖 blocked |
+| blocked | skipped | 用户选择跳过 |
+| blocked | done | 用户手动修复后确认 |
+| 任意 | partial | 用户选择停止 |
+| 任意 | rollback | 用户选择回滚 (git reset) |
+**崩溃恢复**：启动时检测 checkpoint → 跳过已 done REQs → 从下一个 pending 继续。已 commit 的 REQ 不需要重做。
+---
+## Retry 策略
+| 轮次 | 注入上下文 | 超时 |
+|------|-----------|------|
+| 第 1 次 | 标准上下文 | 300s |
+| 第 2 次 | 标准 + 上次失败摘要 (linter+tests) | 300s |
+| 第 3 次 | 标准 + 前两次失败摘要 + "请使用不同实现方式" | 300s |
+---
+## 与 Sprint-Flow 集成
+**默认启用**：Phase 2 BUILD 自动使用 ralph-loop 模式。
+```bash
+/sprint-flow "开发用户登录"
+# → Phase 2 自动使用 ralph-loop 模式
+/sprint-flow "开发小改动" --mode parallel
+# → 可选：切换回旧有的并行模式
+```
+Phase 0, 1, 3-6 行为完全不变。
+**与 test-specification-alignment 完全兼容**：
+- Test alignment 仍解析 specification.yaml (REQ/AC 不变)
+- 仍查找 `@test REQ-XXX` / `@covers AC-XXX-XX`
+- PARTIAL 状态下仅检查已 done REQs
+---
+## Output Format (MANDATORY)
+```json
+{
+  "skill_name": "ralph-loop",
+  "version": "2.0.0",
+  "specification_source": "specification.yaml",
+  "topology_order": ["REQ-001", "REQ-002", "REQ-003"],
+  "requirements": { "total": 6, "done": 4, "pending": 1, "blocked": 1, "skipped": 0 },
+  "current_requirement": { "id": "REQ-005", "status": "done", "retry_count": 0 },
+  "learnings": {
+    "permanent": ["Auth middleware must run before validation"],
+    "contextual": ["migration files must be in src/migrations/"]
+  },
+  "status": "running",
+  "checkpoint_at": "2026-05-08T10:30:00Z"
+}
+```
+**Eval assertions**: `done + pending + blocked + skipped == total`, `iteration <= max_iterations`.
+---
+## Anti-Patterns
+| ❌ 错误 | ✅ 正确 |
+|---|---|
+| 一个 REQ 包含所有需求 | 每个 REQ ≤ 1 context window |
+| 验证失败仍 commit | 不提交 |
+| 只跑 @test REQ-XXX | 全量回归测试 |
+| priority 排序忽略 depends_on | 拓扑排序 + 同层 priority |
+| retry 不注入失败原因 | 每次 retry 注入上次错误 |
+| subagent 各自写 AGENTS.md | orchestrator 统一更新 |
+| progress.log 写长篇大论 | 3-5 行结构化摘要 |
+---
+## Token Savings
+| REQ 数量 | 默认模式 | ralph-loop | 节约 |
+|---------|---------|-----------|------|
+| 3 | ~15k | ~9k | 40% |
+| 5 | ~50k | ~25k | 50% |
+| 10 | ~150k | ~50k | 67% |
+> 原理: 默认 = sum(i × cost_i), ralph-loop = sum(cost_i)
+---
+## References
+- [Design Doc: ralph-loop v3.0](docs/ralph-loop-design.md) — 完整设计文档 + Delphi 评审记录
+- [Phase 2 Integration](references/phase-2-build-ralph.md) — Sprint-Flow 集成细节
+- [Progress Log Template](templates/progress-log.md)

package/skills/ralph-loop/evals/evals.json ADDED Viewed

@@ -0,0 +1,311 @@
+[
+  {
+    "id": "ralph-001",
+    "name": "specification.yaml 作为输入源验证",
+    "description": "验证 ralph-loop 使用 specification.yaml 中的 REQ 作为迭代单元，而非 stories.json",
+    "input": {
+      "specification": {
+        "requirements": [
+          { "id": "REQ-001", "description": "创建 User Model", "acceptance_criteria": [{ "id": "AC-001-01", "criteria": "email unique" }], "status": "pending" },
+          { "id": "REQ-002", "description": "实现密码加密", "depends_on": ["REQ-001"], "status": "pending" }
+        ]
+      }
+    },
+    "expected": {
+      "input_source": "specification.yaml",
+      "iteration_units": ["REQ-001", "REQ-002"],
+      "no_stories_json": true
+    }
+  },
+  {
+    "id": "ralph-002",
+    "name": "拓扑排序 + 依赖顺序",
+    "description": "验证 REQ 按 depends_on 拓扑排序，同层按 priority 升序",
+    "input": {
+      "requirements": [
+        { "id": "REQ-003", "depends_on": ["REQ-002"], "priority": 3 },
+        { "id": "REQ-001", "depends_on": [], "priority": 1 },
+        { "id": "REQ-002", "depends_on": ["REQ-001"], "priority": 2 }
+      ]
+    },
+    "expected": {
+      "sorted_order": ["REQ-001", "REQ-002", "REQ-003"],
+      "algorithm": "Kahn's topological sort"
+    }
+  },
+  {
+    "id": "ralph-003",
+    "name": "循环依赖检测",
+    "description": "REQ 存在循环依赖时 → BLOCK + 报告循环链",
+    "input": {
+      "requirements": [
+        { "id": "REQ-001", "depends_on": ["REQ-002"] },
+        { "id": "REQ-002", "depends_on": ["REQ-003"] },
+        { "id": "REQ-003", "depends_on": ["REQ-001"] }
+      ]
+    },
+    "expected": {
+      "status": "blocked",
+      "cycle_detected": true,
+      "cycle_chain": "REQ-001 → REQ-002 → REQ-003 → REQ-001"
+    }
+  },
+  {
+    "id": "ralph-004",
+    "name": "Learnings 双层分类 — permanent 自动升级",
+    "description": "被 ≥2 个 REQ 引用的 learnings 自动升级为 permanent",
+    "input": {
+      "learnings": [
+        { "id": 1, "text": "migration files in src/migrations/", "ref_count": 1, "scope": "contextual" },
+        { "id": 2, "text": "Auth middleware before validation", "ref_count": 3, "scope": "interface" }
+      ]
+    },
+    "expected": {
+      "permanent": [
+        { "id": 2, "reason": "ref_count >= 2 AND scope == interface" }
+      ],
+      "contextual": [
+        { "id": 1, "reason": "ref_count < 2 AND scope != interface" }
+      ]
+    }
+  },
+  {
+    "id": "ralph-005",
+    "name": "Subagent 上下文隔离 — 不传递历史对话",
+    "description": "每个 subagent context 仅包含：当前 REQ + AC + permanent/contextual/retry-failures + AGENTS.md + git log -5",
+    "input": {
+      "current_req": "REQ-003",
+      "learnings": { "permanent": ["rule1"], "contextual": ["tip1", "tip2"] },
+      "agents_md": "project conventions",
+      "git_log": "commit1, commit2"
+    },
+    "expected": {
+      "context_sources": ["current_req", "acceptance_criteria", "permanent_learnings", "contextual_learnings", "agents_md", "git_log"],
+      "no_historical_dialogue": true,
+      "context_is_bounded": true
+    }
+  },
+  {
+    "id": "ralph-006",
+    "name": "三层验证 Gate — 失败不提交",
+    "description": "验证失败 → 不 commit → retry（L1: typecheck+lint, L2: all tests, L3: coverage）",
+    "input": {
+      "verification": { "l1": "fail", "l2": "skipped", "l3": "skipped" },
+      "retry_count": 0,
+      "max_retries": 3
+    },
+    "expected": {
+      "committed": false,
+      "retry": true,
+      "new_retry_count": 1,
+      "run_all_tests_on_next_try": true
+    }
+  },
+  {
+    "id": "ralph-007",
+    "name": "全量回归测试 — 不只跑 @test REQ-XXX",
+    "description": "REQ-003 完成后，L2 验证跑 ALL tests（包括 @test REQ-001, @test REQ-002），不只跑 @test REQ-003",
+    "input": {
+      "current_req": "REQ-003",
+      "available_tests": ["test_REQ-001", "test_REQ-002", "test_REQ-003"],
+      "test_scope": "all"
+    },
+    "expected": {
+      "tests_run": ["test_REQ-001", "test_REQ-002", "test_REQ-003"],
+      "scope": "full_regression",
+      "not_just_current_req": true
+    }
+  },
+  {
+    "id": "ralph-008",
+    "name": "Retry 失败上下文注入",
+    "description": "retry 时注入上次失败的错误摘要，不是重复相同上下文",
+    "input": {
+      "retry_count": 1,
+      "last_failure": { "linter": ["unused-var at line 42"], "tests": ["test_login fails: 401 != 200"] }
+    },
+    "expected": {
+      "context_extended": true,
+      "failure_summary": "Linter: unused-var at line 42. Tests: test_login fails",
+      "instruction": "请使用不同的实现方式"
+    }
+  },
+  {
+    "id": "ralph-009",
+    "name": "BLOCK 状态 — 依赖级联",
+    "description": "上游 REQ-001 blocked → REQ-002, REQ-003 自动 blocked(含依赖链)",
+    "input": {
+      "requirements": [
+        { "id": "REQ-001", "status": "blocked", "reason": "max_retry_exceeded" },
+        { "id": "REQ-002", "depends_on": ["REQ-001"], "status": "pending" },
+        { "id": "REQ-003", "depends_on": ["REQ-002"], "status": "pending" }
+      ]
+    },
+    "expected": {
+      "REQ-001_status": "blocked",
+      "REQ-002_status": "blocked(auto)",
+      "REQ-003_status": "blocked(auto)",
+      "dependency_chain": "REQ-001(blocked) → REQ-002 → REQ-003"
+    }
+  },
+  {
+    "id": "ralph-010",
+    "name": "PARTIAL 状态行为",
+    "description": "部分完成时：已 done commits 保留，Phase 3 仅检查 done REQs",
+    "input": {
+      "reqs_done": 4,
+      "reqs_total": 6,
+      "reqs_blocked": 1,
+      "reqs_skipped": 1,
+      "status": "partial"
+    },
+    "expected": {
+      "commits_retained": true,
+      "phase3_scope": "done_reqs_only",
+      "spec_alignment_scope": "partial",
+      "report": "4/6 REQ 完成，1 blocked，1 skipped"
+    }
+  },
+  {
+    "id": "ralph-011",
+    "name": "AGENTS.md 由 orchestrator 统一更新",
+    "description": "subagent 不直接写 AGENTS.md，输出 agentmd_addition 字段给 orchestrator",
+    "input": {
+      "subagent_output": { "agentmd_addition": "## ralph-loop: REQ-003 (api endpoint)\n- Patterns: REST CRUD" },
+      "orchestrator_action": "read_agents_md → append → commit"
+    },
+    "expected": {
+      "agens_md_updated_by": "orchestrator",
+      "no_subagent_direct_write": true,
+      "no_race_condition": true
+    }
+  },
+  {
+    "id": "ralph-012",
+    "name": "状态输出格式 — v3.0",
+    "description": "输出 JSON 必须符合 v3.0 state format",
+    "input": {
+      "output": {
+        "skill_name": "ralph-loop",
+        "version": "2.0.0",
+        "specification_source": "specification.yaml",
+        "requirements": { "total": 6, "done": 2, "pending": 3, "blocked": 1, "skipped": 0 },
+        "learnings": { "permanent": ["..."], "contextual": ["..."] },
+        "topology_order": ["REQ-001", "REQ-002", "REQ-003"]
+      }
+    },
+    "expected": {
+      "valid": true,
+      "assertions": [
+        "done + pending + blocked + skipped == total",
+        "learnings has permanent and contextual arrays",
+        "topology_order exists and is non-empty"
+      ]
+    }
+  },
+  {
+    "id": "ralph-013",
+    "name": "崩溃恢复 — checkpoint 机制",
+    "description": "主进程崩溃后，从 checkpoint 恢复，跳过已 done REQs",
+    "input": {
+      "checkpoint": {
+        "iteration": 3,
+        "done_reqs": ["REQ-001", "REQ-002"],
+        "last_commit": "ralph-loop: REQ-002"
+      },
+      "recover_from": "crash"
+    },
+    "expected": {
+      "next_req": "REQ-003",
+      "skip_reqs": ["REQ-001", "REQ-002"],
+      "commits_retained": true,
+      "no_redo_committed": true
+    }
+  },
+  {
+    "id": "ralph-014",
+    "name": "REQ 粒度过大检测",
+    "description": "REQ 超时 2 次后 BLOCK + 提示用户拆分",
+    "input": {
+      "req": "REQ-004",
+      "timeout_count": 2,
+      "max_timeout": 300
+    },
+    "expected": {
+      "status": "blocked",
+      "message": "REQ-004 过大，建议拆分为多个子 REQ",
+      "user_options": ["split", "skip", "continue"]
+    }
+  },
+  {
+    "id": "ralph-015",
+    "name": "Subagent dispatch — OpenCode task()",
+    "description": "验证 dispatch 使用 task() 工具，带正确 input contract",
+    "input": {
+      "req": "REQ-001",
+      "dispatch_method": "task(category=unspecified-high, load_skills=[test-driven-development], timeout=300)",
+      "context": {
+        "requirement": "REQ-001: 创建 User Model",
+        "permanent_learnings": ["auth middleware before validation"],
+        "contextual_learnings": ["migration files in src/migrations/"],
+        "agents_md": "project conventions",
+        "git_log": "commit1, commit2, commit3"
+      }
+    },
+    "expected": {
+      "dispatched": true,
+      "timeout_configured": true,
+      "skills_loaded": ["test-driven-development"],
+      "context_bounded": true
+    }
+  },
+  {
+    "id": "ralph-016",
+    "name": "首次 REQ，无 test-utils.ts — dispatch test-infra 子任务",
+    "description": "验证首个 REQ 执行时，若 test-utils.ts 不存在，先 dispatch 测试基础设施 subagent，不直接 dispatch 业务代码",
+    "input": {
+      "req": "REQ-001",
+      "test_utils_exists": false,
+      "infra_check_result": "missing"
+    },
+    "expected": {
+      "test_infra_dispatched": true,
+      "business_code_dispatched": false,
+      "infra_action": "generate_new",
+      "infra_max_retries": 2
+    }
+  },
+  {
+    "id": "ralph-017",
+    "name": "后续 REQ，test-utils.ts 已存在且接口完整 — 跳过 test-infra",
+    "description": "验证后续 REQ 执行时，若 test-utils.ts 已存在且导出 createTestApp() 和 withTestDb()，直接 dispatch 业务代码",
+    "input": {
+      "req": "REQ-003",
+      "test_utils_exists": true,
+      "exports": ["createTestApp", "withTestDb"],
+      "infra_check_result": "complete"
+    },
+    "expected": {
+      "test_infra_dispatched": false,
+      "business_code_dispatched": true,
+      "infra_summary_injected": true
+    }
+  },
+  {
+    "id": "ralph-018",
+    "name": "test-utils.ts 存在但接口不完整 — dispatch test-infra 增量补充",
+    "description": "验证 test-utils.ts 存在但缺少必需接口（如只有 createTestApp 缺少 withTestDb）时，dispatch test-infra 增量补充",
+    "input": {
+      "req": "REQ-002",
+      "test_utils_exists": true,
+      "exports": ["createTestApp"],
+      "missing_exports": ["withTestDb"],
+      "infra_check_result": "partial"
+    },
+    "expected": {
+      "test_infra_dispatched": true,
+      "business_code_dispatched": false,
+      "infra_action": "incremental_add_missing_exports"
+    }
+  }
+]