gsd-lite 0.3.2 → 0.3.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -7,6 +7,25 @@ const fs = require('node:fs');
7
7
  const path = require('node:path');
8
8
  const os = require('node:os');
9
9
 
10
+ /**
11
+ * Walk from startDir up to filesystem root looking for a .gsd directory.
12
+ * Returns the absolute path to .gsd if found, or null.
13
+ */
14
+ function findGsdDir(startDir) {
15
+ let dir = startDir;
16
+ while (true) {
17
+ const candidate = path.join(dir, '.gsd');
18
+ try {
19
+ fs.statSync(candidate);
20
+ return candidate;
21
+ } catch {
22
+ const parent = path.dirname(dir);
23
+ if (parent === dir) return null; // reached filesystem root
24
+ dir = parent;
25
+ }
26
+ }
27
+ }
28
+
10
29
  let input = '';
11
30
  const stdinTimeout = setTimeout(() => process.exit(0), 3000);
12
31
  process.stdin.setEncoding('utf8');
@@ -17,13 +36,14 @@ process.stdin.on('end', () => {
17
36
  const data = JSON.parse(input);
18
37
  const model = data.model?.display_name || 'Claude';
19
38
  const cwd = data.workspace?.current_dir || process.cwd();
20
- const session = data.session_id || '';
39
+ const session = String(data.session_id || '').replace(/[^a-zA-Z0-9_-]/g, '');
40
+ if (!session) process.exit(0); // Reject empty session ID to avoid bridge file collision
21
41
  const remaining = data.context_window?.remaining_percentage;
22
42
 
23
43
  // Current GSD task from state.json
24
44
  let task = '';
25
45
  let hasGsd = false;
26
- const gsdDir = path.join(cwd, '.gsd');
46
+ const gsdDir = findGsdDir(cwd);
27
47
  try {
28
48
  const state = JSON.parse(fs.readFileSync(path.join(gsdDir, 'state.json'), 'utf8'));
29
49
  hasGsd = true;
@@ -64,26 +84,30 @@ process.stdin.on('end', () => {
64
84
  }));
65
85
  fs.renameSync(tmpBridge, bridgePath);
66
86
  }
67
- } catch {
68
- // Silent fail bridge is best-effort
87
+ } catch (e) {
88
+ if (process.env.GSD_DEBUG) process.stderr.write(`gsd-statusline: bridge write failed: ${e.message}\n`);
69
89
  }
70
90
  }
71
91
 
72
- // Also write to .gsd/.context-health for MCP server reads (skip if unchanged)
73
- try {
74
- const healthPath = path.join(gsdDir, '.context-health');
75
- const current = fs.readFileSync(healthPath, 'utf8').trim();
76
- if (current !== String(remaining)) {
77
- fs.writeFileSync(healthPath, String(remaining));
78
- }
79
- } catch {
80
- // File doesn't exist yet or .gsd/ missing — ensure dir exists then atomic write
92
+ // Also write to .gsd/.context-health for MCP server reads (atomic, skip if unchanged)
93
+ // Only write if a .gsd directory was found — never create .gsd from the hook
94
+ if (gsdDir) {
81
95
  try {
82
- fs.mkdirSync(gsdDir, { recursive: true });
83
- const tmpHealth = path.join(gsdDir, `.context-health.${process.pid}.tmp`);
84
- fs.writeFileSync(tmpHealth, String(remaining));
85
- fs.renameSync(tmpHealth, path.join(gsdDir, '.context-health'));
86
- } catch { /* silent */ }
96
+ const healthPath = path.join(gsdDir, '.context-health');
97
+ let needsHealthWrite = true;
98
+ try {
99
+ const current = fs.readFileSync(healthPath, 'utf8').trim();
100
+ if (current === String(remaining)) needsHealthWrite = false;
101
+ } catch { /* file doesn't exist yet */ }
102
+ if (needsHealthWrite) {
103
+ fs.mkdirSync(gsdDir, { recursive: true });
104
+ const tmpHealth = path.join(gsdDir, `.context-health.${process.pid}-${Date.now()}.tmp`);
105
+ fs.writeFileSync(tmpHealth, String(remaining));
106
+ fs.renameSync(tmpHealth, healthPath);
107
+ }
108
+ } catch (e) {
109
+ if (process.env.GSD_DEBUG) process.stderr.write(`gsd-statusline: context-health write failed: ${e.message}\n`);
110
+ }
87
111
  }
88
112
 
89
113
  // Progress bar (10 segments)
@@ -108,7 +132,7 @@ process.stdin.on('end', () => {
108
132
  } else {
109
133
  process.stdout.write(`\x1b[2m${model}\x1b[0m \u2502 \x1b[2m${dirname}\x1b[0m${ctx}`);
110
134
  }
111
- } catch {
112
- // Silent fail
135
+ } catch (e) {
136
+ if (process.env.GSD_DEBUG) process.stderr.write(`gsd-statusline: ${e.message}\n`);
113
137
  }
114
138
  });
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "gsd-lite",
3
- "version": "0.3.2",
3
+ "version": "0.3.6",
4
4
  "description": "AI orchestration tool for Claude Code — GSD management shell + Superpowers quality core",
5
5
  "type": "module",
6
6
  "bin": {
@@ -0,0 +1,166 @@
1
+ # Evidence 系统规格参考
2
+
3
+ ## 概述
4
+
5
+ Evidence 是 GSD-Lite 的验证证据系统,用于记录 task 和 phase 的执行/审查证据。存储在 `state.json` 的 `evidence` 字段中,以 key-value 对象形式组织。
6
+
7
+ ## Evidence 对象结构
8
+
9
+ `state.evidence` 是一个扁平对象,key 为 evidence ID,value 为 evidence 数据对象。
10
+
11
+ ```json
12
+ {
13
+ "evidence": {
14
+ "ev:test:phase-1": {
15
+ "id": "ev:test:phase-1",
16
+ "scope": "task:1.2",
17
+ "type": "test",
18
+ ...
19
+ },
20
+ "ev:lint:2.3": {
21
+ "id": "ev:lint:2.3",
22
+ "scope": "task:2.3",
23
+ "type": "lint",
24
+ ...
25
+ }
26
+ }
27
+ }
28
+ ```
29
+
30
+ ### 必需字段
31
+
32
+ | 字段 | 类型 | 约束 | 说明 |
33
+ |------|------|------|------|
34
+ | `id` | string | 非空 | evidence 唯一标识符 |
35
+ | `scope` | string | 非空 | 作用域标识,格式见下方 |
36
+
37
+ ### 验证规则
38
+
39
+ `addEvidence()` 入参校验:
40
+ - `id` 必须是非空字符串
41
+ - `data` 必须是非 null 的普通对象
42
+ - `data.scope` 必须是字符串
43
+
44
+ `state.evidence` 整体校验 (`validateState()`):
45
+ - 必须是普通对象 (isPlainObject)
46
+
47
+ ## ID 格式约定
48
+
49
+ Evidence ID 采用 `ev:<type>:<scope>` 格式:
50
+
51
+ ```
52
+ ev:test:phase-1 # phase 级测试证据
53
+ ev:lint:phase-2 # phase 级 lint 证据
54
+ ev:test:users-update # task 级测试证据
55
+ ev:typecheck:phase-2 # phase 级类型检查证据
56
+ ```
57
+
58
+ 此格式为约定 (convention),由 executor/reviewer 生成时遵守。系统不强制校验 ID 格式。
59
+
60
+ ## Scope 格式
61
+
62
+ Scope 标识 evidence 所属的作用域。核心格式为 `task:X.Y`:
63
+
64
+ ```
65
+ task:1.2 -> phase 1, task 2
66
+ task:2.3 -> phase 2, task 3
67
+ task:3.1 -> phase 3, task 1
68
+ ```
69
+
70
+ ### parseScopePhase 解析
71
+
72
+ `parseScopePhase(scope)` 从 scope 字符串提取 phase 编号:
73
+
74
+ - 正则: `/^task:(\d+)\./`
75
+ - `"task:1.2"` -> 返回 `1`
76
+ - `"task:2.3"` -> 返回 `2`
77
+ - `"phase:1"` -> 返回 `null` (不匹配 task: 前缀)
78
+ - `null`/`undefined` -> 返回 `null`
79
+
80
+ 此函数用于 evidence 归档时判断 evidence 所属 phase。
81
+
82
+ 来源: `parseScopePhase()` in `src/tools/state.js`
83
+
84
+ ## 容量限制与自动裁剪
85
+
86
+ ### MAX_EVIDENCE_ENTRIES
87
+
88
+ - 硬限制: `200` 条
89
+ - 定义位置: `src/tools/state.js` 顶层常量
90
+
91
+ ### 自动裁剪触发
92
+
93
+ `addEvidence()` 每次添加 evidence 后检查:
94
+
95
+ ```
96
+ if (Object.keys(state.evidence).length > MAX_EVIDENCE_ENTRIES) {
97
+ -> 调用 _pruneEvidenceFromState(state, currentPhase, gsdDir)
98
+ }
99
+ ```
100
+
101
+ ### 裁剪逻辑
102
+
103
+ `_pruneEvidenceFromState(state, currentPhase, gsdDir)`:
104
+
105
+ 1. 遍历所有 evidence 条目
106
+ 2. 对每条 evidence 调用 `parseScopePhase(entry.scope)` 提取 phase 编号
107
+ 3. 如果 `phaseNum !== null && phaseNum < currentPhase` -> 标记为待归档
108
+ 4. 其余保留 (包括 scope 无法解析的条目)
109
+
110
+ 规则: 仅保留当前 phase 的 evidence,归档所有更早 phase 的 evidence。
111
+
112
+ ## 归档生命周期
113
+
114
+ ### 归档路径
115
+
116
+ `.gsd/evidence-archive.json`
117
+
118
+ ### 归档流程
119
+
120
+ ```
121
+ _pruneEvidenceFromState()
122
+ -> 分离 toArchive / toKeep
123
+ -> 读取现有 evidence-archive.json (不存在则 {})
124
+ -> Object.assign(archive, toArchive) 合并
125
+ -> writeJson(archivePath, archive) 写入归档文件
126
+ -> state.evidence = toKeep 更新内存中的 state
127
+ ```
128
+
129
+ ### 触发时机
130
+
131
+ 1. `addEvidence()` — 当 evidence 数量超过 MAX_EVIDENCE_ENTRIES 时自动触发
132
+ 2. `phaseComplete()` — phase 完成后主动触发 (在 phase lifecycle 转换为 accepted 之后)
133
+ 3. `pruneEvidence()` — 显式调用的外部接口
134
+
135
+ ### 归档特性
136
+
137
+ - 归档是追加式的: 新归档条目与已有归档 merge
138
+ - 归档后 state.evidence 中的对应条目被移除
139
+ - 归档文件持久保存,不会被自动清理
140
+
141
+ ## Evidence 来源
142
+
143
+ ### Executor 结果
144
+
145
+ `handleExecutorResult()` 处理 executor 返回的 evidence:
146
+
147
+ 1. `result.evidence` 数组写入 task 的 `evidence_refs`
148
+ 2. 对数组中每个符合条件的条目 (有 `id` 和 `scope` 字符串字段) 调用 `addEvidence()` 存入 `state.evidence`
149
+ 3. outcome 为 `checkpointed` / `blocked` / `failed` 时均会保存 evidence_refs
150
+
151
+ ### Reviewer 结果
152
+
153
+ `handleReviewerResult()` 处理 reviewer 返回的 evidence:
154
+
155
+ 1. 同样遍历 `result.evidence` 数组
156
+ 2. 对符合条件的条目调用 `addEvidence()` 存入 `state.evidence`
157
+
158
+ ### Task 上的 evidence_refs
159
+
160
+ 每个 task 对象有 `evidence_refs` 数组字段:
161
+ - 类型: `Array` (validateState 要求)
162
+ - 初始值: `[]`
163
+ - 更新时机: executor checkpointed / blocked / failed 时从 result.evidence 覆写
164
+ - 清空时机: `propagateInvalidation()` 或 reviewer 标记 rework 时清空为 `[]`
165
+
166
+ 来源: `addEvidence()`, `_pruneEvidenceFromState()`, `pruneEvidence()`, `phaseComplete()` in `src/tools/state.js`; `handleExecutorResult()`, `handleReviewerResult()` in `src/tools/orchestrator.js`
@@ -0,0 +1,162 @@
1
+ # Execution Loop -- Canonical Specification
2
+
3
+ 本文件是执行循环的唯一 source of truth。所有 command 文件 (start.md, prd.md, resume.md) 引用此文件。
4
+
5
+ ---
6
+
7
+ ### 11.1 — 加载 phase 计划
8
+
9
+ ```
10
+ for each pending phase:
11
+ 加载 phase 计划 + todo DAG
12
+ ```
13
+
14
+ ### 11.2 — 选择 runnable task
15
+
16
+ 选择条件:
17
+ - `lifecycle` 属于 `{pending, needs_revalidation}`
18
+ - `requires` 中每个依赖都满足对应 gate
19
+ - 不被 unresolved blocker 阻塞
20
+ - 未超过 retry 上限
21
+
22
+ 如果 0 个 runnable task 且 phase 未完成:
23
+ ```
24
+ ├── 全部 blocked → workflow_mode = awaiting_user,展示所有 blocker
25
+ └── 全部等待 review → 触发 batch review (L1) 或等待 L2 review 完成
26
+ ```
27
+
28
+ ### 11.3 — 构建 executor 上下文 + 串行派发
29
+
30
+ executor 上下文传递协议 (orchestrator → executor):
31
+ ```
32
+ ├── task_spec: 从 phases/*.md 提取当前 task 的规格段落
33
+ ├── research_decisions: 从 research_basis 引用的 decision 摘要
34
+ ├── predecessor_outputs: 前置依赖 task 的 files_changed + checkpoint_commit
35
+ ├── project_conventions: CLAUDE.md 路径 (executor 自行读取)
36
+ ├── workflows: 需加载的工作流文件路径 (如 tdd-cycle.md)
37
+ └── constraints: retry_count / level / review_required
38
+ ```
39
+
40
+ 派发 `executor` 子代理执行单个 task。
41
+
42
+ ### 11.4 — 处理 executor 结果
43
+
44
+ 严格按 agent result contract 处理:
45
+ ```
46
+ ├── checkpointed → 写入 checkpoint commit + evidence refs → 进入审查 (11.5)
47
+ ├── blocked → 写入 blocked_reason / unblock_condition
48
+ │ → 编排器检查 decisions 数组,能自动回答则重新派发
49
+ │ → 不能回答 → workflow_mode = awaiting_user,向用户转达
50
+ ├── failed → retry_count + 1
51
+ │ → 未超限 → 重新派发 executor
52
+ │ → 超限 (3次) 或返回 [FAILED] 且错误指纹重复
53
+ │ 或修复尝试未收敛 → 触发 debugger (见下方)
54
+ ```
55
+
56
+ **Debugger 触发流程:**
57
+ 1. 编排器派发 `debugger` 子代理,传入: 错误信息 + executor 修复尝试记录 + 相关代码路径
58
+ 2. debugger 返回: 根因分析 + 修复方向建议
59
+ 3. 编排器决定:
60
+ - 带修复方向重新派发 executor
61
+ - 标记 task failed
62
+ - 标记 phase failed
63
+
64
+ **Decisions 累积:**
65
+ - executor 返回 `[DECISION]` → 编排器追加到 `state.json` 的 `decisions` 数组
66
+ - 每条 decision 记录: `id` / `task` / `summary` / `phase`
67
+ - decisions 跨 task、跨 phase、跨 `/clear` + `/gsd:resume` 持久保留
68
+ - 编排器收到 `[BLOCKED]` 时,先查 `decisions` 数组尝试自动回答
69
+
70
+ ### 11.5 — 分层审查
71
+
72
+ ```
73
+ ├── L0: checkpoint commit 后可直接 accepted (无需 reviewer)
74
+ ├── L1: phase 结束后批量 reviewer 审查
75
+ │ → 派发 reviewer 子代理,scope = phase
76
+ └── L2: checkpoint commit 后立即独立审查
77
+ → 派发 reviewer 子代理,scope = task
78
+ → 未 accepted 前不释放其下游依赖
79
+ ```
80
+
81
+ **审查级别运行时重分类:**
82
+ - executor 报告 `contract_changed: true` + 涉及 auth/payment/public API → 自动升级为 L2
83
+ - executor 标注 `[LEVEL-UP]` → 编排器采纳
84
+ - 不主动降级 (安全优先)
85
+
86
+ ### 11.6 — 处理 reviewer 结果
87
+
88
+ ```
89
+ ├── 无 Critical → 更新 accepted 状态 + evidence refs
90
+ └── 有 Critical → 标记返工 task + 失效传播 → 重新审查 (最多 3 轮)
91
+ ```
92
+
93
+ **返工失效传播规则:**
94
+ - 返工修改了 contract / schema / shared behavior:
95
+ → 所有直接和间接依赖 task → `needs_revalidation`
96
+ → 清空其旧 `evidence_refs`
97
+ → 已 accepted 则退回到 `checkpointed` 或 `pending_review`
98
+ - 返工只影响局部实现、外部契约未变:
99
+ → 下游 task 保持现状
100
+ → 但受影响验证范围必须重跑并刷新 evidence
101
+ - 触发判定: `contract_changed` (executor 运行时报告) 是主触发源
102
+ `invalidate_downstream_on_change` (planner 静态标记) 是预判辅助
103
+ → executor 报告 `contract_changed: true` → 一定传播
104
+ → planner 标记但 executor 报告 false → 不传播 (以运行时实际为准)
105
+
106
+ ### 11.7 — Phase handoff gate
107
+
108
+ <HARD-GATE id="phase-handoff">
109
+ 所有条件必须满足才能进入下一 phase:
110
+ - [ ] 所有 required task = `accepted`
111
+ - [ ] required review = `passed`
112
+ - [ ] critical issues = 0
113
+ - [ ] tests/lint/typecheck 满足计划验证条件
114
+ - [ ] 方向校验: 当前阶段产出是否仍与 plan.md 中的项目目标一致?
115
+
116
+ → 全部满足 → 自动进入下一阶段
117
+ → 任一不满足 → 标注问题,尝试修复,3 次失败停止
118
+ → 方向漂移 → workflow_mode = awaiting_user,展示偏差让用户决定
119
+ </HARD-GATE>
120
+
121
+ ### 11.8 — 批量更新 state.json
122
+
123
+ 阶段完成后,编排器批量更新 state.json:
124
+ - 更新 phase lifecycle → `accepted`
125
+ - 更新 phase_handoff 信息
126
+ - 归档旧 phase 的 evidence (仅保留当前 phase)
127
+ - 推进 `current_phase` 到下一个 pending phase
128
+
129
+ **规则:** 只有编排器写 state.json,避免并发竞态。
130
+
131
+ ### 11.9 — 上下文检查
132
+
133
+ 每次派发子代理前和阶段切换时检查上下文健康度:
134
+
135
+ ```
136
+ remaining <= 35%:
137
+ 1. 保存完整状态到 state.json
138
+ 2. workflow_mode = awaiting_clear
139
+ 3. 输出: "上下文剩余 <=35%,已保存进度。请执行 /clear 然后 /gsd:resume 继续"
140
+ 4. 停止执行
141
+
142
+ remaining <= 25%:
143
+ 1. 紧急保存状态到 state.json
144
+ 2. workflow_mode = awaiting_clear
145
+ 3. 输出: "上下文即将耗尽,已保存进度。请立即执行 /clear 然后 /gsd:resume"
146
+ 4. 立即停止
147
+ ```
148
+
149
+ ---
150
+
151
+ ## 依赖门槛语义 (Gate-aware dependencies)
152
+
153
+ ```json
154
+ { "kind": "task", "id": "2.2", "gate": "checkpoint" } // 低风险内部串接
155
+ { "kind": "task", "id": "2.3", "gate": "accepted" } // 默认安全门槛
156
+ { "kind": "phase", "id": 2, "gate": "phase_complete" } // 跨 phase 依赖
157
+ ```
158
+
159
+ - `checkpoint` — 允许依赖未独立验收的实现检查点;只适合低风险内部串接
160
+ - `accepted` — 默认安全门槛;适合共享行为、公共接口、L2 风险任务
161
+ - `phase_complete` — 跨 phase 依赖;只有 phase handoff 完成后才释放
162
+ - 默认值: 如果 planner 没显式放宽,则依赖按 `accepted` 处理
@@ -0,0 +1,84 @@
1
+ # 审查级别分类参考
2
+
3
+ ## 静态分类 (计划时)
4
+
5
+ | 级别 | 适用场景 | 审查方式 |
6
+ |------|---------|---------|
7
+ | L0 | 无运行时语义变化 (docs/config/style) | checkpoint 后直接 accepted |
8
+ | L1 | 普通编码任务 (默认) | phase 结束后批量审查 |
9
+ | L2 | 高风险 (auth/payment/public API/DB migration) | checkpoint 后立即独立审查 |
10
+
11
+ ## 运行时重分类
12
+
13
+ 触发条件 (L1 -> L2 升级):
14
+ 1. executor 报告 `contract_changed: true` 且 task name 匹配敏感关键词
15
+ 2. executor decisions 中包含 `[LEVEL-UP]` 标注 (字符串或 `decision.summary` 中包含)
16
+
17
+ 敏感关键词正则 (`SENSITIVE_KEYWORDS`):
18
+
19
+ ```
20
+ /\b(auth|payment|security|public.?api|login|token|credential|session|oauth)\b/i
21
+ ```
22
+
23
+ 规则: 只升不降 (安全优先)。当前级别为 L2 或 L3 时直接保持不变。
24
+
25
+ ## 决策树
26
+
27
+ ```
28
+ task.level 当前值?
29
+ ├── L2 或 L3 -> 保持不变 (不降级)
30
+ └── L0 或 L1
31
+ ├── executor decisions 含 [LEVEL-UP]? -> 升级为 L2
32
+ ├── contract_changed: true + task.name 匹配敏感关键词? -> 升级为 L2
33
+ └── 否 -> 保持当前级别
34
+ ```
35
+
36
+ 来源: `reclassifyReviewLevel()` in `src/tools/state.js`
37
+
38
+ ## 审查流程
39
+
40
+ ### L0 流程
41
+
42
+ ```
43
+ executor checkpointed
44
+ -> handleExecutorResult 检测 reviewLevel === 'L0'
45
+ -> auto_accepted = true
46
+ -> 编排器直接 accepted (persist lifecycle: 'accepted', done +1)
47
+ -> 释放下游依赖
48
+ ```
49
+
50
+ 不派发 reviewer。`review_required: false` 的 task 同样走此路径。
51
+
52
+ ### L1 流程
53
+
54
+ ```
55
+ executor checkpointed
56
+ -> workflow_mode 保持 'executing_task'
57
+ -> 继续执行其他 task
58
+ -> phase 内所有 runnable task 完成后
59
+ -> selectRunnableTask 返回 { mode: 'trigger_review' }
60
+ -> 编排器设置 workflow_mode = 'reviewing_phase'
61
+ -> 派发 reviewer (scope='phase', review_level='L1-batch')
62
+ -> 批量审查所有 checkpointed task (排除 L0)
63
+ ```
64
+
65
+ ### L2 流程
66
+
67
+ ```
68
+ executor checkpointed
69
+ -> handleExecutorResult 检测 reviewLevel === 'L2' && review_required !== false
70
+ -> 设置 current_review = { scope: 'task', scope_id: task.id, stage: 'spec' }
71
+ -> workflow_mode = 'reviewing_task'
72
+ -> 派发 reviewer (scope='task', review_level='L2')
73
+ -> 审查通过后才释放下游依赖
74
+ ```
75
+
76
+ ## Reviewer 结果处理
77
+
78
+ | 审查结果 | 编排器行为 |
79
+ |----------|-----------|
80
+ | 无 critical issues | accepted_tasks 标记为 `accepted`; phase_review.status = `accepted` |
81
+ | 有 critical issues | rework_tasks 标记为 `needs_revalidation`; phase_review.status = `rework_required` |
82
+ | critical + `invalidates_downstream` | 触发 `propagateInvalidation`: 所有下游依赖 task -> `needs_revalidation` + 清空 evidence_refs |
83
+
84
+ 来源: `handleReviewerResult()` in `src/tools/orchestrator.js`, `reviewer.md` in `agents/`