sillyspec 3.18.2 → 3.18.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (40) hide show
  1. package/docs/brainstorm-plan-contract.md +64 -0
  2. package/docs/plan-execute-contract.md +123 -0
  3. package/docs/revision-mode.md +115 -0
  4. package/docs/sillyspec/file-lifecycle.md +13 -4
  5. package/docs/workflow-contract-regression.md +106 -0
  6. package/package.json +1 -1
  7. package/packages/dashboard/dist/assets/{index-DpLHK4jv.js → index-Bq_Z2hne.js} +568 -568
  8. package/packages/dashboard/dist/assets/{index-BcM2J-hv.css → index-O2W5RV4z.css} +1 -1
  9. package/packages/dashboard/dist/index.html +16 -16
  10. package/packages/dashboard/src/components/PipelineStage.vue +22 -2
  11. package/packages/dashboard/src/components/PipelineView.vue +10 -2
  12. package/packages/dashboard/src/components/StageBadge.vue +17 -3
  13. package/packages/dashboard/src/components/StepCard.vue +7 -2
  14. package/src/change-risk-profile.js +167 -0
  15. package/src/contract-matrix.js +278 -0
  16. package/src/db.js +6 -0
  17. package/src/endpoint-extractor.js +315 -0
  18. package/src/index.js +53 -6
  19. package/src/init.js +31 -4
  20. package/src/knowledge-match.js +130 -0
  21. package/src/progress.js +464 -11
  22. package/src/run.js +287 -7
  23. package/src/scan-postcheck.js +34 -2
  24. package/src/stage-contract.js +86 -6
  25. package/src/stages/brainstorm.js +23 -0
  26. package/src/stages/execute.js +158 -4
  27. package/src/stages/plan.js +82 -0
  28. package/src/stages/scan.js +40 -0
  29. package/src/stages/verify.js +63 -2
  30. package/src/worktree.js +264 -35
  31. package/test/brainstorm-plan-contract.test.mjs +273 -0
  32. package/test/contract-artifacts.test.mjs +323 -0
  33. package/test/knowledge-match.test.mjs +231 -0
  34. package/test/plan-execute-contract.test.mjs +330 -0
  35. package/test/platform-failure-samples.test.mjs +4 -0
  36. package/test/revision-v1.test.mjs +1145 -0
  37. package/test/scan-knowledge.test.mjs +175 -0
  38. package/test/scan-postcheck.test.mjs +3 -0
  39. package/test/spec-dir.test.mjs +8 -3
  40. package/test/stage-definitions.test.mjs +1 -1
@@ -0,0 +1,330 @@
1
+ /**
2
+ * Plan → Execute Contract v1 测试
3
+ *
4
+ * 验证 plan.md 到 execute 的契约:
5
+ * 1. 各复杂度场景的 plan 校验通过
6
+ * 2. 非法 plan 被正确拒绝
7
+ * 3. execute 不复用旧 task
8
+ */
9
+ import { validatePlanForExecute } from '../src/stages/execute.js'
10
+
11
+ let failed = 0
12
+ const failures = []
13
+
14
+ function assert(condition, msg) {
15
+ if (!condition) {
16
+ failed++
17
+ failures.push(msg)
18
+ console.log(` ❌ FAIL: ${msg}`)
19
+ } else {
20
+ console.log(` ✅ PASS: ${msg}`)
21
+ }
22
+ }
23
+
24
+ console.log('=== Plan → Execute Contract v1 测试 ===\n')
25
+
26
+ // ─────────────────────────────────────────
27
+ // Case 1: none plan(最小变更)通过
28
+ // ─────────────────────────────────────────
29
+ console.log('--- Case 1: none plan contract 通过 ---')
30
+ {
31
+ const plan = `# Plan
32
+
33
+ ## Wave 1
34
+ - [ ] task-01: 修复 typo
35
+ `
36
+ const result = validatePlanForExecute(plan)
37
+ assert(result.ok, 'none plan 应校验通过')
38
+ assert(result.tasks.length === 1, `应有 1 个 task,实际 ${result.tasks.length}`)
39
+ assert(result.waves.length === 1, `应有 1 个 wave,实际 ${result.waves.length}`)
40
+ }
41
+
42
+ // ─────────────────────────────────────────
43
+ // Case 2: light plan 通过
44
+ // ─────────────────────────────────────────
45
+ console.log('\n--- Case 2: light plan contract 通过 ---')
46
+ {
47
+ const plan = `# Plan
48
+
49
+ ## Wave 1
50
+ - [ ] task-01: 添加 API 端点
51
+ - [ ] task-02: 添加前端调用
52
+ `
53
+ const result = validatePlanForExecute(plan)
54
+ assert(result.ok, 'light plan 应校验通过')
55
+ assert(result.tasks.length === 2, `应有 2 个 task,实际 ${result.tasks.length}`)
56
+ }
57
+
58
+ // ─────────────────────────────────────────
59
+ // Case 3: full plan with waves 通过
60
+ // ─────────────────────────────────────────
61
+ console.log('\n--- Case 3: full plan wave contract 通过 ---')
62
+ {
63
+ const plan = `# Plan
64
+
65
+ ## Wave 1: 基础设施
66
+ - [ ] task-01: 数据库 schema
67
+ - 修改: db/migrate/001.sql
68
+ - [ ] task-02: 模型定义
69
+
70
+ ## Wave 2: 业务逻辑
71
+ - [ ] task-03: API 实现
72
+ - [ ] task-04: 业务规则
73
+
74
+ ## Wave 3: 测试
75
+ - [ ] task-05: 集成测试
76
+ - 参考: tests/integration/
77
+ `
78
+ const result = validatePlanForExecute(plan)
79
+ assert(result.ok, 'full plan 应校验通过')
80
+ assert(result.tasks.length === 5, `应有 5 个 task,实际 ${result.tasks.length}`)
81
+ assert(result.waves.length === 3, `应有 3 个 wave,实际 ${result.waves.length}`)
82
+ assert(result.tasks[0].index === 1, 'task-01 index 应为 1')
83
+ assert(result.tasks[4].index === 5, 'task-05 index 应为 5')
84
+ }
85
+
86
+ // ─────────────────────────────────────────
87
+ // Case 4: 无 checkbox task 失败
88
+ // ─────────────────────────────────────────
89
+ console.log('\n--- Case 4: 无 checkbox task 失败 ---')
90
+ {
91
+ const plan = `# Plan
92
+
93
+ 这个 plan 只有描述,没有任何 task。
94
+
95
+ ## 注意事项
96
+ - 设计文档已就绪
97
+ `
98
+ const result = validatePlanForExecute(plan)
99
+ assert(!result.ok, '无 checkbox task 应失败')
100
+ assert(result.errors.some(e => e.includes('checkbox task')), '错误应提到 checkbox task')
101
+ }
102
+
103
+ // ─────────────────────────────────────────
104
+ // Case 5: task id 重复失败
105
+ // ─────────────────────────────────────────
106
+ console.log('\n--- Case 5: task id 重复失败 ---')
107
+ {
108
+ const plan = `# Plan
109
+
110
+ ## Wave 1
111
+ - [ ] task-01: 第一个任务
112
+ - [ ] task-01: 重复的任务
113
+ `
114
+ const result = validatePlanForExecute(plan)
115
+ assert(!result.ok, 'task id 重复应失败')
116
+ assert(result.errors.some(e => e.includes('重复')), '错误应提到重复')
117
+ }
118
+
119
+ // ─────────────────────────────────────────
120
+ // Case 6: task id 不连续失败
121
+ // ─────────────────────────────────────────
122
+ console.log('\n--- Case 6: task id 不连续失败 ---')
123
+ {
124
+ const plan = `# Plan
125
+
126
+ ## Wave 1
127
+ - [ ] task-01: 第一个
128
+ - [ ] task-03: 跳过了第二个
129
+ `
130
+ const result = validatePlanForExecute(plan)
131
+ assert(!result.ok, 'task id 不连续应失败')
132
+ assert(result.errors.some(e => e.includes('不连续')), '错误应提到不连续')
133
+ }
134
+
135
+ // ─────────────────────────────────────────
136
+ // Case 7: 空 plan 失败
137
+ // ─────────────────────────────────────────
138
+ console.log('\n--- Case 7: 空 plan 失败 ---')
139
+ {
140
+ const result1 = validatePlanForExecute('')
141
+ assert(!result1.ok, '空字符串应失败')
142
+
143
+ const result2 = validatePlanForExecute(null)
144
+ assert(!result2.ok, 'null 应失败')
145
+
146
+ const result3 = validatePlanForExecute(' ')
147
+ assert(!result3.ok, '纯空格应失败')
148
+ }
149
+
150
+ // ─────────────────────────────────────────
151
+ // Case 8: task name 非空
152
+ // ─────────────────────────────────────────
153
+ console.log('\n--- Case 8: task name 为空失败 ---')
154
+ {
155
+ // 注意:parseWavesFromPlan 在 task name 为空字符串时可能不触发
156
+ // 这个 case 验证 validator 能检测到空 name
157
+ const plan = `# Plan
158
+
159
+ ## Wave 1
160
+ - [ ] task-01:
161
+ `
162
+ const result = validatePlanForExecute(plan)
163
+ // task name 为空时 trim 后为空
164
+ if (result.tasks.length > 0 && !result.tasks[0].name.trim()) {
165
+ assert(!result.ok, 'task name 为空应失败')
166
+ } else {
167
+ // 如果 parser 把空 name 过滤了,那至少 plan 能解析
168
+ console.log(' ℹ️ parser 过滤了空 name,跳过此 case')
169
+ }
170
+ }
171
+
172
+ // ─────────────────────────────────────────
173
+ // Case 9: task 无 id 只有 warning
174
+ // ─────────────────────────────────────────
175
+ console.log('\n--- Case 9: task 无 id 只有 warning ---')
176
+ {
177
+ const plan = `# Plan
178
+
179
+ ## Wave 1
180
+ - [ ] 实现登录功能
181
+ `
182
+ const result = validatePlanForExecute(plan)
183
+ // 无 id 的 task 只产生 warning,不阻止执行
184
+ assert(result.ok, '无 id task 不应阻止执行')
185
+ assert(result.warnings.length > 0, '应有 warning 关于缺少 task id')
186
+ }
187
+
188
+ // ─────────────────────────────────────────
189
+ // Case 10: 连续 id 从 1 开始
190
+ // ─────────────────────────────────────────
191
+ console.log('\n--- Case 10: task-02 起始不报不连续(兼容) ---')
192
+ {
193
+ const plan = `# Plan
194
+
195
+ ## Wave 1
196
+ - [ ] task-02: 第二个
197
+ - [ ] task-03: 第三个
198
+ `
199
+ const result = validatePlanForExecute(plan)
200
+ // 从 task-02 开始,ids[0]=2 ≠ 1,不触发连续性检查
201
+ assert(result.ok, 'task-02 起始不应报不连续')
202
+ }
203
+
204
+ // ─────────────────────────────────────────
205
+ // Case 11: 子行信息解析正确
206
+ // ─────────────────────────────────────────
207
+ console.log('\n--- Case 11: 子行信息(修改/参考)解析正确 ---')
208
+ {
209
+ const plan = `# Plan
210
+
211
+ ## Wave 1
212
+ - [ ] task-01: 实现功能
213
+ - 修改: src/auth.js
214
+ - 参考: docs/auth.md
215
+ - 步骤: 1. 创建模型 2. 写中间件
216
+ `
217
+ const result = validatePlanForExecute(plan)
218
+ assert(result.ok, '有子行的 plan 应校验通过')
219
+ assert(result.tasks[0].file === 'src/auth.js', 'task file 应为 src/auth.js')
220
+ assert(result.tasks[0].reference === 'docs/auth.md', 'task reference 应为 docs/auth.md')
221
+ }
222
+
223
+ // ─────────────────────────────────────────
224
+ // Case 12: 多 Wave 各自有 task
225
+ // ─────────────────────────────────────────
226
+ console.log('\n--- Case 12: 多 Wave 各自有 task ---')
227
+ {
228
+ const plan = `# Plan
229
+
230
+ ## Wave 1
231
+ - [ ] task-01: A
232
+
233
+ ## Wave 2
234
+ - [ ] task-02: B
235
+
236
+ ## Wave 3
237
+ - [ ] task-03: C
238
+ `
239
+ const result = validatePlanForExecute(plan)
240
+ assert(result.ok, '多 Wave plan 应校验通过')
241
+ assert(result.waves.length === 3, '应有 3 个 wave')
242
+ assert(result.waves[0].tasks.length === 1, 'wave 1 应有 1 task')
243
+ assert(result.waves[2].tasks[0].index === 3, 'wave 3 task 应为 task-03')
244
+ }
245
+
246
+ // ─────────────────────────────────────────
247
+ // Plan Postcheck Contract: valid none plan 通过
248
+ // ─────────────────────────────────────────
249
+ console.log('\n--- Plan Postcheck: valid none plan 通过 ---')
250
+ {
251
+ const plan = `# Plan\n\n## Wave 1\n- [ ] task-01: 修复 bug\n`
252
+ const result = validatePlanForExecute(plan)
253
+ assert(result.ok, 'none plan 应通过 postcheck contract')
254
+ assert(result.errors.length === 0, '不应有 errors')
255
+ }
256
+
257
+ // ─────────────────────────────────────────
258
+ // Plan Postcheck Contract: valid light plan 通过
259
+ // ─────────────────────────────────────────
260
+ console.log('\n--- Plan Postcheck: valid light plan 通过 ---')
261
+ {
262
+ const plan = `# Plan\n\n## Wave 1\n- [ ] task-01: API\n- [ ] task-02: 前端\n`
263
+ const result = validatePlanForExecute(plan)
264
+ assert(result.ok, 'light plan 应通过 postcheck contract')
265
+ }
266
+
267
+ // ─────────────────────────────────────────
268
+ // Plan Postcheck Contract: valid full plan 通过
269
+ // ─────────────────────────────────────────
270
+ console.log('\n--- Plan Postcheck: valid full plan 通过 ---')
271
+ {
272
+ const plan = `# Plan\n\n## Wave 1\n- [ ] task-01: A\n## Wave 2\n- [ ] task-02: B\n## Wave 3\n- [ ] task-03: C\n`
273
+ const result = validatePlanForExecute(plan)
274
+ assert(result.ok, 'full plan 应通过 postcheck contract')
275
+ assert(result.waves.length === 3, '应有 3 个 wave')
276
+ }
277
+
278
+ // ─────────────────────────────────────────
279
+ // Plan Postcheck Contract: missing checkbox 失败
280
+ // ─────────────────────────────────────────
281
+ console.log('\n--- Plan Postcheck: missing checkbox 失败 ---')
282
+ {
283
+ const plan = `# Plan\n\n只有描述没有 task。\n`
284
+ const result = validatePlanForExecute(plan)
285
+ assert(!result.ok, '无 checkbox 应不通过 postcheck')
286
+ assert(result.errors.length > 0, '应有 errors')
287
+ assert(result.errors.some(e => e.includes('checkbox task')), '应有 checkbox task 错误')
288
+ }
289
+
290
+ // ─────────────────────────────────────────
291
+ // Plan Postcheck Contract: warning 不阻断
292
+ // ─────────────────────────────────────────
293
+ console.log('\n--- Plan Postcheck: warning 不阻断 completed ---')
294
+ {
295
+ const plan = `# Plan\n\n## Wave 1\n- [ ] 实现功能(无 task id)\n`
296
+ const result = validatePlanForExecute(plan)
297
+ assert(result.ok, '有 warning 但应通过 postcheck(不阻断 completed)')
298
+ assert(result.warnings.length > 0, '应有 warning')
299
+ }
300
+
301
+ // ─────────────────────────────────────────
302
+ // Plan Postcheck Contract: id 重复失败
303
+ // ─────────────────────────────────────────
304
+ console.log('\n--- Plan Postcheck: task id 重复失败 ---')
305
+ {
306
+ const plan = `# Plan\n\n## Wave 1\n- [ ] task-01: A\n- [ ] task-01: B\n`
307
+ const result = validatePlanForExecute(plan)
308
+ assert(!result.ok, 'id 重复应不通过 postcheck')
309
+ }
310
+
311
+ // ─────────────────────────────────────────
312
+ // Plan Postcheck Contract: id 不连续失败
313
+ // ─────────────────────────────────────────
314
+ console.log('\n--- Plan Postcheck: task id 不连续失败 ---')
315
+ {
316
+ const plan = `# Plan\n\n## Wave 1\n- [ ] task-01: A\n- [ ] task-03: C\n`
317
+ const result = validatePlanForExecute(plan)
318
+ assert(!result.ok, 'id 不连续应不通过 postcheck')
319
+ }
320
+
321
+ // ── 结果 ──
322
+ console.log(`\n${'='.repeat(50)}`)
323
+ console.log(`✅ 通过: ${12 - failed} ❌ 失败: ${failed}`)
324
+ if (failures.length > 0) {
325
+ console.log(`失败项:`)
326
+ failures.forEach(f => console.log(` - ${f}`))
327
+ }
328
+ console.log(`${'='.repeat(50)}`)
329
+
330
+ if (failed > 0) process.exit(1)
@@ -167,6 +167,10 @@ console.log('\n=== Test 5: 正常成功场景 ===')
167
167
  // 在 specDir 写 local.yaml
168
168
  writeFileSync(join(specDir, 'local.yaml'), 'build: echo ok\ntest: echo ok\n')
169
169
 
170
+ // 创建 knowledge 目录和 INDEX.md(scan 已产出知识)
171
+ mkdirSync(join(specDir, 'knowledge'), { recursive: true })
172
+ writeFileSync(join(specDir, 'knowledge', 'INDEX.md'), '# Knowledge Index\n')
173
+
170
174
  const { runScanPostCheck } = await import('../src/scan-postcheck.js')
171
175
  const result = runScanPostCheck({ cwd, specDir })
172
176