principles-disciple 1.8.2 → 1.9.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/openclaw.plugin.json +4 -4
- package/package.json +1 -1
- package/src/core/pain-context-extractor.ts +286 -0
- package/src/core/pain.ts +83 -1
- package/src/hooks/lifecycle.ts +7 -6
- package/src/hooks/llm.ts +7 -6
- package/src/hooks/pain.ts +5 -6
- package/src/hooks/subagent.ts +5 -6
- package/src/service/evolution-worker.ts +59 -2
- package/templates/langs/en/skills/ai-sprint-orchestration/EXAMPLES.md +63 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/REFERENCE.md +136 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/SKILL.md +67 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/references/agent-registry.json +214 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +107 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +107 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +105 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +108 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/references/workflow-v1-acceptance-checklist.md +58 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/references/workflow-v1.4-work-unit-handoff.md +190 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/runtime/.gitignore +2 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/archive.mjs +310 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/contract-enforcement.mjs +683 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/decision.mjs +604 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/state-store.mjs +32 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/task-specs.mjs +707 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/run.mjs +3419 -0
- package/templates/langs/en/skills/pd-auditor/SKILL.md +61 -0
- package/templates/langs/en/skills/pd-daily/SKILL.md +1 -1
- package/templates/langs/en/skills/pd-diagnostician/SKILL.md +370 -0
- package/templates/langs/en/skills/pd-explorer/SKILL.md +65 -0
- package/templates/langs/en/skills/pd-grooming/SKILL.md +1 -1
- package/templates/langs/en/skills/pd-implementer/SKILL.md +68 -0
- package/templates/langs/en/skills/pd-mentor/SKILL.md +1 -1
- package/templates/langs/en/skills/pd-pain-signal/SKILL.md +37 -0
- package/templates/langs/en/skills/pd-planner/SKILL.md +65 -0
- package/templates/langs/zh/core/PRINCIPLES.md +7 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/EXAMPLES.md +63 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/REFERENCE.md +136 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/SKILL.md +67 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/agent-registry.json +214 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +107 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +107 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +105 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +108 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/workflow-v1-acceptance-checklist.md +58 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/workflow-v1.4-work-unit-handoff.md +190 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/runtime/.gitignore +2 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/archive.mjs +310 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/contract-enforcement.mjs +683 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/decision.mjs +604 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/state-store.mjs +32 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/task-specs.mjs +707 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/run.mjs +3419 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/test/archive.test.mjs +230 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/test/contract-enforcement.test.mjs +672 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/test/decision.test.mjs +1321 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/test/run.test.mjs +1419 -0
- package/templates/langs/zh/skills/pd-auditor/SKILL.md +1 -1
- package/templates/langs/zh/skills/pd-daily/SKILL.md +1 -1
- package/templates/langs/zh/skills/pd-diagnostician/SKILL.md +37 -23
- package/templates/langs/zh/skills/pd-explorer/SKILL.md +1 -1
- package/templates/langs/zh/skills/pd-grooming/SKILL.md +1 -1
- package/templates/langs/zh/skills/pd-implementer/SKILL.md +1 -1
- package/templates/langs/zh/skills/pd-mentor/SKILL.md +1 -1
- package/templates/langs/zh/skills/pd-pain-signal/SKILL.md +37 -0
- package/templates/langs/zh/skills/pd-planner/SKILL.md +1 -1
- package/tests/core/pain-context-extractor.test.ts +278 -0
- package/tests/core/pain.test.ts +100 -1
- package/tests/hooks/pain.test.ts +1 -1
- package/templates/langs/en/skills/pain/SKILL.md +0 -19
- package/templates/langs/zh/skills/pain/SKILL.md +0 -19
- package/templates/langs/zh/skills/pd-reporter/SKILL.md +0 -78
- package/templates/langs/zh/skills/pd-reviewer/SKILL.md +0 -66
|
@@ -0,0 +1,65 @@
|
|
|
1
|
+
---
|
|
2
|
+
name: pd-planner
|
|
3
|
+
description: Movie-script-style planning to break complex tasks into executable steps. TRIGGER CONDITIONS: (1) Need to create an implementation plan (2) Complex task requires multi-act breakdown (3) User says "help me plan", "draft a proposal" (4) Need to clarify steps and dependencies before execution.
|
|
4
|
+
disable-model-invocation: true
|
|
5
|
+
---
|
|
6
|
+
|
|
7
|
+
# Planner
|
|
8
|
+
|
|
9
|
+
You are a professional planning expert. Your task is to break down complex tasks into executable steps.
|
|
10
|
+
|
|
11
|
+
## Planning Method
|
|
12
|
+
|
|
13
|
+
Use a movie-script-style planning framework:
|
|
14
|
+
|
|
15
|
+
### Act 1: Understanding
|
|
16
|
+
- **Scene Setting**: Clarify objectives, constraints, resources
|
|
17
|
+
- **Character Analysis**: Identify all participants and their capabilities
|
|
18
|
+
- **Conflict Identification**: Clarify core conflicts to resolve
|
|
19
|
+
|
|
20
|
+
### Act 2: Decomposition
|
|
21
|
+
- **Act Breakdown**: Break task into 3-7 key steps
|
|
22
|
+
- **Sub-tasks within Acts**: Each act contains 3-5 sub-tasks
|
|
23
|
+
- **Verification Points**: Verify output at the end of each act
|
|
24
|
+
|
|
25
|
+
### Act 3: Prioritization
|
|
26
|
+
- **Dependencies**: Identify task dependencies
|
|
27
|
+
- **Risk Ordering**: Front-load high-risk tasks
|
|
28
|
+
- **Resource Allocation**: Ensure critical resources are available
|
|
29
|
+
|
|
30
|
+
## Output Format
|
|
31
|
+
|
|
32
|
+
### Plan Document
|
|
33
|
+
|
|
34
|
+
**Task Objective**: [Clear objective statement]
|
|
35
|
+
|
|
36
|
+
**Constraints**:
|
|
37
|
+
- Time constraints: [Time limits]
|
|
38
|
+
- Resource constraints: [Available resources]
|
|
39
|
+
- Risk constraints: [Risks to avoid]
|
|
40
|
+
|
|
41
|
+
**Act 1: Understanding**
|
|
42
|
+
- Scene: [Current situation]
|
|
43
|
+
- Characters: [Stakeholders]
|
|
44
|
+
- Conflict: [Core problem]
|
|
45
|
+
|
|
46
|
+
**Act 2: Decomposition**
|
|
47
|
+
|
|
48
|
+
**Act 1**: [Title]
|
|
49
|
+
- Step 1.1: [Specific action]
|
|
50
|
+
- Step 1.2: [Specific action]
|
|
51
|
+
- Step 1.3: [Specific action]
|
|
52
|
+
- Verification: [Success criteria]
|
|
53
|
+
|
|
54
|
+
**Acts 2-3**: [Similar structure]
|
|
55
|
+
|
|
56
|
+
**Act 3: Prioritization**
|
|
57
|
+
- Sequence: [Recommended execution order]
|
|
58
|
+
- Parallel opportunities: [Tasks that can run in parallel]
|
|
59
|
+
- Checkpoints: [Key verification points]
|
|
60
|
+
|
|
61
|
+
**Risk Assessment**: [Potential issues and mitigations]
|
|
62
|
+
|
|
63
|
+
---
|
|
64
|
+
|
|
65
|
+
Please follow this framework to create a plan and output a structured execution script.
|
|
@@ -0,0 +1,7 @@
|
|
|
1
|
+
### P-10: 流程即权限 (Process as Authority)
|
|
2
|
+
- **Trigger**: 当智能体拥有技术能力直接执行某项操作时
|
|
3
|
+
- **Constraint (Must)**: 必须检查是否存在约定的流程。有流程则必须遵循,即使技术上可以绕过
|
|
4
|
+
- **Constraint (Forbidden)**: 禁止以"技术上可行"为由绕过约定流程
|
|
5
|
+
- **Verification**: 操作前自问:"这个操作有没有约定的流程?我是否在遵循它?"
|
|
6
|
+
- **Exceptions**: 紧急情况下可跳过流程,但事后必须补全流程记录
|
|
7
|
+
- **Source**: 2026-03-13 直接推送 main 分支事件
|
|
@@ -0,0 +1,63 @@
|
|
|
1
|
+
# AI 冲刺编排示例
|
|
2
|
+
|
|
3
|
+
## 示例 1:baseline + validation
|
|
4
|
+
|
|
5
|
+
```powershell
|
|
6
|
+
node scripts/run.mjs --self-check
|
|
7
|
+
node scripts/run.mjs --help
|
|
8
|
+
node scripts/run.mjs --task workflow-validation-minimal
|
|
9
|
+
node scripts/run.mjs --task workflow-validation-minimal-verify
|
|
10
|
+
```
|
|
11
|
+
|
|
12
|
+
## 示例 2:自定义 runtime 根目录
|
|
13
|
+
|
|
14
|
+
```powershell
|
|
15
|
+
node scripts/run.mjs --task workflow-validation-minimal --runtime-root D:/Temp/ai-sprint-runtime
|
|
16
|
+
```
|
|
17
|
+
|
|
18
|
+
## 示例 3:失败分类
|
|
19
|
+
|
|
20
|
+
- `workflow bug`:package-local script 仍然写回 repo-root `ops/ai-sprints`
|
|
21
|
+
- `agent behavior issue`:reviewer 漏掉 `VERDICT`,或 `DIMENSIONS` 格式错误
|
|
22
|
+
- `environment issue`:`acpx` 缺失,或 workspace 不可写
|
|
23
|
+
- `sample-spec issue`:validation spec 要求的字段,当前 sample / product 还没有实现
|
|
24
|
+
|
|
25
|
+
## 示例 4:何时停止
|
|
26
|
+
|
|
27
|
+
如果问题属于以下情况,完成分类后立刻停止本轮:
|
|
28
|
+
|
|
29
|
+
- the issue belongs to `packages/openclaw-plugin`
|
|
30
|
+
- the issue depends on `D:/Code/openclaw`
|
|
31
|
+
- the fix would require dashboard/stageGraph/self-optimization sprint expansion
|
|
32
|
+
- the problem is a sample-side or product-side gap rather than workflow plumbing
|
|
33
|
+
|
|
34
|
+
## 示例 5:从复杂 bugfix 模板开始
|
|
35
|
+
|
|
36
|
+
1. Copy `references/specs/bugfix-complex-template.json`
|
|
37
|
+
2. Replace every placeholder in `taskContract`
|
|
38
|
+
3. Narrow `executionScope` to the smallest useful round
|
|
39
|
+
4. Run the packaged entrypoint with the edited spec:
|
|
40
|
+
|
|
41
|
+
```powershell
|
|
42
|
+
node scripts/run.mjs --task custom-bugfix --task-spec D:/path/to/your-bugfix-spec.json
|
|
43
|
+
```
|
|
44
|
+
|
|
45
|
+
## 示例 6:从复杂 feature 模板开始
|
|
46
|
+
|
|
47
|
+
1. Copy `references/specs/feature-complex-template.json`
|
|
48
|
+
2. Fill `Goal`, `In scope`, `Out of scope`, `Validation commands`, and `Expected artifacts`
|
|
49
|
+
3. Confirm the spec does not require product-side closure outside this milestone
|
|
50
|
+
4. Run:
|
|
51
|
+
|
|
52
|
+
```powershell
|
|
53
|
+
node scripts/run.mjs --task custom-feature --task-spec D:/path/to/your-feature-spec.json
|
|
54
|
+
```
|
|
55
|
+
|
|
56
|
+
## 示例 7:continuation 前先看 checkpoint summary
|
|
57
|
+
|
|
58
|
+
当一轮以 `revise` 结束时,优先检查:
|
|
59
|
+
|
|
60
|
+
- `stages/<stage>/checkpoint-summary.md`
|
|
61
|
+
- `stages/<stage>/handoff.json`
|
|
62
|
+
|
|
63
|
+
下一轮应该把 checkpoint summary 当作主 carry-forward,上下文不够时才回退到完整 decision 文本。
|
|
@@ -0,0 +1,136 @@
|
|
|
1
|
+
# AI 冲刺编排参考
|
|
2
|
+
|
|
3
|
+
## 包结构
|
|
4
|
+
|
|
5
|
+
- `scripts/run.mjs`:package-local orchestrator 入口
|
|
6
|
+
- `scripts/lib/`:decision、contract validation、state store、spec loading、archive helper
|
|
7
|
+
- `references/specs/`:内置 validation spec
|
|
8
|
+
- `references/agent-registry.json`:package-local 的 agent/model 注册表
|
|
9
|
+
- `references/workflow-v1-acceptance-checklist.md`:handoff 检查清单
|
|
10
|
+
- `runtime/`:运行产物默认目录
|
|
11
|
+
|
|
12
|
+
## Runtime 结构
|
|
13
|
+
|
|
14
|
+
默认 runtime 根目录:
|
|
15
|
+
|
|
16
|
+
- `packages/openclaw-plugin/templates/langs/<lang>/skills/ai-sprint-orchestration/runtime`
|
|
17
|
+
|
|
18
|
+
子目录:
|
|
19
|
+
|
|
20
|
+
- `runs/<run-id>/`
|
|
21
|
+
- `archive/<run-id>/`
|
|
22
|
+
- `tmp/sprint-agent/<run-id>/...`
|
|
23
|
+
|
|
24
|
+
也可以通过以下方式覆盖:
|
|
25
|
+
|
|
26
|
+
- `--runtime-root <path>`
|
|
27
|
+
- `AI_SPRINT_RUNTIME_ROOT=<path>`
|
|
28
|
+
|
|
29
|
+
## 自检
|
|
30
|
+
|
|
31
|
+
在新安装环境中先跑:
|
|
32
|
+
|
|
33
|
+
- `node scripts/run.mjs --self-check`
|
|
34
|
+
|
|
35
|
+
它会检查:
|
|
36
|
+
|
|
37
|
+
- package-local references 是否存在
|
|
38
|
+
- built-in spec 是否能加载
|
|
39
|
+
- `agent-registry.json` 是否存在
|
|
40
|
+
- `acpx` 是否可调用
|
|
41
|
+
- runtime 根目录是否可写
|
|
42
|
+
|
|
43
|
+
## 内置 spec
|
|
44
|
+
|
|
45
|
+
- `workflow-validation-minimal`
|
|
46
|
+
- `workflow-validation-minimal-verify`
|
|
47
|
+
- `bugfix-complex-template` (copy and fill before use)
|
|
48
|
+
- `feature-complex-template` (copy and fill before use)
|
|
49
|
+
|
|
50
|
+
这些 spec 用来做 package 自检,验证的是 workflow 包本身,不是产品功能。
|
|
51
|
+
|
|
52
|
+
## 关键产物
|
|
53
|
+
|
|
54
|
+
每次运行重点看:
|
|
55
|
+
|
|
56
|
+
- `sprint.json`
|
|
57
|
+
- `timeline.md`
|
|
58
|
+
- `latest-summary.md`
|
|
59
|
+
- `decision.md`
|
|
60
|
+
- `scorecard.json`
|
|
61
|
+
|
|
62
|
+
重要持久化字段:
|
|
63
|
+
|
|
64
|
+
- `outputQuality`
|
|
65
|
+
- `qualityReasons`
|
|
66
|
+
- `validation`
|
|
67
|
+
- `nextRunRecommendation`
|
|
68
|
+
- `failureClassification`
|
|
69
|
+
- `failureSource`
|
|
70
|
+
- `recommendedNextAction`
|
|
71
|
+
|
|
72
|
+
每个 stage 的 carry-forward 产物:
|
|
73
|
+
|
|
74
|
+
- `checkpoint-summary.md`
|
|
75
|
+
|
|
76
|
+
下一轮 continuation 应优先读取 `checkpoint-summary.md`,只有在不够用时才退回到完整的 `decision.md` 或 `handoff.json`。
|
|
77
|
+
|
|
78
|
+
## 失败分类
|
|
79
|
+
|
|
80
|
+
只能使用其中一个:
|
|
81
|
+
|
|
82
|
+
- `workflow bug`:编排逻辑、产物布局、CLI、validation、持久化问题
|
|
83
|
+
- `agent behavior issue`:workflow prompt / contract 正确,但 agent 输出质量或格式漂移
|
|
84
|
+
- `environment issue`:二进制缺失、权限、文件系统、PATH、runtime 访问问题
|
|
85
|
+
- `sample-spec issue`:spec 本身有问题,或暴露了不应在当前里程碑修的 sample-side / product-side 缺口
|
|
86
|
+
|
|
87
|
+
## 复杂任务的最小 task contract
|
|
88
|
+
|
|
89
|
+
复杂 bugfix 和 feature spec 必须显式提供:
|
|
90
|
+
|
|
91
|
+
- `Goal`
|
|
92
|
+
- `In scope`
|
|
93
|
+
- `Out of scope`
|
|
94
|
+
- `Validation commands`
|
|
95
|
+
- `Expected artifacts`
|
|
96
|
+
|
|
97
|
+
如果这些字段缺失,或者仍然是占位内容,packaged skill 会直接拒绝启动 sprint。
|
|
98
|
+
|
|
99
|
+
## 执行范围限制
|
|
100
|
+
|
|
101
|
+
复杂 spec 可以额外定义:
|
|
102
|
+
|
|
103
|
+
- `maxFiles`
|
|
104
|
+
- `maxChecks`
|
|
105
|
+
- `maxDeliverables`
|
|
106
|
+
|
|
107
|
+
producer 在改代码前,应先在 worklog 里声明 `PLANNED_FILES`、`PLANNED_CHECKS` 和 `DELIVERABLES`。如果一轮会超出范围,就缩小这一轮,而不是强行把大改塞进一次执行。
|
|
108
|
+
|
|
109
|
+
## 同步规则
|
|
110
|
+
|
|
111
|
+
事实来源仍然是:
|
|
112
|
+
|
|
113
|
+
- the repository copy at `packages/openclaw-plugin/templates/langs/zh/skills/ai-sprint-orchestration`
|
|
114
|
+
|
|
115
|
+
只有当变更影响以下内容时,才同步 packaged copy:
|
|
116
|
+
|
|
117
|
+
- package-local CLI behavior
|
|
118
|
+
- validation behavior
|
|
119
|
+
- artifact layout
|
|
120
|
+
- package-local references or runtime assumptions
|
|
121
|
+
|
|
122
|
+
不要盲目镜像所有上游 orchestrator 修改。
|
|
123
|
+
|
|
124
|
+
## 下一阶段架构方向
|
|
125
|
+
|
|
126
|
+
这个 package 现在已经支持更细粒度的 `work-unit` 上下文约束。关键 work-unit 字段包括:
|
|
127
|
+
|
|
128
|
+
- `workUnitId`
|
|
129
|
+
- `workUnitGoal`
|
|
130
|
+
- `allowedFiles`
|
|
131
|
+
- `unitChecks`
|
|
132
|
+
- `unitDeliverables`
|
|
133
|
+
- `unitSummary`
|
|
134
|
+
- `carryForwardSummary`
|
|
135
|
+
|
|
136
|
+
continuation 默认优先读取更短的 `carryForwardSummary`,而不是回放整段历史 decision。目标是把跨 unit 传递的上下文压缩到最小必要信息,降低长运行过程里的上下文漂移。
|
|
@@ -0,0 +1,67 @@
|
|
|
1
|
+
---
|
|
2
|
+
name: ai-sprint-orchestration
|
|
3
|
+
description: 使用打包好的 AI 冲刺编排器推进多阶段开发任务,内置基线检查、工作流验证、失败分类和 workflow-only 迭代纪律。
|
|
4
|
+
---
|
|
5
|
+
|
|
6
|
+
# AI 冲刺编排
|
|
7
|
+
|
|
8
|
+
当任务较大、需要多阶段推进,或者大概率会经历多轮 review / continuation 时,使用这个 skill。
|
|
9
|
+
这个 skill 自带一份可直接运行的编排器打包副本,代理可以直接从当前 skill 目录启动,而不需要去仓库里寻找内部脚本入口。
|
|
10
|
+
|
|
11
|
+
## 适用场景
|
|
12
|
+
|
|
13
|
+
- 需要调研、实现、评审三段推进的复杂缺陷修复
|
|
14
|
+
- 需要显式 producer / reviewer 决策门控的功能开发
|
|
15
|
+
- 使用内置 validation spec 做 workflow 自检
|
|
16
|
+
- 需要产物持久化和可恢复能力的长时任务
|
|
17
|
+
|
|
18
|
+
## 不适用场景
|
|
19
|
+
|
|
20
|
+
- 很小的单文件修改或简单文档修补
|
|
21
|
+
- `packages/openclaw-plugin` 里的 product-side / sample-side 问题
|
|
22
|
+
- 需要修改 `D:/Code/openclaw` 的任务
|
|
23
|
+
- dashboard、stageGraph、自优化 sprint 或并行编排扩展
|
|
24
|
+
|
|
25
|
+
## 快速开始
|
|
26
|
+
|
|
27
|
+
在当前 skill 包根目录执行:
|
|
28
|
+
|
|
29
|
+
1. 先做 package 烟雾检查:
|
|
30
|
+
`node scripts/run.mjs --self-check`
|
|
31
|
+
`node scripts/run.mjs --help`
|
|
32
|
+
2. 再跑 package-local validation:
|
|
33
|
+
`node scripts/run.mjs --task workflow-validation-minimal`
|
|
34
|
+
`node scripts/run.mjs --task workflow-validation-minimal-verify`
|
|
35
|
+
3. 产物默认落在:
|
|
36
|
+
`runtime/`
|
|
37
|
+
|
|
38
|
+
内部 smoke 标准:
|
|
39
|
+
|
|
40
|
+
- `node scripts/run.mjs --self-check` 通过
|
|
41
|
+
- `workflow-validation-minimal` 至少推进到 producer 完成,并产出结构化 decision 或明确分类的 halt
|
|
42
|
+
- `workflow-validation-minimal-verify` 至少推进到 producer 完成,任何 reviewer 失败都必须被分类,不能保持不透明
|
|
43
|
+
|
|
44
|
+
如果你同时持有源码仓库,也可以额外运行仓库里 `packages/openclaw-plugin/templates/langs/zh/skills/ai-sprint-orchestration/test/` 的 source baseline tests。
|
|
45
|
+
|
|
46
|
+
## 执行规则
|
|
47
|
+
|
|
48
|
+
- 以仓库中的 `packages/openclaw-plugin/templates/langs/zh/skills/ai-sprint-orchestration` 作为代码事实来源;英文目录是分发镜像,不是独立实现分支。
|
|
49
|
+
- 如果一次运行失败,只能归类成以下四类之一:
|
|
50
|
+
- `workflow bug`
|
|
51
|
+
- `agent behavior issue`
|
|
52
|
+
- `environment issue`
|
|
53
|
+
- `sample-spec issue`
|
|
54
|
+
- 如果失败属于 product-side 或 sample-side,完成分类后立刻停止,不继续推进产品闭环修复。
|
|
55
|
+
- 每轮只修一个 workflow-only 问题,然后重跑 baseline 和 validation。
|
|
56
|
+
- 在新环境里第一次跑 validation 前,必须先执行 `node scripts/run.mjs --self-check`。
|
|
57
|
+
- 对复杂 bugfix / feature 任务,必须先复制模板 spec,填好最小 task contract,再启动 sprint。
|
|
58
|
+
|
|
59
|
+
## 输出要求
|
|
60
|
+
|
|
61
|
+
每轮只汇报:
|
|
62
|
+
|
|
63
|
+
- 改了什么
|
|
64
|
+
- 跑了什么
|
|
65
|
+
- 什么失败了
|
|
66
|
+
- 失败归类是什么
|
|
67
|
+
- 下一轮唯一推荐动作
|
|
@@ -0,0 +1,214 @@
|
|
|
1
|
+
{
|
|
2
|
+
"$schema": "agent-registry-v1",
|
|
3
|
+
"description": "Registry of available agents and their supported models for AI sprint orchestrator. All models are FREE. Updated: 2026-04-04.",
|
|
4
|
+
"lastUpdated": "2026-04-04",
|
|
5
|
+
|
|
6
|
+
"agents": {
|
|
7
|
+
"iflow": {
|
|
8
|
+
"command": "iflow --experimental-acp",
|
|
9
|
+
"description": "iFlow CLI with ACP support (智谱 Code Plan / MiniMax Code Plan 付费套餐更稳定,但以下模型全部免费)",
|
|
10
|
+
"version": "0.5.18",
|
|
11
|
+
"models": {
|
|
12
|
+
"glm-4.7": {
|
|
13
|
+
"description": "GLM-4.7 — official recommended model, fast",
|
|
14
|
+
"pricing": "free",
|
|
15
|
+
"recommendedTimeoutSeconds": 1200,
|
|
16
|
+
"features": ["recommended", "fast"],
|
|
17
|
+
"notes": "官方推荐模型,速度快"
|
|
18
|
+
},
|
|
19
|
+
"glm-5": {
|
|
20
|
+
"description": "GLM-5 — 744B parameters, long-context",
|
|
21
|
+
"pricing": "free",
|
|
22
|
+
"recommendedTimeoutSeconds": 1800,
|
|
23
|
+
"features": ["slow", "needs-extra-time"],
|
|
24
|
+
"notes": "744B 参数,运行明显较慢。Review 任务超时必须 ≥ 1800s"
|
|
25
|
+
},
|
|
26
|
+
"qwen3-coder-plus": {
|
|
27
|
+
"description": "Qwen3-Coder-Plus — efficient coding model",
|
|
28
|
+
"pricing": "free",
|
|
29
|
+
"recommendedTimeoutSeconds": 1200,
|
|
30
|
+
"features": ["fast", "coding-optimized"],
|
|
31
|
+
"notes": "通义编码模型"
|
|
32
|
+
},
|
|
33
|
+
"deepseek-v3.2": {
|
|
34
|
+
"description": "DeepSeek V3.2",
|
|
35
|
+
"pricing": "free",
|
|
36
|
+
"recommendedTimeoutSeconds": 1200,
|
|
37
|
+
"features": ["fast"],
|
|
38
|
+
"notes": ""
|
|
39
|
+
},
|
|
40
|
+
"minimax-m2.5": {
|
|
41
|
+
"description": "MiniMax M2.5",
|
|
42
|
+
"pricing": "free",
|
|
43
|
+
"recommendedTimeoutSeconds": 1200,
|
|
44
|
+
"features": ["fast"],
|
|
45
|
+
"notes": ""
|
|
46
|
+
},
|
|
47
|
+
"kimi-k2-thinking": {
|
|
48
|
+
"description": "Kimi K2 Thinking",
|
|
49
|
+
"pricing": "free",
|
|
50
|
+
"recommendedTimeoutSeconds": 1800,
|
|
51
|
+
"features": ["reasoning"],
|
|
52
|
+
"notes": "推理型模型"
|
|
53
|
+
},
|
|
54
|
+
"kimi-k2.5": {
|
|
55
|
+
"description": "Kimi K2.5",
|
|
56
|
+
"pricing": "free",
|
|
57
|
+
"recommendedTimeoutSeconds": 1200,
|
|
58
|
+
"features": ["fast"],
|
|
59
|
+
"notes": ""
|
|
60
|
+
},
|
|
61
|
+
"kimi-k2-0905": {
|
|
62
|
+
"description": "Kimi K2 0905",
|
|
63
|
+
"pricing": "free",
|
|
64
|
+
"recommendedTimeoutSeconds": 1200,
|
|
65
|
+
"features": ["fast"],
|
|
66
|
+
"notes": ""
|
|
67
|
+
},
|
|
68
|
+
"iflow-rome-30ba3b": {
|
|
69
|
+
"description": "iFlow ROME 30BA3B",
|
|
70
|
+
"pricing": "free",
|
|
71
|
+
"recommendedTimeoutSeconds": 1200,
|
|
72
|
+
"features": ["preview"],
|
|
73
|
+
"notes": "预览版本"
|
|
74
|
+
}
|
|
75
|
+
}
|
|
76
|
+
},
|
|
77
|
+
|
|
78
|
+
"opencode": {
|
|
79
|
+
"command": "npx -y opencode-ai acp",
|
|
80
|
+
"description": "OpenCode ACP adapter",
|
|
81
|
+
"version": "1.3.13",
|
|
82
|
+
"models": {
|
|
83
|
+
"minimax-cn-coding-plan/MiniMax-M2.7": {
|
|
84
|
+
"description": "MiniMax M2.7 (Chinese coding plan)",
|
|
85
|
+
"pricing": "free",
|
|
86
|
+
"recommendedTimeoutSeconds": 1200,
|
|
87
|
+
"features": ["fast", "coding-optimized", "stable"],
|
|
88
|
+
"notes": "最稳定的模型,默认 producer 选择"
|
|
89
|
+
},
|
|
90
|
+
"minimax-cn-coding-plan/MiniMax-M2.5": {
|
|
91
|
+
"description": "MiniMax M2.5 (Chinese coding plan)",
|
|
92
|
+
"pricing": "free",
|
|
93
|
+
"recommendedTimeoutSeconds": 1200,
|
|
94
|
+
"features": ["fast", "coding-optimized"],
|
|
95
|
+
"notes": "能力略弱于 M2.7"
|
|
96
|
+
},
|
|
97
|
+
"minimax-cn-coding-plan/MiniMax-M2.7-highspeed": {
|
|
98
|
+
"description": "MiniMax M2.7 highspeed variant",
|
|
99
|
+
"pricing": "free",
|
|
100
|
+
"recommendedTimeoutSeconds": 900,
|
|
101
|
+
"features": ["fast", "highspeed"],
|
|
102
|
+
"notes": "高速变体"
|
|
103
|
+
},
|
|
104
|
+
"minimax-cn-coding-plan/MiniMax-M2": {
|
|
105
|
+
"description": "MiniMax M2 (Chinese coding plan)",
|
|
106
|
+
"pricing": "free",
|
|
107
|
+
"recommendedTimeoutSeconds": 1200,
|
|
108
|
+
"features": ["fast"],
|
|
109
|
+
"notes": "旧版本"
|
|
110
|
+
},
|
|
111
|
+
"minimax-cn-coding-plan/MiniMax-M2.1": {
|
|
112
|
+
"description": "MiniMax M2.1 (Chinese coding plan)",
|
|
113
|
+
"pricing": "free",
|
|
114
|
+
"recommendedTimeoutSeconds": 1200,
|
|
115
|
+
"features": ["fast"],
|
|
116
|
+
"notes": "旧版本"
|
|
117
|
+
}
|
|
118
|
+
}
|
|
119
|
+
},
|
|
120
|
+
|
|
121
|
+
"gemini": {
|
|
122
|
+
"command": "gemini --acp",
|
|
123
|
+
"description": "Gemini CLI with ACP support (全部免费)",
|
|
124
|
+
"models": {
|
|
125
|
+
"gemini-2.5-pro": {
|
|
126
|
+
"description": "Gemini 2.5 Pro — high reasoning capability",
|
|
127
|
+
"pricing": "free",
|
|
128
|
+
"recommendedTimeoutSeconds": 1800,
|
|
129
|
+
"features": ["high-reasoning"],
|
|
130
|
+
"notes": "高推理能力"
|
|
131
|
+
},
|
|
132
|
+
"gemini-2.5-flash": {
|
|
133
|
+
"description": "Gemini 2.5 Flash — fast response",
|
|
134
|
+
"pricing": "free",
|
|
135
|
+
"recommendedTimeoutSeconds": 1200,
|
|
136
|
+
"features": ["fast"],
|
|
137
|
+
"notes": "快速响应"
|
|
138
|
+
},
|
|
139
|
+
"gemini-2.5-flash-lite": {
|
|
140
|
+
"description": "Gemini 2.5 Flash Lite — lightweight",
|
|
141
|
+
"pricing": "free",
|
|
142
|
+
"recommendedTimeoutSeconds": 900,
|
|
143
|
+
"features": ["fast", "lite"],
|
|
144
|
+
"notes": "轻量版本"
|
|
145
|
+
},
|
|
146
|
+
"gemini-3-pro-preview": {
|
|
147
|
+
"description": "Gemini 3 Pro Preview — high reasoning, limited quota",
|
|
148
|
+
"pricing": "free",
|
|
149
|
+
"recommendedTimeoutSeconds": 1800,
|
|
150
|
+
"features": ["high-reasoning", "slow", "limited-quota"],
|
|
151
|
+
"notes": "高推理,但额度有限、很慢"
|
|
152
|
+
},
|
|
153
|
+
"gemini-3-flash-preview": {
|
|
154
|
+
"description": "Gemini 3 Flash Preview",
|
|
155
|
+
"pricing": "free",
|
|
156
|
+
"recommendedTimeoutSeconds": 1200,
|
|
157
|
+
"features": ["fast", "preview"],
|
|
158
|
+
"notes": "预览版本"
|
|
159
|
+
},
|
|
160
|
+
"gemini-3.1-pro-preview": {
|
|
161
|
+
"description": "Gemini 3.1 Pro Preview — high reasoning, limited quota",
|
|
162
|
+
"pricing": "free",
|
|
163
|
+
"recommendedTimeoutSeconds": 1800,
|
|
164
|
+
"features": ["high-reasoning", "slow", "limited-quota"],
|
|
165
|
+
"notes": "高推理,但额度有限、很慢"
|
|
166
|
+
},
|
|
167
|
+
"gemini-3.1-flash-lite-preview": {
|
|
168
|
+
"description": "Gemini 3.1 Flash Lite Preview — lightweight preview",
|
|
169
|
+
"pricing": "free",
|
|
170
|
+
"recommendedTimeoutSeconds": 900,
|
|
171
|
+
"features": ["fast", "lite", "preview"],
|
|
172
|
+
"notes": "轻量预览版本"
|
|
173
|
+
}
|
|
174
|
+
}
|
|
175
|
+
},
|
|
176
|
+
|
|
177
|
+
"qwen": {
|
|
178
|
+
"command": "qwen --acp",
|
|
179
|
+
"description": "Qwen Code CLI with ACP support (全部免费)",
|
|
180
|
+
"models": {
|
|
181
|
+
"qwen3.6-plus": {
|
|
182
|
+
"description": "Qwen 3.6 Plus — efficient hybrid model with leading coding performance, 1M context window",
|
|
183
|
+
"pricing": "free",
|
|
184
|
+
"recommendedTimeoutSeconds": 1200,
|
|
185
|
+
"features": ["fast", "coding-optimized", "long-context"],
|
|
186
|
+
"notes": "高效混合模型,领先编码性能,100 万 token 上下文窗口"
|
|
187
|
+
}
|
|
188
|
+
}
|
|
189
|
+
},
|
|
190
|
+
|
|
191
|
+
"claude": {
|
|
192
|
+
"command": "claude",
|
|
193
|
+
"description": "Claude Code (Anthropic)",
|
|
194
|
+
"version": "2.1.81",
|
|
195
|
+
"models": {
|
|
196
|
+
"GLM-5.1": {
|
|
197
|
+
"description": "GLM-5.1 via Claude Code adapter",
|
|
198
|
+
"pricing": "free",
|
|
199
|
+
"recommendedTimeoutSeconds": 1800,
|
|
200
|
+
"features": ["slow"],
|
|
201
|
+
"notes": "保留给 escalation/global-reviewer 角色。注意:智谱 Code Plan 限额较高,容易触发限流"
|
|
202
|
+
}
|
|
203
|
+
}
|
|
204
|
+
}
|
|
205
|
+
},
|
|
206
|
+
|
|
207
|
+
"_notes": {
|
|
208
|
+
"paid_plans": "智谱 Code Plan 和 MiniMax Code Plan 是付费套餐,但本 registry 只登记免费可用的模型。付费套餐更稳定但不改变模型列表。",
|
|
209
|
+
"codex": "codex-acp 在当前环境无法使用,不登记。",
|
|
210
|
+
"kilocode": "kilocode ACP 是 server 模式(监听端口),不是 headless prompt-response,不兼容 acpx,不登记。",
|
|
211
|
+
"qodercli": "qodercli 没有 --acp 标志,不登记。",
|
|
212
|
+
"model_discovery": "opencode 可通过 'opencode models' 自动列出模型。其他 agent(iflow, gemini, qwen)没有 CLI 列表命令,需手动维护。"
|
|
213
|
+
}
|
|
214
|
+
}
|
|
@@ -0,0 +1,107 @@
|
|
|
1
|
+
{
|
|
2
|
+
"id": "bugfix-complex-template",
|
|
3
|
+
"title": "Complex Bugfix Template - Replace before use",
|
|
4
|
+
"workspace": "__SKILL_PACKAGE_ROOT__",
|
|
5
|
+
"branchWorkspace": "__SKILL_PACKAGE_ROOT__",
|
|
6
|
+
"branch": "main",
|
|
7
|
+
"requiresTaskContract": true,
|
|
8
|
+
"taskContract": {
|
|
9
|
+
"goal": "<describe the bug to fix and the expected behavior after the fix>",
|
|
10
|
+
"inScope": [
|
|
11
|
+
"<target modules or files that may be changed>"
|
|
12
|
+
],
|
|
13
|
+
"outOfScope": [
|
|
14
|
+
"<forbidden modules, unrelated refactors, product-side gaps>"
|
|
15
|
+
],
|
|
16
|
+
"validationCommands": [
|
|
17
|
+
"<command 1>",
|
|
18
|
+
"<command 2>"
|
|
19
|
+
],
|
|
20
|
+
"expectedArtifacts": [
|
|
21
|
+
"decision.md",
|
|
22
|
+
"scorecard.json",
|
|
23
|
+
"<optional task-specific artifact>"
|
|
24
|
+
]
|
|
25
|
+
},
|
|
26
|
+
"executionScope": {
|
|
27
|
+
"maxFiles": 6,
|
|
28
|
+
"maxChecks": 4,
|
|
29
|
+
"maxDeliverables": 3
|
|
30
|
+
},
|
|
31
|
+
"maxRoundsPerStage": 2,
|
|
32
|
+
"maxRuntimeMinutes": 60,
|
|
33
|
+
"stageTimeoutMinutes": 15,
|
|
34
|
+
"stages": ["investigate", "implement-pass-1", "verify"],
|
|
35
|
+
"producer": {
|
|
36
|
+
"agent": "iflow",
|
|
37
|
+
"model": "glm-4.7",
|
|
38
|
+
"timeoutSeconds": 180
|
|
39
|
+
},
|
|
40
|
+
"reviewerA": {
|
|
41
|
+
"agent": "iflow",
|
|
42
|
+
"model": "glm-4.7",
|
|
43
|
+
"timeoutSeconds": 120,
|
|
44
|
+
"focus": "Validate root cause, behavioral change, and code correctness."
|
|
45
|
+
},
|
|
46
|
+
"reviewerB": {
|
|
47
|
+
"agent": "iflow",
|
|
48
|
+
"model": "glm-4.7",
|
|
49
|
+
"timeoutSeconds": 120,
|
|
50
|
+
"focus": "Validate scope control, verification quality, and regression risk."
|
|
51
|
+
},
|
|
52
|
+
"context": [
|
|
53
|
+
"This is a generic complex bugfix sprint template.",
|
|
54
|
+
"Replace all placeholder contract values before running.",
|
|
55
|
+
"Use this template only for workflow-contained bugfix work, not for product-side closure in out-of-scope repositories."
|
|
56
|
+
],
|
|
57
|
+
"stageGoals": {
|
|
58
|
+
"investigate": [
|
|
59
|
+
"Establish the most likely root cause.",
|
|
60
|
+
"Narrow the allowed file set and verification plan.",
|
|
61
|
+
"Produce a bugfix plan that fits one bounded implementation round."
|
|
62
|
+
],
|
|
63
|
+
"implement-pass-1": [
|
|
64
|
+
"Implement the smallest sufficient bugfix within the declared scope.",
|
|
65
|
+
"Run the planned verification commands.",
|
|
66
|
+
"Record evidence that the observed behavior changed."
|
|
67
|
+
],
|
|
68
|
+
"verify": [
|
|
69
|
+
"Verify the fix changed the intended behavior.",
|
|
70
|
+
"Check whether any regression risk remains unverified.",
|
|
71
|
+
"Decide whether the bugfix is ready to stop, continue, or revise."
|
|
72
|
+
]
|
|
73
|
+
},
|
|
74
|
+
"stageCriteria": {
|
|
75
|
+
"investigate": {
|
|
76
|
+
"requiredApprovals": 2,
|
|
77
|
+
"requiredProducerSections": ["SUMMARY", "CHANGES", "EVIDENCE", "CODE_EVIDENCE", "KEY_EVENTS", "HYPOTHESIS_MATRIX", "CHECKS", "OPEN_RISKS"],
|
|
78
|
+
"requiredReviewerSections": ["VERDICT", "BLOCKERS", "FINDINGS", "CODE_EVIDENCE", "HYPOTHESIS_MATRIX", "NEXT_FOCUS", "CHECKS"],
|
|
79
|
+
"scoringDimensions": ["root_cause_quality", "scope_definition"],
|
|
80
|
+
"dimensionThreshold": 3,
|
|
81
|
+
"requiredDeliverables": ["root_cause_hypothesis", "execution_plan", "verification_plan"]
|
|
82
|
+
},
|
|
83
|
+
"implement-pass-1": {
|
|
84
|
+
"requiredApprovals": 2,
|
|
85
|
+
"requiredProducerSections": ["SUMMARY", "CHANGES", "EVIDENCE", "CODE_EVIDENCE", "KEY_EVENTS", "HYPOTHESIS_MATRIX", "CHECKS", "OPEN_RISKS", "CONTRACT"],
|
|
86
|
+
"requiredReviewerSections": ["VERDICT", "BLOCKERS", "FINDINGS", "CODE_EVIDENCE", "HYPOTHESIS_MATRIX", "NEXT_FOCUS", "CHECKS"],
|
|
87
|
+
"scoringDimensions": ["behavior_change", "verification_quality", "scope_control"],
|
|
88
|
+
"dimensionThreshold": 3,
|
|
89
|
+
"requiredDeliverables": ["code_change", "verification_evidence", "risk_summary"]
|
|
90
|
+
},
|
|
91
|
+
"verify": {
|
|
92
|
+
"requiredApprovals": 2,
|
|
93
|
+
"requiredProducerSections": ["SUMMARY", "CHANGES", "EVIDENCE", "CODE_EVIDENCE", "KEY_EVENTS", "HYPOTHESIS_MATRIX", "CHECKS", "OPEN_RISKS"],
|
|
94
|
+
"requiredReviewerSections": ["VERDICT", "BLOCKERS", "FINDINGS", "CODE_EVIDENCE", "HYPOTHESIS_MATRIX", "NEXT_FOCUS", "CHECKS"],
|
|
95
|
+
"scoringDimensions": ["artifact_verification", "residual_risk"],
|
|
96
|
+
"dimensionThreshold": 3,
|
|
97
|
+
"requiredDeliverables": ["verified_behavior_change", "residual_risk_assessment"]
|
|
98
|
+
}
|
|
99
|
+
},
|
|
100
|
+
"stageRoleTimeouts": {
|
|
101
|
+
"investigate": { "producer": 180, "reviewer_a": 120, "reviewer_b": 120 },
|
|
102
|
+
"implement-pass-1": { "producer": 240, "reviewer_a": 120, "reviewer_b": 120 },
|
|
103
|
+
"verify": { "producer": 120, "reviewer_a": 90, "reviewer_b": 90 }
|
|
104
|
+
},
|
|
105
|
+
"continuationSpec": null,
|
|
106
|
+
"recoverySpec": null
|
|
107
|
+
}
|