principles-disciple 1.80.0 → 1.82.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/openclaw.plugin.json +1 -1
- package/package.json +1 -1
- package/src/commands/strategy.ts +0 -18
- package/src/i18n/commands.ts +0 -12
- package/src/index.ts +47 -22
- package/src/service/correction-observer-service.ts +200 -0
- package/src/service/evolution-worker.ts +2 -123
- package/templates/langs/en/core/BOOTSTRAP.md +4 -18
- package/templates/langs/en/skills/bootstrap-tools/SKILL.md +1 -1
- package/templates/langs/en/skills/init-strategy/SKILL.md +1 -1
- package/templates/langs/en/skills/pd-mentor/SKILL.md +8 -23
- package/templates/langs/zh/core/BOOTSTRAP.md +2 -15
- package/templates/langs/zh/skills/bootstrap-tools/SKILL.md +1 -1
- package/templates/langs/zh/skills/init-strategy/SKILL.md +1 -1
- package/templates/langs/zh/skills/pd-mentor/SKILL.md +7 -22
- package/tests/commands/strategy.test.ts +3 -18
- package/tests/service/correction-observer-service.test.ts +331 -0
- package/tests/service/evolution-worker.correction-observer.test.ts +41 -164
- package/templates/langs/en/skills/ai-sprint-orchestration/EXAMPLES.md +0 -63
- package/templates/langs/en/skills/ai-sprint-orchestration/REFERENCE.md +0 -136
- package/templates/langs/en/skills/ai-sprint-orchestration/SKILL.md +0 -67
- package/templates/langs/en/skills/ai-sprint-orchestration/references/agent-registry.json +0 -143
- package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +0 -107
- package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +0 -107
- package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +0 -95
- package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +0 -98
- package/templates/langs/en/skills/ai-sprint-orchestration/references/workflow-v1-acceptance-checklist.md +0 -58
- package/templates/langs/en/skills/ai-sprint-orchestration/references/workflow-v1.4-work-unit-handoff.md +0 -190
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/archive.mjs +0 -310
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/contract-enforcement.mjs +0 -683
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/decision.mjs +0 -604
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/state-store.mjs +0 -32
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/task-specs.mjs +0 -707
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/run.mjs +0 -3455
- package/templates/langs/en/skills/evolve-system/SKILL.md +0 -46
- package/templates/langs/en/skills/manage-okr/SKILL.md +0 -96
- package/templates/langs/en/skills/pd-daily/SKILL.md +0 -199
- package/templates/langs/en/skills/pd-grooming/SKILL.md +0 -46
- package/templates/langs/zh/skills/ai-sprint-orchestration/EXAMPLES.md +0 -63
- package/templates/langs/zh/skills/ai-sprint-orchestration/REFERENCE.md +0 -136
- package/templates/langs/zh/skills/ai-sprint-orchestration/SKILL.md +0 -67
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/agent-registry.json +0 -143
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +0 -107
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +0 -107
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/nocturnal-trinity-quality-enhancement.json +0 -111
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +0 -95
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +0 -98
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/workflow-v1-acceptance-checklist.md +0 -58
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/workflow-v1.4-work-unit-handoff.md +0 -190
- package/templates/langs/zh/skills/ai-sprint-orchestration/runtime/.gitignore +0 -2
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/archive.mjs +0 -310
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/contract-enforcement.mjs +0 -683
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/decision.mjs +0 -604
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/state-store.mjs +0 -32
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/task-specs.mjs +0 -707
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/run.mjs +0 -3455
- package/templates/langs/zh/skills/ai-sprint-orchestration/test/archive.test.mjs +0 -230
- package/templates/langs/zh/skills/ai-sprint-orchestration/test/contract-enforcement.test.mjs +0 -672
- package/templates/langs/zh/skills/ai-sprint-orchestration/test/decision.test.mjs +0 -1321
- package/templates/langs/zh/skills/ai-sprint-orchestration/test/run.test.mjs +0 -1435
- package/templates/langs/zh/skills/evolve-system/SKILL.md +0 -46
- package/templates/langs/zh/skills/manage-okr/SKILL.md +0 -109
- package/templates/langs/zh/skills/pd-daily/SKILL.md +0 -283
- package/templates/langs/zh/skills/pd-grooming/SKILL.md +0 -46
|
@@ -1,143 +0,0 @@
|
|
|
1
|
-
{
|
|
2
|
-
"$schema": "agent-registry-v1",
|
|
3
|
-
"description": "Registry of available agents and their supported models for AI sprint orchestrator. All models are FREE. Updated: 2026-04-04.",
|
|
4
|
-
"lastUpdated": "2026-04-04",
|
|
5
|
-
|
|
6
|
-
"agents": {
|
|
7
|
-
"opencode": {
|
|
8
|
-
"command": "npx -y opencode-ai acp",
|
|
9
|
-
"description": "OpenCode ACP adapter",
|
|
10
|
-
"version": "1.3.13",
|
|
11
|
-
"models": {
|
|
12
|
-
"minimax-cn-coding-plan/MiniMax-M2.7": {
|
|
13
|
-
"description": "MiniMax M2.7 (Chinese coding plan)",
|
|
14
|
-
"pricing": "free",
|
|
15
|
-
"recommendedTimeoutSeconds": 1200,
|
|
16
|
-
"features": ["fast", "coding-optimized", "stable"],
|
|
17
|
-
"notes": "最稳定的模型,默认 producer 选择"
|
|
18
|
-
},
|
|
19
|
-
"minimax-cn-coding-plan/MiniMax-M2.5": {
|
|
20
|
-
"description": "MiniMax M2.5 (Chinese coding plan)",
|
|
21
|
-
"pricing": "free",
|
|
22
|
-
"recommendedTimeoutSeconds": 1200,
|
|
23
|
-
"features": ["fast", "coding-optimized"],
|
|
24
|
-
"notes": "能力略弱于 M2.7"
|
|
25
|
-
},
|
|
26
|
-
"minimax-cn-coding-plan/MiniMax-M2.7-highspeed": {
|
|
27
|
-
"description": "MiniMax M2.7 highspeed variant",
|
|
28
|
-
"pricing": "free",
|
|
29
|
-
"recommendedTimeoutSeconds": 900,
|
|
30
|
-
"features": ["fast", "highspeed"],
|
|
31
|
-
"notes": "高速变体"
|
|
32
|
-
},
|
|
33
|
-
"minimax-cn-coding-plan/MiniMax-M2": {
|
|
34
|
-
"description": "MiniMax M2 (Chinese coding plan)",
|
|
35
|
-
"pricing": "free",
|
|
36
|
-
"recommendedTimeoutSeconds": 1200,
|
|
37
|
-
"features": ["fast"],
|
|
38
|
-
"notes": "旧版本"
|
|
39
|
-
},
|
|
40
|
-
"minimax-cn-coding-plan/MiniMax-M2.1": {
|
|
41
|
-
"description": "MiniMax M2.1 (Chinese coding plan)",
|
|
42
|
-
"pricing": "free",
|
|
43
|
-
"recommendedTimeoutSeconds": 1200,
|
|
44
|
-
"features": ["fast"],
|
|
45
|
-
"notes": "旧版本"
|
|
46
|
-
}
|
|
47
|
-
}
|
|
48
|
-
},
|
|
49
|
-
|
|
50
|
-
"gemini": {
|
|
51
|
-
"command": "gemini --acp",
|
|
52
|
-
"description": "Gemini CLI with ACP support (全部免费)",
|
|
53
|
-
"models": {
|
|
54
|
-
"gemini-2.5-pro": {
|
|
55
|
-
"description": "Gemini 2.5 Pro — high reasoning capability",
|
|
56
|
-
"pricing": "free",
|
|
57
|
-
"recommendedTimeoutSeconds": 1800,
|
|
58
|
-
"features": ["high-reasoning"],
|
|
59
|
-
"notes": "高推理能力"
|
|
60
|
-
},
|
|
61
|
-
"gemini-2.5-flash": {
|
|
62
|
-
"description": "Gemini 2.5 Flash — fast response",
|
|
63
|
-
"pricing": "free",
|
|
64
|
-
"recommendedTimeoutSeconds": 1200,
|
|
65
|
-
"features": ["fast"],
|
|
66
|
-
"notes": "快速响应"
|
|
67
|
-
},
|
|
68
|
-
"gemini-2.5-flash-lite": {
|
|
69
|
-
"description": "Gemini 2.5 Flash Lite — lightweight",
|
|
70
|
-
"pricing": "free",
|
|
71
|
-
"recommendedTimeoutSeconds": 900,
|
|
72
|
-
"features": ["fast", "lite"],
|
|
73
|
-
"notes": "轻量版本"
|
|
74
|
-
},
|
|
75
|
-
"gemini-3-pro-preview": {
|
|
76
|
-
"description": "Gemini 3 Pro Preview — high reasoning, limited quota",
|
|
77
|
-
"pricing": "free",
|
|
78
|
-
"recommendedTimeoutSeconds": 1800,
|
|
79
|
-
"features": ["high-reasoning", "slow", "limited-quota"],
|
|
80
|
-
"notes": "高推理,但额度有限、很慢"
|
|
81
|
-
},
|
|
82
|
-
"gemini-3-flash-preview": {
|
|
83
|
-
"description": "Gemini 3 Flash Preview",
|
|
84
|
-
"pricing": "free",
|
|
85
|
-
"recommendedTimeoutSeconds": 1200,
|
|
86
|
-
"features": ["fast", "preview"],
|
|
87
|
-
"notes": "预览版本"
|
|
88
|
-
},
|
|
89
|
-
"gemini-3.1-pro-preview": {
|
|
90
|
-
"description": "Gemini 3.1 Pro Preview — high reasoning, limited quota",
|
|
91
|
-
"pricing": "free",
|
|
92
|
-
"recommendedTimeoutSeconds": 1800,
|
|
93
|
-
"features": ["high-reasoning", "slow", "limited-quota"],
|
|
94
|
-
"notes": "高推理,但额度有限、很慢"
|
|
95
|
-
},
|
|
96
|
-
"gemini-3.1-flash-lite-preview": {
|
|
97
|
-
"description": "Gemini 3.1 Flash Lite Preview — lightweight preview",
|
|
98
|
-
"pricing": "free",
|
|
99
|
-
"recommendedTimeoutSeconds": 900,
|
|
100
|
-
"features": ["fast", "lite", "preview"],
|
|
101
|
-
"notes": "轻量预览版本"
|
|
102
|
-
}
|
|
103
|
-
}
|
|
104
|
-
},
|
|
105
|
-
|
|
106
|
-
"qwen": {
|
|
107
|
-
"command": "qwen --acp",
|
|
108
|
-
"description": "Qwen Code CLI with ACP support (全部免费)",
|
|
109
|
-
"models": {
|
|
110
|
-
"qwen3.6-plus": {
|
|
111
|
-
"description": "Qwen 3.6 Plus — efficient hybrid model with leading coding performance, 1M context window",
|
|
112
|
-
"pricing": "free",
|
|
113
|
-
"recommendedTimeoutSeconds": 1200,
|
|
114
|
-
"features": ["fast", "coding-optimized", "long-context"],
|
|
115
|
-
"notes": "高效混合模型,领先编码性能,100 万 token 上下文窗口"
|
|
116
|
-
}
|
|
117
|
-
}
|
|
118
|
-
},
|
|
119
|
-
|
|
120
|
-
"claude": {
|
|
121
|
-
"command": "claude",
|
|
122
|
-
"description": "Claude Code (Anthropic)",
|
|
123
|
-
"version": "2.1.81",
|
|
124
|
-
"models": {
|
|
125
|
-
"GLM-5.1": {
|
|
126
|
-
"description": "GLM-5.1 via Claude Code adapter",
|
|
127
|
-
"pricing": "free",
|
|
128
|
-
"recommendedTimeoutSeconds": 1800,
|
|
129
|
-
"features": ["slow"],
|
|
130
|
-
"notes": "保留给 escalation/global-reviewer 角色。注意:智谱 Code Plan 限额较高,容易触发限流"
|
|
131
|
-
}
|
|
132
|
-
}
|
|
133
|
-
}
|
|
134
|
-
},
|
|
135
|
-
|
|
136
|
-
"_notes": {
|
|
137
|
-
"paid_plans": "智谱 Code Plan 和 MiniMax Code Plan 是付费套餐,但本 registry 只登记免费可用的模型。付费套餐更稳定但不改变模型列表。",
|
|
138
|
-
"codex": "codex-acp 在当前环境无法使用,不登记。",
|
|
139
|
-
"kilocode": "kilocode ACP 是 server 模式(监听端口),不是 headless prompt-response,不兼容 acpx,不登记。",
|
|
140
|
-
"qodercli": "qodercli 没有 --acp 标志,不登记。",
|
|
141
|
-
"model_discovery": "opencode 可通过 'opencode models' 自动列出模型。其他 agent(gemini, qwen)没有 CLI 列表命令,需手动维护。"
|
|
142
|
-
}
|
|
143
|
-
}
|
|
@@ -1,107 +0,0 @@
|
|
|
1
|
-
{
|
|
2
|
-
"id": "bugfix-complex-template",
|
|
3
|
-
"title": "Complex Bugfix Template - Replace before use",
|
|
4
|
-
"workspace": "__SKILL_PACKAGE_ROOT__",
|
|
5
|
-
"branchWorkspace": "__SKILL_PACKAGE_ROOT__",
|
|
6
|
-
"branch": "main",
|
|
7
|
-
"requiresTaskContract": true,
|
|
8
|
-
"taskContract": {
|
|
9
|
-
"goal": "<describe the bug to fix and the expected behavior after the fix>",
|
|
10
|
-
"inScope": [
|
|
11
|
-
"<target modules or files that may be changed>"
|
|
12
|
-
],
|
|
13
|
-
"outOfScope": [
|
|
14
|
-
"<forbidden modules, unrelated refactors, product-side gaps>"
|
|
15
|
-
],
|
|
16
|
-
"validationCommands": [
|
|
17
|
-
"<command 1>",
|
|
18
|
-
"<command 2>"
|
|
19
|
-
],
|
|
20
|
-
"expectedArtifacts": [
|
|
21
|
-
"decision.md",
|
|
22
|
-
"scorecard.json",
|
|
23
|
-
"<optional task-specific artifact>"
|
|
24
|
-
]
|
|
25
|
-
},
|
|
26
|
-
"executionScope": {
|
|
27
|
-
"maxFiles": 6,
|
|
28
|
-
"maxChecks": 4,
|
|
29
|
-
"maxDeliverables": 3
|
|
30
|
-
},
|
|
31
|
-
"maxRoundsPerStage": 2,
|
|
32
|
-
"maxRuntimeMinutes": 60,
|
|
33
|
-
"stageTimeoutMinutes": 15,
|
|
34
|
-
"stages": ["investigate", "implement-pass-1", "verify"],
|
|
35
|
-
"producer": {
|
|
36
|
-
"agent": "opencode",
|
|
37
|
-
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
38
|
-
"timeoutSeconds": 180
|
|
39
|
-
},
|
|
40
|
-
"reviewerA": {
|
|
41
|
-
"agent": "opencode",
|
|
42
|
-
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
43
|
-
"timeoutSeconds": 120,
|
|
44
|
-
"focus": "Validate root cause, behavioral change, and code correctness."
|
|
45
|
-
},
|
|
46
|
-
"reviewerB": {
|
|
47
|
-
"agent": "opencode",
|
|
48
|
-
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
49
|
-
"timeoutSeconds": 120,
|
|
50
|
-
"focus": "Validate scope control, verification quality, and regression risk."
|
|
51
|
-
},
|
|
52
|
-
"context": [
|
|
53
|
-
"This is a generic complex bugfix sprint template.",
|
|
54
|
-
"Replace all placeholder contract values before running.",
|
|
55
|
-
"Use this template only for workflow-contained bugfix work, not for product-side closure in out-of-scope repositories."
|
|
56
|
-
],
|
|
57
|
-
"stageGoals": {
|
|
58
|
-
"investigate": [
|
|
59
|
-
"Establish the most likely root cause.",
|
|
60
|
-
"Narrow the allowed file set and verification plan.",
|
|
61
|
-
"Produce a bugfix plan that fits one bounded implementation round."
|
|
62
|
-
],
|
|
63
|
-
"implement-pass-1": [
|
|
64
|
-
"Implement the smallest sufficient bugfix within the declared scope.",
|
|
65
|
-
"Run the planned verification commands.",
|
|
66
|
-
"Record evidence that the observed behavior changed."
|
|
67
|
-
],
|
|
68
|
-
"verify": [
|
|
69
|
-
"Verify the fix changed the intended behavior.",
|
|
70
|
-
"Check whether any regression risk remains unverified.",
|
|
71
|
-
"Decide whether the bugfix is ready to stop, continue, or revise."
|
|
72
|
-
]
|
|
73
|
-
},
|
|
74
|
-
"stageCriteria": {
|
|
75
|
-
"investigate": {
|
|
76
|
-
"requiredApprovals": 2,
|
|
77
|
-
"requiredProducerSections": ["SUMMARY", "CHANGES", "EVIDENCE", "CODE_EVIDENCE", "KEY_EVENTS", "HYPOTHESIS_MATRIX", "CHECKS", "OPEN_RISKS"],
|
|
78
|
-
"requiredReviewerSections": ["VERDICT", "BLOCKERS", "FINDINGS", "CODE_EVIDENCE", "HYPOTHESIS_MATRIX", "NEXT_FOCUS", "CHECKS"],
|
|
79
|
-
"scoringDimensions": ["root_cause_quality", "scope_definition"],
|
|
80
|
-
"dimensionThreshold": 3,
|
|
81
|
-
"requiredDeliverables": ["root_cause_hypothesis", "execution_plan", "verification_plan"]
|
|
82
|
-
},
|
|
83
|
-
"implement-pass-1": {
|
|
84
|
-
"requiredApprovals": 2,
|
|
85
|
-
"requiredProducerSections": ["SUMMARY", "CHANGES", "EVIDENCE", "CODE_EVIDENCE", "KEY_EVENTS", "HYPOTHESIS_MATRIX", "CHECKS", "OPEN_RISKS", "CONTRACT"],
|
|
86
|
-
"requiredReviewerSections": ["VERDICT", "BLOCKERS", "FINDINGS", "CODE_EVIDENCE", "HYPOTHESIS_MATRIX", "NEXT_FOCUS", "CHECKS"],
|
|
87
|
-
"scoringDimensions": ["behavior_change", "verification_quality", "scope_control"],
|
|
88
|
-
"dimensionThreshold": 3,
|
|
89
|
-
"requiredDeliverables": ["code_change", "verification_evidence", "risk_summary"]
|
|
90
|
-
},
|
|
91
|
-
"verify": {
|
|
92
|
-
"requiredApprovals": 2,
|
|
93
|
-
"requiredProducerSections": ["SUMMARY", "CHANGES", "EVIDENCE", "CODE_EVIDENCE", "KEY_EVENTS", "HYPOTHESIS_MATRIX", "CHECKS", "OPEN_RISKS"],
|
|
94
|
-
"requiredReviewerSections": ["VERDICT", "BLOCKERS", "FINDINGS", "CODE_EVIDENCE", "HYPOTHESIS_MATRIX", "NEXT_FOCUS", "CHECKS"],
|
|
95
|
-
"scoringDimensions": ["artifact_verification", "residual_risk"],
|
|
96
|
-
"dimensionThreshold": 3,
|
|
97
|
-
"requiredDeliverables": ["verified_behavior_change", "residual_risk_assessment"]
|
|
98
|
-
}
|
|
99
|
-
},
|
|
100
|
-
"stageRoleTimeouts": {
|
|
101
|
-
"investigate": { "producer": 180, "reviewer_a": 120, "reviewer_b": 120 },
|
|
102
|
-
"implement-pass-1": { "producer": 240, "reviewer_a": 120, "reviewer_b": 120 },
|
|
103
|
-
"verify": { "producer": 120, "reviewer_a": 90, "reviewer_b": 90 }
|
|
104
|
-
},
|
|
105
|
-
"continuationSpec": null,
|
|
106
|
-
"recoverySpec": null
|
|
107
|
-
}
|
|
@@ -1,107 +0,0 @@
|
|
|
1
|
-
{
|
|
2
|
-
"id": "feature-complex-template",
|
|
3
|
-
"title": "Complex Feature Template - Replace before use",
|
|
4
|
-
"workspace": "__SKILL_PACKAGE_ROOT__",
|
|
5
|
-
"branchWorkspace": "__SKILL_PACKAGE_ROOT__",
|
|
6
|
-
"branch": "main",
|
|
7
|
-
"requiresTaskContract": true,
|
|
8
|
-
"taskContract": {
|
|
9
|
-
"goal": "<describe the feature to implement and the user-visible behavior>",
|
|
10
|
-
"inScope": [
|
|
11
|
-
"<allowed modules or files>"
|
|
12
|
-
],
|
|
13
|
-
"outOfScope": [
|
|
14
|
-
"<forbidden scope, unrelated refactors, external product-side work>"
|
|
15
|
-
],
|
|
16
|
-
"validationCommands": [
|
|
17
|
-
"<command 1>",
|
|
18
|
-
"<command 2>"
|
|
19
|
-
],
|
|
20
|
-
"expectedArtifacts": [
|
|
21
|
-
"decision.md",
|
|
22
|
-
"scorecard.json",
|
|
23
|
-
"<optional feature artifact>"
|
|
24
|
-
]
|
|
25
|
-
},
|
|
26
|
-
"executionScope": {
|
|
27
|
-
"maxFiles": 8,
|
|
28
|
-
"maxChecks": 5,
|
|
29
|
-
"maxDeliverables": 4
|
|
30
|
-
},
|
|
31
|
-
"maxRoundsPerStage": 2,
|
|
32
|
-
"maxRuntimeMinutes": 75,
|
|
33
|
-
"stageTimeoutMinutes": 20,
|
|
34
|
-
"stages": ["investigate", "implement-pass-1", "verify"],
|
|
35
|
-
"producer": {
|
|
36
|
-
"agent": "opencode",
|
|
37
|
-
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
38
|
-
"timeoutSeconds": 240
|
|
39
|
-
},
|
|
40
|
-
"reviewerA": {
|
|
41
|
-
"agent": "opencode",
|
|
42
|
-
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
43
|
-
"timeoutSeconds": 120,
|
|
44
|
-
"focus": "Validate feature behavior, acceptance criteria coverage, and architecture fit."
|
|
45
|
-
},
|
|
46
|
-
"reviewerB": {
|
|
47
|
-
"agent": "opencode",
|
|
48
|
-
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
49
|
-
"timeoutSeconds": 120,
|
|
50
|
-
"focus": "Validate implementation scope, verification evidence, and regression risk."
|
|
51
|
-
},
|
|
52
|
-
"context": [
|
|
53
|
-
"This is a generic complex feature sprint template.",
|
|
54
|
-
"Replace all placeholder contract values before running.",
|
|
55
|
-
"Use it for bounded feature delivery with explicit acceptance criteria and verification commands."
|
|
56
|
-
],
|
|
57
|
-
"stageGoals": {
|
|
58
|
-
"investigate": [
|
|
59
|
-
"Clarify feature scope and constraints.",
|
|
60
|
-
"Identify the smallest valuable slice that can be implemented now.",
|
|
61
|
-
"Produce a verification plan aligned with acceptance criteria."
|
|
62
|
-
],
|
|
63
|
-
"implement-pass-1": [
|
|
64
|
-
"Implement the smallest valuable feature slice within the declared scope.",
|
|
65
|
-
"Run the planned verification commands.",
|
|
66
|
-
"Record evidence that the new behavior exists and is bounded."
|
|
67
|
-
],
|
|
68
|
-
"verify": [
|
|
69
|
-
"Verify the feature behaves as intended.",
|
|
70
|
-
"Check whether the acceptance criteria are actually covered by evidence.",
|
|
71
|
-
"Decide whether the feature is ready, needs continuation, or revise."
|
|
72
|
-
]
|
|
73
|
-
},
|
|
74
|
-
"stageCriteria": {
|
|
75
|
-
"investigate": {
|
|
76
|
-
"requiredApprovals": 2,
|
|
77
|
-
"requiredProducerSections": ["SUMMARY", "CHANGES", "EVIDENCE", "CODE_EVIDENCE", "KEY_EVENTS", "HYPOTHESIS_MATRIX", "CHECKS", "OPEN_RISKS"],
|
|
78
|
-
"requiredReviewerSections": ["VERDICT", "BLOCKERS", "FINDINGS", "CODE_EVIDENCE", "HYPOTHESIS_MATRIX", "NEXT_FOCUS", "CHECKS"],
|
|
79
|
-
"scoringDimensions": ["scope_definition", "acceptance_alignment"],
|
|
80
|
-
"dimensionThreshold": 3,
|
|
81
|
-
"requiredDeliverables": ["feature_slice", "acceptance_plan", "verification_plan"]
|
|
82
|
-
},
|
|
83
|
-
"implement-pass-1": {
|
|
84
|
-
"requiredApprovals": 2,
|
|
85
|
-
"requiredProducerSections": ["SUMMARY", "CHANGES", "EVIDENCE", "CODE_EVIDENCE", "KEY_EVENTS", "HYPOTHESIS_MATRIX", "CHECKS", "OPEN_RISKS", "CONTRACT"],
|
|
86
|
-
"requiredReviewerSections": ["VERDICT", "BLOCKERS", "FINDINGS", "CODE_EVIDENCE", "HYPOTHESIS_MATRIX", "NEXT_FOCUS", "CHECKS"],
|
|
87
|
-
"scoringDimensions": ["behavior_delivery", "verification_quality", "scope_control"],
|
|
88
|
-
"dimensionThreshold": 3,
|
|
89
|
-
"requiredDeliverables": ["feature_implementation", "evidence_of_behavior", "risk_summary"]
|
|
90
|
-
},
|
|
91
|
-
"verify": {
|
|
92
|
-
"requiredApprovals": 2,
|
|
93
|
-
"requiredProducerSections": ["SUMMARY", "CHANGES", "EVIDENCE", "CODE_EVIDENCE", "KEY_EVENTS", "HYPOTHESIS_MATRIX", "CHECKS", "OPEN_RISKS"],
|
|
94
|
-
"requiredReviewerSections": ["VERDICT", "BLOCKERS", "FINDINGS", "CODE_EVIDENCE", "HYPOTHESIS_MATRIX", "NEXT_FOCUS", "CHECKS"],
|
|
95
|
-
"scoringDimensions": ["artifact_verification", "acceptance_coverage"],
|
|
96
|
-
"dimensionThreshold": 3,
|
|
97
|
-
"requiredDeliverables": ["acceptance_verified", "residual_risk_assessment"]
|
|
98
|
-
}
|
|
99
|
-
},
|
|
100
|
-
"stageRoleTimeouts": {
|
|
101
|
-
"investigate": { "producer": 180, "reviewer_a": 120, "reviewer_b": 120 },
|
|
102
|
-
"implement-pass-1": { "producer": 300, "reviewer_a": 120, "reviewer_b": 120 },
|
|
103
|
-
"verify": { "producer": 120, "reviewer_a": 90, "reviewer_b": 90 }
|
|
104
|
-
},
|
|
105
|
-
"continuationSpec": null,
|
|
106
|
-
"recoverySpec": null
|
|
107
|
-
}
|
|
@@ -1,111 +0,0 @@
|
|
|
1
|
-
{
|
|
2
|
-
"id": "nocturnal-trinity-quality-enhancement",
|
|
3
|
-
"title": "Enhance nocturnal Trinity prompt quality",
|
|
4
|
-
"description": "Enhance nocturnal Trinity prompt quality — add Dreamer perspective diversity constraints and Scribe rejected-decision analysis",
|
|
5
|
-
"workspace": "/home/csuzngjh/code/principles",
|
|
6
|
-
"branch": "fix/bugs-231-228",
|
|
7
|
-
"requiresTaskContract": true,
|
|
8
|
-
"maxRoundsPerStage": 2,
|
|
9
|
-
"maxRuntimeMinutes": 60,
|
|
10
|
-
"stages": [
|
|
11
|
-
"investigate",
|
|
12
|
-
"implement-pass-1",
|
|
13
|
-
"verify"
|
|
14
|
-
],
|
|
15
|
-
"taskContract": {
|
|
16
|
-
"goal": "Improve nocturnal Trinity output quality by adding perspective diversity to Dreamer and rejected-decision analysis to Scribe",
|
|
17
|
-
"inScope": [
|
|
18
|
-
"nocturnal-trinity.ts prompt modifications",
|
|
19
|
-
"nocturnal-trinity.test.ts assertion updates",
|
|
20
|
-
"nocturnal-arbiter.ts compatibility verification"
|
|
21
|
-
],
|
|
22
|
-
"outOfScope": [
|
|
23
|
-
"Runtime or infrastructure changes",
|
|
24
|
-
"New file creation",
|
|
25
|
-
"Non-Trinity prompt changes"
|
|
26
|
-
],
|
|
27
|
-
"validationCommands": [
|
|
28
|
-
"npx vitest run packages/openclaw-plugin/tests/core/nocturnal --reporter=verbose"
|
|
29
|
-
],
|
|
30
|
-
"expectedArtifacts": [
|
|
31
|
-
"packages/openclaw-plugin/src/core/nocturnal-trinity.ts"
|
|
32
|
-
]
|
|
33
|
-
},
|
|
34
|
-
"producer": {
|
|
35
|
-
"agent": "opencode",
|
|
36
|
-
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
37
|
-
"timeoutSeconds": 1800
|
|
38
|
-
},
|
|
39
|
-
"reviewerA": {
|
|
40
|
-
"agent": "opencode",
|
|
41
|
-
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
42
|
-
"timeoutSeconds": 1200,
|
|
43
|
-
"role": "code-quality",
|
|
44
|
-
"focus": "Verify prompt changes are minimal, backward-compatible, and don't break existing arbiter validation"
|
|
45
|
-
},
|
|
46
|
-
"reviewerB": {
|
|
47
|
-
"agent": "opencode",
|
|
48
|
-
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
49
|
-
"timeoutSeconds": 1200,
|
|
50
|
-
"role": "functional-correctness",
|
|
51
|
-
"focus": "Verify tests pass and the new prompt constraints produce structurally valid Trinity output"
|
|
52
|
-
},
|
|
53
|
-
"escalationReviewer": {
|
|
54
|
-
"agent": "opencode",
|
|
55
|
-
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
56
|
-
"timeoutSeconds": 1800
|
|
57
|
-
},
|
|
58
|
-
"stageGoals": {
|
|
59
|
-
"investigate": [
|
|
60
|
-
"Read nocturnal-trinity.ts lines 64-298 (all three prompts) and nocturnal-trinity.test.ts",
|
|
61
|
-
"Identify exact insertion points for Dreamer diversity section and Scribe analysis section",
|
|
62
|
-
"List all test assertions that reference prompt content",
|
|
63
|
-
"Report findings in producer.md"
|
|
64
|
-
],
|
|
65
|
-
"implement-pass-1": [
|
|
66
|
-
"Apply Dreamer perspective diversity constraints to NOCTURNAL_DREAMER_PROMPT",
|
|
67
|
-
"Apply Scribe rejected-decision analysis to NOCTURNAL_SCRIBE_PROMPT",
|
|
68
|
-
"Update test assertions in nocturnal-trinity.test.ts if needed",
|
|
69
|
-
"Run nocturnal-trinity and nocturnal-arbiter tests to verify no breakage"
|
|
70
|
-
],
|
|
71
|
-
"verify": [
|
|
72
|
-
"Run full nocturnal test suite: npx vitest run packages/openclaw-plugin/tests/core/nocturnal --reporter=verbose",
|
|
73
|
-
"Verify all tests pass with 0 failures",
|
|
74
|
-
"Confirm arbiter validation is unchanged",
|
|
75
|
-
"Confirm no new files were created"
|
|
76
|
-
]
|
|
77
|
-
},
|
|
78
|
-
"stageCriteria": {
|
|
79
|
-
"investigate": {
|
|
80
|
-
"scoringDimensions": [
|
|
81
|
-
"completeness",
|
|
82
|
-
"accuracy"
|
|
83
|
-
],
|
|
84
|
-
"dimensionThreshold": 3,
|
|
85
|
-
"requiredDeliverables": [
|
|
86
|
-
"producer.md"
|
|
87
|
-
]
|
|
88
|
-
},
|
|
89
|
-
"implement-pass-1": {
|
|
90
|
-
"scoringDimensions": [
|
|
91
|
-
"correctness",
|
|
92
|
-
"completeness"
|
|
93
|
-
],
|
|
94
|
-
"dimensionThreshold": 3,
|
|
95
|
-
"requiredDeliverables": [
|
|
96
|
-
"producer.md",
|
|
97
|
-
"reviewer-a.md",
|
|
98
|
-
"reviewer-b.md"
|
|
99
|
-
]
|
|
100
|
-
},
|
|
101
|
-
"verify": {
|
|
102
|
-
"scoringDimensions": [
|
|
103
|
-
"correctness"
|
|
104
|
-
],
|
|
105
|
-
"dimensionThreshold": 3,
|
|
106
|
-
"requiredDeliverables": [
|
|
107
|
-
"producer.md"
|
|
108
|
-
]
|
|
109
|
-
}
|
|
110
|
-
}
|
|
111
|
-
}
|
|
@@ -1,95 +0,0 @@
|
|
|
1
|
-
{
|
|
2
|
-
"id": "workflow-validation-minimal-verify",
|
|
3
|
-
"title": "Verify: Workflow v1 infrastructure validation",
|
|
4
|
-
"workspace": "__SKILL_PACKAGE_ROOT__",
|
|
5
|
-
"branchWorkspace": "__SKILL_PACKAGE_ROOT__",
|
|
6
|
-
"branch": "main",
|
|
7
|
-
"integrationPhase": "shadow",
|
|
8
|
-
"maxRoundsPerStage": 1,
|
|
9
|
-
"maxRuntimeMinutes": 15,
|
|
10
|
-
"stageTimeoutMinutes": 5,
|
|
11
|
-
"stages": ["verify"],
|
|
12
|
-
"producer": {
|
|
13
|
-
"agent": "opencode",
|
|
14
|
-
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
15
|
-
"timeoutSeconds": 90
|
|
16
|
-
},
|
|
17
|
-
"reviewerA": {
|
|
18
|
-
"agent": "opencode",
|
|
19
|
-
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
20
|
-
"timeoutSeconds": 45,
|
|
21
|
-
"role": "artifact_checker",
|
|
22
|
-
"focus": "Verify decision.md and scorecard.json contain expected fields"
|
|
23
|
-
},
|
|
24
|
-
"reviewerB": {
|
|
25
|
-
"agent": "opencode",
|
|
26
|
-
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
27
|
-
"timeoutSeconds": 45,
|
|
28
|
-
"role": "recommendation_checker",
|
|
29
|
-
"focus": "Verify nextRunRecommendation is computed and reasonable"
|
|
30
|
-
},
|
|
31
|
-
"context": [
|
|
32
|
-
"=== VERIFY RUN ===",
|
|
33
|
-
"This run verifies the output of workflow-validation-minimal sprint.",
|
|
34
|
-
"",
|
|
35
|
-
"=== VERIFICATION CHECKLIST ===",
|
|
36
|
-
"1. Check sprint directory exists under runtime/runs/<run-id>/",
|
|
37
|
-
"2. Check decision.md exists and contains:",
|
|
38
|
-
" - Outcome: (advance|revise|halt)",
|
|
39
|
-
" - outputQuality: (shadow_complete|production_ready|needs_work)",
|
|
40
|
-
" - qualityReasons: (list of strings)",
|
|
41
|
-
"3. Check scorecard.json exists and contains:",
|
|
42
|
-
" - outputQuality field",
|
|
43
|
-
" - qualityReasons array",
|
|
44
|
-
" - validation object with errorSummary",
|
|
45
|
-
"4. Check nextRunRecommendation is recorded if outputQuality != production_ready",
|
|
46
|
-
"",
|
|
47
|
-
"=== PRODUCER TASK ===",
|
|
48
|
-
"Read the sprint directory from the previous run and report findings.",
|
|
49
|
-
"Use the run-id provided in the stage brief."
|
|
50
|
-
],
|
|
51
|
-
"stageGoals": {
|
|
52
|
-
"verify": [
|
|
53
|
-
"Verify previous run produced valid artifacts.",
|
|
54
|
-
"Confirm outputQuality was persisted correctly.",
|
|
55
|
-
"Confirm nextRunRecommendation was computed."
|
|
56
|
-
]
|
|
57
|
-
},
|
|
58
|
-
"workUnits": {
|
|
59
|
-
"verify": [
|
|
60
|
-
{
|
|
61
|
-
"workUnitId": "verify-artifact-slice",
|
|
62
|
-
"workUnitGoal": "Verify the prior validation run using compact artifact-focused context.",
|
|
63
|
-
"allowedFiles": [
|
|
64
|
-
"runtime/runs",
|
|
65
|
-
"scripts/run.mjs",
|
|
66
|
-
"references/specs/workflow-validation-minimal-verify.json"
|
|
67
|
-
],
|
|
68
|
-
"unitChecks": [
|
|
69
|
-
"node scripts/run.mjs --task workflow-validation-minimal"
|
|
70
|
-
],
|
|
71
|
-
"unitDeliverables": [
|
|
72
|
-
"artifacts verified",
|
|
73
|
-
"fields checked"
|
|
74
|
-
],
|
|
75
|
-
"unitSummary": "Verify persisted workflow artifacts without reopening broad stage history.",
|
|
76
|
-
"carryForwardSummary": "Use prior run id and compact artifact checklist first; avoid long historical replay."
|
|
77
|
-
}
|
|
78
|
-
]
|
|
79
|
-
},
|
|
80
|
-
"stageCriteria": {
|
|
81
|
-
"verify": {
|
|
82
|
-
"requiredApprovals": 2,
|
|
83
|
-
"requiredProducerSections": ["SUMMARY", "EVIDENCE", "CODE_EVIDENCE", "CHECKS"],
|
|
84
|
-
"requiredReviewerSections": ["VERDICT", "BLOCKERS", "FINDINGS", "CODE_EVIDENCE", "NEXT_FOCUS", "CHECKS"],
|
|
85
|
-
"scoringDimensions": ["artifact_verification", "field_correctness"],
|
|
86
|
-
"dimensionThreshold": 3,
|
|
87
|
-
"requiredDeliverables": ["artifacts_verified", "fields_correct"]
|
|
88
|
-
}
|
|
89
|
-
},
|
|
90
|
-
"stageRoleTimeouts": {
|
|
91
|
-
"verify": { "producer": 90, "reviewer_a": 45, "reviewer_b": 45 }
|
|
92
|
-
},
|
|
93
|
-
"continuationSpec": null,
|
|
94
|
-
"recoverySpec": null
|
|
95
|
-
}
|
|
@@ -1,98 +0,0 @@
|
|
|
1
|
-
{
|
|
2
|
-
"id": "workflow-validation-minimal",
|
|
3
|
-
"title": "Workflow v1 Minimal Validation - Test workflow infrastructure without product binding",
|
|
4
|
-
"workspace": "__SKILL_PACKAGE_ROOT__",
|
|
5
|
-
"branchWorkspace": "__SKILL_PACKAGE_ROOT__",
|
|
6
|
-
"branch": "main",
|
|
7
|
-
"integrationPhase": "shadow",
|
|
8
|
-
"maxRoundsPerStage": 2,
|
|
9
|
-
"maxRuntimeMinutes": 20,
|
|
10
|
-
"stageTimeoutMinutes": 4,
|
|
11
|
-
"stages": ["validate"],
|
|
12
|
-
"producer": {
|
|
13
|
-
"agent": "opencode",
|
|
14
|
-
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
15
|
-
"timeoutSeconds": 90
|
|
16
|
-
},
|
|
17
|
-
"reviewerA": {
|
|
18
|
-
"agent": "opencode",
|
|
19
|
-
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
20
|
-
"timeoutSeconds": 45,
|
|
21
|
-
"role": "schema_checker",
|
|
22
|
-
"focus": "Verify report has all required sections, VERDICT format, DIMENSIONS format"
|
|
23
|
-
},
|
|
24
|
-
"reviewerB": {
|
|
25
|
-
"agent": "opencode",
|
|
26
|
-
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
27
|
-
"timeoutSeconds": 45,
|
|
28
|
-
"role": "quality_checker",
|
|
29
|
-
"focus": "Verify outputQuality is computed correctly, qualityReasons are meaningful"
|
|
30
|
-
},
|
|
31
|
-
"context": [
|
|
32
|
-
"=== WORKFLOW VALIDATION SPRINT ===",
|
|
33
|
-
"This sprint validates the workflow infrastructure itself, NOT any product feature.",
|
|
34
|
-
"",
|
|
35
|
-
"=== VALIDATION GOALS ===",
|
|
36
|
-
"1. Producer produces a valid report with all required sections",
|
|
37
|
-
"2. Reviewers produce valid reports with VERDICT, DIMENSIONS",
|
|
38
|
-
"3. Orchestrator computes outputQuality correctly",
|
|
39
|
-
"4. outputQuality and qualityReasons are persisted to decision.md and scorecard.json",
|
|
40
|
-
"5. nextRunRecommendation is computed and recorded",
|
|
41
|
-
"",
|
|
42
|
-
"=== NO PRODUCT LOGIC ===",
|
|
43
|
-
"Producer task: List 3 files in packages/openclaw-plugin/templates/langs/zh/skills/ai-sprint-orchestration/scripts/ and describe their purpose.",
|
|
44
|
-
"This is intentionally trivial - we are testing the workflow package, not any product task.",
|
|
45
|
-
"",
|
|
46
|
-
"=== SUCCESS CRITERIA FOR THIS RUN ===",
|
|
47
|
-
"- No halt due to workflow infrastructure issues (timeout handling, file I/O, validation)",
|
|
48
|
-
"- decision.md contains outputQuality field",
|
|
49
|
-
"- scorecard.json contains outputQuality and qualityReasons",
|
|
50
|
-
"- If outputQuality is shadow_complete, nextRunRecommendation suggests CONTINUATION or VERIFY"
|
|
51
|
-
],
|
|
52
|
-
"stageGoals": {
|
|
53
|
-
"validate": [
|
|
54
|
-
"Produce a minimal valid producer report.",
|
|
55
|
-
"Reviewers verify schema compliance.",
|
|
56
|
-
"Orchestrator computes and persists outputQuality."
|
|
57
|
-
]
|
|
58
|
-
},
|
|
59
|
-
"workUnits": {
|
|
60
|
-
"validate": [
|
|
61
|
-
{
|
|
62
|
-
"workUnitId": "validate-contract-slice",
|
|
63
|
-
"workUnitGoal": "Validate the minimal workflow package using a single compact work unit.",
|
|
64
|
-
"allowedFiles": [
|
|
65
|
-
"scripts/run.mjs",
|
|
66
|
-
"scripts/lib/task-specs.mjs",
|
|
67
|
-
"references/specs/workflow-validation-minimal.json"
|
|
68
|
-
],
|
|
69
|
-
"unitChecks": [
|
|
70
|
-
"node scripts/run.mjs --self-check"
|
|
71
|
-
],
|
|
72
|
-
"unitDeliverables": [
|
|
73
|
-
"producer report drafted",
|
|
74
|
-
"self-check executed"
|
|
75
|
-
],
|
|
76
|
-
"unitSummary": "Use one small work unit to validate package workflow behavior.",
|
|
77
|
-
"carryForwardSummary": "Prefer compact workflow-only context. Do not expand into product-side closure."
|
|
78
|
-
}
|
|
79
|
-
]
|
|
80
|
-
},
|
|
81
|
-
"stageCriteria": {
|
|
82
|
-
"validate": {
|
|
83
|
-
"requiredApprovals": 2,
|
|
84
|
-
"requiredProducerSections": ["SUMMARY", "CHANGES", "EVIDENCE", "CODE_EVIDENCE", "KEY_EVENTS", "HYPOTHESIS_MATRIX", "CHECKS", "OPEN_RISKS"],
|
|
85
|
-
"requiredReviewerSections": ["VERDICT", "BLOCKERS", "FINDINGS", "CODE_EVIDENCE", "HYPOTHESIS_MATRIX", "NEXT_FOCUS", "CHECKS"],
|
|
86
|
-
"scoringDimensions": ["schema_compliance", "report_completeness"],
|
|
87
|
-
"dimensionThreshold": 3,
|
|
88
|
-
"requiredDeliverables": ["producer_report_complete", "self_check_passed"]
|
|
89
|
-
}
|
|
90
|
-
},
|
|
91
|
-
"stageRoleTimeouts": {
|
|
92
|
-
"validate": { "producer": 60, "reviewer_a": 45, "reviewer_b": 45 }
|
|
93
|
-
},
|
|
94
|
-
"verificationSpec": "workflow-validation-minimal-verify",
|
|
95
|
-
"continuationSpec": null,
|
|
96
|
-
"recoverySpec": null,
|
|
97
|
-
"requireVerify": false
|
|
98
|
-
}
|