principles-disciple 1.8.2 → 1.8.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/openclaw.plugin.json +4 -4
- package/package.json +1 -1
- package/templates/langs/en/skills/ai-sprint-orchestration/EXAMPLES.md +63 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/REFERENCE.md +136 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/SKILL.md +67 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/references/agent-registry.json +214 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +107 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +107 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +105 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +108 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/references/workflow-v1-acceptance-checklist.md +58 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/references/workflow-v1.4-work-unit-handoff.md +190 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/runtime/.gitignore +2 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/archive.mjs +310 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/contract-enforcement.mjs +683 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/decision.mjs +604 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/state-store.mjs +32 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/lib/task-specs.mjs +707 -0
- package/templates/langs/en/skills/ai-sprint-orchestration/scripts/run.mjs +3419 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/EXAMPLES.md +63 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/REFERENCE.md +136 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/SKILL.md +67 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/agent-registry.json +214 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +107 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +107 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +105 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +108 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/workflow-v1-acceptance-checklist.md +58 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/references/workflow-v1.4-work-unit-handoff.md +190 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/runtime/.gitignore +2 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/archive.mjs +310 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/contract-enforcement.mjs +683 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/decision.mjs +604 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/state-store.mjs +32 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/lib/task-specs.mjs +707 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/run.mjs +3419 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/test/archive.test.mjs +230 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/test/contract-enforcement.test.mjs +672 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/test/decision.test.mjs +1321 -0
- package/templates/langs/zh/skills/ai-sprint-orchestration/test/run.test.mjs +1419 -0
|
@@ -0,0 +1,107 @@
|
|
|
1
|
+
{
|
|
2
|
+
"id": "feature-complex-template",
|
|
3
|
+
"title": "Complex Feature Template - Replace before use",
|
|
4
|
+
"workspace": "__SKILL_PACKAGE_ROOT__",
|
|
5
|
+
"branchWorkspace": "__SKILL_PACKAGE_ROOT__",
|
|
6
|
+
"branch": "main",
|
|
7
|
+
"requiresTaskContract": true,
|
|
8
|
+
"taskContract": {
|
|
9
|
+
"goal": "<describe the feature to implement and the user-visible behavior>",
|
|
10
|
+
"inScope": [
|
|
11
|
+
"<allowed modules or files>"
|
|
12
|
+
],
|
|
13
|
+
"outOfScope": [
|
|
14
|
+
"<forbidden scope, unrelated refactors, external product-side work>"
|
|
15
|
+
],
|
|
16
|
+
"validationCommands": [
|
|
17
|
+
"<command 1>",
|
|
18
|
+
"<command 2>"
|
|
19
|
+
],
|
|
20
|
+
"expectedArtifacts": [
|
|
21
|
+
"decision.md",
|
|
22
|
+
"scorecard.json",
|
|
23
|
+
"<optional feature artifact>"
|
|
24
|
+
]
|
|
25
|
+
},
|
|
26
|
+
"executionScope": {
|
|
27
|
+
"maxFiles": 8,
|
|
28
|
+
"maxChecks": 5,
|
|
29
|
+
"maxDeliverables": 4
|
|
30
|
+
},
|
|
31
|
+
"maxRoundsPerStage": 2,
|
|
32
|
+
"maxRuntimeMinutes": 75,
|
|
33
|
+
"stageTimeoutMinutes": 20,
|
|
34
|
+
"stages": ["investigate", "implement-pass-1", "verify"],
|
|
35
|
+
"producer": {
|
|
36
|
+
"agent": "iflow",
|
|
37
|
+
"model": "glm-4.7",
|
|
38
|
+
"timeoutSeconds": 240
|
|
39
|
+
},
|
|
40
|
+
"reviewerA": {
|
|
41
|
+
"agent": "iflow",
|
|
42
|
+
"model": "glm-4.7",
|
|
43
|
+
"timeoutSeconds": 120,
|
|
44
|
+
"focus": "Validate feature behavior, acceptance criteria coverage, and architecture fit."
|
|
45
|
+
},
|
|
46
|
+
"reviewerB": {
|
|
47
|
+
"agent": "iflow",
|
|
48
|
+
"model": "glm-4.7",
|
|
49
|
+
"timeoutSeconds": 120,
|
|
50
|
+
"focus": "Validate implementation scope, verification evidence, and regression risk."
|
|
51
|
+
},
|
|
52
|
+
"context": [
|
|
53
|
+
"This is a generic complex feature sprint template.",
|
|
54
|
+
"Replace all placeholder contract values before running.",
|
|
55
|
+
"Use it for bounded feature delivery with explicit acceptance criteria and verification commands."
|
|
56
|
+
],
|
|
57
|
+
"stageGoals": {
|
|
58
|
+
"investigate": [
|
|
59
|
+
"Clarify feature scope and constraints.",
|
|
60
|
+
"Identify the smallest valuable slice that can be implemented now.",
|
|
61
|
+
"Produce a verification plan aligned with acceptance criteria."
|
|
62
|
+
],
|
|
63
|
+
"implement-pass-1": [
|
|
64
|
+
"Implement the smallest valuable feature slice within the declared scope.",
|
|
65
|
+
"Run the planned verification commands.",
|
|
66
|
+
"Record evidence that the new behavior exists and is bounded."
|
|
67
|
+
],
|
|
68
|
+
"verify": [
|
|
69
|
+
"Verify the feature behaves as intended.",
|
|
70
|
+
"Check whether the acceptance criteria are actually covered by evidence.",
|
|
71
|
+
"Decide whether the feature is ready, needs continuation, or revise."
|
|
72
|
+
]
|
|
73
|
+
},
|
|
74
|
+
"stageCriteria": {
|
|
75
|
+
"investigate": {
|
|
76
|
+
"requiredApprovals": 2,
|
|
77
|
+
"requiredProducerSections": ["SUMMARY", "CHANGES", "EVIDENCE", "CODE_EVIDENCE", "KEY_EVENTS", "HYPOTHESIS_MATRIX", "CHECKS", "OPEN_RISKS"],
|
|
78
|
+
"requiredReviewerSections": ["VERDICT", "BLOCKERS", "FINDINGS", "CODE_EVIDENCE", "HYPOTHESIS_MATRIX", "NEXT_FOCUS", "CHECKS"],
|
|
79
|
+
"scoringDimensions": ["scope_definition", "acceptance_alignment"],
|
|
80
|
+
"dimensionThreshold": 3,
|
|
81
|
+
"requiredDeliverables": ["feature_slice", "acceptance_plan", "verification_plan"]
|
|
82
|
+
},
|
|
83
|
+
"implement-pass-1": {
|
|
84
|
+
"requiredApprovals": 2,
|
|
85
|
+
"requiredProducerSections": ["SUMMARY", "CHANGES", "EVIDENCE", "CODE_EVIDENCE", "KEY_EVENTS", "HYPOTHESIS_MATRIX", "CHECKS", "OPEN_RISKS", "CONTRACT"],
|
|
86
|
+
"requiredReviewerSections": ["VERDICT", "BLOCKERS", "FINDINGS", "CODE_EVIDENCE", "HYPOTHESIS_MATRIX", "NEXT_FOCUS", "CHECKS"],
|
|
87
|
+
"scoringDimensions": ["behavior_delivery", "verification_quality", "scope_control"],
|
|
88
|
+
"dimensionThreshold": 3,
|
|
89
|
+
"requiredDeliverables": ["feature_implementation", "evidence_of_behavior", "risk_summary"]
|
|
90
|
+
},
|
|
91
|
+
"verify": {
|
|
92
|
+
"requiredApprovals": 2,
|
|
93
|
+
"requiredProducerSections": ["SUMMARY", "CHANGES", "EVIDENCE", "CODE_EVIDENCE", "KEY_EVENTS", "HYPOTHESIS_MATRIX", "CHECKS", "OPEN_RISKS"],
|
|
94
|
+
"requiredReviewerSections": ["VERDICT", "BLOCKERS", "FINDINGS", "CODE_EVIDENCE", "HYPOTHESIS_MATRIX", "NEXT_FOCUS", "CHECKS"],
|
|
95
|
+
"scoringDimensions": ["artifact_verification", "acceptance_coverage"],
|
|
96
|
+
"dimensionThreshold": 3,
|
|
97
|
+
"requiredDeliverables": ["acceptance_verified", "residual_risk_assessment"]
|
|
98
|
+
}
|
|
99
|
+
},
|
|
100
|
+
"stageRoleTimeouts": {
|
|
101
|
+
"investigate": { "producer": 180, "reviewer_a": 120, "reviewer_b": 120 },
|
|
102
|
+
"implement-pass-1": { "producer": 300, "reviewer_a": 120, "reviewer_b": 120 },
|
|
103
|
+
"verify": { "producer": 120, "reviewer_a": 90, "reviewer_b": 90 }
|
|
104
|
+
},
|
|
105
|
+
"continuationSpec": null,
|
|
106
|
+
"recoverySpec": null
|
|
107
|
+
}
|
|
@@ -0,0 +1,105 @@
|
|
|
1
|
+
{
|
|
2
|
+
"id": "workflow-validation-minimal-verify",
|
|
3
|
+
"title": "Verify: Workflow v1 infrastructure validation",
|
|
4
|
+
"workspace": "__SKILL_PACKAGE_ROOT__",
|
|
5
|
+
"branchWorkspace": "__SKILL_PACKAGE_ROOT__",
|
|
6
|
+
"branch": "main",
|
|
7
|
+
"integrationPhase": "shadow",
|
|
8
|
+
"maxRoundsPerStage": 1,
|
|
9
|
+
"maxRuntimeMinutes": 15,
|
|
10
|
+
"stageTimeoutMinutes": 5,
|
|
11
|
+
"stages": ["verify"],
|
|
12
|
+
"producer": {
|
|
13
|
+
"agent": "iflow",
|
|
14
|
+
"model": "glm-4.7",
|
|
15
|
+
"timeoutSeconds": 90
|
|
16
|
+
},
|
|
17
|
+
"reviewerA": {
|
|
18
|
+
"agent": "opencode",
|
|
19
|
+
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
20
|
+
"timeoutSeconds": 45,
|
|
21
|
+
"fallback": {
|
|
22
|
+
"agent": "iflow",
|
|
23
|
+
"model": "glm-4.7",
|
|
24
|
+
"timeoutSeconds": 75
|
|
25
|
+
},
|
|
26
|
+
"role": "artifact_checker",
|
|
27
|
+
"focus": "Verify decision.md and scorecard.json contain expected fields"
|
|
28
|
+
},
|
|
29
|
+
"reviewerB": {
|
|
30
|
+
"agent": "opencode",
|
|
31
|
+
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
32
|
+
"timeoutSeconds": 45,
|
|
33
|
+
"fallback": {
|
|
34
|
+
"agent": "iflow",
|
|
35
|
+
"model": "glm-4.7",
|
|
36
|
+
"timeoutSeconds": 75
|
|
37
|
+
},
|
|
38
|
+
"role": "recommendation_checker",
|
|
39
|
+
"focus": "Verify nextRunRecommendation is computed and reasonable"
|
|
40
|
+
},
|
|
41
|
+
"context": [
|
|
42
|
+
"=== VERIFY RUN ===",
|
|
43
|
+
"This run verifies the output of workflow-validation-minimal sprint.",
|
|
44
|
+
"",
|
|
45
|
+
"=== VERIFICATION CHECKLIST ===",
|
|
46
|
+
"1. Check sprint directory exists under runtime/runs/<run-id>/",
|
|
47
|
+
"2. Check decision.md exists and contains:",
|
|
48
|
+
" - Outcome: (advance|revise|halt)",
|
|
49
|
+
" - outputQuality: (shadow_complete|production_ready|needs_work)",
|
|
50
|
+
" - qualityReasons: (list of strings)",
|
|
51
|
+
"3. Check scorecard.json exists and contains:",
|
|
52
|
+
" - outputQuality field",
|
|
53
|
+
" - qualityReasons array",
|
|
54
|
+
" - validation object with errorSummary",
|
|
55
|
+
"4. Check nextRunRecommendation is recorded if outputQuality != production_ready",
|
|
56
|
+
"",
|
|
57
|
+
"=== PRODUCER TASK ===",
|
|
58
|
+
"Read the sprint directory from the previous run and report findings.",
|
|
59
|
+
"Use the run-id provided in the stage brief."
|
|
60
|
+
],
|
|
61
|
+
"stageGoals": {
|
|
62
|
+
"verify": [
|
|
63
|
+
"Verify previous run produced valid artifacts.",
|
|
64
|
+
"Confirm outputQuality was persisted correctly.",
|
|
65
|
+
"Confirm nextRunRecommendation was computed."
|
|
66
|
+
]
|
|
67
|
+
},
|
|
68
|
+
"workUnits": {
|
|
69
|
+
"verify": [
|
|
70
|
+
{
|
|
71
|
+
"workUnitId": "verify-artifact-slice",
|
|
72
|
+
"workUnitGoal": "Verify the prior validation run using compact artifact-focused context.",
|
|
73
|
+
"allowedFiles": [
|
|
74
|
+
"runtime/runs",
|
|
75
|
+
"scripts/run.mjs",
|
|
76
|
+
"references/specs/workflow-validation-minimal-verify.json"
|
|
77
|
+
],
|
|
78
|
+
"unitChecks": [
|
|
79
|
+
"node scripts/run.mjs --task workflow-validation-minimal"
|
|
80
|
+
],
|
|
81
|
+
"unitDeliverables": [
|
|
82
|
+
"artifacts verified",
|
|
83
|
+
"fields checked"
|
|
84
|
+
],
|
|
85
|
+
"unitSummary": "Verify persisted workflow artifacts without reopening broad stage history.",
|
|
86
|
+
"carryForwardSummary": "Use prior run id and compact artifact checklist first; avoid long historical replay."
|
|
87
|
+
}
|
|
88
|
+
]
|
|
89
|
+
},
|
|
90
|
+
"stageCriteria": {
|
|
91
|
+
"verify": {
|
|
92
|
+
"requiredApprovals": 2,
|
|
93
|
+
"requiredProducerSections": ["SUMMARY", "EVIDENCE", "CODE_EVIDENCE", "CHECKS"],
|
|
94
|
+
"requiredReviewerSections": ["VERDICT", "BLOCKERS", "FINDINGS", "CODE_EVIDENCE", "NEXT_FOCUS", "CHECKS"],
|
|
95
|
+
"scoringDimensions": ["artifact_verification", "field_correctness"],
|
|
96
|
+
"dimensionThreshold": 3,
|
|
97
|
+
"requiredDeliverables": ["artifacts_verified", "fields_correct"]
|
|
98
|
+
}
|
|
99
|
+
},
|
|
100
|
+
"stageRoleTimeouts": {
|
|
101
|
+
"verify": { "producer": 90, "reviewer_a": 45, "reviewer_b": 45 }
|
|
102
|
+
},
|
|
103
|
+
"continuationSpec": null,
|
|
104
|
+
"recoverySpec": null
|
|
105
|
+
}
|
|
@@ -0,0 +1,108 @@
|
|
|
1
|
+
{
|
|
2
|
+
"id": "workflow-validation-minimal",
|
|
3
|
+
"title": "Workflow v1 Minimal Validation - Test workflow infrastructure without product binding",
|
|
4
|
+
"workspace": "__SKILL_PACKAGE_ROOT__",
|
|
5
|
+
"branchWorkspace": "__SKILL_PACKAGE_ROOT__",
|
|
6
|
+
"branch": "main",
|
|
7
|
+
"integrationPhase": "shadow",
|
|
8
|
+
"maxRoundsPerStage": 2,
|
|
9
|
+
"maxRuntimeMinutes": 20,
|
|
10
|
+
"stageTimeoutMinutes": 4,
|
|
11
|
+
"stages": ["validate"],
|
|
12
|
+
"producer": {
|
|
13
|
+
"agent": "iflow",
|
|
14
|
+
"model": "glm-4.7",
|
|
15
|
+
"timeoutSeconds": 90
|
|
16
|
+
},
|
|
17
|
+
"reviewerA": {
|
|
18
|
+
"agent": "opencode",
|
|
19
|
+
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
20
|
+
"timeoutSeconds": 45,
|
|
21
|
+
"fallback": {
|
|
22
|
+
"agent": "iflow",
|
|
23
|
+
"model": "glm-4.7",
|
|
24
|
+
"timeoutSeconds": 75
|
|
25
|
+
},
|
|
26
|
+
"role": "schema_checker",
|
|
27
|
+
"focus": "Verify report has all required sections, VERDICT format, DIMENSIONS format"
|
|
28
|
+
},
|
|
29
|
+
"reviewerB": {
|
|
30
|
+
"agent": "opencode",
|
|
31
|
+
"model": "minimax-cn-coding-plan/MiniMax-M2.7",
|
|
32
|
+
"timeoutSeconds": 45,
|
|
33
|
+
"fallback": {
|
|
34
|
+
"agent": "iflow",
|
|
35
|
+
"model": "glm-4.7",
|
|
36
|
+
"timeoutSeconds": 75
|
|
37
|
+
},
|
|
38
|
+
"role": "quality_checker",
|
|
39
|
+
"focus": "Verify outputQuality is computed correctly, qualityReasons are meaningful"
|
|
40
|
+
},
|
|
41
|
+
"context": [
|
|
42
|
+
"=== WORKFLOW VALIDATION SPRINT ===",
|
|
43
|
+
"This sprint validates the workflow infrastructure itself, NOT any product feature.",
|
|
44
|
+
"",
|
|
45
|
+
"=== VALIDATION GOALS ===",
|
|
46
|
+
"1. Producer produces a valid report with all required sections",
|
|
47
|
+
"2. Reviewers produce valid reports with VERDICT, DIMENSIONS",
|
|
48
|
+
"3. Orchestrator computes outputQuality correctly",
|
|
49
|
+
"4. outputQuality and qualityReasons are persisted to decision.md and scorecard.json",
|
|
50
|
+
"5. nextRunRecommendation is computed and recorded",
|
|
51
|
+
"",
|
|
52
|
+
"=== NO PRODUCT LOGIC ===",
|
|
53
|
+
"Producer task: List 3 files in packages/openclaw-plugin/templates/langs/zh/skills/ai-sprint-orchestration/scripts/ and describe their purpose.",
|
|
54
|
+
"This is intentionally trivial - we are testing the workflow package, not any product task.",
|
|
55
|
+
"",
|
|
56
|
+
"=== SUCCESS CRITERIA FOR THIS RUN ===",
|
|
57
|
+
"- No halt due to workflow infrastructure issues (timeout handling, file I/O, validation)",
|
|
58
|
+
"- decision.md contains outputQuality field",
|
|
59
|
+
"- scorecard.json contains outputQuality and qualityReasons",
|
|
60
|
+
"- If outputQuality is shadow_complete, nextRunRecommendation suggests CONTINUATION or VERIFY"
|
|
61
|
+
],
|
|
62
|
+
"stageGoals": {
|
|
63
|
+
"validate": [
|
|
64
|
+
"Produce a minimal valid producer report.",
|
|
65
|
+
"Reviewers verify schema compliance.",
|
|
66
|
+
"Orchestrator computes and persists outputQuality."
|
|
67
|
+
]
|
|
68
|
+
},
|
|
69
|
+
"workUnits": {
|
|
70
|
+
"validate": [
|
|
71
|
+
{
|
|
72
|
+
"workUnitId": "validate-contract-slice",
|
|
73
|
+
"workUnitGoal": "Validate the minimal workflow package using a single compact work unit.",
|
|
74
|
+
"allowedFiles": [
|
|
75
|
+
"scripts/run.mjs",
|
|
76
|
+
"scripts/lib/task-specs.mjs",
|
|
77
|
+
"references/specs/workflow-validation-minimal.json"
|
|
78
|
+
],
|
|
79
|
+
"unitChecks": [
|
|
80
|
+
"node scripts/run.mjs --self-check"
|
|
81
|
+
],
|
|
82
|
+
"unitDeliverables": [
|
|
83
|
+
"producer report drafted",
|
|
84
|
+
"self-check executed"
|
|
85
|
+
],
|
|
86
|
+
"unitSummary": "Use one small work unit to validate package workflow behavior.",
|
|
87
|
+
"carryForwardSummary": "Prefer compact workflow-only context. Do not expand into product-side closure."
|
|
88
|
+
}
|
|
89
|
+
]
|
|
90
|
+
},
|
|
91
|
+
"stageCriteria": {
|
|
92
|
+
"validate": {
|
|
93
|
+
"requiredApprovals": 2,
|
|
94
|
+
"requiredProducerSections": ["SUMMARY", "CHANGES", "EVIDENCE", "CODE_EVIDENCE", "KEY_EVENTS", "HYPOTHESIS_MATRIX", "CHECKS", "OPEN_RISKS"],
|
|
95
|
+
"requiredReviewerSections": ["VERDICT", "BLOCKERS", "FINDINGS", "CODE_EVIDENCE", "HYPOTHESIS_MATRIX", "NEXT_FOCUS", "CHECKS"],
|
|
96
|
+
"scoringDimensions": ["schema_compliance", "report_completeness"],
|
|
97
|
+
"dimensionThreshold": 3,
|
|
98
|
+
"requiredDeliverables": ["producer_report_complete", "self_check_passed"]
|
|
99
|
+
}
|
|
100
|
+
},
|
|
101
|
+
"stageRoleTimeouts": {
|
|
102
|
+
"validate": { "producer": 60, "reviewer_a": 45, "reviewer_b": 45 }
|
|
103
|
+
},
|
|
104
|
+
"verificationSpec": "workflow-validation-minimal-verify",
|
|
105
|
+
"continuationSpec": null,
|
|
106
|
+
"recoverySpec": null,
|
|
107
|
+
"requireVerify": false
|
|
108
|
+
}
|
|
@@ -0,0 +1,58 @@
|
|
|
1
|
+
# Workflow v1 Acceptance Checklist
|
|
2
|
+
|
|
3
|
+
## Purpose
|
|
4
|
+
|
|
5
|
+
Use this checklist to validate that the packaged workflow is readable, executable, and safe to hand off to another agent.
|
|
6
|
+
|
|
7
|
+
## Acceptance gates
|
|
8
|
+
|
|
9
|
+
- [ ] Baseline tests are green
|
|
10
|
+
- [ ] `workflow-validation-minimal` completes and writes package-local artifacts
|
|
11
|
+
- [ ] `workflow-validation-minimal-verify` completes and validates the previous run
|
|
12
|
+
- [ ] Every failure is classified into the approved four-category taxonomy
|
|
13
|
+
|
|
14
|
+
## Commands
|
|
15
|
+
|
|
16
|
+
```powershell
|
|
17
|
+
node scripts/run.mjs --self-check
|
|
18
|
+
node scripts/run.mjs --help
|
|
19
|
+
node scripts/run.mjs --task workflow-validation-minimal
|
|
20
|
+
node scripts/run.mjs --task workflow-validation-minimal-verify
|
|
21
|
+
```
|
|
22
|
+
|
|
23
|
+
## Run result record
|
|
24
|
+
|
|
25
|
+
| Field | Value |
|
|
26
|
+
|------|------|
|
|
27
|
+
| runId | |
|
|
28
|
+
| outcome | |
|
|
29
|
+
| outputQuality | |
|
|
30
|
+
| validation | |
|
|
31
|
+
| nextRunRecommendation | |
|
|
32
|
+
| failure classification | |
|
|
33
|
+
|
|
34
|
+
## Required artifact checks
|
|
35
|
+
|
|
36
|
+
- `decision.md` contains `outputQuality`
|
|
37
|
+
- `decision.md` contains `qualityReasons`
|
|
38
|
+
- `decision.md` contains readable validation status
|
|
39
|
+
- `scorecard.json` contains `outputQuality`
|
|
40
|
+
- `scorecard.json` contains `qualityReasons`
|
|
41
|
+
- `scorecard.json` contains `validation`
|
|
42
|
+
- `scorecard.json` contains `nextRunRecommendation`
|
|
43
|
+
|
|
44
|
+
## Failure classification
|
|
45
|
+
|
|
46
|
+
- `workflow bug`
|
|
47
|
+
- `agent behavior issue`
|
|
48
|
+
- `environment issue`
|
|
49
|
+
- `sample-spec issue`
|
|
50
|
+
|
|
51
|
+
## Stop conditions
|
|
52
|
+
|
|
53
|
+
If the run exposes a sample-side or product-side issue:
|
|
54
|
+
|
|
55
|
+
- classify it
|
|
56
|
+
- record evidence
|
|
57
|
+
- stop the run review
|
|
58
|
+
- do not continue into product closure work
|
|
@@ -0,0 +1,190 @@
|
|
|
1
|
+
# Workflow v1.4 Work-Unit Upgrade Handoff
|
|
2
|
+
|
|
3
|
+
## Goal
|
|
4
|
+
|
|
5
|
+
Use the packaged `ai-sprint-orchestration` skill to implement the next architecture upgrade of the workflow itself.
|
|
6
|
+
|
|
7
|
+
This upgrade is **not** about product-side closure. It is about making the orchestrator better at long-running, high-value coding tasks by introducing a finer-grained execution model.
|
|
8
|
+
|
|
9
|
+
The target direction is:
|
|
10
|
+
|
|
11
|
+
- move from `stage -> producer/reviewer`
|
|
12
|
+
- toward `stage -> work units -> producer/reviewer/decision`
|
|
13
|
+
|
|
14
|
+
The key design goal is:
|
|
15
|
+
|
|
16
|
+
- smaller execution units
|
|
17
|
+
- explicit checkpointing
|
|
18
|
+
- forced context reload between units
|
|
19
|
+
- less long-context drift
|
|
20
|
+
|
|
21
|
+
## Current confirmed state
|
|
22
|
+
|
|
23
|
+
The packaged skill is already usable as an internal tool:
|
|
24
|
+
|
|
25
|
+
- package path:
|
|
26
|
+
- `D:/Code/principles/packages/openclaw-plugin/templates/langs/zh/skills/ai-sprint-orchestration`
|
|
27
|
+
- installed path:
|
|
28
|
+
- `C:/Users/Administrator/.agents/skills/ai-sprint-orchestration`
|
|
29
|
+
- self-check works
|
|
30
|
+
- package-local validation runs work
|
|
31
|
+
- failure classification is persisted to:
|
|
32
|
+
- `latest-summary.md`
|
|
33
|
+
- `scorecard.json`
|
|
34
|
+
- complex task templates and minimum task contract already exist
|
|
35
|
+
|
|
36
|
+
Remaining instability is mostly:
|
|
37
|
+
|
|
38
|
+
- `agent behavior issue`
|
|
39
|
+
|
|
40
|
+
It is **not** primarily:
|
|
41
|
+
|
|
42
|
+
- pathing
|
|
43
|
+
- packaging
|
|
44
|
+
- runtime-root layout
|
|
45
|
+
- missing acceptance artifacts
|
|
46
|
+
|
|
47
|
+
## Why v1.4 is needed
|
|
48
|
+
|
|
49
|
+
The current workflow already externalizes state and can resume from artifacts, but its granularity is still too coarse for very complex tasks.
|
|
50
|
+
|
|
51
|
+
Today it mainly refreshes context at:
|
|
52
|
+
|
|
53
|
+
- stage level
|
|
54
|
+
- role level
|
|
55
|
+
- round level
|
|
56
|
+
|
|
57
|
+
That is useful, but not yet enough for difficult long-running work where one producer pass can still become too large, too noisy, or too drift-prone.
|
|
58
|
+
|
|
59
|
+
The next upgrade should add a smaller unit below stage:
|
|
60
|
+
|
|
61
|
+
- `workUnitId`
|
|
62
|
+
- `workUnitGoal`
|
|
63
|
+
- `allowedFiles`
|
|
64
|
+
- `unitChecks`
|
|
65
|
+
- `unitDeliverables`
|
|
66
|
+
- `unitSummary`
|
|
67
|
+
- `carryForwardSummary`
|
|
68
|
+
|
|
69
|
+
## Scope
|
|
70
|
+
|
|
71
|
+
### In scope
|
|
72
|
+
|
|
73
|
+
- `packages/openclaw-plugin/templates/langs/zh/skills/ai-sprint-orchestration`
|
|
74
|
+
- `packages/openclaw-plugin/templates/langs/en/skills/ai-sprint-orchestration`
|
|
75
|
+
- workflow docs, specs, prompts, state shape, and summary artifacts
|
|
76
|
+
- package-local validation and workflow-only tests
|
|
77
|
+
|
|
78
|
+
### Out of scope
|
|
79
|
+
|
|
80
|
+
- `packages/openclaw-plugin`
|
|
81
|
+
- `D:/Code/openclaw`
|
|
82
|
+
- product-side/sample-side closure
|
|
83
|
+
- dashboard
|
|
84
|
+
- stageGraph
|
|
85
|
+
- self-optimizing sprint
|
|
86
|
+
- parallel orchestrator expansion
|
|
87
|
+
|
|
88
|
+
If validation or implementation exposes product-side or sample-side issues, classify them and stop. Do not drift back into product closure work.
|
|
89
|
+
|
|
90
|
+
## Architectural hypothesis
|
|
91
|
+
|
|
92
|
+
The most valuable next step is **not** a full rewrite.
|
|
93
|
+
|
|
94
|
+
The most valuable next step is to implement a high-value foundation slice:
|
|
95
|
+
|
|
96
|
+
1. define the work-unit contract
|
|
97
|
+
2. define how a stage declares work units
|
|
98
|
+
3. add package-local templates and docs for work-unit-aware tasks
|
|
99
|
+
4. add checkpoint/carry-forward artifacts that are short enough to be reused safely
|
|
100
|
+
5. update prompts so each unit starts from minimal context, not long historical text
|
|
101
|
+
|
|
102
|
+
This means the first v1.4 sprint should prioritize:
|
|
103
|
+
|
|
104
|
+
- work-unit interfaces
|
|
105
|
+
- unit-level artifacts
|
|
106
|
+
- unit-level carry-forward
|
|
107
|
+
- validation of the new context-reload behavior
|
|
108
|
+
|
|
109
|
+
It should **not** try to finish every future v1.4 feature in one pass.
|
|
110
|
+
|
|
111
|
+
## Recommended implementation order
|
|
112
|
+
|
|
113
|
+
### Phase 1: foundation interfaces
|
|
114
|
+
|
|
115
|
+
Define and document the unit contract in specs and references:
|
|
116
|
+
|
|
117
|
+
- `workUnitId`
|
|
118
|
+
- `workUnitGoal`
|
|
119
|
+
- `allowedFiles`
|
|
120
|
+
- `unitChecks`
|
|
121
|
+
- `unitDeliverables`
|
|
122
|
+
- `unitSummary`
|
|
123
|
+
- `carryForwardSummary`
|
|
124
|
+
|
|
125
|
+
Add minimal schema/contract validation for these fields where appropriate.
|
|
126
|
+
|
|
127
|
+
### Phase 2: unit-scoped prompt inputs
|
|
128
|
+
|
|
129
|
+
Update producer/reviewer prompt construction so a unit run receives:
|
|
130
|
+
|
|
131
|
+
- current unit goal
|
|
132
|
+
- allowed files
|
|
133
|
+
- expected checks
|
|
134
|
+
- expected deliverables
|
|
135
|
+
- prior carry-forward summary
|
|
136
|
+
|
|
137
|
+
Prefer short checkpoint summaries over replaying long decision history.
|
|
138
|
+
|
|
139
|
+
### Phase 3: checkpoint and continuation tightening
|
|
140
|
+
|
|
141
|
+
Standardize the artifact that one unit leaves behind for the next:
|
|
142
|
+
|
|
143
|
+
- accomplished
|
|
144
|
+
- blockers
|
|
145
|
+
- next focus
|
|
146
|
+
- verified files
|
|
147
|
+
|
|
148
|
+
Make continuation/revise paths prefer this short artifact.
|
|
149
|
+
|
|
150
|
+
### Phase 4: validation
|
|
151
|
+
|
|
152
|
+
Add or update validation specs and tests so the workflow can prove:
|
|
153
|
+
|
|
154
|
+
- missing task contract is rejected
|
|
155
|
+
- work-unit metadata is loaded correctly
|
|
156
|
+
- continuation reads compact carry-forward context
|
|
157
|
+
- failures still classify cleanly
|
|
158
|
+
|
|
159
|
+
## Success criteria
|
|
160
|
+
|
|
161
|
+
The first v1.4 slice is successful if all of these are true:
|
|
162
|
+
|
|
163
|
+
1. The workflow can express work-unit metadata in package-local specs or templates.
|
|
164
|
+
2. Prompts clearly scope a run to a smaller work unit, not a broad stage-only brief.
|
|
165
|
+
3. Continuation uses compact carry-forward summaries by default.
|
|
166
|
+
4. Baseline tests pass.
|
|
167
|
+
5. Package-local self-check still passes.
|
|
168
|
+
6. Validation runs either pass, or fail with explicit classification that is not a workflow-plumbing ambiguity.
|
|
169
|
+
|
|
170
|
+
## Guardrails
|
|
171
|
+
|
|
172
|
+
- Do not rewrite the orchestrator from scratch.
|
|
173
|
+
- Do not introduce a second orchestration system.
|
|
174
|
+
- Do not move back into product/sample closure.
|
|
175
|
+
- Do not increase scope to unrelated features.
|
|
176
|
+
- Prefer one workflow-only architectural improvement per iteration.
|
|
177
|
+
- Preserve the packaged skill as the primary operator entry point.
|
|
178
|
+
|
|
179
|
+
## Suggested starting point for the next thread
|
|
180
|
+
|
|
181
|
+
In the next thread, the first sprint should focus on:
|
|
182
|
+
|
|
183
|
+
- implementing the work-unit contract and carry-forward foundation
|
|
184
|
+
- not the entire future v1.4 roadmap
|
|
185
|
+
|
|
186
|
+
Treat this as a bounded architecture slice:
|
|
187
|
+
|
|
188
|
+
- high value
|
|
189
|
+
- low drift
|
|
190
|
+
- directly useful for future complex coding tasks
|