claude-flow-novice 2.15.6 → 2.15.8
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude/cfn-extras/agents/google-sheets/google-sheets-coordinator.md +1 -1
- package/.claude/cfn-extras/docs/GOOGLE_SHEETS_CFN_LOOP.md +13 -11
- package/.claude/skills/cfn-loop-orchestration/helpers/gate-check.sh +39 -577
- package/.claude/skills/cfn-loop-orchestration/helpers/parse-test-results.sh +49 -270
- package/.claude/skills/cfn-loop-orchestration/src/helpers/consensus.ts +87 -0
- package/.claude/skills/cfn-loop-orchestration/src/helpers/deliverable-verifier.ts +103 -0
- package/.claude/skills/cfn-loop-orchestration/src/helpers/gate-check.ts +115 -0
- package/.claude/skills/cfn-loop-orchestration/src/helpers/iteration-manager.ts +45 -0
- package/.claude/skills/cfn-loop-orchestration/src/helpers/parse-test-results.ts +372 -0
- package/.claude/skills/cfn-loop-orchestration/src/helpers/timeout-calculator.ts +41 -0
- package/.claude/skills/cfn-loop-orchestration/tests/consensus.test.ts +142 -0
- package/.claude/skills/cfn-loop-orchestration/tests/deliverable-verifier.test.ts +197 -0
- package/.claude/skills/cfn-loop-orchestration/tests/gate-check.test.ts +325 -0
- package/.claude/skills/cfn-loop-orchestration/tests/iteration-manager.test.ts +132 -0
- package/.claude/skills/cfn-loop-orchestration/tests/parse-test-results.test.ts +382 -0
- package/.claude/skills/cfn-loop-orchestration/tests/timeout-calculator.test.ts +118 -0
- package/.claude/skills/cfn-redis-coordination/coverage/clover.xml +1447 -0
- package/.claude/skills/cfn-redis-coordination/coverage/coverage-final.json +13 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/agent-logger.ts.html +1423 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/agent-recovery.ts.html +1447 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/base.css +224 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/block-navigation.js +87 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/completion-reporter.ts.html +1273 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/context-manager.ts.html +1066 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/favicon.png +0 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/index.html +281 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/mode-detector.ts.html +550 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/prettify.css +1 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/prettify.js +2 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/redis-client.ts.html +2047 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/result-collector.ts.html +1396 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/sort-arrow-sprite.png +0 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/sorter.js +210 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/swarm-manager.ts.html +1567 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/task-analyzer.ts.html +1297 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/task-executor.ts.html +1354 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/types.ts.html +790 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov-report/waiting-coordinator.ts.html +1846 -0
- package/.claude/skills/cfn-redis-coordination/coverage/lcov.info +2650 -0
- package/.claude/skills/cfn-redis-coordination/dist/task-analyzer.js +1 -1
- package/.claude/skills/cfn-redis-coordination/src/task-analyzer.ts +1 -1
- package/.claude/skills/cfn-redis-coordination/tests/coordination.test.ts +18 -9
- package/claude-assets/agents/cfn-dev-team/coordinators/cfn-frontend-coordinator.md +13 -72
- package/claude-assets/agents/cfn-dev-team/coordinators/cfn-v3-coordinator.md +5 -65
- package/claude-assets/agents/cfn-dev-team/coordinators/consensus-builder.md +465 -508
- package/claude-assets/agents/cfn-dev-team/coordinators/handoff-coordinator.md +733 -743
- package/claude-assets/agents/cfn-dev-team/coordinators/multi-sprint-coordinator.md +13 -79
- package/claude-assets/agents/cfn-dev-team/dev-ops/docker-specialist.md +13 -18
- package/claude-assets/agents/cfn-dev-team/dev-ops/kubernetes-specialist.md +13 -18
- package/claude-assets/agents/cfn-dev-team/developers/api-gateway-specialist.md +13 -18
- package/claude-assets/agents/cfn-dev-team/developers/backend-developer.md +15 -17
- package/claude-assets/agents/cfn-dev-team/developers/data/data-engineer.md +15 -17
- package/claude-assets/agents/cfn-dev-team/developers/database/database-architect.md +15 -14
- package/claude-assets/agents/cfn-dev-team/developers/frontend/mobile-dev.md +15 -17
- package/claude-assets/agents/cfn-dev-team/developers/frontend/react-frontend-engineer.md +15 -17
- package/claude-assets/agents/cfn-dev-team/developers/frontend/typescript-specialist.md +15 -17
- package/claude-assets/agents/cfn-dev-team/developers/frontend/ui-designer.md +23 -30
- package/claude-assets/agents/cfn-dev-team/developers/graphql-specialist.md +13 -18
- package/claude-assets/agents/cfn-dev-team/developers/rust-developer.md +13 -18
- package/claude-assets/agents/cfn-dev-team/reviewers/code-reviewer.md +312 -317
- package/claude-assets/agents/cfn-dev-team/reviewers/quality/code-quality-validator.md +23 -20
- package/claude-assets/agents/cfn-dev-team/reviewers/quality/perf-analyzer.md +23 -20
- package/claude-assets/agents/cfn-dev-team/reviewers/quality/performance-benchmarker.md +23 -20
- package/claude-assets/agents/cfn-dev-team/reviewers/quality/security-specialist.md +23 -20
- package/claude-assets/agents/cfn-dev-team/testers/api-testing-specialist.md +15 -20
- package/claude-assets/agents/cfn-dev-team/testers/chaos-engineering-specialist.md +15 -20
- package/claude-assets/agents/cfn-dev-team/testers/contract-tester.md +718 -737
- package/claude-assets/agents/cfn-dev-team/testers/integration-tester.md +817 -828
- package/claude-assets/agents/cfn-dev-team/testers/interaction-tester.md +15 -20
- package/claude-assets/agents/cfn-dev-team/testers/load-testing-specialist.md +8 -9
- package/claude-assets/agents/cfn-dev-team/testers/mutation-testing-specialist.md +668 -684
- package/claude-assets/agents/cfn-dev-team/testers/playwright-tester.md +15 -20
- package/claude-assets/agents/cfn-dev-team/testers/tester.md +248 -253
- package/claude-assets/agents/cfn-dev-team/utility/epic-creator.md +13 -18
- package/claude-assets/agents/cfn-dev-team/utility/memory-leak-specialist.md +13 -18
- package/claude-assets/agents/cfn-dev-team/utility/z-ai-specialist.md +13 -18
- package/claude-assets/cfn-extras/agents/google-sheets/google-sheets-coordinator.md +1 -1
- package/claude-assets/cfn-extras/docs/GOOGLE_SHEETS_CFN_LOOP.md +13 -11
- package/claude-assets/skills/cfn-loop-orchestration/helpers/gate-check.sh +39 -577
- package/claude-assets/skills/cfn-loop-orchestration/helpers/parse-test-results.sh +49 -270
- package/claude-assets/skills/cfn-loop-orchestration/src/helpers/consensus.ts +87 -0
- package/claude-assets/skills/cfn-loop-orchestration/src/helpers/deliverable-verifier.ts +103 -0
- package/claude-assets/skills/cfn-loop-orchestration/src/helpers/gate-check.ts +115 -0
- package/claude-assets/skills/cfn-loop-orchestration/src/helpers/iteration-manager.ts +45 -0
- package/claude-assets/skills/cfn-loop-orchestration/src/helpers/parse-test-results.ts +372 -0
- package/claude-assets/skills/cfn-loop-orchestration/src/helpers/timeout-calculator.ts +41 -0
- package/claude-assets/skills/cfn-loop-orchestration/tests/consensus.test.ts +142 -0
- package/claude-assets/skills/cfn-loop-orchestration/tests/deliverable-verifier.test.ts +197 -0
- package/claude-assets/skills/cfn-loop-orchestration/tests/gate-check.test.ts +325 -0
- package/claude-assets/skills/cfn-loop-orchestration/tests/iteration-manager.test.ts +132 -0
- package/claude-assets/skills/cfn-loop-orchestration/tests/parse-test-results.test.ts +382 -0
- package/claude-assets/skills/cfn-loop-orchestration/tests/timeout-calculator.test.ts +118 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/clover.xml +1447 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/coverage-final.json +13 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/agent-logger.ts.html +1423 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/agent-recovery.ts.html +1447 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/base.css +224 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/block-navigation.js +87 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/completion-reporter.ts.html +1273 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/context-manager.ts.html +1066 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/favicon.png +0 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/index.html +281 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/mode-detector.ts.html +550 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/prettify.css +1 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/prettify.js +2 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/redis-client.ts.html +2047 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/result-collector.ts.html +1396 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/sort-arrow-sprite.png +0 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/sorter.js +210 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/swarm-manager.ts.html +1567 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/task-analyzer.ts.html +1297 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/task-executor.ts.html +1354 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/types.ts.html +790 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov-report/waiting-coordinator.ts.html +1846 -0
- package/claude-assets/skills/cfn-redis-coordination/coverage/lcov.info +2650 -0
- package/claude-assets/skills/cfn-redis-coordination/dist/task-analyzer.js +1 -1
- package/claude-assets/skills/cfn-redis-coordination/src/task-analyzer.ts +1 -1
- package/claude-assets/skills/cfn-redis-coordination/tests/coordination.test.ts +18 -9
- package/dist/agents/agent-loader.js +165 -146
- package/dist/agents/agent-loader.js.map +1 -1
- package/package.json +1 -1
- package/scripts/clean-agent-profiles.sh +112 -0
|
@@ -66,25 +66,21 @@ fi
|
|
|
66
66
|
|
|
67
67
|
**Old (Deprecated):**
|
|
68
68
|
```bash
|
|
69
|
-
redis-cli HSET "swarm:${TASK_ID}:confidence:iteration${ITERATION}" \
|
|
70
|
-
"${AGENT_ID}" "0.85"
|
|
71
|
-
```
|
|
72
69
|
|
|
73
70
|
**New (Required):**
|
|
74
71
|
```bash
|
|
75
72
|
# Execute tests and capture output
|
|
76
73
|
TEST_OUTPUT=$(npm test 2>&1)
|
|
77
74
|
|
|
78
|
-
# Parse
|
|
79
|
-
|
|
80
|
-
|
|
75
|
+
# Parse natively (no external dependencies)
|
|
76
|
+
PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
|
|
77
|
+
FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
|
|
78
|
+
TOTAL=$((PASS + FAIL))
|
|
79
|
+
RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
|
|
81
80
|
|
|
82
|
-
#
|
|
83
|
-
|
|
84
|
-
"${AGENT_ID}" "$RESULTS"
|
|
81
|
+
# Return results (Main Chat receives automatically in Task Mode)
|
|
82
|
+
echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
|
|
85
83
|
|
|
86
|
-
# Signal completion
|
|
87
|
-
redis-cli LPUSH "swarm:${TASK_ID}:completion:${AGENT_ID}" "done"
|
|
88
84
|
```
|
|
89
85
|
|
|
90
86
|
## Post-Edit Validation
|
|
@@ -210,9 +206,14 @@ Remember: Code analysis reveals improvement opportunities. Focus on actionable,
|
|
|
210
206
|
DO NOT report subjective confidence scores. Instead:
|
|
211
207
|
|
|
212
208
|
1. **Execute Tests**: Run test suite defined in success criteria
|
|
213
|
-
|
|
214
|
-
|
|
215
|
-
|
|
209
|
+
# Parse natively (no external dependencies)
|
|
210
|
+
PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
|
|
211
|
+
FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
|
|
212
|
+
TOTAL=$((PASS + FAIL))
|
|
213
|
+
RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
|
|
214
|
+
|
|
215
|
+
# Return results (Main Chat receives automatically in Task Mode)
|
|
216
|
+
echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
|
|
216
217
|
|
|
217
218
|
**Validation:**
|
|
218
219
|
- ❌ OLD: "Confidence: 0.83 - quality metrics look solid"
|
|
@@ -223,12 +224,14 @@ DO NOT report subjective confidence scores. Instead:
|
|
|
223
224
|
Complete your work and provide test-based validation:
|
|
224
225
|
|
|
225
226
|
1. **Execute Tests**: Run all code quality test suites from success criteria
|
|
226
|
-
|
|
227
|
-
|
|
228
|
-
|
|
229
|
-
|
|
230
|
-
|
|
231
|
-
|
|
227
|
+
# Parse natively (no external dependencies)
|
|
228
|
+
PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
|
|
229
|
+
FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
|
|
230
|
+
TOTAL=$((PASS + FAIL))
|
|
231
|
+
RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
|
|
232
|
+
|
|
233
|
+
# Return results (Main Chat receives automatically in Task Mode)
|
|
234
|
+
echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
|
|
232
235
|
- Coverage: ≥80%
|
|
233
236
|
- Code smells detected: N
|
|
234
237
|
- Technical debt score: X/10
|
|
@@ -56,25 +56,21 @@ fi
|
|
|
56
56
|
|
|
57
57
|
**Old (Deprecated):**
|
|
58
58
|
```bash
|
|
59
|
-
redis-cli HSET "swarm:${TASK_ID}:confidence:iteration${ITERATION}" \
|
|
60
|
-
"${AGENT_ID}" "0.85"
|
|
61
|
-
```
|
|
62
59
|
|
|
63
60
|
**New (Required):**
|
|
64
61
|
```bash
|
|
65
62
|
# Execute tests and capture output
|
|
66
63
|
TEST_OUTPUT=$(npm test 2>&1)
|
|
67
64
|
|
|
68
|
-
# Parse
|
|
69
|
-
|
|
70
|
-
|
|
65
|
+
# Parse natively (no external dependencies)
|
|
66
|
+
PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
|
|
67
|
+
FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
|
|
68
|
+
TOTAL=$((PASS + FAIL))
|
|
69
|
+
RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
|
|
71
70
|
|
|
72
|
-
#
|
|
73
|
-
|
|
74
|
-
"${AGENT_ID}" "$RESULTS"
|
|
71
|
+
# Return results (Main Chat receives automatically in Task Mode)
|
|
72
|
+
echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
|
|
75
73
|
|
|
76
|
-
# Signal completion
|
|
77
|
-
redis-cli LPUSH "swarm:${TASK_ID}:completion:${AGENT_ID}" "done"
|
|
78
74
|
```
|
|
79
75
|
|
|
80
76
|
## Mandatory Post-Edit Validation
|
|
@@ -241,9 +237,14 @@ Remember: Optimize for highest impact with reasonable effort. Focus on critical
|
|
|
241
237
|
DO NOT report subjective confidence scores. Instead:
|
|
242
238
|
|
|
243
239
|
1. **Execute Tests**: Run test suite defined in success criteria
|
|
244
|
-
|
|
245
|
-
|
|
246
|
-
|
|
240
|
+
# Parse natively (no external dependencies)
|
|
241
|
+
PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
|
|
242
|
+
FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
|
|
243
|
+
TOTAL=$((PASS + FAIL))
|
|
244
|
+
RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
|
|
245
|
+
|
|
246
|
+
# Return results (Main Chat receives automatically in Task Mode)
|
|
247
|
+
echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
|
|
247
248
|
|
|
248
249
|
**Validation:**
|
|
249
250
|
- ❌ OLD: "Confidence: 0.86 - analysis is thorough"
|
|
@@ -254,12 +255,14 @@ DO NOT report subjective confidence scores. Instead:
|
|
|
254
255
|
Complete your work and provide test-based validation:
|
|
255
256
|
|
|
256
257
|
1. **Execute Tests**: Run all performance analysis test suites from success criteria
|
|
257
|
-
|
|
258
|
-
|
|
259
|
-
|
|
260
|
-
|
|
261
|
-
|
|
262
|
-
|
|
258
|
+
# Parse natively (no external dependencies)
|
|
259
|
+
PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
|
|
260
|
+
FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
|
|
261
|
+
TOTAL=$((PASS + FAIL))
|
|
262
|
+
RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
|
|
263
|
+
|
|
264
|
+
# Return results (Main Chat receives automatically in Task Mode)
|
|
265
|
+
echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
|
|
263
266
|
- Coverage: ≥80%
|
|
264
267
|
- Bottlenecks identified: N
|
|
265
268
|
- Expected improvement: X%
|
|
@@ -53,25 +53,21 @@ fi
|
|
|
53
53
|
|
|
54
54
|
**Old (Deprecated):**
|
|
55
55
|
```bash
|
|
56
|
-
redis-cli HSET "swarm:${TASK_ID}:confidence:iteration${ITERATION}" \
|
|
57
|
-
"${AGENT_ID}" "0.85"
|
|
58
|
-
```
|
|
59
56
|
|
|
60
57
|
**New (Required):**
|
|
61
58
|
```bash
|
|
62
59
|
# Execute tests and capture output
|
|
63
60
|
TEST_OUTPUT=$(npm test 2>&1)
|
|
64
61
|
|
|
65
|
-
# Parse
|
|
66
|
-
|
|
67
|
-
|
|
62
|
+
# Parse natively (no external dependencies)
|
|
63
|
+
PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
|
|
64
|
+
FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
|
|
65
|
+
TOTAL=$((PASS + FAIL))
|
|
66
|
+
RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
|
|
68
67
|
|
|
69
|
-
#
|
|
70
|
-
|
|
71
|
-
"${AGENT_ID}" "$RESULTS"
|
|
68
|
+
# Return results (Main Chat receives automatically in Task Mode)
|
|
69
|
+
echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
|
|
72
70
|
|
|
73
|
-
# Signal completion
|
|
74
|
-
redis-cli LPUSH "swarm:${TASK_ID}:completion:${AGENT_ID}" "done"
|
|
75
71
|
```
|
|
76
72
|
|
|
77
73
|
## 🚨 Mandatory Post-Edit Validation
|
|
@@ -87,9 +83,14 @@ Refer to [.claude/templates/post-edit-validation.md](../templates/post-edit-vali
|
|
|
87
83
|
DO NOT report subjective confidence scores. Instead:
|
|
88
84
|
|
|
89
85
|
1. **Execute Tests**: Run test suite defined in success criteria
|
|
90
|
-
|
|
91
|
-
|
|
92
|
-
|
|
86
|
+
# Parse natively (no external dependencies)
|
|
87
|
+
PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
|
|
88
|
+
FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
|
|
89
|
+
TOTAL=$((PASS + FAIL))
|
|
90
|
+
RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
|
|
91
|
+
|
|
92
|
+
# Return results (Main Chat receives automatically in Task Mode)
|
|
93
|
+
echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
|
|
93
94
|
|
|
94
95
|
**Validation:**
|
|
95
96
|
- ❌ OLD: "Confidence: 0.88 - benchmarks look good"
|
|
@@ -100,12 +101,14 @@ DO NOT report subjective confidence scores. Instead:
|
|
|
100
101
|
Complete your work and provide test-based validation:
|
|
101
102
|
|
|
102
103
|
1. **Execute Tests**: Run all benchmark test suites from success criteria
|
|
103
|
-
|
|
104
|
-
|
|
105
|
-
|
|
106
|
-
|
|
107
|
-
|
|
108
|
-
|
|
104
|
+
# Parse natively (no external dependencies)
|
|
105
|
+
PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
|
|
106
|
+
FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
|
|
107
|
+
TOTAL=$((PASS + FAIL))
|
|
108
|
+
RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
|
|
109
|
+
|
|
110
|
+
# Return results (Main Chat receives automatically in Task Mode)
|
|
111
|
+
echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
|
|
109
112
|
- Coverage: ≥80%
|
|
110
113
|
- Performance baseline established: Yes/No
|
|
111
114
|
4. **Store in Redis**: Use test-results key (not confidence key)
|
|
@@ -51,25 +51,21 @@ fi
|
|
|
51
51
|
|
|
52
52
|
**Old (Deprecated):**
|
|
53
53
|
```bash
|
|
54
|
-
redis-cli HSET "swarm:${TASK_ID}:confidence:iteration${ITERATION}" \
|
|
55
|
-
"${AGENT_ID}" "0.85"
|
|
56
|
-
```
|
|
57
54
|
|
|
58
55
|
**New (Required):**
|
|
59
56
|
```bash
|
|
60
57
|
# Execute tests and capture output
|
|
61
58
|
TEST_OUTPUT=$(npm test 2>&1)
|
|
62
59
|
|
|
63
|
-
# Parse
|
|
64
|
-
|
|
65
|
-
|
|
60
|
+
# Parse natively (no external dependencies)
|
|
61
|
+
PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
|
|
62
|
+
FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
|
|
63
|
+
TOTAL=$((PASS + FAIL))
|
|
64
|
+
RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
|
|
66
65
|
|
|
67
|
-
#
|
|
68
|
-
|
|
69
|
-
"${AGENT_ID}" "$RESULTS"
|
|
66
|
+
# Return results (Main Chat receives automatically in Task Mode)
|
|
67
|
+
echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
|
|
70
68
|
|
|
71
|
-
# Signal completion
|
|
72
|
-
redis-cli LPUSH "swarm:${TASK_ID}:completion:${AGENT_ID}" "done"
|
|
73
69
|
```
|
|
74
70
|
|
|
75
71
|
## 🚨 MANDATORY DOCUMENTATION REDACTION PROTOCOL
|
|
@@ -169,9 +165,14 @@ Security analysis results are captured and processed through structured reportin
|
|
|
169
165
|
DO NOT report subjective confidence scores. Instead:
|
|
170
166
|
|
|
171
167
|
1. **Execute Tests**: Run test suite defined in success criteria
|
|
172
|
-
|
|
173
|
-
|
|
174
|
-
|
|
168
|
+
# Parse natively (no external dependencies)
|
|
169
|
+
PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
|
|
170
|
+
FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
|
|
171
|
+
TOTAL=$((PASS + FAIL))
|
|
172
|
+
RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
|
|
173
|
+
|
|
174
|
+
# Return results (Main Chat receives automatically in Task Mode)
|
|
175
|
+
echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
|
|
175
176
|
|
|
176
177
|
**Validation:**
|
|
177
178
|
- ❌ OLD: "Confidence: 0.90 - security looks solid"
|
|
@@ -182,12 +183,14 @@ DO NOT report subjective confidence scores. Instead:
|
|
|
182
183
|
Complete your work and provide test-based validation:
|
|
183
184
|
|
|
184
185
|
1. **Execute Tests**: Run all security test suites from success criteria
|
|
185
|
-
|
|
186
|
-
|
|
187
|
-
|
|
188
|
-
|
|
189
|
-
|
|
190
|
-
|
|
186
|
+
# Parse natively (no external dependencies)
|
|
187
|
+
PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
|
|
188
|
+
FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
|
|
189
|
+
TOTAL=$((PASS + FAIL))
|
|
190
|
+
RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
|
|
191
|
+
|
|
192
|
+
# Return results (Main Chat receives automatically in Task Mode)
|
|
193
|
+
echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
|
|
191
194
|
- Coverage: ≥80%
|
|
192
195
|
- Critical vulnerabilities found: N
|
|
193
196
|
4. **Store in Redis**: Use test-results key (not confidence key)
|
|
@@ -64,25 +64,18 @@ fi
|
|
|
64
64
|
|
|
65
65
|
**Old (Deprecated):**
|
|
66
66
|
```bash
|
|
67
|
-
redis-cli HSET "swarm:${TASK_ID}:confidence:iteration${ITERATION}" \
|
|
68
|
-
"${AGENT_ID}" "0.85"
|
|
69
|
-
```
|
|
70
67
|
|
|
71
68
|
**New (Required):**
|
|
72
69
|
```bash
|
|
73
70
|
# Execute tests and capture output
|
|
74
71
|
TEST_OUTPUT=$(npm test 2>&1)
|
|
75
72
|
|
|
76
|
-
# Parse
|
|
77
|
-
|
|
78
|
-
|
|
79
|
-
|
|
80
|
-
|
|
81
|
-
redis-cli HSET "swarm:${TASK_ID}:test-results:iteration${ITERATION}" \
|
|
82
|
-
"${AGENT_ID}" "$RESULTS"
|
|
73
|
+
# Parse natively (no external dependencies)
|
|
74
|
+
PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
|
|
75
|
+
FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
|
|
76
|
+
TOTAL=$((PASS + FAIL))
|
|
77
|
+
RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
|
|
83
78
|
|
|
84
|
-
# Signal completion
|
|
85
|
-
redis-cli LPUSH "swarm:${TASK_ID}:completion:${AGENT_ID}" "done"
|
|
86
79
|
```
|
|
87
80
|
|
|
88
81
|
## Core Responsibilities
|
|
@@ -761,8 +754,8 @@ Before reporting high confidence:
|
|
|
761
754
|
DO NOT report subjective confidence scores. Instead:
|
|
762
755
|
|
|
763
756
|
1. **Execute Tests**: Run test suite defined in success criteria
|
|
764
|
-
2. **Parse Results**: Use
|
|
765
|
-
3. **Store Results**:
|
|
757
|
+
2. **Parse Results**: Use native bash parsing (grep/awk) for test results
|
|
758
|
+
3. **Store Results**: Return results to Main Chat (Task Mode auto-receives output)
|
|
766
759
|
4. **Pass Rate**: Your API testing passes the gate if tests ≥ threshold (95% standard mode)
|
|
767
760
|
|
|
768
761
|
**Validation:**
|
|
@@ -774,12 +767,14 @@ DO NOT report subjective confidence scores. Instead:
|
|
|
774
767
|
Complete your work and provide test-based validation:
|
|
775
768
|
|
|
776
769
|
1. **Execute Tests**: Run all API test suites from success criteria
|
|
777
|
-
|
|
778
|
-
|
|
779
|
-
|
|
780
|
-
|
|
781
|
-
|
|
782
|
-
|
|
770
|
+
# Parse natively (no external dependencies)
|
|
771
|
+
PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
|
|
772
|
+
FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
|
|
773
|
+
TOTAL=$((PASS + FAIL))
|
|
774
|
+
RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
|
|
775
|
+
|
|
776
|
+
# Return results (Main Chat receives automatically in Task Mode)
|
|
777
|
+
echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
|
|
783
778
|
- Coverage: ≥80%
|
|
784
779
|
- Contract tests: X/Y passed
|
|
785
780
|
- Security tests: X/Y passed
|
|
@@ -62,25 +62,18 @@ fi
|
|
|
62
62
|
|
|
63
63
|
**Old (Deprecated):**
|
|
64
64
|
```bash
|
|
65
|
-
redis-cli HSET "swarm:${TASK_ID}:confidence:iteration${ITERATION}" \
|
|
66
|
-
"${AGENT_ID}" "0.85"
|
|
67
|
-
```
|
|
68
65
|
|
|
69
66
|
**New (Required):**
|
|
70
67
|
```bash
|
|
71
68
|
# Execute tests and capture output
|
|
72
69
|
TEST_OUTPUT=$(npm test 2>&1)
|
|
73
70
|
|
|
74
|
-
# Parse
|
|
75
|
-
|
|
76
|
-
|
|
77
|
-
|
|
78
|
-
|
|
79
|
-
redis-cli HSET "swarm:${TASK_ID}:test-results:iteration${ITERATION}" \
|
|
80
|
-
"${AGENT_ID}" "$RESULTS"
|
|
71
|
+
# Parse natively (no external dependencies)
|
|
72
|
+
PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
|
|
73
|
+
FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
|
|
74
|
+
TOTAL=$((PASS + FAIL))
|
|
75
|
+
RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
|
|
81
76
|
|
|
82
|
-
# Signal completion
|
|
83
|
-
redis-cli LPUSH "swarm:${TASK_ID}:completion:${AGENT_ID}" "done"
|
|
84
77
|
```
|
|
85
78
|
|
|
86
79
|
## Core Responsibilities
|
|
@@ -922,8 +915,8 @@ phases:
|
|
|
922
915
|
DO NOT report subjective confidence scores. Instead:
|
|
923
916
|
|
|
924
917
|
1. **Execute Tests**: Run test suite defined in success criteria
|
|
925
|
-
2. **Parse Results**: Use
|
|
926
|
-
3. **Store Results**:
|
|
918
|
+
2. **Parse Results**: Use native bash parsing (grep/awk) for test results
|
|
919
|
+
3. **Store Results**: Return results to Main Chat (Task Mode auto-receives output)
|
|
927
920
|
4. **Pass Rate**: Your chaos testing passes the gate if tests ≥ threshold (95% standard mode)
|
|
928
921
|
|
|
929
922
|
**Validation:**
|
|
@@ -935,12 +928,14 @@ DO NOT report subjective confidence scores. Instead:
|
|
|
935
928
|
Complete your work and provide test-based validation:
|
|
936
929
|
|
|
937
930
|
1. **Execute Tests**: Run all chaos experiment test suites from success criteria
|
|
938
|
-
|
|
939
|
-
|
|
940
|
-
|
|
941
|
-
|
|
942
|
-
|
|
943
|
-
|
|
931
|
+
# Parse natively (no external dependencies)
|
|
932
|
+
PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
|
|
933
|
+
FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
|
|
934
|
+
TOTAL=$((PASS + FAIL))
|
|
935
|
+
RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
|
|
936
|
+
|
|
937
|
+
# Return results (Main Chat receives automatically in Task Mode)
|
|
938
|
+
echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
|
|
944
939
|
- Coverage: ≥80%
|
|
945
940
|
- Critical paths covered: X/Y
|
|
946
941
|
- System resilience verified: Yes/No
|