claude-flow-novice 2.15.9 → 2.15.11

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (74) hide show
  1. package/.claude/skills/cfn-loop-orchestration/IMPLEMENTATION_SUMMARY.md +519 -0
  2. package/.claude/skills/cfn-loop-orchestration/ORCHESTRATOR_IMPLEMENTATION.md +493 -0
  3. package/.claude/skills/cfn-loop-orchestration/ORCHESTRATOR_QUICK_START.md +499 -0
  4. package/.claude/skills/cfn-loop-orchestration/helpers/orchestrate-ts.sh +104 -0
  5. package/.claude/skills/cfn-loop-orchestration/orchestrate.sh +2 -2
  6. package/.claude/skills/cfn-loop-orchestration/src/orchestrate.ts +648 -0
  7. package/.claude/skills/cfn-loop-orchestration/tests/orchestrate.test.ts +836 -0
  8. package/README.md +205 -10
  9. package/claude-assets/agents/cfn-dev-team/CLAUDE.md +9 -81
  10. package/claude-assets/agents/cfn-dev-team/architecture/base-template-generator.md +4 -4
  11. package/claude-assets/agents/cfn-dev-team/architecture/planner.md +4 -4
  12. package/claude-assets/agents/cfn-dev-team/architecture/system-architect.md +5 -5
  13. package/claude-assets/agents/cfn-dev-team/coordinators/cfn-v3-coordinator.md +184 -229
  14. package/claude-assets/agents/cfn-dev-team/dev-ops/devops-engineer.md +4 -4
  15. package/claude-assets/agents/cfn-dev-team/dev-ops/docker-specialist.md +9 -37
  16. package/claude-assets/agents/cfn-dev-team/dev-ops/kubernetes-specialist.md +9 -37
  17. package/claude-assets/agents/cfn-dev-team/dev-ops/monitoring-specialist.md +4 -4
  18. package/claude-assets/agents/cfn-dev-team/developers/api-gateway-specialist.md +10 -40
  19. package/claude-assets/agents/cfn-dev-team/developers/database/database-architect.md +3 -0
  20. package/claude-assets/agents/cfn-dev-team/developers/frontend/mobile-dev.md +4 -1
  21. package/claude-assets/agents/cfn-dev-team/developers/frontend/react-frontend-engineer.md +4 -1
  22. package/claude-assets/agents/cfn-dev-team/developers/frontend/typescript-specialist.md +4 -1
  23. package/claude-assets/agents/cfn-dev-team/developers/frontend/ui-designer.md +5 -0
  24. package/claude-assets/agents/cfn-dev-team/developers/graphql-specialist.md +2 -1
  25. package/claude-assets/agents/cfn-dev-team/developers/rust-developer.md +2 -1
  26. package/claude-assets/agents/cfn-dev-team/documentation/pseudocode.md +2 -7
  27. package/claude-assets/agents/cfn-dev-team/product-owners/accessibility-advocate-persona.md +4 -4
  28. package/claude-assets/agents/cfn-dev-team/product-owners/cto-agent.md +4 -4
  29. package/claude-assets/agents/cfn-dev-team/product-owners/power-user-persona.md +4 -4
  30. package/claude-assets/agents/cfn-dev-team/product-owners/product-owner.md +18 -22
  31. package/claude-assets/agents/cfn-dev-team/reviewers/code-reviewer.md +1 -1
  32. package/claude-assets/agents/cfn-dev-team/reviewers/quality/code-quality-validator.md +1 -1
  33. package/claude-assets/agents/cfn-dev-team/reviewers/quality/perf-analyzer.md +1 -1
  34. package/claude-assets/agents/cfn-dev-team/reviewers/quality/performance-benchmarker.md +1 -1
  35. package/claude-assets/agents/cfn-dev-team/reviewers/quality/security-specialist.md +1 -1
  36. package/claude-assets/agents/cfn-dev-team/testers/api-testing-specialist.md +7 -35
  37. package/claude-assets/agents/cfn-dev-team/testers/chaos-engineering-specialist.md +17 -36
  38. package/claude-assets/agents/cfn-dev-team/testers/contract-tester.md +10 -11
  39. package/claude-assets/agents/cfn-dev-team/testers/e2e/playwright-tester.md +5 -5
  40. package/claude-assets/agents/cfn-dev-team/testers/integration-tester.md +10 -12
  41. package/claude-assets/agents/cfn-dev-team/testers/interaction-tester.md +7 -36
  42. package/claude-assets/agents/cfn-dev-team/testers/load-testing-specialist.md +10 -12
  43. package/claude-assets/agents/cfn-dev-team/testers/mutation-testing-specialist.md +10 -12
  44. package/claude-assets/agents/cfn-dev-team/testers/playwright-tester.md +7 -37
  45. package/claude-assets/agents/cfn-dev-team/testers/tester.md +7 -33
  46. package/claude-assets/agents/cfn-dev-team/testers/unit/tdd-london-unit-swarm.md +5 -5
  47. package/claude-assets/agents/cfn-dev-team/testers/validation/validation-production-validator.md +4 -4
  48. package/claude-assets/agents/cfn-dev-team/testing/test-validation-agent.md +4 -4
  49. package/claude-assets/agents/cfn-dev-team/utility/agent-builder.md +16 -16
  50. package/claude-assets/agents/cfn-dev-team/utility/analyst.md +4 -4
  51. package/claude-assets/agents/cfn-dev-team/utility/code-booster.md +4 -4
  52. package/claude-assets/agents/cfn-dev-team/utility/context-curator.md +4 -4
  53. package/claude-assets/agents/cfn-dev-team/utility/epic-creator.md +7 -85
  54. package/claude-assets/agents/cfn-dev-team/utility/memory-leak-specialist.md +7 -93
  55. package/claude-assets/agents/cfn-dev-team/utility/researcher.md +4 -4
  56. package/claude-assets/agents/cfn-dev-team/utility/z-ai-specialist.md +7 -84
  57. package/claude-assets/skills/cfn-loop-orchestration/IMPLEMENTATION_SUMMARY.md +519 -0
  58. package/claude-assets/skills/cfn-loop-orchestration/ORCHESTRATOR_IMPLEMENTATION.md +493 -0
  59. package/claude-assets/skills/cfn-loop-orchestration/ORCHESTRATOR_QUICK_START.md +499 -0
  60. package/claude-assets/skills/cfn-loop-orchestration/helpers/orchestrate-ts.sh +104 -0
  61. package/claude-assets/skills/cfn-loop-orchestration/orchestrate.sh +2 -2
  62. package/claude-assets/skills/cfn-loop-orchestration/src/orchestrate.ts +648 -0
  63. package/claude-assets/skills/cfn-loop-orchestration/tests/orchestrate.test.ts +836 -0
  64. package/dist/cli/agent-definition-parser.js +37 -4
  65. package/dist/cli/agent-definition-parser.js.map +1 -1
  66. package/dist/cli/agent-executor.js +32 -2
  67. package/dist/cli/agent-executor.js.map +1 -1
  68. package/dist/coordination/coordinate.js +369 -0
  69. package/dist/coordination/coordinate.js.map +1 -0
  70. package/dist/coordination/spawn-agent.js +364 -0
  71. package/dist/coordination/spawn-agent.js.map +1 -0
  72. package/dist/coordination/types-export.js +38 -0
  73. package/dist/coordination/types-export.js.map +1 -0
  74. package/package.json +1 -1
@@ -87,7 +87,6 @@ RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0
87
87
 
88
88
  # Return results (Main Chat receives automatically in Task Mode)
89
89
  echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
90
-
91
90
  ```
92
91
 
93
92
  # React Native Mobile Development Specialist
@@ -222,6 +221,10 @@ RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0
222
221
 
223
222
  # Return results (Main Chat receives automatically in Task Mode)
224
223
  echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
224
+ ```
225
+
226
+ 2. **Report Pass Rate**: Return test results in JSON format
227
+ 3. **Validate Coverage**: Ensure test coverage meets minimum threshold
225
228
  - Coverage: ≥80%
226
229
  4. **Store in Redis**: Use test-results key (not confidence key)
227
230
  5. **Signal Completion**: Push to completion queue
@@ -63,7 +63,6 @@ RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0
63
63
 
64
64
  # Return results (Main Chat receives automatically in Task Mode)
65
65
  echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
66
-
67
66
  ```
68
67
 
69
68
  # React Frontend Engineer Agent Profile
@@ -229,6 +228,10 @@ RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0
229
228
 
230
229
  # Return results (Main Chat receives automatically in Task Mode)
231
230
  echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
231
+ ```
232
+
233
+ 2. **Report Pass Rate**: Return test results in JSON format
234
+ 3. **Validate Coverage**: Ensure test coverage meets minimum threshold
232
235
  - Coverage: ≥80%
233
236
  4. **Store in Redis**: Use test-results key (not confidence key)
234
237
  5. **Signal Completion**: Push to completion queue
@@ -61,7 +61,6 @@ RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0
61
61
 
62
62
  # Return results (Main Chat receives automatically in Task Mode)
63
63
  echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
64
-
65
64
  ```
66
65
 
67
66
  # TypeScript Specialist
@@ -362,6 +361,10 @@ RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0
362
361
 
363
362
  # Return results (Main Chat receives automatically in Task Mode)
364
363
  echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
364
+ ```
365
+
366
+ 2. **Report Pass Rate**: Return test results in JSON format
367
+ 3. **Validate Coverage**: Ensure test coverage meets minimum threshold
365
368
  - Coverage: ≥80%
366
369
  4. **Store in Redis**: Use test-results key (not confidence key)
367
370
  5. **Signal Completion**: Push to completion queue
@@ -81,6 +81,7 @@ RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0
81
81
 
82
82
  # Return results (Main Chat receives automatically in Task Mode)
83
83
  echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
84
+ ```
84
85
 
85
86
  # Parse test results (capture exit code)
86
87
  set +e # Temporarily allow failures
@@ -161,6 +162,10 @@ RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0
161
162
 
162
163
  # Return results (Main Chat receives automatically in Task Mode)
163
164
  echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
165
+ ```
166
+
167
+ 2. **Report Pass Rate**: Return test results in JSON format
168
+ 3. **Validate Coverage**: Ensure test coverage meets minimum threshold
164
169
  - Coverage: ≥80%
165
170
  4. **Store in Redis**: Use test-results key (not confidence key)
166
171
  5. **Signal Completion**: Push to completion queue
@@ -58,6 +58,8 @@ fi
58
58
 
59
59
  **Old (Deprecated):**
60
60
  ```bash
61
+ # Not shown - deprecated pattern
62
+ ```
61
63
 
62
64
  **New (Required):**
63
65
  ```bash
@@ -69,7 +71,6 @@ PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
69
71
  FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
70
72
  TOTAL=$((PASS + FAIL))
71
73
  RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
72
-
73
74
  ```
74
75
 
75
76
  # GraphQL Specialist Agent
@@ -73,6 +73,8 @@ fi
73
73
 
74
74
  **Old (Deprecated):**
75
75
  ```bash
76
+ # Not shown - deprecated pattern
77
+ ```
76
78
 
77
79
  **New (Required):**
78
80
  ```bash
@@ -84,7 +86,6 @@ PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
84
86
  FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
85
87
  TOTAL=$((PASS + FAIL))
86
88
  RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
87
-
88
89
  ```
89
90
 
90
91
  # Rust Developer Agent
@@ -40,11 +40,6 @@ acl_level: 1
40
40
  ## Documentation Approach
41
41
 
42
42
  Focus on clear, executable algorithm documentation that can be implemented across different programming languages.
43
- reasoning: "Algorithms designed, complexity analyzed"
44
- },
45
- { agentId, aclLevel: 1 }
46
- );
47
- ```
48
43
 
49
44
  ## Team Dynamics
50
45
 
@@ -67,7 +62,7 @@ Focus on clear, executable algorithm documentation that can be implemented acros
67
62
  ### Algorithm Design Patterns
68
63
 
69
64
  #### 1. Authentication Algorithm
70
- ```
65
+ ```plaintext
71
66
  ALGORITHM: AuthenticateUser
72
67
  INPUT: email (string), password (string)
73
68
  OUTPUT: user (User) or error
@@ -115,7 +110,7 @@ Space Complexity: O(1)
115
110
  ### Design Patterns
116
111
 
117
112
  #### Strategy Pattern for Authentication
118
- ```
113
+ ```plaintext
119
114
  INTERFACE: AuthenticationStrategy
120
115
  authenticate(credentials): User or Error
121
116
 
@@ -104,8 +104,8 @@ confidence = (
104
104
 
105
105
  Complete your work and provide a structured response with:
106
106
  - Confidence score (0.0-1.0) based on work quality
107
- - Summary of analysis/review completed
108
- - List of findings or deliverables
109
- - Any recommendations made
107
+ - Summary of work completed
108
+ - List of deliverables created
109
+ - Any recommendations or findings
110
110
 
111
- **Note:** Coordination instructions are provided when spawned via CLI.
111
+ **Note:** Coordination handled automatically by the system.
@@ -128,8 +128,8 @@ Evaluate completed implementations:
128
128
 
129
129
  Complete your work and provide a structured response with:
130
130
  - Confidence score (0.0-1.0) based on work quality
131
- - Summary of analysis/review completed
132
- - List of findings or deliverables
133
- - Any recommendations made
131
+ - Summary of work completed
132
+ - List of deliverables created
133
+ - Any recommendations or findings
134
134
 
135
- **Note:** Coordination instructions are provided when spawned via CLI.
135
+ **Note:** Coordination handled automatically by the system.
@@ -117,11 +117,11 @@ Evaluate completed implementations:
117
117
 
118
118
  Complete your work and provide a structured response with:
119
119
  - Confidence score (0.0-1.0) based on work quality
120
- - Summary of analysis/review completed
121
- - List of findings or deliverables
122
- - Any recommendations made
120
+ - Summary of work completed
121
+ - List of deliverables created
122
+ - Any recommendations or findings
123
123
 
124
- **Note:** Coordination instructions are provided when spawned via CLI.
124
+ **Note:** Coordination handled automatically by the system.
125
125
 
126
126
  ## Success Metrics
127
127
 
@@ -323,22 +323,21 @@ const adjustConfidenceBasedOnHistory = (baseConfidence, auditData) => {
323
323
  };
324
324
  ```
325
325
 
326
- **3. Cross-Mode Consistency Validation:**
326
+ **3. Consistency Validation:**
327
327
  ```bash
328
- # Check if Task Mode and CLI Mode validators agree
328
+ # Check validator agreement
329
329
  VALIDATOR_AGREEMENT=$(echo "$AUDIT_DATA" | jq -r '
330
330
  group_by(.agent_type) |
331
331
  map({
332
332
  agent: .[0].agent_type,
333
- modes: group_by(.mode) | map({mode: .[0].mode, avg_confidence: map(.confidence) | add / length})
333
+ avg_confidence: map(.confidence) | add / length
334
334
  }) |
335
- .[] | select(.modes | length > 1) |
336
- select((.modes[0].avg_confidence - .modes[1].avg_confidence | abs) > 0.2) |
335
+ .[] | select(.avg_confidence < 0.8) |
337
336
  .agent')
338
337
 
339
338
  if [ -n "$VALIDATOR_AGREEMENT" ]; then
340
- echo "⚠️ Warning: Cross-mode validator disagreement detected for: $VALIDATOR_AGREEMENT"
341
- # Reduce confidence when validators disagree across modes
339
+ echo "⚠️ Warning: Low confidence detected for: $VALIDATOR_AGREEMENT"
340
+ # Reduce confidence when validators show low scores
342
341
  CONFIDENCE_ADJUSTMENT=0.1
343
342
  fi
344
343
  ```
@@ -363,20 +362,20 @@ if [ $(echo "$PERFORMANCE_PATTERN" | wc -l) -gt 2 ]; then
363
362
  fi
364
363
  ```
365
364
 
366
- **Example 2: Mode Effectiveness Analysis**
365
+ **Example 2: Effectiveness Analysis**
367
366
  ```bash
368
- # Compare Task Mode vs CLI Mode effectiveness
369
- MODE_ANALYSIS=$(echo "$AUDIT_DATA" | jq -r '
370
- group_by(.mode) |
367
+ # Analyze overall agent effectiveness
368
+ EFFECTIVENESS_ANALYSIS=$(echo "$AUDIT_DATA" | jq -r '
369
+ group_by(.agent_type) |
371
370
  map({
372
- mode: .[0].mode,
373
- total_agents: length,
371
+ agent_type: .[0].agent_type,
372
+ total_tasks: length,
374
373
  avg_confidence: map(.confidence) | add / length,
375
374
  success_rate: map(select(.decision != "ABORT")) | length / length
376
375
  })')
377
376
 
378
- echo "📊 MODE EFFECTIVENESS ANALYSIS:"
379
- echo "$MODE_ANALYSIS"
377
+ echo "📊 EFFECTIVENESS ANALYSIS:"
378
+ echo "$EFFECTIVENESS_ANALYSIS"
380
379
  ```
381
380
 
382
381
  **Example 3: Agent Reliability Scoring**
@@ -429,15 +428,12 @@ When provided with validator feedback:
429
428
  - Concerns: Missing test coverage, unclear requirements
430
429
  - Decision: ITERATE with 0.80 confidence
431
430
 
432
- ### Task Mode with Manual Audit Retrieval
431
+ ### Audit Data Integration
433
432
 
434
- **Example: Debugging Security Issues**
433
+ **Example: Security Issue Analysis**
435
434
 
436
435
  ```bash
437
- # Task Mode for debugging
438
- /cfn-loop-task "Fix security vulnerability in auth module" --mode=standard
439
-
440
- # Product Owner spawned in Task Mode:
436
+ # Product Owner workflow:
441
437
  # 1. Receives Loop 2 results from coordinator
442
438
  # 2. Optionally retrieves audit data for context
443
439
  # 3. Makes decision with audit insights
@@ -460,7 +456,7 @@ Agent Performance: Recommend involving security-specialist agent in next iterati
460
456
  1. **Pattern Recognition**: Identifies recurring concerns across iterations
461
457
  2. **Agent Reliability**: Tracks which agents perform best on specific task types
462
458
  3. **Confidence Adjustment**: Modifies confidence based on historical success rates
463
- 4. **Cross-Mode Analysis**: Compares performance between Task Mode and CLI Mode
459
+ 4. **Performance Analysis**: Compares agent effectiveness across different scenarios
464
460
  5. **Decision Context**: Provides rich context for strategic decision-making
465
461
 
466
462
  ### Key Features
@@ -314,4 +314,4 @@ Test Execution Summary:
314
314
  - Gate Status: PASS (≥95% in 2/3 suites, ≥80% overall)
315
315
  ```
316
316
 
317
- **Note:** Coordination instructions and success criteria provided when spawned via CLI.
317
+ **Note:** Coordination handled automatically by the system.
@@ -258,4 +258,4 @@ Code Quality Test Execution Summary:
258
258
  - Gate Status: PASS (≥95% overall, actionable debt prioritization provided)
259
259
  ```
260
260
 
261
- **Note:** Coordination instructions and success criteria provided when spawned via CLI.
261
+ **Note:** Coordination handled automatically by the system.
@@ -289,4 +289,4 @@ Performance Analysis Test Summary:
289
289
  - Gate Status: PASS (≥95% in 1/3 suites, actionable recommendations provided)
290
290
  ```
291
291
 
292
- **Note:** Coordination instructions and success criteria provided when spawned via CLI.
292
+ **Note:** Coordination handled automatically by the system.
@@ -133,7 +133,7 @@ Benchmark Test Execution Summary:
133
133
  - Gate Status: PASS (≥95% in 1/3 suites, latency anomalies noted)
134
134
  ```
135
135
 
136
- **Note:** Coordination instructions and success criteria provided when spawned via CLI.
136
+ **Note:** Coordination handled automatically by the system.
137
137
 
138
138
  ## Team Dynamics
139
139
 
@@ -218,7 +218,7 @@ Security Test Execution Summary:
218
218
  - Gate Status: PASS (≥95% overall, zero critical vulnerabilities)
219
219
  ```
220
220
 
221
- **Note:** Coordination instructions and success criteria provided when spawned via CLI.
221
+ **Note:** Coordination handled automatically by the system.
222
222
 
223
223
  ## Success Metrics
224
224
 
@@ -760,43 +760,15 @@ DO NOT report subjective confidence scores. Instead:
760
760
  - ❌ OLD: "Confidence: 0.90 - API tests are comprehensive"
761
761
  - ✅ NEW: "API Tests: 58/60 passed (96.7% pass rate) - 2 schema validation edge cases need work"
762
762
 
763
- ## Completion Protocol (Test-Driven)
763
+ ## Completion Protocol
764
764
 
765
- Complete your work and provide test-based validation:
765
+ Complete your work and provide a structured response with:
766
+ - Confidence score (0.0-1.0) based on work quality
767
+ - Summary of work completed
768
+ - List of deliverables created
769
+ - Any recommendations or findings
766
770
 
767
- 1. **Execute Tests**: Run all API test suites from success criteria
768
-
769
- ```bash
770
- # Parse natively (no external dependencies)
771
- PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
772
- FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
773
- TOTAL=$((PASS + FAIL))
774
- RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
775
-
776
- # Return results (Main Chat receives automatically in Task Mode)
777
- echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
778
- ```
779
-
780
- 2. **Validate Results**:
781
- - Coverage: ≥80%
782
- - Contract tests: X/Y passed
783
- - Security tests: X/Y passed
784
-
785
- 3. **Store Results**: Use test-results key (not confidence key)
786
- 4. **Signal Completion**: Push to completion queue
787
-
788
- **Example Report:**
789
- ```text
790
- API Testing Summary:
791
- - Contract Tests: 20/20 passed (100%)
792
- - Schema Validation Tests: 18/18 passed (100%)
793
- - Security Tests: 12/12 passed (100%)
794
- - Load Tests: 8/10 passed (80%)
795
- - Overall: 58/60 passed (96.7%)
796
- - Coverage: 85.3%
797
- - All Endpoints Tested: Yes
798
- - Gate Status: PASS (≥95% overall, 100% security coverage)
799
- ```
771
+ **Note:** Coordination handled automatically by the system.
800
772
 
801
773
  ## Skill References
802
774
  → **Contract Testing**: `.claude/skills/pact-contract-testing/SKILL.md`
@@ -921,44 +921,15 @@ DO NOT report subjective confidence scores. Instead:
921
921
  - ❌ OLD: "Confidence: 0.92 - chaos tests comprehensive"
922
922
  - ✅ NEW: "Chaos Tests: 46/48 passed (95.8% pass rate) - 2 network partition scenarios need tuning"
923
923
 
924
- ## Completion Protocol (Test-Driven)
924
+ ## Completion Protocol
925
925
 
926
- Complete your work and provide test-based validation:
926
+ Complete your work and provide a structured response with:
927
+ - Confidence score (0.0-1.0) based on work quality
928
+ - Summary of work completed
929
+ - List of deliverables created
930
+ - Any recommendations or findings
927
931
 
928
- 1. **Execute Tests**: Run all chaos experiment test suites from success criteria
929
-
930
- ```bash
931
- # Parse natively (no external dependencies)
932
- PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
933
- FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
934
- TOTAL=$((PASS + FAIL))
935
- RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
936
-
937
- # Return results (Main Chat receives automatically in Task Mode)
938
- echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
939
- ```
940
-
941
- 2. **Validate Results**:
942
- - Coverage: ≥80%
943
- - Critical paths covered: X/Y
944
- - System resilience verified: Yes/No
945
-
946
- 3. **Store Results**: Use test-results key (not confidence key)
947
- 5. **Signal Completion**: Push to completion queue
948
-
949
- **Example Report:**
950
- ```
951
- Chaos Engineering Test Summary:
952
- - Pod Failure Tests: 10/10 passed (100%)
953
- - Network Chaos Tests: 14/16 passed (87.5%)
954
- - Resource Stress Tests: 12/12 passed (100%)
955
- - Disaster Recovery Tests: 10/10 passed (100%)
956
- - Overall: 46/48 passed (95.8%)
957
- - Coverage: 86.2%
958
- - Critical Paths Tested: 12/12 (100%)
959
- - System Resilience Verified: Yes
960
- - Gate Status: PASS (≥95% overall, all critical paths validated)
961
- ```
932
+ **Note:** Coordination handled automatically by the system.
962
933
 
963
934
  ## Deliverables
964
935
 
@@ -982,3 +953,13 @@ Chaos Engineering Test Summary:
982
953
  → **Failure Injection**: `.claude/skills/failure-injection/SKILL.md`
983
954
  → **Gameday Planning**: `.claude/skills/gameday-runbooks/SKILL.md`
984
955
  → **Resilience Testing**: `.claude/skills/resilience-validation/SKILL.md`
956
+
957
+ ## Completion Protocol
958
+
959
+ Complete your work and provide a structured response with:
960
+ - Confidence score (0.0-1.0) based on work quality
961
+ - Summary of work completed
962
+ - List of deliverables created
963
+ - Any recommendations or findings
964
+
965
+ **Note:** Coordination handled automatically by the system.
@@ -93,17 +93,6 @@ echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
93
93
  # Report completion (no confidence score)
94
94
  ```
95
95
 
96
- ### 4. Completion Protocol
97
-
98
- **DO NOT** report confidence scores. Report test metrics:
99
- ```bash
100
- echo "Contract Test Results:"
101
- echo " Total Contracts: 15"
102
- echo " Verified: 15"
103
- echo " Failed: 0"
104
- echo " Pass Rate: 100%"
105
- ```
106
-
107
96
  ---
108
97
 
109
98
  ## Role: Contract Testing Specialist (Loop 2 Validator)
@@ -716,3 +705,13 @@ pip install pact-python
716
705
  - Good: 0.85-0.95 (minor issues, non-breaking)
717
706
  - Poor: <0.85 (breaking changes, contract failures)
718
707
  - Critical: <0.5 (adapter bugs, major contract violations)
708
+
709
+ ## Completion Protocol
710
+
711
+ Complete your work and provide a structured response with:
712
+ - Confidence score (0.0-1.0) based on work quality
713
+ - Summary of work completed
714
+ - List of deliverables created
715
+ - Any recommendations or findings
716
+
717
+ **Note:** Coordination handled automatically by the system.
@@ -107,10 +107,10 @@ await sqlite.memoryAdapter.set(
107
107
  ## Completion Protocol
108
108
 
109
109
  Complete your work and provide a structured response with:
110
- - Confidence score (0.0-1.0) based on test coverage and quality
111
- - Summary of E2E testing completed
112
- - List of test cases executed and results
113
- - Performance metrics and any issues identified
110
+ - Confidence score (0.0-1.0) based on work quality
111
+ - Summary of work completed
112
+ - List of deliverables created
113
+ - Any recommendations or findings
114
114
 
115
- **Note:** Coordination instructions are provided when spawned via CLI.
115
+ **Note:** Coordination handled automatically by the system.
116
116
 
@@ -81,18 +81,6 @@ echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
81
81
  # Report completion (no confidence score)
82
82
  ```
83
83
 
84
- ### 4. Completion Protocol
85
-
86
- **DO NOT** report confidence scores. Report test metrics:
87
- ```bash
88
- echo "Integration Test Results:"
89
- echo " Total Workflows: 12"
90
- echo " Passed: 11"
91
- echo " Failed: 1"
92
- echo " Pass Rate: 92%"
93
- echo " Critical Workflows: 100% (all passed)"
94
- ```
95
-
96
84
  ---
97
85
 
98
86
  ## Role: Integration Testing Specialist (Loop 2 Validator)
@@ -815,3 +803,13 @@ afterAll(async () => {
815
803
  - ✅ **Race Conditions**: Concurrent update tests catch double-spend bugs
816
804
  - ✅ **Cascade Deletion**: Referential integrity tests catch orphaned records
817
805
  - ✅ **Cross-Service**: Orchestration tests catch integration breaks
806
+
807
+ ## Completion Protocol
808
+
809
+ Complete your work and provide a structured response with:
810
+ - Confidence score (0.0-1.0) based on work quality
811
+ - Summary of work completed
812
+ - List of deliverables created
813
+ - Any recommendations or findings
814
+
815
+ **Note:** Coordination handled automatically by the system.
@@ -196,42 +196,13 @@ DO NOT report subjective confidence scores. Instead:
196
196
  - ❌ OLD: "Confidence: 0.87 - interaction tests comprehensive"
197
197
  - ✅ NEW: "Interaction Tests: 52/55 passed (94.5% pass rate) - 3 accessibility edge cases found"
198
198
 
199
- ## Completion Protocol (Test-Driven)
199
+ ## Completion Protocol
200
200
 
201
- Complete your work and provide test-based validation:
201
+ Complete your work and provide a structured response with:
202
+ - Confidence score (0.0-1.0) based on work quality
203
+ - Summary of work completed
204
+ - List of deliverables created
205
+ - Any recommendations or findings
202
206
 
203
- 1. **Execute Tests**: Run all interaction test suites from success criteria
204
- ```bash
205
- # Parse natively (no external dependencies)
206
- PASS=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= passing)' || echo "0")
207
- FAIL=$(echo "$TEST_OUTPUT" | grep -oP '\d+(?= failing)' || echo "0")
208
- TOTAL=$((PASS + FAIL))
209
- RATE=$(awk "BEGIN {if ($TOTAL > 0) printf \"%.2f\", $PASS/$TOTAL; else print \"0.00\"}")
210
-
211
- # Return results (Main Chat receives automatically in Task Mode)
212
- echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
213
- ```
214
-
215
- 2. **Validate Results**:
216
- - Coverage: ≥80%
217
- - WCAG AA compliance: Yes/No
218
- - Critical flows covered: X/Y
219
-
220
- 3. **Store Results**: Use test-results key (not confidence key)
221
- 4. **Signal Completion**: Push to completion queue
222
-
223
- **Example Report:**
224
- ```
225
- Interaction Testing Summary:
226
- - Integration Tests: 24/25 passed (96%)
227
- - E2E User Flow Tests: 18/20 passed (90%)
228
- - Accessibility Tests: 10/10 passed (100%)
229
- - Overall: 52/55 passed (94.5%)
230
- - Coverage: 87.2%
231
- - WCAG AA Compliance: Yes
232
- - Critical Flows: 8/8 (100%)
233
- - Gate Status: PASS (≥95% in 1/3 suites, accessibility validated)
234
- ```
235
-
236
- **Note:** Coordination instructions and success criteria provided when spawned via CLI.
207
+ **Note:** Coordination handled automatically by the system.
237
208
 
@@ -75,18 +75,6 @@ echo "{\"passed\": $PASS, \"failed\": $FAIL, \"pass_rate\": $RATE}"
75
75
  # Report completion (no confidence score)
76
76
  ```
77
77
 
78
- ### 4. Completion Protocol
79
-
80
- **DO NOT** report confidence scores. Report performance metrics:
81
- ```bash
82
- echo "Load Test Results:"
83
- echo " RPS: 1200 (threshold: ≥1000)"
84
- echo " P95 Latency: 450ms (threshold: <500ms)"
85
- echo " P99 Latency: 850ms (threshold: <1000ms)"
86
- echo " Error Rate: 0.1% (threshold: <1%)"
87
- echo " Pass Rate: 100%"
88
- ```
89
-
90
78
  ---
91
79
 
92
80
  ## Core Responsibilities
@@ -535,3 +523,13 @@ Servers Needed = RPS Required / RPS Per Server
535
523
  - Monitoring system resources during tests
536
524
  - Analyzing performance over extended duration
537
525
  - Validating error handling under stress
526
+
527
+ ## Completion Protocol
528
+
529
+ Complete your work and provide a structured response with:
530
+ - Confidence score (0.0-1.0) based on work quality
531
+ - Summary of work completed
532
+ - List of deliverables created
533
+ - Any recommendations or findings
534
+
535
+ **Note:** Coordination handled automatically by the system.
@@ -72,18 +72,6 @@ MUTATION_SCORE=$(echo "$TEST_OUTPUT" | grep -oP 'Mutation score: \K[0-9.]+')
72
72
  # Report completion (no confidence score)
73
73
  ```
74
74
 
75
- ### 4. Completion Protocol
76
-
77
- **DO NOT** report confidence scores. Report mutation metrics:
78
- ```bash
79
- echo "Mutation Testing Results:"
80
- echo " Mutants Generated: 145"
81
- echo " Mutants Killed: 132"
82
- echo " Mutants Survived: 13"
83
- echo " Mutation Score: 91%"
84
- echo " Threshold: 85% (PASS)"
85
- ```
86
-
87
75
  ---
88
76
 
89
77
  ## Role: Mutation Testing Specialist (Loop 2 Validator)
@@ -666,3 +654,13 @@ echo "Consensus: $CONSENSUS"
666
654
  - Prevents false sense of security from high coverage
667
655
  - Identifies boundary condition bugs
668
656
  - Validates logical operator correctness
657
+
658
+ ## Completion Protocol
659
+
660
+ Complete your work and provide a structured response with:
661
+ - Confidence score (0.0-1.0) based on work quality
662
+ - Summary of work completed
663
+ - List of deliverables created
664
+ - Any recommendations or findings
665
+
666
+ **Note:** Coordination handled automatically by the system.