moflo 4.9.21 → 4.9.23

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (194) hide show
  1. package/.claude/agents/analysis/analyze-code-quality.md +0 -121
  2. package/.claude/agents/analysis/code-analyzer.md +5 -26
  3. package/.claude/agents/architecture/system-design/arch-system-design.md +0 -119
  4. package/.claude/agents/base-template-generator.md +0 -1
  5. package/.claude/agents/core/coder.md +0 -22
  6. package/.claude/agents/core/planner.md +0 -16
  7. package/.claude/agents/core/researcher.md +0 -16
  8. package/.claude/agents/core/reviewer.md +0 -17
  9. package/.claude/agents/core/tester.md +0 -19
  10. package/.claude/agents/custom/test-long-runner.md +0 -2
  11. package/.claude/agents/development/dev-backend-api.md +0 -167
  12. package/.claude/agents/development/dev-database.md +43 -0
  13. package/.claude/agents/development/dev-frontend.md +42 -0
  14. package/.claude/agents/devops/ci-cd/ops-cicd-github.md +0 -112
  15. package/.claude/agents/documentation/api-docs/docs-api-openapi.md +0 -111
  16. package/.claude/agents/security/security-auditor.md +45 -0
  17. package/.claude/guidance/shipped/moflo-cli-reference.md +19 -16
  18. package/.claude/guidance/shipped/moflo-core-guidance.md +0 -2
  19. package/.claude/guidance/shipped/moflo-guidance-rules.md +5 -5
  20. package/.claude/guidance/shipped/moflo-spell-runner.md +1 -0
  21. package/.claude/guidance/shipped/moflo-spell-scheduling.md +225 -0
  22. package/.claude/guidance/shipped/moflo-spell-troubleshooting.md +1 -0
  23. package/.claude/helpers/gate.cjs +70 -3
  24. package/.claude/skills/fl/execution-modes.md +38 -15
  25. package/.claude/skills/fl/phases.md +67 -0
  26. package/.claude/skills/spell-schedule/SKILL.md +18 -5
  27. package/README.md +1 -1
  28. package/bin/gate.cjs +70 -3
  29. package/bin/index-guidance.mjs +32 -6
  30. package/bin/lib/retired-files.mjs +146 -0
  31. package/bin/session-start-launcher.mjs +116 -8
  32. package/dist/src/cli/appliance/rvfa-builder.js +1 -1
  33. package/dist/src/cli/commands/agent.js +3 -9
  34. package/dist/src/cli/commands/daemon.js +13 -17
  35. package/dist/src/cli/commands/hooks.js +4 -9
  36. package/dist/src/cli/commands/index.js +2 -0
  37. package/dist/src/cli/commands/retire.js +111 -0
  38. package/dist/src/cli/commands/spell-schedule.js +237 -49
  39. package/dist/src/cli/hooks/reasoningbank/index.js +7 -7
  40. package/dist/src/cli/init/executor.js +26 -54
  41. package/dist/src/cli/init/helpers-generator.js +66 -3
  42. package/dist/src/cli/init/settings-generator.js +17 -6
  43. package/dist/src/cli/mcp-tools/agent-tools.js +9 -27
  44. package/dist/src/cli/mcp-tools/hooks-tools.js +23 -21
  45. package/dist/src/cli/mcp-tools/memory-tools.js +16 -5
  46. package/dist/src/cli/memory/bridge-embedder.js +26 -6
  47. package/dist/src/cli/memory/bridge-entries.js +33 -15
  48. package/dist/src/cli/memory/controllers/semantic-router.js +18 -12
  49. package/dist/src/cli/memory/sona-optimizer.js +6 -6
  50. package/dist/src/cli/neural/domain/services/learning-service.js +3 -3
  51. package/dist/src/cli/services/agent-router.js +2 -5
  52. package/dist/src/cli/services/daemon-autostart-lifecycle.js +62 -0
  53. package/dist/src/cli/services/daemon-dashboard.js +187 -18
  54. package/dist/src/cli/services/daemon-readiness.js +19 -31
  55. package/dist/src/cli/services/ephemeral-namespace-purge.js +61 -33
  56. package/dist/src/cli/services/headless-worker-executor.js +7 -94
  57. package/dist/src/cli/services/hook-block-hash.js +4 -0
  58. package/dist/src/cli/services/worker-daemon.js +40 -66
  59. package/dist/src/cli/shared/events/example-usage.js +6 -6
  60. package/dist/src/cli/shared/hooks/task-hooks.js +8 -8
  61. package/dist/src/cli/spells/core/runner.js +12 -0
  62. package/dist/src/cli/spells/scheduler/scheduler.js +24 -9
  63. package/dist/src/cli/spells/schema/validator.js +2 -1
  64. package/dist/src/cli/spells/schema/validators/top-level.js +18 -0
  65. package/dist/src/cli/version.js +1 -1
  66. package/package.json +5 -2
  67. package/retired-files.json +1989 -0
  68. package/src/cli/data/model-registry.json +2 -2
  69. package/.claude/agents/consensus/byzantine-coordinator.md +0 -63
  70. package/.claude/agents/consensus/crdt-synchronizer.md +0 -997
  71. package/.claude/agents/consensus/gossip-coordinator.md +0 -63
  72. package/.claude/agents/consensus/performance-benchmarker.md +0 -851
  73. package/.claude/agents/consensus/quorum-manager.md +0 -823
  74. package/.claude/agents/consensus/raft-manager.md +0 -63
  75. package/.claude/agents/consensus/security-manager.md +0 -622
  76. package/.claude/agents/data/ml/data-ml-model.md +0 -193
  77. package/.claude/agents/github/code-review-swarm.md +0 -538
  78. package/.claude/agents/github/github-modes.md +0 -172
  79. package/.claude/agents/github/issue-tracker.md +0 -311
  80. package/.claude/agents/github/multi-repo-swarm.md +0 -551
  81. package/.claude/agents/github/pr-manager.md +0 -183
  82. package/.claude/agents/github/project-board-sync.md +0 -508
  83. package/.claude/agents/github/release-manager.md +0 -360
  84. package/.claude/agents/github/release-swarm.md +0 -580
  85. package/.claude/agents/github/repo-architect.md +0 -391
  86. package/.claude/agents/github/swarm-issue.md +0 -566
  87. package/.claude/agents/github/swarm-pr.md +0 -414
  88. package/.claude/agents/github/sync-coordinator.md +0 -426
  89. package/.claude/agents/github/workflow-automation.md +0 -606
  90. package/.claude/agents/goal/code-goal-planner.md +0 -440
  91. package/.claude/agents/goal/goal-planner.md +0 -168
  92. package/.claude/agents/hive-mind/collective-intelligence-coordinator.md +0 -127
  93. package/.claude/agents/hive-mind/queen-coordinator.md +0 -198
  94. package/.claude/agents/hive-mind/scout-explorer.md +0 -233
  95. package/.claude/agents/hive-mind/swarm-memory-manager.md +0 -184
  96. package/.claude/agents/hive-mind/worker-specialist.md +0 -208
  97. package/.claude/agents/neural/safla-neural.md +0 -73
  98. package/.claude/agents/optimization/benchmark-suite.md +0 -665
  99. package/.claude/agents/optimization/load-balancer.md +0 -431
  100. package/.claude/agents/optimization/performance-monitor.md +0 -672
  101. package/.claude/agents/optimization/resource-allocator.md +0 -674
  102. package/.claude/agents/optimization/topology-optimizer.md +0 -808
  103. package/.claude/agents/reasoning/goal-planner.md +0 -67
  104. package/.claude/agents/sona/sona-learning-optimizer.md +0 -74
  105. package/.claude/agents/sparc/architecture.md +0 -472
  106. package/.claude/agents/sparc/pseudocode.md +0 -318
  107. package/.claude/agents/sparc/refinement.md +0 -525
  108. package/.claude/agents/sparc/specification.md +0 -276
  109. package/.claude/agents/specialized/mobile/spec-mobile-react-native.md +0 -225
  110. package/.claude/agents/swarm/adaptive-coordinator.md +0 -391
  111. package/.claude/agents/swarm/hierarchical-coordinator.md +0 -321
  112. package/.claude/agents/swarm/mesh-coordinator.md +0 -383
  113. package/.claude/agents/testing/production-validator.md +0 -395
  114. package/.claude/agents/testing/tdd-london-swarm.md +0 -244
  115. package/.claude/agents/v3/adr-architect.md +0 -184
  116. package/.claude/agents/v3/aidefence-guardian.md +0 -277
  117. package/.claude/agents/v3/claims-authorizer.md +0 -208
  118. package/.claude/agents/v3/collective-intelligence-coordinator.md +0 -988
  119. package/.claude/agents/v3/ddd-domain-expert.md +0 -220
  120. package/.claude/agents/v3/injection-analyst.md +0 -232
  121. package/.claude/agents/v3/memory-specialist.md +0 -987
  122. package/.claude/agents/v3/performance-engineer.md +0 -1225
  123. package/.claude/agents/v3/pii-detector.md +0 -146
  124. package/.claude/agents/v3/reasoningbank-learner.md +0 -213
  125. package/.claude/agents/v3/security-architect-aidefence.md +0 -405
  126. package/.claude/agents/v3/security-architect.md +0 -865
  127. package/.claude/agents/v3/security-auditor.md +0 -771
  128. package/.claude/agents/v3/sparc-orchestrator.md +0 -182
  129. package/.claude/agents/v3/swarm-memory-manager.md +0 -142
  130. package/.claude/agents/v3/v3-integration-architect.md +0 -205
  131. package/.claude/commands/claude-flow-help.md +0 -103
  132. package/.claude/commands/claude-flow-memory.md +0 -107
  133. package/.claude/commands/claude-flow-swarm.md +0 -205
  134. package/.claude/commands/flo-simplify.md +0 -101
  135. package/.claude/commands/github/README.md +0 -11
  136. package/.claude/commands/github/code-review-swarm.md +0 -514
  137. package/.claude/commands/github/code-review.md +0 -25
  138. package/.claude/commands/github/github-modes.md +0 -146
  139. package/.claude/commands/github/github-swarm.md +0 -113
  140. package/.claude/commands/github/issue-tracker.md +0 -284
  141. package/.claude/commands/github/issue-triage.md +0 -25
  142. package/.claude/commands/github/multi-repo-swarm.md +0 -519
  143. package/.claude/commands/github/pr-enhance.md +0 -26
  144. package/.claude/commands/github/pr-manager.md +0 -164
  145. package/.claude/commands/github/project-board-sync.md +0 -471
  146. package/.claude/commands/github/release-manager.md +0 -332
  147. package/.claude/commands/github/release-swarm.md +0 -544
  148. package/.claude/commands/github/repo-analyze.md +0 -25
  149. package/.claude/commands/github/repo-architect.md +0 -361
  150. package/.claude/commands/github/swarm-issue.md +0 -482
  151. package/.claude/commands/github/swarm-pr.md +0 -285
  152. package/.claude/commands/github/sync-coordinator.md +0 -294
  153. package/.claude/commands/github/workflow-automation.md +0 -442
  154. package/.claude/commands/hooks/README.md +0 -11
  155. package/.claude/commands/hooks/overview.md +0 -58
  156. package/.claude/commands/hooks/post-edit.md +0 -117
  157. package/.claude/commands/hooks/post-task.md +0 -112
  158. package/.claude/commands/hooks/pre-edit.md +0 -113
  159. package/.claude/commands/hooks/pre-task.md +0 -111
  160. package/.claude/commands/hooks/session-end.md +0 -118
  161. package/.claude/commands/hooks/setup.md +0 -103
  162. package/.claude/commands/sparc/analyzer.md +0 -42
  163. package/.claude/commands/sparc/architect.md +0 -43
  164. package/.claude/commands/sparc/ask.md +0 -86
  165. package/.claude/commands/sparc/batch-executor.md +0 -44
  166. package/.claude/commands/sparc/code.md +0 -78
  167. package/.claude/commands/sparc/coder.md +0 -44
  168. package/.claude/commands/sparc/debug.md +0 -72
  169. package/.claude/commands/sparc/debugger.md +0 -44
  170. package/.claude/commands/sparc/designer.md +0 -43
  171. package/.claude/commands/sparc/devops.md +0 -98
  172. package/.claude/commands/sparc/docs-writer.md +0 -69
  173. package/.claude/commands/sparc/documenter.md +0 -44
  174. package/.claude/commands/sparc/innovator.md +0 -44
  175. package/.claude/commands/sparc/integration.md +0 -72
  176. package/.claude/commands/sparc/mcp.md +0 -106
  177. package/.claude/commands/sparc/memory-manager.md +0 -44
  178. package/.claude/commands/sparc/optimizer.md +0 -44
  179. package/.claude/commands/sparc/orchestrator.md +0 -116
  180. package/.claude/commands/sparc/post-deployment-monitoring-mode.md +0 -72
  181. package/.claude/commands/sparc/refinement-optimization-mode.md +0 -72
  182. package/.claude/commands/sparc/researcher.md +0 -44
  183. package/.claude/commands/sparc/reviewer.md +0 -44
  184. package/.claude/commands/sparc/security-review.md +0 -69
  185. package/.claude/commands/sparc/sparc-modes.md +0 -139
  186. package/.claude/commands/sparc/sparc.md +0 -99
  187. package/.claude/commands/sparc/spec-pseudocode.md +0 -69
  188. package/.claude/commands/sparc/spell-manager.md +0 -44
  189. package/.claude/commands/sparc/supabase-admin.md +0 -337
  190. package/.claude/commands/sparc/swarm-coordinator.md +0 -44
  191. package/.claude/commands/sparc/tdd.md +0 -44
  192. package/.claude/commands/sparc/tester.md +0 -44
  193. package/.claude/commands/sparc/tutorial.md +0 -68
  194. package/.claude/commands/sparc.md +0 -151
@@ -1,665 +0,0 @@
1
- ---
2
- name: Benchmark Suite
3
- type: agent
4
- category: optimization
5
- description: Comprehensive performance benchmarking, regression detection and performance validation
6
- ---
7
-
8
- # Benchmark Suite Agent
9
-
10
- ## Agent Profile
11
- - **Name**: Benchmark Suite
12
- - **Type**: Performance Optimization Agent
13
- - **Specialization**: Comprehensive performance benchmarking and testing
14
- - **Performance Focus**: Automated benchmarking, regression detection, and performance validation
15
-
16
- ## Core Capabilities
17
-
18
- ### 1. Comprehensive Benchmarking Framework
19
- ```javascript
20
- // Advanced benchmarking system
21
- class ComprehensiveBenchmarkSuite {
22
- constructor() {
23
- this.benchmarks = {
24
- // Core performance benchmarks
25
- throughput: new ThroughputBenchmark(),
26
- latency: new LatencyBenchmark(),
27
- scalability: new ScalabilityBenchmark(),
28
- resource_usage: new ResourceUsageBenchmark(),
29
-
30
- // Swarm-specific benchmarks
31
- coordination: new CoordinationBenchmark(),
32
- load_balancing: new LoadBalancingBenchmark(),
33
- topology: new TopologyBenchmark(),
34
- fault_tolerance: new FaultToleranceBenchmark(),
35
-
36
- // Custom benchmarks
37
- custom: new CustomBenchmarkManager()
38
- };
39
-
40
- this.reporter = new BenchmarkReporter();
41
- this.comparator = new PerformanceComparator();
42
- this.analyzer = new BenchmarkAnalyzer();
43
- }
44
-
45
- // Execute comprehensive benchmark suite
46
- async runBenchmarkSuite(config = {}) {
47
- const suiteConfig = {
48
- duration: config.duration || 300000, // 5 minutes default
49
- iterations: config.iterations || 10,
50
- warmupTime: config.warmupTime || 30000, // 30 seconds
51
- cooldownTime: config.cooldownTime || 10000, // 10 seconds
52
- parallel: config.parallel || false,
53
- baseline: config.baseline || null
54
- };
55
-
56
- const results = {
57
- summary: {},
58
- detailed: new Map(),
59
- baseline_comparison: null,
60
- recommendations: []
61
- };
62
-
63
- // Warmup phase
64
- await this.warmup(suiteConfig.warmupTime);
65
-
66
- // Execute benchmarks
67
- if (suiteConfig.parallel) {
68
- results.detailed = await this.runBenchmarksParallel(suiteConfig);
69
- } else {
70
- results.detailed = await this.runBenchmarksSequential(suiteConfig);
71
- }
72
-
73
- // Generate summary
74
- results.summary = this.generateSummary(results.detailed);
75
-
76
- // Compare with baseline if provided
77
- if (suiteConfig.baseline) {
78
- results.baseline_comparison = await this.compareWithBaseline(
79
- results.detailed,
80
- suiteConfig.baseline
81
- );
82
- }
83
-
84
- // Generate recommendations
85
- results.recommendations = await this.generateRecommendations(results);
86
-
87
- // Cooldown phase
88
- await this.cooldown(suiteConfig.cooldownTime);
89
-
90
- return results;
91
- }
92
-
93
- // Parallel benchmark execution
94
- async runBenchmarksParallel(config) {
95
- const benchmarkPromises = Object.entries(this.benchmarks).map(
96
- async ([name, benchmark]) => {
97
- const result = await this.executeBenchmark(benchmark, name, config);
98
- return [name, result];
99
- }
100
- );
101
-
102
- const results = await Promise.all(benchmarkPromises);
103
- return new Map(results);
104
- }
105
-
106
- // Sequential benchmark execution
107
- async runBenchmarksSequential(config) {
108
- const results = new Map();
109
-
110
- for (const [name, benchmark] of Object.entries(this.benchmarks)) {
111
- const result = await this.executeBenchmark(benchmark, name, config);
112
- results.set(name, result);
113
-
114
- // Brief pause between benchmarks
115
- await this.sleep(1000);
116
- }
117
-
118
- return results;
119
- }
120
- }
121
- ```
122
-
123
- ### 2. Performance Regression Detection
124
- ```javascript
125
- // Advanced regression detection system
126
- class RegressionDetector {
127
- constructor() {
128
- this.detectors = {
129
- statistical: new StatisticalRegressionDetector(),
130
- machine_learning: new MLRegressionDetector(),
131
- threshold: new ThresholdRegressionDetector(),
132
- trend: new TrendRegressionDetector()
133
- };
134
-
135
- this.analyzer = new RegressionAnalyzer();
136
- this.alerting = new RegressionAlerting();
137
- }
138
-
139
- // Detect performance regressions
140
- async detectRegressions(currentResults, historicalData, config = {}) {
141
- const regressions = {
142
- detected: [],
143
- severity: 'none',
144
- confidence: 0,
145
- analysis: {}
146
- };
147
-
148
- // Run multiple detection algorithms
149
- const detectionPromises = Object.entries(this.detectors).map(
150
- async ([method, detector]) => {
151
- const detection = await detector.detect(currentResults, historicalData, config);
152
- return [method, detection];
153
- }
154
- );
155
-
156
- const detectionResults = await Promise.all(detectionPromises);
157
-
158
- // Aggregate detection results
159
- for (const [method, detection] of detectionResults) {
160
- if (detection.regression_detected) {
161
- regressions.detected.push({
162
- method,
163
- ...detection
164
- });
165
- }
166
- }
167
-
168
- // Calculate overall confidence and severity
169
- if (regressions.detected.length > 0) {
170
- regressions.confidence = this.calculateAggregateConfidence(regressions.detected);
171
- regressions.severity = this.calculateSeverity(regressions.detected);
172
- regressions.analysis = await this.analyzer.analyze(regressions.detected);
173
- }
174
-
175
- return regressions;
176
- }
177
-
178
- // Statistical regression detection using change point analysis
179
- async detectStatisticalRegression(metric, historicalData, sensitivity = 0.95) {
180
- // Use CUSUM (Cumulative Sum) algorithm for change point detection
181
- const cusum = this.calculateCUSUM(metric, historicalData);
182
-
183
- // Detect change points
184
- const changePoints = this.detectChangePoints(cusum, sensitivity);
185
-
186
- // Analyze significance of changes
187
- const analysis = changePoints.map(point => ({
188
- timestamp: point.timestamp,
189
- magnitude: point.magnitude,
190
- direction: point.direction,
191
- significance: point.significance,
192
- confidence: point.confidence
193
- }));
194
-
195
- return {
196
- regression_detected: changePoints.length > 0,
197
- change_points: analysis,
198
- cusum_statistics: cusum.statistics,
199
- sensitivity: sensitivity
200
- };
201
- }
202
-
203
- // Machine learning-based regression detection
204
- async detectMLRegression(metrics, historicalData) {
205
- // Train anomaly detection model on historical data
206
- const model = await this.trainAnomalyModel(historicalData);
207
-
208
- // Predict anomaly scores for current metrics
209
- const anomalyScores = await model.predict(metrics);
210
-
211
- // Identify regressions based on anomaly scores
212
- const threshold = this.calculateDynamicThreshold(anomalyScores);
213
- const regressions = anomalyScores.filter(score => score.anomaly > threshold);
214
-
215
- return {
216
- regression_detected: regressions.length > 0,
217
- anomaly_scores: anomalyScores,
218
- threshold: threshold,
219
- regressions: regressions,
220
- model_confidence: model.confidence
221
- };
222
- }
223
- }
224
- ```
225
-
226
- ### 3. Automated Performance Testing
227
- ```javascript
228
- // Comprehensive automated performance testing
229
- class AutomatedPerformanceTester {
230
- constructor() {
231
- this.testSuites = {
232
- load: new LoadTestSuite(),
233
- stress: new StressTestSuite(),
234
- volume: new VolumeTestSuite(),
235
- endurance: new EnduranceTestSuite(),
236
- spike: new SpikeTestSuite(),
237
- configuration: new ConfigurationTestSuite()
238
- };
239
-
240
- this.scheduler = new TestScheduler();
241
- this.orchestrator = new TestOrchestrator();
242
- this.validator = new ResultValidator();
243
- }
244
-
245
- // Execute automated performance test campaign
246
- async runTestCampaign(config) {
247
- const campaign = {
248
- id: this.generateCampaignId(),
249
- config,
250
- startTime: Date.now(),
251
- tests: [],
252
- results: new Map(),
253
- summary: null
254
- };
255
-
256
- // Schedule test execution
257
- const schedule = await this.scheduler.schedule(config.tests, config.constraints);
258
-
259
- // Execute tests according to schedule
260
- for (const scheduledTest of schedule) {
261
- const testResult = await this.executeScheduledTest(scheduledTest);
262
- campaign.tests.push(scheduledTest);
263
- campaign.results.set(scheduledTest.id, testResult);
264
-
265
- // Validate results in real-time
266
- const validation = await this.validator.validate(testResult);
267
- if (!validation.valid) {
268
- campaign.summary = {
269
- status: 'failed',
270
- reason: validation.reason,
271
- failedAt: scheduledTest.name
272
- };
273
- break;
274
- }
275
- }
276
-
277
- // Generate campaign summary
278
- if (!campaign.summary) {
279
- campaign.summary = await this.generateCampaignSummary(campaign);
280
- }
281
-
282
- campaign.endTime = Date.now();
283
- campaign.duration = campaign.endTime - campaign.startTime;
284
-
285
- return campaign;
286
- }
287
-
288
- // Load testing with gradual ramp-up
289
- async executeLoadTest(config) {
290
- const loadTest = {
291
- type: 'load',
292
- config,
293
- phases: [],
294
- metrics: new Map(),
295
- results: {}
296
- };
297
-
298
- // Ramp-up phase
299
- const rampUpResult = await this.executeRampUp(config.rampUp);
300
- loadTest.phases.push({ phase: 'ramp-up', result: rampUpResult });
301
-
302
- // Sustained load phase
303
- const sustainedResult = await this.executeSustainedLoad(config.sustained);
304
- loadTest.phases.push({ phase: 'sustained', result: sustainedResult });
305
-
306
- // Ramp-down phase
307
- const rampDownResult = await this.executeRampDown(config.rampDown);
308
- loadTest.phases.push({ phase: 'ramp-down', result: rampDownResult });
309
-
310
- // Analyze results
311
- loadTest.results = await this.analyzeLoadTestResults(loadTest.phases);
312
-
313
- return loadTest;
314
- }
315
-
316
- // Stress testing to find breaking points
317
- async executeStressTest(config) {
318
- const stressTest = {
319
- type: 'stress',
320
- config,
321
- breakingPoint: null,
322
- degradationCurve: [],
323
- results: {}
324
- };
325
-
326
- let currentLoad = config.startLoad;
327
- let systemBroken = false;
328
-
329
- while (!systemBroken && currentLoad <= config.maxLoad) {
330
- const testResult = await this.applyLoad(currentLoad, config.duration);
331
-
332
- stressTest.degradationCurve.push({
333
- load: currentLoad,
334
- performance: testResult.performance,
335
- stability: testResult.stability,
336
- errors: testResult.errors
337
- });
338
-
339
- // Check if system is breaking
340
- if (this.isSystemBreaking(testResult, config.breakingCriteria)) {
341
- stressTest.breakingPoint = {
342
- load: currentLoad,
343
- performance: testResult.performance,
344
- reason: this.identifyBreakingReason(testResult)
345
- };
346
- systemBroken = true;
347
- }
348
-
349
- currentLoad += config.loadIncrement;
350
- }
351
-
352
- stressTest.results = await this.analyzeStressTestResults(stressTest);
353
-
354
- return stressTest;
355
- }
356
- }
357
- ```
358
-
359
- ### 4. Performance Validation Framework
360
- ```javascript
361
- // Comprehensive performance validation
362
- class PerformanceValidator {
363
- constructor() {
364
- this.validators = {
365
- sla: new SLAValidator(),
366
- regression: new RegressionValidator(),
367
- scalability: new ScalabilityValidator(),
368
- reliability: new ReliabilityValidator(),
369
- efficiency: new EfficiencyValidator()
370
- };
371
-
372
- this.thresholds = new ThresholdManager();
373
- this.rules = new ValidationRuleEngine();
374
- }
375
-
376
- // Validate performance against defined criteria
377
- async validatePerformance(results, criteria) {
378
- const validation = {
379
- overall: {
380
- passed: true,
381
- score: 0,
382
- violations: []
383
- },
384
- detailed: new Map(),
385
- recommendations: []
386
- };
387
-
388
- // Run all validators
389
- const validationPromises = Object.entries(this.validators).map(
390
- async ([type, validator]) => {
391
- const result = await validator.validate(results, criteria[type]);
392
- return [type, result];
393
- }
394
- );
395
-
396
- const validationResults = await Promise.all(validationPromises);
397
-
398
- // Aggregate validation results
399
- for (const [type, result] of validationResults) {
400
- validation.detailed.set(type, result);
401
-
402
- if (!result.passed) {
403
- validation.overall.passed = false;
404
- validation.overall.violations.push(...result.violations);
405
- }
406
-
407
- validation.overall.score += result.score * (criteria[type]?.weight || 1);
408
- }
409
-
410
- // Normalize overall score
411
- const totalWeight = Object.values(criteria).reduce((sum, c) => sum + (c.weight || 1), 0);
412
- validation.overall.score /= totalWeight;
413
-
414
- // Generate recommendations
415
- validation.recommendations = await this.generateValidationRecommendations(validation);
416
-
417
- return validation;
418
- }
419
-
420
- // SLA validation
421
- async validateSLA(results, slaConfig) {
422
- const slaValidation = {
423
- passed: true,
424
- violations: [],
425
- score: 1.0,
426
- metrics: {}
427
- };
428
-
429
- // Validate each SLA metric
430
- for (const [metric, threshold] of Object.entries(slaConfig.thresholds)) {
431
- const actualValue = this.extractMetricValue(results, metric);
432
- const validation = this.validateThreshold(actualValue, threshold);
433
-
434
- slaValidation.metrics[metric] = {
435
- actual: actualValue,
436
- threshold: threshold.value,
437
- operator: threshold.operator,
438
- passed: validation.passed,
439
- deviation: validation.deviation
440
- };
441
-
442
- if (!validation.passed) {
443
- slaValidation.passed = false;
444
- slaValidation.violations.push({
445
- metric,
446
- actual: actualValue,
447
- expected: threshold.value,
448
- severity: threshold.severity || 'medium'
449
- });
450
-
451
- // Reduce score based on violation severity
452
- const severityMultiplier = this.getSeverityMultiplier(threshold.severity);
453
- slaValidation.score -= (validation.deviation * severityMultiplier);
454
- }
455
- }
456
-
457
- slaValidation.score = Math.max(0, slaValidation.score);
458
-
459
- return slaValidation;
460
- }
461
-
462
- // Scalability validation
463
- async validateScalability(results, scalabilityConfig) {
464
- const scalabilityValidation = {
465
- passed: true,
466
- violations: [],
467
- score: 1.0,
468
- analysis: {}
469
- };
470
-
471
- // Linear scalability analysis
472
- if (scalabilityConfig.linear) {
473
- const linearityAnalysis = this.analyzeLinearScalability(results);
474
- scalabilityValidation.analysis.linearity = linearityAnalysis;
475
-
476
- if (linearityAnalysis.coefficient < scalabilityConfig.linear.minCoefficient) {
477
- scalabilityValidation.passed = false;
478
- scalabilityValidation.violations.push({
479
- type: 'linearity',
480
- actual: linearityAnalysis.coefficient,
481
- expected: scalabilityConfig.linear.minCoefficient
482
- });
483
- }
484
- }
485
-
486
- // Efficiency retention analysis
487
- if (scalabilityConfig.efficiency) {
488
- const efficiencyAnalysis = this.analyzeEfficiencyRetention(results);
489
- scalabilityValidation.analysis.efficiency = efficiencyAnalysis;
490
-
491
- if (efficiencyAnalysis.retention < scalabilityConfig.efficiency.minRetention) {
492
- scalabilityValidation.passed = false;
493
- scalabilityValidation.violations.push({
494
- type: 'efficiency_retention',
495
- actual: efficiencyAnalysis.retention,
496
- expected: scalabilityConfig.efficiency.minRetention
497
- });
498
- }
499
- }
500
-
501
- return scalabilityValidation;
502
- }
503
- }
504
- ```
505
-
506
- ## MCP Integration Hooks
507
-
508
- ### Benchmark Execution Integration
509
- ```javascript
510
- // Comprehensive MCP benchmark integration
511
- const benchmarkIntegration = {
512
- // Execute performance benchmarks
513
- async runBenchmarks(config = {}) {
514
- // Run benchmark suite
515
- const benchmarkResult = await mcp.benchmark_run({
516
- suite: config.suite || 'comprehensive'
517
- });
518
-
519
- // Collect detailed metrics during benchmarking
520
- const metrics = await mcp.metrics_collect({
521
- components: ['system', 'agents', 'coordination', 'memory']
522
- });
523
-
524
- // Analyze performance trends
525
- const trends = await mcp.trend_analysis({
526
- metric: 'performance',
527
- period: '24h'
528
- });
529
-
530
- // Cost analysis
531
- const costAnalysis = await mcp.cost_analysis({
532
- timeframe: '24h'
533
- });
534
-
535
- return {
536
- benchmark: benchmarkResult,
537
- metrics,
538
- trends,
539
- costAnalysis,
540
- timestamp: Date.now()
541
- };
542
- },
543
-
544
- // Quality assessment
545
- async assessQuality(criteria) {
546
- const qualityAssessment = await mcp.quality_assess({
547
- target: 'swarm-performance',
548
- criteria: criteria || [
549
- 'throughput',
550
- 'latency',
551
- 'reliability',
552
- 'scalability',
553
- 'efficiency'
554
- ]
555
- });
556
-
557
- return qualityAssessment;
558
- },
559
-
560
- // Error pattern analysis
561
- async analyzeErrorPatterns() {
562
- // Collect system logs
563
- const logs = await this.collectSystemLogs();
564
-
565
- // Analyze error patterns
566
- const errorAnalysis = await mcp.error_analysis({
567
- logs: logs
568
- });
569
-
570
- return errorAnalysis;
571
- }
572
- };
573
- ```
574
-
575
- ## Operational Commands
576
-
577
- ### Benchmarking Commands
578
- ```bash
579
- # Run comprehensive benchmark suite
580
- npx claude-flow benchmark-run --suite comprehensive --duration 300
581
-
582
- # Execute specific benchmark
583
- npx claude-flow benchmark-run --suite throughput --iterations 10
584
-
585
- # Compare with baseline
586
- npx claude-flow benchmark-compare --current <results> --baseline <baseline>
587
-
588
- # Quality assessment
589
- npx claude-flow quality-assess --target swarm-performance --criteria throughput,latency
590
-
591
- # Performance validation
592
- npx claude-flow validate-performance --results <file> --criteria <file>
593
- ```
594
-
595
- ### Regression Detection Commands
596
- ```bash
597
- # Detect performance regressions
598
- npx claude-flow detect-regression --current <results> --historical <data>
599
-
600
- # Set up automated regression monitoring
601
- npx claude-flow regression-monitor --enable --sensitivity 0.95
602
-
603
- # Analyze error patterns
604
- npx claude-flow error-analysis --logs <log-files>
605
- ```
606
-
607
- ## Integration Points
608
-
609
- ### With Other Optimization Agents
610
- - **Performance Monitor**: Provides continuous monitoring data for benchmarking
611
- - **Load Balancer**: Validates load balancing effectiveness through benchmarks
612
- - **Topology Optimizer**: Tests topology configurations for optimal performance
613
-
614
- ### With CI/CD Pipeline
615
- - **Automated Testing**: Integrates with CI/CD for continuous performance validation
616
- - **Quality Gates**: Provides pass/fail criteria for deployment decisions
617
- - **Regression Prevention**: Catches performance regressions before production
618
-
619
- ## Performance Benchmarks
620
-
621
- ### Standard Benchmark Suite
622
- ```javascript
623
- // Comprehensive benchmark definitions
624
- const standardBenchmarks = {
625
- // Throughput benchmarks
626
- throughput: {
627
- name: 'Throughput Benchmark',
628
- metrics: ['requests_per_second', 'tasks_per_second', 'messages_per_second'],
629
- duration: 300000, // 5 minutes
630
- warmup: 30000, // 30 seconds
631
- targets: {
632
- requests_per_second: { min: 1000, optimal: 5000 },
633
- tasks_per_second: { min: 100, optimal: 500 },
634
- messages_per_second: { min: 10000, optimal: 50000 }
635
- }
636
- },
637
-
638
- // Latency benchmarks
639
- latency: {
640
- name: 'Latency Benchmark',
641
- metrics: ['p50', 'p90', 'p95', 'p99', 'max'],
642
- duration: 300000,
643
- targets: {
644
- p50: { max: 100 }, // 100ms
645
- p90: { max: 200 }, // 200ms
646
- p95: { max: 500 }, // 500ms
647
- p99: { max: 1000 }, // 1s
648
- max: { max: 5000 } // 5s
649
- }
650
- },
651
-
652
- // Scalability benchmarks
653
- scalability: {
654
- name: 'Scalability Benchmark',
655
- metrics: ['linear_coefficient', 'efficiency_retention'],
656
- load_points: [1, 2, 4, 8, 16, 32, 64],
657
- targets: {
658
- linear_coefficient: { min: 0.8 },
659
- efficiency_retention: { min: 0.7 }
660
- }
661
- }
662
- };
663
- ```
664
-
665
- This Benchmark Suite agent provides comprehensive automated performance testing, regression detection, and validation capabilities to ensure optimal swarm performance and prevent performance degradation.