moflo 4.9.21 → 4.9.22

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (170) hide show
  1. package/.claude/agents/analysis/analyze-code-quality.md +0 -121
  2. package/.claude/agents/analysis/code-analyzer.md +5 -26
  3. package/.claude/agents/architecture/system-design/arch-system-design.md +0 -119
  4. package/.claude/agents/base-template-generator.md +0 -1
  5. package/.claude/agents/core/coder.md +0 -22
  6. package/.claude/agents/core/planner.md +0 -16
  7. package/.claude/agents/core/researcher.md +0 -16
  8. package/.claude/agents/core/reviewer.md +0 -17
  9. package/.claude/agents/core/tester.md +0 -19
  10. package/.claude/agents/custom/test-long-runner.md +0 -2
  11. package/.claude/agents/development/dev-backend-api.md +0 -167
  12. package/.claude/agents/development/dev-database.md +43 -0
  13. package/.claude/agents/development/dev-frontend.md +42 -0
  14. package/.claude/agents/devops/ci-cd/ops-cicd-github.md +0 -112
  15. package/.claude/agents/documentation/api-docs/docs-api-openapi.md +0 -111
  16. package/.claude/agents/security/security-auditor.md +45 -0
  17. package/.claude/guidance/shipped/moflo-guidance-rules.md +5 -5
  18. package/.claude/helpers/gate.cjs +70 -3
  19. package/.claude/skills/fl/execution-modes.md +38 -15
  20. package/bin/gate.cjs +70 -3
  21. package/bin/lib/retired-files.mjs +146 -0
  22. package/bin/session-start-launcher.mjs +101 -0
  23. package/dist/src/cli/appliance/rvfa-builder.js +1 -1
  24. package/dist/src/cli/commands/agent.js +3 -9
  25. package/dist/src/cli/commands/hooks.js +1 -3
  26. package/dist/src/cli/commands/index.js +2 -0
  27. package/dist/src/cli/commands/retire.js +111 -0
  28. package/dist/src/cli/hooks/reasoningbank/index.js +7 -7
  29. package/dist/src/cli/init/executor.js +26 -54
  30. package/dist/src/cli/init/helpers-generator.js +66 -3
  31. package/dist/src/cli/init/settings-generator.js +12 -0
  32. package/dist/src/cli/mcp-tools/agent-tools.js +9 -27
  33. package/dist/src/cli/mcp-tools/hooks-tools.js +23 -21
  34. package/dist/src/cli/memory/controllers/semantic-router.js +18 -12
  35. package/dist/src/cli/memory/sona-optimizer.js +6 -6
  36. package/dist/src/cli/neural/domain/services/learning-service.js +3 -3
  37. package/dist/src/cli/services/agent-router.js +2 -5
  38. package/dist/src/cli/services/hook-block-hash.js +4 -0
  39. package/dist/src/cli/shared/events/example-usage.js +6 -6
  40. package/dist/src/cli/shared/hooks/task-hooks.js +8 -8
  41. package/dist/src/cli/version.js +1 -1
  42. package/package.json +3 -2
  43. package/retired-files.json +1989 -0
  44. package/src/cli/data/model-registry.json +2 -2
  45. package/.claude/agents/consensus/byzantine-coordinator.md +0 -63
  46. package/.claude/agents/consensus/crdt-synchronizer.md +0 -997
  47. package/.claude/agents/consensus/gossip-coordinator.md +0 -63
  48. package/.claude/agents/consensus/performance-benchmarker.md +0 -851
  49. package/.claude/agents/consensus/quorum-manager.md +0 -823
  50. package/.claude/agents/consensus/raft-manager.md +0 -63
  51. package/.claude/agents/consensus/security-manager.md +0 -622
  52. package/.claude/agents/data/ml/data-ml-model.md +0 -193
  53. package/.claude/agents/github/code-review-swarm.md +0 -538
  54. package/.claude/agents/github/github-modes.md +0 -172
  55. package/.claude/agents/github/issue-tracker.md +0 -311
  56. package/.claude/agents/github/multi-repo-swarm.md +0 -551
  57. package/.claude/agents/github/pr-manager.md +0 -183
  58. package/.claude/agents/github/project-board-sync.md +0 -508
  59. package/.claude/agents/github/release-manager.md +0 -360
  60. package/.claude/agents/github/release-swarm.md +0 -580
  61. package/.claude/agents/github/repo-architect.md +0 -391
  62. package/.claude/agents/github/swarm-issue.md +0 -566
  63. package/.claude/agents/github/swarm-pr.md +0 -414
  64. package/.claude/agents/github/sync-coordinator.md +0 -426
  65. package/.claude/agents/github/workflow-automation.md +0 -606
  66. package/.claude/agents/goal/code-goal-planner.md +0 -440
  67. package/.claude/agents/goal/goal-planner.md +0 -168
  68. package/.claude/agents/hive-mind/collective-intelligence-coordinator.md +0 -127
  69. package/.claude/agents/hive-mind/queen-coordinator.md +0 -198
  70. package/.claude/agents/hive-mind/scout-explorer.md +0 -233
  71. package/.claude/agents/hive-mind/swarm-memory-manager.md +0 -184
  72. package/.claude/agents/hive-mind/worker-specialist.md +0 -208
  73. package/.claude/agents/neural/safla-neural.md +0 -73
  74. package/.claude/agents/optimization/benchmark-suite.md +0 -665
  75. package/.claude/agents/optimization/load-balancer.md +0 -431
  76. package/.claude/agents/optimization/performance-monitor.md +0 -672
  77. package/.claude/agents/optimization/resource-allocator.md +0 -674
  78. package/.claude/agents/optimization/topology-optimizer.md +0 -808
  79. package/.claude/agents/reasoning/goal-planner.md +0 -67
  80. package/.claude/agents/sona/sona-learning-optimizer.md +0 -74
  81. package/.claude/agents/sparc/architecture.md +0 -472
  82. package/.claude/agents/sparc/pseudocode.md +0 -318
  83. package/.claude/agents/sparc/refinement.md +0 -525
  84. package/.claude/agents/sparc/specification.md +0 -276
  85. package/.claude/agents/specialized/mobile/spec-mobile-react-native.md +0 -225
  86. package/.claude/agents/swarm/adaptive-coordinator.md +0 -391
  87. package/.claude/agents/swarm/hierarchical-coordinator.md +0 -321
  88. package/.claude/agents/swarm/mesh-coordinator.md +0 -383
  89. package/.claude/agents/testing/production-validator.md +0 -395
  90. package/.claude/agents/testing/tdd-london-swarm.md +0 -244
  91. package/.claude/agents/v3/adr-architect.md +0 -184
  92. package/.claude/agents/v3/aidefence-guardian.md +0 -277
  93. package/.claude/agents/v3/claims-authorizer.md +0 -208
  94. package/.claude/agents/v3/collective-intelligence-coordinator.md +0 -988
  95. package/.claude/agents/v3/ddd-domain-expert.md +0 -220
  96. package/.claude/agents/v3/injection-analyst.md +0 -232
  97. package/.claude/agents/v3/memory-specialist.md +0 -987
  98. package/.claude/agents/v3/performance-engineer.md +0 -1225
  99. package/.claude/agents/v3/pii-detector.md +0 -146
  100. package/.claude/agents/v3/reasoningbank-learner.md +0 -213
  101. package/.claude/agents/v3/security-architect-aidefence.md +0 -405
  102. package/.claude/agents/v3/security-architect.md +0 -865
  103. package/.claude/agents/v3/security-auditor.md +0 -771
  104. package/.claude/agents/v3/sparc-orchestrator.md +0 -182
  105. package/.claude/agents/v3/swarm-memory-manager.md +0 -142
  106. package/.claude/agents/v3/v3-integration-architect.md +0 -205
  107. package/.claude/commands/claude-flow-help.md +0 -103
  108. package/.claude/commands/claude-flow-memory.md +0 -107
  109. package/.claude/commands/claude-flow-swarm.md +0 -205
  110. package/.claude/commands/flo-simplify.md +0 -101
  111. package/.claude/commands/github/README.md +0 -11
  112. package/.claude/commands/github/code-review-swarm.md +0 -514
  113. package/.claude/commands/github/code-review.md +0 -25
  114. package/.claude/commands/github/github-modes.md +0 -146
  115. package/.claude/commands/github/github-swarm.md +0 -113
  116. package/.claude/commands/github/issue-tracker.md +0 -284
  117. package/.claude/commands/github/issue-triage.md +0 -25
  118. package/.claude/commands/github/multi-repo-swarm.md +0 -519
  119. package/.claude/commands/github/pr-enhance.md +0 -26
  120. package/.claude/commands/github/pr-manager.md +0 -164
  121. package/.claude/commands/github/project-board-sync.md +0 -471
  122. package/.claude/commands/github/release-manager.md +0 -332
  123. package/.claude/commands/github/release-swarm.md +0 -544
  124. package/.claude/commands/github/repo-analyze.md +0 -25
  125. package/.claude/commands/github/repo-architect.md +0 -361
  126. package/.claude/commands/github/swarm-issue.md +0 -482
  127. package/.claude/commands/github/swarm-pr.md +0 -285
  128. package/.claude/commands/github/sync-coordinator.md +0 -294
  129. package/.claude/commands/github/workflow-automation.md +0 -442
  130. package/.claude/commands/hooks/README.md +0 -11
  131. package/.claude/commands/hooks/overview.md +0 -58
  132. package/.claude/commands/hooks/post-edit.md +0 -117
  133. package/.claude/commands/hooks/post-task.md +0 -112
  134. package/.claude/commands/hooks/pre-edit.md +0 -113
  135. package/.claude/commands/hooks/pre-task.md +0 -111
  136. package/.claude/commands/hooks/session-end.md +0 -118
  137. package/.claude/commands/hooks/setup.md +0 -103
  138. package/.claude/commands/sparc/analyzer.md +0 -42
  139. package/.claude/commands/sparc/architect.md +0 -43
  140. package/.claude/commands/sparc/ask.md +0 -86
  141. package/.claude/commands/sparc/batch-executor.md +0 -44
  142. package/.claude/commands/sparc/code.md +0 -78
  143. package/.claude/commands/sparc/coder.md +0 -44
  144. package/.claude/commands/sparc/debug.md +0 -72
  145. package/.claude/commands/sparc/debugger.md +0 -44
  146. package/.claude/commands/sparc/designer.md +0 -43
  147. package/.claude/commands/sparc/devops.md +0 -98
  148. package/.claude/commands/sparc/docs-writer.md +0 -69
  149. package/.claude/commands/sparc/documenter.md +0 -44
  150. package/.claude/commands/sparc/innovator.md +0 -44
  151. package/.claude/commands/sparc/integration.md +0 -72
  152. package/.claude/commands/sparc/mcp.md +0 -106
  153. package/.claude/commands/sparc/memory-manager.md +0 -44
  154. package/.claude/commands/sparc/optimizer.md +0 -44
  155. package/.claude/commands/sparc/orchestrator.md +0 -116
  156. package/.claude/commands/sparc/post-deployment-monitoring-mode.md +0 -72
  157. package/.claude/commands/sparc/refinement-optimization-mode.md +0 -72
  158. package/.claude/commands/sparc/researcher.md +0 -44
  159. package/.claude/commands/sparc/reviewer.md +0 -44
  160. package/.claude/commands/sparc/security-review.md +0 -69
  161. package/.claude/commands/sparc/sparc-modes.md +0 -139
  162. package/.claude/commands/sparc/sparc.md +0 -99
  163. package/.claude/commands/sparc/spec-pseudocode.md +0 -69
  164. package/.claude/commands/sparc/spell-manager.md +0 -44
  165. package/.claude/commands/sparc/supabase-admin.md +0 -337
  166. package/.claude/commands/sparc/swarm-coordinator.md +0 -44
  167. package/.claude/commands/sparc/tdd.md +0 -44
  168. package/.claude/commands/sparc/tester.md +0 -44
  169. package/.claude/commands/sparc/tutorial.md +0 -68
  170. package/.claude/commands/sparc.md +0 -151
@@ -1,665 +0,0 @@
1
- ---
2
- name: Benchmark Suite
3
- type: agent
4
- category: optimization
5
- description: Comprehensive performance benchmarking, regression detection and performance validation
6
- ---
7
-
8
- # Benchmark Suite Agent
9
-
10
- ## Agent Profile
11
- - **Name**: Benchmark Suite
12
- - **Type**: Performance Optimization Agent
13
- - **Specialization**: Comprehensive performance benchmarking and testing
14
- - **Performance Focus**: Automated benchmarking, regression detection, and performance validation
15
-
16
- ## Core Capabilities
17
-
18
- ### 1. Comprehensive Benchmarking Framework
19
- ```javascript
20
- // Advanced benchmarking system
21
- class ComprehensiveBenchmarkSuite {
22
- constructor() {
23
- this.benchmarks = {
24
- // Core performance benchmarks
25
- throughput: new ThroughputBenchmark(),
26
- latency: new LatencyBenchmark(),
27
- scalability: new ScalabilityBenchmark(),
28
- resource_usage: new ResourceUsageBenchmark(),
29
-
30
- // Swarm-specific benchmarks
31
- coordination: new CoordinationBenchmark(),
32
- load_balancing: new LoadBalancingBenchmark(),
33
- topology: new TopologyBenchmark(),
34
- fault_tolerance: new FaultToleranceBenchmark(),
35
-
36
- // Custom benchmarks
37
- custom: new CustomBenchmarkManager()
38
- };
39
-
40
- this.reporter = new BenchmarkReporter();
41
- this.comparator = new PerformanceComparator();
42
- this.analyzer = new BenchmarkAnalyzer();
43
- }
44
-
45
- // Execute comprehensive benchmark suite
46
- async runBenchmarkSuite(config = {}) {
47
- const suiteConfig = {
48
- duration: config.duration || 300000, // 5 minutes default
49
- iterations: config.iterations || 10,
50
- warmupTime: config.warmupTime || 30000, // 30 seconds
51
- cooldownTime: config.cooldownTime || 10000, // 10 seconds
52
- parallel: config.parallel || false,
53
- baseline: config.baseline || null
54
- };
55
-
56
- const results = {
57
- summary: {},
58
- detailed: new Map(),
59
- baseline_comparison: null,
60
- recommendations: []
61
- };
62
-
63
- // Warmup phase
64
- await this.warmup(suiteConfig.warmupTime);
65
-
66
- // Execute benchmarks
67
- if (suiteConfig.parallel) {
68
- results.detailed = await this.runBenchmarksParallel(suiteConfig);
69
- } else {
70
- results.detailed = await this.runBenchmarksSequential(suiteConfig);
71
- }
72
-
73
- // Generate summary
74
- results.summary = this.generateSummary(results.detailed);
75
-
76
- // Compare with baseline if provided
77
- if (suiteConfig.baseline) {
78
- results.baseline_comparison = await this.compareWithBaseline(
79
- results.detailed,
80
- suiteConfig.baseline
81
- );
82
- }
83
-
84
- // Generate recommendations
85
- results.recommendations = await this.generateRecommendations(results);
86
-
87
- // Cooldown phase
88
- await this.cooldown(suiteConfig.cooldownTime);
89
-
90
- return results;
91
- }
92
-
93
- // Parallel benchmark execution
94
- async runBenchmarksParallel(config) {
95
- const benchmarkPromises = Object.entries(this.benchmarks).map(
96
- async ([name, benchmark]) => {
97
- const result = await this.executeBenchmark(benchmark, name, config);
98
- return [name, result];
99
- }
100
- );
101
-
102
- const results = await Promise.all(benchmarkPromises);
103
- return new Map(results);
104
- }
105
-
106
- // Sequential benchmark execution
107
- async runBenchmarksSequential(config) {
108
- const results = new Map();
109
-
110
- for (const [name, benchmark] of Object.entries(this.benchmarks)) {
111
- const result = await this.executeBenchmark(benchmark, name, config);
112
- results.set(name, result);
113
-
114
- // Brief pause between benchmarks
115
- await this.sleep(1000);
116
- }
117
-
118
- return results;
119
- }
120
- }
121
- ```
122
-
123
- ### 2. Performance Regression Detection
124
- ```javascript
125
- // Advanced regression detection system
126
- class RegressionDetector {
127
- constructor() {
128
- this.detectors = {
129
- statistical: new StatisticalRegressionDetector(),
130
- machine_learning: new MLRegressionDetector(),
131
- threshold: new ThresholdRegressionDetector(),
132
- trend: new TrendRegressionDetector()
133
- };
134
-
135
- this.analyzer = new RegressionAnalyzer();
136
- this.alerting = new RegressionAlerting();
137
- }
138
-
139
- // Detect performance regressions
140
- async detectRegressions(currentResults, historicalData, config = {}) {
141
- const regressions = {
142
- detected: [],
143
- severity: 'none',
144
- confidence: 0,
145
- analysis: {}
146
- };
147
-
148
- // Run multiple detection algorithms
149
- const detectionPromises = Object.entries(this.detectors).map(
150
- async ([method, detector]) => {
151
- const detection = await detector.detect(currentResults, historicalData, config);
152
- return [method, detection];
153
- }
154
- );
155
-
156
- const detectionResults = await Promise.all(detectionPromises);
157
-
158
- // Aggregate detection results
159
- for (const [method, detection] of detectionResults) {
160
- if (detection.regression_detected) {
161
- regressions.detected.push({
162
- method,
163
- ...detection
164
- });
165
- }
166
- }
167
-
168
- // Calculate overall confidence and severity
169
- if (regressions.detected.length > 0) {
170
- regressions.confidence = this.calculateAggregateConfidence(regressions.detected);
171
- regressions.severity = this.calculateSeverity(regressions.detected);
172
- regressions.analysis = await this.analyzer.analyze(regressions.detected);
173
- }
174
-
175
- return regressions;
176
- }
177
-
178
- // Statistical regression detection using change point analysis
179
- async detectStatisticalRegression(metric, historicalData, sensitivity = 0.95) {
180
- // Use CUSUM (Cumulative Sum) algorithm for change point detection
181
- const cusum = this.calculateCUSUM(metric, historicalData);
182
-
183
- // Detect change points
184
- const changePoints = this.detectChangePoints(cusum, sensitivity);
185
-
186
- // Analyze significance of changes
187
- const analysis = changePoints.map(point => ({
188
- timestamp: point.timestamp,
189
- magnitude: point.magnitude,
190
- direction: point.direction,
191
- significance: point.significance,
192
- confidence: point.confidence
193
- }));
194
-
195
- return {
196
- regression_detected: changePoints.length > 0,
197
- change_points: analysis,
198
- cusum_statistics: cusum.statistics,
199
- sensitivity: sensitivity
200
- };
201
- }
202
-
203
- // Machine learning-based regression detection
204
- async detectMLRegression(metrics, historicalData) {
205
- // Train anomaly detection model on historical data
206
- const model = await this.trainAnomalyModel(historicalData);
207
-
208
- // Predict anomaly scores for current metrics
209
- const anomalyScores = await model.predict(metrics);
210
-
211
- // Identify regressions based on anomaly scores
212
- const threshold = this.calculateDynamicThreshold(anomalyScores);
213
- const regressions = anomalyScores.filter(score => score.anomaly > threshold);
214
-
215
- return {
216
- regression_detected: regressions.length > 0,
217
- anomaly_scores: anomalyScores,
218
- threshold: threshold,
219
- regressions: regressions,
220
- model_confidence: model.confidence
221
- };
222
- }
223
- }
224
- ```
225
-
226
- ### 3. Automated Performance Testing
227
- ```javascript
228
- // Comprehensive automated performance testing
229
- class AutomatedPerformanceTester {
230
- constructor() {
231
- this.testSuites = {
232
- load: new LoadTestSuite(),
233
- stress: new StressTestSuite(),
234
- volume: new VolumeTestSuite(),
235
- endurance: new EnduranceTestSuite(),
236
- spike: new SpikeTestSuite(),
237
- configuration: new ConfigurationTestSuite()
238
- };
239
-
240
- this.scheduler = new TestScheduler();
241
- this.orchestrator = new TestOrchestrator();
242
- this.validator = new ResultValidator();
243
- }
244
-
245
- // Execute automated performance test campaign
246
- async runTestCampaign(config) {
247
- const campaign = {
248
- id: this.generateCampaignId(),
249
- config,
250
- startTime: Date.now(),
251
- tests: [],
252
- results: new Map(),
253
- summary: null
254
- };
255
-
256
- // Schedule test execution
257
- const schedule = await this.scheduler.schedule(config.tests, config.constraints);
258
-
259
- // Execute tests according to schedule
260
- for (const scheduledTest of schedule) {
261
- const testResult = await this.executeScheduledTest(scheduledTest);
262
- campaign.tests.push(scheduledTest);
263
- campaign.results.set(scheduledTest.id, testResult);
264
-
265
- // Validate results in real-time
266
- const validation = await this.validator.validate(testResult);
267
- if (!validation.valid) {
268
- campaign.summary = {
269
- status: 'failed',
270
- reason: validation.reason,
271
- failedAt: scheduledTest.name
272
- };
273
- break;
274
- }
275
- }
276
-
277
- // Generate campaign summary
278
- if (!campaign.summary) {
279
- campaign.summary = await this.generateCampaignSummary(campaign);
280
- }
281
-
282
- campaign.endTime = Date.now();
283
- campaign.duration = campaign.endTime - campaign.startTime;
284
-
285
- return campaign;
286
- }
287
-
288
- // Load testing with gradual ramp-up
289
- async executeLoadTest(config) {
290
- const loadTest = {
291
- type: 'load',
292
- config,
293
- phases: [],
294
- metrics: new Map(),
295
- results: {}
296
- };
297
-
298
- // Ramp-up phase
299
- const rampUpResult = await this.executeRampUp(config.rampUp);
300
- loadTest.phases.push({ phase: 'ramp-up', result: rampUpResult });
301
-
302
- // Sustained load phase
303
- const sustainedResult = await this.executeSustainedLoad(config.sustained);
304
- loadTest.phases.push({ phase: 'sustained', result: sustainedResult });
305
-
306
- // Ramp-down phase
307
- const rampDownResult = await this.executeRampDown(config.rampDown);
308
- loadTest.phases.push({ phase: 'ramp-down', result: rampDownResult });
309
-
310
- // Analyze results
311
- loadTest.results = await this.analyzeLoadTestResults(loadTest.phases);
312
-
313
- return loadTest;
314
- }
315
-
316
- // Stress testing to find breaking points
317
- async executeStressTest(config) {
318
- const stressTest = {
319
- type: 'stress',
320
- config,
321
- breakingPoint: null,
322
- degradationCurve: [],
323
- results: {}
324
- };
325
-
326
- let currentLoad = config.startLoad;
327
- let systemBroken = false;
328
-
329
- while (!systemBroken && currentLoad <= config.maxLoad) {
330
- const testResult = await this.applyLoad(currentLoad, config.duration);
331
-
332
- stressTest.degradationCurve.push({
333
- load: currentLoad,
334
- performance: testResult.performance,
335
- stability: testResult.stability,
336
- errors: testResult.errors
337
- });
338
-
339
- // Check if system is breaking
340
- if (this.isSystemBreaking(testResult, config.breakingCriteria)) {
341
- stressTest.breakingPoint = {
342
- load: currentLoad,
343
- performance: testResult.performance,
344
- reason: this.identifyBreakingReason(testResult)
345
- };
346
- systemBroken = true;
347
- }
348
-
349
- currentLoad += config.loadIncrement;
350
- }
351
-
352
- stressTest.results = await this.analyzeStressTestResults(stressTest);
353
-
354
- return stressTest;
355
- }
356
- }
357
- ```
358
-
359
- ### 4. Performance Validation Framework
360
- ```javascript
361
- // Comprehensive performance validation
362
- class PerformanceValidator {
363
- constructor() {
364
- this.validators = {
365
- sla: new SLAValidator(),
366
- regression: new RegressionValidator(),
367
- scalability: new ScalabilityValidator(),
368
- reliability: new ReliabilityValidator(),
369
- efficiency: new EfficiencyValidator()
370
- };
371
-
372
- this.thresholds = new ThresholdManager();
373
- this.rules = new ValidationRuleEngine();
374
- }
375
-
376
- // Validate performance against defined criteria
377
- async validatePerformance(results, criteria) {
378
- const validation = {
379
- overall: {
380
- passed: true,
381
- score: 0,
382
- violations: []
383
- },
384
- detailed: new Map(),
385
- recommendations: []
386
- };
387
-
388
- // Run all validators
389
- const validationPromises = Object.entries(this.validators).map(
390
- async ([type, validator]) => {
391
- const result = await validator.validate(results, criteria[type]);
392
- return [type, result];
393
- }
394
- );
395
-
396
- const validationResults = await Promise.all(validationPromises);
397
-
398
- // Aggregate validation results
399
- for (const [type, result] of validationResults) {
400
- validation.detailed.set(type, result);
401
-
402
- if (!result.passed) {
403
- validation.overall.passed = false;
404
- validation.overall.violations.push(...result.violations);
405
- }
406
-
407
- validation.overall.score += result.score * (criteria[type]?.weight || 1);
408
- }
409
-
410
- // Normalize overall score
411
- const totalWeight = Object.values(criteria).reduce((sum, c) => sum + (c.weight || 1), 0);
412
- validation.overall.score /= totalWeight;
413
-
414
- // Generate recommendations
415
- validation.recommendations = await this.generateValidationRecommendations(validation);
416
-
417
- return validation;
418
- }
419
-
420
- // SLA validation
421
- async validateSLA(results, slaConfig) {
422
- const slaValidation = {
423
- passed: true,
424
- violations: [],
425
- score: 1.0,
426
- metrics: {}
427
- };
428
-
429
- // Validate each SLA metric
430
- for (const [metric, threshold] of Object.entries(slaConfig.thresholds)) {
431
- const actualValue = this.extractMetricValue(results, metric);
432
- const validation = this.validateThreshold(actualValue, threshold);
433
-
434
- slaValidation.metrics[metric] = {
435
- actual: actualValue,
436
- threshold: threshold.value,
437
- operator: threshold.operator,
438
- passed: validation.passed,
439
- deviation: validation.deviation
440
- };
441
-
442
- if (!validation.passed) {
443
- slaValidation.passed = false;
444
- slaValidation.violations.push({
445
- metric,
446
- actual: actualValue,
447
- expected: threshold.value,
448
- severity: threshold.severity || 'medium'
449
- });
450
-
451
- // Reduce score based on violation severity
452
- const severityMultiplier = this.getSeverityMultiplier(threshold.severity);
453
- slaValidation.score -= (validation.deviation * severityMultiplier);
454
- }
455
- }
456
-
457
- slaValidation.score = Math.max(0, slaValidation.score);
458
-
459
- return slaValidation;
460
- }
461
-
462
- // Scalability validation
463
- async validateScalability(results, scalabilityConfig) {
464
- const scalabilityValidation = {
465
- passed: true,
466
- violations: [],
467
- score: 1.0,
468
- analysis: {}
469
- };
470
-
471
- // Linear scalability analysis
472
- if (scalabilityConfig.linear) {
473
- const linearityAnalysis = this.analyzeLinearScalability(results);
474
- scalabilityValidation.analysis.linearity = linearityAnalysis;
475
-
476
- if (linearityAnalysis.coefficient < scalabilityConfig.linear.minCoefficient) {
477
- scalabilityValidation.passed = false;
478
- scalabilityValidation.violations.push({
479
- type: 'linearity',
480
- actual: linearityAnalysis.coefficient,
481
- expected: scalabilityConfig.linear.minCoefficient
482
- });
483
- }
484
- }
485
-
486
- // Efficiency retention analysis
487
- if (scalabilityConfig.efficiency) {
488
- const efficiencyAnalysis = this.analyzeEfficiencyRetention(results);
489
- scalabilityValidation.analysis.efficiency = efficiencyAnalysis;
490
-
491
- if (efficiencyAnalysis.retention < scalabilityConfig.efficiency.minRetention) {
492
- scalabilityValidation.passed = false;
493
- scalabilityValidation.violations.push({
494
- type: 'efficiency_retention',
495
- actual: efficiencyAnalysis.retention,
496
- expected: scalabilityConfig.efficiency.minRetention
497
- });
498
- }
499
- }
500
-
501
- return scalabilityValidation;
502
- }
503
- }
504
- ```
505
-
506
- ## MCP Integration Hooks
507
-
508
- ### Benchmark Execution Integration
509
- ```javascript
510
- // Comprehensive MCP benchmark integration
511
- const benchmarkIntegration = {
512
- // Execute performance benchmarks
513
- async runBenchmarks(config = {}) {
514
- // Run benchmark suite
515
- const benchmarkResult = await mcp.benchmark_run({
516
- suite: config.suite || 'comprehensive'
517
- });
518
-
519
- // Collect detailed metrics during benchmarking
520
- const metrics = await mcp.metrics_collect({
521
- components: ['system', 'agents', 'coordination', 'memory']
522
- });
523
-
524
- // Analyze performance trends
525
- const trends = await mcp.trend_analysis({
526
- metric: 'performance',
527
- period: '24h'
528
- });
529
-
530
- // Cost analysis
531
- const costAnalysis = await mcp.cost_analysis({
532
- timeframe: '24h'
533
- });
534
-
535
- return {
536
- benchmark: benchmarkResult,
537
- metrics,
538
- trends,
539
- costAnalysis,
540
- timestamp: Date.now()
541
- };
542
- },
543
-
544
- // Quality assessment
545
- async assessQuality(criteria) {
546
- const qualityAssessment = await mcp.quality_assess({
547
- target: 'swarm-performance',
548
- criteria: criteria || [
549
- 'throughput',
550
- 'latency',
551
- 'reliability',
552
- 'scalability',
553
- 'efficiency'
554
- ]
555
- });
556
-
557
- return qualityAssessment;
558
- },
559
-
560
- // Error pattern analysis
561
- async analyzeErrorPatterns() {
562
- // Collect system logs
563
- const logs = await this.collectSystemLogs();
564
-
565
- // Analyze error patterns
566
- const errorAnalysis = await mcp.error_analysis({
567
- logs: logs
568
- });
569
-
570
- return errorAnalysis;
571
- }
572
- };
573
- ```
574
-
575
- ## Operational Commands
576
-
577
- ### Benchmarking Commands
578
- ```bash
579
- # Run comprehensive benchmark suite
580
- npx claude-flow benchmark-run --suite comprehensive --duration 300
581
-
582
- # Execute specific benchmark
583
- npx claude-flow benchmark-run --suite throughput --iterations 10
584
-
585
- # Compare with baseline
586
- npx claude-flow benchmark-compare --current <results> --baseline <baseline>
587
-
588
- # Quality assessment
589
- npx claude-flow quality-assess --target swarm-performance --criteria throughput,latency
590
-
591
- # Performance validation
592
- npx claude-flow validate-performance --results <file> --criteria <file>
593
- ```
594
-
595
- ### Regression Detection Commands
596
- ```bash
597
- # Detect performance regressions
598
- npx claude-flow detect-regression --current <results> --historical <data>
599
-
600
- # Set up automated regression monitoring
601
- npx claude-flow regression-monitor --enable --sensitivity 0.95
602
-
603
- # Analyze error patterns
604
- npx claude-flow error-analysis --logs <log-files>
605
- ```
606
-
607
- ## Integration Points
608
-
609
- ### With Other Optimization Agents
610
- - **Performance Monitor**: Provides continuous monitoring data for benchmarking
611
- - **Load Balancer**: Validates load balancing effectiveness through benchmarks
612
- - **Topology Optimizer**: Tests topology configurations for optimal performance
613
-
614
- ### With CI/CD Pipeline
615
- - **Automated Testing**: Integrates with CI/CD for continuous performance validation
616
- - **Quality Gates**: Provides pass/fail criteria for deployment decisions
617
- - **Regression Prevention**: Catches performance regressions before production
618
-
619
- ## Performance Benchmarks
620
-
621
- ### Standard Benchmark Suite
622
- ```javascript
623
- // Comprehensive benchmark definitions
624
- const standardBenchmarks = {
625
- // Throughput benchmarks
626
- throughput: {
627
- name: 'Throughput Benchmark',
628
- metrics: ['requests_per_second', 'tasks_per_second', 'messages_per_second'],
629
- duration: 300000, // 5 minutes
630
- warmup: 30000, // 30 seconds
631
- targets: {
632
- requests_per_second: { min: 1000, optimal: 5000 },
633
- tasks_per_second: { min: 100, optimal: 500 },
634
- messages_per_second: { min: 10000, optimal: 50000 }
635
- }
636
- },
637
-
638
- // Latency benchmarks
639
- latency: {
640
- name: 'Latency Benchmark',
641
- metrics: ['p50', 'p90', 'p95', 'p99', 'max'],
642
- duration: 300000,
643
- targets: {
644
- p50: { max: 100 }, // 100ms
645
- p90: { max: 200 }, // 200ms
646
- p95: { max: 500 }, // 500ms
647
- p99: { max: 1000 }, // 1s
648
- max: { max: 5000 } // 5s
649
- }
650
- },
651
-
652
- // Scalability benchmarks
653
- scalability: {
654
- name: 'Scalability Benchmark',
655
- metrics: ['linear_coefficient', 'efficiency_retention'],
656
- load_points: [1, 2, 4, 8, 16, 32, 64],
657
- targets: {
658
- linear_coefficient: { min: 0.8 },
659
- efficiency_retention: { min: 0.7 }
660
- }
661
- }
662
- };
663
- ```
664
-
665
- This Benchmark Suite agent provides comprehensive automated performance testing, regression detection, and validation capabilities to ensure optimal swarm performance and prevent performance degradation.