@claude-flow/cli 3.7.0-alpha.1 → 3.7.0-alpha.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (476) hide show
  1. package/.claude/agents/analysis/analyze-code-quality.md +178 -178
  2. package/.claude/agents/analysis/code-analyzer.md +209 -209
  3. package/.claude/agents/analysis/code-review/analyze-code-quality.md +178 -178
  4. package/.claude/agents/architecture/arch-system-design.md +156 -156
  5. package/.claude/agents/architecture/system-design/arch-system-design.md +154 -154
  6. package/.claude/agents/browser/browser-agent.yaml +182 -182
  7. package/.claude/agents/consensus/byzantine-coordinator.md +62 -62
  8. package/.claude/agents/consensus/crdt-synchronizer.md +996 -996
  9. package/.claude/agents/consensus/gossip-coordinator.md +62 -62
  10. package/.claude/agents/consensus/performance-benchmarker.md +850 -850
  11. package/.claude/agents/consensus/quorum-manager.md +822 -822
  12. package/.claude/agents/consensus/raft-manager.md +62 -62
  13. package/.claude/agents/consensus/security-manager.md +621 -621
  14. package/.claude/agents/core/coder.md +452 -452
  15. package/.claude/agents/core/planner.md +374 -374
  16. package/.claude/agents/core/researcher.md +368 -368
  17. package/.claude/agents/core/reviewer.md +519 -519
  18. package/.claude/agents/core/tester.md +511 -511
  19. package/.claude/agents/custom/test-long-runner.md +44 -44
  20. package/.claude/agents/data/data-ml-model.md +444 -444
  21. package/.claude/agents/data/ml/data-ml-model.md +192 -192
  22. package/.claude/agents/development/backend/dev-backend-api.md +141 -141
  23. package/.claude/agents/development/dev-backend-api.md +344 -344
  24. package/.claude/agents/devops/ci-cd/ops-cicd-github.md +163 -163
  25. package/.claude/agents/devops/ops-cicd-github.md +164 -164
  26. package/.claude/agents/documentation/api-docs/docs-api-openapi.md +173 -173
  27. package/.claude/agents/documentation/docs-api-openapi.md +354 -354
  28. package/.claude/agents/flow-nexus/app-store.md +87 -87
  29. package/.claude/agents/flow-nexus/authentication.md +68 -68
  30. package/.claude/agents/flow-nexus/challenges.md +80 -80
  31. package/.claude/agents/flow-nexus/neural-network.md +87 -87
  32. package/.claude/agents/flow-nexus/payments.md +82 -82
  33. package/.claude/agents/flow-nexus/sandbox.md +75 -75
  34. package/.claude/agents/flow-nexus/swarm.md +75 -75
  35. package/.claude/agents/flow-nexus/user-tools.md +95 -95
  36. package/.claude/agents/flow-nexus/workflow.md +83 -83
  37. package/.claude/agents/github/code-review-swarm.md +377 -377
  38. package/.claude/agents/github/github-modes.md +172 -172
  39. package/.claude/agents/github/issue-tracker.md +575 -575
  40. package/.claude/agents/github/multi-repo-swarm.md +552 -552
  41. package/.claude/agents/github/pr-manager.md +437 -437
  42. package/.claude/agents/github/project-board-sync.md +508 -508
  43. package/.claude/agents/github/release-manager.md +604 -604
  44. package/.claude/agents/github/release-swarm.md +582 -582
  45. package/.claude/agents/github/repo-architect.md +397 -397
  46. package/.claude/agents/github/swarm-issue.md +572 -572
  47. package/.claude/agents/github/swarm-pr.md +427 -427
  48. package/.claude/agents/github/sync-coordinator.md +451 -451
  49. package/.claude/agents/github/workflow-automation.md +902 -902
  50. package/.claude/agents/goal/agent.md +815 -815
  51. package/.claude/agents/goal/goal-planner.md +72 -72
  52. package/.claude/agents/optimization/benchmark-suite.md +664 -664
  53. package/.claude/agents/optimization/load-balancer.md +430 -430
  54. package/.claude/agents/optimization/performance-monitor.md +671 -671
  55. package/.claude/agents/optimization/resource-allocator.md +673 -673
  56. package/.claude/agents/optimization/topology-optimizer.md +807 -807
  57. package/.claude/agents/payments/agentic-payments.md +126 -126
  58. package/.claude/agents/sona/sona-learning-optimizer.md +74 -74
  59. package/.claude/agents/sparc/architecture.md +698 -698
  60. package/.claude/agents/sparc/pseudocode.md +519 -519
  61. package/.claude/agents/sparc/refinement.md +801 -801
  62. package/.claude/agents/sparc/specification.md +477 -477
  63. package/.claude/agents/specialized/mobile/spec-mobile-react-native.md +224 -224
  64. package/.claude/agents/specialized/spec-mobile-react-native.md +226 -226
  65. package/.claude/agents/sublinear/consensus-coordinator.md +337 -337
  66. package/.claude/agents/sublinear/matrix-optimizer.md +184 -184
  67. package/.claude/agents/sublinear/pagerank-analyzer.md +298 -298
  68. package/.claude/agents/sublinear/performance-optimizer.md +367 -367
  69. package/.claude/agents/sublinear/trading-predictor.md +245 -245
  70. package/.claude/agents/swarm/adaptive-coordinator.md +1126 -1126
  71. package/.claude/agents/swarm/hierarchical-coordinator.md +709 -709
  72. package/.claude/agents/swarm/mesh-coordinator.md +962 -962
  73. package/.claude/agents/templates/automation-smart-agent.md +204 -204
  74. package/.claude/agents/templates/base-template-generator.md +289 -289
  75. package/.claude/agents/templates/coordinator-swarm-init.md +89 -89
  76. package/.claude/agents/templates/github-pr-manager.md +176 -176
  77. package/.claude/agents/templates/implementer-sparc-coder.md +258 -258
  78. package/.claude/agents/templates/memory-coordinator.md +186 -186
  79. package/.claude/agents/templates/orchestrator-task.md +138 -138
  80. package/.claude/agents/templates/performance-analyzer.md +198 -198
  81. package/.claude/agents/templates/sparc-coordinator.md +513 -513
  82. package/.claude/agents/testing/production-validator.md +394 -394
  83. package/.claude/agents/testing/tdd-london-swarm.md +243 -243
  84. package/.claude/agents/v3/adr-architect.md +184 -184
  85. package/.claude/agents/v3/aidefence-guardian.md +282 -282
  86. package/.claude/agents/v3/claims-authorizer.md +208 -208
  87. package/.claude/agents/v3/collective-intelligence-coordinator.md +993 -993
  88. package/.claude/agents/v3/ddd-domain-expert.md +220 -220
  89. package/.claude/agents/v3/injection-analyst.md +236 -236
  90. package/.claude/agents/v3/memory-specialist.md +995 -995
  91. package/.claude/agents/v3/performance-engineer.md +1233 -1233
  92. package/.claude/agents/v3/pii-detector.md +151 -151
  93. package/.claude/agents/v3/reasoningbank-learner.md +213 -213
  94. package/.claude/agents/v3/security-architect-aidefence.md +410 -410
  95. package/.claude/agents/v3/security-architect.md +867 -867
  96. package/.claude/agents/v3/security-auditor.md +771 -771
  97. package/.claude/agents/v3/sparc-orchestrator.md +182 -182
  98. package/.claude/agents/v3/swarm-memory-manager.md +157 -157
  99. package/.claude/agents/v3/v3-integration-architect.md +205 -205
  100. package/.claude/commands/agents/README.md +50 -50
  101. package/.claude/commands/agents/agent-capabilities.md +140 -140
  102. package/.claude/commands/agents/agent-coordination.md +28 -28
  103. package/.claude/commands/agents/agent-spawning.md +28 -28
  104. package/.claude/commands/agents/agent-types.md +216 -216
  105. package/.claude/commands/agents/health.md +139 -139
  106. package/.claude/commands/agents/list.md +100 -100
  107. package/.claude/commands/agents/logs.md +130 -130
  108. package/.claude/commands/agents/metrics.md +122 -122
  109. package/.claude/commands/agents/pool.md +127 -127
  110. package/.claude/commands/agents/spawn.md +140 -140
  111. package/.claude/commands/agents/status.md +115 -115
  112. package/.claude/commands/agents/stop.md +102 -102
  113. package/.claude/commands/analysis/COMMAND_COMPLIANCE_REPORT.md +53 -53
  114. package/.claude/commands/analysis/README.md +9 -9
  115. package/.claude/commands/analysis/bottleneck-detect.md +162 -162
  116. package/.claude/commands/analysis/performance-bottlenecks.md +58 -58
  117. package/.claude/commands/analysis/performance-report.md +25 -25
  118. package/.claude/commands/analysis/token-efficiency.md +44 -44
  119. package/.claude/commands/analysis/token-usage.md +25 -25
  120. package/.claude/commands/automation/README.md +9 -9
  121. package/.claude/commands/automation/auto-agent.md +122 -122
  122. package/.claude/commands/automation/self-healing.md +105 -105
  123. package/.claude/commands/automation/session-memory.md +89 -89
  124. package/.claude/commands/automation/smart-agents.md +72 -72
  125. package/.claude/commands/automation/smart-spawn.md +25 -25
  126. package/.claude/commands/automation/workflow-select.md +25 -25
  127. package/.claude/commands/claude-flow-help.md +103 -103
  128. package/.claude/commands/claude-flow-memory.md +107 -107
  129. package/.claude/commands/claude-flow-swarm.md +205 -205
  130. package/.claude/commands/coordination/README.md +9 -9
  131. package/.claude/commands/coordination/agent-spawn.md +25 -25
  132. package/.claude/commands/coordination/init.md +44 -44
  133. package/.claude/commands/coordination/orchestrate.md +43 -43
  134. package/.claude/commands/coordination/spawn.md +45 -45
  135. package/.claude/commands/coordination/swarm-init.md +85 -85
  136. package/.claude/commands/coordination/task-orchestrate.md +25 -25
  137. package/.claude/commands/flow-nexus/app-store.md +123 -123
  138. package/.claude/commands/flow-nexus/challenges.md +119 -119
  139. package/.claude/commands/flow-nexus/login-registration.md +64 -64
  140. package/.claude/commands/flow-nexus/neural-network.md +133 -133
  141. package/.claude/commands/flow-nexus/payments.md +115 -115
  142. package/.claude/commands/flow-nexus/sandbox.md +82 -82
  143. package/.claude/commands/flow-nexus/swarm.md +86 -86
  144. package/.claude/commands/flow-nexus/user-tools.md +151 -151
  145. package/.claude/commands/flow-nexus/workflow.md +114 -114
  146. package/.claude/commands/github/README.md +11 -11
  147. package/.claude/commands/github/code-review-swarm.md +513 -513
  148. package/.claude/commands/github/code-review.md +25 -25
  149. package/.claude/commands/github/github-modes.md +146 -146
  150. package/.claude/commands/github/github-swarm.md +121 -121
  151. package/.claude/commands/github/issue-tracker.md +291 -291
  152. package/.claude/commands/github/issue-triage.md +25 -25
  153. package/.claude/commands/github/multi-repo-swarm.md +518 -518
  154. package/.claude/commands/github/pr-enhance.md +26 -26
  155. package/.claude/commands/github/pr-manager.md +169 -169
  156. package/.claude/commands/github/project-board-sync.md +470 -470
  157. package/.claude/commands/github/release-manager.md +337 -337
  158. package/.claude/commands/github/release-swarm.md +543 -543
  159. package/.claude/commands/github/repo-analyze.md +25 -25
  160. package/.claude/commands/github/repo-architect.md +366 -366
  161. package/.claude/commands/github/swarm-issue.md +481 -481
  162. package/.claude/commands/github/swarm-pr.md +284 -284
  163. package/.claude/commands/github/sync-coordinator.md +300 -300
  164. package/.claude/commands/github/workflow-automation.md +441 -441
  165. package/.claude/commands/hive-mind/README.md +17 -17
  166. package/.claude/commands/hive-mind/hive-mind-consensus.md +8 -8
  167. package/.claude/commands/hive-mind/hive-mind-init.md +18 -18
  168. package/.claude/commands/hive-mind/hive-mind-memory.md +8 -8
  169. package/.claude/commands/hive-mind/hive-mind-metrics.md +8 -8
  170. package/.claude/commands/hive-mind/hive-mind-resume.md +8 -8
  171. package/.claude/commands/hive-mind/hive-mind-sessions.md +8 -8
  172. package/.claude/commands/hive-mind/hive-mind-spawn.md +21 -21
  173. package/.claude/commands/hive-mind/hive-mind-status.md +8 -8
  174. package/.claude/commands/hive-mind/hive-mind-stop.md +8 -8
  175. package/.claude/commands/hive-mind/hive-mind-wizard.md +8 -8
  176. package/.claude/commands/hive-mind/hive-mind.md +27 -27
  177. package/.claude/commands/hooks/README.md +11 -11
  178. package/.claude/commands/hooks/overview.md +57 -57
  179. package/.claude/commands/hooks/post-edit.md +117 -117
  180. package/.claude/commands/hooks/post-task.md +112 -112
  181. package/.claude/commands/hooks/pre-edit.md +113 -113
  182. package/.claude/commands/hooks/pre-task.md +111 -111
  183. package/.claude/commands/hooks/session-end.md +118 -118
  184. package/.claude/commands/hooks/setup.md +102 -102
  185. package/.claude/commands/memory/README.md +9 -9
  186. package/.claude/commands/memory/memory-persist.md +25 -25
  187. package/.claude/commands/memory/memory-search.md +25 -25
  188. package/.claude/commands/memory/memory-usage.md +25 -25
  189. package/.claude/commands/memory/neural.md +47 -47
  190. package/.claude/commands/monitoring/README.md +9 -9
  191. package/.claude/commands/monitoring/agent-metrics.md +25 -25
  192. package/.claude/commands/monitoring/agents.md +44 -44
  193. package/.claude/commands/monitoring/real-time-view.md +25 -25
  194. package/.claude/commands/monitoring/status.md +46 -46
  195. package/.claude/commands/monitoring/swarm-monitor.md +25 -25
  196. package/.claude/commands/optimization/README.md +9 -9
  197. package/.claude/commands/optimization/auto-topology.md +61 -61
  198. package/.claude/commands/optimization/cache-manage.md +25 -25
  199. package/.claude/commands/optimization/parallel-execute.md +25 -25
  200. package/.claude/commands/optimization/parallel-execution.md +49 -49
  201. package/.claude/commands/optimization/topology-optimize.md +25 -25
  202. package/.claude/commands/pair/README.md +260 -260
  203. package/.claude/commands/pair/commands.md +545 -545
  204. package/.claude/commands/pair/config.md +509 -509
  205. package/.claude/commands/pair/examples.md +511 -511
  206. package/.claude/commands/pair/modes.md +347 -347
  207. package/.claude/commands/pair/session.md +406 -406
  208. package/.claude/commands/pair/start.md +208 -208
  209. package/.claude/commands/sparc/analyzer.md +51 -51
  210. package/.claude/commands/sparc/architect.md +53 -53
  211. package/.claude/commands/sparc/ask.md +97 -97
  212. package/.claude/commands/sparc/batch-executor.md +54 -54
  213. package/.claude/commands/sparc/code.md +89 -89
  214. package/.claude/commands/sparc/coder.md +54 -54
  215. package/.claude/commands/sparc/debug.md +83 -83
  216. package/.claude/commands/sparc/debugger.md +54 -54
  217. package/.claude/commands/sparc/designer.md +53 -53
  218. package/.claude/commands/sparc/devops.md +109 -109
  219. package/.claude/commands/sparc/docs-writer.md +80 -80
  220. package/.claude/commands/sparc/documenter.md +54 -54
  221. package/.claude/commands/sparc/innovator.md +54 -54
  222. package/.claude/commands/sparc/integration.md +83 -83
  223. package/.claude/commands/sparc/mcp.md +117 -117
  224. package/.claude/commands/sparc/memory-manager.md +54 -54
  225. package/.claude/commands/sparc/optimizer.md +54 -54
  226. package/.claude/commands/sparc/orchestrator.md +131 -131
  227. package/.claude/commands/sparc/post-deployment-monitoring-mode.md +83 -83
  228. package/.claude/commands/sparc/refinement-optimization-mode.md +83 -83
  229. package/.claude/commands/sparc/researcher.md +54 -54
  230. package/.claude/commands/sparc/reviewer.md +54 -54
  231. package/.claude/commands/sparc/security-review.md +80 -80
  232. package/.claude/commands/sparc/sparc-modes.md +174 -174
  233. package/.claude/commands/sparc/sparc.md +111 -111
  234. package/.claude/commands/sparc/spec-pseudocode.md +80 -80
  235. package/.claude/commands/sparc/supabase-admin.md +348 -348
  236. package/.claude/commands/sparc/swarm-coordinator.md +54 -54
  237. package/.claude/commands/sparc/tdd.md +54 -54
  238. package/.claude/commands/sparc/tester.md +54 -54
  239. package/.claude/commands/sparc/tutorial.md +79 -79
  240. package/.claude/commands/sparc/workflow-manager.md +54 -54
  241. package/.claude/commands/sparc.md +166 -166
  242. package/.claude/commands/stream-chain/pipeline.md +120 -120
  243. package/.claude/commands/stream-chain/run.md +69 -69
  244. package/.claude/commands/swarm/README.md +15 -15
  245. package/.claude/commands/swarm/analysis.md +95 -95
  246. package/.claude/commands/swarm/development.md +96 -96
  247. package/.claude/commands/swarm/examples.md +168 -168
  248. package/.claude/commands/swarm/maintenance.md +102 -102
  249. package/.claude/commands/swarm/optimization.md +117 -117
  250. package/.claude/commands/swarm/research.md +136 -136
  251. package/.claude/commands/swarm/swarm-analysis.md +8 -8
  252. package/.claude/commands/swarm/swarm-background.md +8 -8
  253. package/.claude/commands/swarm/swarm-init.md +19 -19
  254. package/.claude/commands/swarm/swarm-modes.md +8 -8
  255. package/.claude/commands/swarm/swarm-monitor.md +8 -8
  256. package/.claude/commands/swarm/swarm-spawn.md +19 -19
  257. package/.claude/commands/swarm/swarm-status.md +8 -8
  258. package/.claude/commands/swarm/swarm-strategies.md +8 -8
  259. package/.claude/commands/swarm/swarm.md +87 -87
  260. package/.claude/commands/swarm/testing.md +131 -131
  261. package/.claude/commands/training/README.md +9 -9
  262. package/.claude/commands/training/model-update.md +25 -25
  263. package/.claude/commands/training/neural-patterns.md +107 -107
  264. package/.claude/commands/training/neural-train.md +75 -75
  265. package/.claude/commands/training/pattern-learn.md +25 -25
  266. package/.claude/commands/training/specialization.md +62 -62
  267. package/.claude/commands/truth/start.md +142 -142
  268. package/.claude/commands/verify/check.md +49 -49
  269. package/.claude/commands/verify/start.md +127 -127
  270. package/.claude/commands/workflows/README.md +9 -9
  271. package/.claude/commands/workflows/development.md +77 -77
  272. package/.claude/commands/workflows/research.md +62 -62
  273. package/.claude/commands/workflows/workflow-create.md +25 -25
  274. package/.claude/commands/workflows/workflow-execute.md +25 -25
  275. package/.claude/commands/workflows/workflow-export.md +25 -25
  276. package/.claude/helpers/README.md +96 -96
  277. package/.claude/helpers/adr-compliance.sh +186 -186
  278. package/.claude/helpers/auto-commit.sh +178 -178
  279. package/.claude/helpers/auto-memory-hook.mjs +368 -368
  280. package/.claude/helpers/checkpoint-manager.sh +251 -251
  281. package/.claude/helpers/daemon-manager.sh +252 -252
  282. package/.claude/helpers/ddd-tracker.sh +144 -144
  283. package/.claude/helpers/github-safe.js +121 -121
  284. package/.claude/helpers/github-setup.sh +28 -28
  285. package/.claude/helpers/guidance-hook.sh +13 -13
  286. package/.claude/helpers/guidance-hooks.sh +102 -102
  287. package/.claude/helpers/health-monitor.sh +108 -108
  288. package/.claude/helpers/hook-handler.cjs +278 -278
  289. package/.claude/helpers/intelligence.cjs +1031 -1031
  290. package/.claude/helpers/learning-hooks.sh +329 -329
  291. package/.claude/helpers/learning-optimizer.sh +127 -127
  292. package/.claude/helpers/learning-service.mjs +1144 -1144
  293. package/.claude/helpers/memory.js +83 -83
  294. package/.claude/helpers/metrics-db.mjs +488 -488
  295. package/.claude/helpers/pattern-consolidator.sh +86 -86
  296. package/.claude/helpers/perf-worker.sh +160 -160
  297. package/.claude/helpers/post-commit +16 -16
  298. package/.claude/helpers/pre-commit +26 -26
  299. package/.claude/helpers/quick-start.sh +19 -19
  300. package/.claude/helpers/router.js +66 -66
  301. package/.claude/helpers/security-scanner.sh +127 -127
  302. package/.claude/helpers/session.js +135 -135
  303. package/.claude/helpers/setup-mcp.sh +18 -18
  304. package/.claude/helpers/standard-checkpoint-hooks.sh +189 -189
  305. package/.claude/helpers/statusline-hook.sh +21 -21
  306. package/.claude/helpers/statusline.cjs +575 -575
  307. package/.claude/helpers/statusline.js +321 -321
  308. package/.claude/helpers/swarm-comms.sh +353 -353
  309. package/.claude/helpers/swarm-hooks.sh +761 -761
  310. package/.claude/helpers/swarm-monitor.sh +210 -210
  311. package/.claude/helpers/sync-v3-metrics.sh +245 -245
  312. package/.claude/helpers/update-v3-progress.sh +165 -165
  313. package/.claude/helpers/v3-quick-status.sh +57 -57
  314. package/.claude/helpers/v3.sh +110 -110
  315. package/.claude/helpers/validate-v3-config.sh +215 -215
  316. package/.claude/helpers/worker-manager.sh +170 -170
  317. package/.claude/settings.json +182 -182
  318. package/.claude/skills/agentdb-advanced/SKILL.md +550 -550
  319. package/.claude/skills/agentdb-learning/SKILL.md +545 -545
  320. package/.claude/skills/agentdb-memory-patterns/SKILL.md +339 -339
  321. package/.claude/skills/agentdb-optimization/SKILL.md +509 -509
  322. package/.claude/skills/agentdb-vector-search/SKILL.md +339 -339
  323. package/.claude/skills/agentic-jujutsu/SKILL.md +645 -645
  324. package/.claude/skills/aidefence-scan.md +151 -151
  325. package/.claude/skills/aidefence.yaml +297 -297
  326. package/.claude/skills/browser/SKILL.md +204 -204
  327. package/.claude/skills/flow-nexus-neural/SKILL.md +738 -738
  328. package/.claude/skills/flow-nexus-platform/SKILL.md +1157 -1157
  329. package/.claude/skills/flow-nexus-swarm/SKILL.md +610 -610
  330. package/.claude/skills/github-code-review/SKILL.md +1140 -1140
  331. package/.claude/skills/github-multi-repo/SKILL.md +874 -874
  332. package/.claude/skills/github-project-management/SKILL.md +1290 -1277
  333. package/.claude/skills/github-release-management/SKILL.md +1081 -1081
  334. package/.claude/skills/github-workflow-automation/SKILL.md +1065 -1065
  335. package/.claude/skills/hive-mind-advanced/SKILL.md +712 -712
  336. package/.claude/skills/hooks-automation/SKILL.md +1201 -1201
  337. package/.claude/skills/pair-programming/SKILL.md +1202 -1202
  338. package/.claude/skills/performance-analysis/SKILL.md +563 -563
  339. package/.claude/skills/reasoningbank-agentdb/SKILL.md +446 -446
  340. package/.claude/skills/reasoningbank-intelligence/SKILL.md +201 -201
  341. package/.claude/skills/secure-review.md +181 -181
  342. package/.claude/skills/skill-builder/SKILL.md +910 -910
  343. package/.claude/skills/sparc-methodology/SKILL.md +1115 -1115
  344. package/.claude/skills/stream-chain/SKILL.md +563 -563
  345. package/.claude/skills/swarm-advanced/SKILL.md +973 -973
  346. package/.claude/skills/swarm-orchestration/SKILL.md +179 -179
  347. package/.claude/skills/v3-cli-modernization/SKILL.md +871 -871
  348. package/.claude/skills/v3-core-implementation/SKILL.md +796 -796
  349. package/.claude/skills/v3-ddd-architecture/SKILL.md +441 -441
  350. package/.claude/skills/v3-integration-deep/SKILL.md +240 -240
  351. package/.claude/skills/v3-mcp-optimization/SKILL.md +776 -776
  352. package/.claude/skills/v3-memory-unification/SKILL.md +173 -173
  353. package/.claude/skills/v3-performance-optimization/SKILL.md +389 -389
  354. package/.claude/skills/v3-security-overhaul/SKILL.md +81 -81
  355. package/.claude/skills/v3-swarm-coordination/SKILL.md +339 -339
  356. package/.claude/skills/verification-quality/SKILL.md +649 -649
  357. package/.claude/skills/worker-benchmarks/skill.md +135 -135
  358. package/.claude/skills/worker-integration/skill.md +154 -154
  359. package/README.md +393 -391
  360. package/bin/cli.js +220 -220
  361. package/bin/mcp-server.js +224 -224
  362. package/bin/preinstall.cjs +2 -2
  363. package/dist/src/commands/agent-wasm.js +2 -2
  364. package/dist/src/commands/agent-wasm.js.map +1 -1
  365. package/dist/src/commands/completions.js +409 -409
  366. package/dist/src/commands/daemon.d.ts.map +1 -1
  367. package/dist/src/commands/daemon.js +19 -3
  368. package/dist/src/commands/daemon.js.map +1 -1
  369. package/dist/src/commands/doctor.d.ts.map +1 -1
  370. package/dist/src/commands/doctor.js +105 -23
  371. package/dist/src/commands/doctor.js.map +1 -1
  372. package/dist/src/commands/embeddings.js +26 -26
  373. package/dist/src/commands/hive-mind.d.ts.map +1 -1
  374. package/dist/src/commands/hive-mind.js +122 -104
  375. package/dist/src/commands/hive-mind.js.map +1 -1
  376. package/dist/src/commands/hooks.d.ts.map +1 -1
  377. package/dist/src/commands/hooks.js +34 -21
  378. package/dist/src/commands/hooks.js.map +1 -1
  379. package/dist/src/commands/memory.d.ts.map +1 -1
  380. package/dist/src/commands/memory.js +68 -0
  381. package/dist/src/commands/memory.js.map +1 -1
  382. package/dist/src/commands/ruvector/backup.js +23 -23
  383. package/dist/src/commands/ruvector/benchmark.js +31 -31
  384. package/dist/src/commands/ruvector/import.js +14 -14
  385. package/dist/src/commands/ruvector/init.js +115 -115
  386. package/dist/src/commands/ruvector/migrate.js +99 -99
  387. package/dist/src/commands/ruvector/optimize.js +51 -51
  388. package/dist/src/commands/ruvector/setup.js +624 -624
  389. package/dist/src/commands/ruvector/status.js +38 -38
  390. package/dist/src/index.d.ts +5 -1
  391. package/dist/src/index.d.ts.map +1 -1
  392. package/dist/src/index.js +59 -18
  393. package/dist/src/index.js.map +1 -1
  394. package/dist/src/init/claudemd-generator.js +226 -226
  395. package/dist/src/init/executor.d.ts.map +1 -1
  396. package/dist/src/init/executor.js +511 -453
  397. package/dist/src/init/executor.js.map +1 -1
  398. package/dist/src/init/helpers-generator.js +645 -645
  399. package/dist/src/init/settings-generator.d.ts.map +1 -1
  400. package/dist/src/init/settings-generator.js +11 -5
  401. package/dist/src/init/settings-generator.js.map +1 -1
  402. package/dist/src/init/statusline-generator.js +858 -858
  403. package/dist/src/init/types.d.ts +7 -0
  404. package/dist/src/init/types.d.ts.map +1 -1
  405. package/dist/src/init/types.js.map +1 -1
  406. package/dist/src/mcp-tools/agentdb-tools.d.ts +3 -0
  407. package/dist/src/mcp-tools/agentdb-tools.d.ts.map +1 -1
  408. package/dist/src/mcp-tools/agentdb-tools.js +108 -0
  409. package/dist/src/mcp-tools/agentdb-tools.js.map +1 -1
  410. package/dist/src/mcp-tools/hooks-tools.d.ts.map +1 -1
  411. package/dist/src/mcp-tools/hooks-tools.js +4 -2
  412. package/dist/src/mcp-tools/hooks-tools.js.map +1 -1
  413. package/dist/src/mcp-tools/memory-tools.d.ts.map +1 -1
  414. package/dist/src/mcp-tools/memory-tools.js +19 -0
  415. package/dist/src/mcp-tools/memory-tools.js.map +1 -1
  416. package/dist/src/mcp-tools/neural-tools.d.ts.map +1 -1
  417. package/dist/src/mcp-tools/neural-tools.js +14 -1
  418. package/dist/src/mcp-tools/neural-tools.js.map +1 -1
  419. package/dist/src/mcp-tools/security-tools.d.ts.map +1 -1
  420. package/dist/src/mcp-tools/security-tools.js +28 -3
  421. package/dist/src/mcp-tools/security-tools.js.map +1 -1
  422. package/dist/src/mcp-tools/swarm-tools.d.ts.map +1 -1
  423. package/dist/src/mcp-tools/swarm-tools.js +72 -3
  424. package/dist/src/mcp-tools/swarm-tools.js.map +1 -1
  425. package/dist/src/mcp-tools/wasm-agent-tools.js +1 -1
  426. package/dist/src/mcp-tools/wasm-agent-tools.js.map +1 -1
  427. package/dist/src/memory/intelligence.d.ts.map +1 -1
  428. package/dist/src/memory/intelligence.js +28 -3
  429. package/dist/src/memory/intelligence.js.map +1 -1
  430. package/dist/src/memory/memory-bridge.d.ts +69 -0
  431. package/dist/src/memory/memory-bridge.d.ts.map +1 -1
  432. package/dist/src/memory/memory-bridge.js +319 -66
  433. package/dist/src/memory/memory-bridge.js.map +1 -1
  434. package/dist/src/memory/memory-initializer.d.ts +5 -0
  435. package/dist/src/memory/memory-initializer.d.ts.map +1 -1
  436. package/dist/src/memory/memory-initializer.js +369 -363
  437. package/dist/src/memory/memory-initializer.js.map +1 -1
  438. package/dist/src/memory/neural-package-bridge.d.ts +48 -0
  439. package/dist/src/memory/neural-package-bridge.d.ts.map +1 -0
  440. package/dist/src/memory/neural-package-bridge.js +87 -0
  441. package/dist/src/memory/neural-package-bridge.js.map +1 -0
  442. package/dist/src/memory/rabitq-index.js +5 -5
  443. package/dist/src/memory/sona-optimizer.d.ts.map +1 -1
  444. package/dist/src/memory/sona-optimizer.js +1 -0
  445. package/dist/src/memory/sona-optimizer.js.map +1 -1
  446. package/dist/src/parser.d.ts +9 -0
  447. package/dist/src/parser.d.ts.map +1 -1
  448. package/dist/src/parser.js +11 -0
  449. package/dist/src/parser.js.map +1 -1
  450. package/dist/src/runtime/headless.js +28 -28
  451. package/dist/src/ruvector/agent-wasm.d.ts.map +1 -1
  452. package/dist/src/ruvector/agent-wasm.js +4 -1
  453. package/dist/src/ruvector/agent-wasm.js.map +1 -1
  454. package/dist/src/ruvector/index.d.ts +0 -2
  455. package/dist/src/ruvector/index.d.ts.map +1 -1
  456. package/dist/src/ruvector/index.js +8 -2
  457. package/dist/src/ruvector/index.js.map +1 -1
  458. package/dist/src/ruvector/model-router.d.ts +22 -1
  459. package/dist/src/ruvector/model-router.d.ts.map +1 -1
  460. package/dist/src/ruvector/model-router.js +125 -5
  461. package/dist/src/ruvector/model-router.js.map +1 -1
  462. package/dist/src/services/headless-worker-executor.js +84 -84
  463. package/dist/src/transfer/deploy-seraphine.js +23 -23
  464. package/dist/tsconfig.tsbuildinfo +1 -1
  465. package/package.json +5 -4
  466. package/scripts/deploy-ipfs-node.sh +153 -153
  467. package/scripts/postinstall.cjs +153 -153
  468. package/scripts/publish-registry.ts +345 -345
  469. package/scripts/publish.sh +57 -57
  470. package/scripts/setup-ipfs-registry.md +366 -366
  471. package/dist/src/services/event-stream.d.ts.map +0 -1
  472. package/dist/src/services/event-stream.js.map +0 -1
  473. package/dist/src/services/loop-worker-runner.d.ts.map +0 -1
  474. package/dist/src/services/loop-worker-runner.js.map +0 -1
  475. package/dist/src/services/runtime-capabilities.d.ts.map +0 -1
  476. package/dist/src/services/runtime-capabilities.js.map +0 -1
@@ -1,665 +1,665 @@
1
- ---
2
- name: Benchmark Suite
3
- type: agent
4
- category: optimization
5
- description: Comprehensive performance benchmarking, regression detection and performance validation
6
- ---
7
-
8
- # Benchmark Suite Agent
9
-
10
- ## Agent Profile
11
- - **Name**: Benchmark Suite
12
- - **Type**: Performance Optimization Agent
13
- - **Specialization**: Comprehensive performance benchmarking and testing
14
- - **Performance Focus**: Automated benchmarking, regression detection, and performance validation
15
-
16
- ## Core Capabilities
17
-
18
- ### 1. Comprehensive Benchmarking Framework
19
- ```javascript
20
- // Advanced benchmarking system
21
- class ComprehensiveBenchmarkSuite {
22
- constructor() {
23
- this.benchmarks = {
24
- // Core performance benchmarks
25
- throughput: new ThroughputBenchmark(),
26
- latency: new LatencyBenchmark(),
27
- scalability: new ScalabilityBenchmark(),
28
- resource_usage: new ResourceUsageBenchmark(),
29
-
30
- // Swarm-specific benchmarks
31
- coordination: new CoordinationBenchmark(),
32
- load_balancing: new LoadBalancingBenchmark(),
33
- topology: new TopologyBenchmark(),
34
- fault_tolerance: new FaultToleranceBenchmark(),
35
-
36
- // Custom benchmarks
37
- custom: new CustomBenchmarkManager()
38
- };
39
-
40
- this.reporter = new BenchmarkReporter();
41
- this.comparator = new PerformanceComparator();
42
- this.analyzer = new BenchmarkAnalyzer();
43
- }
44
-
45
- // Execute comprehensive benchmark suite
46
- async runBenchmarkSuite(config = {}) {
47
- const suiteConfig = {
48
- duration: config.duration || 300000, // 5 minutes default
49
- iterations: config.iterations || 10,
50
- warmupTime: config.warmupTime || 30000, // 30 seconds
51
- cooldownTime: config.cooldownTime || 10000, // 10 seconds
52
- parallel: config.parallel || false,
53
- baseline: config.baseline || null
54
- };
55
-
56
- const results = {
57
- summary: {},
58
- detailed: new Map(),
59
- baseline_comparison: null,
60
- recommendations: []
61
- };
62
-
63
- // Warmup phase
64
- await this.warmup(suiteConfig.warmupTime);
65
-
66
- // Execute benchmarks
67
- if (suiteConfig.parallel) {
68
- results.detailed = await this.runBenchmarksParallel(suiteConfig);
69
- } else {
70
- results.detailed = await this.runBenchmarksSequential(suiteConfig);
71
- }
72
-
73
- // Generate summary
74
- results.summary = this.generateSummary(results.detailed);
75
-
76
- // Compare with baseline if provided
77
- if (suiteConfig.baseline) {
78
- results.baseline_comparison = await this.compareWithBaseline(
79
- results.detailed,
80
- suiteConfig.baseline
81
- );
82
- }
83
-
84
- // Generate recommendations
85
- results.recommendations = await this.generateRecommendations(results);
86
-
87
- // Cooldown phase
88
- await this.cooldown(suiteConfig.cooldownTime);
89
-
90
- return results;
91
- }
92
-
93
- // Parallel benchmark execution
94
- async runBenchmarksParallel(config) {
95
- const benchmarkPromises = Object.entries(this.benchmarks).map(
96
- async ([name, benchmark]) => {
97
- const result = await this.executeBenchmark(benchmark, name, config);
98
- return [name, result];
99
- }
100
- );
101
-
102
- const results = await Promise.all(benchmarkPromises);
103
- return new Map(results);
104
- }
105
-
106
- // Sequential benchmark execution
107
- async runBenchmarksSequential(config) {
108
- const results = new Map();
109
-
110
- for (const [name, benchmark] of Object.entries(this.benchmarks)) {
111
- const result = await this.executeBenchmark(benchmark, name, config);
112
- results.set(name, result);
113
-
114
- // Brief pause between benchmarks
115
- await this.sleep(1000);
116
- }
117
-
118
- return results;
119
- }
120
- }
121
- ```
122
-
123
- ### 2. Performance Regression Detection
124
- ```javascript
125
- // Advanced regression detection system
126
- class RegressionDetector {
127
- constructor() {
128
- this.detectors = {
129
- statistical: new StatisticalRegressionDetector(),
130
- machine_learning: new MLRegressionDetector(),
131
- threshold: new ThresholdRegressionDetector(),
132
- trend: new TrendRegressionDetector()
133
- };
134
-
135
- this.analyzer = new RegressionAnalyzer();
136
- this.alerting = new RegressionAlerting();
137
- }
138
-
139
- // Detect performance regressions
140
- async detectRegressions(currentResults, historicalData, config = {}) {
141
- const regressions = {
142
- detected: [],
143
- severity: 'none',
144
- confidence: 0,
145
- analysis: {}
146
- };
147
-
148
- // Run multiple detection algorithms
149
- const detectionPromises = Object.entries(this.detectors).map(
150
- async ([method, detector]) => {
151
- const detection = await detector.detect(currentResults, historicalData, config);
152
- return [method, detection];
153
- }
154
- );
155
-
156
- const detectionResults = await Promise.all(detectionPromises);
157
-
158
- // Aggregate detection results
159
- for (const [method, detection] of detectionResults) {
160
- if (detection.regression_detected) {
161
- regressions.detected.push({
162
- method,
163
- ...detection
164
- });
165
- }
166
- }
167
-
168
- // Calculate overall confidence and severity
169
- if (regressions.detected.length > 0) {
170
- regressions.confidence = this.calculateAggregateConfidence(regressions.detected);
171
- regressions.severity = this.calculateSeverity(regressions.detected);
172
- regressions.analysis = await this.analyzer.analyze(regressions.detected);
173
- }
174
-
175
- return regressions;
176
- }
177
-
178
- // Statistical regression detection using change point analysis
179
- async detectStatisticalRegression(metric, historicalData, sensitivity = 0.95) {
180
- // Use CUSUM (Cumulative Sum) algorithm for change point detection
181
- const cusum = this.calculateCUSUM(metric, historicalData);
182
-
183
- // Detect change points
184
- const changePoints = this.detectChangePoints(cusum, sensitivity);
185
-
186
- // Analyze significance of changes
187
- const analysis = changePoints.map(point => ({
188
- timestamp: point.timestamp,
189
- magnitude: point.magnitude,
190
- direction: point.direction,
191
- significance: point.significance,
192
- confidence: point.confidence
193
- }));
194
-
195
- return {
196
- regression_detected: changePoints.length > 0,
197
- change_points: analysis,
198
- cusum_statistics: cusum.statistics,
199
- sensitivity: sensitivity
200
- };
201
- }
202
-
203
- // Machine learning-based regression detection
204
- async detectMLRegression(metrics, historicalData) {
205
- // Train anomaly detection model on historical data
206
- const model = await this.trainAnomalyModel(historicalData);
207
-
208
- // Predict anomaly scores for current metrics
209
- const anomalyScores = await model.predict(metrics);
210
-
211
- // Identify regressions based on anomaly scores
212
- const threshold = this.calculateDynamicThreshold(anomalyScores);
213
- const regressions = anomalyScores.filter(score => score.anomaly > threshold);
214
-
215
- return {
216
- regression_detected: regressions.length > 0,
217
- anomaly_scores: anomalyScores,
218
- threshold: threshold,
219
- regressions: regressions,
220
- model_confidence: model.confidence
221
- };
222
- }
223
- }
224
- ```
225
-
226
- ### 3. Automated Performance Testing
227
- ```javascript
228
- // Comprehensive automated performance testing
229
- class AutomatedPerformanceTester {
230
- constructor() {
231
- this.testSuites = {
232
- load: new LoadTestSuite(),
233
- stress: new StressTestSuite(),
234
- volume: new VolumeTestSuite(),
235
- endurance: new EnduranceTestSuite(),
236
- spike: new SpikeTestSuite(),
237
- configuration: new ConfigurationTestSuite()
238
- };
239
-
240
- this.scheduler = new TestScheduler();
241
- this.orchestrator = new TestOrchestrator();
242
- this.validator = new ResultValidator();
243
- }
244
-
245
- // Execute automated performance test campaign
246
- async runTestCampaign(config) {
247
- const campaign = {
248
- id: this.generateCampaignId(),
249
- config,
250
- startTime: Date.now(),
251
- tests: [],
252
- results: new Map(),
253
- summary: null
254
- };
255
-
256
- // Schedule test execution
257
- const schedule = await this.scheduler.schedule(config.tests, config.constraints);
258
-
259
- // Execute tests according to schedule
260
- for (const scheduledTest of schedule) {
261
- const testResult = await this.executeScheduledTest(scheduledTest);
262
- campaign.tests.push(scheduledTest);
263
- campaign.results.set(scheduledTest.id, testResult);
264
-
265
- // Validate results in real-time
266
- const validation = await this.validator.validate(testResult);
267
- if (!validation.valid) {
268
- campaign.summary = {
269
- status: 'failed',
270
- reason: validation.reason,
271
- failedAt: scheduledTest.name
272
- };
273
- break;
274
- }
275
- }
276
-
277
- // Generate campaign summary
278
- if (!campaign.summary) {
279
- campaign.summary = await this.generateCampaignSummary(campaign);
280
- }
281
-
282
- campaign.endTime = Date.now();
283
- campaign.duration = campaign.endTime - campaign.startTime;
284
-
285
- return campaign;
286
- }
287
-
288
- // Load testing with gradual ramp-up
289
- async executeLoadTest(config) {
290
- const loadTest = {
291
- type: 'load',
292
- config,
293
- phases: [],
294
- metrics: new Map(),
295
- results: {}
296
- };
297
-
298
- // Ramp-up phase
299
- const rampUpResult = await this.executeRampUp(config.rampUp);
300
- loadTest.phases.push({ phase: 'ramp-up', result: rampUpResult });
301
-
302
- // Sustained load phase
303
- const sustainedResult = await this.executeSustainedLoad(config.sustained);
304
- loadTest.phases.push({ phase: 'sustained', result: sustainedResult });
305
-
306
- // Ramp-down phase
307
- const rampDownResult = await this.executeRampDown(config.rampDown);
308
- loadTest.phases.push({ phase: 'ramp-down', result: rampDownResult });
309
-
310
- // Analyze results
311
- loadTest.results = await this.analyzeLoadTestResults(loadTest.phases);
312
-
313
- return loadTest;
314
- }
315
-
316
- // Stress testing to find breaking points
317
- async executeStressTest(config) {
318
- const stressTest = {
319
- type: 'stress',
320
- config,
321
- breakingPoint: null,
322
- degradationCurve: [],
323
- results: {}
324
- };
325
-
326
- let currentLoad = config.startLoad;
327
- let systemBroken = false;
328
-
329
- while (!systemBroken && currentLoad <= config.maxLoad) {
330
- const testResult = await this.applyLoad(currentLoad, config.duration);
331
-
332
- stressTest.degradationCurve.push({
333
- load: currentLoad,
334
- performance: testResult.performance,
335
- stability: testResult.stability,
336
- errors: testResult.errors
337
- });
338
-
339
- // Check if system is breaking
340
- if (this.isSystemBreaking(testResult, config.breakingCriteria)) {
341
- stressTest.breakingPoint = {
342
- load: currentLoad,
343
- performance: testResult.performance,
344
- reason: this.identifyBreakingReason(testResult)
345
- };
346
- systemBroken = true;
347
- }
348
-
349
- currentLoad += config.loadIncrement;
350
- }
351
-
352
- stressTest.results = await this.analyzeStressTestResults(stressTest);
353
-
354
- return stressTest;
355
- }
356
- }
357
- ```
358
-
359
- ### 4. Performance Validation Framework
360
- ```javascript
361
- // Comprehensive performance validation
362
- class PerformanceValidator {
363
- constructor() {
364
- this.validators = {
365
- sla: new SLAValidator(),
366
- regression: new RegressionValidator(),
367
- scalability: new ScalabilityValidator(),
368
- reliability: new ReliabilityValidator(),
369
- efficiency: new EfficiencyValidator()
370
- };
371
-
372
- this.thresholds = new ThresholdManager();
373
- this.rules = new ValidationRuleEngine();
374
- }
375
-
376
- // Validate performance against defined criteria
377
- async validatePerformance(results, criteria) {
378
- const validation = {
379
- overall: {
380
- passed: true,
381
- score: 0,
382
- violations: []
383
- },
384
- detailed: new Map(),
385
- recommendations: []
386
- };
387
-
388
- // Run all validators
389
- const validationPromises = Object.entries(this.validators).map(
390
- async ([type, validator]) => {
391
- const result = await validator.validate(results, criteria[type]);
392
- return [type, result];
393
- }
394
- );
395
-
396
- const validationResults = await Promise.all(validationPromises);
397
-
398
- // Aggregate validation results
399
- for (const [type, result] of validationResults) {
400
- validation.detailed.set(type, result);
401
-
402
- if (!result.passed) {
403
- validation.overall.passed = false;
404
- validation.overall.violations.push(...result.violations);
405
- }
406
-
407
- validation.overall.score += result.score * (criteria[type]?.weight || 1);
408
- }
409
-
410
- // Normalize overall score
411
- const totalWeight = Object.values(criteria).reduce((sum, c) => sum + (c.weight || 1), 0);
412
- validation.overall.score /= totalWeight;
413
-
414
- // Generate recommendations
415
- validation.recommendations = await this.generateValidationRecommendations(validation);
416
-
417
- return validation;
418
- }
419
-
420
- // SLA validation
421
- async validateSLA(results, slaConfig) {
422
- const slaValidation = {
423
- passed: true,
424
- violations: [],
425
- score: 1.0,
426
- metrics: {}
427
- };
428
-
429
- // Validate each SLA metric
430
- for (const [metric, threshold] of Object.entries(slaConfig.thresholds)) {
431
- const actualValue = this.extractMetricValue(results, metric);
432
- const validation = this.validateThreshold(actualValue, threshold);
433
-
434
- slaValidation.metrics[metric] = {
435
- actual: actualValue,
436
- threshold: threshold.value,
437
- operator: threshold.operator,
438
- passed: validation.passed,
439
- deviation: validation.deviation
440
- };
441
-
442
- if (!validation.passed) {
443
- slaValidation.passed = false;
444
- slaValidation.violations.push({
445
- metric,
446
- actual: actualValue,
447
- expected: threshold.value,
448
- severity: threshold.severity || 'medium'
449
- });
450
-
451
- // Reduce score based on violation severity
452
- const severityMultiplier = this.getSeverityMultiplier(threshold.severity);
453
- slaValidation.score -= (validation.deviation * severityMultiplier);
454
- }
455
- }
456
-
457
- slaValidation.score = Math.max(0, slaValidation.score);
458
-
459
- return slaValidation;
460
- }
461
-
462
- // Scalability validation
463
- async validateScalability(results, scalabilityConfig) {
464
- const scalabilityValidation = {
465
- passed: true,
466
- violations: [],
467
- score: 1.0,
468
- analysis: {}
469
- };
470
-
471
- // Linear scalability analysis
472
- if (scalabilityConfig.linear) {
473
- const linearityAnalysis = this.analyzeLinearScalability(results);
474
- scalabilityValidation.analysis.linearity = linearityAnalysis;
475
-
476
- if (linearityAnalysis.coefficient < scalabilityConfig.linear.minCoefficient) {
477
- scalabilityValidation.passed = false;
478
- scalabilityValidation.violations.push({
479
- type: 'linearity',
480
- actual: linearityAnalysis.coefficient,
481
- expected: scalabilityConfig.linear.minCoefficient
482
- });
483
- }
484
- }
485
-
486
- // Efficiency retention analysis
487
- if (scalabilityConfig.efficiency) {
488
- const efficiencyAnalysis = this.analyzeEfficiencyRetention(results);
489
- scalabilityValidation.analysis.efficiency = efficiencyAnalysis;
490
-
491
- if (efficiencyAnalysis.retention < scalabilityConfig.efficiency.minRetention) {
492
- scalabilityValidation.passed = false;
493
- scalabilityValidation.violations.push({
494
- type: 'efficiency_retention',
495
- actual: efficiencyAnalysis.retention,
496
- expected: scalabilityConfig.efficiency.minRetention
497
- });
498
- }
499
- }
500
-
501
- return scalabilityValidation;
502
- }
503
- }
504
- ```
505
-
506
- ## MCP Integration Hooks
507
-
508
- ### Benchmark Execution Integration
509
- ```javascript
510
- // Comprehensive MCP benchmark integration
511
- const benchmarkIntegration = {
512
- // Execute performance benchmarks
513
- async runBenchmarks(config = {}) {
514
- // Run benchmark suite
515
- const benchmarkResult = await mcp.benchmark_run({
516
- suite: config.suite || 'comprehensive'
517
- });
518
-
519
- // Collect detailed metrics during benchmarking
520
- const metrics = await mcp.metrics_collect({
521
- components: ['system', 'agents', 'coordination', 'memory']
522
- });
523
-
524
- // Analyze performance trends
525
- const trends = await mcp.trend_analysis({
526
- metric: 'performance',
527
- period: '24h'
528
- });
529
-
530
- // Cost analysis
531
- const costAnalysis = await mcp.cost_analysis({
532
- timeframe: '24h'
533
- });
534
-
535
- return {
536
- benchmark: benchmarkResult,
537
- metrics,
538
- trends,
539
- costAnalysis,
540
- timestamp: Date.now()
541
- };
542
- },
543
-
544
- // Quality assessment
545
- async assessQuality(criteria) {
546
- const qualityAssessment = await mcp.quality_assess({
547
- target: 'swarm-performance',
548
- criteria: criteria || [
549
- 'throughput',
550
- 'latency',
551
- 'reliability',
552
- 'scalability',
553
- 'efficiency'
554
- ]
555
- });
556
-
557
- return qualityAssessment;
558
- },
559
-
560
- // Error pattern analysis
561
- async analyzeErrorPatterns() {
562
- // Collect system logs
563
- const logs = await this.collectSystemLogs();
564
-
565
- // Analyze error patterns
566
- const errorAnalysis = await mcp.error_analysis({
567
- logs: logs
568
- });
569
-
570
- return errorAnalysis;
571
- }
572
- };
573
- ```
574
-
575
- ## Operational Commands
576
-
577
- ### Benchmarking Commands
578
- ```bash
579
- # Run comprehensive benchmark suite
580
- npx claude-flow benchmark-run --suite comprehensive --duration 300
581
-
582
- # Execute specific benchmark
583
- npx claude-flow benchmark-run --suite throughput --iterations 10
584
-
585
- # Compare with baseline
586
- npx claude-flow benchmark-compare --current <results> --baseline <baseline>
587
-
588
- # Quality assessment
589
- npx claude-flow quality-assess --target swarm-performance --criteria throughput,latency
590
-
591
- # Performance validation
592
- npx claude-flow validate-performance --results <file> --criteria <file>
593
- ```
594
-
595
- ### Regression Detection Commands
596
- ```bash
597
- # Detect performance regressions
598
- npx claude-flow detect-regression --current <results> --historical <data>
599
-
600
- # Set up automated regression monitoring
601
- npx claude-flow regression-monitor --enable --sensitivity 0.95
602
-
603
- # Analyze error patterns
604
- npx claude-flow error-analysis --logs <log-files>
605
- ```
606
-
607
- ## Integration Points
608
-
609
- ### With Other Optimization Agents
610
- - **Performance Monitor**: Provides continuous monitoring data for benchmarking
611
- - **Load Balancer**: Validates load balancing effectiveness through benchmarks
612
- - **Topology Optimizer**: Tests topology configurations for optimal performance
613
-
614
- ### With CI/CD Pipeline
615
- - **Automated Testing**: Integrates with CI/CD for continuous performance validation
616
- - **Quality Gates**: Provides pass/fail criteria for deployment decisions
617
- - **Regression Prevention**: Catches performance regressions before production
618
-
619
- ## Performance Benchmarks
620
-
621
- ### Standard Benchmark Suite
622
- ```javascript
623
- // Comprehensive benchmark definitions
624
- const standardBenchmarks = {
625
- // Throughput benchmarks
626
- throughput: {
627
- name: 'Throughput Benchmark',
628
- metrics: ['requests_per_second', 'tasks_per_second', 'messages_per_second'],
629
- duration: 300000, // 5 minutes
630
- warmup: 30000, // 30 seconds
631
- targets: {
632
- requests_per_second: { min: 1000, optimal: 5000 },
633
- tasks_per_second: { min: 100, optimal: 500 },
634
- messages_per_second: { min: 10000, optimal: 50000 }
635
- }
636
- },
637
-
638
- // Latency benchmarks
639
- latency: {
640
- name: 'Latency Benchmark',
641
- metrics: ['p50', 'p90', 'p95', 'p99', 'max'],
642
- duration: 300000,
643
- targets: {
644
- p50: { max: 100 }, // 100ms
645
- p90: { max: 200 }, // 200ms
646
- p95: { max: 500 }, // 500ms
647
- p99: { max: 1000 }, // 1s
648
- max: { max: 5000 } // 5s
649
- }
650
- },
651
-
652
- // Scalability benchmarks
653
- scalability: {
654
- name: 'Scalability Benchmark',
655
- metrics: ['linear_coefficient', 'efficiency_retention'],
656
- load_points: [1, 2, 4, 8, 16, 32, 64],
657
- targets: {
658
- linear_coefficient: { min: 0.8 },
659
- efficiency_retention: { min: 0.7 }
660
- }
661
- }
662
- };
663
- ```
664
-
1
+ ---
2
+ name: Benchmark Suite
3
+ type: agent
4
+ category: optimization
5
+ description: Comprehensive performance benchmarking, regression detection and performance validation
6
+ ---
7
+
8
+ # Benchmark Suite Agent
9
+
10
+ ## Agent Profile
11
+ - **Name**: Benchmark Suite
12
+ - **Type**: Performance Optimization Agent
13
+ - **Specialization**: Comprehensive performance benchmarking and testing
14
+ - **Performance Focus**: Automated benchmarking, regression detection, and performance validation
15
+
16
+ ## Core Capabilities
17
+
18
+ ### 1. Comprehensive Benchmarking Framework
19
+ ```javascript
20
+ // Advanced benchmarking system
21
+ class ComprehensiveBenchmarkSuite {
22
+ constructor() {
23
+ this.benchmarks = {
24
+ // Core performance benchmarks
25
+ throughput: new ThroughputBenchmark(),
26
+ latency: new LatencyBenchmark(),
27
+ scalability: new ScalabilityBenchmark(),
28
+ resource_usage: new ResourceUsageBenchmark(),
29
+
30
+ // Swarm-specific benchmarks
31
+ coordination: new CoordinationBenchmark(),
32
+ load_balancing: new LoadBalancingBenchmark(),
33
+ topology: new TopologyBenchmark(),
34
+ fault_tolerance: new FaultToleranceBenchmark(),
35
+
36
+ // Custom benchmarks
37
+ custom: new CustomBenchmarkManager()
38
+ };
39
+
40
+ this.reporter = new BenchmarkReporter();
41
+ this.comparator = new PerformanceComparator();
42
+ this.analyzer = new BenchmarkAnalyzer();
43
+ }
44
+
45
+ // Execute comprehensive benchmark suite
46
+ async runBenchmarkSuite(config = {}) {
47
+ const suiteConfig = {
48
+ duration: config.duration || 300000, // 5 minutes default
49
+ iterations: config.iterations || 10,
50
+ warmupTime: config.warmupTime || 30000, // 30 seconds
51
+ cooldownTime: config.cooldownTime || 10000, // 10 seconds
52
+ parallel: config.parallel || false,
53
+ baseline: config.baseline || null
54
+ };
55
+
56
+ const results = {
57
+ summary: {},
58
+ detailed: new Map(),
59
+ baseline_comparison: null,
60
+ recommendations: []
61
+ };
62
+
63
+ // Warmup phase
64
+ await this.warmup(suiteConfig.warmupTime);
65
+
66
+ // Execute benchmarks
67
+ if (suiteConfig.parallel) {
68
+ results.detailed = await this.runBenchmarksParallel(suiteConfig);
69
+ } else {
70
+ results.detailed = await this.runBenchmarksSequential(suiteConfig);
71
+ }
72
+
73
+ // Generate summary
74
+ results.summary = this.generateSummary(results.detailed);
75
+
76
+ // Compare with baseline if provided
77
+ if (suiteConfig.baseline) {
78
+ results.baseline_comparison = await this.compareWithBaseline(
79
+ results.detailed,
80
+ suiteConfig.baseline
81
+ );
82
+ }
83
+
84
+ // Generate recommendations
85
+ results.recommendations = await this.generateRecommendations(results);
86
+
87
+ // Cooldown phase
88
+ await this.cooldown(suiteConfig.cooldownTime);
89
+
90
+ return results;
91
+ }
92
+
93
+ // Parallel benchmark execution
94
+ async runBenchmarksParallel(config) {
95
+ const benchmarkPromises = Object.entries(this.benchmarks).map(
96
+ async ([name, benchmark]) => {
97
+ const result = await this.executeBenchmark(benchmark, name, config);
98
+ return [name, result];
99
+ }
100
+ );
101
+
102
+ const results = await Promise.all(benchmarkPromises);
103
+ return new Map(results);
104
+ }
105
+
106
+ // Sequential benchmark execution
107
+ async runBenchmarksSequential(config) {
108
+ const results = new Map();
109
+
110
+ for (const [name, benchmark] of Object.entries(this.benchmarks)) {
111
+ const result = await this.executeBenchmark(benchmark, name, config);
112
+ results.set(name, result);
113
+
114
+ // Brief pause between benchmarks
115
+ await this.sleep(1000);
116
+ }
117
+
118
+ return results;
119
+ }
120
+ }
121
+ ```
122
+
123
+ ### 2. Performance Regression Detection
124
+ ```javascript
125
+ // Advanced regression detection system
126
+ class RegressionDetector {
127
+ constructor() {
128
+ this.detectors = {
129
+ statistical: new StatisticalRegressionDetector(),
130
+ machine_learning: new MLRegressionDetector(),
131
+ threshold: new ThresholdRegressionDetector(),
132
+ trend: new TrendRegressionDetector()
133
+ };
134
+
135
+ this.analyzer = new RegressionAnalyzer();
136
+ this.alerting = new RegressionAlerting();
137
+ }
138
+
139
+ // Detect performance regressions
140
+ async detectRegressions(currentResults, historicalData, config = {}) {
141
+ const regressions = {
142
+ detected: [],
143
+ severity: 'none',
144
+ confidence: 0,
145
+ analysis: {}
146
+ };
147
+
148
+ // Run multiple detection algorithms
149
+ const detectionPromises = Object.entries(this.detectors).map(
150
+ async ([method, detector]) => {
151
+ const detection = await detector.detect(currentResults, historicalData, config);
152
+ return [method, detection];
153
+ }
154
+ );
155
+
156
+ const detectionResults = await Promise.all(detectionPromises);
157
+
158
+ // Aggregate detection results
159
+ for (const [method, detection] of detectionResults) {
160
+ if (detection.regression_detected) {
161
+ regressions.detected.push({
162
+ method,
163
+ ...detection
164
+ });
165
+ }
166
+ }
167
+
168
+ // Calculate overall confidence and severity
169
+ if (regressions.detected.length > 0) {
170
+ regressions.confidence = this.calculateAggregateConfidence(regressions.detected);
171
+ regressions.severity = this.calculateSeverity(regressions.detected);
172
+ regressions.analysis = await this.analyzer.analyze(regressions.detected);
173
+ }
174
+
175
+ return regressions;
176
+ }
177
+
178
+ // Statistical regression detection using change point analysis
179
+ async detectStatisticalRegression(metric, historicalData, sensitivity = 0.95) {
180
+ // Use CUSUM (Cumulative Sum) algorithm for change point detection
181
+ const cusum = this.calculateCUSUM(metric, historicalData);
182
+
183
+ // Detect change points
184
+ const changePoints = this.detectChangePoints(cusum, sensitivity);
185
+
186
+ // Analyze significance of changes
187
+ const analysis = changePoints.map(point => ({
188
+ timestamp: point.timestamp,
189
+ magnitude: point.magnitude,
190
+ direction: point.direction,
191
+ significance: point.significance,
192
+ confidence: point.confidence
193
+ }));
194
+
195
+ return {
196
+ regression_detected: changePoints.length > 0,
197
+ change_points: analysis,
198
+ cusum_statistics: cusum.statistics,
199
+ sensitivity: sensitivity
200
+ };
201
+ }
202
+
203
+ // Machine learning-based regression detection
204
+ async detectMLRegression(metrics, historicalData) {
205
+ // Train anomaly detection model on historical data
206
+ const model = await this.trainAnomalyModel(historicalData);
207
+
208
+ // Predict anomaly scores for current metrics
209
+ const anomalyScores = await model.predict(metrics);
210
+
211
+ // Identify regressions based on anomaly scores
212
+ const threshold = this.calculateDynamicThreshold(anomalyScores);
213
+ const regressions = anomalyScores.filter(score => score.anomaly > threshold);
214
+
215
+ return {
216
+ regression_detected: regressions.length > 0,
217
+ anomaly_scores: anomalyScores,
218
+ threshold: threshold,
219
+ regressions: regressions,
220
+ model_confidence: model.confidence
221
+ };
222
+ }
223
+ }
224
+ ```
225
+
226
+ ### 3. Automated Performance Testing
227
+ ```javascript
228
+ // Comprehensive automated performance testing
229
+ class AutomatedPerformanceTester {
230
+ constructor() {
231
+ this.testSuites = {
232
+ load: new LoadTestSuite(),
233
+ stress: new StressTestSuite(),
234
+ volume: new VolumeTestSuite(),
235
+ endurance: new EnduranceTestSuite(),
236
+ spike: new SpikeTestSuite(),
237
+ configuration: new ConfigurationTestSuite()
238
+ };
239
+
240
+ this.scheduler = new TestScheduler();
241
+ this.orchestrator = new TestOrchestrator();
242
+ this.validator = new ResultValidator();
243
+ }
244
+
245
+ // Execute automated performance test campaign
246
+ async runTestCampaign(config) {
247
+ const campaign = {
248
+ id: this.generateCampaignId(),
249
+ config,
250
+ startTime: Date.now(),
251
+ tests: [],
252
+ results: new Map(),
253
+ summary: null
254
+ };
255
+
256
+ // Schedule test execution
257
+ const schedule = await this.scheduler.schedule(config.tests, config.constraints);
258
+
259
+ // Execute tests according to schedule
260
+ for (const scheduledTest of schedule) {
261
+ const testResult = await this.executeScheduledTest(scheduledTest);
262
+ campaign.tests.push(scheduledTest);
263
+ campaign.results.set(scheduledTest.id, testResult);
264
+
265
+ // Validate results in real-time
266
+ const validation = await this.validator.validate(testResult);
267
+ if (!validation.valid) {
268
+ campaign.summary = {
269
+ status: 'failed',
270
+ reason: validation.reason,
271
+ failedAt: scheduledTest.name
272
+ };
273
+ break;
274
+ }
275
+ }
276
+
277
+ // Generate campaign summary
278
+ if (!campaign.summary) {
279
+ campaign.summary = await this.generateCampaignSummary(campaign);
280
+ }
281
+
282
+ campaign.endTime = Date.now();
283
+ campaign.duration = campaign.endTime - campaign.startTime;
284
+
285
+ return campaign;
286
+ }
287
+
288
+ // Load testing with gradual ramp-up
289
+ async executeLoadTest(config) {
290
+ const loadTest = {
291
+ type: 'load',
292
+ config,
293
+ phases: [],
294
+ metrics: new Map(),
295
+ results: {}
296
+ };
297
+
298
+ // Ramp-up phase
299
+ const rampUpResult = await this.executeRampUp(config.rampUp);
300
+ loadTest.phases.push({ phase: 'ramp-up', result: rampUpResult });
301
+
302
+ // Sustained load phase
303
+ const sustainedResult = await this.executeSustainedLoad(config.sustained);
304
+ loadTest.phases.push({ phase: 'sustained', result: sustainedResult });
305
+
306
+ // Ramp-down phase
307
+ const rampDownResult = await this.executeRampDown(config.rampDown);
308
+ loadTest.phases.push({ phase: 'ramp-down', result: rampDownResult });
309
+
310
+ // Analyze results
311
+ loadTest.results = await this.analyzeLoadTestResults(loadTest.phases);
312
+
313
+ return loadTest;
314
+ }
315
+
316
+ // Stress testing to find breaking points
317
+ async executeStressTest(config) {
318
+ const stressTest = {
319
+ type: 'stress',
320
+ config,
321
+ breakingPoint: null,
322
+ degradationCurve: [],
323
+ results: {}
324
+ };
325
+
326
+ let currentLoad = config.startLoad;
327
+ let systemBroken = false;
328
+
329
+ while (!systemBroken && currentLoad <= config.maxLoad) {
330
+ const testResult = await this.applyLoad(currentLoad, config.duration);
331
+
332
+ stressTest.degradationCurve.push({
333
+ load: currentLoad,
334
+ performance: testResult.performance,
335
+ stability: testResult.stability,
336
+ errors: testResult.errors
337
+ });
338
+
339
+ // Check if system is breaking
340
+ if (this.isSystemBreaking(testResult, config.breakingCriteria)) {
341
+ stressTest.breakingPoint = {
342
+ load: currentLoad,
343
+ performance: testResult.performance,
344
+ reason: this.identifyBreakingReason(testResult)
345
+ };
346
+ systemBroken = true;
347
+ }
348
+
349
+ currentLoad += config.loadIncrement;
350
+ }
351
+
352
+ stressTest.results = await this.analyzeStressTestResults(stressTest);
353
+
354
+ return stressTest;
355
+ }
356
+ }
357
+ ```
358
+
359
+ ### 4. Performance Validation Framework
360
+ ```javascript
361
+ // Comprehensive performance validation
362
+ class PerformanceValidator {
363
+ constructor() {
364
+ this.validators = {
365
+ sla: new SLAValidator(),
366
+ regression: new RegressionValidator(),
367
+ scalability: new ScalabilityValidator(),
368
+ reliability: new ReliabilityValidator(),
369
+ efficiency: new EfficiencyValidator()
370
+ };
371
+
372
+ this.thresholds = new ThresholdManager();
373
+ this.rules = new ValidationRuleEngine();
374
+ }
375
+
376
+ // Validate performance against defined criteria
377
+ async validatePerformance(results, criteria) {
378
+ const validation = {
379
+ overall: {
380
+ passed: true,
381
+ score: 0,
382
+ violations: []
383
+ },
384
+ detailed: new Map(),
385
+ recommendations: []
386
+ };
387
+
388
+ // Run all validators
389
+ const validationPromises = Object.entries(this.validators).map(
390
+ async ([type, validator]) => {
391
+ const result = await validator.validate(results, criteria[type]);
392
+ return [type, result];
393
+ }
394
+ );
395
+
396
+ const validationResults = await Promise.all(validationPromises);
397
+
398
+ // Aggregate validation results
399
+ for (const [type, result] of validationResults) {
400
+ validation.detailed.set(type, result);
401
+
402
+ if (!result.passed) {
403
+ validation.overall.passed = false;
404
+ validation.overall.violations.push(...result.violations);
405
+ }
406
+
407
+ validation.overall.score += result.score * (criteria[type]?.weight || 1);
408
+ }
409
+
410
+ // Normalize overall score
411
+ const totalWeight = Object.values(criteria).reduce((sum, c) => sum + (c.weight || 1), 0);
412
+ validation.overall.score /= totalWeight;
413
+
414
+ // Generate recommendations
415
+ validation.recommendations = await this.generateValidationRecommendations(validation);
416
+
417
+ return validation;
418
+ }
419
+
420
+ // SLA validation
421
+ async validateSLA(results, slaConfig) {
422
+ const slaValidation = {
423
+ passed: true,
424
+ violations: [],
425
+ score: 1.0,
426
+ metrics: {}
427
+ };
428
+
429
+ // Validate each SLA metric
430
+ for (const [metric, threshold] of Object.entries(slaConfig.thresholds)) {
431
+ const actualValue = this.extractMetricValue(results, metric);
432
+ const validation = this.validateThreshold(actualValue, threshold);
433
+
434
+ slaValidation.metrics[metric] = {
435
+ actual: actualValue,
436
+ threshold: threshold.value,
437
+ operator: threshold.operator,
438
+ passed: validation.passed,
439
+ deviation: validation.deviation
440
+ };
441
+
442
+ if (!validation.passed) {
443
+ slaValidation.passed = false;
444
+ slaValidation.violations.push({
445
+ metric,
446
+ actual: actualValue,
447
+ expected: threshold.value,
448
+ severity: threshold.severity || 'medium'
449
+ });
450
+
451
+ // Reduce score based on violation severity
452
+ const severityMultiplier = this.getSeverityMultiplier(threshold.severity);
453
+ slaValidation.score -= (validation.deviation * severityMultiplier);
454
+ }
455
+ }
456
+
457
+ slaValidation.score = Math.max(0, slaValidation.score);
458
+
459
+ return slaValidation;
460
+ }
461
+
462
+ // Scalability validation
463
+ async validateScalability(results, scalabilityConfig) {
464
+ const scalabilityValidation = {
465
+ passed: true,
466
+ violations: [],
467
+ score: 1.0,
468
+ analysis: {}
469
+ };
470
+
471
+ // Linear scalability analysis
472
+ if (scalabilityConfig.linear) {
473
+ const linearityAnalysis = this.analyzeLinearScalability(results);
474
+ scalabilityValidation.analysis.linearity = linearityAnalysis;
475
+
476
+ if (linearityAnalysis.coefficient < scalabilityConfig.linear.minCoefficient) {
477
+ scalabilityValidation.passed = false;
478
+ scalabilityValidation.violations.push({
479
+ type: 'linearity',
480
+ actual: linearityAnalysis.coefficient,
481
+ expected: scalabilityConfig.linear.minCoefficient
482
+ });
483
+ }
484
+ }
485
+
486
+ // Efficiency retention analysis
487
+ if (scalabilityConfig.efficiency) {
488
+ const efficiencyAnalysis = this.analyzeEfficiencyRetention(results);
489
+ scalabilityValidation.analysis.efficiency = efficiencyAnalysis;
490
+
491
+ if (efficiencyAnalysis.retention < scalabilityConfig.efficiency.minRetention) {
492
+ scalabilityValidation.passed = false;
493
+ scalabilityValidation.violations.push({
494
+ type: 'efficiency_retention',
495
+ actual: efficiencyAnalysis.retention,
496
+ expected: scalabilityConfig.efficiency.minRetention
497
+ });
498
+ }
499
+ }
500
+
501
+ return scalabilityValidation;
502
+ }
503
+ }
504
+ ```
505
+
506
+ ## MCP Integration Hooks
507
+
508
+ ### Benchmark Execution Integration
509
+ ```javascript
510
+ // Comprehensive MCP benchmark integration
511
+ const benchmarkIntegration = {
512
+ // Execute performance benchmarks
513
+ async runBenchmarks(config = {}) {
514
+ // Run benchmark suite
515
+ const benchmarkResult = await mcp.benchmark_run({
516
+ suite: config.suite || 'comprehensive'
517
+ });
518
+
519
+ // Collect detailed metrics during benchmarking
520
+ const metrics = await mcp.metrics_collect({
521
+ components: ['system', 'agents', 'coordination', 'memory']
522
+ });
523
+
524
+ // Analyze performance trends
525
+ const trends = await mcp.trend_analysis({
526
+ metric: 'performance',
527
+ period: '24h'
528
+ });
529
+
530
+ // Cost analysis
531
+ const costAnalysis = await mcp.cost_analysis({
532
+ timeframe: '24h'
533
+ });
534
+
535
+ return {
536
+ benchmark: benchmarkResult,
537
+ metrics,
538
+ trends,
539
+ costAnalysis,
540
+ timestamp: Date.now()
541
+ };
542
+ },
543
+
544
+ // Quality assessment
545
+ async assessQuality(criteria) {
546
+ const qualityAssessment = await mcp.quality_assess({
547
+ target: 'swarm-performance',
548
+ criteria: criteria || [
549
+ 'throughput',
550
+ 'latency',
551
+ 'reliability',
552
+ 'scalability',
553
+ 'efficiency'
554
+ ]
555
+ });
556
+
557
+ return qualityAssessment;
558
+ },
559
+
560
+ // Error pattern analysis
561
+ async analyzeErrorPatterns() {
562
+ // Collect system logs
563
+ const logs = await this.collectSystemLogs();
564
+
565
+ // Analyze error patterns
566
+ const errorAnalysis = await mcp.error_analysis({
567
+ logs: logs
568
+ });
569
+
570
+ return errorAnalysis;
571
+ }
572
+ };
573
+ ```
574
+
575
+ ## Operational Commands
576
+
577
+ ### Benchmarking Commands
578
+ ```bash
579
+ # Run comprehensive benchmark suite
580
+ npx claude-flow benchmark-run --suite comprehensive --duration 300
581
+
582
+ # Execute specific benchmark
583
+ npx claude-flow benchmark-run --suite throughput --iterations 10
584
+
585
+ # Compare with baseline
586
+ npx claude-flow benchmark-compare --current <results> --baseline <baseline>
587
+
588
+ # Quality assessment
589
+ npx claude-flow quality-assess --target swarm-performance --criteria throughput,latency
590
+
591
+ # Performance validation
592
+ npx claude-flow validate-performance --results <file> --criteria <file>
593
+ ```
594
+
595
+ ### Regression Detection Commands
596
+ ```bash
597
+ # Detect performance regressions
598
+ npx claude-flow detect-regression --current <results> --historical <data>
599
+
600
+ # Set up automated regression monitoring
601
+ npx claude-flow regression-monitor --enable --sensitivity 0.95
602
+
603
+ # Analyze error patterns
604
+ npx claude-flow error-analysis --logs <log-files>
605
+ ```
606
+
607
+ ## Integration Points
608
+
609
+ ### With Other Optimization Agents
610
+ - **Performance Monitor**: Provides continuous monitoring data for benchmarking
611
+ - **Load Balancer**: Validates load balancing effectiveness through benchmarks
612
+ - **Topology Optimizer**: Tests topology configurations for optimal performance
613
+
614
+ ### With CI/CD Pipeline
615
+ - **Automated Testing**: Integrates with CI/CD for continuous performance validation
616
+ - **Quality Gates**: Provides pass/fail criteria for deployment decisions
617
+ - **Regression Prevention**: Catches performance regressions before production
618
+
619
+ ## Performance Benchmarks
620
+
621
+ ### Standard Benchmark Suite
622
+ ```javascript
623
+ // Comprehensive benchmark definitions
624
+ const standardBenchmarks = {
625
+ // Throughput benchmarks
626
+ throughput: {
627
+ name: 'Throughput Benchmark',
628
+ metrics: ['requests_per_second', 'tasks_per_second', 'messages_per_second'],
629
+ duration: 300000, // 5 minutes
630
+ warmup: 30000, // 30 seconds
631
+ targets: {
632
+ requests_per_second: { min: 1000, optimal: 5000 },
633
+ tasks_per_second: { min: 100, optimal: 500 },
634
+ messages_per_second: { min: 10000, optimal: 50000 }
635
+ }
636
+ },
637
+
638
+ // Latency benchmarks
639
+ latency: {
640
+ name: 'Latency Benchmark',
641
+ metrics: ['p50', 'p90', 'p95', 'p99', 'max'],
642
+ duration: 300000,
643
+ targets: {
644
+ p50: { max: 100 }, // 100ms
645
+ p90: { max: 200 }, // 200ms
646
+ p95: { max: 500 }, // 500ms
647
+ p99: { max: 1000 }, // 1s
648
+ max: { max: 5000 } // 5s
649
+ }
650
+ },
651
+
652
+ // Scalability benchmarks
653
+ scalability: {
654
+ name: 'Scalability Benchmark',
655
+ metrics: ['linear_coefficient', 'efficiency_retention'],
656
+ load_points: [1, 2, 4, 8, 16, 32, 64],
657
+ targets: {
658
+ linear_coefficient: { min: 0.8 },
659
+ efficiency_retention: { min: 0.7 }
660
+ }
661
+ }
662
+ };
663
+ ```
664
+
665
665
  This Benchmark Suite agent provides comprehensive automated performance testing, regression detection, and validation capabilities to ensure optimal swarm performance and prevent performance degradation.