agentic-qe 3.4.1 → 3.4.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (496) hide show
  1. package/.claude/skills/.validation/README.md +111 -0
  2. package/.claude/skills/.validation/examples/chaos-engineering-output.example.json +530 -0
  3. package/.claude/skills/.validation/examples/performance-testing-output.example.json +252 -0
  4. package/.claude/skills/.validation/examples/security-testing-output.example.json +413 -0
  5. package/.claude/skills/.validation/examples/testability-scoring-output.example.json +350 -0
  6. package/.claude/skills/.validation/schemas/skill-eval.schema.json +452 -0
  7. package/.claude/skills/.validation/schemas/skill-frontmatter.schema.json +341 -0
  8. package/.claude/skills/.validation/schemas/skill-output-meta.schema.json +199 -0
  9. package/.claude/skills/.validation/schemas/skill-output.template.json +610 -0
  10. package/.claude/skills/.validation/skill-validation-mcp-integration.md +250 -0
  11. package/.claude/skills/.validation/templates/eval.template.yaml +366 -0
  12. package/.claude/skills/.validation/templates/schemas/output.json +145 -0
  13. package/.claude/skills/.validation/templates/security-testing-eval.template.yaml +725 -0
  14. package/.claude/skills/.validation/templates/skill-frontmatter.example.yaml +225 -0
  15. package/.claude/skills/.validation/templates/validate.template.sh +1060 -0
  16. package/.claude/skills/.validation/templates/validator-lib.sh +1031 -0
  17. package/.claude/skills/.validation/test-data/invalid-output.json +5 -0
  18. package/.claude/skills/.validation/test-data/minimal-output.json +9 -0
  19. package/.claude/skills/.validation/test-data/sample-output.json +73 -0
  20. package/.claude/skills/TRUST-TIERS.md +158 -0
  21. package/.claude/skills/a11y-ally/SKILL.md +1664 -1658
  22. package/.claude/skills/a11y-ally/evals/a11y-ally.yaml +376 -0
  23. package/.claude/skills/a11y-ally/schemas/output.json +549 -0
  24. package/.claude/skills/a11y-ally/scripts/validate.sh +690 -0
  25. package/.claude/skills/accessibility-testing/SKILL.md +8 -1
  26. package/.claude/skills/accessibility-testing/evals/accessibility-testing.yaml +719 -0
  27. package/.claude/skills/accessibility-testing/schemas/output.json +776 -0
  28. package/.claude/skills/accessibility-testing/scripts/validate.sh +943 -0
  29. package/.claude/skills/accessibility-testing/test-data/sample-output.json +191 -0
  30. package/.claude/skills/agentic-quality-engineering/SKILL.md +4 -0
  31. package/.claude/skills/agentic-quality-engineering/schemas/output.json +577 -0
  32. package/.claude/skills/api-testing-patterns/SKILL.md +5 -0
  33. package/.claude/skills/api-testing-patterns/evals/api-testing-patterns.yaml +696 -0
  34. package/.claude/skills/api-testing-patterns/schemas/output.json +845 -0
  35. package/.claude/skills/api-testing-patterns/scripts/validate.sh +931 -0
  36. package/.claude/skills/aqe-v2-v3-migration/schemas/output.json +513 -0
  37. package/.claude/skills/aqe-v2-v3-migration/skill.md +4 -0
  38. package/.claude/skills/brutal-honesty-review/SKILL.md +5 -0
  39. package/.claude/skills/brutal-honesty-review/schemas/output.json +291 -0
  40. package/.claude/skills/brutal-honesty-review/scripts/validate.sh +130 -0
  41. package/.claude/skills/bug-reporting-excellence/SKILL.md +5 -0
  42. package/.claude/skills/bug-reporting-excellence/schemas/output.json +288 -0
  43. package/.claude/skills/bug-reporting-excellence/scripts/validate.sh +108 -0
  44. package/.claude/skills/chaos-engineering-resilience/SKILL.md +5 -0
  45. package/.claude/skills/chaos-engineering-resilience/evals/chaos-engineering-resilience.yaml +761 -0
  46. package/.claude/skills/chaos-engineering-resilience/schemas/output.json +1205 -0
  47. package/.claude/skills/chaos-engineering-resilience/scripts/validate.sh +1107 -0
  48. package/.claude/skills/cicd-pipeline-qe-orchestrator/SKILL.md +6 -0
  49. package/.claude/skills/cicd-pipeline-qe-orchestrator/evals/cicd-pipeline-qe-orchestrator.yaml +157 -0
  50. package/.claude/skills/cicd-pipeline-qe-orchestrator/schemas/output.json +542 -0
  51. package/.claude/skills/cicd-pipeline-qe-orchestrator/scripts/validate.sh +310 -0
  52. package/.claude/skills/code-review-quality/SKILL.md +5 -0
  53. package/.claude/skills/code-review-quality/schemas/output.json +264 -0
  54. package/.claude/skills/code-review-quality/scripts/validate.sh +113 -0
  55. package/.claude/skills/compatibility-testing/evals/compatibility-testing.yaml +410 -0
  56. package/.claude/skills/compatibility-testing/schemas/output.json +551 -0
  57. package/.claude/skills/compatibility-testing/scripts/validate.sh +605 -0
  58. package/.claude/skills/compliance-testing/SKILL.md +7 -0
  59. package/.claude/skills/compliance-testing/evals/compliance-testing.yaml +1107 -0
  60. package/.claude/skills/compliance-testing/schemas/output.json +845 -0
  61. package/.claude/skills/compliance-testing/scripts/validate.sh +888 -0
  62. package/.claude/skills/consultancy-practices/SKILL.md +4 -0
  63. package/.claude/skills/consultancy-practices/schemas/output.json +282 -0
  64. package/.claude/skills/context-driven-testing/SKILL.md +3 -0
  65. package/.claude/skills/contract-testing/SKILL.md +5 -0
  66. package/.claude/skills/contract-testing/evals/contract-testing.yaml +748 -0
  67. package/.claude/skills/contract-testing/schemas/output.json +638 -0
  68. package/.claude/skills/contract-testing/scripts/validate.sh +1033 -0
  69. package/.claude/skills/database-testing/SKILL.md +5 -0
  70. package/.claude/skills/database-testing/evals/database-testing.yaml +968 -0
  71. package/.claude/skills/database-testing/schemas/output.json +1446 -0
  72. package/.claude/skills/database-testing/scripts/validate.sh +1099 -0
  73. package/.claude/skills/exploratory-testing-advanced/SKILL.md +3 -0
  74. package/.claude/skills/holistic-testing-pact/SKILL.md +3 -0
  75. package/.claude/skills/localization-testing/SKILL.md +6 -0
  76. package/.claude/skills/localization-testing/evals/localization-testing.yaml +544 -0
  77. package/.claude/skills/localization-testing/schemas/output.json +325 -0
  78. package/.claude/skills/localization-testing/scripts/validate.sh +131 -0
  79. package/.claude/skills/mobile-testing/SKILL.md +6 -0
  80. package/.claude/skills/mobile-testing/evals/mobile-testing.yaml +537 -0
  81. package/.claude/skills/mobile-testing/schemas/output.json +318 -0
  82. package/.claude/skills/mobile-testing/scripts/validate.sh +127 -0
  83. package/.claude/skills/mutation-testing/SKILL.md +8 -1
  84. package/.claude/skills/mutation-testing/evals/mutation-testing.yaml +652 -0
  85. package/.claude/skills/mutation-testing/schemas/output.json +707 -0
  86. package/.claude/skills/mutation-testing/scripts/validate.sh +992 -0
  87. package/.claude/skills/mutation-testing/test-data/sample-output.json +295 -0
  88. package/.claude/skills/n8n-expression-testing/SKILL.md +6 -0
  89. package/.claude/skills/n8n-expression-testing/evals/n8n-expression-testing.yaml +450 -0
  90. package/.claude/skills/n8n-expression-testing/schemas/output.json +369 -0
  91. package/.claude/skills/n8n-expression-testing/scripts/validate.sh +162 -0
  92. package/.claude/skills/n8n-integration-testing-patterns/SKILL.md +6 -0
  93. package/.claude/skills/n8n-integration-testing-patterns/evals/n8n-integration-testing-patterns.yaml +522 -0
  94. package/.claude/skills/n8n-integration-testing-patterns/schemas/output.json +291 -0
  95. package/.claude/skills/n8n-integration-testing-patterns/scripts/validate.sh +104 -0
  96. package/.claude/skills/n8n-security-testing/SKILL.md +6 -0
  97. package/.claude/skills/n8n-security-testing/evals/n8n-security-testing.yaml +493 -0
  98. package/.claude/skills/n8n-security-testing/schemas/output.json +293 -0
  99. package/.claude/skills/n8n-security-testing/scripts/validate.sh +120 -0
  100. package/.claude/skills/n8n-trigger-testing-strategies/SKILL.md +6 -0
  101. package/.claude/skills/n8n-trigger-testing-strategies/evals/n8n-trigger-testing-strategies.yaml +500 -0
  102. package/.claude/skills/n8n-trigger-testing-strategies/schemas/output.json +295 -0
  103. package/.claude/skills/n8n-trigger-testing-strategies/scripts/validate.sh +121 -0
  104. package/.claude/skills/n8n-workflow-testing-fundamentals/SKILL.md +6 -0
  105. package/.claude/skills/n8n-workflow-testing-fundamentals/evals/n8n-workflow-testing-fundamentals.yaml +497 -0
  106. package/.claude/skills/n8n-workflow-testing-fundamentals/schemas/output.json +254 -0
  107. package/.claude/skills/n8n-workflow-testing-fundamentals/scripts/validate.sh +126 -0
  108. package/.claude/skills/performance-analysis/SKILL.md +6 -0
  109. package/.claude/skills/performance-analysis/evals/performance-analysis.yaml +144 -0
  110. package/.claude/skills/performance-analysis/schemas/output.json +588 -0
  111. package/.claude/skills/performance-analysis/scripts/validate.sh +63 -0
  112. package/.claude/skills/performance-testing/SKILL.md +5 -0
  113. package/.claude/skills/performance-testing/evals/performance-testing.yaml +772 -0
  114. package/.claude/skills/performance-testing/schemas/output.json +1184 -0
  115. package/.claude/skills/performance-testing/scripts/validate.sh +1090 -0
  116. package/.claude/skills/qcsd-ideation-swarm/SKILL.md +1759 -1753
  117. package/.claude/skills/qcsd-ideation-swarm/evals/qcsd-ideation-swarm.yaml +138 -0
  118. package/.claude/skills/qcsd-ideation-swarm/schemas/output.json +568 -0
  119. package/.claude/skills/qcsd-ideation-swarm/scripts/validate.sh +56 -0
  120. package/.claude/skills/qe-chaos-resilience/SKILL.md +6 -0
  121. package/.claude/skills/qe-chaos-resilience/evals/qe-chaos-resilience.yaml +443 -0
  122. package/.claude/skills/qe-chaos-resilience/schemas/output.json +314 -0
  123. package/.claude/skills/qe-chaos-resilience/scripts/validate.sh +401 -0
  124. package/.claude/skills/qe-code-intelligence/SKILL.md +6 -0
  125. package/.claude/skills/qe-code-intelligence/evals/qe-code-intelligence.yaml +459 -0
  126. package/.claude/skills/qe-code-intelligence/schemas/output.json +315 -0
  127. package/.claude/skills/qe-code-intelligence/scripts/validate.sh +408 -0
  128. package/.claude/skills/qe-contract-testing/SKILL.md +6 -0
  129. package/.claude/skills/qe-contract-testing/evals/qe-contract-testing.yaml +513 -0
  130. package/.claude/skills/qe-contract-testing/schemas/output.json +295 -0
  131. package/.claude/skills/qe-contract-testing/scripts/validate.sh +421 -0
  132. package/.claude/skills/qe-coverage-analysis/SKILL.md +6 -0
  133. package/.claude/skills/qe-coverage-analysis/evals/qe-coverage-analysis.yaml +494 -0
  134. package/.claude/skills/qe-coverage-analysis/schemas/output.json +286 -0
  135. package/.claude/skills/qe-coverage-analysis/scripts/validate.sh +453 -0
  136. package/.claude/skills/qe-defect-intelligence/SKILL.md +6 -0
  137. package/.claude/skills/qe-defect-intelligence/evals/qe-defect-intelligence.yaml +511 -0
  138. package/.claude/skills/qe-defect-intelligence/schemas/output.json +283 -0
  139. package/.claude/skills/qe-defect-intelligence/scripts/validate.sh +466 -0
  140. package/.claude/skills/qe-iterative-loop/SKILL.md +445 -440
  141. package/.claude/skills/qe-iterative-loop/schemas/output.json +264 -0
  142. package/.claude/skills/qe-iterative-loop/scripts/validate.sh +474 -0
  143. package/.claude/skills/qe-learning-optimization/SKILL.md +6 -0
  144. package/.claude/skills/qe-learning-optimization/evals/qe-learning-optimization.yaml +144 -0
  145. package/.claude/skills/qe-learning-optimization/schemas/output.json +288 -0
  146. package/.claude/skills/qe-learning-optimization/scripts/validate.sh +56 -0
  147. package/.claude/skills/qe-quality-assessment/SKILL.md +6 -0
  148. package/.claude/skills/qe-quality-assessment/evals/qe-quality-assessment.yaml +506 -0
  149. package/.claude/skills/qe-quality-assessment/schemas/output.json +550 -0
  150. package/.claude/skills/qe-quality-assessment/scripts/validate.sh +352 -0
  151. package/.claude/skills/qe-requirements-validation/SKILL.md +6 -0
  152. package/.claude/skills/qe-requirements-validation/evals/qe-requirements-validation.yaml +598 -0
  153. package/.claude/skills/qe-requirements-validation/schemas/output.json +587 -0
  154. package/.claude/skills/qe-requirements-validation/scripts/validate.sh +275 -0
  155. package/.claude/skills/qe-security-compliance/SKILL.md +6 -0
  156. package/.claude/skills/qe-security-compliance/evals/qe-security-compliance.yaml +595 -0
  157. package/.claude/skills/qe-security-compliance/schemas/output.json +498 -0
  158. package/.claude/skills/qe-security-compliance/scripts/validate.sh +305 -0
  159. package/.claude/skills/qe-test-execution/SKILL.md +6 -0
  160. package/.claude/skills/qe-test-execution/evals/qe-test-execution.yaml +607 -0
  161. package/.claude/skills/qe-test-execution/schemas/output.json +529 -0
  162. package/.claude/skills/qe-test-execution/scripts/validate.sh +323 -0
  163. package/.claude/skills/qe-test-generation/SKILL.md +6 -0
  164. package/.claude/skills/qe-test-generation/evals/qe-test-generation.yaml +148 -0
  165. package/.claude/skills/qe-test-generation/schemas/output.json +439 -0
  166. package/.claude/skills/qe-test-generation/scripts/validate.sh +56 -0
  167. package/.claude/skills/qe-visual-accessibility/SKILL.md +6 -0
  168. package/.claude/skills/qe-visual-accessibility/evals/qe-visual-accessibility.yaml +142 -0
  169. package/.claude/skills/qe-visual-accessibility/schemas/output.json +491 -0
  170. package/.claude/skills/qe-visual-accessibility/scripts/validate.sh +56 -0
  171. package/.claude/skills/quality-metrics/SKILL.md +6 -0
  172. package/.claude/skills/quality-metrics/evals/quality-metrics.yaml +494 -0
  173. package/.claude/skills/quality-metrics/schemas/output.json +403 -0
  174. package/.claude/skills/quality-metrics/scripts/validate.sh +434 -0
  175. package/.claude/skills/refactoring-patterns/SKILL.md +5 -0
  176. package/.claude/skills/refactoring-patterns/schemas/output.json +475 -0
  177. package/.claude/skills/refactoring-patterns/scripts/validate.sh +241 -0
  178. package/.claude/skills/regression-testing/SKILL.md +6 -0
  179. package/.claude/skills/regression-testing/evals/regression-testing.yaml +504 -0
  180. package/.claude/skills/regression-testing/schemas/output.json +311 -0
  181. package/.claude/skills/regression-testing/scripts/validate.sh +130 -0
  182. package/.claude/skills/risk-based-testing/SKILL.md +6 -0
  183. package/.claude/skills/risk-based-testing/evals/risk-based-testing.yaml +141 -0
  184. package/.claude/skills/risk-based-testing/schemas/output.json +480 -0
  185. package/.claude/skills/risk-based-testing/scripts/validate.sh +56 -0
  186. package/.claude/skills/security-testing/SKILL.md +5 -0
  187. package/.claude/skills/security-testing/evals/security-testing.yaml +789 -0
  188. package/.claude/skills/security-testing/schemas/output.json +879 -0
  189. package/.claude/skills/security-testing/scripts/validate.sh +967 -0
  190. package/.claude/skills/security-visual-testing/SKILL.md +223 -217
  191. package/.claude/skills/security-visual-testing/evals/security-visual-testing.yaml +163 -0
  192. package/.claude/skills/security-visual-testing/schemas/output.json +486 -0
  193. package/.claude/skills/security-visual-testing/scripts/validate.sh +748 -0
  194. package/.claude/skills/sherlock-review/SKILL.md +5 -0
  195. package/.claude/skills/sherlock-review/schemas/output.json +297 -0
  196. package/.claude/skills/sherlock-review/scripts/validate.sh +115 -0
  197. package/.claude/skills/shift-left-testing/SKILL.md +6 -0
  198. package/.claude/skills/shift-left-testing/evals/shift-left-testing.yaml +145 -0
  199. package/.claude/skills/shift-left-testing/schemas/output.json +459 -0
  200. package/.claude/skills/shift-left-testing/scripts/validate.sh +56 -0
  201. package/.claude/skills/shift-right-testing/SKILL.md +6 -0
  202. package/.claude/skills/shift-right-testing/evals/shift-right-testing.yaml +147 -0
  203. package/.claude/skills/shift-right-testing/schemas/output.json +418 -0
  204. package/.claude/skills/shift-right-testing/scripts/validate.sh +56 -0
  205. package/.claude/skills/six-thinking-hats/SKILL.md +3 -0
  206. package/.claude/skills/tdd-london-chicago/SKILL.md +5 -0
  207. package/.claude/skills/tdd-london-chicago/schemas/output.json +444 -0
  208. package/.claude/skills/tdd-london-chicago/scripts/validate.sh +214 -0
  209. package/.claude/skills/technical-writing/SKILL.md +4 -0
  210. package/.claude/skills/technical-writing/schemas/output.json +268 -0
  211. package/.claude/skills/test-automation-strategy/SKILL.md +6 -0
  212. package/.claude/skills/test-automation-strategy/evals/test-automation-strategy.yaml +148 -0
  213. package/.claude/skills/test-automation-strategy/schemas/output.json +444 -0
  214. package/.claude/skills/test-automation-strategy/scripts/validate.sh +195 -0
  215. package/.claude/skills/test-data-management/SKILL.md +6 -0
  216. package/.claude/skills/test-data-management/evals/test-data-management.yaml +504 -0
  217. package/.claude/skills/test-data-management/schemas/output.json +284 -0
  218. package/.claude/skills/test-data-management/scripts/validate.sh +137 -0
  219. package/.claude/skills/test-design-techniques/SKILL.md +6 -0
  220. package/.claude/skills/test-design-techniques/evals/test-design-techniques.yaml +142 -0
  221. package/.claude/skills/test-design-techniques/schemas/output.json +295 -0
  222. package/.claude/skills/test-design-techniques/scripts/validate.sh +91 -0
  223. package/.claude/skills/test-environment-management/SKILL.md +4 -0
  224. package/.claude/skills/test-environment-management/schemas/output.json +310 -0
  225. package/.claude/skills/test-reporting-analytics/SKILL.md +6 -0
  226. package/.claude/skills/test-reporting-analytics/evals/test-reporting-analytics.yaml +155 -0
  227. package/.claude/skills/test-reporting-analytics/schemas/output.json +329 -0
  228. package/.claude/skills/test-reporting-analytics/scripts/validate.sh +77 -0
  229. package/.claude/skills/testability-scoring/SKILL.md +5 -0
  230. package/.claude/skills/testability-scoring/evals/testability-scoring.yaml +814 -0
  231. package/.claude/skills/testability-scoring/schemas/output.json +606 -0
  232. package/.claude/skills/testability-scoring/scripts/validate.sh +891 -0
  233. package/.claude/skills/trust-tier-manifest.json +2333 -0
  234. package/.claude/skills/verification-quality/SKILL.md +6 -0
  235. package/.claude/skills/verification-quality/evals/verification-quality.yaml +150 -0
  236. package/.claude/skills/verification-quality/schemas/output.json +432 -0
  237. package/.claude/skills/verification-quality/scripts/validate.sh +77 -0
  238. package/.claude/skills/visual-testing-advanced/SKILL.md +6 -0
  239. package/.claude/skills/visual-testing-advanced/evals/visual-testing-advanced.yaml +154 -0
  240. package/.claude/skills/visual-testing-advanced/schemas/output.json +294 -0
  241. package/.claude/skills/visual-testing-advanced/scripts/validate.sh +77 -0
  242. package/.claude/skills/xp-practices/SKILL.md +3 -0
  243. package/README.md +39 -2
  244. package/package.json +4 -1
  245. package/scripts/run-skill-eval.ts +1097 -0
  246. package/scripts/test-schema-validation.js +301 -0
  247. package/scripts/update-skill-manifest.ts +751 -0
  248. package/scripts/validate-skill-frontmatter.js +141 -0
  249. package/v3/CHANGELOG.md +21 -0
  250. package/v3/README.md +43 -3
  251. package/v3/assets/agents/v3/qe-test-idea-rewriter.md +375 -375
  252. package/v3/assets/skills/.validation/README.md +111 -0
  253. package/v3/assets/skills/.validation/examples/chaos-engineering-output.example.json +530 -0
  254. package/v3/assets/skills/.validation/examples/performance-testing-output.example.json +252 -0
  255. package/v3/assets/skills/.validation/examples/security-testing-output.example.json +413 -0
  256. package/v3/assets/skills/.validation/examples/testability-scoring-output.example.json +350 -0
  257. package/v3/assets/skills/.validation/schemas/skill-eval.schema.json +452 -0
  258. package/v3/assets/skills/.validation/schemas/skill-frontmatter.schema.json +341 -0
  259. package/v3/assets/skills/.validation/schemas/skill-output-meta.schema.json +199 -0
  260. package/v3/assets/skills/.validation/schemas/skill-output.template.json +610 -0
  261. package/v3/assets/skills/.validation/skill-validation-mcp-integration.md +250 -0
  262. package/v3/assets/skills/.validation/templates/eval.template.yaml +366 -0
  263. package/v3/assets/skills/.validation/templates/schemas/output.json +145 -0
  264. package/v3/assets/skills/.validation/templates/security-testing-eval.template.yaml +725 -0
  265. package/v3/assets/skills/.validation/templates/skill-frontmatter.example.yaml +225 -0
  266. package/v3/assets/skills/.validation/templates/validate.template.sh +1060 -0
  267. package/v3/assets/skills/.validation/templates/validator-lib.sh +1031 -0
  268. package/v3/assets/skills/.validation/test-data/invalid-output.json +5 -0
  269. package/v3/assets/skills/.validation/test-data/minimal-output.json +9 -0
  270. package/v3/assets/skills/.validation/test-data/sample-output.json +73 -0
  271. package/v3/assets/skills/accessibility-testing/SKILL.md +8 -1
  272. package/v3/assets/skills/accessibility-testing/evals/accessibility-testing.yaml +719 -0
  273. package/v3/assets/skills/accessibility-testing/schemas/output.json +776 -0
  274. package/v3/assets/skills/accessibility-testing/scripts/validate.sh +943 -0
  275. package/v3/assets/skills/accessibility-testing/test-data/sample-output.json +191 -0
  276. package/v3/assets/skills/agentic-quality-engineering/SKILL.md +4 -0
  277. package/v3/assets/skills/agentic-quality-engineering/schemas/output.json +577 -0
  278. package/v3/assets/skills/api-testing-patterns/SKILL.md +5 -0
  279. package/v3/assets/skills/api-testing-patterns/evals/api-testing-patterns.yaml +696 -0
  280. package/v3/assets/skills/api-testing-patterns/schemas/output.json +845 -0
  281. package/v3/assets/skills/api-testing-patterns/scripts/validate.sh +931 -0
  282. package/v3/assets/skills/aqe-v2-v3-migration/schemas/output.json +513 -0
  283. package/v3/assets/skills/aqe-v2-v3-migration/skill.md +20 -16
  284. package/v3/assets/skills/bug-reporting-excellence/SKILL.md +5 -0
  285. package/v3/assets/skills/bug-reporting-excellence/schemas/output.json +288 -0
  286. package/v3/assets/skills/bug-reporting-excellence/scripts/validate.sh +108 -0
  287. package/v3/assets/skills/chaos-engineering-resilience/SKILL.md +5 -0
  288. package/v3/assets/skills/chaos-engineering-resilience/evals/chaos-engineering-resilience.yaml +761 -0
  289. package/v3/assets/skills/chaos-engineering-resilience/schemas/output.json +1205 -0
  290. package/v3/assets/skills/chaos-engineering-resilience/scripts/validate.sh +1107 -0
  291. package/v3/assets/skills/code-review-quality/SKILL.md +5 -0
  292. package/v3/assets/skills/code-review-quality/schemas/output.json +264 -0
  293. package/v3/assets/skills/code-review-quality/scripts/validate.sh +113 -0
  294. package/v3/assets/skills/compatibility-testing/evals/compatibility-testing.yaml +410 -0
  295. package/v3/assets/skills/compatibility-testing/schemas/output.json +551 -0
  296. package/v3/assets/skills/compatibility-testing/scripts/validate.sh +605 -0
  297. package/v3/assets/skills/compliance-testing/SKILL.md +7 -0
  298. package/v3/assets/skills/compliance-testing/evals/compliance-testing.yaml +1107 -0
  299. package/v3/assets/skills/compliance-testing/schemas/output.json +845 -0
  300. package/v3/assets/skills/compliance-testing/scripts/validate.sh +888 -0
  301. package/v3/assets/skills/consultancy-practices/SKILL.md +4 -0
  302. package/v3/assets/skills/consultancy-practices/schemas/output.json +282 -0
  303. package/v3/assets/skills/context-driven-testing/SKILL.md +3 -0
  304. package/v3/assets/skills/contract-testing/SKILL.md +5 -0
  305. package/v3/assets/skills/contract-testing/evals/contract-testing.yaml +748 -0
  306. package/v3/assets/skills/contract-testing/schemas/output.json +638 -0
  307. package/v3/assets/skills/contract-testing/scripts/validate.sh +1033 -0
  308. package/v3/assets/skills/database-testing/SKILL.md +5 -0
  309. package/v3/assets/skills/database-testing/evals/database-testing.yaml +968 -0
  310. package/v3/assets/skills/database-testing/schemas/output.json +1446 -0
  311. package/v3/assets/skills/database-testing/scripts/validate.sh +1099 -0
  312. package/v3/assets/skills/exploratory-testing-advanced/SKILL.md +3 -0
  313. package/v3/assets/skills/holistic-testing-pact/SKILL.md +3 -0
  314. package/v3/assets/skills/localization-testing/SKILL.md +6 -0
  315. package/v3/assets/skills/localization-testing/evals/localization-testing.yaml +544 -0
  316. package/v3/assets/skills/localization-testing/schemas/output.json +325 -0
  317. package/v3/assets/skills/localization-testing/scripts/validate.sh +131 -0
  318. package/v3/assets/skills/mobile-testing/SKILL.md +6 -0
  319. package/v3/assets/skills/mobile-testing/evals/mobile-testing.yaml +537 -0
  320. package/v3/assets/skills/mobile-testing/schemas/output.json +318 -0
  321. package/v3/assets/skills/mobile-testing/scripts/validate.sh +127 -0
  322. package/v3/assets/skills/mutation-testing/SKILL.md +8 -1
  323. package/v3/assets/skills/mutation-testing/evals/mutation-testing.yaml +652 -0
  324. package/v3/assets/skills/mutation-testing/schemas/output.json +707 -0
  325. package/v3/assets/skills/mutation-testing/scripts/validate.sh +992 -0
  326. package/v3/assets/skills/mutation-testing/test-data/sample-output.json +295 -0
  327. package/v3/assets/skills/n8n-expression-testing/scripts/validate.sh +162 -0
  328. package/v3/assets/skills/n8n-integration-testing-patterns/scripts/validate.sh +104 -0
  329. package/v3/assets/skills/n8n-security-testing/scripts/validate.sh +120 -0
  330. package/v3/assets/skills/n8n-trigger-testing-strategies/scripts/validate.sh +121 -0
  331. package/v3/assets/skills/n8n-workflow-testing-fundamentals/scripts/validate.sh +126 -0
  332. package/v3/assets/skills/performance-testing/SKILL.md +5 -0
  333. package/v3/assets/skills/performance-testing/evals/performance-testing.yaml +772 -0
  334. package/v3/assets/skills/performance-testing/schemas/output.json +1184 -0
  335. package/v3/assets/skills/performance-testing/scripts/validate.sh +1090 -0
  336. package/v3/assets/skills/qe-chaos-resilience/SKILL.md +6 -0
  337. package/v3/assets/skills/qe-chaos-resilience/evals/qe-chaos-resilience.yaml +443 -0
  338. package/v3/assets/skills/qe-chaos-resilience/schemas/output.json +314 -0
  339. package/v3/assets/skills/qe-chaos-resilience/scripts/validate.sh +401 -0
  340. package/v3/assets/skills/qe-code-intelligence/SKILL.md +6 -0
  341. package/v3/assets/skills/qe-code-intelligence/evals/qe-code-intelligence.yaml +459 -0
  342. package/v3/assets/skills/qe-code-intelligence/schemas/output.json +315 -0
  343. package/v3/assets/skills/qe-code-intelligence/scripts/validate.sh +408 -0
  344. package/v3/assets/skills/qe-contract-testing/SKILL.md +6 -0
  345. package/v3/assets/skills/qe-contract-testing/evals/qe-contract-testing.yaml +513 -0
  346. package/v3/assets/skills/qe-contract-testing/schemas/output.json +295 -0
  347. package/v3/assets/skills/qe-contract-testing/scripts/validate.sh +421 -0
  348. package/v3/assets/skills/qe-coverage-analysis/SKILL.md +6 -0
  349. package/v3/assets/skills/qe-coverage-analysis/evals/qe-coverage-analysis.yaml +494 -0
  350. package/v3/assets/skills/qe-coverage-analysis/schemas/output.json +286 -0
  351. package/v3/assets/skills/qe-coverage-analysis/scripts/validate.sh +453 -0
  352. package/v3/assets/skills/qe-defect-intelligence/SKILL.md +6 -0
  353. package/v3/assets/skills/qe-defect-intelligence/evals/qe-defect-intelligence.yaml +511 -0
  354. package/v3/assets/skills/qe-defect-intelligence/schemas/output.json +283 -0
  355. package/v3/assets/skills/qe-defect-intelligence/scripts/validate.sh +466 -0
  356. package/v3/assets/skills/qe-iterative-loop/SKILL.md +445 -443
  357. package/v3/assets/skills/qe-iterative-loop/schemas/output.json +264 -0
  358. package/v3/assets/skills/qe-iterative-loop/scripts/validate.sh +474 -0
  359. package/v3/assets/skills/qe-learning-optimization/SKILL.md +6 -0
  360. package/v3/assets/skills/qe-learning-optimization/evals/qe-learning-optimization.yaml +144 -0
  361. package/v3/assets/skills/qe-learning-optimization/schemas/output.json +288 -0
  362. package/v3/assets/skills/qe-learning-optimization/scripts/validate.sh +56 -0
  363. package/v3/assets/skills/qe-quality-assessment/SKILL.md +6 -0
  364. package/v3/assets/skills/qe-quality-assessment/evals/qe-quality-assessment.yaml +506 -0
  365. package/v3/assets/skills/qe-quality-assessment/schemas/output.json +550 -0
  366. package/v3/assets/skills/qe-quality-assessment/scripts/validate.sh +352 -0
  367. package/v3/assets/skills/qe-requirements-validation/SKILL.md +6 -0
  368. package/v3/assets/skills/qe-requirements-validation/evals/qe-requirements-validation.yaml +598 -0
  369. package/v3/assets/skills/qe-requirements-validation/schemas/output.json +587 -0
  370. package/v3/assets/skills/qe-requirements-validation/scripts/validate.sh +275 -0
  371. package/v3/assets/skills/qe-security-compliance/SKILL.md +6 -0
  372. package/v3/assets/skills/qe-security-compliance/evals/qe-security-compliance.yaml +595 -0
  373. package/v3/assets/skills/qe-security-compliance/schemas/output.json +498 -0
  374. package/v3/assets/skills/qe-security-compliance/scripts/validate.sh +305 -0
  375. package/v3/assets/skills/qe-test-execution/SKILL.md +6 -0
  376. package/v3/assets/skills/qe-test-execution/evals/qe-test-execution.yaml +607 -0
  377. package/v3/assets/skills/qe-test-execution/schemas/output.json +529 -0
  378. package/v3/assets/skills/qe-test-execution/scripts/validate.sh +323 -0
  379. package/v3/assets/skills/qe-test-generation/SKILL.md +6 -0
  380. package/v3/assets/skills/qe-test-generation/evals/qe-test-generation.yaml +148 -0
  381. package/v3/assets/skills/qe-test-generation/schemas/output.json +439 -0
  382. package/v3/assets/skills/qe-test-generation/scripts/validate.sh +56 -0
  383. package/v3/assets/skills/qe-visual-accessibility/SKILL.md +6 -0
  384. package/v3/assets/skills/qe-visual-accessibility/evals/qe-visual-accessibility.yaml +142 -0
  385. package/v3/assets/skills/qe-visual-accessibility/schemas/output.json +491 -0
  386. package/v3/assets/skills/qe-visual-accessibility/scripts/validate.sh +56 -0
  387. package/v3/assets/skills/quality-metrics/SKILL.md +6 -0
  388. package/v3/assets/skills/quality-metrics/evals/quality-metrics.yaml +494 -0
  389. package/v3/assets/skills/quality-metrics/schemas/output.json +403 -0
  390. package/v3/assets/skills/quality-metrics/scripts/validate.sh +434 -0
  391. package/v3/assets/skills/refactoring-patterns/SKILL.md +5 -0
  392. package/v3/assets/skills/refactoring-patterns/schemas/output.json +475 -0
  393. package/v3/assets/skills/refactoring-patterns/scripts/validate.sh +241 -0
  394. package/v3/assets/skills/regression-testing/SKILL.md +6 -0
  395. package/v3/assets/skills/regression-testing/evals/regression-testing.yaml +504 -0
  396. package/v3/assets/skills/regression-testing/schemas/output.json +311 -0
  397. package/v3/assets/skills/regression-testing/scripts/validate.sh +130 -0
  398. package/v3/assets/skills/risk-based-testing/SKILL.md +6 -0
  399. package/v3/assets/skills/risk-based-testing/evals/risk-based-testing.yaml +141 -0
  400. package/v3/assets/skills/risk-based-testing/schemas/output.json +480 -0
  401. package/v3/assets/skills/risk-based-testing/scripts/validate.sh +56 -0
  402. package/v3/assets/skills/security-testing/SKILL.md +5 -0
  403. package/v3/assets/skills/security-testing/evals/security-testing.yaml +789 -0
  404. package/v3/assets/skills/security-testing/schemas/output.json +879 -0
  405. package/v3/assets/skills/security-testing/scripts/validate.sh +967 -0
  406. package/v3/assets/skills/shift-left-testing/SKILL.md +6 -0
  407. package/v3/assets/skills/shift-left-testing/evals/shift-left-testing.yaml +145 -0
  408. package/v3/assets/skills/shift-left-testing/schemas/output.json +459 -0
  409. package/v3/assets/skills/shift-left-testing/scripts/validate.sh +56 -0
  410. package/v3/assets/skills/shift-right-testing/SKILL.md +6 -0
  411. package/v3/assets/skills/shift-right-testing/evals/shift-right-testing.yaml +147 -0
  412. package/v3/assets/skills/shift-right-testing/schemas/output.json +418 -0
  413. package/v3/assets/skills/shift-right-testing/scripts/validate.sh +56 -0
  414. package/v3/assets/skills/six-thinking-hats/SKILL.md +3 -0
  415. package/v3/assets/skills/tdd-london-chicago/SKILL.md +5 -0
  416. package/v3/assets/skills/tdd-london-chicago/schemas/output.json +444 -0
  417. package/v3/assets/skills/tdd-london-chicago/scripts/validate.sh +214 -0
  418. package/v3/assets/skills/technical-writing/SKILL.md +4 -0
  419. package/v3/assets/skills/technical-writing/schemas/output.json +268 -0
  420. package/v3/assets/skills/test-automation-strategy/SKILL.md +6 -0
  421. package/v3/assets/skills/test-automation-strategy/evals/test-automation-strategy.yaml +148 -0
  422. package/v3/assets/skills/test-automation-strategy/schemas/output.json +444 -0
  423. package/v3/assets/skills/test-automation-strategy/scripts/validate.sh +195 -0
  424. package/v3/assets/skills/test-data-management/SKILL.md +6 -0
  425. package/v3/assets/skills/test-data-management/evals/test-data-management.yaml +504 -0
  426. package/v3/assets/skills/test-data-management/schemas/output.json +284 -0
  427. package/v3/assets/skills/test-data-management/scripts/validate.sh +137 -0
  428. package/v3/assets/skills/test-design-techniques/SKILL.md +6 -0
  429. package/v3/assets/skills/test-design-techniques/evals/test-design-techniques.yaml +142 -0
  430. package/v3/assets/skills/test-design-techniques/schemas/output.json +295 -0
  431. package/v3/assets/skills/test-design-techniques/scripts/validate.sh +91 -0
  432. package/v3/assets/skills/test-environment-management/SKILL.md +4 -0
  433. package/v3/assets/skills/test-environment-management/schemas/output.json +310 -0
  434. package/v3/assets/skills/test-reporting-analytics/SKILL.md +6 -0
  435. package/v3/assets/skills/test-reporting-analytics/evals/test-reporting-analytics.yaml +155 -0
  436. package/v3/assets/skills/test-reporting-analytics/schemas/output.json +329 -0
  437. package/v3/assets/skills/test-reporting-analytics/scripts/validate.sh +77 -0
  438. package/v3/assets/skills/verification-quality/SKILL.md +6 -0
  439. package/v3/assets/skills/verification-quality/evals/verification-quality.yaml +150 -0
  440. package/v3/assets/skills/verification-quality/schemas/output.json +432 -0
  441. package/v3/assets/skills/verification-quality/scripts/validate.sh +77 -0
  442. package/v3/assets/skills/visual-testing-advanced/SKILL.md +6 -0
  443. package/v3/assets/skills/visual-testing-advanced/evals/visual-testing-advanced.yaml +154 -0
  444. package/v3/assets/skills/visual-testing-advanced/schemas/output.json +294 -0
  445. package/v3/assets/skills/visual-testing-advanced/scripts/validate.sh +77 -0
  446. package/v3/assets/skills/xp-practices/SKILL.md +3 -0
  447. package/v3/assets/templates/validation-report.md.hbs +139 -0
  448. package/v3/assets/templates/validation-summary.json +56 -0
  449. package/v3/dist/cli/bundle.js +7368 -3418
  450. package/v3/dist/cli/commands/eval.d.ts +18 -0
  451. package/v3/dist/cli/commands/eval.d.ts.map +1 -0
  452. package/v3/dist/cli/commands/eval.js +505 -0
  453. package/v3/dist/cli/commands/eval.js.map +1 -0
  454. package/v3/dist/cli/commands/validate-swarm.d.ts +16 -0
  455. package/v3/dist/cli/commands/validate-swarm.d.ts.map +1 -0
  456. package/v3/dist/cli/commands/validate-swarm.js +251 -0
  457. package/v3/dist/cli/commands/validate-swarm.js.map +1 -0
  458. package/v3/dist/cli/commands/validate.d.ts +14 -0
  459. package/v3/dist/cli/commands/validate.d.ts.map +1 -0
  460. package/v3/dist/cli/commands/validate.js +408 -0
  461. package/v3/dist/cli/commands/validate.js.map +1 -0
  462. package/v3/dist/cli/index.js +6 -0
  463. package/v3/dist/cli/index.js.map +1 -1
  464. package/v3/dist/index.d.ts +2 -0
  465. package/v3/dist/index.d.ts.map +1 -1
  466. package/v3/dist/index.js +10 -0
  467. package/v3/dist/index.js.map +1 -1
  468. package/v3/dist/init/skills-installer.d.ts +6 -0
  469. package/v3/dist/init/skills-installer.d.ts.map +1 -1
  470. package/v3/dist/init/skills-installer.js +48 -0
  471. package/v3/dist/init/skills-installer.js.map +1 -1
  472. package/v3/dist/learning/index.d.ts +2 -0
  473. package/v3/dist/learning/index.d.ts.map +1 -1
  474. package/v3/dist/learning/index.js +4 -0
  475. package/v3/dist/learning/index.js.map +1 -1
  476. package/v3/dist/learning/skill-validation-learner.d.ts +264 -0
  477. package/v3/dist/learning/skill-validation-learner.d.ts.map +1 -0
  478. package/v3/dist/learning/skill-validation-learner.js +515 -0
  479. package/v3/dist/learning/skill-validation-learner.js.map +1 -0
  480. package/v3/dist/validation/index.d.ts +19 -0
  481. package/v3/dist/validation/index.d.ts.map +1 -0
  482. package/v3/dist/validation/index.js +31 -0
  483. package/v3/dist/validation/index.js.map +1 -0
  484. package/v3/dist/validation/parallel-eval-runner.d.ts +307 -0
  485. package/v3/dist/validation/parallel-eval-runner.d.ts.map +1 -0
  486. package/v3/dist/validation/parallel-eval-runner.js +566 -0
  487. package/v3/dist/validation/parallel-eval-runner.js.map +1 -0
  488. package/v3/dist/validation/swarm-skill-validator.d.ts +282 -0
  489. package/v3/dist/validation/swarm-skill-validator.d.ts.map +1 -0
  490. package/v3/dist/validation/swarm-skill-validator.js +460 -0
  491. package/v3/dist/validation/swarm-skill-validator.js.map +1 -0
  492. package/v3/dist/validation/validation-result-aggregator.d.ts +232 -0
  493. package/v3/dist/validation/validation-result-aggregator.d.ts.map +1 -0
  494. package/v3/dist/validation/validation-result-aggregator.js +630 -0
  495. package/v3/dist/validation/validation-result-aggregator.js.map +1 -0
  496. package/v3/package.json +1 -1
@@ -0,0 +1,595 @@
1
+ # =============================================================================
2
+ # AQE Skill Evaluation Test Suite: QE Security Compliance v1.0.0
3
+ # =============================================================================
4
+ #
5
+ # Comprehensive evaluation suite for the qe-security-compliance skill.
6
+ # Tests SAST scanning, dependency vulnerability checking, compliance auditing,
7
+ # secret detection, and OWASP Top 10 validation.
8
+ #
9
+ # Schema: .claude/skills/.validation/schemas/skill-eval.schema.json
10
+ # Validator: .claude/skills/qe-security-compliance/scripts/validate.sh
11
+ #
12
+ # Coverage:
13
+ # - SAST scanning for code vulnerabilities
14
+ # - Dependency vulnerability analysis
15
+ # - OWASP Top 10 coverage
16
+ # - Compliance auditing (SOC2, GDPR, HIPAA, PCI-DSS)
17
+ # - Secret detection and prevention
18
+ #
19
+ # =============================================================================
20
+
21
+ skill: qe-security-compliance
22
+ version: 1.0.0
23
+ description: >
24
+ Comprehensive evaluation suite for the qe-security-compliance skill.
25
+ Tests SAST and DAST scanning, dependency vulnerability checking, OWASP
26
+ Top 10 validation, compliance auditing for multiple standards, and secret
27
+ detection across codebase and configuration.
28
+
29
+ # =============================================================================
30
+ # Multi-Model Configuration
31
+ # =============================================================================
32
+
33
+ models_to_test:
34
+ - claude-3.5-sonnet
35
+ - claude-3-haiku
36
+
37
+ # =============================================================================
38
+ # MCP Integration Configuration
39
+ # =============================================================================
40
+
41
+ mcp_integration:
42
+ enabled: true
43
+ namespace: skill-validation
44
+
45
+ query_patterns: true
46
+ track_outcomes: true
47
+ store_patterns: true
48
+ share_learning: true
49
+ update_quality_gate: true
50
+
51
+ target_agents:
52
+ - qe-learning-coordinator
53
+ - qe-queen-coordinator
54
+ - qe-security-auditor
55
+ - qe-security-scanner
56
+
57
+ # =============================================================================
58
+ # ReasoningBank Learning Configuration
59
+ # =============================================================================
60
+
61
+ learning:
62
+ store_success_patterns: true
63
+ store_failure_patterns: true
64
+ pattern_ttl_days: 90
65
+ min_confidence_to_store: 0.7
66
+ cross_model_comparison: true
67
+
68
+ # =============================================================================
69
+ # Result Format Configuration
70
+ # =============================================================================
71
+
72
+ result_format:
73
+ json_output: true
74
+ markdown_report: true
75
+ include_raw_output: false
76
+ include_timing: true
77
+ include_token_usage: true
78
+
79
+ # =============================================================================
80
+ # Environment Setup
81
+ # =============================================================================
82
+
83
+ setup:
84
+ required_tools:
85
+ - jq
86
+ environment_variables:
87
+ SECURITY_SCAN_LEVEL: "comprehensive"
88
+ OWASP_ENABLED: "true"
89
+ SECRET_DETECTION: "enabled"
90
+ fixtures: []
91
+
92
+ # =============================================================================
93
+ # TEST CASES
94
+ # =============================================================================
95
+
96
+ test_cases:
97
+ # ---------------------------------------------------------------------------
98
+ # CATEGORY: SAST Scanning
99
+ # ---------------------------------------------------------------------------
100
+
101
+ - id: tc001_sast_sql_injection_detection
102
+ description: "Detect SQL injection vulnerabilities in code"
103
+ category: sast
104
+ priority: critical
105
+
106
+ input:
107
+ prompt: |
108
+ Scan this code for SQL injection vulnerabilities:
109
+
110
+ ```javascript
111
+ app.get('/user/:id', (req, res) => {
112
+ const userId = req.params.id;
113
+ const query = `SELECT * FROM users WHERE id = ${userId}`;
114
+ db.query(query, (err, results) => {
115
+ res.json(results);
116
+ });
117
+ });
118
+ ```
119
+
120
+ VULNERABILITY:
121
+ - Type: SQL Injection
122
+ - Severity: CRITICAL
123
+ - CWE: CWE-89
124
+ - OWASP: A03:2021
125
+ - Fix: Use parameterized query
126
+
127
+ What are all the issues?
128
+ context:
129
+ scan_type: "sql_injection"
130
+ include_remediation: true
131
+
132
+ expected_output:
133
+ must_contain:
134
+ - "SQL injection"
135
+ - "parameterized"
136
+ - "CWE-89"
137
+ - "critical"
138
+ must_not_contain:
139
+ - "secure"
140
+ - "no vulnerability"
141
+ severity_classification: critical
142
+ finding_count:
143
+ min: 1
144
+
145
+ validation:
146
+ schema_check: true
147
+ keyword_match_threshold: 0.8
148
+ reasoning_quality_min: 0.75
149
+
150
+ - id: tc002_sast_xss_detection
151
+ description: "Detect cross-site scripting (XSS) vulnerabilities"
152
+ category: sast
153
+ priority: critical
154
+
155
+ input:
156
+ prompt: |
157
+ Scan for XSS vulnerabilities:
158
+
159
+ ```javascript
160
+ app.get('/profile', (req, res) => {
161
+ const name = req.query.name;
162
+ res.send(`<h1>Welcome, ${name}!</h1>`);
163
+ });
164
+ ```
165
+
166
+ VULNERABILITY:
167
+ - Type: Reflected XSS
168
+ - Severity: HIGH
169
+ - CWE: CWE-79
170
+ - Attack: name=<script>alert('xss')</script>
171
+ - Fix: Escape output or use textContent
172
+
173
+ Identify all issues and fixes.
174
+ context:
175
+ scan_type: "xss"
176
+ include_examples: true
177
+
178
+ expected_output:
179
+ must_contain:
180
+ - "XSS"
181
+ - "escape"
182
+ - "sanitize"
183
+ - "CWE-79"
184
+ severity_classification: critical
185
+
186
+ validation:
187
+ schema_check: true
188
+ keyword_match_threshold: 0.8
189
+
190
+ - id: tc003_sast_hardcoded_secrets
191
+ description: "Detect hardcoded credentials and secrets"
192
+ category: sast
193
+ priority: critical
194
+
195
+ input:
196
+ prompt: |
197
+ Scan for hardcoded secrets:
198
+
199
+ ```javascript
200
+ const API_KEY = 'sk-12345678901234567890';
201
+ const DB_PASSWORD = 'admin123';
202
+ const JWT_SECRET = 'my-secret-key-do-not-share';
203
+
204
+ const credentials = {
205
+ username: 'admin',
206
+ password: 'P@ssw0rd123'
207
+ };
208
+ ```
209
+
210
+ FINDINGS:
211
+ 1. API_KEY: Hardcoded - CRITICAL
212
+ 2. DB_PASSWORD: Hardcoded - CRITICAL
213
+ 3. JWT_SECRET: Hardcoded - CRITICAL
214
+ 4. Credentials object: Hardcoded password - CRITICAL
215
+
216
+ Fix: Move to environment variables, use vault
217
+ context:
218
+ scan_type: "secrets"
219
+ secret_patterns: "all"
220
+
221
+ expected_output:
222
+ must_contain:
223
+ - "secret"
224
+ - "hardcoded"
225
+ - "environment"
226
+ - "credentials"
227
+ must_not_contain:
228
+ - "ok"
229
+ - "no secrets"
230
+ severity_classification: critical
231
+
232
+ validation:
233
+ schema_check: true
234
+ keyword_match_threshold: 0.8
235
+ reasoning_quality_min: 0.75
236
+
237
+ # ---------------------------------------------------------------------------
238
+ # CATEGORY: Dependency Scanning
239
+ # ---------------------------------------------------------------------------
240
+
241
+ - id: tc004_dependency_vulnerability_check
242
+ description: "Detect known vulnerabilities in dependencies"
243
+ category: dependencies
244
+ priority: critical
245
+
246
+ input:
247
+ prompt: |
248
+ Scan dependencies for vulnerabilities:
249
+
250
+ package.json:
251
+ - lodash@4.17.15 (outdated)
252
+ - express@4.16.0 (vulnerable)
253
+ - moment@2.24.0 (has CVEs)
254
+ - axios@0.18.1 (vulnerable)
255
+
256
+ VULNERABLE PACKAGES:
257
+ 1. express@4.16.0: CVE-2018-16487 (HIGH)
258
+ 2. axios@0.18.1: CVE-2020-28168 (HIGH)
259
+ 3. lodash@4.17.15: CVE-2021-23337 (MEDIUM)
260
+ 4. moment@2.24.0: Regular Expression DoS (MEDIUM)
261
+
262
+ Action: Update to latest versions
263
+ context:
264
+ scan_scope: "package.json"
265
+ include_cves: true
266
+
267
+ expected_output:
268
+ must_contain:
269
+ - "vulnerable"
270
+ - "CVE"
271
+ - "dependency"
272
+ - "update"
273
+ must_not_contain:
274
+ - "no vulnerabilities"
275
+ - "all ok"
276
+ severity_classification: critical
277
+
278
+ validation:
279
+ schema_check: true
280
+ keyword_match_threshold: 0.8
281
+
282
+ - id: tc005_outdated_package_detection
283
+ description: "Identify outdated packages needing updates"
284
+ category: dependencies
285
+ priority: high
286
+
287
+ input:
288
+ prompt: |
289
+ Analyze package freshness:
290
+ - lodash@4.17.15 (current: 4.17.21) - 6 minor versions behind
291
+ - express@4.16.0 (current: 4.18.2) - 2 major versions behind
292
+ - jest@24.0.0 (current: 29.0.0) - 5 major versions behind
293
+
294
+ RECOMMENDATIONS:
295
+ 1. CRITICAL: Update express (major version)
296
+ 2. HIGH: Update jest (major version, breaking changes)
297
+ 3. MEDIUM: Update lodash (minor version, backward compatible)
298
+
299
+ How would you prioritize updates?
300
+ context:
301
+ package_analysis: true
302
+ prioritization: true
303
+
304
+ expected_output:
305
+ must_contain:
306
+ - "outdated"
307
+ - "update"
308
+ - "version"
309
+ - "prioritize"
310
+ finding_count:
311
+ min: 1
312
+
313
+ validation:
314
+ schema_check: true
315
+ keyword_match_threshold: 0.75
316
+
317
+ # ---------------------------------------------------------------------------
318
+ # CATEGORY: OWASP Top 10
319
+ # ---------------------------------------------------------------------------
320
+
321
+ - id: tc006_owasp_comprehensive_check
322
+ description: "Check code against full OWASP Top 10 2021"
323
+ category: owasp
324
+ priority: critical
325
+
326
+ input:
327
+ prompt: |
328
+ Scan code for OWASP Top 10 2021 compliance:
329
+
330
+ A01: Broken Access Control
331
+ - Check: Authorization on endpoints
332
+ - Status: FOUND - no authorization check on /admin
333
+
334
+ A02: Cryptographic Failures
335
+ - Check: Weak encryption, plaintext passwords
336
+ - Status: FOUND - passwords stored plaintext
337
+
338
+ A03: Injection (SQL, NoSQL, Command, XSS, LDAP)
339
+ - Check: SQL injection, XSS
340
+ - Status: FOUND - SQL injection vulnerability
341
+
342
+ A07: Authentication Failures
343
+ - Check: Weak passwords, session management
344
+ - Status: OK - using bcrypt and secure sessions
345
+
346
+ A06: Vulnerable Components
347
+ - Check: Known CVEs in dependencies
348
+ - Status: FOUND - 3 vulnerable packages
349
+
350
+ Other categories: OK
351
+
352
+ SUMMARY: 3 critical issues, 2 must fix immediately
353
+ context:
354
+ standard: "owasp-2021"
355
+ categories: "all"
356
+ include_status: true
357
+
358
+ expected_output:
359
+ must_contain:
360
+ - "OWASP"
361
+ - "A01"
362
+ - "A03"
363
+ - "critical"
364
+ - "vulnerability"
365
+ must_not_contain:
366
+ - "no issues"
367
+ - "compliant"
368
+ severity_classification: critical
369
+
370
+ validation:
371
+ schema_check: true
372
+ keyword_match_threshold: 0.8
373
+ reasoning_quality_min: 0.75
374
+
375
+ # ---------------------------------------------------------------------------
376
+ # CATEGORY: Compliance Auditing
377
+ # ---------------------------------------------------------------------------
378
+
379
+ - id: tc007_soc2_compliance_audit
380
+ description: "Audit code for SOC2 compliance"
381
+ category: compliance
382
+ priority: critical
383
+
384
+ input:
385
+ prompt: |
386
+ Audit SOC2 compliance requirements:
387
+
388
+ SECURITY:
389
+ - Access control: PARTIAL (missing admin endpoint protection)
390
+ - Encryption: OK (TLS in transit, AES at rest)
391
+ - Secret management: FAIL (hardcoded secrets)
392
+ - Monitoring: OK (logs captured)
393
+
394
+ AVAILABILITY:
395
+ - Error handling: OK
396
+ - Backup: OK
397
+ - Disaster recovery: PARTIAL (needs testing)
398
+
399
+ PROCESSING INTEGRITY:
400
+ - Input validation: FAIL (SQL injection found)
401
+ - Error handling: OK
402
+ - Audit logging: PARTIAL (some endpoints missing)
403
+
404
+ CONFIDENTIALITY:
405
+ - PII protection: FAIL (no encryption for user data)
406
+ - Access controls: PARTIAL
407
+
408
+ PRIVACY:
409
+ - Data retention: PARTIAL (no policy)
410
+ - User consent: OK
411
+
412
+ COMPLIANCE: 45% - FAIL (multiple critical gaps)
413
+ context:
414
+ standard: "SOC2"
415
+ categories: "all"
416
+ remediation: true
417
+
418
+ expected_output:
419
+ must_contain:
420
+ - "SOC2"
421
+ - "compliance"
422
+ - "fail"
423
+ - "gap"
424
+ - "remediation"
425
+ must_not_contain:
426
+ - "compliant"
427
+ - "pass"
428
+ severity_classification: critical
429
+
430
+ validation:
431
+ schema_check: true
432
+ keyword_match_threshold: 0.8
433
+
434
+ - id: tc008_gdpr_compliance_check
435
+ description: "Verify GDPR compliance for user data handling"
436
+ category: compliance
437
+ priority: critical
438
+
439
+ input:
440
+ prompt: |
441
+ Check GDPR compliance:
442
+
443
+ REQUIREMENTS:
444
+ 1. User consent documented: FAIL (no consent mechanism)
445
+ 2. Privacy policy: OK (published)
446
+ 3. Data retention policy: FAIL (no policy defined)
447
+ 4. Right to deletion: PARTIAL (can delete but full audit trail)
448
+ 5. Data portability: FAIL (no export functionality)
449
+ 6. Breach notification: PARTIAL (process exists, 30-day compliance ok)
450
+ 7. DPA in place: OK (processor agreements signed)
451
+ 8. Privacy by design: FAIL (not implemented)
452
+
453
+ COMPLIANCE: 38% - FAIL
454
+
455
+ What are the top 3 fixes?
456
+ context:
457
+ standard: "GDPR"
458
+ user_data_handling: true
459
+
460
+ expected_output:
461
+ must_contain:
462
+ - "GDPR"
463
+ - "compliance"
464
+ - "consent"
465
+ - "deletion"
466
+ - "fail"
467
+ severity_classification: critical
468
+
469
+ validation:
470
+ schema_check: true
471
+ keyword_match_threshold: 0.8
472
+
473
+ # ---------------------------------------------------------------------------
474
+ # CATEGORY: Security Gate
475
+ # ---------------------------------------------------------------------------
476
+
477
+ - id: tc009_security_gate_enforcement
478
+ description: "Enforce security gates in CI/CD pipeline"
479
+ category: gates
480
+ priority: critical
481
+
482
+ input:
483
+ prompt: |
484
+ Define security gates for merge:
485
+ 1. Critical vulnerabilities: 0 required
486
+ 2. High vulnerabilities: <= 2
487
+ 3. Known CVEs in dependencies: 0
488
+ 4. Hardcoded secrets: 0
489
+ 5. OWASP blocking issues: 0
490
+
491
+ SCAN RESULTS:
492
+ - Critical: 0 ✓
493
+ - High: 1 (express vulnerability) ✗ BLOCK
494
+ - CVEs: 3 ✗ BLOCK
495
+ - Secrets: 1 hardcoded API key ✗ BLOCK
496
+ - OWASP: 2 issues ✗ BLOCK
497
+
498
+ VERDICT: BLOCK MERGE - fail security gates
499
+
500
+ How would you help fix violations?
501
+ context:
502
+ blocking: true
503
+ remediation_guidance: true
504
+
505
+ expected_output:
506
+ must_contain:
507
+ - "security"
508
+ - "gate"
509
+ - "block"
510
+ - "merge"
511
+ must_not_contain:
512
+ - "approve"
513
+ - "pass"
514
+ severity_classification: critical
515
+
516
+ validation:
517
+ schema_check: true
518
+ keyword_match_threshold: 0.8
519
+
520
+ # ---------------------------------------------------------------------------
521
+ # CATEGORY: Negative Tests
522
+ # ---------------------------------------------------------------------------
523
+
524
+ - id: tc010_security_remediation_guidance
525
+ description: "Provide actionable remediation for security findings"
526
+ category: negative
527
+ priority: high
528
+
529
+ input:
530
+ prompt: |
531
+ For each security issue, provide remediation:
532
+
533
+ ISSUE 1: SQL Injection in getUserById()
534
+ REMEDIATION:
535
+ ```javascript
536
+ // BEFORE (vulnerable)
537
+ const query = `SELECT * FROM users WHERE id = ${userId}`;
538
+
539
+ // AFTER (safe)
540
+ const query = 'SELECT * FROM users WHERE id = ?';
541
+ db.query(query, [userId], callback);
542
+ ```
543
+
544
+ ISSUE 2: Hardcoded API Key
545
+ REMEDIATION:
546
+ // BEFORE
547
+ const API_KEY = 'sk-123456789';
548
+
549
+ // AFTER
550
+ const API_KEY = process.env.STRIPE_API_KEY;
551
+ // Set in .env or secrets manager
552
+
553
+ Generate clear fix for each issue found.
554
+ context:
555
+ issue_remediation: true
556
+ code_examples: true
557
+
558
+ expected_output:
559
+ must_contain:
560
+ - "remediation"
561
+ - "before"
562
+ - "after"
563
+ - "fix"
564
+ finding_count:
565
+ min: 1
566
+
567
+ validation:
568
+ schema_check: true
569
+ allow_partial: true
570
+
571
+ # =============================================================================
572
+ # SUCCESS CRITERIA
573
+ # =============================================================================
574
+
575
+ success_criteria:
576
+ pass_rate: 0.8
577
+ critical_pass_rate: 1.0
578
+ avg_reasoning_quality: 0.75
579
+ max_execution_time_ms: 300000
580
+ cross_model_variance: 0.15
581
+
582
+ # =============================================================================
583
+ # METADATA
584
+ # =============================================================================
585
+
586
+ metadata:
587
+ author: "qe-security-auditor"
588
+ created: "2026-02-02"
589
+ last_updated: "2026-02-02"
590
+ coverage_target: >
591
+ SAST scanning for SQL injection, XSS, hardcoded secrets, path traversal,
592
+ insecure crypto, dependency vulnerability analysis with CVE detection,
593
+ OWASP Top 10 2021 comprehensive checking, compliance auditing for SOC2/GDPR,
594
+ security gate enforcement with blocking criteria, and detailed remediation
595
+ guidance with code examples for all identified vulnerabilities.