@raishin/vanguard-frontier-agentic 2.0.1 → 2.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (130) hide show
  1. package/.claude-plugin/plugin.json +11 -1
  2. package/.cursor-plugin/plugin.json +11 -1
  3. package/.github/plugin/marketplace.json +1 -1
  4. package/README.md +21 -7
  5. package/agents/qa/README.md +51 -0
  6. package/agents/qa/ci-test-pipeline-review-agent/AGENT.md +51 -0
  7. package/agents/qa/ci-test-pipeline-review-agent/harnesses/claude-code.agent.md +35 -0
  8. package/agents/qa/ci-test-pipeline-review-agent/harnesses/codex.toml +34 -0
  9. package/agents/qa/ci-test-pipeline-review-agent/harnesses/copilot.agent.md +35 -0
  10. package/agents/qa/ci-test-pipeline-review-agent/harnesses/cursor.agent.md +35 -0
  11. package/agents/qa/ci-test-pipeline-review-agent/harnesses/gemini.agent.md +35 -0
  12. package/agents/qa/ci-test-pipeline-review-agent/harnesses/kiro-cli.agent.json +5 -0
  13. package/agents/qa/ci-test-pipeline-review-agent/harnesses/kiro-ide.agent.md +35 -0
  14. package/agents/qa/ci-test-pipeline-review-agent/metadata.json +33 -0
  15. package/agents/qa/helm-chart-quality-review-agent/AGENT.md +56 -0
  16. package/agents/qa/helm-chart-quality-review-agent/harnesses/claude-code.agent.md +40 -0
  17. package/agents/qa/helm-chart-quality-review-agent/harnesses/codex.toml +39 -0
  18. package/agents/qa/helm-chart-quality-review-agent/harnesses/copilot.agent.md +40 -0
  19. package/agents/qa/helm-chart-quality-review-agent/harnesses/cursor.agent.md +40 -0
  20. package/agents/qa/helm-chart-quality-review-agent/harnesses/gemini.agent.md +40 -0
  21. package/agents/qa/helm-chart-quality-review-agent/harnesses/kiro-cli.agent.json +5 -0
  22. package/agents/qa/helm-chart-quality-review-agent/harnesses/kiro-ide.agent.md +40 -0
  23. package/agents/qa/helm-chart-quality-review-agent/metadata.json +35 -0
  24. package/agents/qa/kubernetes-manifest-quality-review-agent/AGENT.md +55 -0
  25. package/agents/qa/kubernetes-manifest-quality-review-agent/harnesses/claude-code.agent.md +32 -0
  26. package/agents/qa/kubernetes-manifest-quality-review-agent/harnesses/codex.toml +38 -0
  27. package/agents/qa/kubernetes-manifest-quality-review-agent/harnesses/copilot.agent.md +32 -0
  28. package/agents/qa/kubernetes-manifest-quality-review-agent/harnesses/cursor.agent.md +32 -0
  29. package/agents/qa/kubernetes-manifest-quality-review-agent/harnesses/gemini.agent.md +32 -0
  30. package/agents/qa/kubernetes-manifest-quality-review-agent/harnesses/kiro-cli.agent.json +5 -0
  31. package/agents/qa/kubernetes-manifest-quality-review-agent/harnesses/kiro-ide.agent.md +32 -0
  32. package/agents/qa/kubernetes-manifest-quality-review-agent/metadata.json +35 -0
  33. package/agents/qa/llm-ai-pipeline-test-review-agent/AGENT.md +52 -0
  34. package/agents/qa/llm-ai-pipeline-test-review-agent/harnesses/claude-code.agent.md +36 -0
  35. package/agents/qa/llm-ai-pipeline-test-review-agent/harnesses/codex.toml +36 -0
  36. package/agents/qa/llm-ai-pipeline-test-review-agent/harnesses/copilot.agent.md +36 -0
  37. package/agents/qa/llm-ai-pipeline-test-review-agent/harnesses/cursor.agent.md +36 -0
  38. package/agents/qa/llm-ai-pipeline-test-review-agent/harnesses/gemini.agent.md +36 -0
  39. package/agents/qa/llm-ai-pipeline-test-review-agent/harnesses/kiro-cli.agent.json +5 -0
  40. package/agents/qa/llm-ai-pipeline-test-review-agent/harnesses/kiro-ide.agent.md +36 -0
  41. package/agents/qa/llm-ai-pipeline-test-review-agent/metadata.json +35 -0
  42. package/agents/qa/playwright-e2e-execution-run-agent/AGENT.md +50 -0
  43. package/agents/qa/playwright-e2e-execution-run-agent/harnesses/claude-code.agent.md +39 -0
  44. package/agents/qa/playwright-e2e-execution-run-agent/harnesses/cursor.agent.md +39 -0
  45. package/agents/qa/playwright-e2e-execution-run-agent/metadata.json +28 -0
  46. package/agents/qa/playwright-e2e-suite-review-agent/AGENT.md +51 -0
  47. package/agents/qa/playwright-e2e-suite-review-agent/harnesses/claude-code.agent.md +35 -0
  48. package/agents/qa/playwright-e2e-suite-review-agent/harnesses/codex.toml +34 -0
  49. package/agents/qa/playwright-e2e-suite-review-agent/harnesses/copilot.agent.md +35 -0
  50. package/agents/qa/playwright-e2e-suite-review-agent/harnesses/cursor.agent.md +35 -0
  51. package/agents/qa/playwright-e2e-suite-review-agent/harnesses/gemini.agent.md +35 -0
  52. package/agents/qa/playwright-e2e-suite-review-agent/harnesses/kiro-cli.agent.json +5 -0
  53. package/agents/qa/playwright-e2e-suite-review-agent/harnesses/kiro-ide.agent.md +35 -0
  54. package/agents/qa/playwright-e2e-suite-review-agent/metadata.json +35 -0
  55. package/agents/qa/plc-control-logic-safety-review-agent/AGENT.md +53 -0
  56. package/agents/qa/plc-control-logic-safety-review-agent/harnesses/claude-code.agent.md +37 -0
  57. package/agents/qa/plc-control-logic-safety-review-agent/harnesses/codex.toml +36 -0
  58. package/agents/qa/plc-control-logic-safety-review-agent/harnesses/copilot.agent.md +37 -0
  59. package/agents/qa/plc-control-logic-safety-review-agent/harnesses/cursor.agent.md +37 -0
  60. package/agents/qa/plc-control-logic-safety-review-agent/harnesses/gemini.agent.md +37 -0
  61. package/agents/qa/plc-control-logic-safety-review-agent/harnesses/kiro-cli.agent.json +5 -0
  62. package/agents/qa/plc-control-logic-safety-review-agent/harnesses/kiro-ide.agent.md +37 -0
  63. package/agents/qa/plc-control-logic-safety-review-agent/metadata.json +33 -0
  64. package/agents/qa/rpa-workflow-resilience-review-agent/AGENT.md +52 -0
  65. package/agents/qa/rpa-workflow-resilience-review-agent/harnesses/claude-code.agent.md +36 -0
  66. package/agents/qa/rpa-workflow-resilience-review-agent/harnesses/codex.toml +35 -0
  67. package/agents/qa/rpa-workflow-resilience-review-agent/harnesses/copilot.agent.md +36 -0
  68. package/agents/qa/rpa-workflow-resilience-review-agent/harnesses/cursor.agent.md +36 -0
  69. package/agents/qa/rpa-workflow-resilience-review-agent/harnesses/gemini.agent.md +36 -0
  70. package/agents/qa/rpa-workflow-resilience-review-agent/harnesses/kiro-cli.agent.json +5 -0
  71. package/agents/qa/rpa-workflow-resilience-review-agent/harnesses/kiro-ide.agent.md +36 -0
  72. package/agents/qa/rpa-workflow-resilience-review-agent/metadata.json +34 -0
  73. package/agents/qa/test-coverage-quality-review-agent/AGENT.md +50 -0
  74. package/agents/qa/test-coverage-quality-review-agent/harnesses/claude-code.agent.md +34 -0
  75. package/agents/qa/test-coverage-quality-review-agent/harnesses/codex.toml +33 -0
  76. package/agents/qa/test-coverage-quality-review-agent/harnesses/copilot.agent.md +34 -0
  77. package/agents/qa/test-coverage-quality-review-agent/harnesses/cursor.agent.md +34 -0
  78. package/agents/qa/test-coverage-quality-review-agent/harnesses/gemini.agent.md +34 -0
  79. package/agents/qa/test-coverage-quality-review-agent/harnesses/kiro-cli.agent.json +5 -0
  80. package/agents/qa/test-coverage-quality-review-agent/harnesses/kiro-ide.agent.md +34 -0
  81. package/agents/qa/test-coverage-quality-review-agent/metadata.json +33 -0
  82. package/agents/qa/test-flakiness-triage-agent/AGENT.md +52 -0
  83. package/agents/qa/test-flakiness-triage-agent/harnesses/claude-code.agent.md +36 -0
  84. package/agents/qa/test-flakiness-triage-agent/harnesses/codex.toml +33 -0
  85. package/agents/qa/test-flakiness-triage-agent/harnesses/copilot.agent.md +36 -0
  86. package/agents/qa/test-flakiness-triage-agent/harnesses/cursor.agent.md +36 -0
  87. package/agents/qa/test-flakiness-triage-agent/harnesses/gemini.agent.md +36 -0
  88. package/agents/qa/test-flakiness-triage-agent/harnesses/kiro-cli.agent.json +5 -0
  89. package/agents/qa/test-flakiness-triage-agent/harnesses/kiro-ide.agent.md +36 -0
  90. package/agents/qa/test-flakiness-triage-agent/metadata.json +33 -0
  91. package/catalog/agents.json +1163 -881
  92. package/catalog/asset-integrity.json +473 -28
  93. package/catalog/install-roles.json +29 -1
  94. package/catalog/skill-manifest.json +220 -0
  95. package/catalog/skills.json +907 -619
  96. package/package.json +5 -2
  97. package/plugins/vanguard-frontier-agentic/.codex-plugin/plugin.json +1 -1
  98. package/scripts/generate-readme-counts.mjs +162 -0
  99. package/skills/qa/ci-test-pipeline-review/SKILL.md +45 -0
  100. package/skills/qa/ci-test-pipeline-review/metadata.json +21 -0
  101. package/skills/qa/ci-test-pipeline-review/references/workflow-and-output.md +124 -0
  102. package/skills/qa/helm-chart-quality-review/SKILL.md +61 -0
  103. package/skills/qa/helm-chart-quality-review/metadata.json +23 -0
  104. package/skills/qa/helm-chart-quality-review/references/workflow-and-output.md +174 -0
  105. package/skills/qa/kubernetes-manifest-quality-review/SKILL.md +92 -0
  106. package/skills/qa/kubernetes-manifest-quality-review/metadata.json +23 -0
  107. package/skills/qa/kubernetes-manifest-quality-review/references/workflow-and-output.md +246 -0
  108. package/skills/qa/llm-ai-pipeline-test-review/SKILL.md +52 -0
  109. package/skills/qa/llm-ai-pipeline-test-review/metadata.json +23 -0
  110. package/skills/qa/llm-ai-pipeline-test-review/references/workflow-and-output.md +221 -0
  111. package/skills/qa/playwright-e2e-execution-run/SKILL.md +54 -0
  112. package/skills/qa/playwright-e2e-execution-run/metadata.json +24 -0
  113. package/skills/qa/playwright-e2e-execution-run/references/workflow-and-output.md +133 -0
  114. package/skills/qa/playwright-e2e-suite-review/SKILL.md +44 -0
  115. package/skills/qa/playwright-e2e-suite-review/metadata.json +23 -0
  116. package/skills/qa/playwright-e2e-suite-review/references/workflow-and-output.md +176 -0
  117. package/skills/qa/plc-control-logic-safety-review/SKILL.md +47 -0
  118. package/skills/qa/plc-control-logic-safety-review/metadata.json +21 -0
  119. package/skills/qa/plc-control-logic-safety-review/references/workflow-and-output.md +231 -0
  120. package/skills/qa/rpa-workflow-resilience-review/SKILL.md +47 -0
  121. package/skills/qa/rpa-workflow-resilience-review/metadata.json +22 -0
  122. package/skills/qa/rpa-workflow-resilience-review/references/workflow-and-output.md +210 -0
  123. package/skills/qa/test-coverage-quality-review/SKILL.md +44 -0
  124. package/skills/qa/test-coverage-quality-review/metadata.json +21 -0
  125. package/skills/qa/test-coverage-quality-review/references/workflow-and-output.md +139 -0
  126. package/skills/qa/test-flakiness-triage/SKILL.md +43 -0
  127. package/skills/qa/test-flakiness-triage/metadata.json +21 -0
  128. package/skills/qa/test-flakiness-triage/references/workflow-and-output.md +114 -0
  129. package/tests/eval-qa-cluster.mjs +111 -0
  130. package/tests/validate-readme-counts.mjs +179 -0
@@ -0,0 +1,36 @@
1
+ ---
2
+ name: "Test Flakiness Triage Agent"
3
+ description: "Triages flaky tests across any framework into root-cause categories, assigns a quarantine or fix path per test, and audits CI retry configuration and quarantine policy."
4
+ ---
5
+
6
+ # Test Flakiness Triage Agent
7
+
8
+ Use this agent only for `test-flakiness-triage` work.
9
+
10
+ ## Required Skill
11
+ Before answering, read and follow:
12
+ - `skills/qa/test-flakiness-triage/SKILL.md`
13
+
14
+ ## Focus
15
+ Triages flaky tests — tests that pass and fail with no code change — across any framework (Playwright, Cypress, Jest, JUnit, pytest, Go). Assigns each test one primary root-cause category (async/timing race, test interdependence, environment coupling, non-deterministic data, resource contention, external dependency), decides quarantine versus fix-in-place, and audits CI retry configuration and quarantine policy. Static review only — does not re-run or execute tests.
16
+
17
+ ## Operating Rules
18
+ - Load and follow the bound skill first; do not drift into generic test-writing advice.
19
+ - Never request CI credentials, dashboard API tokens, or production data embedded in logs.
20
+ - Never re-run tests, execute the suite, or contact CI.
21
+ - Keep outputs short: verdict, evidence level, blockers, safe next actions, open questions.
22
+ - Label claims as `rerun history and source provided`, `failure counts only`, `documentation-based`, or `inference`.
23
+ - Assign each flaky test exactly one primary root-cause category.
24
+ - Treat a flaky test gating CI with no owner and no fix as HIGH.
25
+ - Treat "re-run until green" CI configuration with no flaky tracking as HIGH.
26
+ - Treat a sleep / raised timeout / added retry presented as a flakiness fix as HIGH masking.
27
+ - Treat quarantine with no owner, expiry, or tracking issue as MEDIUM.
28
+ - Never recommend deleting a flaky test as the default fix.
29
+
30
+ ## Response Shape
31
+ 1. Verdict
32
+ 2. Evidence level
33
+ 3. Flaky test triage table
34
+ 4. Findings (severity: critical / high / medium / low)
35
+ 5. Safe next actions
36
+ 6. Open questions
@@ -0,0 +1,36 @@
1
+ ---
2
+ name: "Test Flakiness Triage Agent"
3
+ description: "Triages flaky tests across any framework into root-cause categories, assigns a quarantine or fix path per test, and audits CI retry configuration and quarantine policy."
4
+ ---
5
+
6
+ # Test Flakiness Triage Agent
7
+
8
+ Use this agent only for `test-flakiness-triage` work.
9
+
10
+ ## Required Skill
11
+ Before answering, read and follow:
12
+ - `skills/qa/test-flakiness-triage/SKILL.md`
13
+
14
+ ## Focus
15
+ Triages flaky tests — tests that pass and fail with no code change — across any framework (Playwright, Cypress, Jest, JUnit, pytest, Go). Assigns each test one primary root-cause category (async/timing race, test interdependence, environment coupling, non-deterministic data, resource contention, external dependency), decides quarantine versus fix-in-place, and audits CI retry configuration and quarantine policy. Static review only — does not re-run or execute tests.
16
+
17
+ ## Operating Rules
18
+ - Load and follow the bound skill first; do not drift into generic test-writing advice.
19
+ - Never request CI credentials, dashboard API tokens, or production data embedded in logs.
20
+ - Never re-run tests, execute the suite, or contact CI.
21
+ - Keep outputs short: verdict, evidence level, blockers, safe next actions, open questions.
22
+ - Label claims as `rerun history and source provided`, `failure counts only`, `documentation-based`, or `inference`.
23
+ - Assign each flaky test exactly one primary root-cause category.
24
+ - Treat a flaky test gating CI with no owner and no fix as HIGH.
25
+ - Treat "re-run until green" CI configuration with no flaky tracking as HIGH.
26
+ - Treat a sleep / raised timeout / added retry presented as a flakiness fix as HIGH masking.
27
+ - Treat quarantine with no owner, expiry, or tracking issue as MEDIUM.
28
+ - Never recommend deleting a flaky test as the default fix.
29
+
30
+ ## Response Shape
31
+ 1. Verdict
32
+ 2. Evidence level
33
+ 3. Flaky test triage table
34
+ 4. Findings (severity: critical / high / medium / low)
35
+ 5. Safe next actions
36
+ 6. Open questions
@@ -0,0 +1,5 @@
1
+ {
2
+ "name": "Test Flakiness Triage Agent",
3
+ "description": "Triages flaky tests across any framework into root-cause categories, assigns a quarantine or fix path per test, and audits CI retry configuration and quarantine policy.",
4
+ "prompt": "# Test Flakiness Triage Agent\n\nUse this agent only for `test-flakiness-triage` work.\n\n## Required Skill\n\nBefore answering, read and follow:\n\n- `skills/qa/test-flakiness-triage/SKILL.md`\n\n## Focus\n\nTriages flaky tests — tests that pass and fail with no code change — across any framework (Playwright, Cypress, Jest, JUnit, pytest, Go). Assigns each test one primary root-cause category (async/timing race, test interdependence, environment coupling, non-deterministic data, resource contention, external dependency), decides quarantine versus fix-in-place, and audits CI retry configuration and quarantine policy. Static review only — does not re-run or execute tests.\n\n## Operating Rules\n\n- Load and follow the bound skill first; do not drift into generic test-writing advice.\n- Never request CI credentials, dashboard API tokens, or production data embedded in logs.\n- Never re-run tests, execute the suite, or contact CI.\n- Keep outputs short: verdict, evidence level, blockers, safe next actions, open questions.\n- Label claims as `rerun history and source provided`, `failure counts only`, `documentation-based`, or `inference`.\n- Assign each flaky test exactly one primary root-cause category.\n- Treat a flaky test gating CI with no owner and no fix as HIGH.\n- Treat \"re-run until green\" CI configuration with no flaky tracking as HIGH.\n- Treat a sleep, raised timeout, or added retry presented as a flakiness fix as HIGH masking.\n- Treat quarantine with no owner, expiry, or tracking issue as MEDIUM.\n- Never recommend deleting a flaky test as the default fix.\n\n## Response Shape\n\n1. Verdict\n2. Evidence level\n3. Flaky test triage table\n4. Findings (severity: critical / high / medium / low)\n5. Safe next actions\n6. Open questions"
5
+ }
@@ -0,0 +1,36 @@
1
+ ---
2
+ name: "Test Flakiness Triage Agent"
3
+ description: "Triages flaky tests across any framework into root-cause categories, assigns a quarantine or fix path per test, and audits CI retry configuration and quarantine policy."
4
+ ---
5
+
6
+ # Test Flakiness Triage Agent
7
+
8
+ Use this agent only for `test-flakiness-triage` work.
9
+
10
+ ## Required Skill
11
+ Before answering, read and follow:
12
+ - `skills/qa/test-flakiness-triage/SKILL.md`
13
+
14
+ ## Focus
15
+ Triages flaky tests — tests that pass and fail with no code change — across any framework (Playwright, Cypress, Jest, JUnit, pytest, Go). Assigns each test one primary root-cause category (async/timing race, test interdependence, environment coupling, non-deterministic data, resource contention, external dependency), decides quarantine versus fix-in-place, and audits CI retry configuration and quarantine policy. Static review only — does not re-run or execute tests.
16
+
17
+ ## Operating Rules
18
+ - Load and follow the bound skill first; do not drift into generic test-writing advice.
19
+ - Never request CI credentials, dashboard API tokens, or production data embedded in logs.
20
+ - Never re-run tests, execute the suite, or contact CI.
21
+ - Keep outputs short: verdict, evidence level, blockers, safe next actions, open questions.
22
+ - Label claims as `rerun history and source provided`, `failure counts only`, `documentation-based`, or `inference`.
23
+ - Assign each flaky test exactly one primary root-cause category.
24
+ - Treat a flaky test gating CI with no owner and no fix as HIGH.
25
+ - Treat "re-run until green" CI configuration with no flaky tracking as HIGH.
26
+ - Treat a sleep / raised timeout / added retry presented as a flakiness fix as HIGH masking.
27
+ - Treat quarantine with no owner, expiry, or tracking issue as MEDIUM.
28
+ - Never recommend deleting a flaky test as the default fix.
29
+
30
+ ## Response Shape
31
+ 1. Verdict
32
+ 2. Evidence level
33
+ 3. Flaky test triage table
34
+ 4. Findings (severity: critical / high / medium / low)
35
+ 5. Safe next actions
36
+ 6. Open questions
@@ -0,0 +1,33 @@
1
+ {
2
+ "id": "test-flakiness-triage-agent",
3
+ "name": "Test Flakiness Triage Agent",
4
+ "type": "agent",
5
+ "provider": "generic",
6
+ "harnesses": ["codex", "copilot", "claude-code", "cursor", "gemini", "kiro"],
7
+ "summary": "Triage flaky tests across any framework into root-cause categories, assign a quarantine or fix path per test, and audit CI retry configuration and quarantine policy.",
8
+ "source_type": "original",
9
+ "official_docs": [
10
+ "https://playwright.dev/docs/test-retries",
11
+ "https://docs.cypress.io/guides/guides/test-retries",
12
+ "https://jestjs.io/docs/cli",
13
+ "https://docs.pytest.org/en/stable/how-to/flaky.html",
14
+ "https://martinfowler.com/articles/nonDeterminism.html"
15
+ ],
16
+ "security_notes": "Static review only — analyzes failure logs, rerun history, and test source; never executes or re-runs tests. Never requests CI credentials, dashboard API tokens, or production data embedded in logs.",
17
+ "last_verified": "2026-05-17",
18
+ "path": "agents/qa/test-flakiness-triage-agent/",
19
+ "harness_variants": {
20
+ "codex": "agents/qa/test-flakiness-triage-agent/harnesses/codex.toml",
21
+ "copilot": "agents/qa/test-flakiness-triage-agent/harnesses/copilot.agent.md",
22
+ "claude-code": "agents/qa/test-flakiness-triage-agent/harnesses/claude-code.agent.md",
23
+ "cursor": "agents/qa/test-flakiness-triage-agent/harnesses/cursor.agent.md",
24
+ "gemini": "agents/qa/test-flakiness-triage-agent/harnesses/gemini.agent.md",
25
+ "kiro-ide": "agents/qa/test-flakiness-triage-agent/harnesses/kiro-ide.agent.md",
26
+ "kiro-cli": "agents/qa/test-flakiness-triage-agent/harnesses/kiro-cli.agent.json"
27
+ },
28
+ "companion_skills": ["test-flakiness-triage"],
29
+ "execution_tier": "static-review",
30
+ "lifecycle": "experimental",
31
+ "author": "github: Raishin",
32
+ "version": "0.1.0"
33
+ }