@jterrats/open-orchestra 0.1.0 → 0.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (187) hide show
  1. package/CHANGELOG.md +53 -0
  2. package/README.md +17 -2
  3. package/dist/assets/web-console.js +743 -0
  4. package/dist/cli.js +157 -4
  5. package/dist/cli.js.map +1 -1
  6. package/dist/collaboration-flows.d.ts +5 -0
  7. package/dist/collaboration-flows.js +256 -0
  8. package/dist/collaboration-flows.js.map +1 -0
  9. package/dist/command-manifest.d.ts +11 -0
  10. package/dist/command-manifest.js +52 -0
  11. package/dist/command-manifest.js.map +1 -0
  12. package/dist/commands.d.ts +31 -0
  13. package/dist/commands.js +644 -2
  14. package/dist/commands.js.map +1 -1
  15. package/dist/constants.d.ts +4 -0
  16. package/dist/constants.js +22 -0
  17. package/dist/constants.js.map +1 -1
  18. package/dist/defaults.d.ts +7 -11
  19. package/dist/defaults.js +7 -625
  20. package/dist/defaults.js.map +1 -1
  21. package/dist/delegation-decision.d.ts +14 -0
  22. package/dist/delegation-decision.js +391 -0
  23. package/dist/delegation-decision.js.map +1 -0
  24. package/dist/detect-commands.d.ts +3 -0
  25. package/dist/detect-commands.js +28 -0
  26. package/dist/detect-commands.js.map +1 -0
  27. package/dist/diagram-validation.d.ts +36 -0
  28. package/dist/diagram-validation.js +118 -0
  29. package/dist/diagram-validation.js.map +1 -0
  30. package/dist/fs-utils.d.ts +2 -0
  31. package/dist/fs-utils.js +75 -6
  32. package/dist/fs-utils.js.map +1 -1
  33. package/dist/health-checks.d.ts +28 -0
  34. package/dist/health-checks.js +219 -0
  35. package/dist/health-checks.js.map +1 -0
  36. package/dist/health-commands.d.ts +2 -0
  37. package/dist/health-commands.js +18 -0
  38. package/dist/health-commands.js.map +1 -0
  39. package/dist/instruction-apply.d.ts +34 -0
  40. package/dist/instruction-apply.js +150 -0
  41. package/dist/instruction-apply.js.map +1 -0
  42. package/dist/instruction-blocks.d.ts +22 -0
  43. package/dist/instruction-blocks.js +120 -0
  44. package/dist/instruction-blocks.js.map +1 -0
  45. package/dist/instruction-imports.d.ts +12 -0
  46. package/dist/instruction-imports.js +45 -0
  47. package/dist/instruction-imports.js.map +1 -0
  48. package/dist/instruction-stale.d.ts +9 -0
  49. package/dist/instruction-stale.js +106 -0
  50. package/dist/instruction-stale.js.map +1 -0
  51. package/dist/instruction-types.d.ts +66 -0
  52. package/dist/instruction-types.js +2 -0
  53. package/dist/instruction-types.js.map +1 -0
  54. package/dist/instruction-updates.d.ts +4 -0
  55. package/dist/instruction-updates.js +5 -0
  56. package/dist/instruction-updates.js.map +1 -0
  57. package/dist/knowledge-base.d.ts +10 -0
  58. package/dist/knowledge-base.js +117 -0
  59. package/dist/knowledge-base.js.map +1 -0
  60. package/dist/mcp-oauth-proxy.d.ts +39 -0
  61. package/dist/mcp-oauth-proxy.js +80 -0
  62. package/dist/mcp-oauth-proxy.js.map +1 -0
  63. package/dist/pr-review.d.ts +20 -0
  64. package/dist/pr-review.js +142 -0
  65. package/dist/pr-review.js.map +1 -0
  66. package/dist/project-detection.d.ts +22 -0
  67. package/dist/project-detection.js +174 -0
  68. package/dist/project-detection.js.map +1 -0
  69. package/dist/prompt-registry.d.ts +56 -0
  70. package/dist/prompt-registry.js +163 -0
  71. package/dist/prompt-registry.js.map +1 -0
  72. package/dist/release-candidate.d.ts +41 -0
  73. package/dist/release-candidate.js +196 -0
  74. package/dist/release-candidate.js.map +1 -0
  75. package/dist/release-commands.d.ts +4 -0
  76. package/dist/release-commands.js +50 -0
  77. package/dist/release-commands.js.map +1 -0
  78. package/dist/roles/ai-support-roles.d.ts +11 -0
  79. package/dist/roles/ai-support-roles.js +67 -0
  80. package/dist/roles/ai-support-roles.js.map +1 -0
  81. package/dist/roles/core-roles.d.ts +11 -0
  82. package/dist/roles/core-roles.js +144 -0
  83. package/dist/roles/core-roles.js.map +1 -0
  84. package/dist/roles/engineering-roles.d.ts +11 -0
  85. package/dist/roles/engineering-roles.js +176 -0
  86. package/dist/roles/engineering-roles.js.map +1 -0
  87. package/dist/roles/governance-roles.d.ts +11 -0
  88. package/dist/roles/governance-roles.js +117 -0
  89. package/dist/roles/governance-roles.js.map +1 -0
  90. package/dist/roles/index.d.ts +11 -0
  91. package/dist/roles/index.js +17 -0
  92. package/dist/roles/index.js.map +1 -0
  93. package/dist/roles/platform-ops-roles.d.ts +11 -0
  94. package/dist/roles/platform-ops-roles.js +158 -0
  95. package/dist/roles/platform-ops-roles.js.map +1 -0
  96. package/dist/roles/qa-ux-roles.d.ts +11 -0
  97. package/dist/roles/qa-ux-roles.js +193 -0
  98. package/dist/roles/qa-ux-roles.js.map +1 -0
  99. package/dist/roles/release-ops-roles.d.ts +11 -0
  100. package/dist/roles/release-ops-roles.js +109 -0
  101. package/dist/roles/release-ops-roles.js.map +1 -0
  102. package/dist/runtime-adapters.d.ts +6 -0
  103. package/dist/runtime-adapters.js +88 -0
  104. package/dist/runtime-adapters.js.map +1 -0
  105. package/dist/runtime-bootstrap.d.ts +12 -0
  106. package/dist/runtime-bootstrap.js +85 -0
  107. package/dist/runtime-bootstrap.js.map +1 -0
  108. package/dist/skills.d.ts +36 -0
  109. package/dist/skills.js +665 -0
  110. package/dist/skills.js.map +1 -0
  111. package/dist/subagent-protocol.d.ts +41 -0
  112. package/dist/subagent-protocol.js +179 -0
  113. package/dist/subagent-protocol.js.map +1 -0
  114. package/dist/telemetry-consent.d.ts +24 -0
  115. package/dist/telemetry-consent.js +95 -0
  116. package/dist/telemetry-consent.js.map +1 -0
  117. package/dist/telemetry-export.d.ts +14 -0
  118. package/dist/telemetry-export.js +126 -0
  119. package/dist/telemetry-export.js.map +1 -0
  120. package/dist/telemetry-records.d.ts +3 -0
  121. package/dist/telemetry-records.js +96 -0
  122. package/dist/telemetry-records.js.map +1 -0
  123. package/dist/telemetry-redaction.d.ts +9 -0
  124. package/dist/telemetry-redaction.js +55 -0
  125. package/dist/telemetry-redaction.js.map +1 -0
  126. package/dist/telemetry-types.d.ts +52 -0
  127. package/dist/telemetry-types.js +2 -0
  128. package/dist/telemetry-types.js.map +1 -0
  129. package/dist/telemetry.d.ts +4 -0
  130. package/dist/telemetry.js +4 -0
  131. package/dist/telemetry.js.map +1 -0
  132. package/dist/types.d.ts +176 -1
  133. package/dist/validation.d.ts +3 -1
  134. package/dist/validation.js +28 -5
  135. package/dist/validation.js.map +1 -1
  136. package/dist/web-api.js +167 -3
  137. package/dist/web-api.js.map +1 -1
  138. package/dist/web-console.js +6 -160
  139. package/dist/web-console.js.map +1 -1
  140. package/dist/workflow-gates.js +4 -2
  141. package/dist/workflow-gates.js.map +1 -1
  142. package/dist/workflow-services.js +125 -67
  143. package/dist/workflow-services.js.map +1 -1
  144. package/dist/workflow-templates.d.ts +10 -0
  145. package/dist/workflow-templates.js +141 -0
  146. package/dist/workflow-templates.js.map +1 -0
  147. package/dist/workspace-classification.d.ts +5 -0
  148. package/dist/workspace-classification.js +127 -0
  149. package/dist/workspace-classification.js.map +1 -0
  150. package/dist/workspace-validator.js +11 -1
  151. package/dist/workspace-validator.js.map +1 -1
  152. package/dist/workspace.d.ts +8 -4
  153. package/dist/workspace.js +111 -4
  154. package/dist/workspace.js.map +1 -1
  155. package/docs/dev-team-specialist-role-profiles.md +171 -0
  156. package/docs/mcp-oauth-proxy-evaluation.md +44 -0
  157. package/docs/multi-agent-orchestrator-backlog.md +413 -1
  158. package/docs/open-orchestra-dogfooding-findings.md +66 -0
  159. package/docs/orchestra-mvp.md +46 -1
  160. package/docs/runtime-adapters.md +86 -0
  161. package/docs/runtime-llm-flow.md +124 -0
  162. package/docs/setup-agents-dogfooding-findings.md +101 -0
  163. package/docs/skill-loading-strategy.md +114 -0
  164. package/docs/source-of-truth-and-agent-learning.md +83 -0
  165. package/package.json +9 -5
  166. package/rules/agent-roles.mdc +30 -0
  167. package/rules/ai-assisted-development.mdc +22 -0
  168. package/skills/agent-learning/SKILL.md +24 -0
  169. package/skills/agent-learning/manifest.json +40 -0
  170. package/skills/backlog-sync/SKILL.md +24 -0
  171. package/skills/backlog-sync/manifest.json +41 -0
  172. package/skills/diagram-export/SKILL.md +35 -0
  173. package/skills/diagram-export/manifest.json +40 -0
  174. package/skills/model-evaluation/SKILL.md +25 -0
  175. package/skills/model-evaluation/manifest.json +41 -0
  176. package/skills/playwright-evidence/SKILL.md +28 -0
  177. package/skills/playwright-evidence/manifest.json +46 -0
  178. package/skills/pr-review/SKILL.md +23 -0
  179. package/skills/pr-review/manifest.json +43 -0
  180. package/skills/prompt-registry/SKILL.md +24 -0
  181. package/skills/prompt-registry/manifest.json +45 -0
  182. package/skills/release-readiness/SKILL.md +25 -0
  183. package/skills/release-readiness/manifest.json +45 -0
  184. package/skills/source-of-truth/SKILL.md +24 -0
  185. package/skills/source-of-truth/manifest.json +47 -0
  186. package/skills/static-analysis/SKILL.md +26 -0
  187. package/skills/static-analysis/manifest.json +46 -0
package/package.json CHANGED
@@ -1,20 +1,21 @@
1
1
  {
2
2
  "name": "@jterrats/open-orchestra",
3
- "version": "0.1.0",
3
+ "version": "0.2.1",
4
4
  "type": "module",
5
5
  "bin": {
6
6
  "orchestra": "bin/orchestra.js"
7
7
  },
8
8
  "scripts": {
9
- "build": "tsc",
9
+ "build": "tsc && npm run build:web",
10
10
  "typecheck": "tsc --noEmit",
11
11
  "test": "npm run build && node --test test/**/*.js extensions/**/*.test.cjs",
12
- "lint": "eslint . && prettier --check \"{bin,scripts,test}/**/*.js\" \"extensions/**/*.{cjs,json,md}\" \"src/**/*.ts\" \"*.json\"",
13
- "format": "prettier --write \"{bin,scripts,test}/**/*.js\" \"extensions/**/*.{cjs,json,md}\" \"src/**/*.ts\" \"*.json\"",
12
+ "lint": "eslint . && prettier --check \"{bin,scripts,test,src}/**/*.js\" \"extensions/**/*.{cjs,json,md}\" \"src/**/*.ts\" \"*.json\"",
13
+ "format": "prettier --write \"{bin,scripts,test,src}/**/*.js\" \"extensions/**/*.{cjs,json,md}\" \"src/**/*.ts\" \"*.json\"",
14
14
  "secret-scan": "node scripts/secret-scan.js",
15
15
  "validate:workflow": "sh -c 'test ! -d .agent-workflow || (npm run build && node bin/orchestra.js validate)'",
16
16
  "precommit": "npm run lint && npm run typecheck && npm run secret-scan && npm test && npm run validate:workflow",
17
- "hooks:install": "git config core.hooksPath .githooks"
17
+ "hooks:install": "git config core.hooksPath .githooks",
18
+ "build:web": "esbuild src/web-console-client.js --bundle --format=esm --platform=browser --target=es2022 --outfile=dist/assets/web-console.js"
18
19
  },
19
20
  "engines": {
20
21
  "node": ">=22"
@@ -22,6 +23,7 @@
22
23
  "devDependencies": {
23
24
  "@eslint/js": "^10.0.1",
24
25
  "@types/node": "^25.6.0",
26
+ "esbuild": "^0.28.0",
25
27
  "eslint": "^10.2.1",
26
28
  "prettier": "^3.8.3",
27
29
  "typescript": "^6.0.3",
@@ -45,8 +47,10 @@
45
47
  "dist/",
46
48
  "rules/",
47
49
  "docs/",
50
+ "skills/",
48
51
  "AGENTS.md",
49
52
  "CLAUDE.md",
53
+ "CHANGELOG.md",
50
54
  "README.md",
51
55
  "package.json"
52
56
  ],
@@ -39,16 +39,41 @@ Use roles to force complete thinking, not to create silos. A single agent may co
39
39
  - Does not start coding until acceptance criteria and technical boundaries are clear enough.
40
40
  - Confirms the agreed implementation approach before editing files, except for trivial mechanical changes.
41
41
 
42
+ ## Frontend Specialist
43
+ - Owns browser behavior, component architecture, responsive UI, accessibility implementation, client performance, and visual regression risk.
44
+ - Reviews user-facing web changes against mobile-first flows, WCAG-oriented checks, and Playwright-visible behavior.
45
+ - Blocks frontend changes that cannot be verified in target browsers or viewports.
46
+
47
+ ## Backend Specialist
48
+ - Owns service boundaries, API contracts, domain services, persistence integration, concurrency, and failure modes.
49
+ - Reviews backend changes for secure coding, observability, idempotency, retries, data integrity, and server-side tests.
50
+ - Blocks backend changes with unclear contracts, untested failure modes, or unsafe data handling.
51
+
52
+ ## Mobile Specialist
53
+ - Owns mobile UX, device compatibility, offline behavior, permissions, native or hybrid runtime constraints, and store readiness.
54
+ - Reviews mobile changes with device evidence instead of relying only on desktop responsive checks.
55
+ - Blocks mobile releases without device matrix, runtime constraints, or store readiness evidence when applicable.
56
+
42
57
  ## QA
43
58
  - Owns verification strategy, test coverage, regression risk, and release confidence.
44
59
  - Defines happy paths, failure paths, boundary cases, and non-functional checks.
45
60
  - Challenges work that has implementation but no credible test plan.
46
61
 
62
+ ## SDET / Test Automation Engineer
63
+ - Owns automated test architecture, Playwright fixtures, page objects, resilient locators, and CI test reliability.
64
+ - Converts QA plans and acceptance criteria into repeatable smoke, regression, and evidence-producing tests.
65
+ - Blocks automation-heavy releases when tests are brittle, unisolated, or missing traceable evidence.
66
+
47
67
  ## DevOps
48
68
  - Owns deployment, CI/CD, observability, runtime configuration, rollback, and operational readiness.
49
69
  - Verifies environment segregation, infrastructure as code, migrations, secrets, and runbooks.
50
70
  - Blocks releases that cannot be deployed, monitored, rolled back, or supported.
51
71
 
72
+ ## Platform Engineer
73
+ - Owns internal developer platforms, golden paths, reusable templates, self-service workflows, and platform guardrails.
74
+ - Treats developer experience as a product while preserving security, compliance, cost visibility, and operational control.
75
+ - Blocks cross-repo platform changes without template validation, adoption notes, or self-service smoke evidence.
76
+
52
77
  ## Security
53
78
  - Owns threat modeling, abuse cases, data classification, identity, secrets, and dependency risk.
54
79
  - Reviews authentication, authorization, input handling, logging, encryption, and third-party exposure.
@@ -89,6 +114,11 @@ Use roles to force complete thinking, not to create silos. A single agent may co
89
114
  - Reviews user-facing changes for diagnosability, help text, recovery paths, and support escalation needs.
90
115
  - Feeds production incidents, tickets, and user pain back into Product Owner and QA workflows.
91
116
 
117
+ ## AI Evaluation / Prompt Quality Engineer
118
+ - Owns eval objectives, datasets, rubrics, prompt regression checks, model comparisons, and LLM behavior evidence.
119
+ - Treats prompt, model routing, and provider fallback changes as testable product behavior.
120
+ - Blocks AI behavior changes that rely on subjective review without eval cases, scoring rationale, or accepted residual risk.
121
+
92
122
  ## Compliance / Privacy
93
123
  - Owns regulatory requirements, privacy obligations, retention, consent, auditability, and data processing risk.
94
124
  - Reviews PII, restricted data, data residency, retention policies, access logs, consent, and third-party processors.
@@ -29,3 +29,25 @@ AI-generated work must meet the same engineering bar as human-written work. Spee
29
29
  - Discuss the approach with the user before non-trivial AI-assisted implementation.
30
30
  - Explain trade-offs clearly and identify risks introduced by generated code.
31
31
  - If generated code reveals a better or riskier path than agreed, pause and realign before continuing.
32
+
33
+ ## Prompt Registry
34
+
35
+ - Use `.generated-prompts/` as the durable prompt register for generated or substantially changed artifacts.
36
+ - Before creating or substantially changing an artifact, read the relevant register file to preserve conventions, constraints, decisions, and known risks.
37
+ - After substantial changes, add or update one entry for the artifact with task, active role, key decisions, evidence, and the final prompt or a concise prompt summary.
38
+ - Keep only the latest prompt in each entry; rely on git history for prior versions. Do not update entries for typos, formatting-only edits, or single-line mechanical fixes.
39
+
40
+ ## Skill Loading
41
+
42
+ - Keep primary agent instruction files as short indexes plus non-negotiable rules.
43
+ - Load detailed skills only when task signals, active roles, touched paths, or risk areas require them.
44
+ - Prefer skill summaries first; load full skill instructions, assets, scripts, and examples only at execution time.
45
+ - Record selected skills in task context, handoffs, evidence, and final summaries when they materially shaped the work.
46
+
47
+ ## Source of Truth and Learning
48
+
49
+ - Select authoritative source groups before acting: project instructions, backlog, architecture, codebase, quality/security, DevOps/runtime, vendor docs, and agent memory.
50
+ - Prefer local project sources first and official vendor documentation for current APIs, frameworks, cloud services, providers, and tools.
51
+ - When an action fails in a reusable way, record the lesson in `.agent-workflow/agent-lessons.jsonl` with operation, error signature, root cause, fix, prevention, and verification.
52
+ - Before repeating risky operations, search prior lessons for matching tool, command, error signature, or operation.
53
+ - Promote repeated lessons into the relevant skill or rule instead of letting agents rediscover the same failure.
@@ -0,0 +1,24 @@
1
+ # Agent Learning
2
+
3
+ Record reusable failure lessons and promote repeated lessons into skills or rules.
4
+
5
+ ## When To Load
6
+
7
+ - Trigger: `failure`
8
+ - Trigger: `failed`
9
+ - Trigger: `error`
10
+ - Trigger: `syntax`
11
+ - Trigger: `escaping`
12
+ - Trigger: `permission`
13
+ - Trigger: `lesson`
14
+ - Trigger: `learn`
15
+
16
+ ## Procedure
17
+
18
+ - Search relevant lessons before repeating risky operations.
19
+ - After reusable failures, record operation, error signature, root cause, fix, prevention, and verification.
20
+ - Promote repeated lessons into versioned skills or rules after review.
21
+
22
+ ## Evidence
23
+
24
+ - `file`
@@ -0,0 +1,40 @@
1
+ {
2
+ "id": "agent-learning",
3
+ "name": "Agent Learning",
4
+ "summary": "Record reusable failure lessons and promote repeated lessons into skills or rules.",
5
+ "triggers": [
6
+ "failure",
7
+ "failed",
8
+ "error",
9
+ "syntax",
10
+ "escaping",
11
+ "permission",
12
+ "lesson",
13
+ "learn"
14
+ ],
15
+ "roles": [
16
+ "parent",
17
+ "context_curator",
18
+ "toolsmith",
19
+ "developer",
20
+ "qa"
21
+ ],
22
+ "capabilities": [
23
+ "failure-learning",
24
+ "memory-hygiene",
25
+ "repeat-prevention"
26
+ ],
27
+ "riskAreas": [
28
+ "maintainability",
29
+ "governance"
30
+ ],
31
+ "sourceGroups": [
32
+ "agent-memory",
33
+ "codebase"
34
+ ],
35
+ "evidence": [
36
+ "file"
37
+ ],
38
+ "loadBudget": "small",
39
+ "entry": "skills/agent-learning/SKILL.md"
40
+ }
@@ -0,0 +1,24 @@
1
+ # Backlog Sync
2
+
3
+ Keep GitHub issues, local stories, and workflow tasks aligned.
4
+
5
+ ## When To Load
6
+
7
+ - Trigger: `backlog`
8
+ - Trigger: `issue`
9
+ - Trigger: `story`
10
+ - Trigger: `epic`
11
+ - Trigger: `github`
12
+ - Trigger: `acceptance criteria`
13
+ - Trigger: `refine`
14
+
15
+ ## Procedure
16
+
17
+ - Confirm backlog IDs and acceptance criteria before implementation.
18
+ - Keep local tasks, docs, and GitHub issues aligned when one changes.
19
+ - Surface missing refinement as a blocker instead of guessing scope.
20
+
21
+ ## Evidence
22
+
23
+ - `file`
24
+ - `report`
@@ -0,0 +1,41 @@
1
+ {
2
+ "id": "backlog-sync",
3
+ "name": "Backlog Sync",
4
+ "summary": "Keep GitHub issues, local stories, and workflow tasks aligned.",
5
+ "triggers": [
6
+ "backlog",
7
+ "issue",
8
+ "story",
9
+ "epic",
10
+ "github",
11
+ "acceptance criteria",
12
+ "refine"
13
+ ],
14
+ "roles": [
15
+ "product_manager",
16
+ "product_owner",
17
+ "business_analyst",
18
+ "planner",
19
+ "parent"
20
+ ],
21
+ "capabilities": [
22
+ "backlog-management",
23
+ "story-refinement",
24
+ "scope-control"
25
+ ],
26
+ "riskAreas": [
27
+ "governance",
28
+ "scope"
29
+ ],
30
+ "sourceGroups": [
31
+ "product-backlog",
32
+ "project-instructions",
33
+ "agent-memory"
34
+ ],
35
+ "evidence": [
36
+ "file",
37
+ "report"
38
+ ],
39
+ "loadBudget": "small",
40
+ "entry": "skills/backlog-sync/SKILL.md"
41
+ }
@@ -0,0 +1,35 @@
1
+ # Diagram Export
2
+
3
+ Create, validate, and export architecture, workflow, and sequence diagrams.
4
+
5
+ ## When To Load
6
+
7
+ - Trigger: `diagram`
8
+ - Trigger: `mermaid`
9
+ - Trigger: `architecture`
10
+ - Trigger: `flow`
11
+ - Trigger: `sequence`
12
+ - Trigger: `draw.io`
13
+ - Trigger: `lucid`
14
+
15
+ ## Procedure
16
+
17
+ - Identify the diagram purpose and authoritative architecture sources before drawing.
18
+ - Choose the diagram style from the decision matrix before drafting.
19
+ - Prefer text-native diagrams such as Mermaid unless the project requires another format.
20
+ - Run `orchestra diagrams lint --file <diagram.mmd>` for lint-only validation before sharing Mermaid diagrams.
21
+ - Attach evidence with `orchestra diagrams lint --file <diagram.mmd> --task <task-id>` when the diagram supports workflow delivery.
22
+ - If `mmdc` is missing, report the install guidance instead of pretending validation passed.
23
+
24
+ ## Decision Matrix
25
+
26
+ - Architecture boundary or component ownership: C4/container or component diagram.
27
+ - User, business, or agent workflow: flowchart or state diagram.
28
+ - Service/API/message exchange: sequence diagram.
29
+ - Data ownership or relationships: entity relationship diagram.
30
+ - Runtime topology, infrastructure, or deployment: deployment or infrastructure diagram.
31
+
32
+ ## Evidence
33
+
34
+ - `file`
35
+ - `report`
@@ -0,0 +1,40 @@
1
+ {
2
+ "id": "diagram-export",
3
+ "name": "Diagram Export",
4
+ "summary": "Create, validate, and export architecture, workflow, and sequence diagrams.",
5
+ "triggers": [
6
+ "diagram",
7
+ "mermaid",
8
+ "architecture",
9
+ "flow",
10
+ "sequence",
11
+ "draw.io",
12
+ "lucid"
13
+ ],
14
+ "roles": [
15
+ "architect",
16
+ "business_analyst",
17
+ "product_manager",
18
+ "tech_lead",
19
+ "technical_writer"
20
+ ],
21
+ "capabilities": [
22
+ "diagramming",
23
+ "architecture-communication"
24
+ ],
25
+ "riskAreas": [
26
+ "architecture",
27
+ "documentation"
28
+ ],
29
+ "sourceGroups": [
30
+ "architecture",
31
+ "product-backlog",
32
+ "agent-memory"
33
+ ],
34
+ "evidence": [
35
+ "file",
36
+ "report"
37
+ ],
38
+ "loadBudget": "normal",
39
+ "entry": "skills/diagram-export/SKILL.md"
40
+ }
@@ -0,0 +1,25 @@
1
+ # Model Evaluation
2
+
3
+ Run prompt, model, provider-routing, fallback, and rubric evaluations.
4
+
5
+ ## When To Load
6
+
7
+ - Trigger: `model`
8
+ - Trigger: `llm`
9
+ - Trigger: `prompt`
10
+ - Trigger: `provider`
11
+ - Trigger: `fallback`
12
+ - Trigger: `eval`
13
+ - Trigger: `rubric`
14
+ - Trigger: `routing`
15
+
16
+ ## Procedure
17
+
18
+ - Define eval objectives, cases, rubric, and expected behavior before changing prompts or routing.
19
+ - Compare model/provider behavior for material changes and record disagreements.
20
+ - Avoid storing raw sensitive prompts or responses in provenance artifacts.
21
+
22
+ ## Evidence
23
+
24
+ - `report`
25
+ - `file`
@@ -0,0 +1,41 @@
1
+ {
2
+ "id": "model-evaluation",
3
+ "name": "Model Evaluation",
4
+ "summary": "Run prompt, model, provider-routing, fallback, and rubric evaluations.",
5
+ "triggers": [
6
+ "model",
7
+ "llm",
8
+ "prompt",
9
+ "provider",
10
+ "fallback",
11
+ "eval",
12
+ "rubric",
13
+ "routing"
14
+ ],
15
+ "roles": [
16
+ "ai_evaluation_engineer",
17
+ "toolsmith",
18
+ "architect",
19
+ "parent"
20
+ ],
21
+ "capabilities": [
22
+ "llm-evaluation",
23
+ "provider-routing",
24
+ "prompt-quality"
25
+ ],
26
+ "riskAreas": [
27
+ "governance",
28
+ "quality"
29
+ ],
30
+ "sourceGroups": [
31
+ "vendor-docs",
32
+ "agent-memory",
33
+ "quality-security"
34
+ ],
35
+ "evidence": [
36
+ "report",
37
+ "file"
38
+ ],
39
+ "loadBudget": "normal",
40
+ "entry": "skills/model-evaluation/SKILL.md"
41
+ }
@@ -0,0 +1,28 @@
1
+ # Playwright Evidence
2
+
3
+ Plan browser automation and attach screenshots, traces, videos, and reports.
4
+
5
+ ## When To Load
6
+
7
+ - Trigger: `playwright`
8
+ - Trigger: `browser`
9
+ - Trigger: `e2e`
10
+ - Trigger: `screenshot`
11
+ - Trigger: `trace`
12
+ - Trigger: `video`
13
+ - Trigger: `responsive`
14
+ - Trigger: `web`
15
+ - Trigger: `ui`
16
+
17
+ ## Procedure
18
+
19
+ - Plan user-value scenarios from acceptance criteria before writing tests.
20
+ - Use resilient locators and page objects for repeated flows.
21
+ - Attach screenshots, traces, videos, or reports as evidence for release decisions.
22
+
23
+ ## Evidence
24
+
25
+ - `screenshot`
26
+ - `trace`
27
+ - `video`
28
+ - `report`
@@ -0,0 +1,46 @@
1
+ {
2
+ "id": "playwright-evidence",
3
+ "name": "Playwright Evidence",
4
+ "summary": "Plan browser automation and attach screenshots, traces, videos, and reports.",
5
+ "triggers": [
6
+ "playwright",
7
+ "browser",
8
+ "e2e",
9
+ "screenshot",
10
+ "trace",
11
+ "video",
12
+ "responsive",
13
+ "web",
14
+ "ui"
15
+ ],
16
+ "roles": [
17
+ "qa",
18
+ "sdet",
19
+ "frontend_specialist",
20
+ "ux_ui_designer",
21
+ "ux_researcher_accessibility"
22
+ ],
23
+ "capabilities": [
24
+ "e2e-testing",
25
+ "browser-evidence",
26
+ "accessibility-check"
27
+ ],
28
+ "riskAreas": [
29
+ "ux",
30
+ "release"
31
+ ],
32
+ "sourceGroups": [
33
+ "quality-security",
34
+ "codebase",
35
+ "product-backlog",
36
+ "agent-memory"
37
+ ],
38
+ "evidence": [
39
+ "screenshot",
40
+ "trace",
41
+ "video",
42
+ "report"
43
+ ],
44
+ "loadBudget": "normal",
45
+ "entry": "skills/playwright-evidence/SKILL.md"
46
+ }
@@ -0,0 +1,23 @@
1
+ # PR Review
2
+
3
+ Produce review findings, PR summaries, risks, rollout notes, and missing-test gaps.
4
+
5
+ ## When To Load
6
+
7
+ - Trigger: `pr`
8
+ - Trigger: `pull request`
9
+ - Trigger: `review`
10
+ - Trigger: `diff`
11
+ - Trigger: `merge`
12
+ - Trigger: `release summary`
13
+
14
+ ## Procedure
15
+
16
+ - Review behavior, tests, risks, rollout, rollback, and missing evidence before summaries.
17
+ - Lead with findings and blockers, then summarize changes.
18
+ - Reference local files, task context, reviews, and evidence rather than generated claims.
19
+
20
+ ## Evidence
21
+
22
+ - `file`
23
+ - `report`
@@ -0,0 +1,43 @@
1
+ {
2
+ "id": "pr-review",
3
+ "name": "PR Review",
4
+ "summary": "Produce review findings, PR summaries, risks, rollout notes, and missing-test gaps.",
5
+ "triggers": [
6
+ "pr",
7
+ "pull request",
8
+ "review",
9
+ "diff",
10
+ "merge",
11
+ "release summary"
12
+ ],
13
+ "roles": [
14
+ "reviewer_critic",
15
+ "tech_lead",
16
+ "qa",
17
+ "security",
18
+ "release_manager",
19
+ "architect"
20
+ ],
21
+ "capabilities": [
22
+ "review",
23
+ "risk-summary",
24
+ "change-summary"
25
+ ],
26
+ "riskAreas": [
27
+ "release",
28
+ "security",
29
+ "maintainability"
30
+ ],
31
+ "sourceGroups": [
32
+ "codebase",
33
+ "quality-security",
34
+ "product-backlog",
35
+ "agent-memory"
36
+ ],
37
+ "evidence": [
38
+ "file",
39
+ "report"
40
+ ],
41
+ "loadBudget": "normal",
42
+ "entry": "skills/pr-review/SKILL.md"
43
+ }
@@ -0,0 +1,24 @@
1
+ # Prompt Registry
2
+
3
+ Read and update .generated-prompts registers for substantial AI-generated artifacts.
4
+
5
+ ## When To Load
6
+
7
+ - Trigger: `prompt`
8
+ - Trigger: `generated`
9
+ - Trigger: `artifact`
10
+ - Trigger: `code`
11
+ - Trigger: `ui`
12
+ - Trigger: `docs`
13
+ - Trigger: `diagram`
14
+ - Trigger: `eval`
15
+
16
+ ## Procedure
17
+
18
+ - Before substantial generation, read the relevant .generated-prompts register.
19
+ - After substantial changes, update one entry with task, role, decisions, evidence, and prompt summary.
20
+ - Do not update the register for typo-only, formatting-only, or single-line mechanical fixes.
21
+
22
+ ## Evidence
23
+
24
+ - `file`
@@ -0,0 +1,45 @@
1
+ {
2
+ "id": "prompt-registry",
3
+ "name": "Prompt Registry",
4
+ "summary": "Read and update .generated-prompts registers for substantial AI-generated artifacts.",
5
+ "triggers": [
6
+ "prompt",
7
+ "generated",
8
+ "artifact",
9
+ "code",
10
+ "ui",
11
+ "docs",
12
+ "diagram",
13
+ "eval"
14
+ ],
15
+ "roles": [
16
+ "parent",
17
+ "developer",
18
+ "tech_lead",
19
+ "frontend_specialist",
20
+ "backend_specialist",
21
+ "mobile_specialist",
22
+ "sdet",
23
+ "qa",
24
+ "technical_writer",
25
+ "ai_evaluation_engineer"
26
+ ],
27
+ "capabilities": [
28
+ "prompt-memory",
29
+ "artifact-traceability",
30
+ "context-continuity"
31
+ ],
32
+ "riskAreas": [
33
+ "maintainability",
34
+ "governance"
35
+ ],
36
+ "sourceGroups": [
37
+ "agent-memory",
38
+ "codebase"
39
+ ],
40
+ "evidence": [
41
+ "file"
42
+ ],
43
+ "loadBudget": "small",
44
+ "entry": "skills/prompt-registry/SKILL.md"
45
+ }
@@ -0,0 +1,25 @@
1
+ # Release Readiness
2
+
3
+ Validate gates, rollback, observability, support, and customer-impact evidence.
4
+
5
+ ## When To Load
6
+
7
+ - Trigger: `release`
8
+ - Trigger: `deploy`
9
+ - Trigger: `rollback`
10
+ - Trigger: `go-live`
11
+ - Trigger: `readiness`
12
+ - Trigger: `downtime`
13
+ - Trigger: `observability`
14
+
15
+ ## Procedure
16
+
17
+ - Validate gates, evidence, locks, reviews, rollback, observability, and support readiness.
18
+ - Treat missing rollback or unresolved critical QA/security/SRE findings as blockers.
19
+ - Record release evidence and accepted residual risks explicitly.
20
+
21
+ ## Evidence
22
+
23
+ - `command`
24
+ - `report`
25
+ - `file`