claude-code-kit 0.7.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (209) hide show
  1. claude_code_kit-0.7.0.dist-info/METADATA +384 -0
  2. claude_code_kit-0.7.0.dist-info/RECORD +209 -0
  3. claude_code_kit-0.7.0.dist-info/WHEEL +4 -0
  4. claude_code_kit-0.7.0.dist-info/entry_points.txt +4 -0
  5. claude_code_kit-0.7.0.dist-info/licenses/LICENSE +21 -0
  6. claude_kit/__init__.py +10 -0
  7. claude_kit/__main__.py +8 -0
  8. claude_kit/_payload/agents/acceptance-reviewer.md +60 -0
  9. claude_kit/_payload/agents/auditor.md +76 -0
  10. claude_kit/_payload/agents/dependency-scanner.md +84 -0
  11. claude_kit/_payload/agents/developer.md +187 -0
  12. claude_kit/_payload/agents/devils-advocate.md +62 -0
  13. claude_kit/_payload/agents/devops-engineer.md +134 -0
  14. claude_kit/_payload/agents/e2e-tester.md +152 -0
  15. claude_kit/_payload/agents/em-reviewer.md +105 -0
  16. claude_kit/_payload/agents/incident-responder.md +64 -0
  17. claude_kit/_payload/agents/merge-reviewer.md +194 -0
  18. claude_kit/_payload/agents/observability-engineer.md +94 -0
  19. claude_kit/_payload/agents/orchestrator.md +551 -0
  20. claude_kit/_payload/agents/owasp-reviewer.md +76 -0
  21. claude_kit/_payload/agents/policy-validator.md +63 -0
  22. claude_kit/_payload/agents/pr-raiser.md +138 -0
  23. claude_kit/_payload/agents/risk-classifier.md +50 -0
  24. claude_kit/_payload/agents/sdlc-code-reviewer.md +196 -0
  25. claude_kit/_payload/agents/secret-scanner.md +70 -0
  26. claude_kit/_payload/agents/security-reviewer.md +80 -0
  27. claude_kit/_payload/agents/senior-backend-dev.md +199 -0
  28. claude_kit/_payload/agents/senior-frontend-dev.md +181 -0
  29. claude_kit/_payload/agents/senior-tester.md +206 -0
  30. claude_kit/_payload/agents/spec-doc-writer.md +331 -0
  31. claude_kit/_payload/agents/story-planner.md +56 -0
  32. claude_kit/_payload/agents/technical-architect.md +139 -0
  33. claude_kit/_payload/agents/tester.md +193 -0
  34. claude_kit/_payload/agents/ui-designer.md +73 -0
  35. claude_kit/_payload/agents/unit-tester.md +119 -0
  36. claude_kit/_payload/catalog/mcp.yaml +54 -0
  37. claude_kit/_payload/catalog/org.yaml +145 -0
  38. claude_kit/_payload/catalog/profiles.yaml +96 -0
  39. claude_kit/_payload/catalog/stacks.yaml +96 -0
  40. claude_kit/_payload/commands/init.md +36 -0
  41. claude_kit/_payload/commands/sdlc.md +18 -0
  42. claude_kit/_payload/commands/status.md +20 -0
  43. claude_kit/_payload/hooks/hooks.json +58 -0
  44. claude_kit/_payload/hooks/scripts/audit-log.sh +18 -0
  45. claude_kit/_payload/hooks/scripts/guard-secrets.sh +26 -0
  46. claude_kit/_payload/hooks/scripts/lint-fix.sh +38 -0
  47. claude_kit/_payload/hooks/scripts/load-continuity.sh +32 -0
  48. claude_kit/_payload/hooks/scripts/load-learnings.sh +40 -0
  49. claude_kit/_payload/hooks/scripts/type-check.sh +23 -0
  50. claude_kit/_payload/hooks/scripts/validate-frontmatter.sh +34 -0
  51. claude_kit/_payload/hooks/scripts/validate-settings.sh +21 -0
  52. claude_kit/_payload/hooks/scripts/warn-large-edits.sh +24 -0
  53. claude_kit/_payload/hooks/scripts/warn-missing-tests.sh +24 -0
  54. claude_kit/_payload/hooks/scripts/warn-sensitive-files.sh +30 -0
  55. claude_kit/_payload/hooks/scripts/warn-shared-modules.sh +33 -0
  56. claude_kit/_payload/rules/agent-guardrails.md +83 -0
  57. claude_kit/_payload/rules/agent-memory.md +106 -0
  58. claude_kit/_payload/rules/agent-resilience.md +61 -0
  59. claude_kit/_payload/rules/autonomy-levels.md +30 -0
  60. claude_kit/_payload/rules/code-organization.md +312 -0
  61. claude_kit/_payload/rules/continuity.md +84 -0
  62. claude_kit/_payload/rules/design-patterns.md +422 -0
  63. claude_kit/_payload/rules/devops-observability.md +57 -0
  64. claude_kit/_payload/rules/documentation.md +326 -0
  65. claude_kit/_payload/rules/evals.md +62 -0
  66. claude_kit/_payload/rules/frontend-best-practices.md +157 -0
  67. claude_kit/_payload/rules/goal-setting-and-monitoring.md +72 -0
  68. claude_kit/_payload/rules/human-in-the-loop.md +64 -0
  69. claude_kit/_payload/rules/linting-and-formatting.md +220 -0
  70. claude_kit/_payload/rules/mandatory-workflow.md +309 -0
  71. claude_kit/_payload/rules/model-tiers.md +34 -0
  72. claude_kit/_payload/rules/quality-gates.md +107 -0
  73. claude_kit/_payload/rules/rarv-cycle.md +31 -0
  74. claude_kit/_payload/rules/reasoning-techniques.md +62 -0
  75. claude_kit/_payload/rules/responsive-and-accessibility.md +353 -0
  76. claude_kit/_payload/rules/risk-classification.md +36 -0
  77. claude_kit/_payload/rules/testing.md +417 -0
  78. claude_kit/_payload/rules/tool-design.md +66 -0
  79. claude_kit/_payload/skills/_references/accessibility-checklist.md +160 -0
  80. claude_kit/_payload/skills/_references/orchestration-patterns.md +405 -0
  81. claude_kit/_payload/skills/_references/performance-checklist.md +153 -0
  82. claude_kit/_payload/skills/_references/security-checklist.md +134 -0
  83. claude_kit/_payload/skills/_references/testing-patterns.md +236 -0
  84. claude_kit/_payload/skills/accessibility-review/SKILL.md +56 -0
  85. claude_kit/_payload/skills/api-and-interface-design/SKILL.md +294 -0
  86. claude_kit/_payload/skills/api-integration/SKILL.md +348 -0
  87. claude_kit/_payload/skills/archive-sprint/SKILL.md +31 -0
  88. claude_kit/_payload/skills/backlog/SKILL.md +41 -0
  89. claude_kit/_payload/skills/backlog/item-template.md +20 -0
  90. claude_kit/_payload/skills/browser-testing-with-devtools/SKILL.md +302 -0
  91. claude_kit/_payload/skills/ci-cd-and-automation/SKILL.md +402 -0
  92. claude_kit/_payload/skills/code-review-and-quality/SKILL.md +347 -0
  93. claude_kit/_payload/skills/code-simplification/SKILL.md +331 -0
  94. claude_kit/_payload/skills/component-design/SKILL.md +171 -0
  95. claude_kit/_payload/skills/consolidate-learnings/SKILL.md +55 -0
  96. claude_kit/_payload/skills/context-engineering/SKILL.md +321 -0
  97. claude_kit/_payload/skills/debugging-and-error-recovery/SKILL.md +300 -0
  98. claude_kit/_payload/skills/decision/SKILL.md +46 -0
  99. claude_kit/_payload/skills/decision/adr-template.md +36 -0
  100. claude_kit/_payload/skills/deprecation-and-migration/SKILL.md +207 -0
  101. claude_kit/_payload/skills/documentation-and-adrs/SKILL.md +299 -0
  102. claude_kit/_payload/skills/doubt-driven-development/SKILL.md +243 -0
  103. claude_kit/_payload/skills/execute/SKILL.md +27 -0
  104. claude_kit/_payload/skills/frontend-ui-engineering/SKILL.md +328 -0
  105. claude_kit/_payload/skills/git-workflow-and-versioning/SKILL.md +300 -0
  106. claude_kit/_payload/skills/idea-refine/SKILL.md +178 -0
  107. claude_kit/_payload/skills/idea-refine/examples.md +238 -0
  108. claude_kit/_payload/skills/idea-refine/frameworks.md +99 -0
  109. claude_kit/_payload/skills/idea-refine/refinement-criteria.md +113 -0
  110. claude_kit/_payload/skills/idea-refine/scripts/idea-refine.sh +15 -0
  111. claude_kit/_payload/skills/incident-postmortem/SKILL.md +74 -0
  112. claude_kit/_payload/skills/incremental-implementation/SKILL.md +245 -0
  113. claude_kit/_payload/skills/interview-me/SKILL.md +221 -0
  114. claude_kit/_payload/skills/load-testing/SKILL.md +83 -0
  115. claude_kit/_payload/skills/manual-test/SKILL.md +516 -0
  116. claude_kit/_payload/skills/performance-optimization/SKILL.md +277 -0
  117. claude_kit/_payload/skills/planning-and-task-breakdown/SKILL.md +223 -0
  118. claude_kit/_payload/skills/playwright-verification/SKILL.md +205 -0
  119. claude_kit/_payload/skills/refresh-docs/SKILL.md +63 -0
  120. claude_kit/_payload/skills/remember/SKILL.md +96 -0
  121. claude_kit/_payload/skills/scope/SKILL.md +52 -0
  122. claude_kit/_payload/skills/scope/scope-template.md +82 -0
  123. claude_kit/_payload/skills/sdlc/SKILL.md +83 -0
  124. claude_kit/_payload/skills/security-and-hardening/SKILL.md +368 -0
  125. claude_kit/_payload/skills/security-verification/SKILL.md +209 -0
  126. claude_kit/_payload/skills/shipping-and-launch/SKILL.md +309 -0
  127. claude_kit/_payload/skills/smoke-test/SKILL.md +78 -0
  128. claude_kit/_payload/skills/source-driven-development/SKILL.md +195 -0
  129. claude_kit/_payload/skills/spec-driven-development/SKILL.md +200 -0
  130. claude_kit/_payload/skills/sprint/SKILL.md +67 -0
  131. claude_kit/_payload/skills/sprint/sprint-template.md +90 -0
  132. claude_kit/_payload/skills/test-driven-development/SKILL.md +383 -0
  133. claude_kit/_payload/skills/threat-model/SKILL.md +60 -0
  134. claude_kit/_payload/skills/triage/SKILL.md +87 -0
  135. claude_kit/_payload/skills/ui-ux-design/SKILL.md +71 -0
  136. claude_kit/_payload/skills/unit-test/SKILL.md +237 -0
  137. claude_kit/_payload/skills/using-agent-skills/SKILL.md +180 -0
  138. claude_kit/_payload/templates/CLAUDE.md +238 -0
  139. claude_kit/_payload/templates/CLAUDE.stack.md.tmpl +53 -0
  140. claude_kit/_payload/templates/CONTINUITY.template.md +35 -0
  141. claude_kit/_payload/templates/README.claude-sdlc.md.tmpl +219 -0
  142. claude_kit/_payload/templates/agent-memory/MEMORY.md +30 -0
  143. claude_kit/_payload/templates/agent-memory/api/.gitkeep +0 -0
  144. claude_kit/_payload/templates/agent-memory/architecture/.gitkeep +0 -0
  145. claude_kit/_payload/templates/agent-memory/debugging/.gitkeep +0 -0
  146. claude_kit/_payload/templates/agent-memory/gotchas/.gitkeep +0 -0
  147. claude_kit/_payload/templates/agent-memory/patterns/.gitkeep +0 -0
  148. claude_kit/_payload/templates/agent-memory/performance/.gitkeep +0 -0
  149. claude_kit/_payload/templates/artifacts/adr.md +18 -0
  150. claude_kit/_payload/templates/artifacts/feature-spec.md +29 -0
  151. claude_kit/_payload/templates/artifacts/release-plan.md +23 -0
  152. claude_kit/_payload/templates/artifacts/runbook.md +24 -0
  153. claude_kit/_payload/templates/artifacts/security-review.md +23 -0
  154. claude_kit/_payload/templates/artifacts/test-plan.md +22 -0
  155. claude_kit/_payload/templates/org/README.md +53 -0
  156. claude_kit/_payload/templates/org/agents/data-workflow-agent.md +59 -0
  157. claude_kit/_payload/templates/org/agents/founder-prototype-agent.md +61 -0
  158. claude_kit/_payload/templates/org/agents/internal-tools-builder.md +63 -0
  159. claude_kit/_payload/templates/org/agents/pm-copilot.md +60 -0
  160. claude_kit/_payload/templates/org/agents/support-ticket-engineer.md +63 -0
  161. claude_kit/_payload/templates/org/packs/devops-and-release/README.md +46 -0
  162. claude_kit/_payload/templates/org/packs/devops-and-release/pack.yaml +32 -0
  163. claude_kit/_payload/templates/org/packs/engineering-core/README.md +46 -0
  164. claude_kit/_payload/templates/org/packs/engineering-core/pack.yaml +44 -0
  165. claude_kit/_payload/templates/org/packs/non-engineer-builder/README.md +53 -0
  166. claude_kit/_payload/templates/org/packs/non-engineer-builder/pack.yaml +39 -0
  167. claude_kit/_payload/templates/org/packs/onboarding-and-docs/README.md +49 -0
  168. claude_kit/_payload/templates/org/packs/onboarding-and-docs/pack.yaml +26 -0
  169. claude_kit/_payload/templates/org/packs/product-to-code/README.md +50 -0
  170. claude_kit/_payload/templates/org/packs/product-to-code/pack.yaml +34 -0
  171. claude_kit/_payload/templates/org/packs/quality-and-review/README.md +53 -0
  172. claude_kit/_payload/templates/org/packs/quality-and-review/pack.yaml +40 -0
  173. claude_kit/_payload/templates/org/packs/security-and-compliance/README.md +50 -0
  174. claude_kit/_payload/templates/org/packs/security-and-compliance/pack.yaml +36 -0
  175. claude_kit/_payload/templates/org/rules/ai-working-agreement.md +45 -0
  176. claude_kit/_payload/templates/org/rules/ambiguity-resolution.md +36 -0
  177. claude_kit/_payload/templates/org/rules/branch-and-pr-policy.md +41 -0
  178. claude_kit/_payload/templates/org/rules/compliance-policy.md +50 -0
  179. claude_kit/_payload/templates/org/rules/non-engineer-safe-coding.md +37 -0
  180. claude_kit/_payload/templates/org/rules/pii-policy.md +46 -0
  181. claude_kit/_payload/templates/org/rules/production-data-policy.md +35 -0
  182. claude_kit/_payload/templates/org/rules/prompt-to-task-conversion.md +30 -0
  183. claude_kit/_payload/templates/org/rules/prototype-boundaries.md +40 -0
  184. claude_kit/_payload/templates/org/rules/secrets-policy.md +34 -0
  185. claude_kit/_payload/templates/org/skills/customer-issue-to-fix/SKILL.md +61 -0
  186. claude_kit/_payload/templates/org/skills/feature-from-idea/SKILL.md +56 -0
  187. claude_kit/_payload/templates/org/skills/prompt-to-safe-task/SKILL.md +59 -0
  188. claude_kit/_payload/templates/org/skills/prototype-to-production/SKILL.md +61 -0
  189. claude_kit/_payload/templates/org/skills/repo-onboarding/SKILL.md +60 -0
  190. claude_kit/_payload/templates/settings.json +53 -0
  191. claude_kit/_payload/templates/stacks/backend/python/fastapi/rules/fastapi-patterns.md +64 -0
  192. claude_kit/_payload/templates/stacks/db/mongodb/agents/migration-specialist.md +61 -0
  193. claude_kit/_payload/templates/stacks/db/mongodb/agents/mongodb-specialist.md +59 -0
  194. claude_kit/_payload/templates/stacks/db/mongodb/rules/mongodb-patterns.md +39 -0
  195. claude_kit/_payload/templates/stacks/db/postgres/agents/db-performance-reviewer.md +66 -0
  196. claude_kit/_payload/templates/stacks/db/postgres/agents/migration-specialist.md +56 -0
  197. claude_kit/_payload/templates/stacks/db/postgres/agents/postgres-specialist.md +58 -0
  198. claude_kit/_payload/templates/stacks/db/postgres/rules/database-performance.md +64 -0
  199. claude_kit/_payload/templates/stacks/db/postgres/rules/postgres-patterns.md +43 -0
  200. claude_kit/_payload/templates/stacks/frontend/react/rules/react-patterns.md +63 -0
  201. claude_kit/catalog.py +476 -0
  202. claude_kit/cli.py +327 -0
  203. claude_kit/hooks.py +246 -0
  204. claude_kit/models.py +205 -0
  205. claude_kit/prompts.py +209 -0
  206. claude_kit/render.py +146 -0
  207. claude_kit/scaffold.py +492 -0
  208. claude_kit/upgrader.py +294 -0
  209. claude_kit/validator.py +197 -0
@@ -0,0 +1,193 @@
1
+ ---
2
+ name: tester
3
+ description: Validates backend APIs together with the frontend. Verifies API correctness, request/response behavior, UI rendering against spec, integration, error states, and edge cases. Can be spawned in parallel with a testing lane focus.
4
+ tools: Read, Write, Edit, Bash, Glob, Grep
5
+ permissionMode: acceptEdits
6
+ model: sonnet
7
+ color: lime
8
+ tier: specialist
9
+ ---
10
+
11
+ You are **Agent: Tester** — an integration tester for the project.
12
+
13
+ ## Your Job
14
+
15
+ After code review is approved, validate that the implementation works correctly. Per `CLAUDE.md` §5, **work is not complete without tester validation**.
16
+
17
+ ## Execution Mode
18
+
19
+ You may be spawned by the Orchestrator in one of these modes:
20
+
21
+ - **`api`** — Test backend API endpoints only (status codes, response shapes, validation, auth, tenant/authorization scoping if applicable)
22
+ - **`ui`** — Test frontend UI only (screen states, interactions, design spec compliance, accessibility)
23
+ - **`integration`** — Test end-to-end flows (frontend → API → data layer → API → frontend)
24
+ - **`full`** — Test everything (used for small features or single-stack work)
25
+
26
+ When spawned in a specific mode, **focus exclusively on that testing lane**. The merge-reviewer will verify that all lanes together provide complete coverage.
27
+
28
+ ## MANDATORY: Read Before Testing
29
+
30
+ 1. **`{feature-name}_spec.md`** — approved spec + developer documentation (expected behavior, acceptance criteria, API contracts)
31
+ 2. **`CLAUDE.md`** — engineering delivery rules
32
+ 3. **`.claude/rules/testing.md`** — testing standards
33
+ 4. **`.claude/rules/design-patterns.md`** — verify patterns are applied correctly
34
+ 5. The design spec (if one exists and mode is `ui` or `integration` or `full`)
35
+
36
+ ## Input
37
+
38
+ You will receive:
39
+ - Your **testing mode** (api | ui | integration | full)
40
+ - The approved, code-reviewed production code
41
+ - `docs/specs/{feature-name}_spec.md`
42
+ - Optionally, the design spec
43
+
44
+ ---
45
+
46
+ ## Mode: API Testing
47
+
48
+ Test each API endpoint defined in the spec using the project's HTTP testing tools (e.g., curl, httpie, or the project's test client).
49
+
50
+ For each endpoint, verify:
51
+ - [ ] Correct status code (201 create, 200 read, 204 delete, etc.)
52
+ - [ ] Response body matches the expected schema in the spec
53
+ - [ ] Validation errors return appropriate error status with descriptive messages
54
+ - [ ] Unauthenticated requests return 401 (if applicable)
55
+ - [ ] Permission violations return 403 (if applicable)
56
+ - [ ] Not-found returns 404
57
+ - [ ] Duplicates return 409 (if applicable)
58
+ - [ ] Tenant/authorization scoping: User A cannot access User B's data (for multi-tenant/scoped systems)
59
+ - [ ] Rate limiting works on auth/public endpoints (if applicable)
60
+ - [ ] Pagination returns correct metadata (page size, page number, has next, total records) if applicable
61
+ - [ ] Sorting/filtering works as specified
62
+
63
+ ---
64
+
65
+ ## Mode: UI Testing
66
+
67
+ Use the project's browser automation tools (e.g., Chrome DevTools MCP, Playwright, Selenium, or Cypress) to verify the frontend:
68
+
69
+ 1. Navigate to the relevant page(s)
70
+ 2. Take snapshots at each screen state
71
+ 3. Verify against the design spec:
72
+ - [ ] Default state renders correctly
73
+ - [ ] Loading state shows appropriate indicator
74
+ - [ ] Empty state shows correct message and guidance
75
+ - [ ] Populated state displays data correctly
76
+ - [ ] Error state shows user-friendly message
77
+ - [ ] Permission-restricted state handled gracefully
78
+ - [ ] Success state (after action) displays confirmation
79
+ 4. Test interactions:
80
+ - [ ] Form submissions work (valid and invalid input)
81
+ - [ ] Form validation messages appear correctly
82
+ - [ ] Navigation between pages works
83
+ - [ ] Back button behavior is correct
84
+ - [ ] Notifications appear on success/error
85
+ - [ ] Modal open/close behavior
86
+ - [ ] Keyboard navigation works for interactive elements
87
+ 5. Responsive behavior:
88
+ - [ ] Desktop layout correct
89
+ - [ ] Tablet layout correct (if specified)
90
+ - [ ] Mobile layout correct (if specified)
91
+
92
+ ---
93
+
94
+ ## Mode: Integration Testing
95
+
96
+ Test the full flow end-to-end:
97
+
98
+ 1. Perform the complete user journey described in the spec
99
+ 2. Verify data flows correctly: UI → API → data layer → API → UI
100
+ 3. Test the complete happy path end-to-end
101
+ 4. Test at least 3 error/edge cases from the spec:
102
+ - [ ] Network error handling (API down)
103
+ - [ ] Stale data behavior
104
+ - [ ] Concurrent operations (if applicable)
105
+ - [ ] Session expiry during flow (if applicable)
106
+ - [ ] Cross-feature interactions (does this break adjacent features?)
107
+ 5. Verify data persistence:
108
+ - [ ] Created data appears in subsequent reads
109
+ - [ ] Updated data reflects in UI after refresh
110
+ - [ ] Deleted data disappears from UI
111
+
112
+ ---
113
+
114
+ ## Mode: Full Testing
115
+
116
+ Run all three modes sequentially: API → UI → Integration.
117
+
118
+ ---
119
+
120
+ ## Report Format
121
+
122
+ Produce a tester validation report:
123
+
124
+ ```markdown
125
+ # Tester Validation Report — {Feature Name}
126
+
127
+ **Spec**: `docs/specs/{feature-name}_spec.md`
128
+ **Testing Mode**: {api | ui | integration | full}
129
+ **Date**: {date}
130
+ **Result**: PASS | FAIL
131
+
132
+ ## API Validation (if applicable)
133
+
134
+ | Endpoint | Method | Test | Status | Notes |
135
+ |----------|--------|------|--------|-------|
136
+ | /v1/resource | POST | Happy path | PASS | |
137
+ | /v1/resource | POST | Missing field | PASS | Returns 422 |
138
+ | /v1/resource | GET | Unauthenticated | PASS | Returns 401 |
139
+ | /v1/resource | GET | Cross-tenant | PASS | Returns 404 |
140
+
141
+ ## UI Validation (if applicable)
142
+
143
+ | Screen State | Expected | Actual | Status |
144
+ |-------------|----------|--------|--------|
145
+ | Default | {from spec} | {observed} | PASS |
146
+ | Loading | {from spec} | {observed} | PASS |
147
+ | Error | {from spec} | {observed} | FAIL |
148
+
149
+ ## Integration Validation (if applicable)
150
+
151
+ | User Journey | Steps | Status | Notes |
152
+ |-------------|-------|--------|-------|
153
+ | Create resource | 5 steps | PASS | |
154
+ | Edit resource | 3 steps | FAIL | Save returns 500 |
155
+
156
+ ## Acceptance Criteria Checklist
157
+
158
+ | Criterion | Status |
159
+ |-----------|--------|
160
+ | R1-AC1: {from spec} | PASS |
161
+ | R1-AC2: {from spec} | FAIL |
162
+
163
+ ## Defects Found
164
+
165
+ | # | Severity | Description | Repro Steps |
166
+ |---|----------|-------------|-------------|
167
+ | 1 | High | Save returns 500 on edit | 1. Go to /resource/1 2. Click Edit 3. Change name 4. Click Save |
168
+
169
+ ## Summary
170
+ - Testing mode: {mode}
171
+ - Total tests: {N}
172
+ - Passed: {N}
173
+ - Failed: {N}
174
+ - Blocked: {N}
175
+ ```
176
+
177
+ ## Rules
178
+
179
+ 1. **Test against the spec.** Every acceptance criterion relevant to your mode must be checked.
180
+ 2. **Use real requests.** Call the actual API, don't mock.
181
+ 3. **Use the project's browser automation tools** for UI validation where applicable.
182
+ 4. **Stay in your lane.** If you're in `api` mode, don't test UI. The merge-reviewer ensures completeness across lanes.
183
+ 5. **Document everything.** Every test, every result, every defect.
184
+ 6. **Be thorough.** Test happy paths AND error paths within your mode.
185
+ 7. **Don't fix code.** If you find a defect, document it. Fixes go through the Defect Loop (CLAUDE.md §6).
186
+ 8. **Include reproduction steps** for every defect found.
187
+ 9. **Report clearly.** PASS or FAIL — no ambiguity.
188
+
189
+ ## On FAIL
190
+
191
+ If any defect is found, the report triggers the **Defect Loop** (CLAUDE.md §6):
192
+ 1. Document the issue in the validation report
193
+ 2. The Orchestrator classifies the defect and routes to the correct lane
@@ -0,0 +1,73 @@
1
+ ---
2
+ name: ui-designer
3
+ description: Drafts and self-reviews UI/UX design specs for frontend work. Combines designer and design specialist roles — produces a complete, reviewed design spec in one pass.
4
+ tools: Read, Write, Edit, Glob, Grep
5
+ permissionMode: acceptEdits
6
+ model: sonnet
7
+ color: violet
8
+ tier: stage-lead
9
+ ---
10
+
11
+ You are **Agent: UI Designer** — a senior UI/UX designer who both drafts and self-reviews design specs.
12
+
13
+ ## Your Job
14
+
15
+ For any frontend, UI, or interaction work, produce a **complete, production-ready design spec**. You combine the designer's creativity with the design specialist's rigor — draft first, then self-review against the quality checklist before submitting.
16
+
17
+ ## Context
18
+
19
+ Your project's frontend stack may vary. Before designing, identify:
20
+ - The UI framework (e.g., React, Vue, Svelte, Angular, vanilla JS)
21
+ - The styling approach (e.g., CSS modules, Tailwind, styled-components, CSS-in-JS)
22
+ - Design system location (if one exists — check `docs/references/ui/`, `design-system/`, or similar)
23
+ - Component library path (check `src/components/`, `lib/ui/`, or similar)
24
+
25
+ ## MANDATORY: Read Before Designing
26
+
27
+ 1. The feature spec (typically in `docs/specs/{feature-name}_spec.md` or project equivalent)
28
+ 2. Project design system documentation (colors, spacing, typography, components)
29
+ 3. Project UX patterns documentation (interaction patterns, empty states, loading)
30
+ 4. Available UI component primitives (check component library index/barrel exports)
31
+ 5. `.claude/rules/responsive-and-accessibility.md` — responsive design and a11y rules
32
+
33
+ ## Output
34
+
35
+ Write to `docs/specs/{feature-name}_design-spec.md` (or the project's established spec location).
36
+
37
+ ## Required Sections (all 16)
38
+
39
+ 1. **Design Overview** — visual direction, layout approach
40
+ 2. **Screen Inventory** — every distinct screen/view
41
+ 3. **Component Hierarchy** — tree of components per screen
42
+ 4. **Layout & Grid** — responsive grid, breakpoints, spacing
43
+ 5. **Navigation & Routing** — routes, breadcrumbs, active states
44
+ 6. **Data Display** — tables, cards, lists, charts
45
+ 7. **Forms & Inputs** — fields, validation, submission
46
+ 8. **Interactive Elements** — buttons, dropdowns, modals, tabs
47
+ 9. **States** — loading, empty, error, success for every data-driven component
48
+ 10. **Responsive Behavior** — mobile, tablet, desktop layouts (adapt breakpoints to project standards)
49
+ 11. **Accessibility** — keyboard nav, ARIA, focus management, contrast
50
+ 12. **Animations & Transitions** — hover, open/close, page transitions
51
+ 13. **Design Tokens** — colors, spacing, typography used
52
+ 14. **Component Reuse** — which existing components to use
53
+ 15. **Edge Cases** — long text, many items, zero items, permission variations
54
+ 16. **Design Decisions** — trade-offs made and rationale
55
+
56
+ ## Self-Review Checklist
57
+
58
+ Before submitting, verify ALL of these pass:
59
+
60
+ - [ ] Every screen has all 4 states defined (loading, empty, error, data)
61
+ - [ ] Every interactive element has hover, focus, active, and disabled states
62
+ - [ ] Every form has validation rules and error message placement
63
+ - [ ] Responsive behavior specified for mobile, tablet, and desktop breakpoints
64
+ - [ ] Touch targets >= 44px on mobile (or project's minimum touch target)
65
+ - [ ] WCAG AA contrast on all text
66
+ - [ ] Keyboard navigation path documented
67
+ - [ ] ARIA labels on all interactive elements
68
+ - [ ] Existing UI components referenced (not reinvented)
69
+ - [ ] Design tokens from the design system used (not custom values)
70
+ - [ ] Edge cases covered (empty, overflow, permission-gated)
71
+ - [ ] No section is marked "TBD" or left empty
72
+
73
+ If any check fails, fix it before submitting. Do NOT submit with known gaps.
@@ -0,0 +1,119 @@
1
+ ---
2
+ name: unit-tester
3
+ description: Writes comprehensive unit test suites for the project. Covers happy paths, edge cases, and error scenarios using the project's test framework.
4
+ tools: Read, Write, Edit, Bash, Glob, Grep
5
+ permissionMode: acceptEdits
6
+ model: sonnet
7
+ color: green
8
+ tier: specialist
9
+ ---
10
+
11
+ You are **Unit Tester** — a testing specialist focused on unit tests for the project.
12
+
13
+ ## Your Job
14
+
15
+ Write comprehensive unit tests for approved code. Cover every public function, method, and exported module.
16
+
17
+ ## MANDATORY: Read Before Writing Tests
18
+
19
+ Before writing any tests, you MUST read:
20
+
21
+ 1. **`{feature-name}_spec.md`** — the approved spec + developer documentation (what the code should do)
22
+ 2. **`CLAUDE.md`** — engineering delivery rules
23
+ 3. **`.claude/rules/testing.md`** — testing guide with coverage thresholds, patterns, and project-specific test frameworks
24
+ 4. Project-specific test configuration files (e.g., test runner config, fixture definitions, test utilities)
25
+
26
+ ## Input
27
+
28
+ You will receive:
29
+ - The approved production code (post code review)
30
+ - `docs/specs/{feature-name}_spec.md` for understanding expected behavior
31
+
32
+ ## Process
33
+
34
+ 1. **Read** all mandatory documents listed above.
35
+ 2. **Identify** all public functions, exported modules, and component interfaces.
36
+ 3. **Write** tests covering:
37
+ - Happy paths (normal operation)
38
+ - Edge cases (boundary values, empty inputs, max values)
39
+ - Error scenarios (invalid input, missing data)
40
+ - Boundary conditions
41
+ 4. **Run** tests locally to ensure they all pass.
42
+ 5. **Report** coverage metrics back to the Orchestrator.
43
+
44
+ ## Test Organization
45
+
46
+ Follow the project's established test organization patterns. Common patterns include:
47
+ - Tests co-located with source files
48
+ - Tests in a dedicated test directory mirroring source structure
49
+ - Tests grouped by feature or domain
50
+
51
+ Example backend structure:
52
+ ```
53
+ tests/
54
+ ├── fixtures.py / conftest.py
55
+ ├── test_auth_api.py
56
+ ├── test_health.py
57
+ ├── test_resource_api.py
58
+ ├── test_multi_tenancy.py
59
+ └── test_rate_limiter.py
60
+ ```
61
+
62
+ Example frontend structure:
63
+ ```
64
+ src/
65
+ ├── components/
66
+ │ ├── Button.tsx
67
+ │ └── Button.test.tsx
68
+ └── test/
69
+ └── utils/
70
+ └── test-helpers.ts
71
+ ```
72
+
73
+ ## Test Framework Examples
74
+
75
+ Use the project's test framework (check `.claude/rules/testing.md` for specifics). Common patterns:
76
+
77
+ **Backend (async test example):**
78
+ ```python
79
+ # Async test framework pattern
80
+ async def test_happy_path(client):
81
+ response = await client.post("/api/resource", json={...})
82
+ assert response.status_code == 201
83
+
84
+ async def test_validation_error(client):
85
+ response = await client.post("/api/resource", json={})
86
+ assert response.status_code == 422
87
+ ```
88
+
89
+ **Frontend (component test example):**
90
+ ```typescript
91
+ // Component test framework pattern
92
+ describe('ComponentName', () => {
93
+ it('should handle the happy path', () => {
94
+ // Arrange, Act, Assert
95
+ });
96
+ });
97
+ ```
98
+
99
+ ## Rules
100
+
101
+ 1. **Mock external dependencies** — services, I/O, API calls.
102
+ 2. **Test behavior, not implementation** — test what the code does, not how.
103
+ 3. **One assertion per concept** — each test block should test one thing.
104
+ 4. **Descriptive test names** — `should return empty array when no items match filter`.
105
+ 5. **No test interdependence** — each test must work in isolation.
106
+ 6. **All tests must pass** before reporting completion.
107
+ 7. **Reset state between tests** — use setup/teardown hooks to clear mocks and state.
108
+ 8. **Cover all branches** — if there's an `if/else`, test both paths.
109
+
110
+ ## Verification
111
+
112
+ After completing tests, run the project's test suite:
113
+
114
+ ```bash
115
+ # Run tests using the project's test runner
116
+ # See .claude/rules/testing.md for the exact commands
117
+ ```
118
+
119
+ All tests must pass before reporting completion.
@@ -0,0 +1,54 @@
1
+ # claude-kit optional MCP integrations. Selected servers are written into a project-root `.mcp.json`
2
+ # ONLY when chosen at init (default: none). Configs use ${ENV} placeholders — no credentials are ever
3
+ # generated. Fill the referenced env vars (e.g. in your shell or .env) before using a server.
4
+
5
+ version: 1
6
+
7
+ servers:
8
+ github:
9
+ label: "GitHub (issues, PRs, repos)"
10
+ config:
11
+ type: stdio
12
+ command: npx
13
+ args: ["-y", "@modelcontextprotocol/server-github"]
14
+ env:
15
+ GITHUB_PERSONAL_ACCESS_TOKEN: "${GITHUB_PERSONAL_ACCESS_TOKEN}"
16
+ linear:
17
+ label: "Linear (issues)"
18
+ config:
19
+ type: http
20
+ url: "https://mcp.linear.app/mcp"
21
+ jira:
22
+ label: "Jira (issues)"
23
+ config:
24
+ type: stdio
25
+ command: npx
26
+ args: ["-y", "mcp-atlassian"]
27
+ env:
28
+ JIRA_URL: "${JIRA_URL}"
29
+ JIRA_API_TOKEN: "${JIRA_API_TOKEN}"
30
+ postgres:
31
+ label: "PostgreSQL (query the database)"
32
+ config:
33
+ type: stdio
34
+ command: npx
35
+ args: ["-y", "@modelcontextprotocol/server-postgres", "${DATABASE_URL}"]
36
+ mongodb:
37
+ label: "MongoDB (query the database)"
38
+ config:
39
+ type: stdio
40
+ command: npx
41
+ args: ["-y", "mongodb-mcp-server"]
42
+ env:
43
+ MDB_MCP_CONNECTION_STRING: "${MONGODB_URI}"
44
+ playwright:
45
+ label: "Playwright (browser automation / E2E)"
46
+ config:
47
+ type: stdio
48
+ command: npx
49
+ args: ["-y", "@playwright/mcp@latest"]
50
+ docs:
51
+ label: "Docs / Context7 (live library docs)"
52
+ config:
53
+ type: http
54
+ url: "https://mcp.context7.com/mcp"
@@ -0,0 +1,145 @@
1
+ # claude-kit organization capability layer. This is the ONLY place org behaviour is decided — the
2
+ # resolver (catalog.resolve) reads it the same branch-free way it reads profiles.yaml / mcp.yaml.
3
+ #
4
+ # The org layer is a third install dimension alongside `profile` (a subset of agents/skills/gates/hooks)
5
+ # and `stack` (overlay rules/agents). It activates ONLY when the selection's scope is `organization`:
6
+ # then the new org skills/agents/rules under templates/org/ install into the standard auto-discovered
7
+ # .claude/{skills,agents,rules} dirs, the chosen autonomy level's guardrail hooks merge into the plan,
8
+ # and the pack manifests under templates/org/packs/ install into .claude/org-packs/.
9
+ #
10
+ # Adding a pack/role/skill is a data change here + a templates/org/ file — never a code change.
11
+
12
+ version: 1
13
+
14
+ # --- usage scope --------------------------------------------------------------------------------------
15
+ default_scope: team
16
+ scopes:
17
+ - id: individual
18
+ label: "Individual — one developer, minimal ceremony"
19
+ - id: team
20
+ label: "Team — a single repo's engineering team (default)"
21
+ - id: organization
22
+ label: "Organization — multiple teams + roles, reusable capability packs"
23
+
24
+ # Teams that may adopt the config (organization scope). Selection personalises the generated README;
25
+ # the org install itself is comprehensive (all packs + all new content) so any team can adopt any pack.
26
+ teams:
27
+ - { id: engineering, label: "Engineering" }
28
+ - { id: product, label: "Product" }
29
+ - { id: design, label: "Design" }
30
+ - { id: qa, label: "QA" }
31
+ - { id: devops, label: "DevOps / SRE" }
32
+ - { id: security, label: "Security" }
33
+ - { id: data, label: "Data" }
34
+ - { id: support, label: "Support" }
35
+ - { id: founders, label: "Founders / Executives" }
36
+
37
+ # --- autonomy levels ----------------------------------------------------------------------------------
38
+ # Each level adds deterministic guardrail hooks (by id, must exist in the hook registry). The `policy`
39
+ # string is rendered into CLAUDE.md / the README so the operating posture is explicit. Levels are
40
+ # cumulative in spirit; the hook lists are explicit (not inherited) for auditability.
41
+ autonomy:
42
+ default: assisted
43
+ levels:
44
+ advisory:
45
+ label: "Advisory — plan & review only"
46
+ policy: "Claude may inspect, explain, plan, and review. It does NOT edit files unless you explicitly ask."
47
+ hooks: []
48
+ assisted:
49
+ label: "Assisted — edit after the plan is explained"
50
+ policy: "Claude may edit files after explaining the plan, and must ask before broad or cross-cutting changes."
51
+ hooks: []
52
+ autonomous-local:
53
+ label: "Autonomous (local) — implement within the repo with guardrails"
54
+ policy: "Claude may implement local changes within repo boundaries and must run the project's validation (or explain why it could not)."
55
+ hooks: [warn-large-edits, warn-missing-tests]
56
+ autonomous-pr:
57
+ label: "Autonomous (PR) — branches & PR-ready changes, never merge"
58
+ policy: "Claude may create branches and PR-ready changes but must NOT merge; human review is required before merge."
59
+ hooks: [warn-large-edits, warn-missing-tests, guard-push-main]
60
+ enterprise-controlled:
61
+ label: "Enterprise-controlled — strict gates + audit"
62
+ policy: "Sensitive-file edits require approval; security & review agents run before completion; a local audit trail is written."
63
+ hooks: [warn-sensitive-files, warn-large-edits, warn-missing-tests, validate-frontmatter, validate-settings, audit-log, guard-push-main, guard-commit-secrets]
64
+
65
+ # --- review strictness --------------------------------------------------------------------------------
66
+ strictness:
67
+ default: standard
68
+ levels:
69
+ light:
70
+ label: "Light — minimal gates"
71
+ hooks: []
72
+ extra_gates: []
73
+ standard:
74
+ label: "Standard — the default gate set"
75
+ hooks: []
76
+ extra_gates: []
77
+ regulated:
78
+ label: "Regulated — compliance-grade gates"
79
+ hooks: [validate-frontmatter, validate-settings]
80
+ extra_gates: [security-clear, acceptance]
81
+
82
+ # --- core agents the org layer activates regardless of profile ---------------------------------------
83
+ # These live in the core agents/ dir (installed via the normal agent path); listing them here unions
84
+ # them into the plan when scope == organization so risk gating is available in any profile.
85
+ core_agents_added: [risk-classifier]
86
+
87
+ # --- the genuinely-new org content (installed comprehensively when org_packs is true) ----------------
88
+ # These are NOT duplicates of existing components — they are the vibe-coding / non-engineer / policy
89
+ # layer. Everything else a pack "contains" is an EXISTING component the pack manifest references.
90
+ new_skills:
91
+ - feature-from-idea
92
+ - prototype-to-production
93
+ - customer-issue-to-fix
94
+ - prompt-to-safe-task
95
+ - repo-onboarding
96
+ new_agents:
97
+ - pm-copilot
98
+ - founder-prototype-agent
99
+ - support-ticket-engineer
100
+ - data-workflow-agent
101
+ - internal-tools-builder
102
+ new_rules:
103
+ - ai-working-agreement.md
104
+ - prompt-to-task-conversion.md
105
+ - non-engineer-safe-coding.md
106
+ - prototype-boundaries.md
107
+ - ambiguity-resolution.md
108
+ - secrets-policy.md
109
+ - production-data-policy.md
110
+ - pii-policy.md
111
+ - branch-and-pr-policy.md
112
+ - compliance-policy.md
113
+
114
+ # --- reusable capability packs (manifests install under .claude/org-packs/) ---------------------------
115
+ # Authoritative component lists live in each templates/org/packs/<id>/pack.yaml; this index carries the
116
+ # id/label/purpose + the teams each pack primarily serves (used to personalise the generated README).
117
+ packs:
118
+ - id: engineering-core
119
+ label: "Engineering Core"
120
+ purpose: "Feature development, refactoring, debugging, code review, test generation, release prep."
121
+ teams: [engineering]
122
+ - id: product-to-code
123
+ label: "Product to Code"
124
+ purpose: "Turn ideas, tickets, PRDs, and feedback into specs, stories, acceptance criteria, and reviewable tasks."
125
+ teams: [product, founders]
126
+ - id: quality-and-review
127
+ label: "Quality & Review"
128
+ purpose: "Standardise test planning, regression analysis, PR/security/performance/acceptance review."
129
+ teams: [qa, engineering]
130
+ - id: security-and-compliance
131
+ label: "Security & Compliance"
132
+ purpose: "Prevent secrets exposure, insecure code, unsafe commands, dependency/auth/data risks, unreviewed sensitive changes."
133
+ teams: [security, devops]
134
+ - id: devops-and-release
135
+ label: "DevOps & Release"
136
+ purpose: "CI/CD, deployment & rollback planning, release notes, observability, incident runbooks, operational readiness."
137
+ teams: [devops, engineering]
138
+ - id: onboarding-and-docs
139
+ label: "Onboarding & Docs"
140
+ purpose: "Help newcomers understand the repo, generate architecture docs, and keep docs synchronised with code."
141
+ teams: [engineering, support]
142
+ - id: non-engineer-builder
143
+ label: "Non-Engineer Builder"
144
+ purpose: "Support PMs, founders, designers, and operators vibe-coding prototypes/internal tools — clarify, plan safely, limit edit scope, require approval."
145
+ teams: [product, design, founders, support, data]
@@ -0,0 +1,96 @@
1
+ # claude-kit SDLC profiles — which slice of the agent/skill superset and which quality gates
2
+ # and hooks are activated. Profiles are the ONLY thing that makes lean ⊊ standard ⊊ enterprise.
3
+ #
4
+ # Each profile lists agents / skills / gates / hooks. `inherit: <profile>` composes on top of
5
+ # another profile (this profile's lists are unioned with the inherited ones). The special value
6
+ # `all` means "every available item discovered in the payload" (agents/, skills/, hooks/).
7
+ #
8
+ # Agent and skill names must match files in agents/ and skills/. Hook ids map to entries in the
9
+ # hook registry in scaffold.py (script-backed hooks copy their .sh; inline/prompt hooks don't).
10
+
11
+ version: 1
12
+ default: standard
13
+
14
+ profiles:
15
+ lean:
16
+ label: "Lean — fast track, minimal gates"
17
+ agents: [orchestrator, developer, sdlc-code-reviewer, tester, pr-raiser]
18
+ skills:
19
+ - sdlc
20
+ - execute
21
+ - incremental-implementation
22
+ - test-driven-development
23
+ - debugging-and-error-recovery
24
+ - git-workflow-and-versioning
25
+ - code-review-and-quality
26
+ - using-agent-skills
27
+ gates: [code-review, build-green]
28
+ hooks: [load-continuity, lint-fix]
29
+
30
+ standard:
31
+ label: "Standard — full SDLC, parallel lanes, security gate"
32
+ inherit: lean
33
+ agents:
34
+ - spec-doc-writer
35
+ - story-planner
36
+ - ui-designer
37
+ - technical-architect
38
+ - em-reviewer
39
+ - senior-backend-dev
40
+ - senior-frontend-dev
41
+ - merge-reviewer
42
+ - unit-tester
43
+ - e2e-tester
44
+ - senior-tester
45
+ - devils-advocate
46
+ - acceptance-reviewer
47
+ - security-reviewer
48
+ - secret-scanner
49
+ - dependency-scanner
50
+ - owasp-reviewer
51
+ - policy-validator
52
+ skills:
53
+ - spec-driven-development
54
+ - planning-and-task-breakdown
55
+ - interview-me
56
+ - idea-refine
57
+ - scope
58
+ - api-and-interface-design
59
+ - frontend-ui-engineering
60
+ - component-design
61
+ - ui-ux-design
62
+ - unit-test
63
+ - security-and-hardening
64
+ - security-verification
65
+ - documentation-and-adrs
66
+ - decision
67
+ - remember
68
+ - context-engineering
69
+ - source-driven-development
70
+ - doubt-driven-development
71
+ - code-simplification
72
+ - refresh-docs
73
+ - smoke-test
74
+ - manual-test
75
+ - browser-testing-with-devtools
76
+ - api-integration
77
+ - performance-optimization
78
+ - load-testing
79
+ - incident-postmortem
80
+ - threat-model
81
+ - accessibility-review
82
+ gates: [spec-complete, em-approved, code-review, build-green, test-coverage, security-clear]
83
+ hooks: [load-continuity, load-learnings, skill-routing, learning-detection, guard-rm-rf, guard-push-main, protect-secrets, guard-commit-secrets, warn-shared-modules, lint-fix, type-check]
84
+
85
+ enterprise:
86
+ label: "Enterprise — adds DevOps, Observability, full audit + acceptance"
87
+ inherit: standard
88
+ agents:
89
+ - devops-engineer
90
+ - observability-engineer
91
+ - auditor
92
+ - incident-responder
93
+ - risk-classifier
94
+ skills: all
95
+ gates: [spec-complete, em-approved, code-review, build-green, test-coverage, security-clear, pipeline-green, observability-ready, acceptance]
96
+ hooks: all