@starlein/paperclip-plugin-company-wizard 0.3.18 → 0.3.20

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (48) hide show
  1. package/LICENSE +5 -1
  2. package/README.md +21 -5
  3. package/dist/manifest.js +7 -2
  4. package/dist/manifest.js.map +2 -2
  5. package/dist/ui/index.css +1 -1
  6. package/dist/ui/index.css.map +2 -2
  7. package/dist/ui/index.js +2 -2
  8. package/dist/ui/index.js.map +1 -1
  9. package/dist/worker.js +48 -7
  10. package/dist/worker.js.map +2 -2
  11. package/package.json +17 -16
  12. package/templates/ai-wizard/interview-system.md +1 -1
  13. package/templates/ai-wizard/single-shot-system.md +1 -1
  14. package/templates/modules/accessibility/skills/accessibility-audit.bar.md +11 -0
  15. package/templates/modules/architecture-plan/agents/ui-designer/skills/design-system.bar.md +11 -0
  16. package/templates/modules/architecture-plan/docs/architecture-template.md +1 -1
  17. package/templates/modules/architecture-plan/docs/design-system-template.md +1 -1
  18. package/templates/modules/architecture-plan/skills/architecture-plan.bar.md +11 -0
  19. package/templates/modules/backlog/skills/backlog-health.bar.md +11 -0
  20. package/templates/modules/brand-identity/docs/brand-identity-template.md +1 -1
  21. package/templates/modules/brand-identity/skills/brand-identity.bar.md +11 -0
  22. package/templates/modules/build-api/skills/api-design.bar.md +11 -0
  23. package/templates/modules/ci-cd/skills/ci-cd.bar.md +11 -0
  24. package/templates/modules/codebase-onboarding/skills/codebase-audit.bar.md +11 -0
  25. package/templates/modules/market-analysis/docs/market-analysis-template.md +1 -1
  26. package/templates/modules/market-analysis/skills/market-analysis.bar.md +11 -0
  27. package/templates/modules/monitoring/skills/monitoring.bar.md +11 -0
  28. package/templates/modules/security-audit/skills/security-review.bar.md +11 -0
  29. package/templates/modules/security-audit/skills/threat-model.bar.md +11 -0
  30. package/templates/modules/tech-stack/docs/tech-stack-template.md +1 -1
  31. package/templates/modules/tech-stack/skills/tech-stack.bar.md +11 -0
  32. package/templates/modules/user-testing/docs/user-testing-template.md +1 -1
  33. package/templates/modules/user-testing/skills/user-testing.bar.md +11 -0
  34. package/templates/modules/vision-workshop/docs/vision-template.md +1 -1
  35. package/templates/roles/code-reviewer/DONE.md +10 -0
  36. package/templates/roles/code-reviewer/LENSES.md +11 -0
  37. package/templates/roles/devops/DONE.md +10 -0
  38. package/templates/roles/devops/LENSES.md +12 -0
  39. package/templates/roles/engineer/DONE.md +10 -0
  40. package/templates/roles/product-owner/DONE.md +10 -0
  41. package/templates/roles/product-owner/LENSES.md +11 -0
  42. package/templates/roles/qa/DONE.md +10 -0
  43. package/templates/roles/security-engineer/DONE.md +10 -0
  44. package/templates/roles/security-engineer/LENSES.md +16 -0
  45. package/templates/roles/ui-designer/DONE.md +10 -0
  46. package/templates/roles/ui-designer/LENSES.md +13 -0
  47. package/templates/roles/ux-researcher/DONE.md +10 -0
  48. package/templates/roles/ux-researcher/LENSES.md +14 -0
package/package.json CHANGED
@@ -1,22 +1,9 @@
1
1
  {
2
2
  "name": "@starlein/paperclip-plugin-company-wizard",
3
- "version": "0.3.18",
3
+ "version": "0.3.20",
4
4
  "type": "module",
5
5
  "description": "AI-powered wizard to bootstrap paperclip agent companies from composable templates (for latest paperclip version)",
6
6
  "repository": "https://github.com/starlein/paperclip-plugin-company-wizard",
7
- "scripts": {
8
- "build": "node ./esbuild.config.mjs",
9
- "build:rollup": "rollup -c",
10
- "dev": "node ./esbuild.config.mjs --watch",
11
- "dev:ui": "paperclip-plugin-dev-server --root . --ui-dir dist/ui --port 4177",
12
- "test": "vitest run --config ./vitest.config.ts",
13
- "test:logic": "node --test src/logic/*.test.js src/api/*.test.js",
14
- "typecheck": "tsc --noEmit",
15
- "build:prod": "NODE_ENV=production node ./esbuild.config.mjs",
16
- "publish:npm": "npm publish --access public",
17
- "prepublishOnly": "pnpm build:prod",
18
- "prepare": "husky"
19
- },
20
7
  "publishConfig": {
21
8
  "access": "public",
22
9
  "registry": "https://registry.npmjs.org/"
@@ -40,7 +27,10 @@
40
27
  "plugin",
41
28
  "workspace"
42
29
  ],
43
- "author": "@lx-0 <https://github.com/lx-0>",
30
+ "author": "Sascha Pietrowski <sp@speednetwork.de>",
31
+ "contributors": [
32
+ "Yesterday AI (original @yesterday-ai/paperclip-plugin-company-wizard — template system, assembly logic, API client)"
33
+ ],
44
34
  "license": "MIT",
45
35
  "dependencies": {
46
36
  "class-variance-authority": "^0.7.1",
@@ -74,5 +64,16 @@
74
64
  "@paperclipai/shared": ">=2026.529.0",
75
65
  "react": ">=18",
76
66
  "react-dom": ">=18"
67
+ },
68
+ "scripts": {
69
+ "build": "node ./esbuild.config.mjs",
70
+ "build:rollup": "rollup -c",
71
+ "dev": "node ./esbuild.config.mjs --watch",
72
+ "dev:ui": "paperclip-plugin-dev-server --root . --ui-dir dist/ui --port 4177",
73
+ "test": "vitest run --config ./vitest.config.ts",
74
+ "test:logic": "node --test src/logic/*.test.js src/api/*.test.js",
75
+ "typecheck": "tsc --noEmit",
76
+ "build:prod": "NODE_ENV=production node ./esbuild.config.mjs",
77
+ "publish:npm": "npm publish --access public"
77
78
  }
78
- }
79
+ }
@@ -1,4 +1,4 @@
1
- You are the Clipper AI Wizard — an expert at assembling AI agent teams. You're enthusiastic but concise. Clipper bootstraps AI-agent company workspaces from composable templates.
1
+ You are the Company Wizard — an expert at assembling AI agent teams. You're enthusiastic but concise. Company Wizard bootstraps AI-agent company workspaces from composable templates.
2
2
 
3
3
  You are conducting a guided interview to understand what company to set up.
4
4
 
@@ -1,4 +1,4 @@
1
- You are the Clipper AI Wizard. Clipper bootstraps AI-agent company workspaces from composable templates.
1
+ You are the Company Wizard. Company Wizard bootstraps AI-agent company workspaces from composable templates.
2
2
 
3
3
  Given a natural language description of what the user wants to build, you select the best configuration.
4
4
 
@@ -0,0 +1,11 @@
1
+ ## Output / review bar
2
+
3
+ A good accessibility audit:
4
+
5
+ - A `docs/ACCESSIBILITY-AUDIT.md` covering WCAG 2.2 AA across: semantic HTML, keyboard navigation, colour contrast, ARIA usage, images/media, forms, and zoom/responsive behaviour.
6
+ - Each finding has a severity (Critical / Major / Minor), a specific location, and a concrete remediation — Critical and Major findings have follow-up issues created.
7
+
8
+ Not done:
9
+
10
+ - A scan dump with no remediation priorities — a raw list of automated-tool violations with no severity ranking and no recommended fixes is not done.
11
+ - An audit that only runs an automated checker without testing keyboard-only navigation or verifying focus indicators manually.
@@ -0,0 +1,11 @@
1
+ ## Output / review bar
2
+
3
+ A good design system deliverable:
4
+
5
+ - Defines reusable tokens (spacing, colour, type, radius) and the components built from them, with usage rules and do/don't examples.
6
+ - States how engineers consume it (where tokens live, naming, theming) so implementation matches the spec without guesswork.
7
+
8
+ Not done:
9
+
10
+ - Tokens with no usage guidance, or one-off values that bypass the scale.
11
+ - A component gallery with no states (hover, focus, disabled, error) defined.
@@ -35,4 +35,4 @@ _APIs between components._
35
35
  | _..._ | _..._ | _..._ |
36
36
 
37
37
  ---
38
- _Generated by Clipper. Fill in during architecture-plan task._
38
+ _Generated by Company Wizard. Fill in during architecture-plan task._
@@ -58,4 +58,4 @@ _Logo usage, iconography, visual tone_
58
58
  | desktop | _1024px_ | _..._ |
59
59
 
60
60
  ---
61
- _Generated by Clipper. Fill in during design-system task._
61
+ _Generated by Company Wizard. Fill in during design-system task._
@@ -0,0 +1,11 @@
1
+ ## Output / review bar
2
+
3
+ A good architecture plan:
4
+
5
+ - A `docs/ARCHITECTURE.md` with a system overview (text/ASCII component diagram), data flow through the system, API boundaries (internal and external), deployment model, and key decisions recorded in ADR style with rationale.
6
+ - Decomposed into concrete implementation issues for foundational scaffolding so work can start incrementally.
7
+
8
+ Not done:
9
+
10
+ - A diagram with no data flow or failure modes — components drawn without explaining how data moves or what happens when a dependency is unavailable.
11
+ - Decisions recorded without rationale — "we use a monorepo" with no explanation of why that fits the requirements.
@@ -0,0 +1,11 @@
1
+ ## Output / review bar
2
+
3
+ A good backlog health pass:
4
+
5
+ - Every issue created is INVEST-shaped: has a clear title, written acceptance criteria in the description, a priority, a label, and is attached to the correct `projectId` and `goalId` — never a top-level issue with `projectId: null`.
6
+ - The backlog maintains at least 3 unassigned, ready-to-work issues; if the queue drops below that threshold, new ones are created from the roadmap and the action is recorded in daily notes.
7
+
8
+ Not done:
9
+
10
+ - Issues that are not INVEST-shaped — a title with no acceptance criteria, no label, or no project link is not done.
11
+ - Creating duplicate issues without first checking existing open issues, or creating more issues when the goal is already fully decomposed.
@@ -40,4 +40,4 @@ _Communication style, vocabulary preferences, and brand personality traits._
40
40
  _Examples of on-brand vs. off-brand language._
41
41
 
42
42
  ---
43
- _Generated by Clipper. Fill in during brand-identity task._
43
+ _Generated by Company Wizard. Fill in during brand-identity task._
@@ -0,0 +1,11 @@
1
+ ## Output / review bar
2
+
3
+ A good brand identity:
4
+
5
+ - A `docs/BRAND-IDENTITY.md` with concrete values and rationale for every element: colour palette (hex/RGB values with contrast ratios), typography (typefaces, size scale, weight usage), logo usage rules (clear space, do's and don'ts), iconography style, and tone of voice.
6
+ - If a tech stack exists, a design tokens file (CSS custom properties or JSON) matching the chosen stack, so the identity is immediately usable in code.
7
+
8
+ Not done:
9
+
10
+ - A palette with no usage rules — listing hex colours without specifying which is primary, when to use each, or whether they meet WCAG AA contrast is not done.
11
+ - Brand choices without rationale — "we picked blue" with no connection to the target audience, brand attributes, or existing constraints.
@@ -0,0 +1,11 @@
1
+ ## Output / review bar
2
+
3
+ A good API design:
4
+
5
+ - A `docs/API-DESIGN.md` with a resource model, full endpoint inventory (method, path, auth requirement), authentication strategy, error-handling conventions (consistent error shape), and pagination approach.
6
+ - Every endpoint has: description, parameter types and constraints, request/response schema, example request/response, and possible error codes — generated from source annotations (OpenAPI/Swagger), not maintained by hand.
7
+
8
+ Not done:
9
+
10
+ - Endpoints with no auth or error contract — a list of URLs with no mention of who can call them or what error codes they return is not done.
11
+ - A design that skips input validation at the boundary or uses a different error shape per endpoint.
@@ -0,0 +1,11 @@
1
+ ## Output / review bar
2
+
3
+ A good CI/CD setup:
4
+
5
+ - A working pipeline with a CI stage (lint → typecheck → test on every PR and push to main) and a CD stage (deploy on merge to main, smoke tests after deployment), documented in `docs/CI-CD.md` with status badges in the README.
6
+ - Pipelines complete in under 5 minutes (dependency caching in place), action versions pinned to full SHAs, and all secrets stored in GitHub Secrets or equivalent — none in workflow files.
7
+
8
+ Not done:
9
+
10
+ - A pipeline with no rollback path — deploying with no documented procedure for reverting a bad release or re-running the previous successful build is not done.
11
+ - A pipeline that breaks main and is not fixed immediately, or one that stores secrets directly in the workflow YAML.
@@ -0,0 +1,11 @@
1
+ ## Output / review bar
2
+
3
+ A good codebase audit:
4
+
5
+ - A `docs/CODEBASE-AUDIT.md` with architecture overview (layers, key components, data flow), tech stack summary, tech debt inventory ranked by severity (critical / major / minor), test coverage assessment identifying untested paths, and recommended cleanup priorities.
6
+ - Followed by concrete, scoped follow-up issues — one per fix — for the top cleanup opportunities.
7
+
8
+ Not done:
9
+
10
+ - An audit with no prioritised tech-debt list — noting "there is some debt" without ranking it by severity or impact is not done.
11
+ - An audit that describes the code structure without assessing test coverage or identifying actionable cleanup items.
@@ -29,4 +29,4 @@
29
29
  _Strategic recommendations based on the analysis above._
30
30
 
31
31
  ---
32
- _Generated by Clipper. Fill in during market-analysis task._
32
+ _Generated by Company Wizard. Fill in during market-analysis task._
@@ -0,0 +1,11 @@
1
+ ## Output / review bar
2
+
3
+ A good market analysis:
4
+
5
+ - A `docs/MARKET-ANALYSIS.md` that covers: target market (who the users are and what problem is being solved), a competitor breakdown with each player's strengths and weaknesses, a clear positioning statement with a unique value proposition, and identified market/adoption risks.
6
+ - Each insight is evidence-based and tied to a concrete product decision or follow-up action.
7
+
8
+ Not done:
9
+
10
+ - A competitor list with no positioning takeaway — naming five competitors without explaining how the product differentiates or what the strategic response is.
11
+ - Vague assertions ("the market is growing") with no source, no specifics, and no actionable output.
@@ -0,0 +1,11 @@
1
+ ## Output / review bar
2
+
3
+ A good monitoring setup:
4
+
5
+ - Health check endpoints (liveness + readiness) for all services, error tracking with full context (request ID, user, stack trace), structured JSON logs with consistent fields (timestamp, level, service, correlation ID), and alert thresholds for key metrics (error rate, latency, uptime), all documented in `docs/MONITORING.md`.
6
+ - Every alert is symptom-based (user impact), actionable, and has a runbook — no alert fires without a documented response.
7
+
8
+ Not done:
9
+
10
+ - Alerts with no runbook — an alert that fires with no documented steps for what to check or how to respond is not done.
11
+ - Unstructured log strings, or alerts that fire on internal metric movement with no corresponding user-visible impact.
@@ -0,0 +1,11 @@
1
+ ## Output / review bar
2
+
3
+ A good security review:
4
+
5
+ - A `docs/SECURITY-REVIEW.md` with findings that include: severity (Critical / High / Medium / Low), exact file path and line number, the evidence (code snippet or reproduction step), and a specific recommended fix.
6
+ - A dependency report with CVE details from `npm audit` or equivalent. Critical and High findings have follow-up issues created.
7
+
8
+ Not done:
9
+
10
+ - A finding with no exploit path, blast radius, or concrete fix — "there may be an injection risk here" without a reproduction path, affected data scope, or remediation is not done.
11
+ - A review that flags secrets exposure as anything lower than Critical.
@@ -0,0 +1,11 @@
1
+ ## Output / review bar
2
+
3
+ A good threat model:
4
+
5
+ - A `docs/THREAT-MODEL.md` with a system overview that includes components, data flows, and explicit trust boundaries; STRIDE threats against the identified attack surfaces; a risk rating (Likelihood × Impact) for each threat; and mitigations for every Critical and High risk.
6
+ - Critical and High risks have corresponding follow-up issues with specific remediation tasks.
7
+
8
+ Not done:
9
+
10
+ - A threat list with no trust boundaries or blast-radius — threats listed without identifying which components they affect, what data is at risk, or how far an attacker could move laterally.
11
+ - Risk ratings with no mitigations — identifying threats without recommending controls leaves the model unactionable.
@@ -25,4 +25,4 @@ _What was considered and rejected, and why._
25
25
  | _..._ | _..._ | _..._ |
26
26
 
27
27
  ---
28
- _Generated by Clipper. Fill in during tech-stack task._
28
+ _Generated by Company Wizard. Fill in during tech-stack task._
@@ -0,0 +1,11 @@
1
+ ## Output / review bar
2
+
3
+ A good tech stack evaluation:
4
+
5
+ - A `docs/TECH-STACK.md` that lists the chosen technology per layer (language, framework, database, infra) with version, the rationale for each choice, and the alternatives that were considered and rejected.
6
+ - Covers at least: team familiarity, ecosystem maturity, performance trade-offs, and cost for each layer.
7
+
8
+ Not done:
9
+
10
+ - A stack pick with no rationale or rejected alternatives — "we'll use Postgres" with nothing else is not done.
11
+ - A decision that ignores team capabilities or requires paid services without creating an approval request.
@@ -34,4 +34,4 @@ _Prioritized recommendations based on findings above._
34
34
  - [ ] _Issue title — severity, linked finding #_
35
35
 
36
36
  ---
37
- _Generated by Clipper. Fill in during user-testing task._
37
+ _Generated by Company Wizard. Fill in during user-testing task._
@@ -0,0 +1,11 @@
1
+ ## Output / review bar
2
+
3
+ A good usability finding:
4
+
5
+ - Names the task, the observation (with a quote or step trace), the severity, and a concrete recommendation.
6
+ - Distinguishes evidence from interpretation, and reproducible issues from one-offs.
7
+
8
+ Not done:
9
+
10
+ - "Users were confused" with no task, no repro, and no severity.
11
+ - A pass/fail with no evidence attached.
@@ -25,4 +25,4 @@ _How the company achieves that vision._
25
25
  - _What the company explicitly does NOT do_
26
26
 
27
27
  ---
28
- _Generated by Clipper. Fill in during vision-workshop task._
28
+ _Generated by Company Wizard. Fill in during vision-workshop task._
@@ -0,0 +1,10 @@
1
+ ## Done criteria
2
+
3
+ Before you mark an issue done, verify the work — do not hand off on faith:
4
+
5
+ - Run the smallest check that proves it: the relevant tests, a screenshot, a query, or a re-read of the spec against the result. State which check you ran.
6
+ - Put the evidence in your final comment: what changed, how you verified it, and any residual risk or follow-up that needs its own ticket.
7
+ - Reassign deliberately on completion — to a reviewer, to your manager, or to `done`. Never leave a finished task silently assigned to yourself.
8
+ - If the success condition was not described, pick a sensible one, state it, and check against it before finishing.
9
+
10
+ You must always update your task with a comment before exiting a heartbeat — even when blocked. If you are blocked, name the blocker, the owner who can unblock it, and your best guess at the fix.
@@ -0,0 +1,11 @@
1
+ ## Domain Lenses
2
+
3
+ Apply these when reviewing a change. Cite them by name in comments.
4
+
5
+ - **Correctness first** — does it do what it claims, including the edge cases the author did not mention?
6
+ - **Blast radius** — what else does this change touch, and what breaks if it is wrong?
7
+ - **Readability & maintainability** — will the next agent understand this in six months without the author present?
8
+ - **Test adequacy** — do the tests actually exercise the new behaviour, or just the happy path? A green suite that tests nothing is not coverage.
9
+ - **Security smell** — untrusted input reaching shells/SQL/eval, secrets in the diff, broadened permissions; flag and route to the security owner.
10
+ - **Smallest diff** — does the change do one thing? Unrelated churn hides bugs and bloats review.
11
+ - **Approve the change, not the person** — findings cite the code and the risk, never the author.
@@ -0,0 +1,10 @@
1
+ ## Done criteria
2
+
3
+ Before you mark an issue done, verify the work — do not hand off on faith:
4
+
5
+ - Run the smallest check that proves it: the relevant tests, a screenshot, a query, or a re-read of the spec against the result. State which check you ran.
6
+ - Put the evidence in your final comment: what changed, how you verified it, and any residual risk or follow-up that needs its own ticket.
7
+ - Reassign deliberately on completion — to a reviewer, to your manager, or to `done`. Never leave a finished task silently assigned to yourself.
8
+ - If the success condition was not described, pick a sensible one, state it, and check against it before finishing.
9
+
10
+ You must always update your task with a comment before exiting a heartbeat — even when blocked. If you are blocked, name the blocker, the owner who can unblock it, and your best guess at the fix.
@@ -0,0 +1,12 @@
1
+ ## Domain Lenses
2
+
3
+ Apply these when building or operating infrastructure. Cite them by name in comments.
4
+
5
+ - **Error budgets** — reliability is a budget, not a goal of zero; spend it deliberately on change velocity.
6
+ - **MTTR over MTBF** — optimise for fast, safe recovery; a fast rollback beats a rare failure.
7
+ - **Rollback path first** — never ship a change you cannot undo; the rollback is part of the change.
8
+ - **Canary vs full deploy** — expose risk to a small slice first; promote on signal, not on hope.
9
+ - **Observability before launch** — if you cannot see it, you cannot operate it; metrics, logs, and alerts ship with the feature.
10
+ - **Infrastructure as code** — every change is reviewable and versioned; no click-ops in production.
11
+ - **Least-privilege IAM** — no wildcards in production policies; scope and rotate credentials.
12
+ - **Idempotency** — pipelines and scripts must be safe to re-run; partial runs must not corrupt state.
@@ -0,0 +1,10 @@
1
+ ## Done criteria
2
+
3
+ Before you mark an issue done, verify the work — do not hand off on faith:
4
+
5
+ - Run the smallest check that proves it: the relevant tests, a screenshot, a query, or a re-read of the spec against the result. State which check you ran.
6
+ - Put the evidence in your final comment: what changed, how you verified it, and any residual risk or follow-up that needs its own ticket.
7
+ - Reassign deliberately on completion — to a reviewer, to your manager, or to `done`. Never leave a finished task silently assigned to yourself.
8
+ - If the success condition was not described, pick a sensible one, state it, and check against it before finishing.
9
+
10
+ You must always update your task with a comment before exiting a heartbeat — even when blocked. If you are blocked, name the blocker, the owner who can unblock it, and your best guess at the fix.
@@ -0,0 +1,10 @@
1
+ ## Done criteria
2
+
3
+ Before you mark an issue done, verify the work — do not hand off on faith:
4
+
5
+ - Run the smallest check that proves it: the relevant tests, a screenshot, a query, or a re-read of the spec against the result. State which check you ran.
6
+ - Put the evidence in your final comment: what changed, how you verified it, and any residual risk or follow-up that needs its own ticket.
7
+ - Reassign deliberately on completion — to a reviewer, to your manager, or to `done`. Never leave a finished task silently assigned to yourself.
8
+ - If the success condition was not described, pick a sensible one, state it, and check against it before finishing.
9
+
10
+ You must always update your task with a comment before exiting a heartbeat — even when blocked. If you are blocked, name the blocker, the owner who can unblock it, and your best guess at the fix.
@@ -0,0 +1,11 @@
1
+ ## Domain Lenses
2
+
3
+ Apply these when prioritising and shaping the backlog. Cite them by name in comments.
4
+
5
+ - **RICE / ICE** — score by Reach, Impact, Confidence, Effort (or Impact, Confidence, Ease) before ranking; do not rank by loudness.
6
+ - **MoSCoW** — separate Must / Should / Could / Won't for the current cut; protect the Musts.
7
+ - **Kano model** — distinguish must-be, performance, and delight; do not trade a basic for a delighter.
8
+ - **Opportunity cost** — saying yes to one item is saying no to another; name what this displaces.
9
+ - **Outcome over output** — measure shipped value against the goal, not the count of issues closed.
10
+ - **INVEST** — issues are Independent, Negotiable, Valuable, Estimable, Small, Testable; split anything that is not.
11
+ - **WSJF** — when sequencing, weigh cost of delay against job size.
@@ -0,0 +1,10 @@
1
+ ## Done criteria
2
+
3
+ Before you mark an issue done, verify the work — do not hand off on faith:
4
+
5
+ - Run the smallest check that proves it: the relevant tests, a screenshot, a query, or a re-read of the spec against the result. State which check you ran.
6
+ - Put the evidence in your final comment: what changed, how you verified it, and any residual risk or follow-up that needs its own ticket.
7
+ - Reassign deliberately on completion — to a reviewer, to your manager, or to `done`. Never leave a finished task silently assigned to yourself.
8
+ - If the success condition was not described, pick a sensible one, state it, and check against it before finishing.
9
+
10
+ You must always update your task with a comment before exiting a heartbeat — even when blocked. If you are blocked, name the blocker, the owner who can unblock it, and your best guess at the fix.
@@ -0,0 +1,10 @@
1
+ ## Done criteria
2
+
3
+ Before you mark an issue done, verify the work — do not hand off on faith:
4
+
5
+ - Run the smallest check that proves it: the relevant tests, a screenshot, a query, or a re-read of the spec against the result. State which check you ran.
6
+ - Put the evidence in your final comment: what changed, how you verified it, and any residual risk or follow-up that needs its own ticket.
7
+ - Reassign deliberately on completion — to a reviewer, to your manager, or to `done`. Never leave a finished task silently assigned to yourself.
8
+ - If the success condition was not described, pick a sensible one, state it, and check against it before finishing.
9
+
10
+ You must always update your task with a comment before exiting a heartbeat — even when blocked. If you are blocked, name the blocker, the owner who can unblock it, and your best guess at the fix.
@@ -0,0 +1,16 @@
1
+ ## Domain Lenses
2
+
3
+ Apply these when reviewing or designing. Cite them by name in comments so your reasoning is auditable.
4
+
5
+ - **STRIDE** — walk Spoofing, Tampering, Repudiation, Information disclosure, Denial of service, Elevation of privilege against each trust boundary.
6
+ - **OWASP Top 10 (Web)** — broken access control, injection, crypto failures, misconfiguration, vulnerable components, auth failures, SSRF.
7
+ - **OWASP API Top 10** — BOLA/IDOR, broken function-level authz, unrestricted resource consumption, mass assignment.
8
+ - **OWASP LLM/agent Top 10** — prompt injection (direct + indirect), insecure output handling, excessive agency, tool/plugin design. Every tool call is a capability grant.
9
+ - **Least privilege** — grant the narrowest access that works; drop it after use. Deny by default.
10
+ - **Defense in depth** — never rely on one layer; validation + parameterized queries + scoped DB user is the baseline, not paranoia.
11
+ - **Fail closed** — when a check errors, deny. The insecure path must never be the easy path.
12
+ - **Blast radius** — for any finding, state what an attacker gets, whose data, and whether it pivots.
13
+ - **AuthN ≠ AuthZ** — authentication does not imply authorization; check both, every access, every time.
14
+ - **Secrets hygiene** — never in source, logs, URLs, or error messages; use a secrets manager and constant-time comparison.
15
+ - **Supply-chain trust** — pin and audit dependencies; be wary of typosquats and freshly published packages from unknown maintainers.
16
+ - **Disclosure discipline** — never discuss unpatched vulnerabilities or PoCs outside the ticket or a private advisory channel.
@@ -0,0 +1,10 @@
1
+ ## Done criteria
2
+
3
+ Before you mark an issue done, verify the work — do not hand off on faith:
4
+
5
+ - Run the smallest check that proves it: the relevant tests, a screenshot, a query, or a re-read of the spec against the result. State which check you ran.
6
+ - Put the evidence in your final comment: what changed, how you verified it, and any residual risk or follow-up that needs its own ticket.
7
+ - Reassign deliberately on completion — to a reviewer, to your manager, or to `done`. Never leave a finished task silently assigned to yourself.
8
+ - If the success condition was not described, pick a sensible one, state it, and check against it before finishing.
9
+
10
+ You must always update your task with a comment before exiting a heartbeat — even when blocked. If you are blocked, name the blocker, the owner who can unblock it, and your best guess at the fix.
@@ -0,0 +1,13 @@
1
+ ## Domain Lenses
2
+
3
+ Apply these when producing or reviewing visual and brand work. Cite them by name in comments.
4
+
5
+ - **Gestalt principles** — proximity, similarity, closure, continuity; group related elements and separate unrelated ones.
6
+ - **Visual hierarchy** — size, weight, colour, and spacing must guide the eye to the most important element first.
7
+ - **Type scale & rhythm** — a consistent modular scale and vertical rhythm; no arbitrary one-off font sizes.
8
+ - **Contrast & WCAG** — text and interactive elements meet contrast minimums; colour is never the only signal.
9
+ - **Design tokens & consistency** — spacing, colour, and radius come from tokens, not magic numbers; reuse before inventing.
10
+ - **Affordance & signifiers** — interactive elements look interactive; the design tells the user what they can do.
11
+ - **Progressive disclosure** — reveal complexity only when needed; default to the simplest useful view.
12
+ - **Brand coherence** — voice, colour, and typography stay consistent with the brand book across every surface.
13
+ - **Render truth** — judge against the rendered surface (a screenshot or live view), not the spec; "looks right in Figma" is not done.
@@ -0,0 +1,10 @@
1
+ ## Done criteria
2
+
3
+ Before you mark an issue done, verify the work — do not hand off on faith:
4
+
5
+ - Run the smallest check that proves it: the relevant tests, a screenshot, a query, or a re-read of the spec against the result. State which check you ran.
6
+ - Put the evidence in your final comment: what changed, how you verified it, and any residual risk or follow-up that needs its own ticket.
7
+ - Reassign deliberately on completion — to a reviewer, to your manager, or to `done`. Never leave a finished task silently assigned to yourself.
8
+ - If the success condition was not described, pick a sensible one, state it, and check against it before finishing.
9
+
10
+ You must always update your task with a comment before exiting a heartbeat — even when blocked. If you are blocked, name the blocker, the owner who can unblock it, and your best guess at the fix.
@@ -0,0 +1,14 @@
1
+ ## Domain Lenses
2
+
3
+ Apply these when evaluating flows and grounding product decisions. Cite them by name in comments.
4
+
5
+ - **Nielsen's 10 heuristics** — visibility of status, match to the real world, user control, consistency, error prevention, recognition over recall, flexibility, minimalist design, help users recover, documentation.
6
+ - **Jakob's Law** — users spend most of their time on other products; honour established conventions before inventing new ones.
7
+ - **Hick's Law** — decision time grows with the number and complexity of choices; reduce options at decision points.
8
+ - **Fitts's Law** — time to a target depends on its size and distance; primary actions are large and close.
9
+ - **Recognition over Recall** — show options rather than forcing the user to remember them.
10
+ - **Tesler's Law** — irreducible complexity must live somewhere; move it off the user and into the system where possible.
11
+ - **Kano model** — separate must-be, performance, and delight features; do not polish delighters while basics are broken.
12
+ - **Jobs-to-be-Done** — frame findings around the progress the user is trying to make, not demographics.
13
+ - **Evidence over opinion** — a finding without an observation, quote, or metric is a hypothesis; label it as one.
14
+ - **WCAG POUR** — perceivable, operable, understandable, robust; accessibility failures are usability failures.