@appsforgood/next-supabase-kit 0.1.4 → 0.1.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (49) hide show
  1. package/CHANGELOG.md +12 -0
  2. package/DOGFOOD.md +24 -0
  3. package/LOOP_CODING.md +107 -0
  4. package/MAINTAINER_RELEASE.md +100 -0
  5. package/README.md +40 -4
  6. package/REPOSITORY_SETTINGS.md +7 -3
  7. package/SUPPLY_CHAIN.md +5 -5
  8. package/UPGRADE.md +2 -1
  9. package/antigravity/commands/accessibility-pass.toml +16 -0
  10. package/antigravity/commands/browser-qa.toml +18 -0
  11. package/antigravity/commands/distinctiveness-pass.toml +16 -0
  12. package/antigravity/commands/frontend.toml +5 -4
  13. package/antigravity/commands/layout-cleanup.toml +16 -0
  14. package/antigravity/commands/responsive-cleanup.toml +16 -0
  15. package/antigravity/commands/screenshot-critique.toml +16 -0
  16. package/antigravity/commands/ui-audit.toml +17 -0
  17. package/antigravity/commands/ui-polish.toml +17 -0
  18. package/antigravity/plugin.json +9 -0
  19. package/checklists/ui-acceptance-rubric.md +58 -0
  20. package/checklists/ui-detectors.md +75 -0
  21. package/dist/index.js +1090 -411
  22. package/dist/index.js.map +1 -1
  23. package/dist/studio/office/assets/office.css +188 -29
  24. package/dist/studio/office/assets/office.js +72 -50
  25. package/dist/studio/wizard/assets/wizard.css +157 -26
  26. package/dist/studio/wizard/assets/wizard.js +78 -70
  27. package/examples/next-supabase-installed/.agent-kit/agent-roster.json +7 -3
  28. package/examples/next-supabase-installed/.agent-kit/manifest.json +13 -11
  29. package/examples/next-supabase-installed/audit-output.json +22 -2
  30. package/examples/next-supabase-installed/tree.txt +1 -0
  31. package/package.json +28 -7
  32. package/prompts/ui-command-index.md +124 -0
  33. package/research/summaries/agentic-engineering-maturity-levels.md +54 -0
  34. package/rosters/next-supabase-default-council.json +37 -12
  35. package/runtime-skills/ui-improvement-harness/SKILL.md +12 -0
  36. package/schemas/agentic-level.schema.json +47 -0
  37. package/schemas/onboarding-state.schema.json +4 -1
  38. package/skills/ui-improvement-harness.md +96 -0
  39. package/templates/next-supabase/AGENT_ROSTER.md +6 -3
  40. package/templates/next-supabase/ASSISTANT_ADAPTERS.md +3 -1
  41. package/templates/next-supabase/DECISIONS.md +14 -0
  42. package/templates/next-supabase/DESIGN.md +3 -0
  43. package/templates/next-supabase/DOCS.md +7 -1
  44. package/templates/next-supabase/LOOP_CODING.md +98 -0
  45. package/templates/next-supabase/QUALITY_GATES.md +4 -2
  46. package/templates/next-supabase/SKILLS.md +14 -0
  47. package/templates/next-supabase/SPEC.md +5 -1
  48. package/templates/next-supabase/STYLE_GUIDE.md +3 -1
  49. package/templates/next-supabase/TESTING.md +14 -0
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "summary": {
3
- "pass": 62,
3
+ "pass": 66,
4
4
  "warn": 5,
5
5
  "fail": 0
6
6
  },
@@ -19,7 +19,7 @@
19
19
  {
20
20
  "level": "pass",
21
21
  "area": "install",
22
- "message": "Agent kit installed at version 0.1.4."
22
+ "message": "Agent kit installed at version 0.1.6."
23
23
  },
24
24
  {
25
25
  "level": "pass",
@@ -96,6 +96,11 @@
96
96
  "area": "templates",
97
97
  "message": "TESTING.md matches the current bundled template."
98
98
  },
99
+ {
100
+ "level": "pass",
101
+ "area": "templates",
102
+ "message": "LOOP_CODING.md matches the current bundled template."
103
+ },
99
104
  {
100
105
  "level": "pass",
101
106
  "area": "templates",
@@ -186,6 +191,11 @@
186
191
  "area": "agents",
187
192
  "message": ".agent-kit/schemas/onboarding-state.schema.json is present and parseable."
188
193
  },
194
+ {
195
+ "level": "pass",
196
+ "area": "agents",
197
+ "message": ".agent-kit/schemas/agentic-level.schema.json is present and parseable."
198
+ },
189
199
  {
190
200
  "level": "warn",
191
201
  "area": "studio",
@@ -267,6 +277,11 @@
267
277
  "area": "docs",
268
278
  "message": "TESTING.md exists."
269
279
  },
280
+ {
281
+ "level": "pass",
282
+ "area": "docs",
283
+ "message": "LOOP_CODING.md exists."
284
+ },
270
285
  {
271
286
  "level": "pass",
272
287
  "area": "docs",
@@ -351,6 +366,11 @@
351
366
  "message": "No package.json found to verify test scripts.",
352
367
  "remediation": "Add package.json with test, lint, and build scripts appropriate to the stack."
353
368
  },
369
+ {
370
+ "level": "pass",
371
+ "area": "project-reality",
372
+ "message": "No obvious committed secret patterns detected in tracked source files."
373
+ },
354
374
  {
355
375
  "level": "pass",
356
376
  "area": "project-reality",
@@ -14,6 +14,7 @@
14
14
  |-- STYLE_GUIDE.md
15
15
  |-- SECURITY.md
16
16
  |-- TESTING.md
17
+ |-- LOOP_CODING.md
17
18
  |-- DEPLOYMENT.md
18
19
  |-- UPGRADE.md
19
20
  |-- .github
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@appsforgood/next-supabase-kit",
3
- "version": "0.1.4",
3
+ "version": "0.1.6",
4
4
  "description": "Open agent council, skills, prompts, checklists, and markdown templates for Next.js and Supabase projects.",
5
5
  "type": "module",
6
6
  "repository": {
@@ -13,7 +13,8 @@
13
13
  "homepage": "https://github.com/lukey662/agentsandskills#readme",
14
14
  "publishConfig": {
15
15
  "access": "public",
16
- "registry": "https://registry.npmjs.org"
16
+ "registry": "https://registry.npmjs.org",
17
+ "provenance": true
17
18
  },
18
19
  "bin": {
19
20
  "agent-kit": "dist/index.js"
@@ -57,6 +58,8 @@
57
58
  "SUPPLY_CHAIN.md",
58
59
  "BEST_PRACTICE_EVIDENCE.md",
59
60
  "DOGFOOD.md",
61
+ "LOOP_CODING.md",
62
+ "MAINTAINER_RELEASE.md",
60
63
  "RESEARCH_CITATION_POLICY.md",
61
64
  "UPGRADE.md",
62
65
  "SECURITY.md",
@@ -70,8 +73,12 @@
70
73
  "build": "tsup && node scripts/copy-studio-assets.mjs",
71
74
  "dev": "tsx src/cli/index.ts",
72
75
  "typecheck": "tsc --noEmit",
73
- "lint": "tsc --noEmit",
76
+ "lint": "eslint .",
77
+ "lint:fix": "eslint . --fix",
78
+ "format": "prettier --write .",
79
+ "format:check": "prettier --check .",
74
80
  "test": "vitest run",
81
+ "test:coverage": "vitest run --coverage",
75
82
  "test:watch": "vitest",
76
83
  "smoke": "node dist/index.js doctor",
77
84
  "smoke:install": "node scripts/smoke-install.mjs",
@@ -84,20 +91,34 @@
84
91
  "sbom:check": "node scripts/sbom-check.mjs",
85
92
  "sbom:generate": "node scripts/sbom-check.mjs --output sbom.cdx.json",
86
93
  "publish:verify": "node scripts/post-publish-verify.mjs",
94
+ "changeset": "changeset",
95
+ "changeset:version": "changeset version",
87
96
  "release:check": "node scripts/release-check.mjs",
88
- "pack:check": "npm pack --dry-run"
97
+ "pack:check": "npm pack --dry-run",
98
+ "dogfood:init": "node scripts/dogfood-init.mjs",
99
+ "adapter:validate": "node dist/index.js adapter validate all"
89
100
  },
90
101
  "dependencies": {
91
- "@octokit/rest": "^21.1.1",
92
- "commander": "^12.1.0",
102
+ "@clack/prompts": "^1.6.0",
103
+ "@octokit/rest": "^22.0.1",
104
+ "commander": "^14.0.3",
105
+ "picocolors": "^1.1.1",
93
106
  "simple-git": "^3.27.0",
94
- "zod": "^3.24.1"
107
+ "zod": "^4.4.3"
95
108
  },
96
109
  "devDependencies": {
110
+ "@changesets/cli": "^2.31.0",
111
+ "@eslint/js": "^9.39.4",
97
112
  "@types/node": "^25.9.3",
113
+ "@vitest/coverage-v8": "^4.1.9",
114
+ "eslint": "^9.39.4",
115
+ "eslint-config-prettier": "^10.1.8",
116
+ "globals": "^17.7.0",
117
+ "prettier": "^3.9.4",
98
118
  "tsup": "^8.3.5",
99
119
  "tsx": "^4.19.2",
100
120
  "typescript": "^6.0.3",
121
+ "typescript-eslint": "^8.62.1",
101
122
  "vitest": "^4.1.8"
102
123
  },
103
124
  "overrides": {
@@ -0,0 +1,124 @@
1
+ # UI Command Index
2
+
3
+ Use this index to run repeatable UI improvement workflows. These are command-like prompts for any assistant surface and the source of truth for native runtime commands.
4
+
5
+ Canonical sources:
6
+
7
+ - `DESIGN.md`
8
+ - `STYLE_GUIDE.md`
9
+ - `TESTING.md`
10
+ - `QUALITY_GATES.md`
11
+ - `.agent-kit/agent-roster.json`
12
+ - `.agent-kit/skills/ui-improvement-harness.md`
13
+ - `.agent-kit/checklists/ui-detectors.md`
14
+ - `.agent-kit/checklists/ui-acceptance-rubric.md`
15
+ - `.agent-kit/prompts/screenshot-review.md`
16
+ - `.agent-kit/prompts/visual-qa-plan.md`
17
+
18
+ ## `/ui-audit`
19
+
20
+ Audit a target UI surface before release.
21
+
22
+ Required steps:
23
+
24
+ 1. Identify target route, component, workflow, auth state, data state, and risk tier.
25
+ 2. Load product/design context and relevant design brief.
26
+ 3. Review desktop and mobile evidence, or state which evidence must still be captured.
27
+ 4. Run the UI detector checklist.
28
+ 5. Return blockers, majors, minors, preserved capabilities, and required fixes.
29
+
30
+ Required outputs: target surface, risk tier, detector findings by severity, missing evidence, pass/fail verdict.
31
+
32
+ ## `/ui-polish`
33
+
34
+ Improve visual quality without changing product scope.
35
+
36
+ Required steps:
37
+
38
+ 1. Start from detector findings, screenshots, or a named surface.
39
+ 2. Preserve product behavior, auth boundaries, copy claims, and data contracts.
40
+ 3. Improve hierarchy, spacing, density, alignment, component states, and interaction feedback.
41
+ 4. Avoid decorative complexity and generic SaaS defaults.
42
+ 5. Re-run detector and screenshot critique after changes.
43
+
44
+ Required outputs: polish goals, changes made or proposed, detector deltas, screenshots needed, residual risks.
45
+
46
+ ## `/layout-cleanup`
47
+
48
+ Reduce clutter and repair layout structure.
49
+
50
+ Required steps:
51
+
52
+ 1. Identify primary task, secondary tasks, and content hierarchy.
53
+ 2. Remove unnecessary nesting, repeated surfaces, card-within-card patterns, and arbitrary dividers.
54
+ 3. Normalize spacing, grouping, alignment, heading scale, and responsive containers.
55
+ 4. Verify no truncation, overlap, or horizontal overflow remains.
56
+
57
+ Required outputs: layout findings, cleanup actions, preserved workflow, desktop/mobile evidence.
58
+
59
+ ## `/responsive-cleanup`
60
+
61
+ Make a UI work across mobile and desktop.
62
+
63
+ Required steps:
64
+
65
+ 1. Review mobile width, desktop width, and any tablet breakpoint used by the project.
66
+ 2. Verify tap targets, text fit, navigation, primary action visibility, sticky UI, and scroll behavior.
67
+ 3. Verify stateful screens on mobile, not only the happy path.
68
+ 4. Capture or request mobile and desktop screenshots before acceptance.
69
+
70
+ Required outputs: viewports checked, responsive findings, fixes, screenshots, remaining risks.
71
+
72
+ ## `/accessibility-pass`
73
+
74
+ Run a WCAG 2.1 AA-oriented pass on the target UI.
75
+
76
+ Required steps:
77
+
78
+ 1. Check semantics, headings, landmarks, forms, labels, tables, and buttons.
79
+ 2. Check keyboard navigation, visible focus, tab order, escape/close behavior, and skip path when applicable.
80
+ 3. Check contrast, reduced motion, error association, touch targets, and status announcements.
81
+ 4. Keep auth, state, and data-boundary tests separate from visual checks.
82
+
83
+ Required outputs: accessibility findings, severity, fixes, skipped checks, test evidence.
84
+
85
+ ## `/distinctiveness-pass`
86
+
87
+ Prove the UI belongs to this product and does not look generic.
88
+
89
+ Required steps:
90
+
91
+ 1. Compare the first viewport to product category, audience, workflow, and content fingerprint.
92
+ 2. Confirm references were translated into lessons without copying source layouts, copy, assets, or brand marks.
93
+ 3. Remove fake metrics, vague claims, abstract filler, and interchangeable card stacks.
94
+ 4. Re-score distinctiveness and product quality where significant UI work is involved.
95
+
96
+ Required outputs: product-specific evidence, generic-risk findings, source-safety notes, required changes.
97
+
98
+ ## `/screenshot-critique`
99
+
100
+ Review provided screenshots or captured browser screenshots.
101
+
102
+ Required steps:
103
+
104
+ 1. Name each screenshot, viewport, route, auth state, data state, and UI state.
105
+ 2. Run screenshot review, detector checklist, and accessibility risk scan.
106
+ 3. Compare against `DESIGN.md`, `STYLE_GUIDE.md`, and selected creative direction.
107
+ 4. Return concrete fixes, not broad design advice.
108
+
109
+ Required outputs: screenshot inventory, blockers, high-value fixes, accepted areas, missing screenshots.
110
+
111
+ ## `/browser-qa`
112
+
113
+ Run a live browser QA loop for an implemented UI.
114
+
115
+ Required steps:
116
+
117
+ 1. Start or identify the dev/preview server and target routes.
118
+ 2. Open the target with required auth, role, tenant, and data state.
119
+ 3. Capture desktop and mobile screenshots.
120
+ 4. Run detector, screenshot critique, accessibility pass, and responsive cleanup.
121
+ 5. Apply scoped fixes and repeat until acceptance criteria pass.
122
+ 6. Record evidence with `agent-kit session output` when Agent Studio is in use.
123
+
124
+ Required outputs: route, auth state, commands run, screenshots, detector results, fixes, final verdict.
@@ -0,0 +1,54 @@
1
+ # Agentic Engineering Maturity Levels
2
+
3
+ Generated from the Agent Kit iceberg model for setup office gamification, `LOOP_CODING.md`, and maintainer climb planning.
4
+
5
+ ## Summary
6
+
7
+ Agentic engineering maturity is modeled as **levels L3–L8**. The kit **computes L3–L6** from audit, adapter, and setup signals. **L7–L8 are deferred** (never auto-awarded) because they require stronger eval gates than agent freedom.
8
+
9
+ | Level | Name | Computed? |
10
+ | --- | --- | --- |
11
+ | L3 | AI-native IDE | Yes |
12
+ | L4 | Rules, context, MCP contract | Yes |
13
+ | L5 | Subagents, skills, council specialists | Yes |
14
+ | L6 | Eval loops, hooks, CI gates | Yes (downstream or maintainer profile) |
15
+ | L7 | Overnight / unsupervised teams | No — explore only |
16
+ | L8 | Agents managing agents | No — lab only |
17
+
18
+ ## Base levels (reference)
19
+
20
+ | Lens | Level |
21
+ | --- | --- |
22
+ | What `@appsforgood/next-supabase-kit` ships | High L4 → solid L5 |
23
+ | BaseRepo maintainer day-to-day (gitignored dogfood overlay) | Mid L4 |
24
+ | BaseRepo CI (`release:check`, `adapter:validate`, audit smokes) | Partial L6 |
25
+ | Fresh downstream `init` | ~L4 capability; L3 until context complete |
26
+ | Fresh `init --activate cursor\|codex` | L5 capability when subagents exist |
27
+
28
+ ## When each level was cutting edge (approximate)
29
+
30
+ | Era | Frontier | Became baseline |
31
+ | --- | --- | --- |
32
+ | 2022–2023 | Browser chat, tab completion | Copy-paste only |
33
+ | 2023–2024 | Repo-aware IDE chat (L3) | Autocomplete-only |
34
+ | Late 2024–2025 | AGENTS.md, rules, MCP (L4) | Ad-hoc prompting |
35
+ | 2025–2026 | Subagents, skills, councils (L5) | Single chat for all roles |
36
+ | 2026 now | Eval CI, loop until green (L6) | Manual “run tests when you remember” |
37
+ | 2026 hype | Overnight agent teams (L7) | Not safe as default |
38
+ | 2026+ lab | Meta-orchestration (L8) | Not mainstream production |
39
+
40
+ ## Office and wizard integration
41
+
42
+ - `agent-kit setup` computes level via `computeAgenticLevel()` and returns it on `/api/state`.
43
+ - Agent Office shows **Lcurrent → Ltarget**, an iceberg strip (L3–L8), and top climb steps.
44
+ - Setup wizard complete screen links **`LOOP_CODING.md`**, **`agent-kit adapter validate`**, and audit gates.
45
+ - Maintainer source repos use a **maintainer profile** (release-check + dogfood docs) for L6 signals.
46
+
47
+ ## Related assets
48
+
49
+ - `LOOP_CODING.md` — kit-safe loop patterns
50
+ - `schemas/agentic-level.schema.json` — report shape
51
+ - `src/studio/agentic-level.ts` — scoring implementation
52
+ - `research/summaries/maturity-model-patterns.md` — QUALITY_GATES evidence tiers (separate from Agentic L3–L8)
53
+
54
+ Do not conflate **Agentic L3–L8** with **QUALITY_GATES Baseline/Strong/Best-Practice** or **visual QA baseline/strong/mature** — the setup UI labels these separately.
@@ -70,6 +70,7 @@
70
70
  "frontend-distinctiveness-benchmark",
71
71
  "frontend-product-quality-rubric",
72
72
  "frontend-design-system",
73
+ "ui-improvement-harness",
73
74
  "visual-regression-qa",
74
75
  "accessibility-wcag"
75
76
  ],
@@ -95,13 +96,7 @@
95
96
  "voice-tone",
96
97
  "pricing-copy"
97
98
  ],
98
- "skills": [
99
- "positioning-messaging",
100
- "conversion-copywriting",
101
- "landing-page-copy",
102
- "product-voice-tone",
103
- "onboarding-empty-state-copy"
104
- ],
99
+ "skills": ["positioning-messaging", "conversion-copywriting", "landing-page-copy", "product-voice-tone", "onboarding-empty-state-copy"],
105
100
  "handsOffTo": ["frontend-design-lead", "nextjs-engineer", "qa-engineer", "docs-maintainer"]
106
101
  },
107
102
  {
@@ -147,7 +142,19 @@
147
142
  },
148
143
  {
149
144
  "id": "core-change",
150
- "triggers": ["schema", "auth", "rls", "api", "route handler", "server action", "dependency", "upgrade", "release workflow", "package behavior", "cross-layer"],
145
+ "triggers": [
146
+ "schema",
147
+ "auth",
148
+ "rls",
149
+ "api",
150
+ "route handler",
151
+ "server action",
152
+ "dependency",
153
+ "upgrade",
154
+ "release workflow",
155
+ "package behavior",
156
+ "cross-layer"
157
+ ],
151
158
  "sequence": [
152
159
  "planner",
153
160
  "lead-architect",
@@ -171,7 +178,7 @@
171
178
  },
172
179
  {
173
180
  "id": "frontend-change",
174
- "triggers": ["screen", "component", "layout", "design", "responsive", "accessibility", "screenshot"],
181
+ "triggers": ["screen", "component", "layout", "design", "responsive", "accessibility", "screenshot", "ui audit", "ui polish", "browser qa"],
175
182
  "sequence": ["planner", "frontend-design-lead", "marketing-copy-lead", "nextjs-engineer", "qa-engineer", "docs-maintainer"],
176
183
  "council": ["frontend-design-lead", "marketing-copy-lead", "qa-engineer"],
177
184
  "requiredOutputs": [
@@ -183,15 +190,33 @@
183
190
  "design critique verdict",
184
191
  "frontend product-quality scorecard",
185
192
  "domain-specific UI rationale",
193
+ "UI detector findings and severity",
194
+ "UI command workflow applied when polishing or auditing",
186
195
  "visual QA evidence",
187
196
  "state coverage",
188
197
  "accessibility checks",
189
- "desktop/mobile verification"
198
+ "desktop/mobile verification",
199
+ "authenticated screen evidence when applicable"
190
200
  ]
191
201
  },
192
202
  {
193
203
  "id": "marketing-copy",
194
- "triggers": ["copy", "copywriting", "marketing", "positioning", "messaging", "value prop", "value proposition", "landing page", "headline", "cta", "conversion", "onboarding", "empty state", "pricing"],
204
+ "triggers": [
205
+ "copy",
206
+ "copywriting",
207
+ "marketing",
208
+ "positioning",
209
+ "messaging",
210
+ "value prop",
211
+ "value proposition",
212
+ "landing page",
213
+ "headline",
214
+ "cta",
215
+ "conversion",
216
+ "onboarding",
217
+ "empty state",
218
+ "pricing"
219
+ ],
195
220
  "sequence": ["planner", "marketing-copy-lead", "frontend-design-lead", "qa-engineer", "docs-maintainer"],
196
221
  "council": ["marketing-copy-lead", "frontend-design-lead"],
197
222
  "requiredOutputs": [
@@ -219,7 +244,7 @@
219
244
  "Meaningful multi-agent work must record council-session evidence in COUNCIL.md or a structured record that follows .agent-kit/schemas/council-session.schema.json.",
220
245
  "Planner starts planning and ambiguous requests by default.",
221
246
  "Lead Architect must review core changes before implementation.",
222
- "Frontend Design Lead must record reference-set evidence, anti-references, a design critique verdict, a distinctiveness benchmark, and a frontend product-quality scorecard before accepting significant frontend work.",
247
+ "Frontend Design Lead must record reference-set evidence, anti-references, a design critique verdict, a distinctiveness benchmark, a frontend product-quality scorecard, UI detector severity findings, and desktop/mobile screenshot evidence before accepting significant frontend work.",
223
248
  "Marketing Copy Lead must ask discovery questions and record audience, pain, outcome, value proposition, proof, objections, voice/tone, and conversion goal before accepting public-facing or conversion-facing copy.",
224
249
  "Security Reviewer must review auth, data mutation, external-call, dependency, secret, and release-risk changes.",
225
250
  "QA Engineer must verify behavior changes before completion.",
@@ -0,0 +1,12 @@
1
+ ---
2
+ name: ui-improvement-harness
3
+ description: Use when running repeatable UI audit, polish, layout cleanup, responsive cleanup, accessibility, screenshot critique, visual distinctiveness, or live browser QA workflows.
4
+ ---
5
+
6
+ # UI Improvement Harness Runtime Skill
7
+
8
+ Canonical workflow: `skills/ui-improvement-harness.md`.
9
+
10
+ Installed-project canonical workflow: `.agent-kit/skills/ui-improvement-harness.md`.
11
+
12
+ Use the canonical skill before accepting meaningful UI polish, audit, screenshot review, or browser iteration work. Runtime wrappers must not fork the detector, rubric, or command policy.
@@ -0,0 +1,47 @@
1
+ {
2
+ "$schema": "https://json-schema.org/draft/2020-12/schema",
3
+ "$id": "https://agent-skills.dev/schemas/agentic-level.schema.json",
4
+ "title": "Agent Kit Agentic Level Report",
5
+ "type": "object",
6
+ "required": ["currentLevel", "targetLevel", "maintainerProfile", "computedAt", "signals"],
7
+ "additionalProperties": false,
8
+ "properties": {
9
+ "currentLevel": { "type": "integer", "enum": [3, 4, 5, 6] },
10
+ "targetLevel": { "type": "integer", "enum": [3, 4, 5, 6, 7, 8] },
11
+ "maintainerProfile": { "type": "boolean" },
12
+ "computedAt": { "type": "string", "format": "date-time" },
13
+ "maintainerNote": { "type": "string" },
14
+ "signals": {
15
+ "type": "array",
16
+ "items": {
17
+ "type": "object",
18
+ "required": ["id", "level", "label", "pass", "evidence", "remediation"],
19
+ "additionalProperties": false,
20
+ "properties": {
21
+ "id": { "type": "string" },
22
+ "level": { "type": "integer", "enum": [3, 4, 5, 6] },
23
+ "label": { "type": "string" },
24
+ "pass": { "type": "boolean" },
25
+ "evidence": { "type": "string" },
26
+ "remediation": { "type": "string" }
27
+ }
28
+ }
29
+ },
30
+ "climbSteps": {
31
+ "type": "array",
32
+ "items": {
33
+ "type": "object",
34
+ "required": ["id", "level", "label", "pass", "evidence", "remediation"],
35
+ "additionalProperties": false,
36
+ "properties": {
37
+ "id": { "type": "string" },
38
+ "level": { "type": "integer", "enum": [3, 4, 5, 6] },
39
+ "label": { "type": "string" },
40
+ "pass": { "type": "boolean" },
41
+ "evidence": { "type": "string" },
42
+ "remediation": { "type": "string" }
43
+ }
44
+ }
45
+ }
46
+ }
47
+ }
@@ -28,6 +28,9 @@
28
28
  "wizardVersion": { "type": "string" },
29
29
  "ideSurface": { "type": "string", "enum": ["cursor", "copilot", "claude", "codex", "other"] },
30
30
  "ideVerifiedAt": { "type": "string", "format": "date-time" },
31
- "visualQaTier": { "type": "string", "enum": ["baseline", "strong", "mature"] }
31
+ "visualQaTier": { "type": "string", "enum": ["baseline", "strong", "mature"] },
32
+ "targetAgenticLevel": { "type": "integer", "enum": [3, 4, 5, 6, 7, 8] },
33
+ "lastAgenticLevel": { "type": "integer", "enum": [3, 4, 5, 6] },
34
+ "lastAgenticComputedAt": { "type": "string", "format": "date-time" }
32
35
  }
33
36
  }
@@ -0,0 +1,96 @@
1
+ # UI Improvement Harness Skill
2
+
3
+ ## Use When
4
+
5
+ Running operational UI improvement loops for user-facing screens, dashboards, admin flows, app shells, onboarding, marketing surfaces, component systems, or authenticated product workflows.
6
+
7
+ Use this skill when a request asks for UI audit, polish, layout cleanup, responsive cleanup, accessibility pass, screenshot critique, visual distinctiveness, live browser QA, or repeatable frontend improvement workflows.
8
+
9
+ ## Goal
10
+
11
+ Turn frontend quality guidance into repeatable commands. The harness should help agents move from screenshots and browser evidence to concrete fixes, then loop until deterministic detector findings and review findings pass for the release risk.
12
+
13
+ ## Required Inputs
14
+
15
+ - Target surface: route, component, flow, or screenshot set.
16
+ - Product context from `DESIGN.md`, `STYLE_GUIDE.md`, and relevant `.agent-kit/design-briefs/*`.
17
+ - Auth and permission context for protected screens, including role, tenant, and fixture user assumptions.
18
+ - Desktop and mobile viewports for meaningful UI changes.
19
+ - State coverage requirements: default, loading, empty, error, disabled, success, permission, focus, and narrow viewport states where relevant.
20
+ - Existing visual QA tier from `TESTING.md`, or a proposed tier from `.agent-kit/prompts/visual-qa-plan.md`.
21
+
22
+ ## Command Workflows
23
+
24
+ Use `.agent-kit/prompts/ui-command-index.md` as the command index. It defines these command-like workflows:
25
+
26
+ - UI audit: find blockers and major issues before implementation or release.
27
+ - UI polish: improve hierarchy, density, spacing, state feedback, and visual finish without changing product scope.
28
+ - Layout cleanup: remove clutter, nesting, overflow, weak grouping, and inconsistent spacing.
29
+ - Responsive/mobile cleanup: verify mobile hierarchy, tap targets, text fit, navigation, and critical actions.
30
+ - Accessibility pass: verify semantic structure, keyboard path, focus, labels, contrast, motion, and error feedback.
31
+ - Visual distinctiveness pass: prove product specificity and avoid generic AI/SaaS defaults.
32
+ - Screenshot critique: review desktop/mobile/state screenshots against product context and detector findings.
33
+ - Live browser QA loop: inspect the running app, capture evidence, apply scoped fixes, and repeat until acceptance criteria pass.
34
+
35
+ ## Deterministic Detector Checklist
36
+
37
+ Use `.agent-kit/checklists/ui-detectors.md` before and after polish. Treat each finding as `blocker`, `major`, `minor`, or `not-applicable`.
38
+
39
+ Required detector areas:
40
+
41
+ - Crowded layout and excessive competing surfaces.
42
+ - Weak hierarchy or unclear primary action.
43
+ - Inconsistent spacing, density, typography, radius, or alignment.
44
+ - Poor mobile tap targets or unreachable critical actions.
45
+ - Truncation, overflow, overlap, or text that does not fit.
46
+ - Card-within-card patterns and decorative containers that obscure workflow.
47
+ - Generic SaaS or AI-site styling, including abstract decoration that hides missing content.
48
+ - Weak hover, pressed, selected, loading, success, empty, error, disabled, focus, and permission feedback.
49
+ - Missing loading, empty, error, disabled, success, permission, and mobile states where relevant.
50
+ - Accessibility and focus issues, including contrast, labels, landmarks, keyboard order, and motion.
51
+
52
+ ## Acceptance Rubric
53
+
54
+ Use `.agent-kit/checklists/ui-acceptance-rubric.md`.
55
+
56
+ - Blocker findings must be fixed before release.
57
+ - Major findings must be fixed or explicitly accepted with rationale before high-risk UI changes ship.
58
+ - High-risk UI changes require desktop and mobile screenshots plus authenticated or permission-state evidence when the workflow requires login.
59
+ - Screenshot evidence must include the first viewport, primary workflow, and the highest-risk state affected by the change.
60
+ - Visual checks do not replace semantic, keyboard, auth, data-boundary, or regression tests.
61
+
62
+ ## Live Browser QA Loop
63
+
64
+ For implemented UI:
65
+
66
+ 1. Start or identify the app server and route.
67
+ 2. Open the target route with the required auth state or test account.
68
+ 3. Capture desktop and mobile screenshots.
69
+ 4. Run the deterministic detector checklist.
70
+ 5. Run screenshot critique and accessibility pass.
71
+ 6. Apply the smallest scoped fixes.
72
+ 7. Repeat until no blockers remain and major findings are resolved or documented.
73
+ 8. Record evidence with `agent-kit session output` when Agent Studio is in use.
74
+
75
+ For authenticated screens, do not substitute a public landing page screenshot. Use a real signed-in state, a seeded local fixture, or an explicit limitation note that names the missing auth evidence.
76
+
77
+ ## Reject By Default
78
+
79
+ - A UI pass based only on static prose with no screenshot or browser evidence when implementation exists.
80
+ - Desktop-only review for responsive or mobile-risk changes.
81
+ - Public-page review used as evidence for authenticated app screens.
82
+ - Vague polish requests that do not name detector findings or acceptance criteria.
83
+ - Fixes that add decorative cards, gradients, fake metrics, or generic copy instead of clarifying the workflow.
84
+ - Ignoring major detector findings without rationale.
85
+
86
+ ## Review Output
87
+
88
+ Return:
89
+
90
+ - Target surface and auth state reviewed.
91
+ - Commands run or command-like workflows applied.
92
+ - Detector findings by severity.
93
+ - Screenshots and viewports reviewed.
94
+ - Accessibility, responsive, state, and distinctiveness verdicts.
95
+ - Fixes made or required before acceptance.
96
+ - Tests, browser checks, visual QA evidence, and gaps.
@@ -4,7 +4,7 @@ This project uses `.agent-kit/agent-roster.json` as the default council contract
4
4
 
5
5
  ## Default Rule
6
6
 
7
- Planner handles planning by default. Lead Architect reviews core changes before implementation. Frontend Design Lead owns content-first creative direction, reference-led critique, frontend distinctiveness benchmarking, product-quality scoring, and visual QA before significant frontend implementation is accepted. Marketing Copy Lead owns positioning, value proposition, public-facing copy, proof, objections, voice, and CTA hierarchy before conversion-facing copy is accepted. Security Reviewer, QA Engineer, Documentation Maintainer, and Deployment/Observability Engineer join when their trigger areas are touched. Meaningful multi-agent work records council-session evidence in `COUNCIL.md` or a structured record that follows `.agent-kit/schemas/council-session.schema.json`.
7
+ Planner handles planning by default. Lead Architect reviews core changes before implementation. Frontend Design Lead owns content-first creative direction, reference-led critique, frontend distinctiveness benchmarking, product-quality scoring, UI detector severity review, command-based UI polish/audit loops, and visual QA before significant frontend implementation is accepted. Marketing Copy Lead owns positioning, value proposition, public-facing copy, proof, objections, voice, and CTA hierarchy before conversion-facing copy is accepted. Security Reviewer, QA Engineer, Documentation Maintainer, and Deployment/Observability Engineer join when their trigger areas are touched. Meaningful multi-agent work records council-session evidence in `COUNCIL.md` or a structured record that follows `.agent-kit/schemas/council-session.schema.json`.
8
8
 
9
9
  ## Default Workflows
10
10
 
@@ -36,7 +36,7 @@ Handoff order:
36
36
 
37
37
  ### Frontend Change
38
38
 
39
- Use when the request touches screens, components, layout, visual design, accessibility, responsiveness, or screenshot review.
39
+ Use when the request touches screens, components, layout, visual design, accessibility, responsiveness, screenshot review, UI audit, UI polish, or browser QA.
40
40
 
41
41
  Handoff order:
42
42
 
@@ -57,10 +57,13 @@ Required outputs:
57
57
  - Design critique verdict
58
58
  - Frontend product-quality scorecard
59
59
  - Domain-specific UI rationale
60
+ - UI detector findings and severity
61
+ - UI command workflow applied when polishing or auditing
60
62
  - Visual QA evidence
61
63
  - State coverage
62
64
  - Accessibility checks
63
65
  - Desktop/mobile verification
66
+ - Authenticated screen evidence when applicable
64
67
 
65
68
  ### Marketing Copy
66
69
 
@@ -90,7 +93,7 @@ Required outputs:
90
93
  - Each agent must state its decision, risk, and required next handoff.
91
94
  - Each meaningful council session must record workflow, affected layers, required outputs, handoff decisions, risks, evidence, and verification status.
92
95
  - Core changes cannot skip Lead Architect.
93
- - Frontend changes cannot skip content/brand intake, creative-direction rationale, reference-set evidence, distinctiveness benchmark, design critique verdict, product-quality scorecard, visual QA evidence, or Frontend Design Lead review.
96
+ - Frontend changes cannot skip content/brand intake, creative-direction rationale, reference-set evidence, distinctiveness benchmark, design critique verdict, product-quality scorecard, UI detector severity review, visual QA evidence, or Frontend Design Lead review.
94
97
  - Public-facing or conversion-facing copy cannot skip Marketing Copy Lead discovery questions, value proposition, proof, objection, voice/tone, and CTA review.
95
98
  - Auth, data mutation, dependency, external-call, secret, and release-risk changes cannot skip Security Reviewer.
96
99
  - Behavior changes cannot skip QA evidence.
@@ -108,7 +108,9 @@ Validate the structural package with:
108
108
  agent-kit adapter validate antigravity
109
109
  ```
110
110
 
111
- If the local machine has the Antigravity CLI, teams may also run native plugin validation and record that evidence here. Runtime command files are adapters only; `AGENTS.md`, `.agent-kit/agent-roster.json`, `QUALITY_GATES.md`, and Agent Studio sessions remain canonical.
111
+ If the local machine has the Antigravity CLI, teams may also run native plugin validation and record that evidence here. Runtime command files are adapters only; `AGENTS.md`, `.agent-kit/agent-roster.json`, `QUALITY_GATES.md`, `.agent-kit/prompts/ui-command-index.md`, `.agent-kit/checklists/ui-detectors.md`, and Agent Studio sessions remain canonical.
112
+
113
+ The frontend adapter surface includes `/frontend` plus focused UI improvement commands: `/ui-audit`, `/ui-polish`, `/layout-cleanup`, `/responsive-cleanup`, `/accessibility-pass`, `/distinctiveness-pass`, `/screenshot-critique`, and `/browser-qa`. These commands invoke existing Frontend Design Lead, QA, accessibility, screenshot, and documentation gates; they do not replace the council workflow.
112
114
 
113
115
  ## Acceptance Evidence
114
116