opencastle 0.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +21 -0
- package/README.md +215 -0
- package/bin/cli.mjs +69 -0
- package/dist/cli/adapters/claude-code.d.ts +22 -0
- package/dist/cli/adapters/claude-code.d.ts.map +1 -0
- package/dist/cli/adapters/claude-code.js +237 -0
- package/dist/cli/adapters/claude-code.js.map +1 -0
- package/dist/cli/adapters/cursor.d.ts +20 -0
- package/dist/cli/adapters/cursor.d.ts.map +1 -0
- package/dist/cli/adapters/cursor.js +231 -0
- package/dist/cli/adapters/cursor.js.map +1 -0
- package/dist/cli/adapters/vscode.d.ts +20 -0
- package/dist/cli/adapters/vscode.d.ts.map +1 -0
- package/dist/cli/adapters/vscode.js +132 -0
- package/dist/cli/adapters/vscode.js.map +1 -0
- package/dist/cli/copy.d.ts +14 -0
- package/dist/cli/copy.d.ts.map +1 -0
- package/dist/cli/copy.js +62 -0
- package/dist/cli/copy.js.map +1 -0
- package/dist/cli/dashboard.d.ts +3 -0
- package/dist/cli/dashboard.d.ts.map +1 -0
- package/dist/cli/dashboard.js +183 -0
- package/dist/cli/dashboard.js.map +1 -0
- package/dist/cli/diff.d.ts +3 -0
- package/dist/cli/diff.d.ts.map +1 -0
- package/dist/cli/diff.js +27 -0
- package/dist/cli/diff.js.map +1 -0
- package/dist/cli/eject.d.ts +3 -0
- package/dist/cli/eject.d.ts.map +1 -0
- package/dist/cli/eject.js +27 -0
- package/dist/cli/eject.js.map +1 -0
- package/dist/cli/init.d.ts +3 -0
- package/dist/cli/init.d.ts.map +1 -0
- package/dist/cli/init.js +92 -0
- package/dist/cli/init.js.map +1 -0
- package/dist/cli/manifest.d.ts +14 -0
- package/dist/cli/manifest.d.ts.map +1 -0
- package/dist/cli/manifest.js +34 -0
- package/dist/cli/manifest.js.map +1 -0
- package/dist/cli/mcp.d.ts +14 -0
- package/dist/cli/mcp.d.ts.map +1 -0
- package/dist/cli/mcp.js +35 -0
- package/dist/cli/mcp.js.map +1 -0
- package/dist/cli/prompt.d.ts +12 -0
- package/dist/cli/prompt.d.ts.map +1 -0
- package/dist/cli/prompt.js +104 -0
- package/dist/cli/prompt.js.map +1 -0
- package/dist/cli/run/adapters/claude-code.d.ts +16 -0
- package/dist/cli/run/adapters/claude-code.d.ts.map +1 -0
- package/dist/cli/run/adapters/claude-code.js +82 -0
- package/dist/cli/run/adapters/claude-code.js.map +1 -0
- package/dist/cli/run/adapters/copilot.d.ts +16 -0
- package/dist/cli/run/adapters/copilot.d.ts.map +1 -0
- package/dist/cli/run/adapters/copilot.js +84 -0
- package/dist/cli/run/adapters/copilot.js.map +1 -0
- package/dist/cli/run/adapters/cursor.d.ts +16 -0
- package/dist/cli/run/adapters/cursor.d.ts.map +1 -0
- package/dist/cli/run/adapters/cursor.js +81 -0
- package/dist/cli/run/adapters/cursor.js.map +1 -0
- package/dist/cli/run/adapters/index.d.ts +14 -0
- package/dist/cli/run/adapters/index.d.ts.map +1 -0
- package/dist/cli/run/adapters/index.js +35 -0
- package/dist/cli/run/adapters/index.js.map +1 -0
- package/dist/cli/run/executor.d.ts +15 -0
- package/dist/cli/run/executor.d.ts.map +1 -0
- package/dist/cli/run/executor.js +249 -0
- package/dist/cli/run/executor.js.map +1 -0
- package/dist/cli/run/reporter.d.ts +10 -0
- package/dist/cli/run/reporter.d.ts.map +1 -0
- package/dist/cli/run/reporter.js +112 -0
- package/dist/cli/run/reporter.js.map +1 -0
- package/dist/cli/run/schema.d.ts +28 -0
- package/dist/cli/run/schema.d.ts.map +1 -0
- package/dist/cli/run/schema.js +511 -0
- package/dist/cli/run/schema.js.map +1 -0
- package/dist/cli/run.d.ts +6 -0
- package/dist/cli/run.d.ts.map +1 -0
- package/dist/cli/run.js +123 -0
- package/dist/cli/run.js.map +1 -0
- package/dist/cli/stack-config.d.ts +12 -0
- package/dist/cli/stack-config.d.ts.map +1 -0
- package/dist/cli/stack-config.js +146 -0
- package/dist/cli/stack-config.js.map +1 -0
- package/dist/cli/types.d.ts +169 -0
- package/dist/cli/types.d.ts.map +1 -0
- package/dist/cli/types.js +2 -0
- package/dist/cli/types.js.map +1 -0
- package/dist/cli/update.d.ts +3 -0
- package/dist/cli/update.d.ts.map +1 -0
- package/dist/cli/update.js +50 -0
- package/dist/cli/update.js.map +1 -0
- package/package.json +48 -0
- package/src/cli/adapters/claude-code.ts +287 -0
- package/src/cli/adapters/cursor.ts +377 -0
- package/src/cli/adapters/vscode.ts +168 -0
- package/src/cli/copy.ts +79 -0
- package/src/cli/dashboard.ts +225 -0
- package/src/cli/diff.ts +44 -0
- package/src/cli/eject.ts +39 -0
- package/src/cli/init.ts +120 -0
- package/src/cli/manifest.ts +45 -0
- package/src/cli/mcp.ts +49 -0
- package/src/cli/prompt.ts +115 -0
- package/src/cli/run/adapters/claude-code.ts +95 -0
- package/src/cli/run/adapters/copilot.ts +97 -0
- package/src/cli/run/adapters/cursor.ts +94 -0
- package/src/cli/run/adapters/index.ts +40 -0
- package/src/cli/run/executor.ts +292 -0
- package/src/cli/run/reporter.ts +129 -0
- package/src/cli/run/schema.ts +595 -0
- package/src/cli/run.ts +137 -0
- package/src/cli/stack-config.ts +180 -0
- package/src/cli/types.ts +207 -0
- package/src/cli/update.ts +75 -0
- package/src/dashboard/astro.config.mjs +6 -0
- package/src/dashboard/package-lock.json +5455 -0
- package/src/dashboard/package.json +14 -0
- package/src/dashboard/public/data/delegations.ndjson +35 -0
- package/src/dashboard/public/data/panels.ndjson +13 -0
- package/src/dashboard/public/data/sessions.ndjson +50 -0
- package/src/dashboard/public/icon-192.png +0 -0
- package/src/dashboard/scripts/generate-seed-data.ts +355 -0
- package/src/dashboard/src/layouts/Layout.astro +25 -0
- package/src/dashboard/src/pages/index.astro +1070 -0
- package/src/dashboard/src/styles/dashboard.css +1078 -0
- package/src/dashboard/tsconfig.json +6 -0
- package/src/orchestrator/agent-workflows/README.md +22 -0
- package/src/orchestrator/agent-workflows/bug-fix.md +128 -0
- package/src/orchestrator/agent-workflows/data-pipeline.md +145 -0
- package/src/orchestrator/agent-workflows/database-migration.md +159 -0
- package/src/orchestrator/agent-workflows/feature-implementation.md +223 -0
- package/src/orchestrator/agent-workflows/performance-optimization.md +125 -0
- package/src/orchestrator/agent-workflows/refactoring.md +142 -0
- package/src/orchestrator/agent-workflows/schema-changes.md +164 -0
- package/src/orchestrator/agent-workflows/security-audit.md +148 -0
- package/src/orchestrator/agent-workflows/shared-delivery-phase.md +33 -0
- package/src/orchestrator/agents/api-designer.agent.md +68 -0
- package/src/orchestrator/agents/architect.agent.md +129 -0
- package/src/orchestrator/agents/content-engineer.agent.md +57 -0
- package/src/orchestrator/agents/copywriter.agent.md +95 -0
- package/src/orchestrator/agents/data-expert.agent.md +63 -0
- package/src/orchestrator/agents/database-engineer.agent.md +62 -0
- package/src/orchestrator/agents/developer.agent.md +66 -0
- package/src/orchestrator/agents/devops-expert.agent.md +57 -0
- package/src/orchestrator/agents/documentation-writer.agent.md +60 -0
- package/src/orchestrator/agents/performance-expert.agent.md +58 -0
- package/src/orchestrator/agents/release-manager.agent.md +72 -0
- package/src/orchestrator/agents/researcher.agent.md +145 -0
- package/src/orchestrator/agents/reviewer.agent.md +62 -0
- package/src/orchestrator/agents/security-expert.agent.md +64 -0
- package/src/orchestrator/agents/seo-specialist.agent.md +67 -0
- package/src/orchestrator/agents/team-lead.agent.md +644 -0
- package/src/orchestrator/agents/testing-expert.agent.md +85 -0
- package/src/orchestrator/agents/ui-ux-expert.agent.md +63 -0
- package/src/orchestrator/copilot-instructions.md +3 -0
- package/src/orchestrator/customizations/AGENT-EXPERTISE.md +325 -0
- package/src/orchestrator/customizations/AGENT-FAILURES.md +69 -0
- package/src/orchestrator/customizations/AGENT-PERFORMANCE.md +58 -0
- package/src/orchestrator/customizations/DISPUTES.md +162 -0
- package/src/orchestrator/customizations/KNOWLEDGE-GRAPH.md +10 -0
- package/src/orchestrator/customizations/LESSONS-LEARNED.md +70 -0
- package/src/orchestrator/customizations/README.md +59 -0
- package/src/orchestrator/customizations/agents/agent-registry.md +46 -0
- package/src/orchestrator/customizations/agents/skill-matrix.md +142 -0
- package/src/orchestrator/customizations/logs/README.md +181 -0
- package/src/orchestrator/customizations/logs/delegations.ndjson +1 -0
- package/src/orchestrator/customizations/logs/panels.ndjson +1 -0
- package/src/orchestrator/customizations/logs/sessions.ndjson +1 -0
- package/src/orchestrator/customizations/project/docs-structure.md +23 -0
- package/src/orchestrator/customizations/project/tracker-config.md +45 -0
- package/src/orchestrator/customizations/project.instructions.md +64 -0
- package/src/orchestrator/customizations/stack/api-config.md +37 -0
- package/src/orchestrator/customizations/stack/cms-config.md +26 -0
- package/src/orchestrator/customizations/stack/data-pipeline-config.md +41 -0
- package/src/orchestrator/customizations/stack/database-config.md +44 -0
- package/src/orchestrator/customizations/stack/deployment-config.md +45 -0
- package/src/orchestrator/customizations/stack/testing-config.md +56 -0
- package/src/orchestrator/instructions/ai-optimization.instructions.md +143 -0
- package/src/orchestrator/instructions/general.instructions.md +194 -0
- package/src/orchestrator/mcp.json +55 -0
- package/src/orchestrator/prompts/bootstrap-customizations.prompt.md +235 -0
- package/src/orchestrator/prompts/brainstorm.prompt.md +115 -0
- package/src/orchestrator/prompts/bug-fix.prompt.md +141 -0
- package/src/orchestrator/prompts/create-skill.prompt.md +103 -0
- package/src/orchestrator/prompts/generate-task-spec.prompt.md +154 -0
- package/src/orchestrator/prompts/implement-feature.prompt.md +124 -0
- package/src/orchestrator/prompts/metrics-report.prompt.md +142 -0
- package/src/orchestrator/prompts/quick-refinement.prompt.md +137 -0
- package/src/orchestrator/prompts/resolve-pr-comments.prompt.md +100 -0
- package/src/orchestrator/skills/accessibility-standards/SKILL.md +164 -0
- package/src/orchestrator/skills/agent-hooks/SKILL.md +147 -0
- package/src/orchestrator/skills/agent-memory/SKILL.md +144 -0
- package/src/orchestrator/skills/api-patterns/SKILL.md +106 -0
- package/src/orchestrator/skills/browser-testing/SKILL.md +203 -0
- package/src/orchestrator/skills/code-commenting/SKILL.md +133 -0
- package/src/orchestrator/skills/contentful-cms/SKILL.md +43 -0
- package/src/orchestrator/skills/context-map/SKILL.md +135 -0
- package/src/orchestrator/skills/convex-database/SKILL.md +80 -0
- package/src/orchestrator/skills/data-engineering/SKILL.md +99 -0
- package/src/orchestrator/skills/deployment-infrastructure/SKILL.md +49 -0
- package/src/orchestrator/skills/documentation-standards/SKILL.md +85 -0
- package/src/orchestrator/skills/fast-review/SKILL.md +327 -0
- package/src/orchestrator/skills/frontend-design/SKILL.md +42 -0
- package/src/orchestrator/skills/jira-management/SKILL.md +168 -0
- package/src/orchestrator/skills/memory-merger/SKILL.md +123 -0
- package/src/orchestrator/skills/nextjs-patterns/SKILL.md +75 -0
- package/src/orchestrator/skills/nx-workspace/SKILL.md +192 -0
- package/src/orchestrator/skills/panel-majority-vote/SKILL.md +184 -0
- package/src/orchestrator/skills/panel-majority-vote/panel-report.template.md +38 -0
- package/src/orchestrator/skills/performance-optimization/SKILL.md +101 -0
- package/src/orchestrator/skills/react-development/SKILL.md +117 -0
- package/src/orchestrator/skills/sanity-cms/SKILL.md +18 -0
- package/src/orchestrator/skills/security-hardening/SKILL.md +118 -0
- package/src/orchestrator/skills/self-improvement/SKILL.md +137 -0
- package/src/orchestrator/skills/seo-patterns/SKILL.md +40 -0
- package/src/orchestrator/skills/session-checkpoints/SKILL.md +205 -0
- package/src/orchestrator/skills/slack-notifications/SKILL.md +211 -0
- package/src/orchestrator/skills/strapi-cms/SKILL.md +43 -0
- package/src/orchestrator/skills/supabase-database/SKILL.md +24 -0
- package/src/orchestrator/skills/task-management/SKILL.md +143 -0
- package/src/orchestrator/skills/team-lead-reference/SKILL.md +317 -0
- package/src/orchestrator/skills/teams-notifications/SKILL.md +249 -0
- package/src/orchestrator/skills/testing-workflow/SKILL.md +134 -0
- package/src/orchestrator/skills/validation-gates/SKILL.md +100 -0
|
@@ -0,0 +1,85 @@
|
|
|
1
|
+
---
|
|
2
|
+
description: 'Testing expert for E2E tests, integration tests, browser validation, and Cypress test suites using Chrome DevTools MCP and test file authoring.'
|
|
3
|
+
name: 'Testing Expert'
|
|
4
|
+
model: GPT-5.3-Codex
|
|
5
|
+
tools: ['search/changes', 'search/codebase', 'edit/editFiles', 'web/fetch', 'read/problems', 'execute/getTerminalOutput', 'execute/runInTerminal', 'read/terminalLastCommand', 'read/terminalSelection', 'search', 'execute/testFailure', 'search/usages', 'chrome-devtools/*']
|
|
6
|
+
---
|
|
7
|
+
|
|
8
|
+
# Testing Expert
|
|
9
|
+
|
|
10
|
+
You are an expert tester who validates UI changes using Chrome DevTools MCP automation and writes E2E/integration test suites.
|
|
11
|
+
|
|
12
|
+
## Skills
|
|
13
|
+
|
|
14
|
+
### Capability Slots
|
|
15
|
+
|
|
16
|
+
Resolve via [skill-matrix.md](.github/customizations/agents/skill-matrix.md).
|
|
17
|
+
|
|
18
|
+
- **e2e-testing** — Browser automation tool reference, validation checklist, regression testing, reporting patterns
|
|
19
|
+
- **testing** — Test planning templates, coverage requirements, context management, common mistakes
|
|
20
|
+
|
|
21
|
+
### Direct Skills
|
|
22
|
+
|
|
23
|
+
- **validation-gates** — Shared validation gate definitions (deterministic checks, cache clearing, regression checks)
|
|
24
|
+
|
|
25
|
+
## Context Management
|
|
26
|
+
|
|
27
|
+
- **ONE focus area per session** — don't try to test everything at once
|
|
28
|
+
- **MAX 3 screenshots** — use `evaluate_script()` for most checks
|
|
29
|
+
- **Prefer `evaluate_script()` over `take_snapshot()`** — returns less data
|
|
30
|
+
- **Clear browser state** between unrelated test flows
|
|
31
|
+
|
|
32
|
+
## Test Plan Structure
|
|
33
|
+
|
|
34
|
+
Every test suite must cover:
|
|
35
|
+
1. **Initial State** — Page loads with correct defaults
|
|
36
|
+
2. **User Interactions** — Buttons, dropdowns, filters trigger correct behavior
|
|
37
|
+
3. **State Transitions** — Changing values produces different results
|
|
38
|
+
4. **Edge Cases** — Empty results, boundaries, invalid input
|
|
39
|
+
5. **Integration** — Component interactions, data flow, URL sync
|
|
40
|
+
|
|
41
|
+
## Guidelines
|
|
42
|
+
|
|
43
|
+
- Test behavior, not implementation details
|
|
44
|
+
- Use `data-testid` for reliable element selection
|
|
45
|
+
- Mock external APIs in unit/integration tests
|
|
46
|
+
- Test keyboard navigation and accessibility
|
|
47
|
+
- Ensure deterministic tests — no flaky timing issues
|
|
48
|
+
- Test interactions, not just initial load — change filters, click buttons, verify results update
|
|
49
|
+
- Verify server-side behavior — confirm filter changes trigger new server requests
|
|
50
|
+
- Start the dev server before browser testing
|
|
51
|
+
- Reload between major test flows to prevent stale state
|
|
52
|
+
- **MANDATORY: Test every UI change at all three responsive breakpoints (Mobile 375px, Tablet 768px, Desktop 1440px) — never test at desktop only. Use `mcp_chrome-devtoo_resize_page()` to switch viewports. See the browser-testing skill for exact commands and per-breakpoint checklists.**
|
|
53
|
+
|
|
54
|
+
## Critical Rules
|
|
55
|
+
|
|
56
|
+
1. **95% minimum coverage** — all new code must meet the coverage threshold
|
|
57
|
+
2. **Test behavior, not implementation** — tests should survive refactors
|
|
58
|
+
3. **Run the full test suite** — never return without running `yarn nx run <project>:test`
|
|
59
|
+
|
|
60
|
+
## Done When
|
|
61
|
+
|
|
62
|
+
- All specified test scenarios pass (including edge cases)
|
|
63
|
+
- Coverage meets project minimum (95% for new code)
|
|
64
|
+
- Browser validation confirms visual correctness at all breakpoints
|
|
65
|
+
- No test flakiness detected (all tests pass 3 consecutive runs)
|
|
66
|
+
- Test files follow project naming and organization conventions
|
|
67
|
+
|
|
68
|
+
## Out of Scope
|
|
69
|
+
|
|
70
|
+
- Fixing application bugs found during testing (report them, don't fix)
|
|
71
|
+
- Refactoring production code for testability (suggest changes only)
|
|
72
|
+
- Writing database migrations or schema changes
|
|
73
|
+
- Performance optimization beyond identifying bottlenecks during testing
|
|
74
|
+
|
|
75
|
+
## Output Contract
|
|
76
|
+
|
|
77
|
+
When completing a task, return a structured summary:
|
|
78
|
+
|
|
79
|
+
1. **Test Files** — List every test file created or modified
|
|
80
|
+
2. **Coverage** — Test count, pass/fail, coverage percentage for affected projects
|
|
81
|
+
3. **Browser Validation** — Screenshots taken and what they prove (for E2E tasks)
|
|
82
|
+
4. **Edge Cases Tested** — List edge cases covered and any known gaps
|
|
83
|
+
5. **Regressions Checked** — Adjacent features/pages verified to still work
|
|
84
|
+
|
|
85
|
+
See **Base Output Contract** in `general.instructions.md` for the standard closing items (Discovered Issues + Lessons Applied).
|
|
@@ -0,0 +1,63 @@
|
|
|
1
|
+
---
|
|
2
|
+
description: 'UI/UX expert for designing and building accessible, consistent React components with deep knowledge of the design system.'
|
|
3
|
+
name: 'UI/UX Expert'
|
|
4
|
+
model: Gemini 3.1 Pro
|
|
5
|
+
tools: ['search/changes', 'search/codebase', 'edit/editFiles', 'web/fetch', 'vscode/getProjectSetupInfo', 'vscode/installExtension', 'vscode/newWorkspace', 'vscode/runCommand', 'read/problems', 'execute/getTerminalOutput', 'execute/runInTerminal', 'read/terminalLastCommand', 'read/terminalSelection', 'search', 'execute/testFailure', 'search/usages', 'chrome-devtools/*']
|
|
6
|
+
---
|
|
7
|
+
|
|
8
|
+
# UI/UX Expert
|
|
9
|
+
|
|
10
|
+
You are an expert UI/UX developer specializing in building accessible, visually consistent React components based on a design system template.
|
|
11
|
+
|
|
12
|
+
## Critical Rules
|
|
13
|
+
|
|
14
|
+
1. **Reference the project template** for design patterns and consistency
|
|
15
|
+
2. **Use CSS Modules + Sass** for component styles, co-located with components
|
|
16
|
+
3. **Place shared components in the UI library** — never in app-specific directories
|
|
17
|
+
|
|
18
|
+
## Skills
|
|
19
|
+
|
|
20
|
+
### Capability Slots
|
|
21
|
+
|
|
22
|
+
Resolve via [skill-matrix.md](.github/customizations/agents/skill-matrix.md).
|
|
23
|
+
|
|
24
|
+
- **design-system** — Design thinking, typography, color/theme, motion, spatial composition, visual quality
|
|
25
|
+
- **ui-library** — Component architecture, TypeScript patterns, hooks, styling, testing
|
|
26
|
+
- **accessibility** — Keyboard navigation, screen reader semantics, contrast, forms, graphics, tables
|
|
27
|
+
- **e2e-testing** — Viewport resize commands and per-breakpoint checklists
|
|
28
|
+
|
|
29
|
+
## Guidelines
|
|
30
|
+
|
|
31
|
+
- Design with mobile-first responsive approach
|
|
32
|
+
- **Validate every UI change at all three breakpoints:** Mobile (375px), Tablet (768px), Desktop (1440px) — load the **e2e-testing** skill (resolved via matrix) for resize commands and per-breakpoint checklists
|
|
33
|
+
- Use semantic HTML before adding ARIA
|
|
34
|
+
- Test with keyboard-only navigation
|
|
35
|
+
- Implement hover, focus, and active states for all interactive elements
|
|
36
|
+
- Use `clsx` for conditional class composition
|
|
37
|
+
- Export all components from the UI library's index
|
|
38
|
+
|
|
39
|
+
## Done When
|
|
40
|
+
|
|
41
|
+
- Components render correctly at all three breakpoints (375px, 768px, 1440px)
|
|
42
|
+
- WCAG 2.2 AA compliance verified (keyboard navigation, contrast, semantics)
|
|
43
|
+
- Components are exported from the UI library index
|
|
44
|
+
- Hover, focus, and active states are implemented for all interactive elements
|
|
45
|
+
- CSS Modules are co-located with components
|
|
46
|
+
|
|
47
|
+
## Out of Scope
|
|
48
|
+
|
|
49
|
+
- Server-side data fetching or API integration
|
|
50
|
+
- Database schema changes or migrations
|
|
51
|
+
- Writing E2E test suites (visual spot-checks during development are in scope)
|
|
52
|
+
- Business logic implementation
|
|
53
|
+
|
|
54
|
+
## Output Contract
|
|
55
|
+
|
|
56
|
+
When completing a task, return a structured summary:
|
|
57
|
+
|
|
58
|
+
1. **Components** — List components created/modified with purpose
|
|
59
|
+
2. **Accessibility** — WCAG checks performed and results
|
|
60
|
+
3. **Responsive** — Breakpoints tested (mobile 375px, tablet 768px, desktop 1440px)
|
|
61
|
+
4. **Visual Evidence** — Screenshots at each breakpoint
|
|
62
|
+
|
|
63
|
+
See **Base Output Contract** in `general.instructions.md` for the standard closing items (Discovered Issues + Lessons Applied).
|
|
@@ -0,0 +1,325 @@
|
|
|
1
|
+
# Agent Expertise Registry
|
|
2
|
+
|
|
3
|
+
Structured tracking of agent performance across sessions. Updated by the Team Lead after task completion.
|
|
4
|
+
|
|
5
|
+
> **Protocol:** See the **agent-memory** skill for update triggers, retrieval protocol, and pruning rules.
|
|
6
|
+
|
|
7
|
+
---
|
|
8
|
+
|
|
9
|
+
## Developer
|
|
10
|
+
|
|
11
|
+
### Strong Areas
|
|
12
|
+
|
|
13
|
+
| Area | Evidence | Last Updated |
|
|
14
|
+
|------|----------|-------------|
|
|
15
|
+
| _(no entries yet)_ | | |
|
|
16
|
+
|
|
17
|
+
### Weak Areas
|
|
18
|
+
|
|
19
|
+
| Area | Evidence | Last Updated |
|
|
20
|
+
|------|----------|-------------|
|
|
21
|
+
| _(no entries yet)_ | | |
|
|
22
|
+
|
|
23
|
+
### File Familiarity
|
|
24
|
+
|
|
25
|
+
_(no entries yet)_
|
|
26
|
+
|
|
27
|
+
---
|
|
28
|
+
|
|
29
|
+
## Testing Expert
|
|
30
|
+
|
|
31
|
+
### Strong Areas
|
|
32
|
+
|
|
33
|
+
| Area | Evidence | Last Updated |
|
|
34
|
+
|------|----------|-------------|
|
|
35
|
+
| _(no entries yet)_ | | |
|
|
36
|
+
|
|
37
|
+
### Weak Areas
|
|
38
|
+
|
|
39
|
+
| Area | Evidence | Last Updated |
|
|
40
|
+
|------|----------|-------------|
|
|
41
|
+
| _(no entries yet)_ | | |
|
|
42
|
+
|
|
43
|
+
### File Familiarity
|
|
44
|
+
|
|
45
|
+
_(no entries yet)_
|
|
46
|
+
|
|
47
|
+
---
|
|
48
|
+
|
|
49
|
+
## Content Engineer
|
|
50
|
+
|
|
51
|
+
### Strong Areas
|
|
52
|
+
|
|
53
|
+
| Area | Evidence | Last Updated |
|
|
54
|
+
|------|----------|-------------|
|
|
55
|
+
| _(no entries yet)_ | | |
|
|
56
|
+
|
|
57
|
+
### Weak Areas
|
|
58
|
+
|
|
59
|
+
| Area | Evidence | Last Updated |
|
|
60
|
+
|------|----------|-------------|
|
|
61
|
+
| _(no entries yet)_ | | |
|
|
62
|
+
|
|
63
|
+
### File Familiarity
|
|
64
|
+
|
|
65
|
+
_(no entries yet)_
|
|
66
|
+
|
|
67
|
+
---
|
|
68
|
+
|
|
69
|
+
## Database Engineer
|
|
70
|
+
|
|
71
|
+
### Strong Areas
|
|
72
|
+
|
|
73
|
+
| Area | Evidence | Last Updated |
|
|
74
|
+
|------|----------|-------------|
|
|
75
|
+
| _(no entries yet)_ | | |
|
|
76
|
+
|
|
77
|
+
### Weak Areas
|
|
78
|
+
|
|
79
|
+
| Area | Evidence | Last Updated |
|
|
80
|
+
|------|----------|-------------|
|
|
81
|
+
| _(no entries yet)_ | | |
|
|
82
|
+
|
|
83
|
+
### File Familiarity
|
|
84
|
+
|
|
85
|
+
_(no entries yet)_
|
|
86
|
+
|
|
87
|
+
---
|
|
88
|
+
|
|
89
|
+
## UI/UX Expert
|
|
90
|
+
|
|
91
|
+
### Strong Areas
|
|
92
|
+
|
|
93
|
+
| Area | Evidence | Last Updated |
|
|
94
|
+
|------|----------|-------------|
|
|
95
|
+
| _(no entries yet)_ | | |
|
|
96
|
+
|
|
97
|
+
### Weak Areas
|
|
98
|
+
|
|
99
|
+
| Area | Evidence | Last Updated |
|
|
100
|
+
|------|----------|-------------|
|
|
101
|
+
| _(no entries yet)_ | | |
|
|
102
|
+
|
|
103
|
+
### File Familiarity
|
|
104
|
+
|
|
105
|
+
_(no entries yet)_
|
|
106
|
+
|
|
107
|
+
---
|
|
108
|
+
|
|
109
|
+
## Performance Expert
|
|
110
|
+
|
|
111
|
+
### Strong Areas
|
|
112
|
+
|
|
113
|
+
| Area | Evidence | Last Updated |
|
|
114
|
+
|------|----------|-------------|
|
|
115
|
+
| _(no entries yet)_ | | |
|
|
116
|
+
|
|
117
|
+
### Weak Areas
|
|
118
|
+
|
|
119
|
+
| Area | Evidence | Last Updated |
|
|
120
|
+
|------|----------|-------------|
|
|
121
|
+
| _(no entries yet)_ | | |
|
|
122
|
+
|
|
123
|
+
### File Familiarity
|
|
124
|
+
|
|
125
|
+
_(no entries yet)_
|
|
126
|
+
|
|
127
|
+
---
|
|
128
|
+
|
|
129
|
+
## Security Expert
|
|
130
|
+
|
|
131
|
+
### Strong Areas
|
|
132
|
+
|
|
133
|
+
| Area | Evidence | Last Updated |
|
|
134
|
+
|------|----------|-------------|
|
|
135
|
+
| _(no entries yet)_ | | |
|
|
136
|
+
|
|
137
|
+
### Weak Areas
|
|
138
|
+
|
|
139
|
+
| Area | Evidence | Last Updated |
|
|
140
|
+
|------|----------|-------------|
|
|
141
|
+
| _(no entries yet)_ | | |
|
|
142
|
+
|
|
143
|
+
### File Familiarity
|
|
144
|
+
|
|
145
|
+
_(no entries yet)_
|
|
146
|
+
|
|
147
|
+
---
|
|
148
|
+
|
|
149
|
+
## Data Expert
|
|
150
|
+
|
|
151
|
+
### Strong Areas
|
|
152
|
+
|
|
153
|
+
| Area | Evidence | Last Updated |
|
|
154
|
+
|------|----------|-------------|
|
|
155
|
+
| _(no entries yet)_ | | |
|
|
156
|
+
|
|
157
|
+
### Weak Areas
|
|
158
|
+
|
|
159
|
+
| Area | Evidence | Last Updated |
|
|
160
|
+
|------|----------|-------------|
|
|
161
|
+
| _(no entries yet)_ | | |
|
|
162
|
+
|
|
163
|
+
### File Familiarity
|
|
164
|
+
|
|
165
|
+
_(no entries yet)_
|
|
166
|
+
|
|
167
|
+
---
|
|
168
|
+
|
|
169
|
+
## DevOps Expert
|
|
170
|
+
|
|
171
|
+
### Strong Areas
|
|
172
|
+
|
|
173
|
+
| Area | Evidence | Last Updated |
|
|
174
|
+
|------|----------|-------------|
|
|
175
|
+
| _(no entries yet)_ | | |
|
|
176
|
+
|
|
177
|
+
### Weak Areas
|
|
178
|
+
|
|
179
|
+
| Area | Evidence | Last Updated |
|
|
180
|
+
|------|----------|-------------|
|
|
181
|
+
| _(no entries yet)_ | | |
|
|
182
|
+
|
|
183
|
+
### File Familiarity
|
|
184
|
+
|
|
185
|
+
_(no entries yet)_
|
|
186
|
+
|
|
187
|
+
---
|
|
188
|
+
|
|
189
|
+
## Architect
|
|
190
|
+
|
|
191
|
+
### Strong Areas
|
|
192
|
+
|
|
193
|
+
| Area | Evidence | Last Updated |
|
|
194
|
+
|------|----------|-------------|
|
|
195
|
+
| _(no entries yet)_ | | |
|
|
196
|
+
|
|
197
|
+
### Weak Areas
|
|
198
|
+
|
|
199
|
+
| Area | Evidence | Last Updated |
|
|
200
|
+
|------|----------|-------------|
|
|
201
|
+
| _(no entries yet)_ | | |
|
|
202
|
+
|
|
203
|
+
### File Familiarity
|
|
204
|
+
|
|
205
|
+
_(no entries yet)_
|
|
206
|
+
|
|
207
|
+
---
|
|
208
|
+
|
|
209
|
+
## Documentation Writer
|
|
210
|
+
|
|
211
|
+
### Strong Areas
|
|
212
|
+
|
|
213
|
+
| Area | Evidence | Last Updated |
|
|
214
|
+
|------|----------|-------------|
|
|
215
|
+
| _(no entries yet)_ | | |
|
|
216
|
+
|
|
217
|
+
### Weak Areas
|
|
218
|
+
|
|
219
|
+
| Area | Evidence | Last Updated |
|
|
220
|
+
|------|----------|-------------|
|
|
221
|
+
| _(no entries yet)_ | | |
|
|
222
|
+
|
|
223
|
+
### File Familiarity
|
|
224
|
+
|
|
225
|
+
_(no entries yet)_
|
|
226
|
+
|
|
227
|
+
---
|
|
228
|
+
|
|
229
|
+
## Researcher
|
|
230
|
+
|
|
231
|
+
### Strong Areas
|
|
232
|
+
|
|
233
|
+
| Area | Evidence | Last Updated |
|
|
234
|
+
|------|----------|-------------|
|
|
235
|
+
| _(no entries yet)_ | | |
|
|
236
|
+
|
|
237
|
+
### Weak Areas
|
|
238
|
+
|
|
239
|
+
| Area | Evidence | Last Updated |
|
|
240
|
+
|------|----------|-------------|
|
|
241
|
+
| _(no entries yet)_ | | |
|
|
242
|
+
|
|
243
|
+
### File Familiarity
|
|
244
|
+
|
|
245
|
+
_(no entries yet)_
|
|
246
|
+
|
|
247
|
+
---
|
|
248
|
+
|
|
249
|
+
## Copywriter
|
|
250
|
+
|
|
251
|
+
### Strong Areas
|
|
252
|
+
|
|
253
|
+
| Area | Evidence | Last Updated |
|
|
254
|
+
|------|----------|-------------|
|
|
255
|
+
| _(no entries yet)_ | | |
|
|
256
|
+
|
|
257
|
+
### Weak Areas
|
|
258
|
+
|
|
259
|
+
| Area | Evidence | Last Updated |
|
|
260
|
+
|------|----------|-------------|
|
|
261
|
+
| _(no entries yet)_ | | |
|
|
262
|
+
|
|
263
|
+
### File Familiarity
|
|
264
|
+
|
|
265
|
+
_(no entries yet)_
|
|
266
|
+
|
|
267
|
+
---
|
|
268
|
+
|
|
269
|
+
## SEO Specialist
|
|
270
|
+
|
|
271
|
+
### Strong Areas
|
|
272
|
+
|
|
273
|
+
| Area | Evidence | Last Updated |
|
|
274
|
+
|------|----------|-------------|
|
|
275
|
+
| _(no entries yet)_ | | |
|
|
276
|
+
|
|
277
|
+
### Weak Areas
|
|
278
|
+
|
|
279
|
+
| Area | Evidence | Last Updated |
|
|
280
|
+
|------|----------|-------------|
|
|
281
|
+
| _(no entries yet)_ | | |
|
|
282
|
+
|
|
283
|
+
### File Familiarity
|
|
284
|
+
|
|
285
|
+
_(no entries yet)_
|
|
286
|
+
|
|
287
|
+
---
|
|
288
|
+
|
|
289
|
+
## API Designer
|
|
290
|
+
|
|
291
|
+
### Strong Areas
|
|
292
|
+
|
|
293
|
+
| Area | Evidence | Last Updated |
|
|
294
|
+
|------|----------|-------------|
|
|
295
|
+
| _(no entries yet)_ | | |
|
|
296
|
+
|
|
297
|
+
### Weak Areas
|
|
298
|
+
|
|
299
|
+
| Area | Evidence | Last Updated |
|
|
300
|
+
|------|----------|-------------|
|
|
301
|
+
| _(no entries yet)_ | | |
|
|
302
|
+
|
|
303
|
+
### File Familiarity
|
|
304
|
+
|
|
305
|
+
_(no entries yet)_
|
|
306
|
+
|
|
307
|
+
---
|
|
308
|
+
|
|
309
|
+
## Release Manager
|
|
310
|
+
|
|
311
|
+
### Strong Areas
|
|
312
|
+
|
|
313
|
+
| Area | Evidence | Last Updated |
|
|
314
|
+
|------|----------|-------------|
|
|
315
|
+
| _(no entries yet)_ | | |
|
|
316
|
+
|
|
317
|
+
### Weak Areas
|
|
318
|
+
|
|
319
|
+
| Area | Evidence | Last Updated |
|
|
320
|
+
|------|----------|-------------|
|
|
321
|
+
| _(no entries yet)_ | | |
|
|
322
|
+
|
|
323
|
+
### File Familiarity
|
|
324
|
+
|
|
325
|
+
_(no entries yet)_
|
|
@@ -0,0 +1,69 @@
|
|
|
1
|
+
````markdown
|
|
2
|
+
# Agent Failure Log (Dead Letter Queue)
|
|
3
|
+
|
|
4
|
+
Structured log of failed agent delegations for diagnosis and retry. Prevents failed work from silently disappearing.
|
|
5
|
+
|
|
6
|
+
> **Review this file at the start of each session.** Check for pending failures that need retry and patterns that indicate systemic issues.
|
|
7
|
+
|
|
8
|
+
---
|
|
9
|
+
|
|
10
|
+
## How to Use This File
|
|
11
|
+
|
|
12
|
+
### When to add an entry
|
|
13
|
+
|
|
14
|
+
Add an entry when **any** of these occur:
|
|
15
|
+
|
|
16
|
+
- A delegated agent fails to complete its task after 2+ attempts
|
|
17
|
+
- A background agent produces output that fails all verification gates
|
|
18
|
+
- A panel review BLOCKs 3 times and requires escalation → **create a dispute record** in `DISPUTES.md` instead (see below)
|
|
19
|
+
- An agent encounters an unrecoverable error (e.g., MCP server down, tool unavailable)
|
|
20
|
+
|
|
21
|
+
> **Disputes vs. DLQ:** When a panel BLOCKs 3 times or agents fundamentally disagree on an approach, create a **dispute record** in `DISPUTES.md` — not a DLQ entry. Disputes package both perspectives and resolution options for human decision-making. DLQ entries are for simple failures (tool errors, timeouts, scope creep).
|
|
22
|
+
|
|
23
|
+
### Entry format
|
|
24
|
+
|
|
25
|
+
```markdown
|
|
26
|
+
### DLQ-XXX: Short description
|
|
27
|
+
|
|
28
|
+
| Field | Value |
|
|
29
|
+
|-------|-------|
|
|
30
|
+
| **Date** | YYYY-MM-DD |
|
|
31
|
+
| **Agent** | Agent name |
|
|
32
|
+
| **Linear Issue** | PREFIX-XX (if applicable) |
|
|
33
|
+
| **Failure Type** | `verification-fail` / `tool-error` / `panel-block` / `timeout` / `scope-creep` |
|
|
34
|
+
| **Attempts** | Number of attempts before logging |
|
|
35
|
+
|
|
36
|
+
**Task:** What was the agent supposed to do?
|
|
37
|
+
|
|
38
|
+
**Failure Details:** What went wrong? Include error messages, failed checks, or panel BLOCK reasons.
|
|
39
|
+
|
|
40
|
+
**Root Cause:** Why did it fail? (if known)
|
|
41
|
+
|
|
42
|
+
**Resolution:** How was it eventually resolved? (or "pending" if unresolved)
|
|
43
|
+
```
|
|
44
|
+
|
|
45
|
+
### Failure types
|
|
46
|
+
|
|
47
|
+
| Type | Description |
|
|
48
|
+
|------|-------------|
|
|
49
|
+
| `verification-fail` | Agent completed but output fails lint/test/build/browser checks |
|
|
50
|
+
| `tool-error` | MCP server down, tool unavailable, API error |
|
|
51
|
+
| `panel-block` | Panel review blocked 3+ times |
|
|
52
|
+
| `timeout` | Agent ran out of context or took too long |
|
|
53
|
+
| `scope-creep` | Agent modified files outside its partition or went off-task |
|
|
54
|
+
|
|
55
|
+
---
|
|
56
|
+
|
|
57
|
+
## Failures
|
|
58
|
+
|
|
59
|
+
<!-- Failures are appended here by the Team Lead during sessions.
|
|
60
|
+
Start numbering from DLQ-001. -->
|
|
61
|
+
|
|
62
|
+
---
|
|
63
|
+
|
|
64
|
+
## Index
|
|
65
|
+
|
|
66
|
+
| ID | Date | Agent | Type | Status |
|
|
67
|
+
|----|------|-------|------|--------|
|
|
68
|
+
|
|
69
|
+
````
|
|
@@ -0,0 +1,58 @@
|
|
|
1
|
+
````markdown
|
|
2
|
+
# Agent Performance Tracking
|
|
3
|
+
|
|
4
|
+
> **Last Updated:** _(auto-updated by metrics-report prompt)_
|
|
5
|
+
|
|
6
|
+
Tracks agent success rates across panel reviews and delegated tasks to inform model routing and panel reviewer selection.
|
|
7
|
+
|
|
8
|
+
## Data Sources
|
|
9
|
+
|
|
10
|
+
Performance data is collected automatically via NDJSON session logs:
|
|
11
|
+
- **Session data:** `customizations/logs/sessions.ndjson` — appended by every agent after each session
|
|
12
|
+
- **Delegation data:** `customizations/logs/delegations.ndjson` — appended by the Team Lead after each delegation
|
|
13
|
+
- **Full reporting:** Run the **metrics-report** prompt to generate a dashboard from all sources
|
|
14
|
+
|
|
15
|
+
## Quick Queries
|
|
16
|
+
|
|
17
|
+
```bash
|
|
18
|
+
# Sessions per agent
|
|
19
|
+
jq -r '.agent' customizations/logs/sessions.ndjson | sort | uniq -c | sort -rn
|
|
20
|
+
|
|
21
|
+
# Success rate by agent
|
|
22
|
+
jq -r '[.agent, .outcome] | @tsv' customizations/logs/sessions.ndjson | sort | uniq -c
|
|
23
|
+
|
|
24
|
+
# Delegation tier distribution
|
|
25
|
+
jq -r '.tier' customizations/logs/delegations.ndjson | sort | uniq -c
|
|
26
|
+
|
|
27
|
+
# Failed delegations
|
|
28
|
+
jq 'select(.outcome == "failed")' customizations/logs/delegations.ndjson
|
|
29
|
+
```
|
|
30
|
+
|
|
31
|
+
## Panel Review Performance
|
|
32
|
+
|
|
33
|
+
Panel review data is collected automatically via `customizations/logs/panels.ndjson` (appended by the panel runner after each review — see step 7 in the panel majority vote skill).
|
|
34
|
+
|
|
35
|
+
```bash
|
|
36
|
+
# Total panel reviews
|
|
37
|
+
wc -l customizations/logs/panels.ndjson
|
|
38
|
+
|
|
39
|
+
# Pass vs block rate
|
|
40
|
+
jq -r '.verdict' customizations/logs/panels.ndjson | sort | uniq -c
|
|
41
|
+
|
|
42
|
+
# Reviews by panel key
|
|
43
|
+
jq -r '.panel_key' customizations/logs/panels.ndjson | sort | uniq -c | sort -rn
|
|
44
|
+
|
|
45
|
+
# Reviews that required retries (attempt > 1)
|
|
46
|
+
jq 'select(.attempt > 1)' customizations/logs/panels.ndjson
|
|
47
|
+
|
|
48
|
+
# Average SHOULD-FIX items per review
|
|
49
|
+
jq -s 'if length > 0 then (map(.should_fix) | add) / length else 0 end' customizations/logs/panels.ndjson
|
|
50
|
+
```
|
|
51
|
+
|
|
52
|
+
## Usage
|
|
53
|
+
|
|
54
|
+
Referenced by the **panel-majority-vote** skill for weight assignment:
|
|
55
|
+
- Agents with >80% success rate for similar reviews get a +1 weight bonus
|
|
56
|
+
- This file is the source of truth for that metric
|
|
57
|
+
|
|
58
|
+
````
|