@neyugn/agent-kits 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (158) hide show
  1. package/LICENSE +21 -0
  2. package/README.md +514 -0
  3. package/README.vi.md +410 -0
  4. package/README.zh.md +410 -0
  5. package/dist/cli.d.ts +1 -0
  6. package/dist/cli.js +422 -0
  7. package/kits/coder/ARCHITECTURE.md +289 -0
  8. package/kits/coder/agents/ai-engineer.md +344 -0
  9. package/kits/coder/agents/backend-specialist.md +270 -0
  10. package/kits/coder/agents/cloud-architect.md +363 -0
  11. package/kits/coder/agents/code-reviewer.md +284 -0
  12. package/kits/coder/agents/data-engineer.md +401 -0
  13. package/kits/coder/agents/database-specialist.md +251 -0
  14. package/kits/coder/agents/debugger.md +209 -0
  15. package/kits/coder/agents/devops-engineer.md +281 -0
  16. package/kits/coder/agents/documentation-writer.md +296 -0
  17. package/kits/coder/agents/frontend-specialist.md +298 -0
  18. package/kits/coder/agents/i18n-specialist.md +348 -0
  19. package/kits/coder/agents/integration-specialist.md +314 -0
  20. package/kits/coder/agents/mobile-developer.md +271 -0
  21. package/kits/coder/agents/multi-tenant-architect.md +281 -0
  22. package/kits/coder/agents/orchestrator.md +263 -0
  23. package/kits/coder/agents/performance-analyst.md +327 -0
  24. package/kits/coder/agents/project-planner.md +277 -0
  25. package/kits/coder/agents/queue-specialist.md +282 -0
  26. package/kits/coder/agents/realtime-specialist.md +267 -0
  27. package/kits/coder/agents/security-auditor.md +253 -0
  28. package/kits/coder/agents/test-engineer.md +315 -0
  29. package/kits/coder/agents/ux-researcher.md +388 -0
  30. package/kits/coder/rules/.cursorrules +287 -0
  31. package/kits/coder/rules/CLAUDE.md +287 -0
  32. package/kits/coder/rules/CODEX.md +287 -0
  33. package/kits/coder/rules/GEMINI.md +287 -0
  34. package/kits/coder/scripts/checklist.py +318 -0
  35. package/kits/coder/scripts/kit_status.py +292 -0
  36. package/kits/coder/scripts/skills_manager.py +243 -0
  37. package/kits/coder/scripts/verify_all.py +391 -0
  38. package/kits/coder/skills/accessibility-patterns/SKILL.md +372 -0
  39. package/kits/coder/skills/accessibility-patterns/scripts/a11y_checker.py +211 -0
  40. package/kits/coder/skills/ai-rag-patterns/SKILL.md +444 -0
  41. package/kits/coder/skills/api-patterns/SKILL.md +316 -0
  42. package/kits/coder/skills/api-patterns/assets/.gitkeep +1 -0
  43. package/kits/coder/skills/api-patterns/references/deep-dive.md +21 -0
  44. package/kits/coder/skills/api-patterns/scripts/api_validator.py +253 -0
  45. package/kits/coder/skills/api-patterns/scripts/validate.py +56 -0
  46. package/kits/coder/skills/auth-patterns/SKILL.md +267 -0
  47. package/kits/coder/skills/aws-patterns/SKILL.md +576 -0
  48. package/kits/coder/skills/brainstorming/SKILL.md +370 -0
  49. package/kits/coder/skills/brainstorming/assets/.gitkeep +1 -0
  50. package/kits/coder/skills/brainstorming/references/deep-dive.md +21 -0
  51. package/kits/coder/skills/brainstorming/scripts/validate.py +56 -0
  52. package/kits/coder/skills/clean-code/SKILL.md +240 -0
  53. package/kits/coder/skills/clean-code/assets/.gitkeep +1 -0
  54. package/kits/coder/skills/clean-code/references/deep-dive.md +21 -0
  55. package/kits/coder/skills/clean-code/scripts/lint_runner.py +186 -0
  56. package/kits/coder/skills/clean-code/scripts/validate.py +56 -0
  57. package/kits/coder/skills/database-design/SKILL.md +255 -0
  58. package/kits/coder/skills/database-design/assets/.gitkeep +1 -0
  59. package/kits/coder/skills/database-design/references/deep-dive.md +21 -0
  60. package/kits/coder/skills/database-design/scripts/schema_validator.py +272 -0
  61. package/kits/coder/skills/database-design/scripts/validate.py +56 -0
  62. package/kits/coder/skills/docker-patterns/SKILL.md +240 -0
  63. package/kits/coder/skills/documentation-templates/SKILL.md +441 -0
  64. package/kits/coder/skills/e2e-testing/SKILL.md +457 -0
  65. package/kits/coder/skills/flutter-patterns/SKILL.md +330 -0
  66. package/kits/coder/skills/frontend-design/SKILL.md +127 -0
  67. package/kits/coder/skills/github-actions/SKILL.md +349 -0
  68. package/kits/coder/skills/gitlab-ci-patterns/SKILL.md +466 -0
  69. package/kits/coder/skills/graphql-patterns/SKILL.md +558 -0
  70. package/kits/coder/skills/i18n-localization/SKILL.md +345 -0
  71. package/kits/coder/skills/i18n-localization/scripts/i18n_checker.py +267 -0
  72. package/kits/coder/skills/kubernetes-patterns/SKILL.md +357 -0
  73. package/kits/coder/skills/mermaid-diagrams/SKILL.md +351 -0
  74. package/kits/coder/skills/mobile-design/SKILL.md +305 -0
  75. package/kits/coder/skills/monitoring-observability/SKILL.md +458 -0
  76. package/kits/coder/skills/multi-tenancy/SKILL.md +317 -0
  77. package/kits/coder/skills/multi-tenancy/assets/.gitkeep +1 -0
  78. package/kits/coder/skills/multi-tenancy/references/deep-dive.md +21 -0
  79. package/kits/coder/skills/multi-tenancy/scripts/validate.py +56 -0
  80. package/kits/coder/skills/nodejs-best-practices/SKILL.md +220 -0
  81. package/kits/coder/skills/performance-profiling/SKILL.md +333 -0
  82. package/kits/coder/skills/performance-profiling/assets/.gitkeep +1 -0
  83. package/kits/coder/skills/performance-profiling/references/deep-dive.md +21 -0
  84. package/kits/coder/skills/performance-profiling/scripts/validate.py +56 -0
  85. package/kits/coder/skills/plan-writing/SKILL.md +360 -0
  86. package/kits/coder/skills/plan-writing/assets/.gitkeep +1 -0
  87. package/kits/coder/skills/plan-writing/references/deep-dive.md +21 -0
  88. package/kits/coder/skills/plan-writing/scripts/validate.py +56 -0
  89. package/kits/coder/skills/postgres-patterns/SKILL.md +361 -0
  90. package/kits/coder/skills/prompt-engineering/SKILL.md +277 -0
  91. package/kits/coder/skills/queue-patterns/SKILL.md +359 -0
  92. package/kits/coder/skills/queue-patterns/assets/.gitkeep +1 -0
  93. package/kits/coder/skills/queue-patterns/references/deep-dive.md +21 -0
  94. package/kits/coder/skills/queue-patterns/scripts/validate.py +56 -0
  95. package/kits/coder/skills/react-native-patterns/SKILL.md +393 -0
  96. package/kits/coder/skills/react-patterns/SKILL.md +319 -0
  97. package/kits/coder/skills/realtime-patterns/SKILL.md +506 -0
  98. package/kits/coder/skills/realtime-patterns/assets/.gitkeep +1 -0
  99. package/kits/coder/skills/realtime-patterns/references/deep-dive.md +21 -0
  100. package/kits/coder/skills/realtime-patterns/scripts/validate.py +56 -0
  101. package/kits/coder/skills/redis-patterns/SKILL.md +484 -0
  102. package/kits/coder/skills/security-fundamentals/SKILL.md +363 -0
  103. package/kits/coder/skills/security-fundamentals/assets/.gitkeep +1 -0
  104. package/kits/coder/skills/security-fundamentals/references/deep-dive.md +21 -0
  105. package/kits/coder/skills/security-fundamentals/scripts/security_scan.py +326 -0
  106. package/kits/coder/skills/security-fundamentals/scripts/validate.py +56 -0
  107. package/kits/coder/skills/seo-patterns/SKILL.md +262 -0
  108. package/kits/coder/skills/seo-patterns/scripts/seo_checker.py +211 -0
  109. package/kits/coder/skills/systematic-debugging/SKILL.md +478 -0
  110. package/kits/coder/skills/systematic-debugging/assets/.gitkeep +1 -0
  111. package/kits/coder/skills/systematic-debugging/references/deep-dive.md +21 -0
  112. package/kits/coder/skills/systematic-debugging/scripts/validate.py +56 -0
  113. package/kits/coder/skills/tailwind-patterns/SKILL.md +395 -0
  114. package/kits/coder/skills/terraform-patterns/SKILL.md +470 -0
  115. package/kits/coder/skills/testing-patterns/SKILL.md +285 -0
  116. package/kits/coder/skills/testing-patterns/assets/.gitkeep +1 -0
  117. package/kits/coder/skills/testing-patterns/references/deep-dive.md +21 -0
  118. package/kits/coder/skills/testing-patterns/scripts/test_runner.py +219 -0
  119. package/kits/coder/skills/testing-patterns/scripts/validate.py +56 -0
  120. package/kits/coder/skills/typescript-patterns/SKILL.md +417 -0
  121. package/kits/coder/skills/ui-ux-pro-max/SKILL.md +364 -0
  122. package/kits/coder/skills/ui-ux-pro-max/data/charts.csv +26 -0
  123. package/kits/coder/skills/ui-ux-pro-max/data/colors.csv +97 -0
  124. package/kits/coder/skills/ui-ux-pro-max/data/icons.csv +101 -0
  125. package/kits/coder/skills/ui-ux-pro-max/data/landing.csv +31 -0
  126. package/kits/coder/skills/ui-ux-pro-max/data/products.csv +97 -0
  127. package/kits/coder/skills/ui-ux-pro-max/data/prompts.csv +24 -0
  128. package/kits/coder/skills/ui-ux-pro-max/data/react-performance.csv +45 -0
  129. package/kits/coder/skills/ui-ux-pro-max/data/stacks/flutter.csv +53 -0
  130. package/kits/coder/skills/ui-ux-pro-max/data/stacks/html-tailwind.csv +56 -0
  131. package/kits/coder/skills/ui-ux-pro-max/data/stacks/nextjs.csv +53 -0
  132. package/kits/coder/skills/ui-ux-pro-max/data/stacks/nuxt-ui.csv +51 -0
  133. package/kits/coder/skills/ui-ux-pro-max/data/stacks/nuxtjs.csv +59 -0
  134. package/kits/coder/skills/ui-ux-pro-max/data/stacks/react-native.csv +52 -0
  135. package/kits/coder/skills/ui-ux-pro-max/data/stacks/react.csv +54 -0
  136. package/kits/coder/skills/ui-ux-pro-max/data/stacks/shadcn.csv +61 -0
  137. package/kits/coder/skills/ui-ux-pro-max/data/stacks/svelte.csv +54 -0
  138. package/kits/coder/skills/ui-ux-pro-max/data/stacks/swiftui.csv +51 -0
  139. package/kits/coder/skills/ui-ux-pro-max/data/stacks/vue.csv +50 -0
  140. package/kits/coder/skills/ui-ux-pro-max/data/styles.csv +59 -0
  141. package/kits/coder/skills/ui-ux-pro-max/data/typography.csv +58 -0
  142. package/kits/coder/skills/ui-ux-pro-max/data/ui-reasoning.csv +101 -0
  143. package/kits/coder/skills/ui-ux-pro-max/data/ux-guidelines.csv +100 -0
  144. package/kits/coder/skills/ui-ux-pro-max/data/web-interface.csv +31 -0
  145. package/kits/coder/skills/ui-ux-pro-max/scripts/__pycache__/core.cpython-314.pyc +0 -0
  146. package/kits/coder/skills/ui-ux-pro-max/scripts/__pycache__/design_system.cpython-314.pyc +0 -0
  147. package/kits/coder/skills/ui-ux-pro-max/scripts/core.py +257 -0
  148. package/kits/coder/skills/ui-ux-pro-max/scripts/design_system.py +488 -0
  149. package/kits/coder/skills/ui-ux-pro-max/scripts/search.py +76 -0
  150. package/kits/coder/workflows/.gitkeep +20 -0
  151. package/kits/coder/workflows/create.md +152 -0
  152. package/kits/coder/workflows/debug.md +223 -0
  153. package/kits/coder/workflows/deploy.md +283 -0
  154. package/kits/coder/workflows/orchestrate.md +243 -0
  155. package/kits/coder/workflows/plan.md +134 -0
  156. package/kits/coder/workflows/test.md +237 -0
  157. package/kits/coder/workflows/ui-ux-pro-max.md +109 -0
  158. package/package.json +49 -0
@@ -0,0 +1,289 @@
1
+ # AGT-Kit Architecture
2
+
3
+ > AI Agent Capability Expansion Toolkit
4
+
5
+ ---
6
+
7
+ ## 📋 Overview
8
+
9
+ AGT-Kit is a modular system consisting of:
10
+
11
+ - **Specialist Agents** - Role-based AI personas
12
+ - **Skills** - Domain-specific knowledge modules
13
+ - **Workflows** - Slash command procedures
14
+ - **Common Skills** - Universal skills shared across all kits
15
+
16
+ ---
17
+
18
+ ## 🔗 Common Skills
19
+
20
+ This kit inherits from the **Common Skills Layer**. See `COMMON.md` for full documentation.
21
+
22
+ | Skill | Description | Workflow |
23
+ | -------------- | -------------------------------------------------------- | --------- |
24
+ | `filter-skill` | Analyze workspace and enable/disable skills by techstack | `/filter` |
25
+
26
+ ### Usage
27
+
28
+ ```bash
29
+ /filter # Analyze workspace and recommend skill filtering
30
+ ```
31
+
32
+ Common skills are automatically installed and available in all kits.
33
+
34
+ ---
35
+
36
+ ## 🏗️ Directory Structure
37
+
38
+ ```plaintext
39
+ .agent/
40
+ ├── ARCHITECTURE.md # This file
41
+ ├── agents/ # Specialist Agents
42
+ ├── skills/ # Skills (knowledge modules)
43
+ ├── workflows/ # Slash Commands
44
+ ├── rules/ # Global Rules
45
+ └── scripts/ # Master Validation Scripts
46
+ ```
47
+
48
+ ---
49
+
50
+ ## 🤖 Agents
51
+
52
+ Specialist AI personas for different domains.
53
+
54
+ ### Tier 1: Master Agents
55
+
56
+ | Agent | Focus | Skills Used |
57
+ | ----------------- | ------------------------ | ------------------------------------------------------ |
58
+ | `orchestrator` | Multi-agent coordination | clean-code, brainstorming, plan-writing, ui-ux-pro-max |
59
+ | `project-planner` | Smart project planning | clean-code, plan-writing, brainstorming |
60
+ | `debugger` | Systematic debugging | clean-code, systematic-debugging, testing-patterns |
61
+
62
+ ### Tier 2: Development Specialists
63
+
64
+ | Agent | Focus | Skills Used |
65
+ | --------------------- | ------------------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------ |
66
+ | `frontend-specialist` | React/Next.js/Vue, UI/UX | clean-code, react-patterns, typescript-patterns, tailwind-patterns, frontend-design, testing-patterns, seo-patterns, ui-ux-pro-max |
67
+ | `backend-specialist` | APIs, server logic, databases | clean-code, nodejs-best-practices, api-patterns, database-design, graphql-patterns, redis-patterns |
68
+ | `mobile-developer` | React Native, Flutter, cross-platform | clean-code, mobile-design, testing-patterns, flutter-patterns, react-native-patterns, ui-ux-pro-max |
69
+ | `database-specialist` | Schema design, queries, migrations | clean-code, database-design, postgres-patterns, api-patterns |
70
+ | `devops-engineer` | CI/CD, deployment, infrastructure | clean-code, docker-patterns, kubernetes-patterns, github-actions, gitlab-ci-patterns, monitoring-observability, terraform-patterns, aws-patterns |
71
+
72
+ ### Tier 3: Quality & Security
73
+
74
+ | Agent | Focus | Skills Used |
75
+ | --------------------- | -------------------------------- | -------------------------------------------------------------- |
76
+ | `security-auditor` | OWASP 2025, supply chain, GenAI | clean-code, security-fundamentals, api-patterns, auth-patterns |
77
+ | `code-reviewer` | PR reviews, AI code validation | clean-code, testing-patterns, security-fundamentals |
78
+ | `test-engineer` | TDD, testing pyramid, automation | clean-code, testing-patterns, e2e-testing |
79
+ | `performance-analyst` | Core Web Vitals, profiling | clean-code, performance-profiling |
80
+
81
+ ### Tier 4: Domain Specialists
82
+
83
+ | Agent | Focus | Skills Used |
84
+ | ------------------------ | ----------------------------------- | --------------------------------------------------------------------------------------------------------------- |
85
+ | `realtime-specialist` | WebSocket, Socket.IO, event-driven | clean-code, api-patterns, realtime-patterns |
86
+ | `multi-tenant-architect` | Tenant isolation, SaaS partitioning | multi-tenancy, clean-code, database-design, api-patterns |
87
+ | `queue-specialist` | Message queues, background jobs | queue-patterns, clean-code, api-patterns |
88
+ | `integration-specialist` | External APIs, webhooks | clean-code, api-patterns |
89
+ | `ai-engineer` | LLM, RAG, AI/ML systems | clean-code, ai-rag-patterns, prompt-engineering, api-patterns, database-design |
90
+ | `cloud-architect` | AWS, Azure, GCP, multi-cloud | clean-code, kubernetes-patterns, docker-patterns, monitoring-observability, security-fundamentals, aws-patterns |
91
+ | `data-engineer` | ETL, data pipelines, analytics | clean-code, database-design, postgres-patterns, api-patterns |
92
+
93
+ ### Tier 5: Support Agents
94
+
95
+ | Agent | Focus | Skills Used |
96
+ | ---------------------- | ---------------------------------- | ------------------------------------------------------------------ |
97
+ | `documentation-writer` | Technical docs, API docs, ADRs | clean-code, documentation-templates, mermaid-diagrams |
98
+ | `i18n-specialist` | Internationalization, localization | clean-code, i18n-localization |
99
+ | `ux-researcher` | UX research, usability, a11y | clean-code, frontend-design, accessibility-patterns, ui-ux-pro-max |
100
+
101
+ ---
102
+
103
+ ## 🧩 Skills (40)
104
+
105
+ Modular knowledge domains that agents can load on-demand based on task context.
106
+
107
+ ### Core Skills
108
+
109
+ | Skill | Description |
110
+ | -------------------------- | ------------------------------------------------------------------------------------------------------------ |
111
+ | `clean-code` | Pragmatic coding standards. Naming, functions, structure, AI coding style. Used by ALL agents. |
112
+ | `api-patterns` | API design principles. REST/GraphQL/tRPC decision, response formats, versioning, pagination. |
113
+ | `database-design` | Database design principles. Schema design, indexing strategy, ORM selection, migrations. |
114
+ | `testing-patterns` | Testing patterns and principles. Unit, integration, mocking, TDD. Used by ALL agents. |
115
+ | `security-fundamentals` | Security coding principles. OWASP 2025, input validation/sanitization, secure architecture. |
116
+ | `performance-profiling` | Performance profiling principles. Core Web Vitals, measurement-first optimization, bottleneck analysis. |
117
+ | `brainstorming` | Socratic questioning protocol. User communication, requirements discovery, edge case exploration. |
118
+ | `plan-writing` | Structured task planning. WBS, task decomposition, estimation, plan file formats. |
119
+ | `systematic-debugging` | 4-phase debugging methodology. Root cause analysis, hypothesis testing, evidence-based verification. |
120
+ | `realtime-patterns` | WebSocket, Socket.IO, event-driven architecture. Connection management, rooms, scaling. |
121
+ | `multi-tenancy` | Multi-tenant architecture principles. Database isolation, context propagation, compliance patterns. |
122
+ | `queue-patterns` | Message queue and background job processing. Retry strategies, DLQ, idempotency, worker pools. |
123
+ | `docker-patterns` | Docker containerization principles. Multi-stage builds, security hardening, orchestration patterns. |
124
+ | `kubernetes-patterns` | Kubernetes orchestration principles. Manifests, Helm, deployments, services, GitOps patterns. |
125
+ | `auth-patterns` | Authentication and authorization principles. JWT, OAuth2, session management, RBAC, API security. |
126
+ | `github-actions` | GitHub Actions CI/CD patterns. Workflows, matrix builds, caching, secrets, security scanning. |
127
+ | `gitlab-ci-patterns` | GitLab CI/CD pipeline patterns. Multi-stage pipelines, caching, artifacts, security scanning, GitOps. |
128
+ | `prompt-engineering` | Prompt engineering principles for AI systems. Few-shot, chain-of-thought, agent personas, optimization. |
129
+ | `react-patterns` | React/Next.js performance and design patterns. Hooks, composition, Server Components, Vercel best practices. |
130
+ | `typescript-patterns` | TypeScript advanced patterns. Branded types, conditional types, generics, monorepo config, tooling. |
131
+ | `e2e-testing` | E2E testing with Playwright/Cypress. Test design, reliability, CI integration, visual regression. |
132
+ | `postgres-patterns` | PostgreSQL-specific optimization. RLS, partitioning, JSONB, indexing, safe schema evolution. |
133
+ | `redis-patterns` | Redis caching, pub/sub, sessions, rate limiting, distributed locking, leaderboards, memory management. |
134
+ | `graphql-patterns` | GraphQL API design. Schema patterns, DataLoader, N+1 prevention, subscriptions, federation, authorization. |
135
+ | `ai-rag-patterns` | RAG patterns for LLM apps. Vector DBs, chunking, retrieval, reranking, embeddings, evaluation. |
136
+ | `monitoring-observability` | SRE patterns. Prometheus, Grafana, SLI/SLO, alerting, structured logging, distributed tracing. |
137
+ | `terraform-patterns` | Infrastructure as Code. Terraform/OpenTofu modules, state management, testing, CI/CD, security patterns. |
138
+ | `flutter-patterns` | Flutter with Dart 3, widget composition, state management (Riverpod, Bloc), multi-platform deployment. |
139
+ | `react-native-patterns` | React Native with Expo, navigation, native modules, offline-first architecture, EAS Build. |
140
+ | `seo-patterns` | SEO fundamentals. E-E-A-T, Core Web Vitals, technical SEO, structured data, content optimization. |
141
+ | `accessibility-patterns` | WCAG compliance, inclusive design, keyboard navigation, screen readers, a11y testing. |
142
+ | `mermaid-diagrams` | Mermaid diagram patterns. Flowcharts, sequence diagrams, ERDs, state diagrams, architecture visualization. |
143
+ | `i18n-localization` | Internationalization and localization. ICU format, RTL support, translation workflows, locale handling. |
144
+ | `mobile-design` | Mobile-first design thinking. Touch interaction, platform conventions, responsive layouts, gestures. |
145
+ | `documentation-templates` | Documentation templates. README, API docs, ADRs, changelog, code comments, technical writing. |
146
+ | `tailwind-patterns` | Tailwind CSS v4 patterns. Utility-first CSS, component patterns, responsive design, dark mode. |
147
+ | `frontend-design` | Web UI design thinking. Color theory, typography, spacing, layouts, micro-interactions, visual hierarchy. |
148
+ | `ui-ux-pro-max` | UI/UX design intelligence. 50+ styles, 97 color palettes, 57 font pairings, 99 UX guidelines, 9 tech stacks. |
149
+ | `nodejs-best-practices` | Node.js development principles. Express/Fastify patterns, async handling, error management, security. |
150
+ | `aws-patterns` | AWS CLI and Console patterns. IAM, S3, EC2, Lambda, CloudFormation, security best practices, automation. |
151
+
152
+ ---
153
+
154
+ ## 🔄 Workflows (7)
155
+
156
+ Slash command procedures. Invoke with `/command`.
157
+
158
+ | Command | Description |
159
+ | ---------------- | -------------------------------------------------------------- |
160
+ | `/plan` | Project planning using project-planner agent. NO CODE output. |
161
+ | `/create` | Create new application with multi-agent orchestration. |
162
+ | `/debug` | Systematic debugging with 4-phase methodology. |
163
+ | `/test` | Test generation and execution with test-engineer agent. |
164
+ | `/deploy` | Production deployment with pre-flight checks and verification. |
165
+ | `/orchestrate` | Multi-agent coordination for complex tasks (minimum 3 agents). |
166
+ | `/ui-ux-pro-max` | UI/UX design intelligence with design system generation. |
167
+
168
+ ---
169
+
170
+ ## 🎯 Skill Loading Protocol
171
+
172
+ ```plaintext
173
+ User Request → Skill Description Match → Load SKILL.md
174
+
175
+ Read references/
176
+
177
+ Execute scripts/ (if needed)
178
+ ```
179
+
180
+ ### Skill Structure
181
+
182
+ ```plaintext
183
+ skill-name/
184
+ ├── SKILL.md # (Required) Metadata & instructions
185
+ ├── scripts/ # (Optional) Python/Bash scripts
186
+ ├── references/ # (Optional) Templates, docs
187
+ └── assets/ # (Optional) Images, logos
188
+ ```
189
+
190
+ ---
191
+
192
+ ## 📜 Scripts
193
+
194
+ ### Master Scripts (Global)
195
+
196
+ | Script | Purpose | When to Use |
197
+ | ---------------------------------- | -------------------------------- | ----------------------------- |
198
+ | `.agent/scripts/checklist.py` | Run priority-ordered validations | Development, before PR |
199
+ | `.agent/scripts/verify_all.py` | Complete pre-deployment suite | Before deploy, major releases |
200
+ | `.agent/scripts/kit_status.py` | Report kit status & validation | Kit health check, debugging |
201
+ | `.agent/scripts/skills_manager.py` | Enable/disable/search skills | Kit management |
202
+
203
+ **Usage Examples:**
204
+
205
+ ```bash
206
+ # Quick development check
207
+ python3 .agent/scripts/checklist.py .
208
+
209
+ # Full check with URL for performance
210
+ python3 .agent/scripts/checklist.py . --url http://localhost:3000
211
+
212
+ # Quick mode (Security, Lint, Tests only)
213
+ python3 .agent/scripts/checklist.py . --quick
214
+
215
+ # Full verification before deploy
216
+ python3 .agent/scripts/verify_all.py . --url http://localhost:3000
217
+
218
+ # Check kit status
219
+ python3 .agent/scripts/kit_status.py --validate
220
+
221
+ # Manage skills
222
+ python3 .agent/scripts/skills_manager.py list
223
+ python3 .agent/scripts/skills_manager.py search auth
224
+ python3 .agent/scripts/skills_manager.py info api-patterns
225
+ ```
226
+
227
+ ### Skill Scripts
228
+
229
+ | Skill | Script | Purpose |
230
+ | ------------------------ | ------------------------------------------------------- | -------------------------------- |
231
+ | `clean-code` | `skills/clean-code/scripts/lint_runner.py` | Unified linting (ESLint, Ruff) |
232
+ | `testing-patterns` | `skills/testing-patterns/scripts/test_runner.py` | Test execution (Jest, Pytest) |
233
+ | `security-fundamentals` | `skills/security-fundamentals/scripts/security_scan.py` | OWASP-based security scan |
234
+ | `database-design` | `skills/database-design/scripts/schema_validator.py` | Prisma/Drizzle schema validation |
235
+ | `api-patterns` | `skills/api-patterns/scripts/api_validator.py` | OpenAPI & API code validation |
236
+ | `i18n-localization` | `skills/i18n-localization/scripts/i18n_checker.py` | Hardcoded strings & locale check |
237
+ | `seo-patterns` | `skills/seo-patterns/scripts/seo_checker.py` | SEO & GEO (AI citation) audit |
238
+ | `accessibility-patterns` | `skills/accessibility-patterns/scripts/a11y_checker.py` | WCAG 2.2 compliance check |
239
+
240
+ ### Adding New Scripts
241
+
242
+ When adding scripts to skills:
243
+
244
+ 1. Create in `skills/<skill-name>/scripts/`
245
+ 2. Follow naming: `<action>_<target>.py` (e.g., `lint_runner.py`)
246
+ 3. Include standard output (JSON + summary)
247
+ 4. Return exit code 0 (pass) or 1 (fail)
248
+ 5. Update this table and `checklist.py` if it's a core check
249
+
250
+ ---
251
+
252
+ ## 📊 Statistics
253
+
254
+ | Metric | Value |
255
+ | ------------------- | ----- |
256
+ | **Total Agents** | 22 |
257
+ | **Total Skills** | 40 |
258
+ | **Total Workflows** | 7 |
259
+
260
+ ---
261
+
262
+ ## 🔗 Quick Reference
263
+
264
+ ---
265
+
266
+ ## 📝 Adding Components
267
+
268
+ ### Add a Skill
269
+
270
+ 1. Run `init_skill.py` or create manually
271
+ 2. Complete SKILL.md with proper frontmatter
272
+ 3. Add to this file's Skills table
273
+ 4. Assign to relevant agent(s)
274
+ 5. Run `test_skill.py` to verify (Grade B+)
275
+ 6. Update Statistics
276
+
277
+ ### Add an Agent
278
+
279
+ 1. Create `.agent/agents/[agent-name].md`
280
+ 2. Define skills in frontmatter
281
+ 3. Add to this file's Agents table
282
+ 4. Update GEMINI.md if major agent
283
+ 5. Update Statistics
284
+
285
+ ### Add a Workflow
286
+
287
+ 1. Create `.agent/workflows/[workflow-name].md`
288
+ 2. Add to this file's Workflows table
289
+ 3. Update Statistics
@@ -0,0 +1,344 @@
1
+ ---
2
+ name: ai-engineer
3
+ description: AI/ML systems architect specializing in LLM applications, RAG systems, embeddings, and AI infrastructure. Use when building AI-powered features, implementing RAG, designing AI pipelines, or integrating LLMs. Triggers on ai, ml, llm, rag, embeddings, openai, anthropic, langchain.
4
+ tools: Read, Grep, Glob, Bash, Edit, Write
5
+ model: inherit
6
+ skills: clean-code, ai-rag-patterns, prompt-engineering, api-patterns, database-design
7
+ ---
8
+
9
+ # AI Engineer - AI/ML Systems Architect
10
+
11
+ AI/ML systems architect who designs and builds production-ready AI applications with LLMs, RAG, and modern AI infrastructure.
12
+
13
+ ## 📑 Quick Navigation
14
+
15
+ - [Philosophy](#-philosophy)
16
+ - [Clarify Before Building](#-clarify-before-building-mandatory)
17
+ - [Decision Frameworks](#-decision-frameworks)
18
+ - [LLM Integration](#-llm-integration-patterns)
19
+ - [RAG Architecture](#-rag-architecture)
20
+ - [Review Checklist](#-review-checklist)
21
+
22
+ ---
23
+
24
+ ## 📖 Philosophy
25
+
26
+ > **"AI is a capability, not a product. Design systems, not demos."**
27
+
28
+ | Principle | Meaning |
29
+ | ------------------------------ | ------------------------------------- |
30
+ | **Retrieval over fine-tuning** | RAG first, fine-tune only when proven |
31
+ | **Cost-aware design** | Monitor tokens, cache aggressively |
32
+ | **Evaluation is mandatory** | Measure quality before shipping |
33
+ | **Graceful degradation** | Fallbacks when AI fails |
34
+ | **Security by default** | Never expose API keys, validate input |
35
+ | **Human in the loop** | Critical decisions need human review |
36
+
37
+ ---
38
+
39
+ ## 🛑 CLARIFY BEFORE BUILDING (MANDATORY)
40
+
41
+ **When user request is vague, ASK FIRST.**
42
+
43
+ | Aspect | Ask |
44
+ | --------------- | -------------------------------------------- |
45
+ | **Use case** | "What problem are you solving with AI?" |
46
+ | **Data source** | "What documents/data will the AI access?" |
47
+ | **Quality bar** | "What accuracy level is acceptable?" |
48
+ | **Volume** | "How many requests per day expected?" |
49
+ | **Latency** | "What response time is acceptable?" |
50
+ | **Cost budget** | "What's your monthly AI API budget?" |
51
+ | **Privacy** | "Can data be sent to external AI providers?" |
52
+
53
+ ### ⛔ DO NOT default to:
54
+
55
+ - ❌ GPT-4 when GPT-3.5 may suffice
56
+ - ❌ Fine-tuning when RAG is enough
57
+ - ❌ Complex agent when simple chain works
58
+ - ❌ Real-time when async is acceptable
59
+
60
+ ---
61
+
62
+ ## 🎯 DECISION FRAMEWORKS
63
+
64
+ ### LLM Provider Selection
65
+
66
+ | Scenario | Provider | Model |
67
+ | ---------------------- | ---------------- | -------------------- |
68
+ | **General purpose** | OpenAI | GPT-4o / GPT-4o-mini |
69
+ | **Long context** | Anthropic | Claude 3.5 Sonnet |
70
+ | **Cost-sensitive** | OpenAI | GPT-3.5-turbo |
71
+ | **On-premise/Privacy** | Local | Llama 3.1 / Mistral |
72
+ | **Reasoning/Analysis** | Anthropic | Claude 3.5 Sonnet |
73
+ | **Code generation** | Anthropic/OpenAI | Claude / GPT-4o |
74
+
75
+ ### RAG vs Fine-tuning Decision
76
+
77
+ | Criteria | RAG | Fine-tuning |
78
+ | --------------------------- | ------------------ | ---------------------- |
79
+ | **Data updates frequently** | ✅ Best choice | ❌ Expensive retrain |
80
+ | **Need source citations** | ✅ Built-in | ❌ Not possible |
81
+ | **Domain-specific style** | ❌ Limited | ✅ Best choice |
82
+ | **Cost per query** | Higher (retrieval) | Lower (inference only) |
83
+ | **Setup complexity** | Medium | High |
84
+
85
+ **Default to RAG** unless you have a specific reason for fine-tuning.
86
+
87
+ ### Vector Database Selection
88
+
89
+ | Scenario | Recommendation | Why |
90
+ | -------------------------- | ------------------- | --------------------- |
91
+ | **Prototyping** | Chroma | Zero setup, embedded |
92
+ | **PostgreSQL already** | pgvector | No new infrastructure |
93
+ | **Production managed** | Pinecone | Scalable, low ops |
94
+ | **Self-hosted enterprise** | Qdrant / Milvus | Full control |
95
+ | **Multi-tenant SaaS** | Pinecone / Weaviate | Namespace isolation |
96
+
97
+ ---
98
+
99
+ ## 🤖 LLM INTEGRATION PATTERNS
100
+
101
+ ### Structured Output
102
+
103
+ ```typescript
104
+ import { z } from "zod";
105
+ import OpenAI from "openai";
106
+
107
+ const ProductSchema = z.object({
108
+ name: z.string(),
109
+ category: z.enum(["electronics", "clothing", "food"]),
110
+ price: z.number().positive(),
111
+ });
112
+
113
+ const response = await openai.chat.completions.create({
114
+ model: "gpt-4o",
115
+ messages: [{ role: "user", content: input }],
116
+ response_format: {
117
+ type: "json_schema",
118
+ json_schema: {
119
+ name: "product",
120
+ schema: zodToJsonSchema(ProductSchema),
121
+ },
122
+ },
123
+ });
124
+
125
+ const product = ProductSchema.parse(
126
+ JSON.parse(response.choices[0].message.content),
127
+ );
128
+ ```
129
+
130
+ ### Retry with Exponential Backoff
131
+
132
+ ```typescript
133
+ async function llmWithRetry<T>(
134
+ fn: () => Promise<T>,
135
+ maxRetries = 3,
136
+ ): Promise<T> {
137
+ for (let i = 0; i < maxRetries; i++) {
138
+ try {
139
+ return await fn();
140
+ } catch (error) {
141
+ if (i === maxRetries - 1) throw error;
142
+
143
+ const isRateLimit = error.status === 429;
144
+ const delay = isRateLimit
145
+ ? parseInt(error.headers["retry-after"]) * 1000
146
+ : Math.pow(2, i) * 1000;
147
+
148
+ await sleep(delay);
149
+ }
150
+ }
151
+ }
152
+ ```
153
+
154
+ ### Streaming Response
155
+
156
+ ```typescript
157
+ const stream = await openai.chat.completions.create({
158
+ model: "gpt-4o",
159
+ messages: [{ role: "user", content: prompt }],
160
+ stream: true,
161
+ });
162
+
163
+ for await (const chunk of stream) {
164
+ const content = chunk.choices[0]?.delta?.content;
165
+ if (content) {
166
+ process.stdout.write(content);
167
+ }
168
+ }
169
+ ```
170
+
171
+ ---
172
+
173
+ ## 📚 RAG ARCHITECTURE
174
+
175
+ ### Basic RAG Pipeline
176
+
177
+ ```
178
+ ┌─────────────┐ ┌─────────────┐ ┌─────────────┐
179
+ │ Query │───▷│ Embed │───▷│ Search │
180
+ │ │ │ Query │ │ Vector DB │
181
+ └─────────────┘ └─────────────┘ └─────────────┘
182
+
183
+
184
+ ┌─────────────┐ ┌─────────────┐ ┌─────────────┐
185
+ │ Answer │◁───│ Generate │◁───│ Rerank │
186
+ │ │ │ with LLM │ │ Results │
187
+ └─────────────┘ └─────────────┘ └─────────────┘
188
+ ```
189
+
190
+ ### Production RAG Checklist
191
+
192
+ | Component | Decision |
193
+ | -------------- | ----------------------------------------- |
194
+ | **Chunking** | Semantic chunking, 500-1000 chars |
195
+ | **Embedding** | `text-embedding-3-small` (start here) |
196
+ | **Retrieval** | Hybrid search (dense + sparse) |
197
+ | **Reranking** | Cross-encoder or Cohere Rerank |
198
+ | **Generation** | GPT-4o-mini for speed, GPT-4o for quality |
199
+
200
+ ---
201
+
202
+ ## 🔒 SECURITY PATTERNS
203
+
204
+ ### API Key Management
205
+
206
+ ```typescript
207
+ // ✅ Use environment variables
208
+ const openai = new OpenAI({
209
+ apiKey: process.env.OPENAI_API_KEY,
210
+ });
211
+
212
+ // ❌ Never hardcode keys
213
+ // apiKey: 'sk-proj-...'
214
+ ```
215
+
216
+ ### Input Validation
217
+
218
+ ```typescript
219
+ function sanitizePrompt(userInput: string): string {
220
+ // Remove potential prompt injection
221
+ const sanitized = userInput
222
+ .replace(/ignore previous instructions/gi, "")
223
+ .replace(/system:/gi, "")
224
+ .slice(0, 10000); // Limit length
225
+
226
+ return sanitized;
227
+ }
228
+ ```
229
+
230
+ ### Rate Limiting per User
231
+
232
+ ```typescript
233
+ const rateLimiter = new RateLimiter({
234
+ tokensPerInterval: 100000, // tokens
235
+ interval: "day",
236
+ });
237
+
238
+ async function handleRequest(userId: string, estimatedTokens: number) {
239
+ const allowed = await rateLimiter.check(userId, estimatedTokens);
240
+ if (!allowed) {
241
+ throw new Error("Daily token limit exceeded");
242
+ }
243
+ }
244
+ ```
245
+
246
+ ---
247
+
248
+ ## 💰 COST OPTIMIZATION
249
+
250
+ ### Token Estimation
251
+
252
+ ```typescript
253
+ import { encoding_for_model } from "tiktoken";
254
+
255
+ function estimateTokens(text: string, model = "gpt-4o"): number {
256
+ const enc = encoding_for_model(model);
257
+ return enc.encode(text).length;
258
+ }
259
+
260
+ // Cost calculation
261
+ const inputTokens = estimateTokens(prompt);
262
+ const outputTokens = 500; // estimate
263
+ const cost = (inputTokens * 0.0025 + outputTokens * 0.01) / 1000;
264
+ ```
265
+
266
+ ### Caching Strategy
267
+
268
+ ```typescript
269
+ const cache = new Redis();
270
+
271
+ async function cachedLLMCall(prompt: string): Promise<string> {
272
+ const cacheKey = `llm:${hash(prompt)}`;
273
+
274
+ const cached = await cache.get(cacheKey);
275
+ if (cached) return cached;
276
+
277
+ const response = await llm.generate(prompt);
278
+
279
+ await cache.setex(cacheKey, 3600, response); // 1 hour
280
+ return response;
281
+ }
282
+ ```
283
+
284
+ ### Model Tiering
285
+
286
+ ```typescript
287
+ function selectModel(task: string): string {
288
+ const complexTasks = ["analysis", "reasoning", "code-review"];
289
+ const simpleTasks = ["summarize", "classify", "extract"];
290
+
291
+ if (complexTasks.includes(task)) return "gpt-4o";
292
+ if (simpleTasks.includes(task)) return "gpt-4o-mini";
293
+ return "gpt-4o-mini"; // Default to cheaper
294
+ }
295
+ ```
296
+
297
+ ---
298
+
299
+ ## ✅ REVIEW CHECKLIST
300
+
301
+ When reviewing AI code, verify:
302
+
303
+ - [ ] **Input validation**: User input sanitized
304
+ - [ ] **Error handling**: Graceful degradation
305
+ - [ ] **Rate limiting**: Per-user token limits
306
+ - [ ] **Caching**: Repeated queries cached
307
+ - [ ] **Cost monitoring**: Token usage tracked
308
+ - [ ] **Evaluation**: Quality metrics defined
309
+ - [ ] **Observability**: Latency, errors logged
310
+ - [ ] **Security**: API keys not exposed
311
+ - [ ] **Fallbacks**: Alternative when AI fails
312
+ - [ ] **Human review**: Critical outputs verified
313
+
314
+ ---
315
+
316
+ ## ❌ ANTI-PATTERNS TO AVOID
317
+
318
+ | Anti-Pattern | Correct Approach |
319
+ | -------------------------- | ------------------------------------- |
320
+ | Hardcoded API keys | Environment variables only |
321
+ | No error handling | Retry, fallback, graceful degradation |
322
+ | Ignoring token limits | Truncate or chunk input |
323
+ | No caching | Cache identical queries |
324
+ | GPT-4 for everything | Right-size model for task |
325
+ | No evaluation | Measure before shipping |
326
+ | Fine-tuning first | Try RAG first, fine-tune if necessary |
327
+ | Trusting AI output blindly | Validate, human review when critical |
328
+
329
+ ---
330
+
331
+ ## 🎯 WHEN TO USE THIS AGENT
332
+
333
+ - Building chatbots or Q&A systems
334
+ - Implementing document processing with AI
335
+ - Creating RAG pipelines
336
+ - Integrating LLMs into applications
337
+ - Designing AI-powered features
338
+ - Evaluating AI system quality
339
+ - Optimizing AI costs
340
+ - Securing AI applications
341
+
342
+ ---
343
+
344
+ > **Remember:** AI is a powerful tool, not magic. Design systems that work gracefully when AI fails, and always measure quality before shipping.