multimodel-dev-os 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (105) hide show
  1. package/.ai/agents/README.md +23 -0
  2. package/.ai/agents/coder.md +11 -0
  3. package/.ai/agents/devops.md +8 -0
  4. package/.ai/agents/multimodel-orchestrator.md +105 -0
  5. package/.ai/agents/planner.md +11 -0
  6. package/.ai/agents/qa-tester.md +8 -0
  7. package/.ai/agents/reviewer.md +11 -0
  8. package/.ai/agents/security-auditor.md +8 -0
  9. package/.ai/agents/seo-auditor.md +8 -0
  10. package/.ai/checks/README.md +38 -0
  11. package/.ai/checks/context-budget.md +7 -0
  12. package/.ai/checks/pre-commit.md +8 -0
  13. package/.ai/checks/pre-deploy.md +8 -0
  14. package/.ai/checks/pre-implementation.md +7 -0
  15. package/.ai/checks/regression-checklist.md +8 -0
  16. package/.ai/config.yaml +60 -0
  17. package/.ai/context/README.md +18 -0
  18. package/.ai/context/architecture.md +15 -0
  19. package/.ai/context/business-rules.md +12 -0
  20. package/.ai/context/context-budget.md +12 -0
  21. package/.ai/context/deployment-rules.md +15 -0
  22. package/.ai/context/model-map.md +11 -0
  23. package/.ai/context/project-brief.md +17 -0
  24. package/.ai/context/seo-rules.md +15 -0
  25. package/.ai/prompts/README.md +37 -0
  26. package/.ai/prompts/generate-tests.md +5 -0
  27. package/.ai/prompts/handoff-to-next-model.md +5 -0
  28. package/.ai/prompts/implement-safely.md +5 -0
  29. package/.ai/prompts/plan-first.md +5 -0
  30. package/.ai/prompts/review-diff.md +5 -0
  31. package/.ai/prompts/summarize-session.md +5 -0
  32. package/.ai/session-logs/.gitkeep +1 -0
  33. package/.ai/session-logs/README.md +49 -0
  34. package/.ai/skills/README.md +34 -0
  35. package/.ai/skills/bug-fix.md +9 -0
  36. package/.ai/skills/caveman-bug-fix.md +2 -0
  37. package/.ai/skills/caveman-context-handoff.md +2 -0
  38. package/.ai/skills/caveman-feature-build.md +2 -0
  39. package/.ai/skills/context-routing.md +8 -0
  40. package/.ai/skills/cpanel-deploy.md +9 -0
  41. package/.ai/skills/example-skill.md +38 -0
  42. package/.ai/skills/landing-page-optimization.md +8 -0
  43. package/.ai/skills/model-routing.md +7 -0
  44. package/.ai/skills/nextjs-feature-build.md +9 -0
  45. package/.ai/skills/refactor.md +9 -0
  46. package/.ai/skills/seo-implementation.md +8 -0
  47. package/.ai/templates/AGENTS.caveman.md +12 -0
  48. package/.ai/templates/MEMORY.caveman.md +14 -0
  49. package/.ai/templates/RUNBOOK.caveman.md +22 -0
  50. package/.ai/templates/TASKS.caveman.md +7 -0
  51. package/.ai/templates/bug-report-template.md +14 -0
  52. package/.ai/templates/feature-spec-template.md +14 -0
  53. package/.ai/templates/project-memory-template.md +12 -0
  54. package/.ai/templates/session-log-template.md +16 -0
  55. package/.ai/templates/task-template.md +16 -0
  56. package/AGENTS.md +79 -0
  57. package/LICENSE +21 -0
  58. package/MEMORY.md +42 -0
  59. package/README.md +197 -0
  60. package/RUNBOOK.md +73 -0
  61. package/TASKS.md +28 -0
  62. package/adapters/antigravity/.gemini/settings.json +13 -0
  63. package/adapters/antigravity/AGENTS.md +29 -0
  64. package/adapters/antigravity/setup.md +36 -0
  65. package/adapters/claude/CLAUDE.md +31 -0
  66. package/adapters/claude/setup.md +35 -0
  67. package/adapters/codex/AGENTS.md +27 -0
  68. package/adapters/codex/setup.md +25 -0
  69. package/adapters/cursor/.cursorrules +30 -0
  70. package/adapters/cursor/setup.md +35 -0
  71. package/adapters/gemini/GEMINI.md +31 -0
  72. package/adapters/gemini/setup.md +34 -0
  73. package/adapters/vscode/.vscode/settings.json +21 -0
  74. package/adapters/vscode/setup.md +40 -0
  75. package/bin/multimodel-dev-os.js +267 -0
  76. package/docs/adapters.md +79 -0
  77. package/docs/architecture.md +64 -0
  78. package/docs/caveman-mode.md +74 -0
  79. package/docs/cli-roadmap.md +44 -0
  80. package/docs/faq.md +66 -0
  81. package/docs/installers.md +58 -0
  82. package/docs/multimodel-workflow.md +121 -0
  83. package/docs/npm-publishing.md +74 -0
  84. package/docs/quickstart.md +85 -0
  85. package/docs/testing-v0.2.md +73 -0
  86. package/examples/ecommerce-store/.ai/config.yaml +4 -0
  87. package/examples/ecommerce-store/AGENTS.md +5 -0
  88. package/examples/ecommerce-store/MEMORY.md +4 -0
  89. package/examples/general-app/.ai/config.yaml +4 -0
  90. package/examples/general-app/AGENTS.md +5 -0
  91. package/examples/general-app/MEMORY.md +4 -0
  92. package/examples/nextjs-saas/.ai/config.yaml +4 -0
  93. package/examples/nextjs-saas/AGENTS.md +13 -0
  94. package/examples/nextjs-saas/MEMORY.md +5 -0
  95. package/examples/seo-landing-page/.ai/config.yaml +4 -0
  96. package/examples/seo-landing-page/AGENTS.md +5 -0
  97. package/examples/seo-landing-page/MEMORY.md +5 -0
  98. package/examples/wordpress-site/.ai/config.yaml +4 -0
  99. package/examples/wordpress-site/AGENTS.md +5 -0
  100. package/examples/wordpress-site/MEMORY.md +4 -0
  101. package/package.json +43 -0
  102. package/scripts/install.ps1 +230 -0
  103. package/scripts/install.sh +237 -0
  104. package/scripts/pack-template.sh +39 -0
  105. package/scripts/verify.sh +271 -0
@@ -0,0 +1,23 @@
1
+ # Agents
2
+
3
+ > Agent role definitions and orchestration configuration.
4
+
5
+ ## Purpose
6
+
7
+ This directory defines:
8
+ - Agent roles and their file scopes
9
+ - Orchestration mode (sequential, parallel, supervised)
10
+ - Handoff protocol between agents
11
+
12
+ ## Files
13
+
14
+ | File | Purpose |
15
+ |------|---------|
16
+ | `orchestrator.md` | Multi-agent coordination protocol |
17
+ | `{role-name}.md` | Custom role definitions (optional) |
18
+
19
+ ## Quick Reference
20
+
21
+ Define agents in root `.ai/config.yaml`, then detail their coordination here.
22
+
23
+ See `orchestrator.md` for the full protocol spec.
@@ -0,0 +1,11 @@
1
+ # Coder Agent Spec
2
+
3
+ > Responsible for writing clean, structured, and modular implementation code based on an approved plan.
4
+
5
+ ## Focus Areas
6
+ - Enforce strict typing and standard style guides.
7
+ - Avoid introducing unused variables or broken code imports.
8
+ - Make targeted atomic edits instead of rewriting large file sections.
9
+
10
+ ## Primary Tooling
11
+ - IDE agents, code completion engines, or fast edit tools (e.g. Cursor / Claude)
@@ -0,0 +1,8 @@
1
+ # DevOps Agent Spec
2
+
3
+ > Responsible for managing deployment configurations, CI/CD pipelines, container boundaries, server environments, and rollbacks.
4
+
5
+ ## Focus Areas
6
+ - Enforce strict continuous deployment gating.
7
+ - Manage Dockerfiles, container definitions, and cloud config templates safely.
8
+ - Write robust, fail-safe recovery scripts.
@@ -0,0 +1,105 @@
1
+ # Multimodel Orchestrator Protocol — v0.1
2
+
3
+ > Specification for coordinating multiple AI coding agents on a single project.
4
+ > v0.1 is a **protocol document** — runtime implementation comes in v0.2+.
5
+
6
+ ## Purpose
7
+
8
+ When multiple AI tools work on the same codebase, they need:
9
+ 1. **Role clarity** — who does what
10
+ 2. **File boundaries** — who touches which files
11
+ 3. **Session logging** — how to pass context between agents
12
+ 4. **Conflict prevention** — avoid stepping on each other's changes
13
+
14
+ ## Agent Roles
15
+
16
+ Define agents in `.ai/config.yaml`:
17
+
18
+ ```yaml
19
+ orchestrator:
20
+ agents:
21
+ - name: "architect"
22
+ tool: "claude"
23
+ role: "Design and plan architecture"
24
+ files: ["docs/**", "AGENTS.md", "MEMORY.md"]
25
+ permissions: "read+write"
26
+
27
+ - name: "implementer"
28
+ tool: "cursor"
29
+ role: "Write implementation code"
30
+ files: ["src/**", "lib/**", "tests/**"]
31
+ permissions: "read+write"
32
+
33
+ - name: "reviewer"
34
+ tool: "codex"
35
+ role: "Review code and suggest fixes"
36
+ files: ["**"]
37
+ permissions: "read-only"
38
+ ```
39
+
40
+ ## Execution Modes
41
+
42
+ | Mode | Behavior |
43
+ |------|----------|
44
+ | `sequential` | One agent at a time. Session log required between each. |
45
+ | `parallel` | Multiple agents work simultaneously on different file scopes. |
46
+ | `supervised` | Human reviews each agent's output before the next agent starts. |
47
+
48
+ ## Session Log Protocol
49
+
50
+ When an agent finishes a task, it writes a session log to `.ai/session-logs/`:
51
+
52
+ ### Session Log Format
53
+
54
+ ```markdown
55
+ # Session: {agent_name} → {next_agent}
56
+
57
+ **Timestamp:** {ISO 8601}
58
+ **Agent:** {tool_name} ({role_name})
59
+ **Mode:** {execution_mode}
60
+
61
+ ## Action Summary
62
+ {What was done in 2-3 sentences}
63
+
64
+ ## Files Changed
65
+ - {path} ({created|modified|deleted})
66
+
67
+ ## Next Steps
68
+ 1. {Concrete next action}
69
+ 2. {Another action}
70
+
71
+ ## Blockers
72
+ - {Any blockers, or "None"}
73
+
74
+ ## Context for Next Agent
75
+ {Any important context the next agent needs}
76
+ ```
77
+
78
+ ### Naming Convention
79
+
80
+ ```
81
+ .ai/session-logs/{YYYY-MM-DD}-{agent}-{summary}.md
82
+ ```
83
+
84
+ Example: `.ai/session-logs/2026-05-30-architect-auth-design.md`
85
+
86
+ ## Conflict Prevention Rules
87
+
88
+ 1. **File scoping:** Agents should only modify files in their defined `files` glob
89
+ 2. **Lock files:** If an agent is working on a file, other agents should skip it
90
+ 3. **Pull before push:** Always check for changes before committing
91
+ 4. **Atomic tasks:** Each agent should complete a coherent unit of work
92
+
93
+ ## Current Limitations (v0.1)
94
+
95
+ - No runtime enforcement — this is a convention, not a system
96
+ - No automatic conflict detection
97
+ - No agent-to-agent messaging (use session logs)
98
+ - No parallel execution safeguards
99
+
100
+ ## Roadmap
101
+
102
+ - **v0.2:** CLI that reads config and routes tasks
103
+ - **v0.3:** Automatic session log generation
104
+ - **v0.4:** Conflict detection and resolution
105
+ - **v0.5:** Real-time agent coordination
@@ -0,0 +1,11 @@
1
+ # Planner Agent Spec
2
+
3
+ > Responsible for requirement clarification, researching dependencies, and designing robust step-by-step implementation plans.
4
+
5
+ ## Focus Areas
6
+ - Research before taking action.
7
+ - Outline files to create, modify, or delete.
8
+ - Define a strict verification plan.
9
+
10
+ ## Primary Tooling
11
+ - Reasoning models (e.g. Claude Code / Antigravity with high reasoning)
@@ -0,0 +1,8 @@
1
+ # QA Tester Agent Spec
2
+
3
+ > Responsible for writing comprehensive unit, integration, and E2E test suites, and running regression checks.
4
+
5
+ ## Focus Areas
6
+ - Write unit tests covering Edge Cases.
7
+ - Validate component routing and user experience.
8
+ - Maintain test coverage budgets.
@@ -0,0 +1,11 @@
1
+ # Reviewer Agent Spec
2
+
3
+ > Responsible for conducting strict pull request reviews, evaluating diff structures, and finding performance code smells.
4
+
5
+ ## Focus Areas
6
+ - Evaluate security vulnerability risks.
7
+ - Look for resource leaks or inefficient algorithms.
8
+ - Enforce coding rules defined in `AGENTS.md`.
9
+
10
+ ## Primary Tooling
11
+ - Codex / large reasoning review assistants
@@ -0,0 +1,8 @@
1
+ # Security Auditor Agent Spec
2
+
3
+ > Responsible for identifying potential security vulnerabilities, reviewing third-party dependencies for CVE issues, and validating input sanitization.
4
+
5
+ ## Focus Areas
6
+ - Enforce strict input sanitization and parameter encoding.
7
+ - Verify JWT verification, auth scopes, and RBAC rules.
8
+ - Prevent inclusion of plain text keys or secrets.
@@ -0,0 +1,8 @@
1
+ # SEO Auditor Agent Spec
2
+
3
+ > Responsible for conducting strict audits on HTML structures, metadata tags, heading hierarchies, and validating conformance with search indexing best practices.
4
+
5
+ ## Focus Areas
6
+ - Enforce exactly one main `<h1>` per page.
7
+ - Audit semantic elements hierarchy.
8
+ - Validate open graph/meta title and description formats.
@@ -0,0 +1,38 @@
1
+ # Checks
2
+
3
+ > Pre- and post-action checks that agents run before/after critical operations.
4
+
5
+ ## What is a Check?
6
+
7
+ A check is a markdown file that defines verification steps an agent should run:
8
+ - Before committing code
9
+ - Before deploying
10
+ - After a migration
11
+ - After a dependency update
12
+
13
+ ## Structure
14
+
15
+ ```
16
+ .ai/checks/
17
+ ├── README.md ← You are here
18
+ ├── pre-commit.md ← Example pre-commit check
19
+ └── your-check.md ← Your custom checks
20
+ ```
21
+
22
+ ## Enabling Checks
23
+
24
+ Set in `.ai/config.yaml`:
25
+
26
+ ```yaml
27
+ checks:
28
+ pre_commit:
29
+ enabled: true
30
+ file: ".ai/checks/pre-commit.md"
31
+ ```
32
+
33
+ ## Creating a Check
34
+
35
+ 1. Create a markdown file in this directory
36
+ 2. Define the check name, trigger, and steps
37
+ 3. Include pass/fail criteria
38
+ 4. Reference it in `.ai/config.yaml`
@@ -0,0 +1,7 @@
1
+ # Context Budget Checks
2
+
3
+ > Active checks to evaluate token and context window state.
4
+
5
+ - [ ] Check active files in prompt < 15
6
+ - [ ] Confirm no build outputs or temp files are passed
7
+ - [ ] Active usage of Caveman Mode for bulk refactorings
@@ -0,0 +1,8 @@
1
+ # Pre-Commit Checks
2
+
3
+ > Self-checklist before committing changes.
4
+
5
+ - [ ] Run linter and verify 0 errors
6
+ - [ ] Run test suite and verify 100% pass
7
+ - [ ] No local machine paths committed
8
+ - [ ] No credentials/secrets in code
@@ -0,0 +1,8 @@
1
+ # Pre-Deploy Checks
2
+
3
+ > Gating checks prior to deploying to staging/production.
4
+
5
+ - [ ] All CI pipeline checks pass successfully
6
+ - [ ] Environment variables configured correctly
7
+ - [ ] Database migrations mapped and tested
8
+ - [ ] Rollback recovery script verified
@@ -0,0 +1,7 @@
1
+ # Pre-Implementation Checks
2
+
3
+ > Self-checklist before modifying codebase files.
4
+
5
+ - [ ] Clear planning document approved
6
+ - [ ] Understand target file boundaries
7
+ - [ ] Verify test suite works locally before any edits
@@ -0,0 +1,8 @@
1
+ # Regression Checklist
2
+
3
+ > Procedures to ensure modifications do not disrupt existing application functionality.
4
+
5
+ - [ ] Check primary user authentication flows
6
+ - [ ] Verify core page loading parameters
7
+ - [ ] Check console log errors
8
+ - [ ] Confirm layout styling holds across sizes
@@ -0,0 +1,60 @@
1
+ # multimodel-dev-os configuration
2
+ # Source of truth for AI operating layer settings
3
+
4
+ project:
5
+ name: null # Your project name
6
+ description: null # One-line description
7
+ version: null # Project version
8
+
9
+ # Mode: "standard" (full templates) or "caveman" (minimal tokens)
10
+ mode: "standard"
11
+
12
+ # Orchestrator configuration
13
+ # See .ai/agents/orchestrator.md for full protocol spec
14
+ orchestrator:
15
+ version: "0.1"
16
+ mode: "sequential" # sequential | parallel | supervised
17
+ session_logs:
18
+ format: "markdown"
19
+ location: ".ai/session-logs/"
20
+ required_fields:
21
+ - agent_name
22
+ - timestamp
23
+ - action_summary
24
+ - files_changed
25
+ - next_steps
26
+
27
+ agents:
28
+ - name: "default"
29
+ tool: "any"
30
+ role: "General development"
31
+ files: ["**"]
32
+ permissions: "read+write"
33
+
34
+ # Adapter configuration
35
+ # Only enable adapters for tools you use
36
+ adapters:
37
+ codex: false
38
+ antigravity: false
39
+ cursor: false
40
+ claude: false
41
+ gemini: false
42
+ vscode: false
43
+
44
+ # Checks configuration
45
+ checks:
46
+ pre_commit:
47
+ enabled: false
48
+ file: ".ai/checks/pre-commit.md"
49
+ post_commit:
50
+ enabled: false
51
+ file: null
52
+
53
+ # Skills
54
+ skills:
55
+ directory: ".ai/skills/"
56
+ auto_load: true
57
+
58
+ # Prompts
59
+ prompts:
60
+ directory: ".ai/prompts/"
@@ -0,0 +1,18 @@
1
+ # Context
2
+
3
+ > Shared project context that AI agents read at session start.
4
+
5
+ ## Purpose
6
+
7
+ Place files here that provide essential background for any AI agent:
8
+ - Architecture decisions not yet in `MEMORY.md`
9
+ - Design documents under active discussion
10
+ - Reference material agents need frequently
11
+ - External specs or API docs relevant to current work
12
+
13
+ ## Guidelines
14
+
15
+ - Keep files under 200 lines each
16
+ - Use markdown for all context files
17
+ - Remove stale context regularly
18
+ - Prefer structured data (tables, lists) over prose
@@ -0,0 +1,15 @@
1
+ # Technical Architecture
2
+
3
+ > High-level technical architecture, system design, data flows, and tech stack configurations.
4
+
5
+ ## Stack Overview
6
+ - Frontend: `null`
7
+ - Backend: `null`
8
+ - Database: `null`
9
+ - Hosting: `null`
10
+
11
+ ## System Diagram & Data Flow
12
+ `null`
13
+
14
+ ## Key Boundaries & Core Services
15
+ `null`
@@ -0,0 +1,12 @@
1
+ # Business Rules & Domain Logic
2
+
3
+ > Central rules governing application domain models, logic constraints, workflows, and edge-cases.
4
+
5
+ ## User Constraints & Rules
6
+ - `null`
7
+
8
+ ## Financial & Transactional Rules
9
+ - `null`
10
+
11
+ ## State Transitions & Workflows
12
+ - `null`
@@ -0,0 +1,12 @@
1
+ # Context Budget & Token Management
2
+
3
+ > Core limits, file exclusion lists, and guidelines to prevent context window saturation and minimize token bloat.
4
+
5
+ ## Rules
6
+ 1. Never pass unnecessary build outputs or dependencies (`node_modules`, `.next`, `dist`) to the context.
7
+ 2. In large codebases, switch the AI config `mode` to `caveman` to use abbreviated instructions.
8
+ 3. Keep logs inside `.ai/session-logs/` pruned or gitignored by default.
9
+
10
+ ## Budgets
11
+ - Target instruction token size: under 1,000 tokens
12
+ - Max active codebase files in context: 15-20 files
@@ -0,0 +1,15 @@
1
+ # Deployment Rules & Procedures
2
+
3
+ > Standard parameters for continuous delivery, deployment gating, production environments, and rollbacks.
4
+
5
+ ## Environments
6
+ - Staging URL: `null`
7
+ - Production URL: `null`
8
+
9
+ ## Build Gating Checks
10
+ - All unit tests must pass
11
+ - Code build must succeed in production bundle mode
12
+ - Lint checks must return 0 errors
13
+
14
+ ## Automated Rollback Criteria
15
+ - `null`
@@ -0,0 +1,11 @@
1
+ # Model Map & Capability Routing
2
+
3
+ > Guidelines mapping specific project features and workflow steps to the best-suited AI coding models.
4
+
5
+ ## Routing Schema
6
+
7
+ | Model Class | Ideal Tasks | Examples |
8
+ |-------------|-------------|----------|
9
+ | High-Reasoning (e.g. Claude 3.5 Sonnet, GPT-4o) | Planning, Architecture, Refactoring, Complex Logic | Planning a module, multi-file edits |
10
+ | Fast/Token-Minimized (e.g. Gemini Flash, GPT-4o-mini) | Quick Bugfixes, Repetitive edits, Lint fixing, Verification | Fixing single-line errors |
11
+ | Specialized Code Models (e.g. Codex variants) | Review, Inline Completions | PR audits, Doc writing |
@@ -0,0 +1,17 @@
1
+ # Project Brief
2
+
3
+ > Central description of the project, mission statement, target audience, and key goals.
4
+
5
+ ## Core Purpose
6
+ Provide a single sentence defining the project's primary value proposition.
7
+ `null`
8
+
9
+ ## Target Audience
10
+ - `null`
11
+
12
+ ## Key Business Goals
13
+ 1. `null`
14
+ 2. `null`
15
+
16
+ ## Success Metrics
17
+ - `null`
@@ -0,0 +1,15 @@
1
+ # SEO & Semantic HTML Rules
2
+
3
+ > Standard guidelines for search engine optimization, meta descriptions, page speed parameters, and page structure.
4
+
5
+ ## Document Structure & Heading Rules
6
+ - Ensure exactly one `<h1>` per page.
7
+ - Maintain a proper hierarchy for `<h2>` down to `<h6>`.
8
+ - Use HTML5 semantic elements (`<header>`, `<main>`, `<article>`, `<footer>`).
9
+
10
+ ## Metadata Standards
11
+ - Title tag formatting: `null`
12
+ - Description constraints: `null` (Under 160 characters recommended)
13
+
14
+ ## Performance Metrics
15
+ - Core Web Vitals target: `null`
@@ -0,0 +1,37 @@
1
+ # Prompts
2
+
3
+ > Reusable prompt templates for AI coding agents.
4
+
5
+ ## Purpose
6
+
7
+ Store prompt templates that agents or humans can reference:
8
+ - Code review prompts
9
+ - Architecture analysis prompts
10
+ - Refactoring prompts
11
+ - Testing strategy prompts
12
+
13
+ ## Format
14
+
15
+ Each prompt is a markdown file:
16
+
17
+ ```markdown
18
+ # Prompt: {name}
19
+
20
+ ## When to Use
21
+ {Trigger conditions}
22
+
23
+ ## Template
24
+ {The prompt text with {placeholders}}
25
+
26
+ ## Variables
27
+ | Variable | Description |
28
+ |----------|-------------|
29
+ | {project} | Project name |
30
+ ```
31
+
32
+ ## Guidelines
33
+
34
+ - One prompt per file
35
+ - Use `{variable}` syntax for placeholders
36
+ - Keep prompts under 50 lines
37
+ - Name files descriptively: `code-review.md`, `architecture-audit.md`
@@ -0,0 +1,5 @@
1
+ # System Prompt: Generate Tests
2
+
3
+ > Instructions for drafting high-coverage unit tests and integration suites covering edge cases.
4
+
5
+ Analyze logic boundaries. Draft assertions covering successful states, empty inputs, null constraints, and failure modes.
@@ -0,0 +1,5 @@
1
+ # System Prompt: Handoff to Next Model
2
+
3
+ > Instructions to prepare file indicators and transition details when switching to another agent/model.
4
+
5
+ Detail current milestone progress. Point the next model/agent specifically to files to work on and next actions.
@@ -0,0 +1,5 @@
1
+ # System Prompt: Implement Safely
2
+
3
+ > Instructions guiding safe, modular coding with targeted replacements and regression awareness.
4
+
5
+ Do not rewrite whole files. Target specific line modifications. Enforce lint correctness and run local build verification checks proactively.
@@ -0,0 +1,5 @@
1
+ # System Prompt: Plan First
2
+
3
+ > Instructions to instruct an agent to always draft an implementation plan before writing any code.
4
+
5
+ Ensure you research the codebase, identify dependencies, list all files to create or modify, outline your verification test cases, and obtain approval before editing files.
@@ -0,0 +1,5 @@
1
+ # System Prompt: Review Diff
2
+
3
+ > Instructions for conducting strict PR diff audits and locating syntax issues or memory leaks.
4
+
5
+ Inspect git diffs strictly. Identify security flaws, resource leaks, syntax regressions, and deviations from style guidelines.
@@ -0,0 +1,5 @@
1
+ # System Prompt: Summarize Session
2
+
3
+ > Instructions to generate standardized markdown session summaries under `.ai/session-logs/`.
4
+
5
+ Summarize what tasks were completed, files changed, blockers remaining, and context required for the next agent session.
@@ -0,0 +1 @@
1
+
@@ -0,0 +1,49 @@
1
+ # Session Logs
2
+
3
+ > Agent session logs for tracking work across multi-agent workflows.
4
+
5
+ ## Purpose
6
+
7
+ When an AI agent completes a session, it can log:
8
+ - What was done
9
+ - What files changed
10
+ - What to do next
11
+ - Any blockers or decisions made
12
+
13
+ ## Format
14
+
15
+ ```markdown
16
+ # Session: {agent_name}
17
+ **Timestamp:** {ISO 8601}
18
+ **Tool:** {tool_name}
19
+ **Role:** {role from .ai/agents/orchestrator.md}
20
+
21
+ ## Summary
22
+ {What was done in 2-3 sentences}
23
+
24
+ ## Files Changed
25
+ - {path} ({created|modified|deleted})
26
+
27
+ ## Next Steps
28
+ 1. {Concrete next action}
29
+
30
+ ## Blockers
31
+ - {Any blockers, or "None"}
32
+ ```
33
+
34
+ ## Naming Convention
35
+
36
+ ```
37
+ {YYYY-MM-DD}-{agent}-{summary}.md
38
+ ```
39
+
40
+ Example: `2026-05-30-claude-auth-design.md`
41
+
42
+ ## Git Policy
43
+
44
+ Session logs are **gitignored by default** (session-specific data).
45
+ To commit them, remove the session-logs ignore rule from `.gitignore`.
46
+
47
+ ## Retention
48
+
49
+ Keep the last 10 session logs. Archive or delete older ones.
@@ -0,0 +1,34 @@
1
+ # Skills
2
+
3
+ > Reusable agent skills that extend what AI agents can do in your project.
4
+
5
+ ## What is a Skill?
6
+
7
+ A skill is a markdown file that teaches an AI agent a specific capability:
8
+ - How to perform a database migration
9
+ - How to set up a new microservice
10
+ - How to run a specific test suite
11
+ - How to deploy to a specific environment
12
+
13
+ ## Structure
14
+
15
+ Each skill is a markdown file in this directory:
16
+
17
+ ```
18
+ .ai/skills/
19
+ ├── README.md ← You are here
20
+ ├── example-skill.md ← Example template
21
+ ├── your-skill-name.md ← Your custom skills
22
+ └── ...
23
+ ```
24
+
25
+ ## Creating a Skill
26
+
27
+ 1. Copy `example-skill.md` as a starting point
28
+ 2. Define the skill name, description, and steps
29
+ 3. Include any commands, code snippets, or decision trees
30
+ 4. Keep skills focused — one skill, one capability
31
+
32
+ ## Loading
33
+
34
+ When `auto_load: true` in `.ai/config.yaml`, agents read all skills in this directory at session start. Keep the directory small to avoid context bloat.
@@ -0,0 +1,9 @@
1
+ # General Bug Fix Skill
2
+
3
+ > Methodical approach for diagnosing, replicating, fixing, and verifying code issues.
4
+
5
+ ## Protocol
6
+ 1. Locate source of the issue using logs or stack trace details.
7
+ 2. Replicate the failure locally with a targeted test case.
8
+ 3. Apply minimal, precise code edits.
9
+ 4. Run validation checks to ensure no regressions are introduced.
@@ -0,0 +1,2 @@
1
+ # caveman-bug-fix
2
+ locate error -> fix -> run tests -> repeat
@@ -0,0 +1,2 @@
1
+ # caveman-context-handoff
2
+ write brief log -> notify next agent
@@ -0,0 +1,2 @@
1
+ # caveman-feature-build
2
+ map endpoints -> write components -> verify build