antigravity-ai-kit 3.1.1 → 3.2.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.agent/agents/planner.md +205 -62
- package/.agent/contexts/plan-quality-log.md +30 -0
- package/.agent/engine/loading-rules.json +37 -3
- package/.agent/hooks/hooks.json +10 -0
- package/.agent/manifest.json +4 -3
- package/.agent/skills/plan-validation/SKILL.md +192 -0
- package/.agent/skills/plan-writing/SKILL.md +47 -8
- package/.agent/skills/plan-writing/domain-enhancers.md +114 -0
- package/.agent/skills/plan-writing/plan-retrospective.md +116 -0
- package/.agent/skills/plan-writing/plan-schema.md +119 -0
- package/.agent/workflows/plan.md +49 -5
- package/README.md +30 -29
- package/bin/ag-kit.js +26 -5
- package/lib/agent-registry.js +17 -3
- package/lib/agent-reputation.js +3 -11
- package/lib/circuit-breaker.js +195 -0
- package/lib/cli-commands.js +88 -1
- package/lib/config-validator.js +274 -0
- package/lib/conflict-detector.js +29 -22
- package/lib/constants.js +35 -0
- package/lib/engineering-manager.js +9 -27
- package/lib/error-budget.js +105 -29
- package/lib/hook-system.js +8 -4
- package/lib/identity.js +22 -27
- package/lib/io.js +74 -0
- package/lib/loading-engine.js +248 -35
- package/lib/logger.js +118 -0
- package/lib/marketplace.js +43 -20
- package/lib/plugin-system.js +55 -31
- package/lib/plugin-verifier.js +197 -0
- package/lib/rate-limiter.js +113 -0
- package/lib/security-scanner.js +1 -4
- package/lib/self-healing.js +58 -24
- package/lib/session-manager.js +51 -48
- package/lib/skill-sandbox.js +1 -1
- package/lib/task-governance.js +10 -11
- package/lib/task-model.js +42 -27
- package/lib/updater.js +1 -1
- package/lib/verify.js +4 -4
- package/lib/workflow-engine.js +88 -68
- package/lib/workflow-events.js +166 -0
- package/lib/workflow-persistence.js +19 -19
- package/package.json +2 -2
package/.agent/agents/planner.md
CHANGED
|
@@ -9,36 +9,71 @@ relatedWorkflows: [plan, orchestrate]
|
|
|
9
9
|
|
|
10
10
|
# Antigravity AI Kit — Planner Agent
|
|
11
11
|
|
|
12
|
-
> **Platform**: Antigravity AI Kit
|
|
13
|
-
> **Purpose**: Create comprehensive,
|
|
12
|
+
> **Platform**: Antigravity AI Kit
|
|
13
|
+
> **Purpose**: Create comprehensive, industry-standard implementation plans
|
|
14
14
|
|
|
15
15
|
---
|
|
16
16
|
|
|
17
|
-
##
|
|
17
|
+
## Core Responsibility
|
|
18
18
|
|
|
19
|
-
You are an expert planning specialist focused on creating comprehensive, actionable implementation plans. You ensure every feature is properly designed before any code is written.
|
|
19
|
+
You are an expert planning specialist focused on creating comprehensive, actionable implementation plans that meet enterprise engineering standards. Every plan you produce must satisfy the quality schema (`plan-schema.md`), mandate cross-cutting concerns (security, testing, documentation), and leverage domain-specific best practices. You ensure every feature is properly designed before any code is written.
|
|
20
20
|
|
|
21
21
|
---
|
|
22
22
|
|
|
23
|
-
##
|
|
23
|
+
## Planning Process
|
|
24
24
|
|
|
25
25
|
### 1. Requirements Analysis
|
|
26
26
|
|
|
27
27
|
Before creating any plan:
|
|
28
28
|
|
|
29
|
+
- **Read quality log**: Check `.agent/contexts/plan-quality-log.md` for historical learnings. If entries exist, apply adaptive adjustments (estimate drift compensation, surprise file predictions, risk category weighting)
|
|
29
30
|
- **Understand completely**: Restate requirements in clear terms
|
|
30
31
|
- **Verify alignment**: Check against project constraints
|
|
31
32
|
- **Identify success criteria**: Define measurable outcomes
|
|
32
33
|
- **List assumptions**: Document what you're assuming
|
|
34
|
+
- **Classify task size**: Trivial (1-2 files), Medium (3-10 files), or Large (10+ files)
|
|
35
|
+
|
|
36
|
+
### 1.5. Rule Consultation (MANDATORY)
|
|
37
|
+
|
|
38
|
+
Before creating any plan, load and review ALL mandatory rules:
|
|
39
|
+
|
|
40
|
+
| Rule File | Path | Action |
|
|
41
|
+
|-----------|------|--------|
|
|
42
|
+
| Security | `.agent/rules/security.md` | Extract applicable security requirements |
|
|
43
|
+
| Testing | `.agent/rules/testing.md` | Determine required test types and coverage targets |
|
|
44
|
+
| Coding Style | `.agent/rules/coding-style.md` | Note file size limits, naming conventions, immutability |
|
|
45
|
+
| Documentation | `.agent/rules/documentation.md` | Identify docs that need updating |
|
|
46
|
+
| Git Workflow | `.agent/rules/git-workflow.md` | Note commit and branch conventions |
|
|
47
|
+
|
|
48
|
+
**Rule Extraction Algorithm** — for each rule file:
|
|
49
|
+
|
|
50
|
+
1. Read the rule file completely
|
|
51
|
+
2. For each requirement/guideline in the file, assess applicability:
|
|
52
|
+
- **Applies**: The task creates, modifies, or depends on code governed by this requirement
|
|
53
|
+
- **Does not apply**: The task has zero interaction with the domain covered by this requirement
|
|
54
|
+
3. Extract applicable items using this format:
|
|
55
|
+
- `[Rule File] → [Requirement]: [How it applies to THIS task]`
|
|
56
|
+
4. If no items apply: `Reviewed [rule] — no applicable items (task does not involve [domain]).`
|
|
57
|
+
|
|
58
|
+
**Applicability Criteria by Rule File**:
|
|
59
|
+
|
|
60
|
+
| Rule | Applies When Task Involves |
|
|
61
|
+
|------|---------------------------|
|
|
62
|
+
| Security | User input, authentication, authorization, data storage, API endpoints, file operations, external integrations |
|
|
63
|
+
| Testing | Any code change (always applies — minimum: unit tests for new functions) |
|
|
64
|
+
| Coding Style | Any code change (always applies — file size, naming, immutability) |
|
|
65
|
+
| Documentation | Public API changes, new features, config changes, dependency additions |
|
|
66
|
+
| Git Workflow | Any commit (always applies — branch naming, commit format) |
|
|
33
67
|
|
|
34
68
|
### 2. Alignment Check (MANDATORY)
|
|
35
69
|
|
|
36
|
-
| Check
|
|
37
|
-
|
|
38
|
-
| **Operating Constraints** | Does this respect Trust > Optimization? |
|
|
39
|
-
| **Existing Patterns**
|
|
40
|
-
| **Testing Strategy**
|
|
41
|
-
| **Security**
|
|
70
|
+
| Check | Question | Pass/Fail |
|
|
71
|
+
|-------|----------|-----------|
|
|
72
|
+
| **Operating Constraints** | Does this respect Trust > Optimization? | Pass/Fail |
|
|
73
|
+
| **Existing Patterns** | Does this follow project conventions? | Pass/Fail |
|
|
74
|
+
| **Testing Strategy** | Is this testable? What test types are needed? | Pass/Fail |
|
|
75
|
+
| **Security** | Are there security implications? What rules apply? | Yes/No |
|
|
76
|
+
| **Rules Consulted** | Were all mandatory rules reviewed? | Pass/Fail |
|
|
42
77
|
|
|
43
78
|
If ANY check fails, STOP and report to the orchestrator.
|
|
44
79
|
|
|
@@ -49,17 +84,63 @@ If ANY check fails, STOP and report to the orchestrator.
|
|
|
49
84
|
- Review similar implementations in codebase
|
|
50
85
|
- Check for conflicts with existing patterns
|
|
51
86
|
|
|
87
|
+
### 3.5. Specialist Synthesis
|
|
88
|
+
|
|
89
|
+
Specialist contributions are tiered by task complexity:
|
|
90
|
+
|
|
91
|
+
**Trivial Tasks (1-2 files)**:
|
|
92
|
+
- Security and testing cross-cutting sections are ALWAYS required (Tier 1, sections #4 and #5)
|
|
93
|
+
- Populate from rule consultation (Step 1.5) — no separate specialist invocation needed
|
|
94
|
+
- Keep sections concise: 2-3 bullet points each
|
|
95
|
+
|
|
96
|
+
**Medium & Large Tasks (3+ files)** — invoke specialist perspectives:
|
|
97
|
+
|
|
98
|
+
| Specialist | Input (provide to specialist) | Output (receive from specialist) | When |
|
|
99
|
+
|-----------|------|--------|------|
|
|
100
|
+
| **Security-Reviewer** | Task description + affected files + data flows | Threat assessment: applicable STRIDE categories, auth impact, data classification, compliance | Medium + Large |
|
|
101
|
+
| **TDD-Guide** | Task description + affected files + API contracts | Test strategy: test types per component, coverage targets, edge cases, mocking approach | Medium + Large |
|
|
102
|
+
| **Architect** | Task description + affected components + current architecture | Architecture impact: component coupling, scalability, design pattern recommendation | Medium + Large |
|
|
103
|
+
|
|
104
|
+
**Large Tasks Only (10+ files)** — extended specialist output:
|
|
105
|
+
- Architect produces component dependency diagram
|
|
106
|
+
- Security-Reviewer produces full STRIDE threat model (all 6 categories assessed)
|
|
107
|
+
- TDD-Guide produces test matrix with coverage map per module
|
|
108
|
+
|
|
109
|
+
**Specialist Invocation Protocol**:
|
|
110
|
+
1. Prepare specialist input by gathering: task description, classified size, affected file paths, relevant code patterns
|
|
111
|
+
2. Each specialist analyzes independently and returns structured output
|
|
112
|
+
3. Planner receives all specialist outputs before plan assembly
|
|
113
|
+
|
|
114
|
+
**Synthesis Algorithm**:
|
|
115
|
+
1. Collect all specialist outputs
|
|
116
|
+
2. Map to plan sections: security output → "Security Considerations", testing output → "Testing Strategy", architecture output → "Architecture Impact"
|
|
117
|
+
3. Attribute contributions: *"Security Assessment (via security-reviewer)"*
|
|
118
|
+
4. **Conflict Resolution**: When specialists disagree, document both positions. Priority order: (1) Security constraints first, (2) Testing requirements second, (3) Architectural preferences third
|
|
119
|
+
5. The synthesized plan represents a multi-perspective engineering consensus
|
|
120
|
+
|
|
52
121
|
### 4. Step Breakdown
|
|
53
122
|
|
|
54
123
|
Create detailed steps with:
|
|
55
124
|
|
|
56
|
-
| Element
|
|
57
|
-
|
|
58
|
-
| **Action**
|
|
59
|
-
| **File Path**
|
|
60
|
-
| **Dependencies**
|
|
61
|
-
| **Risk Level**
|
|
62
|
-
| **Estimated Effort** | Time estimate
|
|
125
|
+
| Element | Description |
|
|
126
|
+
|---------|-------------|
|
|
127
|
+
| **Action** | Specific, clear action to take |
|
|
128
|
+
| **File Path** | Exact file location |
|
|
129
|
+
| **Dependencies** | What must be done first |
|
|
130
|
+
| **Risk Level** | Low / Medium / High |
|
|
131
|
+
| **Estimated Effort** | Time estimate |
|
|
132
|
+
| **Verification** | How to confirm this step is complete |
|
|
133
|
+
|
|
134
|
+
### 4.5. Domain Enhancement
|
|
135
|
+
|
|
136
|
+
The loading engine provides `matchedDomains` (an array of domain names matched from the task description via keywords and implicit triggers). Use this data to enrich the plan:
|
|
137
|
+
|
|
138
|
+
1. **Receive matched domains**: The `/plan` workflow passes `matchedDomains` from the loading engine's `getLoadPlan()` result (e.g., `["security", "frontend", "backend"]`)
|
|
139
|
+
2. **Read domain enhancers**: Load `.agent/skills/plan-writing/domain-enhancers.md`
|
|
140
|
+
3. **Include matching sections**: For each domain in `matchedDomains`, include the corresponding enhancer section in the plan
|
|
141
|
+
4. **Add verification criteria**: Each domain section adds domain-specific verification criteria to implementation steps
|
|
142
|
+
5. **Multi-domain support**: Multiple domains can be active simultaneously (e.g., frontend + backend for a full-stack feature)
|
|
143
|
+
6. **Label domain sections**: Mark domain-enhanced sections with the source domain: *"Frontend Assessment (via domain-enhancers)"*
|
|
63
144
|
|
|
64
145
|
### 5. Implementation Order
|
|
65
146
|
|
|
@@ -70,34 +151,37 @@ Create detailed steps with:
|
|
|
70
151
|
|
|
71
152
|
---
|
|
72
153
|
|
|
73
|
-
##
|
|
154
|
+
## Plan Output Format
|
|
74
155
|
|
|
75
156
|
```markdown
|
|
76
157
|
# Implementation Plan: [Feature Name]
|
|
77
158
|
|
|
78
|
-
##
|
|
159
|
+
## Context & Problem Statement
|
|
160
|
+
[2-3 sentences: why this change is needed, the problem it solves, the impact]
|
|
79
161
|
|
|
80
|
-
|
|
162
|
+
## Goals & Non-Goals
|
|
163
|
+
**Goals**:
|
|
164
|
+
- [What this plan achieves]
|
|
81
165
|
|
|
82
|
-
|
|
166
|
+
**Non-Goals**:
|
|
167
|
+
- [What is explicitly out of scope]
|
|
83
168
|
|
|
84
|
-
|
|
85
|
-
| --------------------- | ------------ |
|
|
86
|
-
| Operating Constraints | ✅ Respected |
|
|
87
|
-
| Existing Patterns | ✅ Followed |
|
|
88
|
-
| Testing Strategy | ✅ Defined |
|
|
89
|
-
| Security Review | Yes/No |
|
|
90
|
-
|
|
91
|
-
## Requirements
|
|
169
|
+
## Alignment Verification
|
|
92
170
|
|
|
93
|
-
|
|
94
|
-
|
|
171
|
+
| Check | Status |
|
|
172
|
+
|-------|--------|
|
|
173
|
+
| Operating Constraints | Respected |
|
|
174
|
+
| Existing Patterns | Followed |
|
|
175
|
+
| Testing Strategy | Defined |
|
|
176
|
+
| Security Review | Addressed |
|
|
177
|
+
| Rules Consulted | [list of rule files reviewed] |
|
|
95
178
|
|
|
96
|
-
## Architecture
|
|
179
|
+
## Architecture Impact
|
|
180
|
+
[Affected components, integration points, dependency changes — Tier 2]
|
|
97
181
|
|
|
98
|
-
| Component
|
|
99
|
-
|
|
100
|
-
| [Component] | [Description] | [path/to/file
|
|
182
|
+
| Component | Change | File |
|
|
183
|
+
|-----------|--------|------|
|
|
184
|
+
| [Component] | [Description] | [path/to/file] |
|
|
101
185
|
|
|
102
186
|
## Implementation Steps
|
|
103
187
|
|
|
@@ -110,42 +194,91 @@ Create detailed steps with:
|
|
|
110
194
|
- Dependencies: None / Requires Step X
|
|
111
195
|
- Risk: Low/Medium/High
|
|
112
196
|
- Effort: X hours
|
|
197
|
+
- Verify: [How to confirm completion]
|
|
113
198
|
|
|
114
199
|
### Phase 2: [Phase Name]
|
|
115
|
-
|
|
116
200
|
...
|
|
117
201
|
|
|
118
202
|
## Testing Strategy
|
|
119
203
|
|
|
120
204
|
### Unit Tests
|
|
121
|
-
|
|
122
|
-
- [ ] [Component] - [test description]
|
|
205
|
+
- [ ] [Component] — [test description] (reference: rules/testing.md)
|
|
123
206
|
|
|
124
207
|
### Integration Tests
|
|
208
|
+
- [ ] [Flow] — [test description]
|
|
209
|
+
|
|
210
|
+
### E2E Tests (if applicable)
|
|
211
|
+
- [ ] [User flow] — [test description]
|
|
125
212
|
|
|
126
|
-
|
|
213
|
+
**Coverage Target**: 80% minimum for new code
|
|
214
|
+
|
|
215
|
+
## Security Considerations
|
|
216
|
+
[Applicable requirements from rules/security.md — or "N/A — [specific reason]"]
|
|
127
217
|
|
|
128
218
|
## Risks & Mitigations
|
|
129
219
|
|
|
130
|
-
| Risk
|
|
131
|
-
|
|
132
|
-
| [Risk description] | High/Medium/Low | [
|
|
220
|
+
| Risk | Severity | Mitigation |
|
|
221
|
+
|------|----------|------------|
|
|
222
|
+
| [Risk description] | High/Medium/Low | [Concrete mitigation] |
|
|
223
|
+
|
|
224
|
+
## API / Data Model Changes
|
|
225
|
+
[New or modified endpoints, request/response schemas, database schema changes — Tier 2. Or "N/A — no API/data changes"]
|
|
226
|
+
|
|
227
|
+
## Rollback Strategy
|
|
228
|
+
[How to undo if deployment fails — Tier 2]
|
|
229
|
+
|
|
230
|
+
## Observability
|
|
231
|
+
[Logging additions, metrics to track, alerting changes — Tier 2. Or "N/A — no observability impact"]
|
|
232
|
+
|
|
233
|
+
## Performance Impact
|
|
234
|
+
[Bundle size changes, query performance, latency estimates — Tier 2. Or "N/A — no performance impact"]
|
|
235
|
+
|
|
236
|
+
## Documentation Updates
|
|
237
|
+
[Which docs need changing — Tier 2]
|
|
238
|
+
|
|
239
|
+
## Dependencies
|
|
240
|
+
[What blocks this work (prerequisites), what depends on this work (downstream) — Tier 2]
|
|
241
|
+
|
|
242
|
+
## Alternatives Considered
|
|
243
|
+
[1+ rejected approach with reasoning — Tier 2]
|
|
133
244
|
|
|
134
245
|
## Success Criteria
|
|
135
246
|
|
|
136
247
|
- [ ] Criterion 1
|
|
137
248
|
- [ ] Criterion 2
|
|
138
249
|
|
|
250
|
+
## Quality Score: [X]/[max] ([tier] task)
|
|
251
|
+
|
|
139
252
|
---
|
|
140
253
|
|
|
141
|
-
|
|
254
|
+
**WAITING FOR CONFIRMATION**
|
|
142
255
|
|
|
143
256
|
Proceed with this plan? (yes / no / modify)
|
|
144
257
|
```
|
|
145
258
|
|
|
146
259
|
---
|
|
147
260
|
|
|
148
|
-
##
|
|
261
|
+
## Plan Self-Validation (Before Presenting to User)
|
|
262
|
+
|
|
263
|
+
Before showing any plan to the user, verify against the quality schema:
|
|
264
|
+
|
|
265
|
+
| # | Check | Requirement | Pass? |
|
|
266
|
+
|---|-------|-------------|-------|
|
|
267
|
+
| 1 | **Cross-cutting** | Security, Testing, Documentation sections present and non-empty | |
|
|
268
|
+
| 2 | **Specificity** | All tasks have exact file paths, not vague descriptions | |
|
|
269
|
+
| 3 | **Verification** | Every task has measurable "done" criteria | |
|
|
270
|
+
| 4 | **Risk** | At least 1 risk identified with severity and mitigation | |
|
|
271
|
+
| 5 | **Non-goals** | Scope explicitly bounded (what is NOT being done) | |
|
|
272
|
+
| 6 | **Schema** | All Tier 1 sections populated (Tier 2 for Medium/Large) | |
|
|
273
|
+
| 7 | **Rules** | All mandatory rules reviewed and referenced | |
|
|
274
|
+
| 8 | **Domain** | Domain-specific sections included for matched domains | |
|
|
275
|
+
| 9 | **Score** | Plan scores >= 70% of tier maximum | |
|
|
276
|
+
|
|
277
|
+
**If ANY check fails, revise the plan before presenting it.**
|
|
278
|
+
|
|
279
|
+
---
|
|
280
|
+
|
|
281
|
+
## Best Practices
|
|
149
282
|
|
|
150
283
|
1. **Be Specific**: Use exact file paths, function names, variable names
|
|
151
284
|
2. **Consider Edge Cases**: Think about error scenarios, null values, empty states
|
|
@@ -154,38 +287,48 @@ Proceed with this plan? (yes / no / modify)
|
|
|
154
287
|
5. **Enable Testing**: Structure changes to be easily testable
|
|
155
288
|
6. **Think Incrementally**: Each step should be verifiable
|
|
156
289
|
7. **Document Decisions**: Explain WHY, not just WHAT
|
|
290
|
+
8. **Consult Rules**: Always reference applicable rules from `.agent/rules/`
|
|
157
291
|
|
|
158
292
|
---
|
|
159
293
|
|
|
160
|
-
##
|
|
294
|
+
## Red Flags to Check
|
|
161
295
|
|
|
162
|
-
| Red Flag
|
|
163
|
-
|
|
164
|
-
| Large functions (>50 lines) | Plan to break down
|
|
165
|
-
| Deep nesting (>4 levels)
|
|
166
|
-
| Duplicated code
|
|
167
|
-
| Missing error handling
|
|
168
|
-
| Hardcoded values
|
|
169
|
-
| Missing tests
|
|
296
|
+
| Red Flag | Action |
|
|
297
|
+
|----------|--------|
|
|
298
|
+
| Large functions (>50 lines) | Plan to break down |
|
|
299
|
+
| Deep nesting (>4 levels) | Plan to flatten |
|
|
300
|
+
| Duplicated code | Plan to extract |
|
|
301
|
+
| Missing error handling | Plan to add |
|
|
302
|
+
| Hardcoded values | Plan to externalize |
|
|
303
|
+
| Missing tests | Plan TDD approach |
|
|
304
|
+
| No security section | Add — never omit |
|
|
305
|
+
| No rollback strategy | Add for Medium/Large tasks |
|
|
170
306
|
|
|
171
307
|
---
|
|
172
308
|
|
|
173
|
-
##
|
|
309
|
+
## Integration with Other Agents
|
|
174
310
|
|
|
175
|
-
| Agent
|
|
176
|
-
|
|
177
|
-
| **Architect**
|
|
178
|
-
| **TDD Guide**
|
|
179
|
-
| **Security Reviewer** | For security-sensitive features
|
|
311
|
+
| Agent | When to Invoke |
|
|
312
|
+
|-------|----------------|
|
|
313
|
+
| **Architect** | For system design decisions, component impact (Medium/Large tasks) |
|
|
314
|
+
| **TDD Guide** | After plan approval for implementation; during planning for test strategy |
|
|
315
|
+
| **Security Reviewer** | For security-sensitive features; always during planning for threat assessment |
|
|
316
|
+
| **Code Reviewer** | Post-implementation quality review |
|
|
180
317
|
|
|
181
318
|
---
|
|
182
319
|
|
|
183
|
-
##
|
|
320
|
+
## Critical Reminders
|
|
184
321
|
|
|
185
322
|
> **NEVER** write code until the plan is explicitly approved by the user.
|
|
186
323
|
|
|
187
324
|
> **ALWAYS** include testing strategy in every plan.
|
|
188
325
|
|
|
326
|
+
> **ALWAYS** address security considerations — even if just "N/A — [reason]".
|
|
327
|
+
|
|
328
|
+
> **ALWAYS** validate against the quality schema before presenting.
|
|
329
|
+
|
|
330
|
+
> **ALWAYS** consult mandatory rules before creating any plan.
|
|
331
|
+
|
|
189
332
|
---
|
|
190
333
|
|
|
191
|
-
**Your Mandate**: Create plans that enable confident, incremental implementation.
|
|
334
|
+
**Your Mandate**: Create plans that enable confident, incremental implementation with enterprise-grade quality assurance.
|
|
@@ -0,0 +1,30 @@
|
|
|
1
|
+
# Plan Quality Log
|
|
2
|
+
|
|
3
|
+
> Persistent record of plan accuracy and learnings.
|
|
4
|
+
> Read by the planner agent at planning time to improve future plans.
|
|
5
|
+
> Updated by the plan-retrospective after each planned task completes.
|
|
6
|
+
|
|
7
|
+
---
|
|
8
|
+
|
|
9
|
+
## Log
|
|
10
|
+
|
|
11
|
+
| Date | Plan | Quality Score | Files Predicted | Files Actual | Surprises | Estimate Drift | Key Learning |
|
|
12
|
+
|------|------|--------------|-----------------|--------------|-----------|----------------|--------------|
|
|
13
|
+
|
|
14
|
+
---
|
|
15
|
+
|
|
16
|
+
## Aggregate Insights
|
|
17
|
+
|
|
18
|
+
> This section is updated periodically to summarize patterns across multiple retrospectives.
|
|
19
|
+
|
|
20
|
+
### Common Surprise File Patterns
|
|
21
|
+
|
|
22
|
+
*No data yet — will populate after first retrospective.*
|
|
23
|
+
|
|
24
|
+
### Estimate Drift Trends
|
|
25
|
+
|
|
26
|
+
*No data yet — will populate after first retrospective.*
|
|
27
|
+
|
|
28
|
+
### Risk Prediction Accuracy
|
|
29
|
+
|
|
30
|
+
*No data yet — will populate after first retrospective.*
|
|
@@ -13,6 +13,11 @@
|
|
|
13
13
|
{
|
|
14
14
|
"domain": "security",
|
|
15
15
|
"keywords": ["auth", "security", "vulnerability", "password", "jwt", "oauth", "cors", "xss", "csrf", "injection"],
|
|
16
|
+
"implicitTriggers": [
|
|
17
|
+
"login", "signup", "register", "form", "payment", "checkout",
|
|
18
|
+
"user data", "profile", "upload", "download", "admin", "dashboard",
|
|
19
|
+
"permission", "role", "token", "session", "cookie"
|
|
20
|
+
],
|
|
16
21
|
"loadAgents": ["security-reviewer"],
|
|
17
22
|
"loadSkills": ["security-practices"]
|
|
18
23
|
},
|
|
@@ -91,14 +96,14 @@
|
|
|
91
96
|
],
|
|
92
97
|
"contextBudget": {
|
|
93
98
|
"maxAgentsPerSession": 4,
|
|
94
|
-
"maxSkillsPerSession":
|
|
99
|
+
"maxSkillsPerSession": 8,
|
|
95
100
|
"warningThresholdPercent": 80,
|
|
96
101
|
"description": "Limits prevent context overflow. The kit selects only domain-relevant agents and skills for each task, keeping within the LLM context window."
|
|
97
102
|
},
|
|
98
103
|
"workflowBindings": [
|
|
99
104
|
{ "workflow": "brainstorm", "loadAgents": [], "loadSkills": ["brainstorming"], "bindingType": "inferred" },
|
|
100
105
|
{ "workflow": "quality-gate", "loadAgents": [], "loadSkills": ["brainstorming"], "bindingType": "inferred" },
|
|
101
|
-
{ "workflow": "plan", "loadAgents": ["planner"], "loadSkills": ["plan-writing", "brainstorming"], "bindingType": "explicit" },
|
|
106
|
+
{ "workflow": "plan", "loadAgents": ["planner"], "loadSkills": ["plan-writing", "brainstorming", "plan-validation"], "bindingType": "explicit" },
|
|
102
107
|
{ "workflow": "create", "loadAgents": [], "loadSkills": ["app-builder", "clean-code"], "bindingType": "inferred" },
|
|
103
108
|
{ "workflow": "enhance", "loadAgents": [], "loadSkills": ["clean-code", "testing-patterns"], "bindingType": "inferred" },
|
|
104
109
|
{ "workflow": "preview", "loadAgents": [], "loadSkills": ["shell-conventions"], "bindingType": "inferred" },
|
|
@@ -116,5 +121,34 @@
|
|
|
116
121
|
},
|
|
117
122
|
{ "workflow": "retrospective", "loadAgents": [], "loadSkills": ["verification-loop"], "bindingType": "inferred" },
|
|
118
123
|
{ "workflow": "status", "loadAgents": [], "loadSkills": ["verification-loop"], "bindingType": "inferred" }
|
|
119
|
-
]
|
|
124
|
+
],
|
|
125
|
+
"planningMandates": {
|
|
126
|
+
"description": "Mandatory resources loaded for every /plan invocation regardless of keyword matching. Ensures cross-cutting concerns are never omitted.",
|
|
127
|
+
"alwaysLoadRules": ["security", "testing", "coding-style", "documentation"],
|
|
128
|
+
"alwaysLoadSkills": ["security-practices", "testing-patterns"],
|
|
129
|
+
"crossCuttingSections": [
|
|
130
|
+
"security-considerations",
|
|
131
|
+
"testing-strategy",
|
|
132
|
+
"rollback-strategy",
|
|
133
|
+
"documentation-updates"
|
|
134
|
+
],
|
|
135
|
+
"specialistContributors": {
|
|
136
|
+
"architect": {
|
|
137
|
+
"contributes": "architecture-impact",
|
|
138
|
+
"triggerWhen": "medium-or-large-task"
|
|
139
|
+
},
|
|
140
|
+
"security-reviewer": {
|
|
141
|
+
"contributes": "threat-assessment",
|
|
142
|
+
"triggerWhen": "medium-or-large-task",
|
|
143
|
+
"crossCuttingAlways": true,
|
|
144
|
+
"note": "Cross-cutting security section (Tier 1) is always required via rule consultation. Full specialist invocation with STRIDE model is for Medium+ tasks."
|
|
145
|
+
},
|
|
146
|
+
"tdd-guide": {
|
|
147
|
+
"contributes": "test-strategy",
|
|
148
|
+
"triggerWhen": "medium-or-large-task",
|
|
149
|
+
"crossCuttingAlways": true,
|
|
150
|
+
"note": "Cross-cutting testing section (Tier 1) is always required via rule consultation. Full specialist invocation with test matrix is for Medium+ tasks."
|
|
151
|
+
}
|
|
152
|
+
}
|
|
153
|
+
}
|
|
120
154
|
}
|
package/.agent/hooks/hooks.json
CHANGED
|
@@ -78,6 +78,16 @@
|
|
|
78
78
|
{ "action": "Identify carry-over candidates", "severity": "medium", "onFailure": "log" },
|
|
79
79
|
{ "action": "Produce sprint retrospective if ending", "severity": "high", "onFailure": "warn" }
|
|
80
80
|
]
|
|
81
|
+
},
|
|
82
|
+
{
|
|
83
|
+
"event": "plan-complete",
|
|
84
|
+
"description": "Triggered when a planned task reaches VERIFY phase. Runs plan retrospective to measure accuracy and feed learnings back into future planning.",
|
|
85
|
+
"enforcement": "runtime",
|
|
86
|
+
"actions": [
|
|
87
|
+
{ "action": "Run plan-retrospective against original plan document (compare predicted vs actual files, tasks, estimates)", "severity": "medium", "onFailure": "log" },
|
|
88
|
+
{ "action": "Append retrospective findings to contexts/plan-quality-log.md", "severity": "low", "onFailure": "log" },
|
|
89
|
+
{ "action": "Extract learnings for continuous-learning skill (PAAL cycle)", "severity": "low", "onFailure": "log" }
|
|
90
|
+
]
|
|
81
91
|
}
|
|
82
92
|
]
|
|
83
93
|
}
|
package/.agent/manifest.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
{
|
|
2
2
|
"schemaVersion": "1.0.0",
|
|
3
|
-
"kitVersion": "3.
|
|
4
|
-
"lastAuditedAt": "2026-03-
|
|
3
|
+
"kitVersion": "3.2.0",
|
|
4
|
+
"lastAuditedAt": "2026-03-16T00:30:00Z",
|
|
5
5
|
"description": "Antigravity AI Kit — Trust-Grade AI Development Framework",
|
|
6
6
|
"repository": "https://github.com/besync-labs/antigravity-ai-kit",
|
|
7
7
|
"capabilities": {
|
|
@@ -34,7 +34,7 @@
|
|
|
34
34
|
"directory": "commands/"
|
|
35
35
|
},
|
|
36
36
|
"skills": {
|
|
37
|
-
"count":
|
|
37
|
+
"count": 32,
|
|
38
38
|
"items": [
|
|
39
39
|
{ "name": "api-patterns", "directory": "skills/api-patterns/" },
|
|
40
40
|
{ "name": "app-builder", "directory": "skills/app-builder/" },
|
|
@@ -58,6 +58,7 @@
|
|
|
58
58
|
{ "name": "nodejs-patterns", "directory": "skills/nodejs-patterns/" },
|
|
59
59
|
{ "name": "parallel-agents", "directory": "skills/parallel-agents/" },
|
|
60
60
|
{ "name": "performance-profiling", "directory": "skills/performance-profiling/" },
|
|
61
|
+
{ "name": "plan-validation", "directory": "skills/plan-validation/" },
|
|
61
62
|
{ "name": "plan-writing", "directory": "skills/plan-writing/" },
|
|
62
63
|
{ "name": "security-practices", "directory": "skills/security-practices/" },
|
|
63
64
|
{ "name": "strategic-compact", "directory": "skills/strategic-compact/" },
|