@nano-step/skill-manager 5.6.0 → 5.6.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/utils.d.ts +1 -1
- package/dist/utils.js +1 -1
- package/package.json +1 -1
- package/private-catalog.json +5 -0
- package/skills/deep-design/SKILL.md +402 -0
- package/skills/deep-design/evals/evals.json +23 -0
- package/skills/deep-design/skill.json +7 -0
- package/skills/feature-analysis/SKILL.md +290 -0
- package/skills/feature-analysis/skill.json +15 -0
- package/skills/nano-brain/AGENTS_SNIPPET.md +0 -9
- package/skills/nano-brain/skill.json +7 -0
- package/skills/pr-code-reviewer/CHANGELOG.md +287 -0
- package/skills/pr-code-reviewer/RESEARCH.md +60 -0
- package/skills/pr-code-reviewer/SKILL.md +530 -0
- package/skills/pr-code-reviewer/assets/config.json +47 -0
- package/skills/pr-code-reviewer/checklists/backend-express.md +357 -0
- package/skills/pr-code-reviewer/checklists/ci-cd.md +428 -0
- package/skills/pr-code-reviewer/checklists/consumer-search-matrix.md +339 -0
- package/skills/pr-code-reviewer/checklists/database.md +382 -0
- package/skills/pr-code-reviewer/checklists/frontend-vue-nuxt.md +426 -0
- package/skills/pr-code-reviewer/checklists/review-checklist.md +116 -0
- package/skills/pr-code-reviewer/references/framework-rules/express.md +39 -0
- package/skills/pr-code-reviewer/references/framework-rules/nestjs.md +41 -0
- package/skills/pr-code-reviewer/references/framework-rules/typeorm.md +52 -0
- package/skills/pr-code-reviewer/references/framework-rules/typescript.md +50 -0
- package/skills/pr-code-reviewer/references/framework-rules/vue-nuxt.md +53 -0
- package/skills/pr-code-reviewer/references/nano-brain-integration.md +61 -0
- package/skills/pr-code-reviewer/references/performance-patterns.md +26 -0
- package/skills/pr-code-reviewer/references/quality-patterns.md +25 -0
- package/skills/pr-code-reviewer/references/report-template.md +167 -0
- package/skills/pr-code-reviewer/references/security-patterns.md +31 -0
- package/skills/pr-code-reviewer/references/subagent-prompts.md +323 -0
- package/skills/pr-code-reviewer/skill.json +15 -0
- package/skills/rri-t-testing/SKILL.md +224 -0
- package/skills/rri-t-testing/assets/rri-t-coverage-dashboard.md +138 -0
- package/skills/rri-t-testing/assets/rri-t-memory-protocol.md +271 -0
- package/skills/rri-t-testing/assets/rri-t-persona-interview.md +249 -0
- package/skills/rri-t-testing/assets/rri-t-quality-scorecard.md +122 -0
- package/skills/rri-t-testing/assets/rri-t-risk-matrix.md +87 -0
- package/skills/rri-t-testing/assets/rri-t-stress-matrix.md +100 -0
- package/skills/rri-t-testing/assets/rri-t-test-case.md +181 -0
- package/skills/rri-t-testing/assets/rri-t-testability-gate.md +131 -0
- package/skills/rri-t-testing/assets/rri-t-traceability-matrix.md +105 -0
- package/skills/rri-t-testing/skill.json +9 -0
package/dist/utils.d.ts
CHANGED
package/dist/utils.js
CHANGED
|
@@ -13,7 +13,7 @@ exports.writeText = writeText;
|
|
|
13
13
|
const path_1 = __importDefault(require("path"));
|
|
14
14
|
const os_1 = __importDefault(require("os"));
|
|
15
15
|
const fs_extra_1 = __importDefault(require("fs-extra"));
|
|
16
|
-
exports.MANAGER_VERSION = "5.6.
|
|
16
|
+
exports.MANAGER_VERSION = "5.6.1";
|
|
17
17
|
async function detectOpenCodePaths() {
|
|
18
18
|
const homeConfig = path_1.default.join(os_1.default.homedir(), ".config", "opencode");
|
|
19
19
|
const cwd = process.cwd();
|
package/package.json
CHANGED
package/private-catalog.json
CHANGED
|
@@ -19,6 +19,11 @@
|
|
|
19
19
|
"version": "7.1.0",
|
|
20
20
|
"description": "PR review with MANDATORY cross-repo consumer search, nano-brain code intelligence, and better-context structural analysis. READ-ONLY — no comments, pushes, or code fixes."
|
|
21
21
|
},
|
|
22
|
+
{
|
|
23
|
+
"name": "deep-design",
|
|
24
|
+
"version": "1.0.0",
|
|
25
|
+
"description": "Multi-agent planning pipeline: Metis + Oracle → Synthesis → OpenSpec → Momus review"
|
|
26
|
+
},
|
|
22
27
|
{
|
|
23
28
|
"name": "rri-t-testing",
|
|
24
29
|
"version": "1.0.0",
|
|
@@ -0,0 +1,402 @@
|
|
|
1
|
+
---
|
|
2
|
+
name: deep-design
|
|
3
|
+
description: "MANDATORY for any non-trivial feature planning. Multi-agent pipeline: Metis (scope/risk) + Oracle (architecture) in parallel → synthesis → OpenSpec proposal → Momus review. MUST USE when: user describes a feature that touches multiple services or modules, user wants to plan/design/architect before coding, user says 'plan this', 'design this', 'think this through', 'spec this out', 'deep design', 'let me get this right', 'before we start coding', 'rethink how X works', 'migrate from X to Y', 'add multi-tenancy/billing/auth/permissions/real-time/encryption/caching', user describes any system that needs architectural decisions, user mentions wanting a proposal or spec, user wants to avoid mistakes on a complex feature. Also triggers on: 'plan out the migration', 'design a system for', 'I want to add [complex feature]... need to think through', 'this is a big change', 'let me get the design reviewed', 'before anyone writes code'. When in doubt about whether to use this skill, USE IT — it's better to over-plan than to start coding a complex feature without a reviewed design."
|
|
4
|
+
compatibility: "OpenCode"
|
|
5
|
+
metadata:
|
|
6
|
+
version: "1.0.0"
|
|
7
|
+
---
|
|
8
|
+
|
|
9
|
+
# Deep Design Pipeline
|
|
10
|
+
|
|
11
|
+
## Overview
|
|
12
|
+
|
|
13
|
+
A 5-phase orchestration pipeline that turns a user's feature idea into a reviewed, implementation-ready OpenSpec proposal. The pipeline ensures nothing gets missed — hidden complexity is surfaced, architecture is validated, and the final proposal is stress-tested by an expert reviewer before a single line of code is written.
|
|
14
|
+
|
|
15
|
+
**Pipeline at a glance:**
|
|
16
|
+
|
|
17
|
+
```
|
|
18
|
+
User describes feature
|
|
19
|
+
│
|
|
20
|
+
▼
|
|
21
|
+
┌───────────────────────────────┐
|
|
22
|
+
│ Phase 1: PARALLEL ANALYSIS │
|
|
23
|
+
│ │
|
|
24
|
+
│ ┌─────────┐ ┌──────────┐ │
|
|
25
|
+
│ │ Metis │ │ Oracle │ │
|
|
26
|
+
│ │ (scope, │ │ (arch, │ │
|
|
27
|
+
│ │ risks, │ │ design, │ │
|
|
28
|
+
│ │ phases) │ │ MVA) │ │
|
|
29
|
+
│ └────┬────┘ └────┬─────┘ │
|
|
30
|
+
│ └──────┬───────┘ │
|
|
31
|
+
└──────────────┼────────────────┘
|
|
32
|
+
▼
|
|
33
|
+
┌──────────────────────────────┐
|
|
34
|
+
│ Phase 2: SYNTHESIS │
|
|
35
|
+
│ Merge insights, resolve │
|
|
36
|
+
│ conflicts, produce refined │
|
|
37
|
+
│ design brief │
|
|
38
|
+
└──────────────┬───────────────┘
|
|
39
|
+
▼
|
|
40
|
+
┌──────────────────────────────┐
|
|
41
|
+
│ Phase 3: OPENSPEC PROPOSAL │
|
|
42
|
+
│ proposal.md, design.md, │
|
|
43
|
+
│ specs/, tasks.md │
|
|
44
|
+
└──────────────┬───────────────┘
|
|
45
|
+
▼
|
|
46
|
+
┌──────────────────────────────┐
|
|
47
|
+
│ Phase 4: MOMUS REVIEW │
|
|
48
|
+
│ Expert critique of the │
|
|
49
|
+
│ proposal — gaps, risks, │
|
|
50
|
+
│ missing scenarios │
|
|
51
|
+
└──────────────┬───────────────┘
|
|
52
|
+
▼
|
|
53
|
+
┌──────────────────────────────┐
|
|
54
|
+
│ Phase 5: DELIVER │
|
|
55
|
+
│ Present proposal + review │
|
|
56
|
+
│ to user for approval │
|
|
57
|
+
└──────────────────────────────┘
|
|
58
|
+
```
|
|
59
|
+
|
|
60
|
+
**Cost note:** This pipeline fires three expensive agents (Metis, Oracle, Momus — all claude-opus-4-6-thinking). It is designed for non-trivial features where getting the design right matters more than speed. Every feature gets the full treatment.
|
|
61
|
+
|
|
62
|
+
---
|
|
63
|
+
|
|
64
|
+
## Input
|
|
65
|
+
|
|
66
|
+
The user provides a feature description. This can range from a single sentence ("add real-time collaboration") to a detailed brief. The skill works with whatever level of detail is given — Metis and Oracle will independently identify what's missing.
|
|
67
|
+
|
|
68
|
+
If the user's description is too vague to act on (e.g., "make it better"), ask ONE clarifying question before starting the pipeline. Otherwise, start immediately.
|
|
69
|
+
|
|
70
|
+
## Phase 1: Parallel Analysis (Metis + Oracle)
|
|
71
|
+
|
|
72
|
+
Fire both agents simultaneously using `run_in_background=true`. They analyze the same feature description independently — this diversity of perspective is the point.
|
|
73
|
+
|
|
74
|
+
### Metis Prompt
|
|
75
|
+
|
|
76
|
+
```
|
|
77
|
+
task(
|
|
78
|
+
subagent_type="metis",
|
|
79
|
+
run_in_background=true,
|
|
80
|
+
load_skills=["nano-brain"],
|
|
81
|
+
description="Deep design: Metis scope/risk analysis for [feature]",
|
|
82
|
+
prompt="""
|
|
83
|
+
CONTEXT: The user wants to build: [paste user's feature description verbatim].
|
|
84
|
+
The codebase is at [project root]. Use nano-brain memory_query to check for
|
|
85
|
+
past decisions or context related to this feature area. If the codebase is not
|
|
86
|
+
accessible at the given path, work with the described tech stack — do not stall
|
|
87
|
+
on codebase discovery.
|
|
88
|
+
|
|
89
|
+
ROLE: You are a pre-planning consultant. Your job is to find what the user
|
|
90
|
+
hasn't thought of yet — the hidden complexities, the scope risks, the things
|
|
91
|
+
that will blow up at 2am if nobody plans for them.
|
|
92
|
+
|
|
93
|
+
ANALYZE AND RETURN:
|
|
94
|
+
|
|
95
|
+
1. HIDDEN COMPLEXITIES
|
|
96
|
+
- What non-obvious technical challenges does this feature involve?
|
|
97
|
+
- What edge cases will bite during implementation?
|
|
98
|
+
- What existing systems will this interact with unexpectedly?
|
|
99
|
+
|
|
100
|
+
2. SCOPE RISKS
|
|
101
|
+
- Where is scope likely to creep?
|
|
102
|
+
- What looks simple but is actually hard?
|
|
103
|
+
- What dependencies exist that could block progress?
|
|
104
|
+
|
|
105
|
+
3. PHASING ADVICE
|
|
106
|
+
- What's the natural decomposition into phases?
|
|
107
|
+
- What should be built first to de-risk the rest?
|
|
108
|
+
- What can be deferred to a v2 without compromising v1?
|
|
109
|
+
|
|
110
|
+
4. MISSING REQUIREMENTS
|
|
111
|
+
- What has the user not mentioned that they'll definitely need?
|
|
112
|
+
- What error handling, edge cases, or failure modes are unaddressed?
|
|
113
|
+
|
|
114
|
+
5. QUESTIONS FOR THE USER
|
|
115
|
+
- What critical decisions need user input before design can proceed?
|
|
116
|
+
- List max 3-5 questions, ranked by impact.
|
|
117
|
+
|
|
118
|
+
FORMAT: Use clear headers and bullet points. Be specific to THIS feature
|
|
119
|
+
in THIS codebase — no generic advice.
|
|
120
|
+
"""
|
|
121
|
+
)
|
|
122
|
+
```
|
|
123
|
+
|
|
124
|
+
### Oracle Prompt
|
|
125
|
+
|
|
126
|
+
```
|
|
127
|
+
task(
|
|
128
|
+
subagent_type="oracle",
|
|
129
|
+
run_in_background=true,
|
|
130
|
+
load_skills=["nano-brain"],
|
|
131
|
+
description="Deep design: Oracle architecture validation for [feature]",
|
|
132
|
+
prompt="""
|
|
133
|
+
CONTEXT: The user wants to build: [paste user's feature description verbatim].
|
|
134
|
+
The codebase is at [project root]. Use nano-brain memory_query and code_context
|
|
135
|
+
to understand existing architecture before making recommendations. If the
|
|
136
|
+
codebase is not accessible at the given path, work with the described tech
|
|
137
|
+
stack — do not stall on codebase discovery.
|
|
138
|
+
|
|
139
|
+
ROLE: You are a senior architect validating the design of this feature.
|
|
140
|
+
Your job is to ensure the architecture is sound, identify the minimum viable
|
|
141
|
+
approach, and answer the hard design questions before code is written.
|
|
142
|
+
|
|
143
|
+
ANALYZE AND RETURN:
|
|
144
|
+
|
|
145
|
+
1. ARCHITECTURE VALIDATION
|
|
146
|
+
- Does this feature fit cleanly into the existing architecture?
|
|
147
|
+
- What architectural patterns should it follow (based on what exists)?
|
|
148
|
+
- Where are the integration points with existing systems?
|
|
149
|
+
- Are there architectural anti-patterns to avoid?
|
|
150
|
+
|
|
151
|
+
2. DESIGN QUESTIONS & ANSWERS
|
|
152
|
+
- What are the key design decisions for this feature?
|
|
153
|
+
- For each decision, recommend an approach with reasoning.
|
|
154
|
+
- Note where multiple valid approaches exist and which you'd pick.
|
|
155
|
+
|
|
156
|
+
3. MINIMUM VIABLE APPROACH (MVA)
|
|
157
|
+
- What is the smallest version of this feature that delivers value?
|
|
158
|
+
- What can be cut from v1 without losing the core value proposition?
|
|
159
|
+
- What technical shortcuts are acceptable vs. which create tech debt?
|
|
160
|
+
|
|
161
|
+
4. SECURITY & PERFORMANCE CONSIDERATIONS
|
|
162
|
+
- Any security implications? (auth, data exposure, injection risks)
|
|
163
|
+
- Any performance concerns? (N+1 queries, memory, concurrency)
|
|
164
|
+
- Any data integrity risks?
|
|
165
|
+
|
|
166
|
+
5. TECHNOLOGY RECOMMENDATIONS
|
|
167
|
+
- Should this use existing libraries/tools or introduce new ones?
|
|
168
|
+
- Are there proven patterns in the codebase to reuse?
|
|
169
|
+
|
|
170
|
+
FORMAT: Use clear headers and bullet points. Be specific to THIS feature
|
|
171
|
+
in THIS codebase. Recommend concrete approaches, not abstract principles.
|
|
172
|
+
"""
|
|
173
|
+
)
|
|
174
|
+
```
|
|
175
|
+
|
|
176
|
+
**After firing both:** Continue to Phase 2 when both complete. Do NOT proceed until you have both results — end your response and wait for the `<system-reminder>` notifications if needed.
|
|
177
|
+
|
|
178
|
+
## Phase 2: Synthesis
|
|
179
|
+
|
|
180
|
+
This phase is performed by you (the orchestrator), not a subagent. You have both Metis and Oracle results. Your job is to merge them into a single coherent design brief.
|
|
181
|
+
|
|
182
|
+
### How to Synthesize
|
|
183
|
+
|
|
184
|
+
1. **Identify agreements** — Where Metis and Oracle align, that's high-confidence. Note these as settled decisions.
|
|
185
|
+
|
|
186
|
+
2. **Resolve conflicts** — Where they disagree, use these heuristics:
|
|
187
|
+
- **Architecture/technology choices** → Prefer Oracle (it's the architect)
|
|
188
|
+
- **Scope risks and hidden complexity** → Prefer Metis (it's the risk analyst)
|
|
189
|
+
- **Timeline/phasing** → Prefer Metis's caution over Oracle's optimism
|
|
190
|
+
- **Security concerns** → Prefer whichever is MORE conservative
|
|
191
|
+
- **If genuinely unclear** → Flag as open question for the user
|
|
192
|
+
- **Document every conflict resolution** in a table (Topic / Metis Said / Oracle Said / Resolution) so the user can override your judgment
|
|
193
|
+
|
|
194
|
+
3. **Merge phasing + MVA** — Combine Metis's phasing advice with Oracle's MVA recommendation into a single implementation roadmap.
|
|
195
|
+
|
|
196
|
+
4. **Consolidate questions** — Deduplicate questions from both agents. If Metis and Oracle both flagged the same uncertainty, that's a critical question.
|
|
197
|
+
|
|
198
|
+
5. **Produce a Design Brief** — Write a structured summary (not a file yet — this feeds Phase 3):
|
|
199
|
+
|
|
200
|
+
```markdown
|
|
201
|
+
## Design Brief: [Feature Name]
|
|
202
|
+
|
|
203
|
+
### Settled Decisions
|
|
204
|
+
- [Decision 1]: [Approach] (agreed by both Metis and Oracle)
|
|
205
|
+
- [Decision 2]: ...
|
|
206
|
+
|
|
207
|
+
### Architecture Approach
|
|
208
|
+
[Oracle's recommended architecture, validated against Metis's complexity analysis]
|
|
209
|
+
|
|
210
|
+
### Implementation Phases
|
|
211
|
+
- **Phase 1 (MVP):** [What to build first — Oracle's MVA + Metis's de-risking order]
|
|
212
|
+
- **Phase 2:** [What comes next]
|
|
213
|
+
- **Phase 3 (if applicable):** [Deferred items]
|
|
214
|
+
|
|
215
|
+
### Key Risks & Mitigations
|
|
216
|
+
- [Risk from Metis] → [Mitigation from Oracle or your judgment]
|
|
217
|
+
- ...
|
|
218
|
+
|
|
219
|
+
### Open Questions for User
|
|
220
|
+
1. [Most impactful question]
|
|
221
|
+
2. ...
|
|
222
|
+
|
|
223
|
+
### Security & Performance Notes
|
|
224
|
+
[From Oracle's analysis]
|
|
225
|
+
```
|
|
226
|
+
|
|
227
|
+
**Present the Design Brief to the user.** Ask them to answer the open questions and confirm the approach before proceeding to Phase 3. Do NOT proceed to OpenSpec without user confirmation.
|
|
228
|
+
|
|
229
|
+
If the user has answers/feedback, incorporate them into the brief before moving on.
|
|
230
|
+
|
|
231
|
+
## Phase 3: OpenSpec Proposal
|
|
232
|
+
|
|
233
|
+
With the user-approved Design Brief in hand, create a formal OpenSpec change. Use the existing OpenSpec workflow — do not reinvent it.
|
|
234
|
+
|
|
235
|
+
### Steps
|
|
236
|
+
|
|
237
|
+
1. **Create the change:**
|
|
238
|
+
```bash
|
|
239
|
+
openspec new change "<feature-name-kebab-case>"
|
|
240
|
+
```
|
|
241
|
+
|
|
242
|
+
2. **Get artifact status and instructions:**
|
|
243
|
+
```bash
|
|
244
|
+
openspec status --change "<name>" --json
|
|
245
|
+
```
|
|
246
|
+
|
|
247
|
+
3. **Create artifacts in dependency order.** For each artifact:
|
|
248
|
+
```bash
|
|
249
|
+
openspec instructions <artifact-id> --change "<name>" --json
|
|
250
|
+
```
|
|
251
|
+
Use the template from instructions, but fill it with content from the Design Brief.
|
|
252
|
+
|
|
253
|
+
4. **Key artifact mapping from Design Brief:**
|
|
254
|
+
|
|
255
|
+
| Design Brief Section | OpenSpec Artifact |
|
|
256
|
+
|---------------------|-------------------|
|
|
257
|
+
| Settled Decisions + Architecture Approach | `design.md` |
|
|
258
|
+
| Implementation Phases | `tasks.md` (with checkboxes) |
|
|
259
|
+
| The "why" + scope | `proposal.md` |
|
|
260
|
+
| Security/Performance + Requirements | `specs/<capability>/spec.md` |
|
|
261
|
+
| Key Risks & Mitigations | `design.md` (Risks section) |
|
|
262
|
+
|
|
263
|
+
5. **Validate the proposal:**
|
|
264
|
+
```bash
|
|
265
|
+
openspec validate "<name>" --strict --no-interactive
|
|
266
|
+
```
|
|
267
|
+
Fix any validation errors before proceeding.
|
|
268
|
+
|
|
269
|
+
### Writing Guidelines
|
|
270
|
+
|
|
271
|
+
- **proposal.md**: Focus on WHY this feature exists and WHAT changes. Pull from the user's original description + Metis's scope analysis.
|
|
272
|
+
- **design.md**: Capture Oracle's architecture recommendations, the settled decisions, and risk mitigations. This is the technical "how."
|
|
273
|
+
- **tasks.md**: Break implementation phases into concrete checkboxed tasks. Use Metis's phasing advice for ordering. Each task should be independently completable.
|
|
274
|
+
- **specs/**: Write formal requirements with scenarios (WHEN/THEN format). Cover the happy path, error cases, and edge cases that Metis identified.
|
|
275
|
+
|
|
276
|
+
After all artifacts are created and validated, proceed to Phase 4.
|
|
277
|
+
|
|
278
|
+
## Phase 4: Momus Review
|
|
279
|
+
|
|
280
|
+
Fire Momus to stress-test the proposal. Momus is an expert reviewer — it will find gaps, ambiguities, and missing scenarios that slipped through.
|
|
281
|
+
|
|
282
|
+
### Momus Prompt
|
|
283
|
+
|
|
284
|
+
```
|
|
285
|
+
task(
|
|
286
|
+
subagent_type="momus",
|
|
287
|
+
load_skills=["nano-brain"],
|
|
288
|
+
description="Deep design: Momus review of [feature] proposal",
|
|
289
|
+
prompt="""
|
|
290
|
+
CONTEXT: We've completed a multi-agent planning pipeline for a new feature.
|
|
291
|
+
The OpenSpec proposal is at: openspec/changes/<name>/
|
|
292
|
+
|
|
293
|
+
ARTIFACTS TO REVIEW:
|
|
294
|
+
- proposal.md: [paste path]
|
|
295
|
+
- design.md: [paste path]
|
|
296
|
+
- tasks.md: [paste path]
|
|
297
|
+
- specs/: [paste path(s)]
|
|
298
|
+
|
|
299
|
+
Read ALL artifacts before reviewing.
|
|
300
|
+
|
|
301
|
+
ROLE: You are an expert reviewer evaluating this proposal for implementation
|
|
302
|
+
readiness. Your job is to find what's missing, what's ambiguous, and what
|
|
303
|
+
will cause problems during implementation.
|
|
304
|
+
|
|
305
|
+
REVIEW CRITERIA:
|
|
306
|
+
|
|
307
|
+
1. COMPLETENESS
|
|
308
|
+
- Are all requirements covered by specs with scenarios?
|
|
309
|
+
- Are error cases and edge cases addressed?
|
|
310
|
+
- Are there implicit assumptions that should be explicit?
|
|
311
|
+
- Is anything mentioned in the proposal but missing from tasks?
|
|
312
|
+
|
|
313
|
+
2. CLARITY
|
|
314
|
+
- Can a developer pick up tasks.md and start working without asking questions?
|
|
315
|
+
- Are design decisions in design.md clear and well-reasoned?
|
|
316
|
+
- Are spec scenarios specific enough to be testable?
|
|
317
|
+
|
|
318
|
+
3. VERIFIABILITY
|
|
319
|
+
- Can each requirement be verified (tested/checked)?
|
|
320
|
+
- Are acceptance criteria clear for each task?
|
|
321
|
+
- Are there measurable success criteria?
|
|
322
|
+
|
|
323
|
+
4. RISKS & GAPS
|
|
324
|
+
- What failure modes are unaddressed?
|
|
325
|
+
- What happens if a dependency is unavailable?
|
|
326
|
+
- Are there race conditions, data consistency issues, or security gaps?
|
|
327
|
+
- Is the task ordering correct? Are there hidden dependencies between tasks?
|
|
328
|
+
|
|
329
|
+
5. SCOPE ASSESSMENT
|
|
330
|
+
- Is the scope appropriate for the stated goals?
|
|
331
|
+
- Is anything over-engineered for v1?
|
|
332
|
+
- Is anything under-specified that will cause scope creep?
|
|
333
|
+
|
|
334
|
+
OUTPUT FORMAT:
|
|
335
|
+
|
|
336
|
+
## Review Summary
|
|
337
|
+
[1-2 sentence overall assessment: ready / needs work / major concerns]
|
|
338
|
+
|
|
339
|
+
## Critical Issues (must fix before implementation)
|
|
340
|
+
- [Issue]: [Why it matters] → [Suggested fix]
|
|
341
|
+
|
|
342
|
+
## Recommendations (should fix)
|
|
343
|
+
- [Issue]: [Why it matters] → [Suggested fix]
|
|
344
|
+
|
|
345
|
+
## Minor Notes (nice to have)
|
|
346
|
+
- [Observation]
|
|
347
|
+
|
|
348
|
+
## Verdict
|
|
349
|
+
[APPROVED / APPROVED WITH CONDITIONS / NEEDS REVISION]
|
|
350
|
+
[If needs revision, list the specific items that must be addressed]
|
|
351
|
+
"""
|
|
352
|
+
)
|
|
353
|
+
```
|
|
354
|
+
|
|
355
|
+
**After Momus completes:**
|
|
356
|
+
|
|
357
|
+
- If **APPROVED**: Proceed to Phase 5.
|
|
358
|
+
- If **APPROVED WITH CONDITIONS**: Apply the fixes to the OpenSpec artifacts, then proceed to Phase 5. No need to re-run Momus unless the fixes are substantial.
|
|
359
|
+
- If **NEEDS REVISION**: Apply the critical fixes, re-validate with `openspec validate`, and present the updated proposal to the user. Ask if they want to re-run Momus or proceed.
|
|
360
|
+
|
|
361
|
+
## Phase 5: Deliver to User
|
|
362
|
+
|
|
363
|
+
Present the final result to the user. This is the handoff — they decide what happens next.
|
|
364
|
+
|
|
365
|
+
### What to Present
|
|
366
|
+
|
|
367
|
+
```markdown
|
|
368
|
+
## Deep Design Complete: [Feature Name]
|
|
369
|
+
|
|
370
|
+
### Pipeline Summary
|
|
371
|
+
- ✅ Metis: Identified [N] hidden complexities, [N] scope risks
|
|
372
|
+
- ✅ Oracle: Validated architecture, recommended [approach]
|
|
373
|
+
- ✅ Synthesis: Resolved [N] conflicts, produced design brief
|
|
374
|
+
- ✅ OpenSpec: Created proposal at `openspec/changes/<name>/`
|
|
375
|
+
- ✅ Momus: [APPROVED / APPROVED WITH CONDITIONS]
|
|
376
|
+
|
|
377
|
+
### Proposal Location
|
|
378
|
+
`openspec/changes/<name>/`
|
|
379
|
+
- `proposal.md` — Why and what
|
|
380
|
+
- `design.md` — Architecture and decisions
|
|
381
|
+
- `tasks.md` — Implementation checklist ([N] tasks across [N] phases)
|
|
382
|
+
- `specs/` — Formal requirements with scenarios
|
|
383
|
+
|
|
384
|
+
### Momus Review Highlights
|
|
385
|
+
[Top 2-3 findings from Momus, if any]
|
|
386
|
+
|
|
387
|
+
### Next Steps
|
|
388
|
+
- **To implement:** `/opsx-apply <name>` or ask me to start implementation
|
|
389
|
+
- **To modify:** Edit any artifact directly or ask me to adjust
|
|
390
|
+
- **To explore further:** `/opsx-explore <name>` to think through specific aspects
|
|
391
|
+
```
|
|
392
|
+
|
|
393
|
+
---
|
|
394
|
+
|
|
395
|
+
## Guardrails
|
|
396
|
+
|
|
397
|
+
- **Never skip a phase.** Every feature gets the full pipeline.
|
|
398
|
+
- **Never proceed past Phase 2 without user confirmation.** The Design Brief is a checkpoint.
|
|
399
|
+
- **Never auto-implement.** This skill produces a reviewed proposal — implementation is a separate decision.
|
|
400
|
+
- **Always validate OpenSpec artifacts** before running Momus. Don't waste an expensive review on invalid specs.
|
|
401
|
+
- **Always use `load_skills=["nano-brain"]`** when firing Metis, Oracle, and Momus so they can access project memory and code intelligence.
|
|
402
|
+
- **Always collect all background results** before synthesizing. Never synthesize with partial data.
|
|
@@ -0,0 +1,23 @@
|
|
|
1
|
+
{
|
|
2
|
+
"skill_name": "deep-design",
|
|
3
|
+
"evals": [
|
|
4
|
+
{
|
|
5
|
+
"id": 1,
|
|
6
|
+
"prompt": "I want to add real-time notifications to our app. Users should get notified when someone comments on their post, when they get a new follower, and when there's a system announcement. We're using a NestJS backend with PostgreSQL and a React frontend.",
|
|
7
|
+
"expected_output": "Full deep-design pipeline execution: Metis + Oracle fired in parallel, synthesis produces design brief with user checkpoint, OpenSpec proposal created with all artifacts, Momus review completed, final delivery with next steps.",
|
|
8
|
+
"files": []
|
|
9
|
+
},
|
|
10
|
+
{
|
|
11
|
+
"id": 2,
|
|
12
|
+
"prompt": "We need to migrate our authentication from session-based to JWT tokens. The app currently uses express-session with Redis store. About 50k daily active users. Can't have any downtime during migration.",
|
|
13
|
+
"expected_output": "Full deep-design pipeline execution with emphasis on: Metis identifying migration risks and zero-downtime phasing, Oracle recommending JWT architecture and security considerations, synthesis resolving migration strategy, OpenSpec proposal with phased tasks, Momus reviewing for migration gaps.",
|
|
14
|
+
"files": []
|
|
15
|
+
},
|
|
16
|
+
{
|
|
17
|
+
"id": 3,
|
|
18
|
+
"prompt": "Plan a multi-tenant billing system. Each tenant has their own subscription plan, usage metering, and invoice generation. We need Stripe integration. Some tenants are on custom enterprise deals with negotiated rates.",
|
|
19
|
+
"expected_output": "Full deep-design pipeline execution with emphasis on: Metis surfacing hidden complexity around custom enterprise pricing and usage metering edge cases, Oracle validating Stripe integration architecture and data model, synthesis producing comprehensive design brief, OpenSpec with detailed specs covering billing scenarios, Momus catching financial edge cases.",
|
|
20
|
+
"files": []
|
|
21
|
+
}
|
|
22
|
+
]
|
|
23
|
+
}
|