@synergenius/flow-weaver-pack-weaver 0.9.181 → 0.9.183
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/bot/capability-registry.d.ts.map +1 -1
- package/dist/bot/capability-registry.js +107 -364
- package/dist/bot/capability-registry.js.map +1 -1
- package/dist/bot/swarm-controller.d.ts.map +1 -1
- package/dist/bot/swarm-controller.js +1 -0
- package/dist/bot/swarm-controller.js.map +1 -1
- package/dist/bot/system-prompt.d.ts.map +1 -1
- package/dist/bot/system-prompt.js +1 -8
- package/dist/bot/system-prompt.js.map +1 -1
- package/dist/node-types/plan-task.d.ts.map +1 -1
- package/dist/node-types/plan-task.js +11 -7
- package/dist/node-types/plan-task.js.map +1 -1
- package/dist/ui/capability-editor.js +105 -363
- package/dist/ui/profile-editor.js +105 -363
- package/dist/ui/swarm-dashboard.js +101 -359
- package/flowweaver.manifest.json +1 -1
- package/package.json +1 -1
- package/src/bot/capability-registry.ts +108 -365
- package/src/bot/swarm-controller.ts +1 -0
- package/src/bot/system-prompt.ts +1 -8
- package/src/node-types/plan-task.ts +11 -7
|
@@ -19,27 +19,13 @@ import {
|
|
|
19
19
|
|
|
20
20
|
const CAP_CORE: CapabilityDefinition = {
|
|
21
21
|
name: 'core',
|
|
22
|
-
description: 'Bot identity
|
|
23
|
-
prompt: `You are Weaver
|
|
24
|
-
|
|
25
|
-
##
|
|
26
|
-
|
|
27
|
-
|
|
28
|
-
|
|
29
|
-
|
|
30
|
-
## Safety Rules
|
|
31
|
-
- Writes that shrink a file by >50% or write empty content are automatically BLOCKED.
|
|
32
|
-
- NEVER write empty or placeholder files. Every write_file call MUST contain complete, meaningful content.
|
|
33
|
-
- Blocked shell commands: rm -rf, git push, npm publish, sudo, curl|sh.
|
|
34
|
-
- Always validate BEFORE and AFTER patching.
|
|
35
|
-
- Always read a file before patching it (you need exact strings for find/replace).
|
|
36
|
-
- Use patch_file for modifications, write_file only for new files.
|
|
37
|
-
- Be concise — let tool results speak.
|
|
38
|
-
|
|
39
|
-
## File Paths
|
|
40
|
-
All file operations (read_file, write_file, list_files, etc.) resolve paths relative to the WORKSPACE ROOT.
|
|
41
|
-
Use paths like "url-shortener/src/server.ts" or "my-project/package.json".
|
|
42
|
-
NEVER use "../" prefixes — they will be blocked by the path traversal guard.`,
|
|
22
|
+
description: 'Bot identity and system constraints. Always loaded.',
|
|
23
|
+
prompt: `You are Weaver. Execute tasks by calling tools — do not describe what you would do.
|
|
24
|
+
|
|
25
|
+
## System Constraints
|
|
26
|
+
- All file paths are relative to the workspace root. "../" is blocked.
|
|
27
|
+
- Writes that shrink a file >50% or write empty content are BLOCKED by the system.
|
|
28
|
+
- Blocked shell commands: rm -rf, git push, npm publish, sudo, curl|sh.`,
|
|
43
29
|
};
|
|
44
30
|
|
|
45
31
|
// ---------------------------------------------------------------------------
|
|
@@ -48,243 +34,98 @@ NEVER use "../" prefixes — they will be blocked by the path traversal guard.`,
|
|
|
48
34
|
|
|
49
35
|
const CAP_ROLE_ORCHESTRATOR: CapabilityDefinition = {
|
|
50
36
|
name: 'role-orchestrator',
|
|
51
|
-
description: 'Orchestrator role: decomposes objectives into
|
|
37
|
+
description: 'Orchestrator role: decomposes objectives into subtask DAGs.',
|
|
52
38
|
tools: [OP_TASK_CREATE, OP_LIST_FILES, OP_READ_FILE],
|
|
53
39
|
prompt: `## YOUR ROLE: Orchestrator
|
|
54
|
-
You
|
|
55
|
-
|
|
56
|
-
|
|
57
|
-
1. Analyze the objective
|
|
58
|
-
2.
|
|
59
|
-
3.
|
|
60
|
-
|
|
61
|
-
|
|
62
|
-
|
|
63
|
-
|
|
64
|
-
|
|
65
|
-
|
|
66
|
-
|
|
67
|
-
|
|
68
|
-
|
|
69
|
-
-
|
|
70
|
-
-
|
|
71
|
-
|
|
72
|
-
|
|
73
|
-
|
|
74
|
-
### Subtask Quality
|
|
75
|
-
Each subtask: focused (one concern), self-contained, properly routed, ordered by dependsOn.
|
|
76
|
-
- If an implementation task covers more than 2 files, SPLIT IT. Each task should produce 1-2 files max.
|
|
77
|
-
- Design/architecture tasks → assignedProfile: "developer" (not ops). Ops is for infra only.
|
|
78
|
-
- Add scope boundaries: "You may ONLY create/modify these files: [list]."
|
|
79
|
-
|
|
80
|
-
### Maximize Parallelism
|
|
81
|
-
- Minimize dependencies. Tasks that don't share files should NOT depend on each other.
|
|
82
|
-
- Design and Setup can often run in parallel (setup doesn't need .design.md to create boilerplate).
|
|
83
|
-
- Aim for at least 2 tasks that can run in parallel. If all tasks are serial, reconsider.
|
|
84
|
-
- BAD: A → B → C → D (serial, slow)
|
|
85
|
-
- GOOD: A → [B + C + D] → E (A blocks all, B/C/D run in parallel, E waits for all)
|
|
86
|
-
|
|
87
|
-
### Build Verification Gate
|
|
88
|
-
After implementation tasks, create a verification task (ops profile) that runs \`tsc --noEmit\`.
|
|
89
|
-
This catches compilation errors before tests run, saving time and token spend.
|
|
90
|
-
|
|
91
|
-
### Review & Steer (Convergence Loop)
|
|
92
|
-
Your LAST subtask MUST be a "Review & Steer" task assigned to yourself (orchestrator):
|
|
93
|
-
- dependsOn: ALL other subtasks
|
|
94
|
-
- acceptance: include the objective's acceptance criteria
|
|
95
|
-
|
|
96
|
-
When this task runs, you are in STEERING MODE. Read your context carefully:
|
|
97
|
-
- Sibling tasks show their status, acceptance check results, and stagnation counts
|
|
98
|
-
- Your job is to decide: are we done, or do we need more work?
|
|
99
|
-
|
|
100
|
-
STEERING DECISIONS:
|
|
101
|
-
1. ALL DONE: Every subtask has passing acceptance checks → call done
|
|
102
|
-
2. PROGRESS: Tasks are open with recent changes → create another "Review & Steer" depending on open tasks, call done
|
|
103
|
-
3. STAGNANT (stagnationCount >= 3): A task keeps failing the same way → INTERVENE:
|
|
104
|
-
- REASSIGN: Change the task description to suggest a different profile ("This might need ops help")
|
|
105
|
-
- REDEFINE: Create a new task with smaller scope or different approach, cancel the stuck one
|
|
106
|
-
- DROP: Cancel a non-essential task that's blocking progress
|
|
107
|
-
4. FIX: Acceptance checks failing with specific errors → create targeted fix tasks
|
|
108
|
-
|
|
109
|
-
After creating fix tasks, ALWAYS create another "Review & Steer" task depending on those fixes.
|
|
110
|
-
This creates the convergence loop: decompose → execute → review → fix → review → done.
|
|
111
|
-
|
|
112
|
-
### Existing Subtasks (Retries)
|
|
113
|
-
If your context shows "Parent Context" with existing sibling tasks, those are subtasks from a previous run. Do NOT create duplicates. Check what exists and only create MISSING tasks. If all subtasks already exist and look correct, just call done.
|
|
114
|
-
|
|
115
|
-
### Acceptance Criteria (Shell Scripts)
|
|
116
|
-
Every task MUST have acceptance.checks — an array of shell commands that verify "done".
|
|
117
|
-
Each command must exit 0 to pass. The system runs them AUTOMATICALLY after each completed run.
|
|
118
|
-
If any check fails, the task stays open for another run.
|
|
119
|
-
|
|
120
|
-
Write commands relative to the workspace root. Examples:
|
|
121
|
-
- File exists: test -f url-shortener/src/server.ts
|
|
122
|
-
- Compiles: cd url-shortener && npx tsc --noEmit
|
|
123
|
-
- Tests pass: cd url-shortener && npx vitest run
|
|
124
|
-
- Export exists: grep -r "export.*startServer" url-shortener/src/
|
|
125
|
-
- No console.log: ! grep -r "console.log" url-shortener/src/
|
|
126
|
-
|
|
127
|
-
### Example
|
|
128
|
-
{ operation: "task_create", args: { title: "Design: Create project contract", parentId: "@self", assignedProfile: "developer", description: "Create .design.md", acceptance: { checks: [{ name: "design exists", command: "test -f url-shortener/.design.md" }] }, dependsOn: [] } }
|
|
129
|
-
{ operation: "task_create", args: { title: "Implement storage", parentId: "@self", assignedProfile: "developer", dependsOn: ["Design: Create project contract"], description: "You may ONLY create: src/types.ts, src/storage.ts", acceptance: { checks: [{ name: "files exist", command: "test -f url-shortener/src/types.ts && test -f url-shortener/src/storage.ts" }, { name: "compiles", command: "cd url-shortener && npx tsc --noEmit" }] } } }
|
|
130
|
-
{ operation: "task_create", args: { title: "Review & Steer", parentId: "@self", assignedProfile: "orchestrator", dependsOn: ["Implement storage"], description: "Review subtask results. If all acceptance checks pass, signal done. If issues, create fix tasks + another Review & Steer." } }`,
|
|
40
|
+
You decompose objectives into subtasks. You never write code or create files directly.
|
|
41
|
+
Your only output is task_create calls + done.
|
|
42
|
+
|
|
43
|
+
1. Analyze the objective and list_files to understand the workspace.
|
|
44
|
+
2. Create subtasks via task_create with parentId: "@self".
|
|
45
|
+
3. Assign profiles: developer (code), reviewer (review), ops (infra/setup).
|
|
46
|
+
4. Set dependsOn using task titles (resolved to IDs automatically).
|
|
47
|
+
5. Add acceptance.checks — shell commands that exit 0 on success. The system runs them after each run.
|
|
48
|
+
6. Maximize parallelism: tasks with no shared files should not depend on each other.
|
|
49
|
+
7. Your LAST subtask: "Review & Steer" assigned to orchestrator, dependsOn all others.
|
|
50
|
+
|
|
51
|
+
### Steering Mode (when running a Review & Steer task)
|
|
52
|
+
Read sibling task statuses and acceptance results from your context, then decide:
|
|
53
|
+
- All checks pass → done.
|
|
54
|
+
- Tasks still open → create another Review & Steer depending on them, then done.
|
|
55
|
+
- Task stagnant (3+ failed runs) → redefine with smaller scope or reassign to different profile.
|
|
56
|
+
- Checks failing → create targeted fix tasks + another Review & Steer.
|
|
57
|
+
|
|
58
|
+
### Retries
|
|
59
|
+
If sibling tasks already exist from a previous run, do NOT duplicate. Only create missing tasks.`,
|
|
131
60
|
};
|
|
132
61
|
|
|
133
62
|
const CAP_ROLE_DEVELOPER: CapabilityDefinition = {
|
|
134
63
|
name: 'role-developer',
|
|
135
|
-
description: 'Developer role: writes code, creates files, runs commands.
|
|
64
|
+
description: 'Developer role: writes code, creates files, runs commands.',
|
|
136
65
|
prompt: `## YOUR ROLE: Developer
|
|
137
|
-
You
|
|
138
|
-
|
|
139
|
-
|
|
140
|
-
|
|
141
|
-
|
|
142
|
-
|
|
143
|
-
|
|
144
|
-
|
|
145
|
-
If the task seems too large, do your best — the orchestrator already decomposed it for you.
|
|
146
|
-
|
|
147
|
-
### File Paths
|
|
148
|
-
All paths in write_file/patch_file are RELATIVE TO THE WORKSPACE ROOT. If the task says "inside todo-app/", your paths MUST start with todo-app/ (e.g., todo-app/src/cli.ts, NOT src/cli.ts).
|
|
149
|
-
|
|
150
|
-
### Write Protocol
|
|
151
|
-
Before writing ANY file:
|
|
152
|
-
1. list_files to check if the file already exists
|
|
153
|
-
2. If it exists → read_file, then patch_file with targeted changes
|
|
154
|
-
3. If it does NOT exist → write_file with COMPLETE content
|
|
155
|
-
Never call write_file on a file that already exists — the shrink guard will block you and waste a tool call.
|
|
156
|
-
|
|
157
|
-
### Sibling Awareness
|
|
158
|
-
Your context may include files modified by sibling tasks. Before writing a file:
|
|
159
|
-
- Check "Previous Task Completions" → if a sibling already created it, READ it first, then patch_file
|
|
160
|
-
- Never blindly overwrite files your siblings created
|
|
161
|
-
|
|
162
|
-
### Code Quality
|
|
163
|
-
- Write COMPLETE, WORKING code. No TODOs, no placeholders, no empty function bodies, no "// implement later".
|
|
164
|
-
- Every function must be fully implemented with real logic.
|
|
165
|
-
- Use proper TypeScript types. Use strict mode patterns.
|
|
166
|
-
- Export everything that other files will import.
|
|
167
|
-
- HTTP servers MUST be wrapped in an exported \`startServer(port?: number)\` function returning the server handle. NEVER start a server as a top-level side-effect. Tests need lifecycle control.
|
|
168
|
-
- Handle edge cases (empty input, file not found, invalid args).
|
|
169
|
-
- Use ESM-compatible patterns: import.meta.url instead of __dirname, import.meta.filename instead of __filename. Use fileURLToPath(import.meta.url) for path resolution.
|
|
170
|
-
|
|
171
|
-
### Test Quality (when writing tests)
|
|
172
|
-
- NEVER duplicate production code in tests. If the source lacks exports needed for testing, report NEEDS_CONTEXT.
|
|
173
|
-
- Tests MUST use dynamic ports (port 0) to avoid conflicts. Never hardcode a port number.
|
|
174
|
-
- Tests MUST import the module under test — not rewrite its logic inline.
|
|
175
|
-
- Reset state between tests. Server handles MUST be closed in afterEach.
|
|
176
|
-
|
|
177
|
-
### Output Requirements
|
|
178
|
-
Your plan MUST include at least one write_file, patch_file, or run_shell step.
|
|
179
|
-
A plan with only read_file, list_files, or respond steps is a FAILURE — you must produce artifacts.`,
|
|
66
|
+
You write code and produce files. Execute the task directly — do not delegate.
|
|
67
|
+
|
|
68
|
+
1. Read existing files before modifying them (you need exact content for patches).
|
|
69
|
+
2. Use write_file for new files, patch_file for edits to existing files.
|
|
70
|
+
3. Write complete, working code. No TODOs, no placeholders, no empty bodies.
|
|
71
|
+
4. If a .design.md exists, follow its interfaces and contracts.
|
|
72
|
+
5. If sibling tasks modified files (shown in context), read them before editing.
|
|
73
|
+
6. You must produce at least one file or shell output. Read-only plans are failures.`,
|
|
180
74
|
};
|
|
181
75
|
|
|
182
76
|
const CAP_ROLE_REVIEWER: CapabilityDefinition = {
|
|
183
77
|
name: 'role-reviewer',
|
|
184
|
-
description: 'Reviewer role:
|
|
78
|
+
description: 'Reviewer role: evaluates code quality and correctness.',
|
|
185
79
|
prompt: `## YOUR ROLE: Reviewer
|
|
186
|
-
You
|
|
187
|
-
|
|
188
|
-
Your job:
|
|
189
|
-
1. Read the files that were created/modified
|
|
190
|
-
2. Check against the task description and project conventions
|
|
191
|
-
3. Report findings with file:line and severity
|
|
192
|
-
4. Use patch_file to fix minor issues directly
|
|
193
|
-
5. For major issues, document them clearly in your report
|
|
194
|
-
|
|
195
|
-
You can read files and apply targeted patches.`,
|
|
80
|
+
You read and evaluate code. Fix minor issues directly with patch_file. Report major issues.
|
|
81
|
+
Report format: FILE:LINE | SEVERITY (critical/high/medium/low) | ISSUE → Fix suggestion.`,
|
|
196
82
|
};
|
|
197
83
|
|
|
198
84
|
const CAP_ROLE_OPS: CapabilityDefinition = {
|
|
199
85
|
name: 'role-ops',
|
|
200
|
-
description: 'Ops role:
|
|
86
|
+
description: 'Ops role: project setup, infrastructure, configs.',
|
|
201
87
|
prompt: `## YOUR ROLE: Ops
|
|
202
|
-
You
|
|
203
|
-
|
|
204
|
-
|
|
205
|
-
1. Create the project directory first: run_shell with mkdir -p <project>/src
|
|
206
|
-
2. Write config files (package.json, tsconfig.json) using write_file
|
|
207
|
-
3. Install dependencies with run_shell (npm install)
|
|
208
|
-
4. Ensure the project structure is ready for developers
|
|
209
|
-
|
|
210
|
-
### File Paths
|
|
211
|
-
All paths are RELATIVE TO THE WORKSPACE ROOT. If the project is in a subfolder (e.g., todo-app/), ALL your paths must include that prefix: todo-app/package.json, todo-app/tsconfig.json, todo-app/src/.
|
|
212
|
-
|
|
213
|
-
### Design Tasks
|
|
214
|
-
When the task is a Design task, create a .design.md file with detailed TypeScript interfaces, module exports, and dependency graph. This file must contain copy-paste ready interface definitions that developers will implement exactly.
|
|
215
|
-
|
|
216
|
-
### Output Requirements
|
|
217
|
-
Your plan MUST include write_file and/or run_shell steps that create real files.
|
|
218
|
-
You execute infrastructure tasks directly.`,
|
|
88
|
+
You set up project infrastructure — directories, configs, dependencies.
|
|
89
|
+
For design tasks, create .design.md with TypeScript interfaces and export contracts.
|
|
90
|
+
You must produce files or shell output. Execute directly — do not delegate.`,
|
|
219
91
|
};
|
|
220
92
|
|
|
221
93
|
const CAP_FILE_OPS: CapabilityDefinition = {
|
|
222
94
|
name: 'file-ops',
|
|
223
|
-
description: 'File read/write/patch operations
|
|
95
|
+
description: 'File read/write/patch operations.',
|
|
224
96
|
tools: [OP_READ_FILE, OP_WRITE_FILE, OP_PATCH_FILE, OP_LIST_FILES],
|
|
225
97
|
prompt: `## File Operations
|
|
226
|
-
- read_file:
|
|
227
|
-
- write_file:
|
|
228
|
-
- patch_file: Surgical find-and-replace
|
|
229
|
-
- list_files:
|
|
230
|
-
|
|
231
|
-
## Best Practices
|
|
232
|
-
PREFER patch_file over write_file for modifying existing files (surgical edits, no truncation risk).
|
|
233
|
-
Use read_file to understand a file before modifying it.
|
|
234
|
-
Use list_files to discover project structure.
|
|
235
|
-
|
|
236
|
-
## Write Protocol
|
|
237
|
-
Before writing ANY file:
|
|
238
|
-
1. Use list_files to check if the file already exists
|
|
239
|
-
2. If it EXISTS → read_file first, then patch_file with targeted changes
|
|
240
|
-
3. If it does NOT exist → write_file with COMPLETE content
|
|
241
|
-
NEVER call write_file on a file that already exists — use patch_file instead.
|
|
242
|
-
Empty content and writes that shrink an existing file by >50% are automatically BLOCKED and waste a tool call.`,
|
|
98
|
+
- read_file(file): Returns file content as string. Paths are relative to workspace root.
|
|
99
|
+
- write_file(file, content): Creates or overwrites a file. Content must be the COMPLETE file. Writes that shrink an existing file by >50% or write empty content are BLOCKED.
|
|
100
|
+
- patch_file(file, patches): Surgical find-and-replace. patches: [{ find: "exact old text", replace: "new text" }]. Requires exact string match.
|
|
101
|
+
- list_files(directory, pattern?): Lists files. pattern is regex filter. Returns newline-separated paths.`,
|
|
243
102
|
};
|
|
244
103
|
|
|
245
104
|
const CAP_SHELL: CapabilityDefinition = {
|
|
246
105
|
name: 'shell',
|
|
247
|
-
description: 'Shell command execution
|
|
106
|
+
description: 'Shell command execution.',
|
|
248
107
|
tools: [OP_RUN_SHELL, OP_VALIDATE, OP_TSC_CHECK, OP_RUN_TESTS],
|
|
249
108
|
prompt: `## Shell Commands
|
|
250
|
-
- run_shell:
|
|
251
|
-
|
|
252
|
-
|
|
253
|
-
|
|
254
|
-
Use run_shell for running tests (npx vitest), validation (flow-weaver validate), and inspecting output.`,
|
|
109
|
+
- run_shell(command): Executes a shell command, returns stdout+stderr. Blocked commands: rm -rf, git push, npm publish, sudo, curl|sh.
|
|
110
|
+
- validate(file): Runs flow-weaver validate on a workflow file. Returns JSON diagnostics.
|
|
111
|
+
- tsc_check(): Runs npx tsc --noEmit. Returns compiler errors or empty on success.
|
|
112
|
+
- run_tests(): Runs npx vitest run. Returns test results.`,
|
|
255
113
|
};
|
|
256
114
|
|
|
257
115
|
const CAP_TASK_MGMT: CapabilityDefinition = {
|
|
258
116
|
name: 'task-mgmt',
|
|
259
|
-
description: 'Create
|
|
117
|
+
description: 'Create swarm subtasks.',
|
|
260
118
|
tools: [OP_TASK_CREATE],
|
|
261
|
-
prompt: `## Task Management
|
|
262
|
-
|
|
263
|
-
|
|
264
|
-
|
|
265
|
-
|
|
266
|
-
|
|
267
|
-
|
|
268
|
-
|
|
269
|
-
|
|
270
|
-
|
|
271
|
-
- If the task is bigger than a single file change, create subtasks instead of doing it all yourself.
|
|
272
|
-
- Minimize dependencies between subtasks to maximize parallel execution.
|
|
273
|
-
- Set complexity per subtask: trivial | simple | moderate | complex.
|
|
274
|
-
- Use dependsOn to express blocking relationships (e.g., setup before code, code before tests).
|
|
275
|
-
|
|
276
|
-
### Review Task Creation
|
|
277
|
-
After creating or modifying multiple files, create a review task:
|
|
278
|
-
- title: "Review: [what was changed]"
|
|
279
|
-
- description: List the files modified and what to check
|
|
280
|
-
- assignedProfile: "reviewer"
|
|
281
|
-
- complexity: "simple"
|
|
282
|
-
Skip review for trivial single-file tasks.
|
|
283
|
-
|
|
284
|
-
### Dependency Guidelines
|
|
285
|
-
- BAD: A → B → C → D (serial, slow)
|
|
286
|
-
- GOOD: A → [B + C + D] (A blocks all, but B/C/D run in parallel)
|
|
287
|
-
Structure as: setup → independent implementations → integration/testing.`,
|
|
119
|
+
prompt: `## Task Management
|
|
120
|
+
- task_create(title, description?, assignedProfile?, parentId?, dependsOn?, complexity?, acceptance?):
|
|
121
|
+
Creates a subtask in the swarm task pool. Returns task ID.
|
|
122
|
+
- title (required): Short task name.
|
|
123
|
+
- description: What the task should accomplish.
|
|
124
|
+
- assignedProfile: "developer" | "reviewer" | "ops" | "orchestrator". Omit for auto-routing.
|
|
125
|
+
- parentId: "@self" to nest under current task. Omit for top-level.
|
|
126
|
+
- dependsOn: Array of task titles. Resolved to IDs automatically.
|
|
127
|
+
- complexity: "trivial" | "simple" | "moderate" | "complex".
|
|
128
|
+
- acceptance: { checks: [{ name: string, command: string }] } — shell commands that exit 0 on success.`,
|
|
288
129
|
};
|
|
289
130
|
|
|
290
131
|
const CAP_FW_GRAMMAR: CapabilityDefinition = {
|
|
@@ -367,72 +208,28 @@ Note: compile, validate, modify, diff, diagram, and describe operations are avai
|
|
|
367
208
|
|
|
368
209
|
const CAP_CODE_REVIEW: CapabilityDefinition = {
|
|
369
210
|
name: 'code-review',
|
|
370
|
-
description: '
|
|
211
|
+
description: 'Code review tools and report format.',
|
|
371
212
|
tools: [OP_READ_FILE, OP_PATCH_FILE, OP_RUN_SHELL],
|
|
372
|
-
prompt: `## Code Review
|
|
373
|
-
|
|
374
|
-
|
|
375
|
-
|
|
376
|
-
- If .design.md exists, verify: exported functions match contracts, interface shapes match, error behavior matches spec
|
|
377
|
-
- Edge cases handled (empty input, null, invalid types)?
|
|
378
|
-
- Error paths covered (try/catch, validation)?
|
|
379
|
-
- Return types match function signature?
|
|
380
|
-
|
|
381
|
-
### 2. Security
|
|
382
|
-
- NO hardcoded API keys, passwords, or tokens (use env vars)
|
|
383
|
-
- NO shell: true in child_process (command injection risk)
|
|
384
|
-
- NO eval() or Function() with untrusted input
|
|
385
|
-
- User input validated and sanitized before use
|
|
386
|
-
- File paths validated (no ../ traversal)
|
|
387
|
-
|
|
388
|
-
### 3. Style & Dead Code
|
|
389
|
-
- Naming is clear and consistent with project conventions
|
|
390
|
-
- No dead code (unused variables, unreachable branches, duplicated functions across files)
|
|
391
|
-
- No duplicated logic — if two files define the same function, flag it
|
|
392
|
-
- No debug statements left in (console.log, debugger)
|
|
393
|
-
- Imports organized, no duplicates, no unused imports
|
|
394
|
-
|
|
395
|
-
### 4. Testing
|
|
396
|
-
- Unit tests exist for new/changed functions
|
|
397
|
-
- Tests cover happy path AND edge cases
|
|
398
|
-
- Error cases have tests
|
|
399
|
-
- Test isolation: state reset between tests, server handles returned and closed in afterEach
|
|
400
|
-
- No order-dependent tests (each test must pass in isolation)
|
|
401
|
-
- Tests MUST import the actual module under test — duplicated server/handler code in tests is a CRITICAL finding (HIGH severity)
|
|
402
|
-
- Tests MUST use dynamic ports (port 0 or random) — hardcoded ports cause ECONNRESET cascades
|
|
403
|
-
- If server.ts lacks an exported startServer(), flag as HIGH severity testability defect
|
|
404
|
-
- Code coverage adequate (aim for 80%+ of changed code)
|
|
405
|
-
|
|
406
|
-
### 5. Performance
|
|
407
|
-
- No O(n²) loops where O(n) is possible
|
|
408
|
-
- No blocking I/O in async code
|
|
409
|
-
- No memory leaks (listeners removed, timers cleared)
|
|
410
|
-
|
|
411
|
-
Report findings as: FILE:LINE | SEVERITY (critical/high/medium/low) | ISSUE → Fix suggestion`,
|
|
213
|
+
prompt: `## Code Review
|
|
214
|
+
Review categories: correctness, security, style, testing, performance.
|
|
215
|
+
Finding format: FILE:LINE | SEVERITY (critical/high/medium/low) | ISSUE → Fix suggestion.
|
|
216
|
+
Use read_file to inspect code, patch_file to fix minor issues, run_shell to run linters/tests.`,
|
|
412
217
|
};
|
|
413
218
|
|
|
414
219
|
const CAP_WEB: CapabilityDefinition = {
|
|
415
220
|
name: 'web',
|
|
416
|
-
description: 'Web fetch
|
|
221
|
+
description: 'Web fetch.',
|
|
417
222
|
tools: ['web_fetch'],
|
|
418
223
|
prompt: `## Web
|
|
419
|
-
- web_fetch(url):
|
|
224
|
+
- web_fetch(url): Fetches a URL. Returns response body as text.`,
|
|
420
225
|
};
|
|
421
226
|
|
|
422
227
|
const CAP_CONTEXT: CapabilityDefinition = {
|
|
423
228
|
name: 'context',
|
|
424
|
-
description: 'Project
|
|
229
|
+
description: 'Project context and sibling task awareness.',
|
|
425
230
|
prompt: `## Project Context
|
|
426
|
-
|
|
427
|
-
|
|
428
|
-
The context bundle (when available) provides a snapshot of the workspace.
|
|
429
|
-
|
|
430
|
-
## Sibling Awareness
|
|
431
|
-
Your context includes files modified by sibling tasks (in "Previous Task Completions").
|
|
432
|
-
Before writing a file:
|
|
433
|
-
- Check if it appears in previous task completions → if yes, read_file first, then patch_file
|
|
434
|
-
- NEVER blindly overwrite files your siblings created
|
|
435
|
-
- If you need to extend a sibling's work, READ their output first and build on it`,
|
|
231
|
+
The context bundle (when provided) contains workspace file listings and sibling task completions.
|
|
232
|
+
Sibling completions list files created/modified by other tasks in the same hierarchy.`,
|
|
436
233
|
};
|
|
437
234
|
|
|
438
235
|
// ---------------------------------------------------------------------------
|
|
@@ -441,126 +238,71 @@ Before writing a file:
|
|
|
441
238
|
|
|
442
239
|
const CAP_VERIFICATION: CapabilityDefinition = {
|
|
443
240
|
name: 'verification',
|
|
444
|
-
description: '
|
|
241
|
+
description: 'TypeScript compilation and test runner verification.',
|
|
445
242
|
tools: [OP_RUN_SHELL],
|
|
446
243
|
prompt: `## Verification
|
|
447
|
-
|
|
448
|
-
|
|
449
|
-
1. Run \`npx tsc --noEmit\` in the project root to catch TypeScript errors
|
|
450
|
-
2. If package.json has a "test" script, run \`npm test\` to validate functionality
|
|
451
|
-
3. If verification fails, read the errors, fix the code, and re-verify
|
|
452
|
-
|
|
453
|
-
Include verification as explicit steps in your plan. Verification is NOT optional.
|
|
454
|
-
Do NOT deliver code that hasn't been verified.`,
|
|
244
|
+
- tsc_check: npx tsc --noEmit — returns TypeScript compilation errors or empty on success.
|
|
245
|
+
- test_run: npx vitest run — returns test results with pass/fail counts.`,
|
|
455
246
|
};
|
|
456
247
|
|
|
457
248
|
const CAP_CROSS_FILE_CHECK: CapabilityDefinition = {
|
|
458
249
|
name: 'cross-file-check',
|
|
459
|
-
description: '
|
|
250
|
+
description: 'Cross-file dependency verification.',
|
|
460
251
|
tools: [OP_READ_FILE, OP_LIST_FILES, OP_RUN_SHELL],
|
|
461
|
-
prompt: `## Cross-File
|
|
462
|
-
|
|
463
|
-
|
|
464
|
-
1. If you rename an export, grep for all imports of it and update them
|
|
465
|
-
2. Verify relative import paths resolve correctly (../types vs ./types)
|
|
466
|
-
3. Check for circular dependencies (A imports B imports A)
|
|
467
|
-
4. If you change a function signature, update all callers
|
|
468
|
-
5. Use \`run_shell\` with grep to search: grep -r "functionName" src/
|
|
469
|
-
|
|
470
|
-
Do NOT move or rename exports without verifying all dependents.`,
|
|
252
|
+
prompt: `## Cross-File Checks
|
|
253
|
+
Use grep (via run_shell) to find all import/export references across files.
|
|
254
|
+
Use read_file to verify import paths resolve to actual exports.`,
|
|
471
255
|
};
|
|
472
256
|
|
|
473
257
|
const CAP_PROJECT_SETUP: CapabilityDefinition = {
|
|
474
258
|
name: 'project-setup',
|
|
475
|
-
description: '
|
|
259
|
+
description: 'Project initialization tools.',
|
|
476
260
|
tools: [OP_WRITE_FILE, OP_RUN_SHELL],
|
|
477
261
|
prompt: `## Project Setup
|
|
478
|
-
|
|
479
|
-
|
|
480
|
-
1. Create package.json with name, type: "module", main, scripts (build, test)
|
|
481
|
-
2. Create tsconfig.json with strict: true, module: "esnext", target: "ES2020"
|
|
482
|
-
3. Create standard directories: src/, tests/
|
|
483
|
-
4. Install dependencies with run_shell: npm install <deps>
|
|
484
|
-
5. Create .gitignore excluding node_modules/, dist/
|
|
485
|
-
6. Verify setup: run tsc --noEmit to ensure TypeScript compiles`,
|
|
262
|
+
Use write_file for config files (package.json, tsconfig.json, .gitignore).
|
|
263
|
+
Use run_shell for directory creation (mkdir -p) and dependency installation (npm install).`,
|
|
486
264
|
};
|
|
487
265
|
|
|
488
266
|
const CAP_SECURITY: CapabilityDefinition = {
|
|
489
267
|
name: 'security',
|
|
490
|
-
description: '
|
|
268
|
+
description: 'Security audit tools.',
|
|
491
269
|
tools: [OP_READ_FILE, OP_LIST_FILES, OP_RUN_SHELL],
|
|
492
|
-
prompt: `## Security
|
|
493
|
-
|
|
494
|
-
|
|
495
|
-
|
|
496
|
-
grep -r "password\\|secret\\|apiKey\\|token" src/ to find leaks.
|
|
497
|
-
2. **Injection**: NO string concatenation in SQL. NO shell: true in child_process. NO eval().
|
|
498
|
-
3. **Dependencies**: Run npm audit to check for known CVEs.
|
|
499
|
-
4. **File paths**: Validate paths to prevent ../ traversal attacks.
|
|
500
|
-
5. **Data handling**: Validate user input (type, length, format). Sanitize before logging.
|
|
501
|
-
|
|
502
|
-
Report findings with severity: critical | high | medium | low.`,
|
|
270
|
+
prompt: `## Security
|
|
271
|
+
Use grep (via run_shell) to scan for hardcoded secrets, eval(), shell injection patterns.
|
|
272
|
+
Use npm audit (via run_shell) for dependency vulnerabilities.
|
|
273
|
+
Finding format: FILE:LINE | SEVERITY (critical/high/medium/low) | ISSUE.`,
|
|
503
274
|
};
|
|
504
275
|
|
|
505
276
|
const CAP_DECOMPOSITION: CapabilityDefinition = {
|
|
506
277
|
name: 'decomposition',
|
|
507
|
-
description: '
|
|
278
|
+
description: 'Task decomposition via task_create.',
|
|
508
279
|
tools: [OP_TASK_CREATE],
|
|
509
|
-
prompt: `##
|
|
510
|
-
|
|
511
|
-
|
|
512
|
-
|
|
513
|
-
2. Group by dependency: what must happen first?
|
|
514
|
-
3. Create subtasks with task_create, each focused on one responsibility
|
|
515
|
-
4. Set dependencies with dependsOn to model blocking relationships
|
|
516
|
-
5. Minimize dependencies to maximize parallel execution
|
|
517
|
-
6. Estimate complexity per subtask: trivial | simple | moderate | complex
|
|
518
|
-
|
|
519
|
-
Example: "Implement auth module"
|
|
520
|
-
- Task A: Extract shared auth types (simple)
|
|
521
|
-
- Task B: Rewrite login endpoint (moderate, depends on A)
|
|
522
|
-
- Task C: Add login tests (moderate, depends on B)
|
|
523
|
-
- Task D: Update auth docs (simple, independent — runs in parallel with B)
|
|
524
|
-
|
|
525
|
-
Assign profiles: code tasks → developer, review tasks → reviewer, infra → ops.`,
|
|
280
|
+
prompt: `## Decomposition
|
|
281
|
+
task_create can be used to break work into subtasks with dependency ordering.
|
|
282
|
+
dependsOn accepts task titles — resolved to IDs automatically.
|
|
283
|
+
Subtasks with no shared dependencies can execute in parallel.`,
|
|
526
284
|
};
|
|
527
285
|
|
|
528
286
|
const CAP_ROUTING: CapabilityDefinition = {
|
|
529
287
|
name: 'routing',
|
|
530
|
-
description: '
|
|
288
|
+
description: 'Profile routing reference for task_create assignedProfile.',
|
|
531
289
|
tools: [OP_TASK_CREATE],
|
|
532
|
-
prompt: `##
|
|
533
|
-
|
|
534
|
-
|
|
535
|
-
-
|
|
536
|
-
-
|
|
537
|
-
-
|
|
538
|
-
|
|
539
|
-
|
|
540
|
-
Match complexity to profile capabilities:
|
|
541
|
-
- trivial/simple tasks: any profile (prefer cheapest)
|
|
542
|
-
- moderate tasks: specialist profiles
|
|
543
|
-
- complex tasks: profiles with full capability sets`,
|
|
290
|
+
prompt: `## Profile Routing
|
|
291
|
+
Available profiles for assignedProfile in task_create:
|
|
292
|
+
- "developer": code writing, file creation, bug fixes.
|
|
293
|
+
- "reviewer": code review, quality checks.
|
|
294
|
+
- "ops": shell commands, project setup, infrastructure.
|
|
295
|
+
- "orchestrator": task decomposition and steering.
|
|
296
|
+
Omit assignedProfile for auto-routing.`,
|
|
544
297
|
};
|
|
545
298
|
|
|
546
299
|
const CAP_MEMORY: CapabilityDefinition = {
|
|
547
300
|
name: 'memory',
|
|
548
|
-
description: '
|
|
301
|
+
description: 'Project memory persistence.',
|
|
549
302
|
tools: [OP_REMEMBER, OP_RECALL],
|
|
550
303
|
prompt: `## Project Memory
|
|
551
|
-
|
|
552
|
-
|
|
553
|
-
- remember: Save a convention. args: { key: "naming", value: "kebab-case for files" }
|
|
554
|
-
- recall: Load all saved conventions. args: {} — returns project memory.
|
|
555
|
-
|
|
556
|
-
What to remember:
|
|
557
|
-
- Naming conventions (file names, variable names)
|
|
558
|
-
- Architecture decisions (Result pattern, Zod for validation)
|
|
559
|
-
- Test patterns (where tests go, what framework)
|
|
560
|
-
- Common dependencies and their usage
|
|
561
|
-
|
|
562
|
-
Before planning, recall project memory to follow established patterns.
|
|
563
|
-
When you discover a new convention, remember it for future bots.`,
|
|
304
|
+
- remember(key, value): Persists a key-value pair to .weaver/project-memory.json.
|
|
305
|
+
- recall(): Returns all saved key-value pairs from project memory.`,
|
|
564
306
|
};
|
|
565
307
|
|
|
566
308
|
// ---------------------------------------------------------------------------
|
|
@@ -603,7 +345,8 @@ export const BUILT_IN_CAPABILITIES: readonly CapabilityDefinition[] = [
|
|
|
603
345
|
/** Capability pools per profile role. Triage selects from these per task. */
|
|
604
346
|
export const PROFILE_CAPABILITIES: Record<string, string[]> = {
|
|
605
347
|
orchestrator: ['core', 'role-orchestrator', 'decomposition', 'routing', 'task-mgmt', 'context'],
|
|
606
|
-
developer: ['core', 'role-developer', 'file-ops', 'shell', 'verification', 'cross-file-check', '
|
|
348
|
+
developer: ['core', 'role-developer', 'file-ops', 'shell', 'verification', 'cross-file-check', 'context'],
|
|
349
|
+
'fw-developer': ['core', 'role-developer', 'file-ops', 'shell', 'verification', 'cross-file-check', 'fw-grammar', 'fw-validate', 'fw-cli', 'context'],
|
|
607
350
|
reviewer: ['core', 'role-reviewer', 'code-review', 'security', 'context'],
|
|
608
351
|
ops: ['core', 'role-ops', 'file-ops', 'shell', 'project-setup', 'verification', 'context'],
|
|
609
352
|
};
|
|
@@ -787,6 +787,7 @@ export class SwarmController {
|
|
|
787
787
|
const taskJson = JSON.stringify({
|
|
788
788
|
id: task.id,
|
|
789
789
|
parentId: task.parentId,
|
|
790
|
+
assignedProfile: task.assignedProfile,
|
|
790
791
|
instruction: prompt,
|
|
791
792
|
mode: task.context.files.length > 0 ? 'modify' : 'create',
|
|
792
793
|
targets: task.context.files.length > 0 ? task.context.files : undefined,
|
package/src/bot/system-prompt.ts
CHANGED
|
@@ -298,14 +298,7 @@ function formatBotOperations(cliCommands: CliCommandDoc[]): string {
|
|
|
298
298
|
}
|
|
299
299
|
|
|
300
300
|
export function buildBotSystemPrompt(contextBundle?: string, _cliCommands?: CliCommandDoc[], projectDir?: string, sections?: Set<PromptSection>): string {
|
|
301
|
-
let prompt =
|
|
302
|
-
|
|
303
|
-
Writes that shrink a file by >50% or write empty content are automatically BLOCKED.
|
|
304
|
-
Blocked shell commands: rm -rf, git push, npm publish, sudo, curl|sh.
|
|
305
|
-
Always validate BEFORE and AFTER patching.
|
|
306
|
-
Always read a file before patching it (you need exact strings for find/replace).
|
|
307
|
-
Use patch_file for modifications, write_file only for new files.
|
|
308
|
-
Be concise in your text responses — let tool results speak.`;
|
|
301
|
+
let prompt = '';
|
|
309
302
|
|
|
310
303
|
// Load project plan file if it exists — this is the vision spec that guides all work
|
|
311
304
|
if (projectDir) {
|