@vpxa/aikit 0.1.17 → 0.1.18
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/package.json +1 -1
- package/packages/server/dist/tools/flow.tools.js +1 -1
- package/packages/server/dist/version-check.js +1 -1
- package/scaffold/adapters/copilot.mjs +12 -4
- package/scaffold/definitions/bodies.mjs +66 -26
- package/scaffold/definitions/models.mjs +32 -17
- package/scaffold/general/agents/Architect-Reviewer-Alpha.agent.md +1 -1
- package/scaffold/general/agents/Architect-Reviewer-Beta.agent.md +1 -1
- package/scaffold/general/agents/Code-Reviewer-Alpha.agent.md +1 -1
- package/scaffold/general/agents/Code-Reviewer-Beta.agent.md +1 -1
- package/scaffold/general/agents/Debugger.agent.md +1 -1
- package/scaffold/general/agents/Documenter.agent.md +1 -1
- package/scaffold/general/agents/Explorer.agent.md +1 -1
- package/scaffold/general/agents/Frontend.agent.md +1 -1
- package/scaffold/general/agents/Implementer.agent.md +1 -1
- package/scaffold/general/agents/Orchestrator.agent.md +73 -44
- package/scaffold/general/agents/Planner.agent.md +12 -1
- package/scaffold/general/agents/README.md +17 -17
- package/scaffold/general/agents/Refactor.agent.md +1 -1
- package/scaffold/general/agents/Researcher-Alpha.agent.md +1 -1
- package/scaffold/general/agents/Researcher-Beta.agent.md +1 -1
- package/scaffold/general/agents/Researcher-Delta.agent.md +1 -1
- package/scaffold/general/agents/Researcher-Gamma.agent.md +1 -1
- package/scaffold/general/agents/Security.agent.md +1 -1
package/package.json
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
import{getToolMeta as e}from"../tool-metadata.js";import{basename as
|
|
1
|
+
import{getToolMeta as e}from"../tool-metadata.js";import{existsSync as t}from"node:fs";import{basename as n,join as r,resolve as i}from"node:path";import{z as a}from"zod";import{readFile as o}from"node:fs/promises";import{createLogger as s,serializeError as c}from"../../../core/dist/index.js";import{homedir as l}from"node:os";const u=s(`flow-tools`);function d(e){return{content:[{type:`text`,text:e}]}}function f(e){return e instanceof Error?e.message:String(e)}function p(s,p){let m=p.sources?.[0]?.path??process.cwd(),h=r(p.stateDir??r(p.sources[0].path,`.aikit-state`),`flows`),g=r(h,`registry.json`),_=r(h,`state.json`);function v(e,t){return i(y(e),t).replaceAll(`\\`,`/`)}function y(e){if(e.sourceType===`builtin`){let r=n(e.installPath),a=i(m,`.github`,`flows`,r);if(t(a))return a.replaceAll(`\\`,`/`);let o=i(l(),`.copilot`,`flows`,r);return t(o)?o.replaceAll(`\\`,`/`):a.replaceAll(`\\`,`/`)}return e.installPath.replaceAll(`\\`,`/`)}async function b(){let{FlowRegistryManager:e,FlowStateMachine:t}=await import(`../../../flows/dist/index.js`);return{registry:new e(g),stateMachine:new t(_)}}let x=e(`flow_list`);s.registerTool(`flow_list`,{title:x.title,description:`List all installed flows and their steps`,annotations:x.annotations,inputSchema:{}},async()=>{try{let{registry:e,stateMachine:t}=await b(),n=e.list(),r=t.getStatus(),i={flows:n.map(e=>({name:e.name,version:e.version,source:e.source,sourceType:e.sourceType,format:e.format,steps:e.manifest.steps.map(e=>e.id)})),activeFlow:r.success&&r.data?{flow:r.data.flow,status:r.data.status,currentStep:r.data.currentStep}:null};return d(JSON.stringify(i,null,2))}catch(e){return u.error(`flow_list failed`,c(e)),d(`Error: ${f(e)}`)}});let S=e(`flow_info`);s.registerTool(`flow_info`,{title:S.title,description:`Show detailed information about a specific flow`,annotations:S.annotations,inputSchema:{name:a.string().describe(`Flow name to get info for`)}},async({name:e})=>{try{let{registry:t}=await b(),n=t.get(e);if(!n)return d(`Flow "${e}" not found. Use flow_list to see available flows.`);let r={name:n.name,version:n.version,description:n.manifest.description,source:n.source,sourceType:n.sourceType,format:n.format,installPath:y(n),registeredAt:n.registeredAt,updatedAt:n.updatedAt,steps:n.manifest.steps.map(e=>({id:e.id,name:e.name,skill:v(n,e.skill),produces:e.produces,requires:e.requires,description:e.description})),agents:n.manifest.agents,artifactsDir:n.manifest.artifacts_dir,install:n.manifest.install};return d(JSON.stringify(r,null,2))}catch(e){return u.error(`flow_info failed`,c(e)),d(`Error: ${f(e)}`)}});let C=e(`flow_start`);s.registerTool(`flow_start`,{title:C.title,description:`Start a flow. Sets the active flow and positions at the first step.`,annotations:C.annotations,inputSchema:{flow:a.string().describe(`Flow name to start (use flow_list to see options)`)}},async({flow:e})=>{try{let{registry:t,stateMachine:n}=await b(),r=t.get(e);if(!r)return d(`Flow "${e}" not found. Use flow_list to see available flows.`);let i=n.start(r.name,r.manifest);if(!i.success||!i.data)return d(`Cannot start: ${i.error}`);let a=i.data,o=r.manifest.steps.find(e=>e.id===a.currentStep),s={started:!0,flow:a.flow,currentStep:a.currentStep,currentStepSkill:r&&o?v(r,o.skill):null,currentStepDescription:o?.description??null,totalSteps:r.manifest.steps.length,stepSequence:r.manifest.steps.map(e=>e.id),artifactsDir:r.manifest.artifacts_dir};return d(JSON.stringify(s,null,2))}catch(e){return u.error(`flow_start failed`,c(e)),d(`Error: ${f(e)}`)}});let w=e(`flow_step`);s.registerTool(`flow_step`,{title:w.title,description:`Advance the active flow: complete current step and move to next, skip current step, or redo current step.`,annotations:w.annotations,inputSchema:{action:a.enum([`next`,`skip`,`redo`]).describe(`next: mark current step done and advance. skip: skip current step. redo: repeat current step.`)}},async({action:e})=>{try{let{registry:t,stateMachine:n}=await b(),r=n.load();if(!r)return d(`No active flow. Use flow_start first.`);let i=t.get(r.flow);if(!i)return d(`Flow "${r.flow}" not found in registry.`);let a=n.step(e,i.manifest);if(!a.success||!a.data)return d(`Cannot ${e}: ${a.error}`);let o=a.data,s=o.currentStep?i.manifest.steps.find(e=>e.id===o.currentStep):null,c={flow:o.flow,status:o.status,action:e,currentStep:o.currentStep,currentStepSkill:i&&s?v(i,s.skill):null,currentStepDescription:s?.description??null,completedSteps:o.completedSteps,skippedSteps:o.skippedSteps,totalSteps:i.manifest.steps.length,remaining:i.manifest.steps.filter(e=>!o.completedSteps.includes(e.id)&&!o.skippedSteps.includes(e.id)&&e.id!==o.currentStep).map(e=>e.id)};return d(JSON.stringify(c,null,2))}catch(e){return u.error(`flow_step failed`,c(e)),d(`Error: ${f(e)}`)}});let T=e(`flow_status`);s.registerTool(`flow_status`,{title:T.title,description:`Show the current flow execution state — which flow is active, current step, completed steps, and artifacts.`,annotations:T.annotations,inputSchema:{}},async()=>{try{let{registry:e,stateMachine:t}=await b(),n=t.getStatus();if(!n.success||!n.data)return d(`No active flow. Use flow_start to begin one, or flow_list to see available flows.`);let r=n.data,i=e.get(r.flow),a=i?.manifest.steps.find(e=>e.id===r.currentStep),o=i&&a?v(i,a.skill):null,s={flow:r.flow,status:r.status,currentStep:r.currentStep,currentStepSkill:o,skillPath:o,currentStepDescription:a?.description??null,completedSteps:r.completedSteps,skippedSteps:r.skippedSteps,artifacts:r.artifacts,startedAt:r.startedAt,updatedAt:r.updatedAt,totalSteps:i?.manifest.steps.length??0,progress:i?`${r.completedSteps.length+r.skippedSteps.length}/${i.manifest.steps.length}`:`unknown`};return d(JSON.stringify(s,null,2))}catch(e){return u.error(`flow_status failed`,c(e)),d(`Error: ${f(e)}`)}});let E=e(`flow_read_skill`);s.registerTool(`flow_read_skill`,{title:E.title===`flow_read_skill`?`Flow Read Skill`:E.title,description:`Read the skill or instruction content for a flow step. If step is omitted, reads the current step.`,annotations:E.title===`flow_read_skill`?{readOnlyHint:!0,idempotentHint:!0}:E.annotations,inputSchema:{step:a.string().optional().describe(`Step id or name to read. Defaults to the current step.`)}},async({step:e})=>{try{let{registry:t,stateMachine:n}=await b(),r=n.getStatus();if(!r.success||!r.data)return d(`No active flow. Use flow_start to begin one, or flow_list to see available flows.`);let i=r.data,a=t.get(i.flow);if(!a)return d(`Flow "${i.flow}" not found in registry.`);let s=e??i.currentStep;if(!s)return d(`No current step is available for the active flow.`);let c=a.manifest.steps.find(e=>e.id===s||e.name===s);return d(c?await o(v(a,c.skill),`utf-8`):`Step "${s}" not found in flow "${i.flow}".`)}catch(e){return u.error(`flow_read_skill failed`,c(e)),e instanceof Error&&`code`in e&&e.code===`ENOENT`?d(`Could not read skill file: ${e.message}`):d(`Error: ${f(e)}`)}});let D=e(`flow_reset`);s.registerTool(`flow_reset`,{title:D.title,description:`Reset the active flow, clearing all state. Use to start over or switch to a different flow.`,annotations:D.annotations,inputSchema:{}},async()=>{try{let{stateMachine:e}=await b(),t=e.reset();return t.success?d(`Flow state reset. Use flow_start to begin a new flow.`):d(`Reset failed: ${t.error}`)}catch(e){return u.error(`flow_reset failed`,c(e)),d(`Error: ${f(e)}`)}})}export{p as registerFlowTools};
|
|
@@ -1 +1 @@
|
|
|
1
|
-
import{existsSync as e,readFileSync as t}from"node:fs";import{dirname as n,resolve as r}from"node:path";import{fileURLToPath as i}from"node:url";import{createLogger as a}from"../../core/dist/index.js";import{
|
|
1
|
+
import{existsSync as e,readFileSync as t}from"node:fs";import{dirname as n,resolve as r}from"node:path";import{fileURLToPath as i}from"node:url";import{createLogger as a}from"../../core/dist/index.js";import{homedir as o}from"node:os";import{execFile as s}from"node:child_process";const c=a(`server`);function l(){let e=r(n(i(import.meta.url)),`..`,`..`,`..`,`package.json`);try{return JSON.parse(t(e,`utf-8`)).version??`0.0.0`}catch{return`0.0.0`}}function u(e,t){let n=e.split(`.`).map(Number),r=t.split(`.`).map(Number);for(let e=0;e<3;e++){let t=(n[e]??0)-(r[e]??0);if(t!==0)return t>0?1:-1}return 0}function d(){let e=l();fetch(`https://registry.npmjs.org/@vpxa/aikit/latest`,{signal:AbortSignal.timeout(5e3)}).then(e=>{if(e.ok)return e.json()}).then(t=>{if(!t||typeof t!=`object`)return;let n=t.version;n&&u(e,n)<0&&c.warn(`Update available`,{currentVersion:e,latestVersion:n,updateCommand:`aikit upgrade`})}).catch(()=>{})}function f(){try{let n=r(o(),`.copilot`,`.aikit-scaffold.json`);return e(n)?JSON.parse(t(n,`utf-8`)).version??null:null}catch{return null}}function p(){try{let n=r(process.cwd(),`.github`,`.aikit-scaffold.json`);return e(n)?JSON.parse(t(n,`utf-8`)).version??null:null}catch{return null}}let m=`idle`,h=null;function g(){return{state:m,error:h}}function _(){try{let t=l(),a=f(),o=p();if(!(a!=null&&a!==t)&&!(o!=null&&o!==t)||m===`pending`||m===`success`)return;m=`pending`,h=null,c.info(`Scaffold version mismatch — auto-upgrading`,{serverVersion:t,userScaffoldVersion:a,workspaceScaffoldVersion:o});let u=r(n(i(import.meta.url)),`..`,`..`,`..`,`bin`,`aikit.mjs`);if(!e(u)){m=`failed`,h=`aikit CLI binary not found at ${u}`,c.warn(`Cannot auto-upgrade: aikit CLI binary not found`,{binPath:u});return}s(process.execPath,[u,`upgrade`],{timeout:3e4,windowsHide:!0},(e,t,n)=>{e?(m=`failed`,h=e.message,c.warn(`Auto-upgrade failed`,{error:e.message,stderr:n?.slice(0,500)})):(m=`success`,h=null,c.info(`Auto-upgrade complete`))}).unref()}catch(e){m=`failed`,h=e instanceof Error?e.message:String(e),c.warn(`Auto-upgrade check failed`,{error:h})}}export{_ as autoUpgradeScaffold,d as checkForUpdates,l as getCurrentVersion,g as getUpgradeState};
|
|
@@ -64,8 +64,14 @@ function buildToolsYaml(toolRole) {
|
|
|
64
64
|
}
|
|
65
65
|
|
|
66
66
|
function copilotModel(agentName) {
|
|
67
|
-
const
|
|
68
|
-
|
|
67
|
+
const models = MODELS[agentName];
|
|
68
|
+
if (!models) return 'Auto (copilot)';
|
|
69
|
+
if (Array.isArray(models)) {
|
|
70
|
+
if (models.length === 0) return 'Auto (copilot)';
|
|
71
|
+
if (models.length === 1) return models[0];
|
|
72
|
+
return `[${models.join(', ')}]`;
|
|
73
|
+
}
|
|
74
|
+
return models;
|
|
69
75
|
}
|
|
70
76
|
|
|
71
77
|
const FLOWS_SECTION = [
|
|
@@ -84,13 +90,15 @@ function buildAgentTable() {
|
|
|
84
90
|
if (def.variants) {
|
|
85
91
|
for (const suffix of VARIANT_GROUPS[name] || []) {
|
|
86
92
|
const fullName = `${name}-${suffix}`;
|
|
87
|
-
const
|
|
93
|
+
const models = MODELS[fullName] || MODELS[name];
|
|
94
|
+
const model = Array.isArray(models) ? models[0] : models || 'Unknown';
|
|
88
95
|
const varDef = def.variants[suffix] || {};
|
|
89
96
|
const desc = varDef.description || def.description;
|
|
90
97
|
rows.push(`| **${fullName}** | ${desc} | ${model} | ${def.category} |`);
|
|
91
98
|
}
|
|
92
99
|
} else {
|
|
93
|
-
const
|
|
100
|
+
const models = MODELS[name];
|
|
101
|
+
const model = Array.isArray(models) ? models[0] : models || 'Unknown';
|
|
94
102
|
rows.push(`| **${name}** | ${def.description} | ${model} | ${def.category} |`);
|
|
95
103
|
}
|
|
96
104
|
}
|
|
@@ -40,26 +40,43 @@ ${agentTable}
|
|
|
40
40
|
3. After review: \`evidence_map({ action: "gate", task_id })\` → YIELD/HOLD/HARD_BLOCK
|
|
41
41
|
4. Auto-upgrade tier if unknowns reveal contract/security issues
|
|
42
42
|
|
|
43
|
-
##
|
|
43
|
+
## Flow-Driven Development
|
|
44
44
|
|
|
45
|
-
|
|
46
|
-
1. Read onboard artifacts → parse goal → identify affected subsystems → \`forge_classify\`
|
|
47
|
-
2. Research: <5 files direct, 5-15 Explorer→Researcher, >15 multiple parallel
|
|
48
|
-
3. Draft plan: 3-10 phases, agent assignments, TDD steps, dependency graph
|
|
49
|
-
4. Batch independent phases for parallel execution
|
|
50
|
-
5. **🛑 STOP — user approval required**
|
|
45
|
+
Orchestrator uses the flow system for structured development. Flows define the step sequence — Orchestrator adds multi-agent orchestration, quality gates, and review protocols on top.
|
|
51
46
|
|
|
52
|
-
###
|
|
47
|
+
### Flow Selection
|
|
53
48
|
|
|
54
|
-
|
|
49
|
+
| Situation | Flow | Steps |
|
|
50
|
+
|-----------|------|-------|
|
|
51
|
+
| Bug fix, small feature, refactoring | \`aikit:basic\` | assess → implement → verify |
|
|
52
|
+
| New feature, major change, multi-file | \`aikit:advanced\` | spec → plan → task → execute → verify |
|
|
53
|
+
| Custom/specialized work | Check \`flow_list\` | Follow flow-specific steps |
|
|
55
54
|
|
|
56
|
-
|
|
57
|
-
2. ✅ Task decomposition table produced? (show user: task → files → agent → parallel batch)
|
|
58
|
-
3. ✅ Independence Check passed per pair? (shared files? shared state? ordering dependency? → must be "No" for parallel)
|
|
59
|
-
4. ✅ Each task ≤ 3 files? (if not, split further)
|
|
60
|
-
5. ✅ Parallel batches identified? (tasks with no dependencies MUST be in same batch)
|
|
55
|
+
**If multiple flows could apply and user hasn't specified → ask user to choose.**
|
|
61
56
|
|
|
62
|
-
|
|
57
|
+
### Session Start Flow Check
|
|
58
|
+
|
|
59
|
+
1. \`flow_status\` — check for active flow
|
|
60
|
+
2. If active:
|
|
61
|
+
- Note current step name and skill path
|
|
62
|
+
- Read the current step skill with \`flow_read_skill\`
|
|
63
|
+
- Follow its instructions
|
|
64
|
+
- When complete: \`flow_step({ action: 'next' })\`
|
|
65
|
+
3. If no active flow:
|
|
66
|
+
- \`flow_list\` — check ALL available flows (builtin + custom)
|
|
67
|
+
- Recommend appropriate flow based on task scope
|
|
68
|
+
- \`flow_start({ flow: '<name>' })\` after user confirms
|
|
69
|
+
|
|
70
|
+
### Orchestrator Protocols (apply during ALL flow steps)
|
|
71
|
+
|
|
72
|
+
**PRE-DISPATCH GATE — complete ALL before ANY \`runSubagent\` call:**
|
|
73
|
+
1. ✅ \`multi-agents-development\` skill loaded?
|
|
74
|
+
2. ✅ Task decomposition table produced?
|
|
75
|
+
3. ✅ Independence Check passed per pair?
|
|
76
|
+
4. ✅ Each task ≤ 3 files?
|
|
77
|
+
5. ✅ Parallel batches identified?
|
|
78
|
+
|
|
79
|
+
**Decomposition output format:**
|
|
63
80
|
|
|
64
81
|
\`\`\`
|
|
65
82
|
Batch 1 (parallel):
|
|
@@ -69,23 +86,35 @@ Batch 2 (after batch 1):
|
|
|
69
86
|
Task C: [agent] → [file5] — [goal] (depends on A)
|
|
70
87
|
\`\`\`
|
|
71
88
|
|
|
72
|
-
**
|
|
73
|
-
1. **Scope** — exact files
|
|
89
|
+
**Subagent prompt template:**
|
|
90
|
+
1. **Scope** — exact files + boundary
|
|
74
91
|
2. **Goal** — acceptance criteria, testable
|
|
75
|
-
3. **Arch Context** —
|
|
76
|
-
4. **Constraints** — patterns, conventions
|
|
92
|
+
3. **Arch Context** — code snippets from \`compact()\`/\`digest()\`
|
|
93
|
+
4. **Constraints** — patterns, conventions
|
|
77
94
|
5. **FORGE** — tier + evidence requirements
|
|
78
95
|
6. **Self-Review** — checklist before declaring status
|
|
79
96
|
|
|
80
|
-
**Subagent status protocol
|
|
97
|
+
**Subagent status protocol:** \`DONE\` | \`DONE_WITH_CONCERNS\` | \`NEEDS_CONTEXT\` | \`BLOCKED\`
|
|
81
98
|
|
|
82
|
-
**
|
|
99
|
+
**Additional Orchestrator requirements during flow execution:**
|
|
100
|
+
- Apply the PRE-DISPATCH GATE before any subagent dispatch, regardless of flow
|
|
101
|
+
- Apply FORGE at classification and verification points; pass tier/evidence expectations into subagents and gate with \`evidence_map\`
|
|
102
|
+
- Enforce delegation rules at all times — Orchestrator never implements code directly
|
|
103
|
+
- Use the subagent prompt template for every dispatch so step-specific flow instructions are grounded in actual code context
|
|
83
104
|
|
|
84
|
-
|
|
85
|
-
|
|
86
|
-
|
|
87
|
-
|
|
88
|
-
|
|
105
|
+
**Per-step review cycle:** Dispatch → Code Review (Alpha+Beta) → Arch Review (if boundary changes) → Security (if applicable) → \`evidence_map\` gate → **🛑 STOP — present results**
|
|
106
|
+
|
|
107
|
+
### Flow MCP Tools
|
|
108
|
+
|
|
109
|
+
| Tool | Purpose |
|
|
110
|
+
|------|---------|
|
|
111
|
+
| \`flow_list\` | List installed flows and active flow |
|
|
112
|
+
| \`flow_info\` | Get detailed flow info including steps |
|
|
113
|
+
| \`flow_start\` | Start a named flow |
|
|
114
|
+
| \`flow_step\` | Advance: next, skip, or redo current step |
|
|
115
|
+
| \`flow_status\` | Check current execution state |
|
|
116
|
+
| \`flow_reset\` | Clear flow state to start over |
|
|
117
|
+
| \`flow_read_skill\` | Read the skill content for the current step |
|
|
89
118
|
|
|
90
119
|
## Emergency: STOP → ASSESS → CONTAIN → RECOVER → DOCUMENT
|
|
91
120
|
|
|
@@ -228,6 +257,17 @@ At session start, check for an active flow:
|
|
|
228
257
|
5. **Dependency Graph** — For each phase, list dependencies. Group into parallel batches
|
|
229
258
|
6. **Present** — Show plan with open questions, complexity estimate, parallel batch layout
|
|
230
259
|
|
|
260
|
+
## Flow Integration
|
|
261
|
+
|
|
262
|
+
When activated as part of a flow (e.g., \`aikit:advanced\` plan step or \`aikit:basic\` assess step):
|
|
263
|
+
1. Check \`flow_status\` for current step context
|
|
264
|
+
2. Read the step's skill file for specific instructions
|
|
265
|
+
3. Follow skill instructions while applying Planner methodology
|
|
266
|
+
4. Produce required artifacts (as specified by the flow step's \`produces\` field)
|
|
267
|
+
5. When complete, report to Orchestrator (do NOT call \`flow_step\` — let Orchestrator advance)
|
|
268
|
+
|
|
269
|
+
When no flow is active, operate autonomously following normal Planner methodology.
|
|
270
|
+
|
|
231
271
|
## Subagent Output Relay
|
|
232
272
|
|
|
233
273
|
When subagents complete, their visual outputs (from \`present\`) are NOT visible to the user.
|
|
@@ -11,29 +11,44 @@
|
|
|
11
11
|
|
|
12
12
|
export const MODELS = {
|
|
13
13
|
// ─── Single-role agents ───────────────────────────────────────────────
|
|
14
|
-
Orchestrator: 'Claude Opus 4.6',
|
|
15
|
-
Planner: 'Claude Opus 4.6',
|
|
16
|
-
Implementer:
|
|
17
|
-
|
|
18
|
-
|
|
19
|
-
|
|
20
|
-
|
|
21
|
-
|
|
22
|
-
|
|
14
|
+
Orchestrator: ['Claude Opus 4.6 (copilot)', 'GPT-5.4 (copilot)', 'Auto (copilot)'],
|
|
15
|
+
Planner: ['Claude Opus 4.6 (copilot)', 'GPT-5.4 (copilot)', 'Auto (copilot)'],
|
|
16
|
+
Implementer: [
|
|
17
|
+
'GPT-5.4 (copilot)',
|
|
18
|
+
'Gemini 3.1 Pro (Preview) (copilot)',
|
|
19
|
+
'GPT-5.3-Codex (copilot)',
|
|
20
|
+
'Auto (copilot)',
|
|
21
|
+
],
|
|
22
|
+
Frontend: [
|
|
23
|
+
'Gemini 3.1 Pro (Preview) (copilot)',
|
|
24
|
+
'GPT-5.4 (copilot)',
|
|
25
|
+
'GPT-5.3-Codex (copilot)',
|
|
26
|
+
'Auto (copilot)',
|
|
27
|
+
],
|
|
28
|
+
Debugger: [
|
|
29
|
+
'Claude Opus 4.6 (copilot)',
|
|
30
|
+
'GPT-5.4 (copilot)',
|
|
31
|
+
'GPT-5.3-Codex (copilot)',
|
|
32
|
+
'Auto (copilot)',
|
|
33
|
+
],
|
|
34
|
+
Refactor: ['GPT-5.4 (copilot)', 'GPT-5.3-Codex (copilot)', 'Auto (copilot)'],
|
|
35
|
+
Security: ['Claude Opus 4.6 (copilot)', 'GPT-5.4 (copilot)', 'Auto (copilot)'],
|
|
36
|
+
Documenter: ['GPT-5.4 (copilot)', 'Gemini 3.1 Pro (Preview) (copilot)', 'Auto (copilot)'],
|
|
37
|
+
Explorer: ['Gemini 3 Flash (Preview) (copilot)', 'Claude Haiku 4.5 (copilot)', 'Auto (copilot)'],
|
|
23
38
|
|
|
24
39
|
// ─── Researcher variants (4 models for multi-model decision protocol) ────────────
|
|
25
|
-
'Researcher-Alpha': 'Claude Opus 4.6',
|
|
26
|
-
'Researcher-Beta': 'Claude Sonnet 4.6',
|
|
27
|
-
'Researcher-Gamma': 'GPT-5.4',
|
|
28
|
-
'Researcher-Delta': 'Gemini 3.1 Pro (Preview)',
|
|
40
|
+
'Researcher-Alpha': ['Claude Opus 4.6 (copilot)', 'Auto (copilot)'],
|
|
41
|
+
'Researcher-Beta': ['Claude Sonnet 4.6 (copilot)', 'Auto (copilot)'],
|
|
42
|
+
'Researcher-Gamma': ['GPT-5.4 (copilot)', 'Auto (copilot)'],
|
|
43
|
+
'Researcher-Delta': ['Gemini 3.1 Pro (Preview) (copilot)', 'Auto (copilot)'],
|
|
29
44
|
|
|
30
45
|
// ─── Code-Reviewer variants (2 models for dual review) ───────────────
|
|
31
|
-
'Code-Reviewer-Alpha': 'GPT-5.4',
|
|
32
|
-
'Code-Reviewer-Beta': 'Claude Opus 4.6',
|
|
46
|
+
'Code-Reviewer-Alpha': ['GPT-5.4 (copilot)', 'Auto (copilot)'],
|
|
47
|
+
'Code-Reviewer-Beta': ['Claude Opus 4.6 (copilot)', 'Auto (copilot)'],
|
|
33
48
|
|
|
34
49
|
// ─── Architect-Reviewer variants (2 models for dual review) ──────────
|
|
35
|
-
'Architect-Reviewer-Alpha': 'GPT-5.4',
|
|
36
|
-
'Architect-Reviewer-Beta': 'Claude Opus 4.6',
|
|
50
|
+
'Architect-Reviewer-Alpha': ['GPT-5.4 (copilot)', 'Auto (copilot)'],
|
|
51
|
+
'Architect-Reviewer-Beta': ['Claude Opus 4.6 (copilot)', 'Auto (copilot)'],
|
|
37
52
|
};
|
|
38
53
|
|
|
39
54
|
/**
|
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
description: 'Primary architecture reviewer'
|
|
3
3
|
argument-hint: Files, PR, or subsystem to architecture-review
|
|
4
4
|
tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
|
|
5
|
-
model: GPT-5.4 (copilot)
|
|
5
|
+
model: [GPT-5.4 (copilot), Auto (copilot)]
|
|
6
6
|
---
|
|
7
7
|
|
|
8
8
|
# Architect-Reviewer-Alpha - The Structural Guardian
|
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
description: 'Architecture reviewer variant — different LLM perspective for dual review'
|
|
3
3
|
argument-hint: Files, PR, or subsystem to architecture-review
|
|
4
4
|
tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
|
|
5
|
-
model: Claude Opus 4.6 (copilot)
|
|
5
|
+
model: [Claude Opus 4.6 (copilot), Auto (copilot)]
|
|
6
6
|
---
|
|
7
7
|
|
|
8
8
|
# Architect-Reviewer-Beta - The Structural Guardian
|
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
description: 'Primary code reviewer'
|
|
3
3
|
argument-hint: File path, PR, or code to review
|
|
4
4
|
tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
|
|
5
|
-
model: GPT-5.4 (copilot)
|
|
5
|
+
model: [GPT-5.4 (copilot), Auto (copilot)]
|
|
6
6
|
---
|
|
7
7
|
|
|
8
8
|
# Code-Reviewer-Alpha - The Quality Guardian
|
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
description: 'Code reviewer variant — different LLM perspective for dual review'
|
|
3
3
|
argument-hint: File path, PR, or code to review
|
|
4
4
|
tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
|
|
5
|
-
model: Claude Opus 4.6 (copilot)
|
|
5
|
+
model: [Claude Opus 4.6 (copilot), Auto (copilot)]
|
|
6
6
|
---
|
|
7
7
|
|
|
8
8
|
# Code-Reviewer-Beta - The Quality Guardian
|
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
description: 'Expert debugger that diagnoses issues, traces errors, and provides solutions'
|
|
3
3
|
argument-hint: Error message, stack trace, or description of issue
|
|
4
4
|
tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalSelection, read/terminalLastCommand, agent/runSubagent, edit/createFile, edit/editFiles, search/changes, search/codebase, search/usages, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
|
|
5
|
-
model: Claude Opus 4.6 (copilot)
|
|
5
|
+
model: [Claude Opus 4.6 (copilot), GPT-5.4 (copilot), GPT-5.3-Codex (copilot), Auto (copilot)]
|
|
6
6
|
---
|
|
7
7
|
|
|
8
8
|
# Debugger - The Problem Solver
|
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
description: 'Documentation specialist that creates and maintains comprehensive project documentation'
|
|
3
3
|
argument-hint: Component, API, feature, or area to document
|
|
4
4
|
tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, edit/createFile, edit/editFiles, edit/rename, edit/createDirectory, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
|
|
5
|
-
model: GPT-5.4 (copilot)
|
|
5
|
+
model: [GPT-5.4 (copilot), Gemini 3.1 Pro (Preview) (copilot), Auto (copilot)]
|
|
6
6
|
---
|
|
7
7
|
|
|
8
8
|
# Documenter - The Knowledge Keeper
|
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
description: 'Rapid codebase exploration to find files, usages, dependencies, and structural context'
|
|
3
3
|
argument-hint: Find files, usages, and context related to: {topic or goal}
|
|
4
4
|
tools: [read/problems, read/readFile, search/changes, search/codebase, search/usages, search/fileSearch, search/listDirectory, search/textSearch, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
|
|
5
|
-
model: Gemini 3 Flash (Preview) (copilot)
|
|
5
|
+
model: [Gemini 3 Flash (Preview) (copilot), Claude Haiku 4.5 (copilot), Auto (copilot)]
|
|
6
6
|
---
|
|
7
7
|
|
|
8
8
|
# Explorer - The Rapid Scout
|
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
description: 'UI/UX specialist for React, styling, responsive design, and frontend implementation'
|
|
3
3
|
argument-hint: UI component, styling task, or frontend feature
|
|
4
4
|
tools: [execute/createAndRunTask, execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, edit/createFile, edit/editFiles, edit/rename, edit/createDirectory, search/changes, search/codebase, search/usages, todo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
|
|
5
|
-
model: Gemini 3.1 Pro (Preview) (copilot)
|
|
5
|
+
model: [Gemini 3.1 Pro (Preview) (copilot), GPT-5.4 (copilot), GPT-5.3-Codex (copilot), Auto (copilot)]
|
|
6
6
|
---
|
|
7
7
|
|
|
8
8
|
# Frontend - The UI Specialist
|
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
description: 'Persistent implementation agent that writes code following TDD practices until all tasks are complete'
|
|
3
3
|
argument-hint: Implementation task, feature, or phase from plan
|
|
4
4
|
tools: [execute/createAndRunTask, execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, edit/createFile, edit/editFiles, edit/rename, edit/createDirectory, search/changes, search/codebase, search/usages, todo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
|
|
5
|
-
model: GPT-5.4 (copilot)
|
|
5
|
+
model: [GPT-5.4 (copilot), Gemini 3.1 Pro (Preview) (copilot), GPT-5.3-Codex (copilot), Auto (copilot)]
|
|
6
6
|
---
|
|
7
7
|
|
|
8
8
|
# Implementer - The Code Builder
|
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
description: 'Master conductor that orchestrates the full development lifecycle: Planning → Implementation → Review → Recovery → Commit'
|
|
3
3
|
tools: [vscode/memory, vscode/runCommand, vscode/switchAgent, execute/killTerminal, execute/createAndRunTask, execute/runInTerminal, read/terminalSelection, read/terminalLastCommand, read/problems, read/readFile, agent/runSubagent, edit/createFile, edit/editFiles, edit/rename, edit/createDirectory, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, todo, search/searchSubagent, search/textSearch, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, vscode/askQuestions, vscode/resolveMemoryFileUri, aikit/*]
|
|
4
|
-
model: Claude Opus 4.6 (copilot)
|
|
4
|
+
model: [Claude Opus 4.6 (copilot), GPT-5.4 (copilot), Auto (copilot)]
|
|
5
5
|
---
|
|
6
6
|
|
|
7
7
|
# Orchestrator - The Master Conductor
|
|
@@ -21,23 +21,23 @@ You orchestrate the full development lifecycle: **planning → implementation
|
|
|
21
21
|
|
|
22
22
|
| Agent | Purpose | Model | Category |
|
|
23
23
|
|-------|---------|-------|----------|
|
|
24
|
-
| **Orchestrator** | Master conductor that orchestrates the full development lifecycle: Planning → Implementation → Review → Recovery → Commit | Claude Opus 4.6 | orchestration |
|
|
25
|
-
| **Planner** | Autonomous planner that researches codebases and writes comprehensive TDD implementation plans | Claude Opus 4.6 | orchestration |
|
|
26
|
-
| **Implementer** | Persistent implementation agent that writes code following TDD practices until all tasks are complete | GPT-5.4 | implementation |
|
|
27
|
-
| **Frontend** | UI/UX specialist for React, styling, responsive design, and frontend implementation | Gemini 3.1 Pro (Preview) | implementation |
|
|
28
|
-
| **Refactor** | Code refactoring specialist that improves structure, readability, and maintainability | GPT-5.4 | implementation |
|
|
29
|
-
| **Debugger** | Expert debugger that diagnoses issues, traces errors, and provides solutions | Claude Opus 4.6 | diagnostics |
|
|
30
|
-
| **Security** | Security specialist that analyzes code for vulnerabilities and compliance | Claude Opus 4.6 | diagnostics |
|
|
31
|
-
| **Documenter** | Documentation specialist that creates and maintains comprehensive project documentation | GPT-5.4 | documentation |
|
|
32
|
-
| **Explorer** | Rapid codebase exploration to find files, usages, dependencies, and structural context | Gemini 3 Flash (Preview) | exploration |
|
|
33
|
-
| **Researcher-Alpha** | Primary deep research agent — also serves as default Researcher | Claude Opus 4.6 | research |
|
|
34
|
-
| **Researcher-Beta** | Research variant — pragmatic analysis with focus on trade-offs and edge cases | Claude Sonnet 4.6 | research |
|
|
35
|
-
| **Researcher-Gamma** | Research variant — broad pattern matching across domains and technologies | GPT-5.4 | research |
|
|
36
|
-
| **Researcher-Delta** | Research variant — implementation feasibility and performance implications | Gemini 3.1 Pro (Preview) | research |
|
|
37
|
-
| **Code-Reviewer-Alpha** | Primary code reviewer | GPT-5.4 | review |
|
|
38
|
-
| **Code-Reviewer-Beta** | Code reviewer variant — different LLM perspective for dual review | Claude Opus 4.6 | review |
|
|
39
|
-
| **Architect-Reviewer-Alpha** | Primary architecture reviewer | GPT-5.4 | review |
|
|
40
|
-
| **Architect-Reviewer-Beta** | Architecture reviewer variant — different LLM perspective for dual review | Claude Opus 4.6 | review |
|
|
24
|
+
| **Orchestrator** | Master conductor that orchestrates the full development lifecycle: Planning → Implementation → Review → Recovery → Commit | Claude Opus 4.6 (copilot) | orchestration |
|
|
25
|
+
| **Planner** | Autonomous planner that researches codebases and writes comprehensive TDD implementation plans | Claude Opus 4.6 (copilot) | orchestration |
|
|
26
|
+
| **Implementer** | Persistent implementation agent that writes code following TDD practices until all tasks are complete | GPT-5.4 (copilot) | implementation |
|
|
27
|
+
| **Frontend** | UI/UX specialist for React, styling, responsive design, and frontend implementation | Gemini 3.1 Pro (Preview) (copilot) | implementation |
|
|
28
|
+
| **Refactor** | Code refactoring specialist that improves structure, readability, and maintainability | GPT-5.4 (copilot) | implementation |
|
|
29
|
+
| **Debugger** | Expert debugger that diagnoses issues, traces errors, and provides solutions | Claude Opus 4.6 (copilot) | diagnostics |
|
|
30
|
+
| **Security** | Security specialist that analyzes code for vulnerabilities and compliance | Claude Opus 4.6 (copilot) | diagnostics |
|
|
31
|
+
| **Documenter** | Documentation specialist that creates and maintains comprehensive project documentation | GPT-5.4 (copilot) | documentation |
|
|
32
|
+
| **Explorer** | Rapid codebase exploration to find files, usages, dependencies, and structural context | Gemini 3 Flash (Preview) (copilot) | exploration |
|
|
33
|
+
| **Researcher-Alpha** | Primary deep research agent — also serves as default Researcher | Claude Opus 4.6 (copilot) | research |
|
|
34
|
+
| **Researcher-Beta** | Research variant — pragmatic analysis with focus on trade-offs and edge cases | Claude Sonnet 4.6 (copilot) | research |
|
|
35
|
+
| **Researcher-Gamma** | Research variant — broad pattern matching across domains and technologies | GPT-5.4 (copilot) | research |
|
|
36
|
+
| **Researcher-Delta** | Research variant — implementation feasibility and performance implications | Gemini 3.1 Pro (Preview) (copilot) | research |
|
|
37
|
+
| **Code-Reviewer-Alpha** | Primary code reviewer | GPT-5.4 (copilot) | review |
|
|
38
|
+
| **Code-Reviewer-Beta** | Code reviewer variant — different LLM perspective for dual review | Claude Opus 4.6 (copilot) | review |
|
|
39
|
+
| **Architect-Reviewer-Alpha** | Primary architecture reviewer | GPT-5.4 (copilot) | review |
|
|
40
|
+
| **Architect-Reviewer-Beta** | Architecture reviewer variant — different LLM perspective for dual review | Claude Opus 4.6 (copilot) | review |
|
|
41
41
|
|
|
42
42
|
**Parallelism**: Read-only agents run in parallel freely. File-modifying agents run in parallel ONLY on completely different files. Max 4 concurrent file-modifying agents.
|
|
43
43
|
|
|
@@ -57,26 +57,43 @@ You orchestrate the full development lifecycle: **planning → implementation
|
|
|
57
57
|
3. After review: `evidence_map({ action: "gate", task_id })` → YIELD/HOLD/HARD_BLOCK
|
|
58
58
|
4. Auto-upgrade tier if unknowns reveal contract/security issues
|
|
59
59
|
|
|
60
|
-
##
|
|
60
|
+
## Flow-Driven Development
|
|
61
61
|
|
|
62
|
-
|
|
63
|
-
1. Read onboard artifacts → parse goal → identify affected subsystems → `forge_classify`
|
|
64
|
-
2. Research: <5 files direct, 5-15 Explorer→Researcher, >15 multiple parallel
|
|
65
|
-
3. Draft plan: 3-10 phases, agent assignments, TDD steps, dependency graph
|
|
66
|
-
4. Batch independent phases for parallel execution
|
|
67
|
-
5. **🛑 STOP — user approval required**
|
|
62
|
+
Orchestrator uses the flow system for structured development. Flows define the step sequence — Orchestrator adds multi-agent orchestration, quality gates, and review protocols on top.
|
|
68
63
|
|
|
69
|
-
###
|
|
64
|
+
### Flow Selection
|
|
70
65
|
|
|
71
|
-
|
|
66
|
+
| Situation | Flow | Steps |
|
|
67
|
+
|-----------|------|-------|
|
|
68
|
+
| Bug fix, small feature, refactoring | `aikit:basic` | assess → implement → verify |
|
|
69
|
+
| New feature, major change, multi-file | `aikit:advanced` | spec → plan → task → execute → verify |
|
|
70
|
+
| Custom/specialized work | Check `flow_list` | Follow flow-specific steps |
|
|
72
71
|
|
|
73
|
-
|
|
74
|
-
2. ✅ Task decomposition table produced? (show user: task → files → agent → parallel batch)
|
|
75
|
-
3. ✅ Independence Check passed per pair? (shared files? shared state? ordering dependency? → must be "No" for parallel)
|
|
76
|
-
4. ✅ Each task ≤ 3 files? (if not, split further)
|
|
77
|
-
5. ✅ Parallel batches identified? (tasks with no dependencies MUST be in same batch)
|
|
72
|
+
**If multiple flows could apply and user hasn't specified → ask user to choose.**
|
|
78
73
|
|
|
79
|
-
|
|
74
|
+
### Session Start Flow Check
|
|
75
|
+
|
|
76
|
+
1. `flow_status` — check for active flow
|
|
77
|
+
2. If active:
|
|
78
|
+
- Note current step name and skill path
|
|
79
|
+
- Read the current step skill with `flow_read_skill`
|
|
80
|
+
- Follow its instructions
|
|
81
|
+
- When complete: `flow_step({ action: 'next' })`
|
|
82
|
+
3. If no active flow:
|
|
83
|
+
- `flow_list` — check ALL available flows (builtin + custom)
|
|
84
|
+
- Recommend appropriate flow based on task scope
|
|
85
|
+
- `flow_start({ flow: '<name>' })` after user confirms
|
|
86
|
+
|
|
87
|
+
### Orchestrator Protocols (apply during ALL flow steps)
|
|
88
|
+
|
|
89
|
+
**PRE-DISPATCH GATE — complete ALL before ANY `runSubagent` call:**
|
|
90
|
+
1. ✅ `multi-agents-development` skill loaded?
|
|
91
|
+
2. ✅ Task decomposition table produced?
|
|
92
|
+
3. ✅ Independence Check passed per pair?
|
|
93
|
+
4. ✅ Each task ≤ 3 files?
|
|
94
|
+
5. ✅ Parallel batches identified?
|
|
95
|
+
|
|
96
|
+
**Decomposition output format:**
|
|
80
97
|
|
|
81
98
|
```
|
|
82
99
|
Batch 1 (parallel):
|
|
@@ -86,23 +103,35 @@ Batch 2 (after batch 1):
|
|
|
86
103
|
Task C: [agent] → [file5] — [goal] (depends on A)
|
|
87
104
|
```
|
|
88
105
|
|
|
89
|
-
**
|
|
90
|
-
1. **Scope** — exact files
|
|
106
|
+
**Subagent prompt template:**
|
|
107
|
+
1. **Scope** — exact files + boundary
|
|
91
108
|
2. **Goal** — acceptance criteria, testable
|
|
92
|
-
3. **Arch Context** —
|
|
93
|
-
4. **Constraints** — patterns, conventions
|
|
109
|
+
3. **Arch Context** — code snippets from `compact()`/`digest()`
|
|
110
|
+
4. **Constraints** — patterns, conventions
|
|
94
111
|
5. **FORGE** — tier + evidence requirements
|
|
95
112
|
6. **Self-Review** — checklist before declaring status
|
|
96
113
|
|
|
97
|
-
**Subagent status protocol
|
|
114
|
+
**Subagent status protocol:** `DONE` | `DONE_WITH_CONCERNS` | `NEEDS_CONTEXT` | `BLOCKED`
|
|
115
|
+
|
|
116
|
+
**Additional Orchestrator requirements during flow execution:**
|
|
117
|
+
- Apply the PRE-DISPATCH GATE before any subagent dispatch, regardless of flow
|
|
118
|
+
- Apply FORGE at classification and verification points; pass tier/evidence expectations into subagents and gate with `evidence_map`
|
|
119
|
+
- Enforce delegation rules at all times — Orchestrator never implements code directly
|
|
120
|
+
- Use the subagent prompt template for every dispatch so step-specific flow instructions are grounded in actual code context
|
|
98
121
|
|
|
99
|
-
**Per-
|
|
122
|
+
**Per-step review cycle:** Dispatch → Code Review (Alpha+Beta) → Arch Review (if boundary changes) → Security (if applicable) → `evidence_map` gate → **🛑 STOP — present results**
|
|
123
|
+
|
|
124
|
+
### Flow MCP Tools
|
|
100
125
|
|
|
101
|
-
|
|
102
|
-
|
|
103
|
-
|
|
104
|
-
|
|
105
|
-
|
|
126
|
+
| Tool | Purpose |
|
|
127
|
+
|------|---------|
|
|
128
|
+
| `flow_list` | List installed flows and active flow |
|
|
129
|
+
| `flow_info` | Get detailed flow info including steps |
|
|
130
|
+
| `flow_start` | Start a named flow |
|
|
131
|
+
| `flow_step` | Advance: next, skip, or redo current step |
|
|
132
|
+
| `flow_status` | Check current execution state |
|
|
133
|
+
| `flow_reset` | Clear flow state to start over |
|
|
134
|
+
| `flow_read_skill` | Read the skill content for the current step |
|
|
106
135
|
|
|
107
136
|
## Emergency: STOP → ASSESS → CONTAIN → RECOVER → DOCUMENT
|
|
108
137
|
|
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
description: 'Autonomous planner that researches codebases and writes comprehensive TDD implementation plans'
|
|
3
3
|
tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, edit/createFile, edit/editFiles, edit/rename, edit/createDirectory, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, todo, search/searchSubagent, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
|
|
4
|
-
model: Claude Opus 4.6 (copilot)
|
|
4
|
+
model: [Claude Opus 4.6 (copilot), GPT-5.4 (copilot), Auto (copilot)]
|
|
5
5
|
---
|
|
6
6
|
|
|
7
7
|
# Planner - The Strategic Architect
|
|
@@ -38,6 +38,17 @@ You are the **Planner**, autonomous planner that researches codebases and writes
|
|
|
38
38
|
5. **Dependency Graph** — For each phase, list dependencies. Group into parallel batches
|
|
39
39
|
6. **Present** — Show plan with open questions, complexity estimate, parallel batch layout
|
|
40
40
|
|
|
41
|
+
## Flow Integration
|
|
42
|
+
|
|
43
|
+
When activated as part of a flow (e.g., `aikit:advanced` plan step or `aikit:basic` assess step):
|
|
44
|
+
1. Check `flow_status` for current step context
|
|
45
|
+
2. Read the step's skill file for specific instructions
|
|
46
|
+
3. Follow skill instructions while applying Planner methodology
|
|
47
|
+
4. Produce required artifacts (as specified by the flow step's `produces` field)
|
|
48
|
+
5. When complete, report to Orchestrator (do NOT call `flow_step` — let Orchestrator advance)
|
|
49
|
+
|
|
50
|
+
When no flow is active, operate autonomously following normal Planner methodology.
|
|
51
|
+
|
|
41
52
|
## Subagent Output Relay
|
|
42
53
|
|
|
43
54
|
When subagents complete, their visual outputs (from `present`) are NOT visible to the user.
|
|
@@ -6,23 +6,23 @@ This directory contains AI agent definitions generated by `@vpxa/aikit init`.
|
|
|
6
6
|
|
|
7
7
|
| Agent | Purpose | Model | Category |
|
|
8
8
|
|-------|---------|-------|----------|
|
|
9
|
-
| **Orchestrator** | Master conductor that orchestrates the full development lifecycle: Planning → Implementation → Review → Recovery → Commit | Claude Opus 4.6 | orchestration |
|
|
10
|
-
| **Planner** | Autonomous planner that researches codebases and writes comprehensive TDD implementation plans | Claude Opus 4.6 | orchestration |
|
|
11
|
-
| **Implementer** | Persistent implementation agent that writes code following TDD practices until all tasks are complete | GPT-5.4 | implementation |
|
|
12
|
-
| **Frontend** | UI/UX specialist for React, styling, responsive design, and frontend implementation | Gemini 3.1 Pro (Preview) | implementation |
|
|
13
|
-
| **Refactor** | Code refactoring specialist that improves structure, readability, and maintainability | GPT-5.4 | implementation |
|
|
14
|
-
| **Debugger** | Expert debugger that diagnoses issues, traces errors, and provides solutions | Claude Opus 4.6 | diagnostics |
|
|
15
|
-
| **Security** | Security specialist that analyzes code for vulnerabilities and compliance | Claude Opus 4.6 | diagnostics |
|
|
16
|
-
| **Documenter** | Documentation specialist that creates and maintains comprehensive project documentation | GPT-5.4 | documentation |
|
|
17
|
-
| **Explorer** | Rapid codebase exploration to find files, usages, dependencies, and structural context | Gemini 3 Flash (Preview) | exploration |
|
|
18
|
-
| **Researcher-Alpha** | Primary deep research agent — also serves as default Researcher | Claude Opus 4.6 | research |
|
|
19
|
-
| **Researcher-Beta** | Research variant — pragmatic analysis with focus on trade-offs and edge cases | Claude Sonnet 4.6 | research |
|
|
20
|
-
| **Researcher-Gamma** | Research variant — broad pattern matching across domains and technologies | GPT-5.4 | research |
|
|
21
|
-
| **Researcher-Delta** | Research variant — implementation feasibility and performance implications | Gemini 3.1 Pro (Preview) | research |
|
|
22
|
-
| **Code-Reviewer-Alpha** | Primary code reviewer | GPT-5.4 | review |
|
|
23
|
-
| **Code-Reviewer-Beta** | Code reviewer variant — different LLM perspective for dual review | Claude Opus 4.6 | review |
|
|
24
|
-
| **Architect-Reviewer-Alpha** | Primary architecture reviewer | GPT-5.4 | review |
|
|
25
|
-
| **Architect-Reviewer-Beta** | Architecture reviewer variant — different LLM perspective for dual review | Claude Opus 4.6 | review |
|
|
9
|
+
| **Orchestrator** | Master conductor that orchestrates the full development lifecycle: Planning → Implementation → Review → Recovery → Commit | Claude Opus 4.6 (copilot) | orchestration |
|
|
10
|
+
| **Planner** | Autonomous planner that researches codebases and writes comprehensive TDD implementation plans | Claude Opus 4.6 (copilot) | orchestration |
|
|
11
|
+
| **Implementer** | Persistent implementation agent that writes code following TDD practices until all tasks are complete | GPT-5.4 (copilot) | implementation |
|
|
12
|
+
| **Frontend** | UI/UX specialist for React, styling, responsive design, and frontend implementation | Gemini 3.1 Pro (Preview) (copilot) | implementation |
|
|
13
|
+
| **Refactor** | Code refactoring specialist that improves structure, readability, and maintainability | GPT-5.4 (copilot) | implementation |
|
|
14
|
+
| **Debugger** | Expert debugger that diagnoses issues, traces errors, and provides solutions | Claude Opus 4.6 (copilot) | diagnostics |
|
|
15
|
+
| **Security** | Security specialist that analyzes code for vulnerabilities and compliance | Claude Opus 4.6 (copilot) | diagnostics |
|
|
16
|
+
| **Documenter** | Documentation specialist that creates and maintains comprehensive project documentation | GPT-5.4 (copilot) | documentation |
|
|
17
|
+
| **Explorer** | Rapid codebase exploration to find files, usages, dependencies, and structural context | Gemini 3 Flash (Preview) (copilot) | exploration |
|
|
18
|
+
| **Researcher-Alpha** | Primary deep research agent — also serves as default Researcher | Claude Opus 4.6 (copilot) | research |
|
|
19
|
+
| **Researcher-Beta** | Research variant — pragmatic analysis with focus on trade-offs and edge cases | Claude Sonnet 4.6 (copilot) | research |
|
|
20
|
+
| **Researcher-Gamma** | Research variant — broad pattern matching across domains and technologies | GPT-5.4 (copilot) | research |
|
|
21
|
+
| **Researcher-Delta** | Research variant — implementation feasibility and performance implications | Gemini 3.1 Pro (Preview) (copilot) | research |
|
|
22
|
+
| **Code-Reviewer-Alpha** | Primary code reviewer | GPT-5.4 (copilot) | review |
|
|
23
|
+
| **Code-Reviewer-Beta** | Code reviewer variant — different LLM perspective for dual review | Claude Opus 4.6 (copilot) | review |
|
|
24
|
+
| **Architect-Reviewer-Alpha** | Primary architecture reviewer | GPT-5.4 (copilot) | review |
|
|
25
|
+
| **Architect-Reviewer-Beta** | Architecture reviewer variant — different LLM perspective for dual review | Claude Opus 4.6 (copilot) | review |
|
|
26
26
|
|
|
27
27
|
## Multi-Model Pattern
|
|
28
28
|
|
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
description: 'Code refactoring specialist that improves structure, readability, and maintainability'
|
|
3
3
|
argument-hint: Code, component, or pattern to refactor
|
|
4
4
|
tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, edit/createFile, edit/editFiles, edit/rename, edit/createDirectory, search/changes, search/codebase, search/usages, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
|
|
5
|
-
model: GPT-5.4 (copilot)
|
|
5
|
+
model: [GPT-5.4 (copilot), GPT-5.3-Codex (copilot), Auto (copilot)]
|
|
6
6
|
---
|
|
7
7
|
|
|
8
8
|
# Refactor - The Code Sculptor
|
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
description: 'Primary deep research agent — also serves as default Researcher'
|
|
3
3
|
argument-hint: Research question, problem statement, or subsystem to investigate
|
|
4
4
|
tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
|
|
5
|
-
model: Claude Opus 4.6 (copilot)
|
|
5
|
+
model: [Claude Opus 4.6 (copilot), Auto (copilot)]
|
|
6
6
|
---
|
|
7
7
|
|
|
8
8
|
# Researcher-Alpha - The Context Gatherer
|
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
description: 'Research variant — pragmatic analysis with focus on trade-offs and edge cases'
|
|
3
3
|
argument-hint: Research question, problem statement, or subsystem to investigate
|
|
4
4
|
tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
|
|
5
|
-
model: Claude Sonnet 4.6 (copilot)
|
|
5
|
+
model: [Claude Sonnet 4.6 (copilot), Auto (copilot)]
|
|
6
6
|
---
|
|
7
7
|
|
|
8
8
|
# Researcher-Beta - The Context Gatherer
|
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
description: 'Research variant — implementation feasibility and performance implications'
|
|
3
3
|
argument-hint: Research question, problem statement, or subsystem to investigate
|
|
4
4
|
tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
|
|
5
|
-
model: Gemini 3.1 Pro (Preview) (copilot)
|
|
5
|
+
model: [Gemini 3.1 Pro (Preview) (copilot), Auto (copilot)]
|
|
6
6
|
---
|
|
7
7
|
|
|
8
8
|
# Researcher-Delta - The Context Gatherer
|
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
description: 'Research variant — broad pattern matching across domains and technologies'
|
|
3
3
|
argument-hint: Research question, problem statement, or subsystem to investigate
|
|
4
4
|
tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
|
|
5
|
-
model: GPT-5.4 (copilot)
|
|
5
|
+
model: [GPT-5.4 (copilot), Auto (copilot)]
|
|
6
6
|
---
|
|
7
7
|
|
|
8
8
|
# Researcher-Gamma - The Context Gatherer
|
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
description: 'Security specialist that analyzes code for vulnerabilities and compliance'
|
|
3
3
|
argument-hint: Code, feature, or component to security review
|
|
4
4
|
tools: [execute/runInTerminal, read/problems, read/readFile, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
|
|
5
|
-
model: Claude Opus 4.6 (copilot)
|
|
5
|
+
model: [Claude Opus 4.6 (copilot), GPT-5.4 (copilot), Auto (copilot)]
|
|
6
6
|
---
|
|
7
7
|
|
|
8
8
|
# Security - The Vulnerability Hunter
|