@vpxa/aikit 0.1.17 → 0.1.18

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@vpxa/aikit",
3
- "version": "0.1.17",
3
+ "version": "0.1.18",
4
4
  "type": "module",
5
5
  "description": "Local-first AI developer toolkit — knowledge base, code analysis, context management, and developer tools for LLM agents",
6
6
  "license": "MIT",
@@ -1 +1 @@
1
- import{getToolMeta as e}from"../tool-metadata.js";import{basename as t,join as n,resolve as r}from"node:path";import{z as i}from"zod";import{readFile as a}from"node:fs/promises";import{createLogger as o,serializeError as s}from"../../../core/dist/index.js";const c=o(`flow-tools`);function l(e){return{content:[{type:`text`,text:e}]}}function u(e){return e instanceof Error?e.message:String(e)}function d(o,d){let f=d.sources?.[0]?.path??process.cwd(),p=n(d.stateDir??n(d.sources[0].path,`.aikit-state`),`flows`),m=n(p,`registry.json`),h=n(p,`state.json`);function g(e,n){let i;return i=e.sourceType===`builtin`?r(f,`.github`,`flows`,t(e.installPath),n):r(e.installPath,n),i.replaceAll(`\\`,`/`)}function _(e){return e.sourceType===`builtin`?r(f,`.github`,`flows`,t(e.installPath)).replaceAll(`\\`,`/`):e.installPath.replaceAll(`\\`,`/`)}async function v(){let{FlowRegistryManager:e,FlowStateMachine:t}=await import(`../../../flows/dist/index.js`);return{registry:new e(m),stateMachine:new t(h)}}let y=e(`flow_list`);o.registerTool(`flow_list`,{title:y.title,description:`List all installed flows and their steps`,annotations:y.annotations,inputSchema:{}},async()=>{try{let{registry:e,stateMachine:t}=await v(),n=e.list(),r=t.getStatus(),i={flows:n.map(e=>({name:e.name,version:e.version,source:e.source,sourceType:e.sourceType,format:e.format,steps:e.manifest.steps.map(e=>e.id)})),activeFlow:r.success&&r.data?{flow:r.data.flow,status:r.data.status,currentStep:r.data.currentStep}:null};return l(JSON.stringify(i,null,2))}catch(e){return c.error(`flow_list failed`,s(e)),l(`Error: ${u(e)}`)}});let b=e(`flow_info`);o.registerTool(`flow_info`,{title:b.title,description:`Show detailed information about a specific flow`,annotations:b.annotations,inputSchema:{name:i.string().describe(`Flow name to get info for`)}},async({name:e})=>{try{let{registry:t}=await v(),n=t.get(e);if(!n)return l(`Flow "${e}" not found. Use flow_list to see available flows.`);let r={name:n.name,version:n.version,description:n.manifest.description,source:n.source,sourceType:n.sourceType,format:n.format,installPath:_(n),registeredAt:n.registeredAt,updatedAt:n.updatedAt,steps:n.manifest.steps.map(e=>({id:e.id,name:e.name,skill:g(n,e.skill),produces:e.produces,requires:e.requires,description:e.description})),agents:n.manifest.agents,artifactsDir:n.manifest.artifacts_dir,install:n.manifest.install};return l(JSON.stringify(r,null,2))}catch(e){return c.error(`flow_info failed`,s(e)),l(`Error: ${u(e)}`)}});let x=e(`flow_start`);o.registerTool(`flow_start`,{title:x.title,description:`Start a flow. Sets the active flow and positions at the first step.`,annotations:x.annotations,inputSchema:{flow:i.string().describe(`Flow name to start (use flow_list to see options)`)}},async({flow:e})=>{try{let{registry:t,stateMachine:n}=await v(),r=t.get(e);if(!r)return l(`Flow "${e}" not found. Use flow_list to see available flows.`);let i=n.start(r.name,r.manifest);if(!i.success||!i.data)return l(`Cannot start: ${i.error}`);let a=i.data,o=r.manifest.steps.find(e=>e.id===a.currentStep),s={started:!0,flow:a.flow,currentStep:a.currentStep,currentStepSkill:r&&o?g(r,o.skill):null,currentStepDescription:o?.description??null,totalSteps:r.manifest.steps.length,stepSequence:r.manifest.steps.map(e=>e.id),artifactsDir:r.manifest.artifacts_dir};return l(JSON.stringify(s,null,2))}catch(e){return c.error(`flow_start failed`,s(e)),l(`Error: ${u(e)}`)}});let S=e(`flow_step`);o.registerTool(`flow_step`,{title:S.title,description:`Advance the active flow: complete current step and move to next, skip current step, or redo current step.`,annotations:S.annotations,inputSchema:{action:i.enum([`next`,`skip`,`redo`]).describe(`next: mark current step done and advance. skip: skip current step. redo: repeat current step.`)}},async({action:e})=>{try{let{registry:t,stateMachine:n}=await v(),r=n.load();if(!r)return l(`No active flow. Use flow_start first.`);let i=t.get(r.flow);if(!i)return l(`Flow "${r.flow}" not found in registry.`);let a=n.step(e,i.manifest);if(!a.success||!a.data)return l(`Cannot ${e}: ${a.error}`);let o=a.data,s=o.currentStep?i.manifest.steps.find(e=>e.id===o.currentStep):null,c={flow:o.flow,status:o.status,action:e,currentStep:o.currentStep,currentStepSkill:i&&s?g(i,s.skill):null,currentStepDescription:s?.description??null,completedSteps:o.completedSteps,skippedSteps:o.skippedSteps,totalSteps:i.manifest.steps.length,remaining:i.manifest.steps.filter(e=>!o.completedSteps.includes(e.id)&&!o.skippedSteps.includes(e.id)&&e.id!==o.currentStep).map(e=>e.id)};return l(JSON.stringify(c,null,2))}catch(e){return c.error(`flow_step failed`,s(e)),l(`Error: ${u(e)}`)}});let C=e(`flow_status`);o.registerTool(`flow_status`,{title:C.title,description:`Show the current flow execution state — which flow is active, current step, completed steps, and artifacts.`,annotations:C.annotations,inputSchema:{}},async()=>{try{let{registry:e,stateMachine:t}=await v(),n=t.getStatus();if(!n.success||!n.data)return l(`No active flow. Use flow_start to begin one, or flow_list to see available flows.`);let r=n.data,i=e.get(r.flow),a=i?.manifest.steps.find(e=>e.id===r.currentStep),o=i&&a?g(i,a.skill):null,s={flow:r.flow,status:r.status,currentStep:r.currentStep,currentStepSkill:o,skillPath:o,currentStepDescription:a?.description??null,completedSteps:r.completedSteps,skippedSteps:r.skippedSteps,artifacts:r.artifacts,startedAt:r.startedAt,updatedAt:r.updatedAt,totalSteps:i?.manifest.steps.length??0,progress:i?`${r.completedSteps.length+r.skippedSteps.length}/${i.manifest.steps.length}`:`unknown`};return l(JSON.stringify(s,null,2))}catch(e){return c.error(`flow_status failed`,s(e)),l(`Error: ${u(e)}`)}});let w=e(`flow_read_skill`);o.registerTool(`flow_read_skill`,{title:w.title===`flow_read_skill`?`Flow Read Skill`:w.title,description:`Read the skill or instruction content for a flow step. If step is omitted, reads the current step.`,annotations:w.title===`flow_read_skill`?{readOnlyHint:!0,idempotentHint:!0}:w.annotations,inputSchema:{step:i.string().optional().describe(`Step id or name to read. Defaults to the current step.`)}},async({step:e})=>{try{let{registry:t,stateMachine:n}=await v(),r=n.getStatus();if(!r.success||!r.data)return l(`No active flow. Use flow_start to begin one, or flow_list to see available flows.`);let i=r.data,o=t.get(i.flow);if(!o)return l(`Flow "${i.flow}" not found in registry.`);let s=e??i.currentStep;if(!s)return l(`No current step is available for the active flow.`);let c=o.manifest.steps.find(e=>e.id===s||e.name===s);return l(c?await a(g(o,c.skill),`utf-8`):`Step "${s}" not found in flow "${i.flow}".`)}catch(e){return c.error(`flow_read_skill failed`,s(e)),e instanceof Error&&`code`in e&&e.code===`ENOENT`?l(`Could not read skill file: ${e.message}`):l(`Error: ${u(e)}`)}});let T=e(`flow_reset`);o.registerTool(`flow_reset`,{title:T.title,description:`Reset the active flow, clearing all state. Use to start over or switch to a different flow.`,annotations:T.annotations,inputSchema:{}},async()=>{try{let{stateMachine:e}=await v(),t=e.reset();return t.success?l(`Flow state reset. Use flow_start to begin a new flow.`):l(`Reset failed: ${t.error}`)}catch(e){return c.error(`flow_reset failed`,s(e)),l(`Error: ${u(e)}`)}})}export{d as registerFlowTools};
1
+ import{getToolMeta as e}from"../tool-metadata.js";import{existsSync as t}from"node:fs";import{basename as n,join as r,resolve as i}from"node:path";import{z as a}from"zod";import{readFile as o}from"node:fs/promises";import{createLogger as s,serializeError as c}from"../../../core/dist/index.js";import{homedir as l}from"node:os";const u=s(`flow-tools`);function d(e){return{content:[{type:`text`,text:e}]}}function f(e){return e instanceof Error?e.message:String(e)}function p(s,p){let m=p.sources?.[0]?.path??process.cwd(),h=r(p.stateDir??r(p.sources[0].path,`.aikit-state`),`flows`),g=r(h,`registry.json`),_=r(h,`state.json`);function v(e,t){return i(y(e),t).replaceAll(`\\`,`/`)}function y(e){if(e.sourceType===`builtin`){let r=n(e.installPath),a=i(m,`.github`,`flows`,r);if(t(a))return a.replaceAll(`\\`,`/`);let o=i(l(),`.copilot`,`flows`,r);return t(o)?o.replaceAll(`\\`,`/`):a.replaceAll(`\\`,`/`)}return e.installPath.replaceAll(`\\`,`/`)}async function b(){let{FlowRegistryManager:e,FlowStateMachine:t}=await import(`../../../flows/dist/index.js`);return{registry:new e(g),stateMachine:new t(_)}}let x=e(`flow_list`);s.registerTool(`flow_list`,{title:x.title,description:`List all installed flows and their steps`,annotations:x.annotations,inputSchema:{}},async()=>{try{let{registry:e,stateMachine:t}=await b(),n=e.list(),r=t.getStatus(),i={flows:n.map(e=>({name:e.name,version:e.version,source:e.source,sourceType:e.sourceType,format:e.format,steps:e.manifest.steps.map(e=>e.id)})),activeFlow:r.success&&r.data?{flow:r.data.flow,status:r.data.status,currentStep:r.data.currentStep}:null};return d(JSON.stringify(i,null,2))}catch(e){return u.error(`flow_list failed`,c(e)),d(`Error: ${f(e)}`)}});let S=e(`flow_info`);s.registerTool(`flow_info`,{title:S.title,description:`Show detailed information about a specific flow`,annotations:S.annotations,inputSchema:{name:a.string().describe(`Flow name to get info for`)}},async({name:e})=>{try{let{registry:t}=await b(),n=t.get(e);if(!n)return d(`Flow "${e}" not found. Use flow_list to see available flows.`);let r={name:n.name,version:n.version,description:n.manifest.description,source:n.source,sourceType:n.sourceType,format:n.format,installPath:y(n),registeredAt:n.registeredAt,updatedAt:n.updatedAt,steps:n.manifest.steps.map(e=>({id:e.id,name:e.name,skill:v(n,e.skill),produces:e.produces,requires:e.requires,description:e.description})),agents:n.manifest.agents,artifactsDir:n.manifest.artifacts_dir,install:n.manifest.install};return d(JSON.stringify(r,null,2))}catch(e){return u.error(`flow_info failed`,c(e)),d(`Error: ${f(e)}`)}});let C=e(`flow_start`);s.registerTool(`flow_start`,{title:C.title,description:`Start a flow. Sets the active flow and positions at the first step.`,annotations:C.annotations,inputSchema:{flow:a.string().describe(`Flow name to start (use flow_list to see options)`)}},async({flow:e})=>{try{let{registry:t,stateMachine:n}=await b(),r=t.get(e);if(!r)return d(`Flow "${e}" not found. Use flow_list to see available flows.`);let i=n.start(r.name,r.manifest);if(!i.success||!i.data)return d(`Cannot start: ${i.error}`);let a=i.data,o=r.manifest.steps.find(e=>e.id===a.currentStep),s={started:!0,flow:a.flow,currentStep:a.currentStep,currentStepSkill:r&&o?v(r,o.skill):null,currentStepDescription:o?.description??null,totalSteps:r.manifest.steps.length,stepSequence:r.manifest.steps.map(e=>e.id),artifactsDir:r.manifest.artifacts_dir};return d(JSON.stringify(s,null,2))}catch(e){return u.error(`flow_start failed`,c(e)),d(`Error: ${f(e)}`)}});let w=e(`flow_step`);s.registerTool(`flow_step`,{title:w.title,description:`Advance the active flow: complete current step and move to next, skip current step, or redo current step.`,annotations:w.annotations,inputSchema:{action:a.enum([`next`,`skip`,`redo`]).describe(`next: mark current step done and advance. skip: skip current step. redo: repeat current step.`)}},async({action:e})=>{try{let{registry:t,stateMachine:n}=await b(),r=n.load();if(!r)return d(`No active flow. Use flow_start first.`);let i=t.get(r.flow);if(!i)return d(`Flow "${r.flow}" not found in registry.`);let a=n.step(e,i.manifest);if(!a.success||!a.data)return d(`Cannot ${e}: ${a.error}`);let o=a.data,s=o.currentStep?i.manifest.steps.find(e=>e.id===o.currentStep):null,c={flow:o.flow,status:o.status,action:e,currentStep:o.currentStep,currentStepSkill:i&&s?v(i,s.skill):null,currentStepDescription:s?.description??null,completedSteps:o.completedSteps,skippedSteps:o.skippedSteps,totalSteps:i.manifest.steps.length,remaining:i.manifest.steps.filter(e=>!o.completedSteps.includes(e.id)&&!o.skippedSteps.includes(e.id)&&e.id!==o.currentStep).map(e=>e.id)};return d(JSON.stringify(c,null,2))}catch(e){return u.error(`flow_step failed`,c(e)),d(`Error: ${f(e)}`)}});let T=e(`flow_status`);s.registerTool(`flow_status`,{title:T.title,description:`Show the current flow execution state — which flow is active, current step, completed steps, and artifacts.`,annotations:T.annotations,inputSchema:{}},async()=>{try{let{registry:e,stateMachine:t}=await b(),n=t.getStatus();if(!n.success||!n.data)return d(`No active flow. Use flow_start to begin one, or flow_list to see available flows.`);let r=n.data,i=e.get(r.flow),a=i?.manifest.steps.find(e=>e.id===r.currentStep),o=i&&a?v(i,a.skill):null,s={flow:r.flow,status:r.status,currentStep:r.currentStep,currentStepSkill:o,skillPath:o,currentStepDescription:a?.description??null,completedSteps:r.completedSteps,skippedSteps:r.skippedSteps,artifacts:r.artifacts,startedAt:r.startedAt,updatedAt:r.updatedAt,totalSteps:i?.manifest.steps.length??0,progress:i?`${r.completedSteps.length+r.skippedSteps.length}/${i.manifest.steps.length}`:`unknown`};return d(JSON.stringify(s,null,2))}catch(e){return u.error(`flow_status failed`,c(e)),d(`Error: ${f(e)}`)}});let E=e(`flow_read_skill`);s.registerTool(`flow_read_skill`,{title:E.title===`flow_read_skill`?`Flow Read Skill`:E.title,description:`Read the skill or instruction content for a flow step. If step is omitted, reads the current step.`,annotations:E.title===`flow_read_skill`?{readOnlyHint:!0,idempotentHint:!0}:E.annotations,inputSchema:{step:a.string().optional().describe(`Step id or name to read. Defaults to the current step.`)}},async({step:e})=>{try{let{registry:t,stateMachine:n}=await b(),r=n.getStatus();if(!r.success||!r.data)return d(`No active flow. Use flow_start to begin one, or flow_list to see available flows.`);let i=r.data,a=t.get(i.flow);if(!a)return d(`Flow "${i.flow}" not found in registry.`);let s=e??i.currentStep;if(!s)return d(`No current step is available for the active flow.`);let c=a.manifest.steps.find(e=>e.id===s||e.name===s);return d(c?await o(v(a,c.skill),`utf-8`):`Step "${s}" not found in flow "${i.flow}".`)}catch(e){return u.error(`flow_read_skill failed`,c(e)),e instanceof Error&&`code`in e&&e.code===`ENOENT`?d(`Could not read skill file: ${e.message}`):d(`Error: ${f(e)}`)}});let D=e(`flow_reset`);s.registerTool(`flow_reset`,{title:D.title,description:`Reset the active flow, clearing all state. Use to start over or switch to a different flow.`,annotations:D.annotations,inputSchema:{}},async()=>{try{let{stateMachine:e}=await b(),t=e.reset();return t.success?d(`Flow state reset. Use flow_start to begin a new flow.`):d(`Reset failed: ${t.error}`)}catch(e){return u.error(`flow_reset failed`,c(e)),d(`Error: ${f(e)}`)}})}export{p as registerFlowTools};
@@ -1 +1 @@
1
- import{existsSync as e,readFileSync as t}from"node:fs";import{dirname as n,resolve as r}from"node:path";import{fileURLToPath as i}from"node:url";import{createLogger as a}from"../../core/dist/index.js";import{execFile as o}from"node:child_process";import{homedir as s}from"node:os";const c=a(`server`);function l(){let e=r(n(i(import.meta.url)),`..`,`..`,`..`,`package.json`);try{return JSON.parse(t(e,`utf-8`)).version??`0.0.0`}catch{return`0.0.0`}}function u(e,t){let n=e.split(`.`).map(Number),r=t.split(`.`).map(Number);for(let e=0;e<3;e++){let t=(n[e]??0)-(r[e]??0);if(t!==0)return t>0?1:-1}return 0}function d(){let e=l();fetch(`https://registry.npmjs.org/@vpxa/aikit/latest`,{signal:AbortSignal.timeout(5e3)}).then(e=>{if(e.ok)return e.json()}).then(t=>{if(!t||typeof t!=`object`)return;let n=t.version;n&&u(e,n)<0&&c.warn(`Update available`,{currentVersion:e,latestVersion:n,updateCommand:`aikit upgrade`})}).catch(()=>{})}function f(){try{let n=r(s(),`.copilot`,`.aikit-scaffold.json`);return e(n)?JSON.parse(t(n,`utf-8`)).version??null:null}catch{return null}}function p(){try{let n=r(process.cwd(),`.github`,`.aikit-scaffold.json`);return e(n)?JSON.parse(t(n,`utf-8`)).version??null:null}catch{return null}}let m=`idle`,h=null;function g(){return{state:m,error:h}}function _(){try{let t=l(),a=f(),s=p();if(!(a!=null&&a!==t)&&!(s!=null&&s!==t)||m===`pending`||m===`success`)return;m=`pending`,h=null,c.info(`Scaffold version mismatch — auto-upgrading`,{serverVersion:t,userScaffoldVersion:a,workspaceScaffoldVersion:s});let u=r(n(i(import.meta.url)),`..`,`..`,`..`,`bin`,`aikit.mjs`);if(!e(u)){m=`failed`,h=`aikit CLI binary not found at ${u}`,c.warn(`Cannot auto-upgrade: aikit CLI binary not found`,{binPath:u});return}o(process.execPath,[u,`upgrade`],{timeout:3e4,windowsHide:!0},(e,t,n)=>{e?(m=`failed`,h=e.message,c.warn(`Auto-upgrade failed`,{error:e.message,stderr:n?.slice(0,500)})):(m=`success`,h=null,c.info(`Auto-upgrade complete`))}).unref()}catch(e){m=`failed`,h=e instanceof Error?e.message:String(e),c.warn(`Auto-upgrade check failed`,{error:h})}}export{_ as autoUpgradeScaffold,d as checkForUpdates,l as getCurrentVersion,g as getUpgradeState};
1
+ import{existsSync as e,readFileSync as t}from"node:fs";import{dirname as n,resolve as r}from"node:path";import{fileURLToPath as i}from"node:url";import{createLogger as a}from"../../core/dist/index.js";import{homedir as o}from"node:os";import{execFile as s}from"node:child_process";const c=a(`server`);function l(){let e=r(n(i(import.meta.url)),`..`,`..`,`..`,`package.json`);try{return JSON.parse(t(e,`utf-8`)).version??`0.0.0`}catch{return`0.0.0`}}function u(e,t){let n=e.split(`.`).map(Number),r=t.split(`.`).map(Number);for(let e=0;e<3;e++){let t=(n[e]??0)-(r[e]??0);if(t!==0)return t>0?1:-1}return 0}function d(){let e=l();fetch(`https://registry.npmjs.org/@vpxa/aikit/latest`,{signal:AbortSignal.timeout(5e3)}).then(e=>{if(e.ok)return e.json()}).then(t=>{if(!t||typeof t!=`object`)return;let n=t.version;n&&u(e,n)<0&&c.warn(`Update available`,{currentVersion:e,latestVersion:n,updateCommand:`aikit upgrade`})}).catch(()=>{})}function f(){try{let n=r(o(),`.copilot`,`.aikit-scaffold.json`);return e(n)?JSON.parse(t(n,`utf-8`)).version??null:null}catch{return null}}function p(){try{let n=r(process.cwd(),`.github`,`.aikit-scaffold.json`);return e(n)?JSON.parse(t(n,`utf-8`)).version??null:null}catch{return null}}let m=`idle`,h=null;function g(){return{state:m,error:h}}function _(){try{let t=l(),a=f(),o=p();if(!(a!=null&&a!==t)&&!(o!=null&&o!==t)||m===`pending`||m===`success`)return;m=`pending`,h=null,c.info(`Scaffold version mismatch — auto-upgrading`,{serverVersion:t,userScaffoldVersion:a,workspaceScaffoldVersion:o});let u=r(n(i(import.meta.url)),`..`,`..`,`..`,`bin`,`aikit.mjs`);if(!e(u)){m=`failed`,h=`aikit CLI binary not found at ${u}`,c.warn(`Cannot auto-upgrade: aikit CLI binary not found`,{binPath:u});return}s(process.execPath,[u,`upgrade`],{timeout:3e4,windowsHide:!0},(e,t,n)=>{e?(m=`failed`,h=e.message,c.warn(`Auto-upgrade failed`,{error:e.message,stderr:n?.slice(0,500)})):(m=`success`,h=null,c.info(`Auto-upgrade complete`))}).unref()}catch(e){m=`failed`,h=e instanceof Error?e.message:String(e),c.warn(`Auto-upgrade check failed`,{error:h})}}export{_ as autoUpgradeScaffold,d as checkForUpdates,l as getCurrentVersion,g as getUpgradeState};
@@ -64,8 +64,14 @@ function buildToolsYaml(toolRole) {
64
64
  }
65
65
 
66
66
  function copilotModel(agentName) {
67
- const base = MODELS[agentName];
68
- return base ? `${base} (copilot)` : 'Claude Opus 4.6 (copilot)';
67
+ const models = MODELS[agentName];
68
+ if (!models) return 'Auto (copilot)';
69
+ if (Array.isArray(models)) {
70
+ if (models.length === 0) return 'Auto (copilot)';
71
+ if (models.length === 1) return models[0];
72
+ return `[${models.join(', ')}]`;
73
+ }
74
+ return models;
69
75
  }
70
76
 
71
77
  const FLOWS_SECTION = [
@@ -84,13 +90,15 @@ function buildAgentTable() {
84
90
  if (def.variants) {
85
91
  for (const suffix of VARIANT_GROUPS[name] || []) {
86
92
  const fullName = `${name}-${suffix}`;
87
- const model = MODELS[fullName] || 'Unknown';
93
+ const models = MODELS[fullName] || MODELS[name];
94
+ const model = Array.isArray(models) ? models[0] : models || 'Unknown';
88
95
  const varDef = def.variants[suffix] || {};
89
96
  const desc = varDef.description || def.description;
90
97
  rows.push(`| **${fullName}** | ${desc} | ${model} | ${def.category} |`);
91
98
  }
92
99
  } else {
93
- const model = MODELS[name] || 'Unknown';
100
+ const models = MODELS[name];
101
+ const model = Array.isArray(models) ? models[0] : models || 'Unknown';
94
102
  rows.push(`| **${name}** | ${def.description} | ${model} | ${def.category} |`);
95
103
  }
96
104
  }
@@ -40,26 +40,43 @@ ${agentTable}
40
40
  3. After review: \`evidence_map({ action: "gate", task_id })\` → YIELD/HOLD/HARD_BLOCK
41
41
  4. Auto-upgrade tier if unknowns reveal contract/security issues
42
42
 
43
- ## Workflow
43
+ ## Flow-Driven Development
44
44
 
45
- ### Phase 1: Planning
46
- 1. Read onboard artifacts → parse goal → identify affected subsystems → \`forge_classify\`
47
- 2. Research: <5 files direct, 5-15 Explorer→Researcher, >15 multiple parallel
48
- 3. Draft plan: 3-10 phases, agent assignments, TDD steps, dependency graph
49
- 4. Batch independent phases for parallel execution
50
- 5. **🛑 STOP — user approval required**
45
+ Orchestrator uses the flow system for structured development. Flows define the step sequence — Orchestrator adds multi-agent orchestration, quality gates, and review protocols on top.
51
46
 
52
- ### Phase 2: Implementation Cycle
47
+ ### Flow Selection
53
48
 
54
- **🚨 PRE-DISPATCH GATE complete ALL before ANY \`runSubagent\` call:**
49
+ | Situation | Flow | Steps |
50
+ |-----------|------|-------|
51
+ | Bug fix, small feature, refactoring | \`aikit:basic\` | assess → implement → verify |
52
+ | New feature, major change, multi-file | \`aikit:advanced\` | spec → plan → task → execute → verify |
53
+ | Custom/specialized work | Check \`flow_list\` | Follow flow-specific steps |
55
54
 
56
- 1. \`multi-agents-development\` skill loaded? (Bootstrap step 4 if not, load NOW)
57
- 2. ✅ Task decomposition table produced? (show user: task → files → agent → parallel batch)
58
- 3. ✅ Independence Check passed per pair? (shared files? shared state? ordering dependency? → must be "No" for parallel)
59
- 4. ✅ Each task ≤ 3 files? (if not, split further)
60
- 5. ✅ Parallel batches identified? (tasks with no dependencies MUST be in same batch)
55
+ **If multiple flows could apply and user hasn't specified ask user to choose.**
61
56
 
62
- **Decomposition output format** (show this to user before dispatching):
57
+ ### Session Start Flow Check
58
+
59
+ 1. \`flow_status\` — check for active flow
60
+ 2. If active:
61
+ - Note current step name and skill path
62
+ - Read the current step skill with \`flow_read_skill\`
63
+ - Follow its instructions
64
+ - When complete: \`flow_step({ action: 'next' })\`
65
+ 3. If no active flow:
66
+ - \`flow_list\` — check ALL available flows (builtin + custom)
67
+ - Recommend appropriate flow based on task scope
68
+ - \`flow_start({ flow: '<name>' })\` after user confirms
69
+
70
+ ### Orchestrator Protocols (apply during ALL flow steps)
71
+
72
+ **PRE-DISPATCH GATE — complete ALL before ANY \`runSubagent\` call:**
73
+ 1. ✅ \`multi-agents-development\` skill loaded?
74
+ 2. ✅ Task decomposition table produced?
75
+ 3. ✅ Independence Check passed per pair?
76
+ 4. ✅ Each task ≤ 3 files?
77
+ 5. ✅ Parallel batches identified?
78
+
79
+ **Decomposition output format:**
63
80
 
64
81
  \`\`\`
65
82
  Batch 1 (parallel):
@@ -69,23 +86,35 @@ Batch 2 (after batch 1):
69
86
  Task C: [agent] → [file5] — [goal] (depends on A)
70
87
  \`\`\`
71
88
 
72
- **Prompt every subagent with** (use \`multi-agents-development\` skill templates):
73
- 1. **Scope** — exact files to touch + boundary (do NOT touch)
89
+ **Subagent prompt template:**
90
+ 1. **Scope** — exact files + boundary
74
91
  2. **Goal** — acceptance criteria, testable
75
- 3. **Arch Context** — paste actual code snippets from \`compact()\`/\`digest()\`
76
- 4. **Constraints** — patterns, conventions, anti-patterns
92
+ 3. **Arch Context** — code snippets from \`compact()\`/\`digest()\`
93
+ 4. **Constraints** — patterns, conventions
77
94
  5. **FORGE** — tier + evidence requirements
78
95
  6. **Self-Review** — checklist before declaring status
79
96
 
80
- **Subagent status protocol**: \`DONE\` | \`DONE_WITH_CONCERNS\` | \`NEEDS_CONTEXT\` | \`BLOCKED\`
97
+ **Subagent status protocol:** \`DONE\` | \`DONE_WITH_CONCERNS\` | \`NEEDS_CONTEXT\` | \`BLOCKED\`
81
98
 
82
- **Per-batch flow**: Dispatch (parallel) Spec Review → Code Quality Review (Alpha+Beta parallel) → Arch Review (if boundary changes) → Security (if applicable) → \`evidence_map\` gate → **🛑 STOP — present commit message**
99
+ **Additional Orchestrator requirements during flow execution:**
100
+ - Apply the PRE-DISPATCH GATE before any subagent dispatch, regardless of flow
101
+ - Apply FORGE at classification and verification points; pass tier/evidence expectations into subagents and gate with \`evidence_map\`
102
+ - Enforce delegation rules at all times — Orchestrator never implements code directly
103
+ - Use the subagent prompt template for every dispatch so step-specific flow instructions are grounded in actual code context
83
104
 
84
- ### Phase 3: Completion
85
- 1. Optional: Refactor pass (separate commit)
86
- 2. Documenter for docs updates
87
- 3. \`remember\` all decisions, patterns, gotchas, conventions
88
- 4. \`reindex({})\` + \`produce_knowledge({ path: "." })\`
105
+ **Per-step review cycle:** Dispatch → Code Review (Alpha+Beta) → Arch Review (if boundary changes) → Security (if applicable) → \`evidence_map\` gate → **🛑 STOP — present results**
106
+
107
+ ### Flow MCP Tools
108
+
109
+ | Tool | Purpose |
110
+ |------|---------|
111
+ | \`flow_list\` | List installed flows and active flow |
112
+ | \`flow_info\` | Get detailed flow info including steps |
113
+ | \`flow_start\` | Start a named flow |
114
+ | \`flow_step\` | Advance: next, skip, or redo current step |
115
+ | \`flow_status\` | Check current execution state |
116
+ | \`flow_reset\` | Clear flow state to start over |
117
+ | \`flow_read_skill\` | Read the skill content for the current step |
89
118
 
90
119
  ## Emergency: STOP → ASSESS → CONTAIN → RECOVER → DOCUMENT
91
120
 
@@ -228,6 +257,17 @@ At session start, check for an active flow:
228
257
  5. **Dependency Graph** — For each phase, list dependencies. Group into parallel batches
229
258
  6. **Present** — Show plan with open questions, complexity estimate, parallel batch layout
230
259
 
260
+ ## Flow Integration
261
+
262
+ When activated as part of a flow (e.g., \`aikit:advanced\` plan step or \`aikit:basic\` assess step):
263
+ 1. Check \`flow_status\` for current step context
264
+ 2. Read the step's skill file for specific instructions
265
+ 3. Follow skill instructions while applying Planner methodology
266
+ 4. Produce required artifacts (as specified by the flow step's \`produces\` field)
267
+ 5. When complete, report to Orchestrator (do NOT call \`flow_step\` — let Orchestrator advance)
268
+
269
+ When no flow is active, operate autonomously following normal Planner methodology.
270
+
231
271
  ## Subagent Output Relay
232
272
 
233
273
  When subagents complete, their visual outputs (from \`present\`) are NOT visible to the user.
@@ -11,29 +11,44 @@
11
11
 
12
12
  export const MODELS = {
13
13
  // ─── Single-role agents ───────────────────────────────────────────────
14
- Orchestrator: 'Claude Opus 4.6',
15
- Planner: 'Claude Opus 4.6',
16
- Implementer: 'GPT-5.4',
17
- Frontend: 'Gemini 3.1 Pro (Preview)',
18
- Debugger: 'Claude Opus 4.6',
19
- Refactor: 'GPT-5.4',
20
- Security: 'Claude Opus 4.6',
21
- Documenter: 'GPT-5.4',
22
- Explorer: 'Gemini 3 Flash (Preview)',
14
+ Orchestrator: ['Claude Opus 4.6 (copilot)', 'GPT-5.4 (copilot)', 'Auto (copilot)'],
15
+ Planner: ['Claude Opus 4.6 (copilot)', 'GPT-5.4 (copilot)', 'Auto (copilot)'],
16
+ Implementer: [
17
+ 'GPT-5.4 (copilot)',
18
+ 'Gemini 3.1 Pro (Preview) (copilot)',
19
+ 'GPT-5.3-Codex (copilot)',
20
+ 'Auto (copilot)',
21
+ ],
22
+ Frontend: [
23
+ 'Gemini 3.1 Pro (Preview) (copilot)',
24
+ 'GPT-5.4 (copilot)',
25
+ 'GPT-5.3-Codex (copilot)',
26
+ 'Auto (copilot)',
27
+ ],
28
+ Debugger: [
29
+ 'Claude Opus 4.6 (copilot)',
30
+ 'GPT-5.4 (copilot)',
31
+ 'GPT-5.3-Codex (copilot)',
32
+ 'Auto (copilot)',
33
+ ],
34
+ Refactor: ['GPT-5.4 (copilot)', 'GPT-5.3-Codex (copilot)', 'Auto (copilot)'],
35
+ Security: ['Claude Opus 4.6 (copilot)', 'GPT-5.4 (copilot)', 'Auto (copilot)'],
36
+ Documenter: ['GPT-5.4 (copilot)', 'Gemini 3.1 Pro (Preview) (copilot)', 'Auto (copilot)'],
37
+ Explorer: ['Gemini 3 Flash (Preview) (copilot)', 'Claude Haiku 4.5 (copilot)', 'Auto (copilot)'],
23
38
 
24
39
  // ─── Researcher variants (4 models for multi-model decision protocol) ────────────
25
- 'Researcher-Alpha': 'Claude Opus 4.6',
26
- 'Researcher-Beta': 'Claude Sonnet 4.6',
27
- 'Researcher-Gamma': 'GPT-5.4',
28
- 'Researcher-Delta': 'Gemini 3.1 Pro (Preview)',
40
+ 'Researcher-Alpha': ['Claude Opus 4.6 (copilot)', 'Auto (copilot)'],
41
+ 'Researcher-Beta': ['Claude Sonnet 4.6 (copilot)', 'Auto (copilot)'],
42
+ 'Researcher-Gamma': ['GPT-5.4 (copilot)', 'Auto (copilot)'],
43
+ 'Researcher-Delta': ['Gemini 3.1 Pro (Preview) (copilot)', 'Auto (copilot)'],
29
44
 
30
45
  // ─── Code-Reviewer variants (2 models for dual review) ───────────────
31
- 'Code-Reviewer-Alpha': 'GPT-5.4',
32
- 'Code-Reviewer-Beta': 'Claude Opus 4.6',
46
+ 'Code-Reviewer-Alpha': ['GPT-5.4 (copilot)', 'Auto (copilot)'],
47
+ 'Code-Reviewer-Beta': ['Claude Opus 4.6 (copilot)', 'Auto (copilot)'],
33
48
 
34
49
  // ─── Architect-Reviewer variants (2 models for dual review) ──────────
35
- 'Architect-Reviewer-Alpha': 'GPT-5.4',
36
- 'Architect-Reviewer-Beta': 'Claude Opus 4.6',
50
+ 'Architect-Reviewer-Alpha': ['GPT-5.4 (copilot)', 'Auto (copilot)'],
51
+ 'Architect-Reviewer-Beta': ['Claude Opus 4.6 (copilot)', 'Auto (copilot)'],
37
52
  };
38
53
 
39
54
  /**
@@ -2,7 +2,7 @@
2
2
  description: 'Primary architecture reviewer'
3
3
  argument-hint: Files, PR, or subsystem to architecture-review
4
4
  tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
5
- model: GPT-5.4 (copilot)
5
+ model: [GPT-5.4 (copilot), Auto (copilot)]
6
6
  ---
7
7
 
8
8
  # Architect-Reviewer-Alpha - The Structural Guardian
@@ -2,7 +2,7 @@
2
2
  description: 'Architecture reviewer variant — different LLM perspective for dual review'
3
3
  argument-hint: Files, PR, or subsystem to architecture-review
4
4
  tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
5
- model: Claude Opus 4.6 (copilot)
5
+ model: [Claude Opus 4.6 (copilot), Auto (copilot)]
6
6
  ---
7
7
 
8
8
  # Architect-Reviewer-Beta - The Structural Guardian
@@ -2,7 +2,7 @@
2
2
  description: 'Primary code reviewer'
3
3
  argument-hint: File path, PR, or code to review
4
4
  tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
5
- model: GPT-5.4 (copilot)
5
+ model: [GPT-5.4 (copilot), Auto (copilot)]
6
6
  ---
7
7
 
8
8
  # Code-Reviewer-Alpha - The Quality Guardian
@@ -2,7 +2,7 @@
2
2
  description: 'Code reviewer variant — different LLM perspective for dual review'
3
3
  argument-hint: File path, PR, or code to review
4
4
  tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
5
- model: Claude Opus 4.6 (copilot)
5
+ model: [Claude Opus 4.6 (copilot), Auto (copilot)]
6
6
  ---
7
7
 
8
8
  # Code-Reviewer-Beta - The Quality Guardian
@@ -2,7 +2,7 @@
2
2
  description: 'Expert debugger that diagnoses issues, traces errors, and provides solutions'
3
3
  argument-hint: Error message, stack trace, or description of issue
4
4
  tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalSelection, read/terminalLastCommand, agent/runSubagent, edit/createFile, edit/editFiles, search/changes, search/codebase, search/usages, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
5
- model: Claude Opus 4.6 (copilot)
5
+ model: [Claude Opus 4.6 (copilot), GPT-5.4 (copilot), GPT-5.3-Codex (copilot), Auto (copilot)]
6
6
  ---
7
7
 
8
8
  # Debugger - The Problem Solver
@@ -2,7 +2,7 @@
2
2
  description: 'Documentation specialist that creates and maintains comprehensive project documentation'
3
3
  argument-hint: Component, API, feature, or area to document
4
4
  tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, edit/createFile, edit/editFiles, edit/rename, edit/createDirectory, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
5
- model: GPT-5.4 (copilot)
5
+ model: [GPT-5.4 (copilot), Gemini 3.1 Pro (Preview) (copilot), Auto (copilot)]
6
6
  ---
7
7
 
8
8
  # Documenter - The Knowledge Keeper
@@ -2,7 +2,7 @@
2
2
  description: 'Rapid codebase exploration to find files, usages, dependencies, and structural context'
3
3
  argument-hint: Find files, usages, and context related to: {topic or goal}
4
4
  tools: [read/problems, read/readFile, search/changes, search/codebase, search/usages, search/fileSearch, search/listDirectory, search/textSearch, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
5
- model: Gemini 3 Flash (Preview) (copilot)
5
+ model: [Gemini 3 Flash (Preview) (copilot), Claude Haiku 4.5 (copilot), Auto (copilot)]
6
6
  ---
7
7
 
8
8
  # Explorer - The Rapid Scout
@@ -2,7 +2,7 @@
2
2
  description: 'UI/UX specialist for React, styling, responsive design, and frontend implementation'
3
3
  argument-hint: UI component, styling task, or frontend feature
4
4
  tools: [execute/createAndRunTask, execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, edit/createFile, edit/editFiles, edit/rename, edit/createDirectory, search/changes, search/codebase, search/usages, todo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
5
- model: Gemini 3.1 Pro (Preview) (copilot)
5
+ model: [Gemini 3.1 Pro (Preview) (copilot), GPT-5.4 (copilot), GPT-5.3-Codex (copilot), Auto (copilot)]
6
6
  ---
7
7
 
8
8
  # Frontend - The UI Specialist
@@ -2,7 +2,7 @@
2
2
  description: 'Persistent implementation agent that writes code following TDD practices until all tasks are complete'
3
3
  argument-hint: Implementation task, feature, or phase from plan
4
4
  tools: [execute/createAndRunTask, execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, edit/createFile, edit/editFiles, edit/rename, edit/createDirectory, search/changes, search/codebase, search/usages, todo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
5
- model: GPT-5.4 (copilot)
5
+ model: [GPT-5.4 (copilot), Gemini 3.1 Pro (Preview) (copilot), GPT-5.3-Codex (copilot), Auto (copilot)]
6
6
  ---
7
7
 
8
8
  # Implementer - The Code Builder
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  description: 'Master conductor that orchestrates the full development lifecycle: Planning → Implementation → Review → Recovery → Commit'
3
3
  tools: [vscode/memory, vscode/runCommand, vscode/switchAgent, execute/killTerminal, execute/createAndRunTask, execute/runInTerminal, read/terminalSelection, read/terminalLastCommand, read/problems, read/readFile, agent/runSubagent, edit/createFile, edit/editFiles, edit/rename, edit/createDirectory, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, todo, search/searchSubagent, search/textSearch, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, vscode/askQuestions, vscode/resolveMemoryFileUri, aikit/*]
4
- model: Claude Opus 4.6 (copilot)
4
+ model: [Claude Opus 4.6 (copilot), GPT-5.4 (copilot), Auto (copilot)]
5
5
  ---
6
6
 
7
7
  # Orchestrator - The Master Conductor
@@ -21,23 +21,23 @@ You orchestrate the full development lifecycle: **planning → implementation
21
21
 
22
22
  | Agent | Purpose | Model | Category |
23
23
  |-------|---------|-------|----------|
24
- | **Orchestrator** | Master conductor that orchestrates the full development lifecycle: Planning → Implementation → Review → Recovery → Commit | Claude Opus 4.6 | orchestration |
25
- | **Planner** | Autonomous planner that researches codebases and writes comprehensive TDD implementation plans | Claude Opus 4.6 | orchestration |
26
- | **Implementer** | Persistent implementation agent that writes code following TDD practices until all tasks are complete | GPT-5.4 | implementation |
27
- | **Frontend** | UI/UX specialist for React, styling, responsive design, and frontend implementation | Gemini 3.1 Pro (Preview) | implementation |
28
- | **Refactor** | Code refactoring specialist that improves structure, readability, and maintainability | GPT-5.4 | implementation |
29
- | **Debugger** | Expert debugger that diagnoses issues, traces errors, and provides solutions | Claude Opus 4.6 | diagnostics |
30
- | **Security** | Security specialist that analyzes code for vulnerabilities and compliance | Claude Opus 4.6 | diagnostics |
31
- | **Documenter** | Documentation specialist that creates and maintains comprehensive project documentation | GPT-5.4 | documentation |
32
- | **Explorer** | Rapid codebase exploration to find files, usages, dependencies, and structural context | Gemini 3 Flash (Preview) | exploration |
33
- | **Researcher-Alpha** | Primary deep research agent — also serves as default Researcher | Claude Opus 4.6 | research |
34
- | **Researcher-Beta** | Research variant — pragmatic analysis with focus on trade-offs and edge cases | Claude Sonnet 4.6 | research |
35
- | **Researcher-Gamma** | Research variant — broad pattern matching across domains and technologies | GPT-5.4 | research |
36
- | **Researcher-Delta** | Research variant — implementation feasibility and performance implications | Gemini 3.1 Pro (Preview) | research |
37
- | **Code-Reviewer-Alpha** | Primary code reviewer | GPT-5.4 | review |
38
- | **Code-Reviewer-Beta** | Code reviewer variant — different LLM perspective for dual review | Claude Opus 4.6 | review |
39
- | **Architect-Reviewer-Alpha** | Primary architecture reviewer | GPT-5.4 | review |
40
- | **Architect-Reviewer-Beta** | Architecture reviewer variant — different LLM perspective for dual review | Claude Opus 4.6 | review |
24
+ | **Orchestrator** | Master conductor that orchestrates the full development lifecycle: Planning → Implementation → Review → Recovery → Commit | Claude Opus 4.6 (copilot) | orchestration |
25
+ | **Planner** | Autonomous planner that researches codebases and writes comprehensive TDD implementation plans | Claude Opus 4.6 (copilot) | orchestration |
26
+ | **Implementer** | Persistent implementation agent that writes code following TDD practices until all tasks are complete | GPT-5.4 (copilot) | implementation |
27
+ | **Frontend** | UI/UX specialist for React, styling, responsive design, and frontend implementation | Gemini 3.1 Pro (Preview) (copilot) | implementation |
28
+ | **Refactor** | Code refactoring specialist that improves structure, readability, and maintainability | GPT-5.4 (copilot) | implementation |
29
+ | **Debugger** | Expert debugger that diagnoses issues, traces errors, and provides solutions | Claude Opus 4.6 (copilot) | diagnostics |
30
+ | **Security** | Security specialist that analyzes code for vulnerabilities and compliance | Claude Opus 4.6 (copilot) | diagnostics |
31
+ | **Documenter** | Documentation specialist that creates and maintains comprehensive project documentation | GPT-5.4 (copilot) | documentation |
32
+ | **Explorer** | Rapid codebase exploration to find files, usages, dependencies, and structural context | Gemini 3 Flash (Preview) (copilot) | exploration |
33
+ | **Researcher-Alpha** | Primary deep research agent — also serves as default Researcher | Claude Opus 4.6 (copilot) | research |
34
+ | **Researcher-Beta** | Research variant — pragmatic analysis with focus on trade-offs and edge cases | Claude Sonnet 4.6 (copilot) | research |
35
+ | **Researcher-Gamma** | Research variant — broad pattern matching across domains and technologies | GPT-5.4 (copilot) | research |
36
+ | **Researcher-Delta** | Research variant — implementation feasibility and performance implications | Gemini 3.1 Pro (Preview) (copilot) | research |
37
+ | **Code-Reviewer-Alpha** | Primary code reviewer | GPT-5.4 (copilot) | review |
38
+ | **Code-Reviewer-Beta** | Code reviewer variant — different LLM perspective for dual review | Claude Opus 4.6 (copilot) | review |
39
+ | **Architect-Reviewer-Alpha** | Primary architecture reviewer | GPT-5.4 (copilot) | review |
40
+ | **Architect-Reviewer-Beta** | Architecture reviewer variant — different LLM perspective for dual review | Claude Opus 4.6 (copilot) | review |
41
41
 
42
42
  **Parallelism**: Read-only agents run in parallel freely. File-modifying agents run in parallel ONLY on completely different files. Max 4 concurrent file-modifying agents.
43
43
 
@@ -57,26 +57,43 @@ You orchestrate the full development lifecycle: **planning → implementation
57
57
  3. After review: `evidence_map({ action: "gate", task_id })` → YIELD/HOLD/HARD_BLOCK
58
58
  4. Auto-upgrade tier if unknowns reveal contract/security issues
59
59
 
60
- ## Workflow
60
+ ## Flow-Driven Development
61
61
 
62
- ### Phase 1: Planning
63
- 1. Read onboard artifacts → parse goal → identify affected subsystems → `forge_classify`
64
- 2. Research: <5 files direct, 5-15 Explorer→Researcher, >15 multiple parallel
65
- 3. Draft plan: 3-10 phases, agent assignments, TDD steps, dependency graph
66
- 4. Batch independent phases for parallel execution
67
- 5. **🛑 STOP — user approval required**
62
+ Orchestrator uses the flow system for structured development. Flows define the step sequence — Orchestrator adds multi-agent orchestration, quality gates, and review protocols on top.
68
63
 
69
- ### Phase 2: Implementation Cycle
64
+ ### Flow Selection
70
65
 
71
- **🚨 PRE-DISPATCH GATE complete ALL before ANY `runSubagent` call:**
66
+ | Situation | Flow | Steps |
67
+ |-----------|------|-------|
68
+ | Bug fix, small feature, refactoring | `aikit:basic` | assess → implement → verify |
69
+ | New feature, major change, multi-file | `aikit:advanced` | spec → plan → task → execute → verify |
70
+ | Custom/specialized work | Check `flow_list` | Follow flow-specific steps |
72
71
 
73
- 1. `multi-agents-development` skill loaded? (Bootstrap step 4 if not, load NOW)
74
- 2. ✅ Task decomposition table produced? (show user: task → files → agent → parallel batch)
75
- 3. ✅ Independence Check passed per pair? (shared files? shared state? ordering dependency? → must be "No" for parallel)
76
- 4. ✅ Each task ≤ 3 files? (if not, split further)
77
- 5. ✅ Parallel batches identified? (tasks with no dependencies MUST be in same batch)
72
+ **If multiple flows could apply and user hasn't specified ask user to choose.**
78
73
 
79
- **Decomposition output format** (show this to user before dispatching):
74
+ ### Session Start Flow Check
75
+
76
+ 1. `flow_status` — check for active flow
77
+ 2. If active:
78
+ - Note current step name and skill path
79
+ - Read the current step skill with `flow_read_skill`
80
+ - Follow its instructions
81
+ - When complete: `flow_step({ action: 'next' })`
82
+ 3. If no active flow:
83
+ - `flow_list` — check ALL available flows (builtin + custom)
84
+ - Recommend appropriate flow based on task scope
85
+ - `flow_start({ flow: '<name>' })` after user confirms
86
+
87
+ ### Orchestrator Protocols (apply during ALL flow steps)
88
+
89
+ **PRE-DISPATCH GATE — complete ALL before ANY `runSubagent` call:**
90
+ 1. ✅ `multi-agents-development` skill loaded?
91
+ 2. ✅ Task decomposition table produced?
92
+ 3. ✅ Independence Check passed per pair?
93
+ 4. ✅ Each task ≤ 3 files?
94
+ 5. ✅ Parallel batches identified?
95
+
96
+ **Decomposition output format:**
80
97
 
81
98
  ```
82
99
  Batch 1 (parallel):
@@ -86,23 +103,35 @@ Batch 2 (after batch 1):
86
103
  Task C: [agent] → [file5] — [goal] (depends on A)
87
104
  ```
88
105
 
89
- **Prompt every subagent with** (use `multi-agents-development` skill templates):
90
- 1. **Scope** — exact files to touch + boundary (do NOT touch)
106
+ **Subagent prompt template:**
107
+ 1. **Scope** — exact files + boundary
91
108
  2. **Goal** — acceptance criteria, testable
92
- 3. **Arch Context** — paste actual code snippets from `compact()`/`digest()`
93
- 4. **Constraints** — patterns, conventions, anti-patterns
109
+ 3. **Arch Context** — code snippets from `compact()`/`digest()`
110
+ 4. **Constraints** — patterns, conventions
94
111
  5. **FORGE** — tier + evidence requirements
95
112
  6. **Self-Review** — checklist before declaring status
96
113
 
97
- **Subagent status protocol**: `DONE` | `DONE_WITH_CONCERNS` | `NEEDS_CONTEXT` | `BLOCKED`
114
+ **Subagent status protocol:** `DONE` | `DONE_WITH_CONCERNS` | `NEEDS_CONTEXT` | `BLOCKED`
115
+
116
+ **Additional Orchestrator requirements during flow execution:**
117
+ - Apply the PRE-DISPATCH GATE before any subagent dispatch, regardless of flow
118
+ - Apply FORGE at classification and verification points; pass tier/evidence expectations into subagents and gate with `evidence_map`
119
+ - Enforce delegation rules at all times — Orchestrator never implements code directly
120
+ - Use the subagent prompt template for every dispatch so step-specific flow instructions are grounded in actual code context
98
121
 
99
- **Per-batch flow**: Dispatch (parallel) Spec Review → Code Quality Review (Alpha+Beta parallel) → Arch Review (if boundary changes) → Security (if applicable) → `evidence_map` gate → **🛑 STOP — present commit message**
122
+ **Per-step review cycle:** Dispatch → Code Review (Alpha+Beta) → Arch Review (if boundary changes) → Security (if applicable) → `evidence_map` gate → **🛑 STOP — present results**
123
+
124
+ ### Flow MCP Tools
100
125
 
101
- ### Phase 3: Completion
102
- 1. Optional: Refactor pass (separate commit)
103
- 2. Documenter for docs updates
104
- 3. `remember` all decisions, patterns, gotchas, conventions
105
- 4. `reindex({})` + `produce_knowledge({ path: "." })`
126
+ | Tool | Purpose |
127
+ |------|---------|
128
+ | `flow_list` | List installed flows and active flow |
129
+ | `flow_info` | Get detailed flow info including steps |
130
+ | `flow_start` | Start a named flow |
131
+ | `flow_step` | Advance: next, skip, or redo current step |
132
+ | `flow_status` | Check current execution state |
133
+ | `flow_reset` | Clear flow state to start over |
134
+ | `flow_read_skill` | Read the skill content for the current step |
106
135
 
107
136
  ## Emergency: STOP → ASSESS → CONTAIN → RECOVER → DOCUMENT
108
137
 
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  description: 'Autonomous planner that researches codebases and writes comprehensive TDD implementation plans'
3
3
  tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, edit/createFile, edit/editFiles, edit/rename, edit/createDirectory, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, todo, search/searchSubagent, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
4
- model: Claude Opus 4.6 (copilot)
4
+ model: [Claude Opus 4.6 (copilot), GPT-5.4 (copilot), Auto (copilot)]
5
5
  ---
6
6
 
7
7
  # Planner - The Strategic Architect
@@ -38,6 +38,17 @@ You are the **Planner**, autonomous planner that researches codebases and writes
38
38
  5. **Dependency Graph** — For each phase, list dependencies. Group into parallel batches
39
39
  6. **Present** — Show plan with open questions, complexity estimate, parallel batch layout
40
40
 
41
+ ## Flow Integration
42
+
43
+ When activated as part of a flow (e.g., `aikit:advanced` plan step or `aikit:basic` assess step):
44
+ 1. Check `flow_status` for current step context
45
+ 2. Read the step's skill file for specific instructions
46
+ 3. Follow skill instructions while applying Planner methodology
47
+ 4. Produce required artifacts (as specified by the flow step's `produces` field)
48
+ 5. When complete, report to Orchestrator (do NOT call `flow_step` — let Orchestrator advance)
49
+
50
+ When no flow is active, operate autonomously following normal Planner methodology.
51
+
41
52
  ## Subagent Output Relay
42
53
 
43
54
  When subagents complete, their visual outputs (from `present`) are NOT visible to the user.
@@ -6,23 +6,23 @@ This directory contains AI agent definitions generated by `@vpxa/aikit init`.
6
6
 
7
7
  | Agent | Purpose | Model | Category |
8
8
  |-------|---------|-------|----------|
9
- | **Orchestrator** | Master conductor that orchestrates the full development lifecycle: Planning → Implementation → Review → Recovery → Commit | Claude Opus 4.6 | orchestration |
10
- | **Planner** | Autonomous planner that researches codebases and writes comprehensive TDD implementation plans | Claude Opus 4.6 | orchestration |
11
- | **Implementer** | Persistent implementation agent that writes code following TDD practices until all tasks are complete | GPT-5.4 | implementation |
12
- | **Frontend** | UI/UX specialist for React, styling, responsive design, and frontend implementation | Gemini 3.1 Pro (Preview) | implementation |
13
- | **Refactor** | Code refactoring specialist that improves structure, readability, and maintainability | GPT-5.4 | implementation |
14
- | **Debugger** | Expert debugger that diagnoses issues, traces errors, and provides solutions | Claude Opus 4.6 | diagnostics |
15
- | **Security** | Security specialist that analyzes code for vulnerabilities and compliance | Claude Opus 4.6 | diagnostics |
16
- | **Documenter** | Documentation specialist that creates and maintains comprehensive project documentation | GPT-5.4 | documentation |
17
- | **Explorer** | Rapid codebase exploration to find files, usages, dependencies, and structural context | Gemini 3 Flash (Preview) | exploration |
18
- | **Researcher-Alpha** | Primary deep research agent — also serves as default Researcher | Claude Opus 4.6 | research |
19
- | **Researcher-Beta** | Research variant — pragmatic analysis with focus on trade-offs and edge cases | Claude Sonnet 4.6 | research |
20
- | **Researcher-Gamma** | Research variant — broad pattern matching across domains and technologies | GPT-5.4 | research |
21
- | **Researcher-Delta** | Research variant — implementation feasibility and performance implications | Gemini 3.1 Pro (Preview) | research |
22
- | **Code-Reviewer-Alpha** | Primary code reviewer | GPT-5.4 | review |
23
- | **Code-Reviewer-Beta** | Code reviewer variant — different LLM perspective for dual review | Claude Opus 4.6 | review |
24
- | **Architect-Reviewer-Alpha** | Primary architecture reviewer | GPT-5.4 | review |
25
- | **Architect-Reviewer-Beta** | Architecture reviewer variant — different LLM perspective for dual review | Claude Opus 4.6 | review |
9
+ | **Orchestrator** | Master conductor that orchestrates the full development lifecycle: Planning → Implementation → Review → Recovery → Commit | Claude Opus 4.6 (copilot) | orchestration |
10
+ | **Planner** | Autonomous planner that researches codebases and writes comprehensive TDD implementation plans | Claude Opus 4.6 (copilot) | orchestration |
11
+ | **Implementer** | Persistent implementation agent that writes code following TDD practices until all tasks are complete | GPT-5.4 (copilot) | implementation |
12
+ | **Frontend** | UI/UX specialist for React, styling, responsive design, and frontend implementation | Gemini 3.1 Pro (Preview) (copilot) | implementation |
13
+ | **Refactor** | Code refactoring specialist that improves structure, readability, and maintainability | GPT-5.4 (copilot) | implementation |
14
+ | **Debugger** | Expert debugger that diagnoses issues, traces errors, and provides solutions | Claude Opus 4.6 (copilot) | diagnostics |
15
+ | **Security** | Security specialist that analyzes code for vulnerabilities and compliance | Claude Opus 4.6 (copilot) | diagnostics |
16
+ | **Documenter** | Documentation specialist that creates and maintains comprehensive project documentation | GPT-5.4 (copilot) | documentation |
17
+ | **Explorer** | Rapid codebase exploration to find files, usages, dependencies, and structural context | Gemini 3 Flash (Preview) (copilot) | exploration |
18
+ | **Researcher-Alpha** | Primary deep research agent — also serves as default Researcher | Claude Opus 4.6 (copilot) | research |
19
+ | **Researcher-Beta** | Research variant — pragmatic analysis with focus on trade-offs and edge cases | Claude Sonnet 4.6 (copilot) | research |
20
+ | **Researcher-Gamma** | Research variant — broad pattern matching across domains and technologies | GPT-5.4 (copilot) | research |
21
+ | **Researcher-Delta** | Research variant — implementation feasibility and performance implications | Gemini 3.1 Pro (Preview) (copilot) | research |
22
+ | **Code-Reviewer-Alpha** | Primary code reviewer | GPT-5.4 (copilot) | review |
23
+ | **Code-Reviewer-Beta** | Code reviewer variant — different LLM perspective for dual review | Claude Opus 4.6 (copilot) | review |
24
+ | **Architect-Reviewer-Alpha** | Primary architecture reviewer | GPT-5.4 (copilot) | review |
25
+ | **Architect-Reviewer-Beta** | Architecture reviewer variant — different LLM perspective for dual review | Claude Opus 4.6 (copilot) | review |
26
26
 
27
27
  ## Multi-Model Pattern
28
28
 
@@ -2,7 +2,7 @@
2
2
  description: 'Code refactoring specialist that improves structure, readability, and maintainability'
3
3
  argument-hint: Code, component, or pattern to refactor
4
4
  tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, edit/createFile, edit/editFiles, edit/rename, edit/createDirectory, search/changes, search/codebase, search/usages, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
5
- model: GPT-5.4 (copilot)
5
+ model: [GPT-5.4 (copilot), GPT-5.3-Codex (copilot), Auto (copilot)]
6
6
  ---
7
7
 
8
8
  # Refactor - The Code Sculptor
@@ -2,7 +2,7 @@
2
2
  description: 'Primary deep research agent — also serves as default Researcher'
3
3
  argument-hint: Research question, problem statement, or subsystem to investigate
4
4
  tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
5
- model: Claude Opus 4.6 (copilot)
5
+ model: [Claude Opus 4.6 (copilot), Auto (copilot)]
6
6
  ---
7
7
 
8
8
  # Researcher-Alpha - The Context Gatherer
@@ -2,7 +2,7 @@
2
2
  description: 'Research variant — pragmatic analysis with focus on trade-offs and edge cases'
3
3
  argument-hint: Research question, problem statement, or subsystem to investigate
4
4
  tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
5
- model: Claude Sonnet 4.6 (copilot)
5
+ model: [Claude Sonnet 4.6 (copilot), Auto (copilot)]
6
6
  ---
7
7
 
8
8
  # Researcher-Beta - The Context Gatherer
@@ -2,7 +2,7 @@
2
2
  description: 'Research variant — implementation feasibility and performance implications'
3
3
  argument-hint: Research question, problem statement, or subsystem to investigate
4
4
  tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
5
- model: Gemini 3.1 Pro (Preview) (copilot)
5
+ model: [Gemini 3.1 Pro (Preview) (copilot), Auto (copilot)]
6
6
  ---
7
7
 
8
8
  # Researcher-Delta - The Context Gatherer
@@ -2,7 +2,7 @@
2
2
  description: 'Research variant — broad pattern matching across domains and technologies'
3
3
  argument-hint: Research question, problem statement, or subsystem to investigate
4
4
  tools: [execute/runInTerminal, read/problems, read/readFile, read/terminalLastCommand, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
5
- model: GPT-5.4 (copilot)
5
+ model: [GPT-5.4 (copilot), Auto (copilot)]
6
6
  ---
7
7
 
8
8
  # Researcher-Gamma - The Context Gatherer
@@ -2,7 +2,7 @@
2
2
  description: 'Security specialist that analyzes code for vulnerabilities and compliance'
3
3
  argument-hint: Code, feature, or component to security review
4
4
  tools: [execute/runInTerminal, read/problems, read/readFile, agent/runSubagent, search/changes, search/codebase, search/usages, web/fetch, web/githubRepo, browser/openBrowserPage, browser/readPage, browser/screenshotPage, browser/navigatePage, browser/clickElement, browser/dragElement, browser/hoverElement, browser/typeInPage, browser/runPlaywrightCode, browser/handleDialog, aikit/*]
5
- model: Claude Opus 4.6 (copilot)
5
+ model: [Claude Opus 4.6 (copilot), GPT-5.4 (copilot), Auto (copilot)]
6
6
  ---
7
7
 
8
8
  # Security - The Vulnerability Hunter