npm - agent-state-machine - Versions diffs - 2.2.1 → 2.3.0 - Mend

agent-state-machine 2.2.1 → 2.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

package/bin/cli.js +33 -5
package/lib/file-tree.js +1 -1
package/lib/runtime/agent.js +6 -2
package/lib/runtime/interaction.js +2 -1
package/lib/runtime/prompt.js +37 -1
package/lib/runtime/runtime.js +67 -5
package/lib/setup.js +4 -4
package/package.json +1 -1
package/templates/project-builder/agents/code-fixer.md +50 -0
package/templates/project-builder/agents/code-writer.md +3 -0
package/templates/project-builder/agents/sanity-checker.md +6 -0
package/templates/project-builder/agents/test-planner.md +3 -1
package/templates/project-builder/config.js +4 -4
package/templates/project-builder/scripts/workflow-helpers.js +104 -2
package/templates/project-builder/workflow.js +151 -14
package/templates/starter/config.js +1 -1
package/vercel-server/api/submit/[token].js +0 -11
package/vercel-server/local-server.js +0 -19
package/vercel-server/public/remote/assets/index-BTLc1QSv.js +168 -0
package/vercel-server/public/remote/assets/index-DLa4X08t.css +1 -0
package/vercel-server/public/remote/index.html +2 -2
package/vercel-server/ui/src/App.jsx +53 -18
package/vercel-server/ui/src/components/ChoiceInteraction.jsx +69 -18
package/vercel-server/ui/src/components/ConfirmInteraction.jsx +7 -7
package/vercel-server/ui/src/components/ContentCard.jsx +607 -103
package/vercel-server/ui/src/components/EventsLog.jsx +20 -13
package/vercel-server/ui/src/components/Footer.jsx +9 -4
package/vercel-server/ui/src/components/Header.jsx +12 -3
package/vercel-server/ui/src/components/SendingCard.jsx +33 -0
package/vercel-server/ui/src/components/TextInteraction.jsx +8 -8
package/vercel-server/ui/src/index.css +82 -10
package/vercel-server/public/remote/assets/index-CbgeVnKw.js +0 -148
package/vercel-server/public/remote/assets/index-DHL_iHQW.css +0 -1

package/templates/project-builder/workflow.js CHANGED Viewed

@@ -8,11 +8,12 @@
  * 4. Task lifecycle with optimal agent sequencing
  */
-import { agent, memory, askHuman } from 'agent-state-machine';
+import { agent, memory, askHuman, getCurrentRuntime } from 'agent-state-machine';
 import path from 'path';
 import { fileURLToPath } from 'url';
 import {
   writeMarkdownFile,
+  writeImplementationFiles,
   isApproval,
   renderRoadmapMarkdown,
   renderTasksMarkdown,
@@ -20,7 +21,12 @@ import {
   getTaskStage,
   setTaskStage,
   getTaskData,
-  setTaskData
+  setTaskData,
+  clearPartialTaskData,
+  getQuickFixAttempts,
+  incrementQuickFixAttempts,
+  resetQuickFixAttempts,
+  detectTestFramework
 } from './scripts/workflow-helpers.js';
 import {
   createInteraction,
@@ -34,6 +40,57 @@ const __dirname = path.dirname(__filename);
 const WORKFLOW_DIR = __dirname;
 const STATE_DIR = path.join(WORKFLOW_DIR, 'state');
+// ANSI Colors for console output
+const C = {
+  reset: '\x1b[0m',
+  bold: '\x1b[1m',
+  cyan: '\x1b[36m',
+  green: '\x1b[32m',
+  yellow: '\x1b[33m'
+};
+function applyFixesToImplementation(originalImplementation, fixes) {
+  if (!originalImplementation || !Array.isArray(fixes) || fixes.length === 0) {
+    return originalImplementation;
+  }
+  const updated = { ...originalImplementation };
+  const container = updated.implementation ? { ...updated.implementation } : updated;
+  const files = Array.isArray(container.files) ? [...container.files] : [];
+  for (const fix of fixes) {
+    if (!fix?.path || !fix?.code) {
+      console.warn(`  [Fix] Skipping invalid fix entry: ${JSON.stringify(fix)}`);
+      continue;
+    }
+    if (fix.operation && fix.operation !== 'replace') {
+      console.warn(`  [Fix] Unsupported operation "${fix.operation}" for ${fix.path}`);
+      continue;
+    }
+    const existingIndex = files.findIndex((file) => file.path === fix.path);
+    const nextFile = {
+      ...(existingIndex >= 0 ? files[existingIndex] : {}),
+      path: fix.path,
+      code: fix.code,
+      purpose: fix.purpose || (existingIndex >= 0 ? files[existingIndex].purpose : 'Updated by code-fixer')
+    };
+    if (existingIndex >= 0) {
+      files[existingIndex] = nextFile;
+    } else {
+      files.push(nextFile);
+    }
+  }
+  if (updated.implementation) {
+    updated.implementation = { ...container, files };
+    return updated;
+  }
+  return { ...updated, files };
+}
 // ============================================
 // MAIN WORKFLOW
 // ============================================
@@ -334,6 +391,14 @@ export default async function () {
             });
             setTaskData(i, taskId, 'code', implementation);
           }
+          // Write implementation files to disk
+          const implementation = getTaskData(i, taskId, 'code');
+          if (implementation) {
+            console.log('    > Writing files to disk...');
+            writeImplementationFiles(implementation);
+          }
           setTaskStage(i, taskId, TASK_STAGES.CODE_REVIEW);
           stage = TASK_STAGES.CODE_REVIEW;
         }
@@ -373,10 +438,12 @@ export default async function () {
         // 6. Sanity check generation & execution
         if (stage === TASK_STAGES.SANITY_CHECK) {
+          const testFramework = detectTestFramework();
           const executableChecks = await agent('sanity-checker', {
             task: task,
             implementation: getTaskData(i, taskId, 'code'),
-            testPlan: getTaskData(i, taskId, 'tests')
+            testPlan: getTaskData(i, taskId, 'tests'),
+            testFramework
           });
           setTaskData(i, taskId, 'sanity_checks', executableChecks);
@@ -387,8 +454,8 @@ export default async function () {
           const sanityChoice = createInteraction('choice', `phase-${i + 1}-task-${taskId}-sanity-choice`, {
             prompt: `Sanity checks for "${task.title}":\n\n${checksDisplay}\n\nHow would you like to proceed?`,
             options: [
-              { key: 'manual', label: 'Run checks manually', description: 'You run the commands and confirm results' },
               { key: 'auto', label: 'Run automatically', description: 'Agent executes checks and reports results' },
+              { key: 'manual', label: 'Run checks manually', description: 'You run the commands and confirm results' },
               { key: 'skip', label: 'Skip verification', description: 'Approve without running checks' }
             ],
             allowCustom: true
@@ -402,6 +469,7 @@ export default async function () {
           if (sanityResponse.isCustom) {
             setTaskData(i, taskId, 'feedback', sanityResponse.customText || sanityResponse.raw || sanityRaw);
+            resetQuickFixAttempts(i, taskId);
             setTaskStage(i, taskId, TASK_STAGES.PENDING);
             t--;
             continue;
@@ -423,12 +491,26 @@ export default async function () {
                 .map((r) => `  - Check ${r.id}: ${r.error}`)
                 .join('\n');
+              const quickFixAttempts = getQuickFixAttempts(i, taskId);
+              const runtime = getCurrentRuntime();
+              const maxAttempts = runtime?.workflowConfig?.maxQuickFixAttempts ?? 10;
+              const failOptions = [];
+              if (quickFixAttempts < maxAttempts) {
+                failOptions.push({
+                  key: 'quickfix',
+                  label: 'Quick fix',
+                  description: `Run targeted fixes (attempt ${quickFixAttempts + 1} of ${maxAttempts})`
+                });
+              }
+              failOptions.push(
+                { key: 'partial', label: 'Partial reimplement', description: 'Keep security review and test plan, redo implementation' },
+                { key: 'reimplement', label: 'Full reimplement', description: 'Restart task from scratch' },
+                { key: 'ignore', label: 'Ignore failures and approve anyway' }
+              );
               const failChoice = createInteraction('choice', `phase-${i + 1}-task-${taskId}-sanity-fail`, {
                 prompt: `${results.summary.failed} sanity check(s) failed:\n\n${failedChecks}\n\nHow would you like to proceed?`,
-                options: [
-                  { key: 'reimplement', label: 'Re-implement task with this feedback' },
-                  { key: 'ignore', label: 'Ignore failures and approve anyway' }
-                ],
+                options: failOptions,
                 allowCustom: true
               });
@@ -438,19 +520,71 @@ export default async function () {
               });
               const failResponse = await parseResponse(failChoice, failRaw);
-              if (failResponse.selectedKey === 'reimplement' || failResponse.isCustom) {
+              if (failResponse.isCustom) {
+                const customFeedback = failResponse.customText || failResponse.text || failResponse.raw || failRaw;
+                const combinedFeedback = `${customFeedback}\n\nSanity check failures:\n${failedChecks}`;
+                setTaskData(i, taskId, 'feedback', combinedFeedback);
+                clearPartialTaskData(i, taskId);
+                resetQuickFixAttempts(i, taskId);
+                setTaskStage(i, taskId, TASK_STAGES.PENDING);
+                t--;
+                continue;
+              }
+              if (failResponse.selectedKey === 'quickfix') {
+                console.log('    > Running quick fix...');
+                const fixerResult = await agent('code-fixer', {
+                  task: task,
+                  originalImplementation: getTaskData(i, taskId, 'code'),
+                  sanityCheckResults: {
+                    summary: results.summary,
+                    results: results.results,
+                    checks: executableChecks.checks
+                  },
+                  testPlan: getTaskData(i, taskId, 'tests'),
+                  previousAttempts: quickFixAttempts
+                });
+                const fixes = fixerResult?.fixes || [];
+                const fixFiles = fixes
+                  .filter((fix) => fix?.path && fix?.code && (!fix.operation || fix.operation === 'replace'))
+                  .map((fix) => ({ path: fix.path, code: fix.code }));
+                if (fixFiles.length > 0) {
+                  console.log('    > Applying fixes to disk...');
+                  writeImplementationFiles({ files: fixFiles });
+                }
+                const updatedImplementation = applyFixesToImplementation(getTaskData(i, taskId, 'code'), fixes);
+                setTaskData(i, taskId, 'code', updatedImplementation);
+                incrementQuickFixAttempts(i, taskId);
+                setTaskData(i, taskId, 'sanity_checks', null);
+                setTaskData(i, taskId, 'sanity_results', null);
+                setTaskStage(i, taskId, TASK_STAGES.SANITY_CHECK);
+                t--;
+                continue;
+              }
+              if (failResponse.selectedKey === 'partial') {
+                setTaskData(i, taskId, 'feedback', `Sanity check failures:\n${failedChecks}`);
+                clearPartialTaskData(i, taskId, ['security_pre', 'tests']);
+                resetQuickFixAttempts(i, taskId);
+                setTaskStage(i, taskId, TASK_STAGES.IMPLEMENTING);
+                t--;
+                continue;
+              }
+              if (failResponse.selectedKey === 'reimplement') {
                 setTaskData(i, taskId, 'feedback', `Sanity check failures:\n${failedChecks}`);
-                setTaskData(i, taskId, 'security_pre', null);
-                setTaskData(i, taskId, 'tests', null);
-                setTaskData(i, taskId, 'code', null);
-                setTaskData(i, taskId, 'review', null);
-                setTaskData(i, taskId, 'security_post', null);
+                clearPartialTaskData(i, taskId);
+                resetQuickFixAttempts(i, taskId);
                 setTaskStage(i, taskId, TASK_STAGES.PENDING);
                 t--;
                 continue;
               }
             }
+            resetQuickFixAttempts(i, taskId);
             setTaskStage(i, taskId, TASK_STAGES.COMPLETED);
             stage = TASK_STAGES.COMPLETED;
             task.stage = 'completed';
@@ -458,6 +592,7 @@ export default async function () {
             writeMarkdownFile(STATE_DIR, `phase-${i + 1}-tasks.md`, renderTasksMarkdown(i + 1, phase.title, tasks));
             console.log(`    Task ${t + 1} confirmed complete!\n`);
           } else if (action === 'skip') {
+            resetQuickFixAttempts(i, taskId);
             setTaskStage(i, taskId, TASK_STAGES.COMPLETED);
             stage = TASK_STAGES.COMPLETED;
             task.stage = 'completed';
@@ -489,6 +624,7 @@ export default async function () {
           if (approvalResponse.selectedKey === 'approve' || isApproval(approvalResponse.raw || approvalRaw)) {
             setTaskStage(i, taskId, TASK_STAGES.COMPLETED);
+            resetQuickFixAttempts(i, taskId);
             task.stage = 'completed';
             memory[tasksKey] = tasks;
             writeMarkdownFile(STATE_DIR, `phase-${i + 1}-tasks.md`, renderTasksMarkdown(i + 1, phase.title, tasks));
@@ -505,6 +641,7 @@ export default async function () {
             setTaskData(i, taskId, 'security_post', null);
             setTaskData(i, taskId, 'sanity_checks', null);
             setTaskData(i, taskId, 'sanity_results', null);
+            resetQuickFixAttempts(i, taskId);
             setTaskStage(i, taskId, TASK_STAGES.PENDING);
             t--;

package/templates/starter/config.js CHANGED Viewed

@@ -1,6 +1,6 @@
 export const config = {
   models: {
-    low: "gemini",
+    low: "gemini -m gemini-2.5-flash-lite",
     med: "codex --model gpt-5.2",
     high: "claude -m claude-opus-4-20250514 -p",
   },

package/vercel-server/api/submit/[token].js CHANGED Viewed

@@ -6,7 +6,6 @@
 import {
   getSession,
-  addEvent,
   redis,
   KEYS,
 } from '../../lib/redis.js';
@@ -69,16 +68,6 @@ export default async function handler(req, res) {
     // Set TTL on pending list (24 hours - same as session, allows laptop sleep)
     await redis.expire(pendingKey, 24 * 60 * 60);
-    // Log event to events list (single source of truth for UI)
-    await addEvent(token, {
-      timestamp: new Date().toISOString(),
-      event: 'INTERACTION_SUBMITTED',
-      slug,
-      targetKey: targetKey || `_interaction_${slug}`,
-      answer: responseString.substring(0, 200) + (responseString.length > 200 ? '...' : ''),
-      source: 'remote',
-    });
     return res.status(200).json({ success: true });
   } catch (err) {
     console.error('Error submitting interaction:', err);

package/vercel-server/local-server.js CHANGED Viewed

@@ -342,8 +342,6 @@ async function handleSubmitPost(req, res, token) {
     return sendJson(res, 400, { error: 'Missing slug or response' });
   }
-  const responseString = typeof response === 'string' ? response : JSON.stringify(response);
   // Add to pending interactions for CLI to pick up
   session.pendingInteractions.push({
     slug,
@@ -351,23 +349,6 @@ async function handleSubmitPost(req, res, token) {
     response,
   });
-  // Log to history (include answer preview)
-  const event = {
-    timestamp: new Date().toISOString(),
-    event: 'INTERACTION_SUBMITTED',
-    slug,
-    targetKey: targetKey || `_interaction_${slug}`,
-    answer: responseString.substring(0, 200) + (responseString.length > 200 ? '...' : ''),
-    source: 'remote',
-  };
-  session.history.unshift(event);
-  // Broadcast to browsers
-  broadcastToSession(token, {
-    type: 'event',
-    ...event,
-  });
   return sendJson(res, 200, { success: true });
 }