npm - agent-state-machine - Versions diffs - 2.2.0 → 2.2.1 - Mend

agent-state-machine 2.2.0 → 2.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/bin/cli.js +48 -0
package/lib/remote/client.js +37 -8
package/package.json +1 -1
package/templates/project-builder/README.md +304 -56
package/templates/project-builder/agents/sanity-runner.js +3 -1
package/templates/starter/README.md +291 -42
package/vercel-server/api/submit/[token].js +2 -2
package/vercel-server/api/ws/cli.js +40 -2
package/vercel-server/local-server.js +32 -3
package/vercel-server/public/remote/assets/{index-BOKpYANC.js → index-CbgeVnKw.js} +28 -28
package/vercel-server/public/remote/index.html +1 -1
package/vercel-server/ui/src/App.jsx +0 -43

package/templates/starter/README.md CHANGED Viewed

@@ -1,62 +1,100 @@
-# __WORKFLOW_NAME__
+# agent-state-machine
-A workflow created with agent-state-machine (native JS format).
+A workflow runner for building **linear, stateful agent workflows** in plain JavaScript.
-## Structure
+You write normal `async/await` code. The runtime handles:
+- **Auto-persisted** `memory` (saved to disk on mutation)
+- **Auto-tracked** `fileTree` (detects file changes made by agents via Git)
+- **Human-in-the-loop** blocking via `askHuman()` or agent-driven interactions
+- Local **JS agents** + **Markdown agents** (LLM-powered)
+- **Agent retries** with history logging for failures
-```
-__WORKFLOW_NAME__/
-├── workflow.js      # Native JS workflow (async/await)
-├── config.js        # Model/API key configuration
-├── agents/          # Custom agents (.js/.mjs/.cjs or .md)
-├── interactions/    # Human-in-the-loop inputs (created at runtime)
-├── state/           # Runtime state (current.json, history.jsonl)
-└── steering/        # Steering configuration
-```
+---
-## Usage
+## Install
-Edit `config.js` to set models and API keys for this workflow.
+You need to install the package **globally** to get the CLI, and **locally** in your project so your workflow can import the library.
-Run the workflow (or resume if interrupted):
-```bash
-state-machine run __WORKFLOW_NAME__
-```
+### Global CLI
+Provides the `state-machine` command.
-Check status:
 ```bash
-state-machine status __WORKFLOW_NAME__
-```
+# npm
+npm i -g agent-state-machine
-View history:
-```bash
-state-machine history __WORKFLOW_NAME__
+# pnpm
+pnpm add -g agent-state-machine
 ```
-View trace logs in browser with live updates:
+### Local Library
+Required so your `workflow.js` can `import { agent, memory, fileTree } from 'agent-state-machine'`.
 ```bash
-state-machine follow __WORKFLOW_NAME__
+# npm
+npm i agent-state-machine
+# pnpm (for monorepos/turbo, install in root)
+pnpm add agent-state-machine -w
 ```
-Reset state (clears memory/state):
+Requirements: Node.js >= 16.
+---
+## CLI
 ```bash
-state-machine reset __WORKFLOW_NAME__
+state-machine --setup <workflow-name>
+state-machine --setup <workflow-name> --template <template-name>
+state-machine run <workflow-name>
+state-machine run <workflow-name> -reset
+state-machine run <workflow-name> -reset-hard
+state-machine -reset <workflow-name>
+state-machine -reset-hard <workflow-name>
+state-machine history <workflow-name> [limit]
 ```
-Hard reset (clears everything: history/interactions/memory):
-```bash
-state-machine reset-hard __WORKFLOW_NAME__
+Templates live in `templates/` and `starter` is used by default.
+Workflows live in:
+```text
+workflows/<name>/
+├── workflow.js        # Native JS workflow (async/await)
+├── config.js          # Model/API key configuration
+├── package.json       # Sets "type": "module" for this workflow folder
+├── agents/            # Custom agents (.js/.mjs/.cjs or .md)
+├── interactions/      # Human-in-the-loop files (auto-created)
+├── state/             # current.json, history.jsonl
+└── steering/          # global.md + config.json
 ```
-## Writing Workflows
+---
-Edit `workflow.js` - write normal async JavaScript:
+## Writing workflows (native JS)
+Edit `config.js` to set models and API keys for the workflow.
 ```js
+/**
+/**
+ * project-builder Workflow
+ *
+ * Native JavaScript workflow - write normal async/await code!
+ *
+ * Features:
+ * - memory object auto-persists to disk (use memory guards for idempotency)
+ * - Use standard JS control flow (if, for, etc.)
+ * - Interactive prompts pause and wait for user input
+ */
 import { agent, memory, askHuman, parallel } from 'agent-state-machine';
+import { notify } from './scripts/mac-notification.js';
 export default async function() {
-  console.log('Starting __WORKFLOW_NAME__ workflow...');
+  console.log('Starting project-builder workflow...');
   // Example: Get user input (saved to memory)
   const userLocation = await askHuman('Where do you live?');
@@ -88,31 +126,242 @@ export default async function() {
   // console.log('b: ' + JSON.stringify(b))
   // console.log('c: ' + JSON.stringify(c))
-  notify(['__WORKFLOW_NAME__', userInfo.name || userInfo + ' has been greeted!']);
+  notify(['project-builder', userInfo.name || userInfo + ' has been greeted!']);
   console.log('Workflow completed!');
 }
 ```
-## Creating Agents
+### Resuming workflows
+`state-machine run` restarts your workflow from the top, loading the persisted state.
+If the workflow needs human input, it will **block inline** in the terminal. You can answer in the terminal, edit `interactions/<slug>.md`, or respond in the browser.
+If the process is interrupted, running `state-machine run <workflow-name>` again will continue execution (assuming your workflow uses `memory` to skip completed steps).
+---
+## Core API
+### `agent(name, params?, options?)`
+Runs `workflows/<name>/agents/<agent>.(js|mjs|cjs)` or `<agent>.md`.
+```js
+const out = await agent('review', { file: 'src/app.js' });
+memory.lastReview = out;
+```
+Options:
+- `retry` (number | false): default `2` (3 total attempts). Use `false` to disable retries.
+- `steering` (string | string[]): extra steering files to load from `workflows/<name>/steering/`.
+Context is explicit: only `params` are provided to agents unless you pass additional data.
+### `memory`
+A persisted object for your workflow.
+- Mutations auto-save to `workflows/<name>/state/current.json`.
+- Use it as your "long-lived state" between runs.
+```js
+memory.count = (memory.count || 0) + 1;
+```
+### `fileTree`
+Auto-tracked file changes made by agents.
+- Before each `await agent(...)`, the runtime captures a Git baseline
+- After the agent completes, it detects created/modified/deleted files
+- Changes are stored in `memory.fileTree` and persisted to `current.json`
+```js
+// Files are auto-tracked when agents create them
+await agent('code-writer', { task: 'Create auth module' });
+// Access tracked files
+console.log(memory.fileTree);
+// { "src/auth.js": { status: "created", createdBy: "code-writer", ... } }
+// Pass file context to other agents
+await agent('code-reviewer', { fileTree: memory.fileTree });
+```
+Configuration in `config.js`:
+```js
+export const config = {
+  // ... models and apiKeys ...
+  projectRoot: process.env.PROJECT_ROOT,  // defaults to ../.. from workflow
+  fileTracking: true,                     // enable/disable (default: true)
+  fileTrackingIgnore: ['node_modules/**', '.git/**', 'dist/**'],
+  fileTrackingKeepDeleted: false          // keep deleted files in tree
+};
+```
+### `trackFile(path, options?)` / `untrackFile(path)`
+Manual file tracking utilities:
+```js
+import { trackFile, getFileTree, untrackFile } from 'agent-state-machine';
+trackFile('README.md', { caption: 'Project docs' });
+const tree = getFileTree();
+untrackFile('old-file.js');
+```
+### `askHuman(question, options?)`
+Gets user input.
+- In a TTY, it prompts in the terminal (or via the browser when remote follow is enabled).
+- Otherwise it creates `interactions/<slug>.md` and blocks until you confirm in the terminal (or respond in the browser).
+```js
+const repo = await askHuman('What repo should I work on?', { slug: 'repo' });
+memory.repo = repo;
+```
+### `parallel([...])` / `parallelLimit([...], limit)`
-**JavaScript agent** (`agents/my-agent.js`):
+Run multiple `agent()` calls concurrently:
 ```js
+import { agent, parallel, parallelLimit } from 'agent-state-machine';
+const [a, b] = await parallel([
+  agent('review', { file: 'src/a.js' }),
+  agent('review', { file: 'src/b.js' }),
+]);
+const results = await parallelLimit(
+  ['a.js', 'b.js', 'c.js'].map(f => agent('review', { file: f })),
+  2
+);
+```
+---
+## Agents
+Agents live in `workflows/<workflow>/agents/`.
+### JavaScript agents
+**ESM (`.js` / `.mjs`)**:
+```js
+// workflows/<name>/agents/example.js
 import { llm } from 'agent-state-machine';
 export default async function handler(context) {
-  const response = await llm(context, { model: 'smart', prompt: 'Hello!' });
-  return { greeting: response.text };
+  // context includes:
+  // - params passed to agent(name, params)
+  // - context._steering (global + optional additional steering content)
+  // - context._config (models/apiKeys/workflowDir/projectRoot)
+  // Optionally return _files to annotate tracked files
+  return {
+    ok: true,
+    _files: [{ path: 'src/example.js', caption: 'Example module' }]
+  };
+}
+```
+**CommonJS (`.cjs`)** (only if you prefer CJS):
+```js
+// workflows/<name>/agents/example.cjs
+async function handler(context) {
+  return { ok: true };
 }
+module.exports = handler;
+module.exports.handler = handler;
 ```
-**Markdown agent** (`agents/greeter.md`):
+If you need to request human input from a JS agent, return an `_interaction` payload:
+```js
+return {
+  _interaction: {
+    slug: 'approval',
+    targetKey: 'approval',
+    content: 'Please approve this change (yes/no).'
+  }
+};
+```
+The runtime will block execution and wait for your response in the terminal.
+### Markdown agents (`.md`)
+Markdown agents are LLM-backed prompt templates with optional frontmatter.
+Frontmatter can include `steering` to load additional files from `workflows/<name>/steering/`.
 ```md
 ---
-model: fast
+model: smart
 output: greeting
+steering: tone, product
+---
+Generate a friendly greeting for {{name}}.
+```
+Calling it:
+```js
+const { greeting } = await agent('greeter', { name: 'Sam' });
+memory.greeting = greeting;
+```
 ---
-Generate a greeting for {{name}}.
+## Models & LLM execution
+In your workflow’s `export const config = { models: { ... } }`, each model value can be:
+### CLI command
+```js
+export const config = {
+  models: {
+    smart: "claude -m claude-sonnet-4-20250514 -p"
+  }
+};
 ```
+### API target
+Format: `api:<provider>:<model>`
+```js
+export const config = {
+  models: {
+    smart: "api:openai:gpt-4.1-mini"
+  },
+  apiKeys: {
+    openai: process.env.OPENAI_API_KEY
+  }
+};
+```
+The runtime captures the fully-built prompt in `state/history.jsonl`, viewable in the browser with live updates when running with the `--local` flag or via the remote URL. Remote follow links persist across runs (stored in `config.js`) unless you pass `-n`/`--new` to regenerate.
+---
+## State & persistence
+Native JS workflows persist to:
+- `workflows/<name>/state/current.json` — status, memory (includes fileTree), pending interaction
+- `workflows/<name>/state/history.jsonl` — event log (newest entries first, includes agent retry/failure entries)
+- `workflows/<name>/interactions/*.md` — human input files (when paused)
+## License
+MIT

package/vercel-server/api/submit/[token].js CHANGED Viewed

@@ -66,8 +66,8 @@ export default async function handler(req, res) {
       response,
     }));
-    // Set TTL on pending list
-    await redis.expire(pendingKey, 300); // 5 minutes
+    // Set TTL on pending list (24 hours - same as session, allows laptop sleep)
+    await redis.expire(pendingKey, 24 * 60 * 60);
     // Log event to events list (single source of truth for UI)
     await addEvent(token, {

package/vercel-server/api/ws/cli.js CHANGED Viewed

@@ -21,7 +21,7 @@ import {
 export default async function handler(req, res) {
   // Enable CORS
   res.setHeader('Access-Control-Allow-Origin', '*');
-  res.setHeader('Access-Control-Allow-Methods', 'GET, POST, OPTIONS');
+  res.setHeader('Access-Control-Allow-Methods', 'GET, POST, DELETE, OPTIONS');
   res.setHeader('Access-Control-Allow-Headers', 'Content-Type');
   if (req.method === 'OPTIONS') {
@@ -36,6 +36,10 @@ export default async function handler(req, res) {
     return handleGet(req, res);
   }
+  if (req.method === 'DELETE') {
+    return handleDelete(req, res);
+  }
   return res.status(405).json({ error: 'Method not allowed' });
 }
@@ -161,12 +165,22 @@ async function handleGet(req, res) {
     // Poll every 5 seconds (10 calls per 50s timeout vs 50 calls before)
     while (Date.now() - startTime < timeoutMs) {
-      const pending = await redis.lpop(pendingKey);
+      // Peek at first item without removing (LINDEX 0)
+      // We only remove AFTER CLI confirms receipt via DELETE request
+      const pending = await redis.lindex(pendingKey, 0);
       if (pending) {
         const data = typeof pending === 'object' ? pending : JSON.parse(pending);
+        // Generate a receipt ID so CLI can confirm
+        const receiptId = `${Date.now()}-${Math.random().toString(36).slice(2, 8)}`;
+        // DON'T remove yet - CLI will confirm with DELETE request
+        // This prevents data loss if response doesn't reach CLI
         return res.status(200).json({
           type: 'interaction_response',
+          receiptId,
           ...data,
         });
       }
@@ -182,3 +196,27 @@ async function handleGet(req, res) {
     return res.status(500).json({ error: err.message });
   }
 }
+/**
+ * Handle DELETE requests - CLI confirms receipt of interaction
+ * This removes the interaction from the pending queue
+ */
+async function handleDelete(req, res) {
+  const { token } = req.query;
+  if (!token) {
+    return res.status(400).json({ error: 'Missing token parameter' });
+  }
+  const channel = KEYS.interactions(token);
+  const pendingKey = `${channel}:pending`;
+  try {
+    // Remove the first item (the one we just sent)
+    await redis.lpop(pendingKey);
+    return res.status(200).json({ success: true });
+  } catch (err) {
+    console.error('Error confirming interaction receipt:', err);
+    return res.status(500).json({ error: err.message });
+  }
+}

package/vercel-server/local-server.js CHANGED Viewed

@@ -101,7 +101,7 @@ function sendJson(res, status, data) {
   res.writeHead(status, {
     'Content-Type': 'application/json',
     'Access-Control-Allow-Origin': '*',
-    'Access-Control-Allow-Methods': 'GET, POST, OPTIONS',
+    'Access-Control-Allow-Methods': 'GET, POST, DELETE, OPTIONS',
     'Access-Control-Allow-Headers': 'Content-Type',
   });
   res.end(JSON.stringify(data));
@@ -187,6 +187,7 @@ async function handleCliPost(req, res) {
 /**
  * Handle CLI GET (long-poll for interactions)
+ * Peeks at first item without removing - CLI confirms via DELETE
  */
 async function handleCliGet(req, res, query) {
   const { token, timeout = '30000' } = query;
@@ -207,7 +208,8 @@ async function handleCliGet(req, res, query) {
   const checkInterval = setInterval(() => {
     if (session.pendingInteractions.length > 0) {
       clearInterval(checkInterval);
-      const interaction = session.pendingInteractions.shift();
+      // Peek at first item WITHOUT removing - CLI will confirm via DELETE
+      const interaction = session.pendingInteractions[0];
       return sendJson(res, 200, {
         type: 'interaction_response',
         ...interaction,
@@ -227,6 +229,30 @@ async function handleCliGet(req, res, query) {
   });
 }
+/**
+ * Handle CLI DELETE (confirm receipt of interaction)
+ * Removes the first pending interaction after CLI confirms receipt
+ */
+function handleCliDelete(req, res, query) {
+  const { token } = query;
+  if (!token) {
+    return sendJson(res, 400, { error: 'Missing token' });
+  }
+  const session = getSession(token);
+  if (!session) {
+    return sendJson(res, 404, { error: 'Session not found' });
+  }
+  // Remove the first pending interaction (the one we just sent)
+  if (session.pendingInteractions.length > 0) {
+    session.pendingInteractions.shift();
+  }
+  return sendJson(res, 200, { success: true });
+}
 /**
  * Handle SSE events endpoint for browsers
  */
@@ -446,7 +472,7 @@ async function handleRequest(req, res) {
   if (req.method === 'OPTIONS') {
     res.writeHead(200, {
       'Access-Control-Allow-Origin': '*',
-      'Access-Control-Allow-Methods': 'GET, POST, OPTIONS',
+      'Access-Control-Allow-Methods': 'GET, POST, DELETE, OPTIONS',
       'Access-Control-Allow-Headers': 'Content-Type',
     });
     return res.end();
@@ -460,6 +486,9 @@ async function handleRequest(req, res) {
     if (req.method === 'GET') {
       return handleCliGet(req, res, query);
     }
+    if (req.method === 'DELETE') {
+      return handleCliDelete(req, res, query);
+    }
   }
   // Route: Session UI