npm - @quintinshaw/pi-dynamic-workflows - Versions diffs - 1.3.0 → 1.5.0 - Mend

@quintinshaw/pi-dynamic-workflows 1.3.0 → 1.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

package/README.md +6 -3
package/dist/agent.d.ts +2 -0
package/dist/agent.js +6 -2
package/dist/index.d.ts +3 -1
package/dist/index.js +1 -0
package/dist/run-persistence.d.ts +6 -0
package/dist/workflow-manager.d.ts +8 -2
package/dist/workflow-manager.js +50 -6
package/dist/workflow.d.ts +14 -0
package/dist/workflow.js +46 -2
package/dist/worktree.d.ts +25 -0
package/dist/worktree.js +61 -0
package/package.json +1 -1
package/src/agent.ts +8 -2
package/src/index.ts +3 -0
package/src/run-persistence.ts +2 -0
package/src/workflow-manager.ts +62 -7
package/src/workflow.ts +69 -3
package/src/worktree.ts +76 -0

package/README.md CHANGED Viewed

@@ -99,6 +99,7 @@ return { inventory, summary }
 | `phase` | string | Override the current phase for this agent |
 | `schema` | object | JSON Schema for structured output |
 | `model` | string | Run this agent on a specific model — `provider/modelId` or a bare `modelId` |
+| `isolation` | `"worktree"` | Run this agent in its own throwaway git worktree (parallel edits without conflict) |
 | `timeoutMs` | number | Override the default 5-minute agent timeout |
 Models can also be set per phase via `meta.phases[].model`. Precedence is `opts.model` > phase model > session default; an unknown model logs a warning and falls back to the default.
@@ -133,7 +134,9 @@ Scripts run inside a Node `vm` sandbox. Intentionally unavailable: `Date.now()`,
 - **Structured output** — JSON-Schema-validated subagent results
 - **Real token & cost accounting** — read from each subagent's SDK session (input / output / total / cost), with a character estimate only as fallback when a provider reports no usage; `budget` gates on the real total
 - **Real per-agent / per-phase model routing** — `opts.model` and `meta.phases[].model` actually select the model (resolved against your authed model registry), with graceful fallback
-- **`/workflows` command** — list, inspect, stop, pause, and remove background runs; runs started with `background: true` are reachable from the command
+- **`/workflows` command** — list, inspect, stop, pause, **resume**, and remove background runs; runs started with `background: true` are reachable from the command
+- **Resume** — each agent result is journaled by a deterministic call index; resuming replays the unchanged prefix from cache (no re-run, no tokens) and runs only new or edited calls live
+- **Worktree isolation** — `isolation: "worktree"` runs an agent in its own git worktree on a throwaway branch, so parallel agents can edit the same files without conflict; the worktree is torn down after (results are not auto-merged), and it falls back to a logged no-op outside a git repo
 - **Safety limits** — 1000-agent cap (`maxAgents`), per-agent timeout (`agentTimeoutMs`), recoverable-vs-fatal error classification
 - **Live progress + token/cost display**, `Esc` to abort
 - **Log persistence** to `.pi/workflows/runs/`
@@ -142,9 +145,9 @@ Scripts run inside a Node `vm` sandbox. Intentionally unavailable: `Date.now()`,
 Tracked toward closer parity with Claude Code dynamic workflows:
-- **Resume** — journaled results, replay the unchanged prefix, run the rest live
-- **Worktree isolation** for parallel edits, and **bundled `/deep-research`**
+- **Bundled `/deep-research`** and `/adversarial-review` workflows
 - **Saved workflows** as `/<name>` slash commands
+- **Nested `workflow()`** to compose saved workflows inline
 ## How it works

package/dist/agent.d.ts CHANGED Viewed

@@ -38,6 +38,8 @@ export interface AgentRunOptions<TSchemaDef extends TSchema | undefined = undefi
     model?: string;
     /** Called with the resolved model id once known (for display/telemetry). */
     onModelResolved?: (modelId: string) => void;
+    /** Run this agent in a different working directory (e.g. an isolated worktree). */
+    cwd?: string;
 }
 export type AgentRunResult<TSchemaDef extends TSchema | undefined> = TSchemaDef extends TSchema ? Static<TSchemaDef> : string;
 export declare class WorkflowAgent {

package/dist/agent.js CHANGED Viewed

@@ -39,7 +39,11 @@ export class WorkflowAgent {
     }
     async run(prompt, options = {}) {
         const capture = { called: false, value: undefined };
-        const customTools = [...this.baseTools, ...(options.tools ?? [])];
+        // Per-call cwd (e.g. a worktree) needs coding tools bound to that directory,
+        // since tools capture their cwd at construction and can't be relocated.
+        const runCwd = options.cwd ?? this.cwd;
+        const baseTools = runCwd === this.cwd ? this.baseTools : createCodingTools(runCwd);
+        const customTools = [...baseTools, ...(options.tools ?? [])];
         if (options.schema) {
             customTools.push(createStructuredOutputTool({ schema: options.schema, capture }));
         }
@@ -57,7 +61,7 @@ export class WorkflowAgent {
         }
         const agentDir = getAgentDir();
         const { session } = await createAgentSession({
-            cwd: this.cwd,
+            cwd: runCwd,
             agentDir,
             sessionManager: SessionManager.inMemory(),
             // Use real SettingsManager to inherit user's default provider/model settings.

package/dist/index.d.ts CHANGED Viewed

@@ -18,7 +18,7 @@ export type { PersistedRunState, RunPersistence, RunStatus } from "./run-persist
 export { createRunPersistence, generateRunId } from "./run-persistence.js";
 export type { StructuredOutputCapture, StructuredOutputToolOptions } from "./structured-output.js";
 export { createStructuredOutputTool } from "./structured-output.js";
-export type { AgentOptions, WorkflowMeta, WorkflowMetaPhase, WorkflowRunOptions, WorkflowRunResult, } from "./workflow.js";
+export type { AgentOptions, JournalEntry, WorkflowMeta, WorkflowMetaPhase, WorkflowRunOptions, WorkflowRunResult, } from "./workflow.js";
 export { parseWorkflowScript, runWorkflow } from "./workflow.js";
 export { registerWorkflowCommands } from "./workflow-commands.js";
 export type { ManagedRun, WorkflowManagerOptions } from "./workflow-manager.js";
@@ -27,3 +27,5 @@ export type { SavedWorkflow, WorkflowStorage } from "./workflow-saved.js";
 export { createWorkflowStorage } from "./workflow-saved.js";
 export type { WorkflowToolInput, WorkflowToolOptions } from "./workflow-tool.js";
 export { createWorkflowTool } from "./workflow-tool.js";
+export type { Worktree } from "./worktree.js";
+export { createWorktree, removeWorktree } from "./worktree.js";

package/dist/index.js CHANGED Viewed

@@ -14,3 +14,4 @@ export { registerWorkflowCommands } from "./workflow-commands.js";
 export { WorkflowManager } from "./workflow-manager.js";
 export { createWorkflowStorage } from "./workflow-saved.js";
 export { createWorkflowTool } from "./workflow-tool.js";
+export { createWorktree, removeWorktree } from "./worktree.js";

package/dist/run-persistence.d.ts CHANGED Viewed

@@ -33,6 +33,12 @@ export interface PersistedRunState {
         output: number;
         total: number;
     };
+    /** Cached agent results for resume, keyed by deterministic call index. */
+    journal?: Array<{
+        index: number;
+        hash: string;
+        result: unknown;
+    }>;
 }
 export interface RunPersistence {
     /** Save current run state. */

package/dist/workflow-manager.d.ts CHANGED Viewed

@@ -5,7 +5,7 @@ import { EventEmitter } from "node:events";
 import type { WorkflowSnapshot } from "./display.js";
 import { WorkflowError } from "./errors.js";
 import { type PersistedRunState, type RunPersistence, type RunStatus } from "./run-persistence.js";
-import { type WorkflowRunResult } from "./workflow.js";
+import { type JournalEntry, type WorkflowRunResult } from "./workflow.js";
 export interface ManagedRun {
     runId: string;
     status: RunStatus;
@@ -14,6 +14,11 @@ export interface ManagedRun {
     error?: WorkflowError;
     controller: AbortController;
     startedAt: Date;
+    /** The real script, kept so the run can be resumed. */
+    script: string;
+    args?: unknown;
+    /** Accumulated agent results for resume (deterministic call index -> result). */
+    journal: JournalEntry[];
 }
 export interface WorkflowManagerOptions {
     cwd?: string;
@@ -44,7 +49,8 @@ export declare class WorkflowManager extends EventEmitter {
      */
     pause(runId: string): boolean;
     /**
-     * Resume a paused workflow.
+     * Resume an interrupted run: replay journaled results for the unchanged prefix
+     * and run the rest live. Returns false if there is nothing resumable.
      */
     resume(runId: string): Promise<boolean>;
     /**

package/dist/workflow-manager.js CHANGED Viewed

@@ -40,6 +40,9 @@ export class WorkflowManager extends EventEmitter {
             },
             controller,
             startedAt: new Date(),
+            script,
+            args,
+            journal: [],
         };
         this.runs.set(runId, managed);
         // Persist initial state
@@ -82,17 +85,28 @@ export class WorkflowManager extends EventEmitter {
             },
             controller,
             startedAt: new Date(),
+            script,
+            args,
+            journal: [],
         };
         this.runs.set(runId, managed);
         return this.executeRun(managed, script, args);
     }
-    async executeRun(managed, script, args) {
+    async executeRun(managed, script, args, resumeJournal) {
         try {
             const result = await runWorkflow(script, {
                 cwd: this.cwd,
                 args,
                 signal: managed.controller.signal,
                 concurrency: this.concurrency,
+                resumeJournal,
+                resumeFromRunId: resumeJournal ? managed.runId : undefined,
+                onAgentJournal: (entry) => {
+                    // Append (crash-safe-ish): keep the latest entry per index, then persist.
+                    managed.journal = managed.journal.filter((e) => e.index !== entry.index);
+                    managed.journal.push(entry);
+                    this.persistRun(managed);
+                },
                 onLog: (message) => {
                     managed.snapshot.logs.push(message);
                     this.emit("log", { runId: managed.runId, message });
@@ -152,7 +166,11 @@ export class WorkflowManager extends EventEmitter {
         this.persistence.save({
             runId: managed.runId,
             workflowName: managed.snapshot.name,
-            script: "", // Don't persist script for security
+            // Persist the real script + journal so the run can be resumed. Runs live
+            // under .pi/workflows/runs/ — protect via directory permissions, not blanking.
+            script: managed.script,
+            args: managed.args,
+            journal: managed.journal,
             status: managed.status,
             phases: managed.snapshot.phases,
             currentPhase: managed.snapshot.currentPhase,
@@ -183,15 +201,41 @@ export class WorkflowManager extends EventEmitter {
         return true;
     }
     /**
-     * Resume a paused workflow.
+     * Resume an interrupted run: replay journaled results for the unchanged prefix
+     * and run the rest live. Returns false if there is nothing resumable.
      */
     async resume(runId) {
+        const active = this.runs.get(runId);
+        if (active?.status === "running")
+            return false; // already running
         const persisted = this.persistence.load(runId);
-        if (persisted?.status !== "paused")
+        if (!persisted?.script || persisted.status === "completed")
             return false;
-        // For now, resume creates a fresh run with completed agents' results cached
-        // Full resume would require re-executing the script with cached results
+        const controller = new AbortController();
+        const managed = {
+            runId,
+            status: "running",
+            snapshot: {
+                name: persisted.workflowName,
+                phases: persisted.phases ?? [],
+                logs: persisted.logs ?? [],
+                agents: [],
+                agentCount: 0,
+                runningCount: 0,
+                doneCount: 0,
+                errorCount: 0,
+            },
+            controller,
+            startedAt: new Date(),
+            script: persisted.script,
+            args: persisted.args,
+            journal: persisted.journal ?? [],
+        };
+        this.runs.set(runId, managed);
+        const resumeJournal = new Map((persisted.journal ?? []).map((e) => [e.index, e]));
         this.emit("resumed", { runId });
+        // Run in the background; executeRun records status/errors on the managed run.
+        void this.executeRun(managed, persisted.script, persisted.args, resumeJournal).catch(() => { });
         return true;
     }
     /**

package/dist/workflow.d.ts CHANGED Viewed

@@ -11,6 +11,13 @@ export interface WorkflowMeta {
     whenToUse?: string;
     phases?: WorkflowMetaPhase[];
 }
+/** One cached agent() result, keyed by its deterministic call index. */
+export interface JournalEntry {
+    index: number;
+    /** sha256 of the call's identity (prompt + model + phase + agentType + schema). */
+    hash: string;
+    result: unknown;
+}
 export interface WorkflowRunOptions extends WorkflowAgentOptions {
     args?: unknown;
     agent?: Pick<WorkflowAgent, "run">;
@@ -25,6 +32,12 @@ export interface WorkflowRunOptions extends WorkflowAgentOptions {
     persistLogs?: boolean;
     /** Run ID for persistence. Auto-generated if not provided. */
     runId?: string;
+    /** Resume: cached agent results keyed by deterministic call index. */
+    resumeJournal?: Map<number, JournalEntry>;
+    /** Resume: the run being resumed (informational; enables resume mode). */
+    resumeFromRunId?: string;
+    /** Called after each live agent completes so the caller can persist the journal. */
+    onAgentJournal?: (entry: JournalEntry) => void;
     onLog?: (message: string) => void;
     onPhase?: (title: string) => void;
     onAgentStart?: (event: {
@@ -38,6 +51,7 @@ export interface WorkflowRunOptions extends WorkflowAgentOptions {
         phase?: string;
         result: unknown;
         tokens?: number;
+        worktree?: string;
     }) => void;
     onTokenUsage?: (usage: {
         input: number;

package/dist/workflow.js CHANGED Viewed

@@ -1,3 +1,4 @@
+import { createHash } from "node:crypto";
 import vm from "node:vm";
 import { parse } from "acorn";
 import { WorkflowAgent } from "./agent.js";
@@ -5,6 +6,7 @@ import { DEFAULT_AGENT_TIMEOUT_MS, MAX_AGENTS_PER_RUN, MAX_CONCURRENCY } from ".
 import { WorkflowError, WorkflowErrorCode, wrapError } from "./errors.js";
 import { createWorkflowLogger } from "./logger.js";
 import { parseModelRoutingFromMeta, resolveModelForPhase } from "./model-routing.js";
+import { createWorktree, removeWorktree } from "./worktree.js";
 const DETERMINISM_BLOCKLIST = /\bDate\s*\.\s*now\b|\bMath\s*\.\s*random\b|\bnew\s+Date\s*\(\s*\)/;
 export async function runWorkflow(script, options = {}) {
     const started = Date.now();
@@ -14,6 +16,7 @@ export async function runWorkflow(script, options = {}) {
     const maxAgents = options.maxAgents ?? MAX_AGENTS_PER_RUN;
     const agentTimeoutMs = options.agentTimeoutMs ?? DEFAULT_AGENT_TIMEOUT_MS;
     const runId = options.runId ?? `run-${started.toString(36)}`;
+    const baseCwd = options.cwd ?? process.cwd();
     // Initialize logger
     const logger = createWorkflowLogger({
         runId,
@@ -25,6 +28,7 @@ export async function runWorkflow(script, options = {}) {
         logs: [],
         phases: [],
         agentCount: 0,
+        callSeq: 0,
         spent: 0,
         tokenUsage: { input: 0, output: 0, total: 0, cost: 0 },
     };
@@ -67,11 +71,33 @@ export async function runWorkflow(script, options = {}) {
         const requestedLabel = agentOptions.label?.trim();
         // Precedence: explicit agentOptions.model > phase model (meta.phases[].model).
         const modelSpec = agentOptions.model ?? resolveModelForPhase(assignedPhase, routingConfig);
+        // Deterministic resume key: assigned at lexical call time, before the limiter,
+        // so parallel()/pipeline() fan-out is reproducible for a fixed script.
+        const callIndex = state.callSeq++;
+        const callHash = hashAgentCall(prompt, modelSpec, assignedPhase, agentOptions);
+        // Resume: replay a cached result for an unchanged call (matching hash), without
+        // consuming a concurrency slot, tokens, or a real subagent run.
+        const cached = options.resumeJournal?.get(callIndex);
+        if (cached && cached.hash === callHash) {
+            state.agentCount++;
+            const label = requestedLabel || defaultAgentLabel(assignedPhase, state.agentCount);
+            options.onAgentStart?.({ label, phase: assignedPhase, prompt, model: modelSpec });
+            options.onAgentEnd?.({ label, phase: assignedPhase, result: cached.result, tokens: 0 });
+            return cached.result;
+        }
         return limiter(async () => {
             state.agentCount++;
             const label = requestedLabel || defaultAgentLabel(assignedPhase, state.agentCount);
             const timeout = agentOptions.timeoutMs ?? agentTimeoutMs;
             options.onAgentStart?.({ label, phase: assignedPhase, prompt, model: modelSpec });
+            // Optional per-agent worktree isolation (deterministic name -> stable resume keys).
+            let worktree;
+            if (agentOptions.isolation === "worktree") {
+                worktree = await createWorktree(baseCwd, `${runId}-${callIndex}-${label}`);
+                if (!worktree.isolated)
+                    log(`isolation ignored for "${label}" (${worktree.reason})`);
+            }
+            const runCwd = worktree?.isolated ? worktree.cwd : undefined;
             // Captured from the subagent's real session usage; falls back to an
             // estimate when the provider reports no usage (total === 0).
             let usage;
@@ -95,13 +121,15 @@ export async function runWorkflow(script, options = {}) {
                     signal: options.signal,
                     instructions: buildAgentInstructions(assignedPhase, agentOptions),
                     model: modelSpec,
+                    cwd: runCwd,
                     onUsage: (u) => {
                         usage = u;
                     },
                 }), timeout, `Agent "${label}" timed out after ${timeout}ms`);
                 throwIfAborted();
                 const tokens = recordTokens(result);
-                options.onAgentEnd?.({ label, phase: assignedPhase, result, tokens });
+                options.onAgentJournal?.({ index: callIndex, hash: callHash, result });
+                options.onAgentEnd?.({ label, phase: assignedPhase, result, tokens, worktree: runCwd });
                 return result;
             }
             catch (error) {
@@ -110,13 +138,18 @@ export async function runWorkflow(script, options = {}) {
                 const workflowError = wrapError(error, { agentLabel: label });
                 logger.error(`agent ${label} failed: ${workflowError.message}`);
                 const tokens = recordTokens(null);
-                options.onAgentEnd?.({ label, phase: assignedPhase, result: null, tokens });
+                options.onAgentEnd?.({ label, phase: assignedPhase, result: null, tokens, worktree: runCwd });
                 // Return null for recoverable errors
                 if (workflowError.recoverable) {
                     return null;
                 }
                 throw workflowError;
             }
+            finally {
+                // Always tear down the worktree, even on timeout/abort.
+                if (worktree?.isolated)
+                    await removeWorktree(worktree);
+            }
         });
     };
     const parallel = async (thunks) => {
@@ -348,6 +381,17 @@ function createLimiter(limit) {
 function defaultAgentLabel(phase, index) {
     return phase ? `${phase} agent ${index}` : `agent ${index}`;
 }
+/** Stable identity hash for an agent() call — a cache miss on resume when anything changes. */
+function hashAgentCall(prompt, model, phase, options) {
+    const identity = JSON.stringify({
+        prompt,
+        model: model ?? null,
+        phase: phase ?? null,
+        agentType: options.agentType ?? null,
+        schema: options.schema ?? null,
+    });
+    return createHash("sha256").update(identity).digest("hex");
+}
 function buildAgentInstructions(phase, options) {
     const lines = [];
     if (phase)

package/dist/worktree.d.ts ADDED Viewed

@@ -0,0 +1,25 @@
+/**
+ * Per-agent git worktree isolation. When an agent requests `isolation: "worktree"`,
+ * it runs in a throwaway worktree on its own branch so parallel agents can edit the
+ * same files without conflict. Results are NOT auto-merged — the path is surfaced for
+ * the caller to inspect. Falls back to a logged no-op when isolation isn't possible.
+ */
+export interface Worktree {
+    /** True when a real worktree was created; false means "ran in the shared tree". */
+    isolated: boolean;
+    /** cwd the agent should run in (worktree path when isolated, else the base cwd). */
+    cwd: string;
+    branch?: string;
+    /** Repo root the worktree was added to (for teardown). */
+    repoRoot?: string;
+    /** Why isolation was skipped, when isolated === false. */
+    reason?: string;
+}
+/**
+ * Create an isolated worktree under `<repoRoot>/.pi/worktrees/<name>` on branch
+ * `pi/wf/<name>`. The `name` must be deterministic (derived from runId + call index,
+ * never wall-clock) so resume keys stay stable. Returns a no-op Worktree on any failure.
+ */
+export declare function createWorktree(baseCwd: string, name: string): Promise<Worktree>;
+/** Remove a worktree and its branch. Best-effort; safe to call on a no-op Worktree. */
+export declare function removeWorktree(wt: Worktree): Promise<void>;

package/dist/worktree.js ADDED Viewed

@@ -0,0 +1,61 @@
+/**
+ * Per-agent git worktree isolation. When an agent requests `isolation: "worktree"`,
+ * it runs in a throwaway worktree on its own branch so parallel agents can edit the
+ * same files without conflict. Results are NOT auto-merged — the path is surfaced for
+ * the caller to inspect. Falls back to a logged no-op when isolation isn't possible.
+ */
+import { execFile } from "node:child_process";
+import { join } from "node:path";
+import { promisify } from "node:util";
+const exec = promisify(execFile);
+function slug(name) {
+    return (name
+        .toLowerCase()
+        .replace(/[^a-z0-9]+/g, "-")
+        .replace(/^-+|-+$/g, "")
+        .slice(0, 32) || "agent");
+}
+/**
+ * Create an isolated worktree under `<repoRoot>/.pi/worktrees/<name>` on branch
+ * `pi/wf/<name>`. The `name` must be deterministic (derived from runId + call index,
+ * never wall-clock) so resume keys stay stable. Returns a no-op Worktree on any failure.
+ */
+export async function createWorktree(baseCwd, name) {
+    const id = slug(name);
+    let repoRoot;
+    try {
+        const { stdout } = await exec("git", ["-C", baseCwd, "rev-parse", "--show-toplevel"]);
+        repoRoot = stdout.trim();
+    }
+    catch {
+        return { isolated: false, cwd: baseCwd, reason: "not a git repository" };
+    }
+    const path = join(repoRoot, ".pi", "worktrees", id);
+    const branch = `pi/wf/${id}`;
+    try {
+        await exec("git", ["-C", repoRoot, "worktree", "add", "-b", branch, path, "HEAD"]);
+        return { isolated: true, cwd: path, branch, repoRoot };
+    }
+    catch (error) {
+        return { isolated: false, cwd: baseCwd, reason: error instanceof Error ? error.message : String(error) };
+    }
+}
+/** Remove a worktree and its branch. Best-effort; safe to call on a no-op Worktree. */
+export async function removeWorktree(wt) {
+    if (!wt.isolated || !wt.repoRoot)
+        return;
+    try {
+        await exec("git", ["-C", wt.repoRoot, "worktree", "remove", "--force", wt.cwd]);
+    }
+    catch {
+        // already gone / locked — fall through
+    }
+    if (wt.branch) {
+        try {
+            await exec("git", ["-C", wt.repoRoot, "branch", "-D", wt.branch]);
+        }
+        catch {
+            // branch already deleted
+        }
+    }
+}

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@quintinshaw/pi-dynamic-workflows",
-  "version": "1.3.0",
+  "version": "1.5.0",
   "description": "Claude-Code-style dynamic workflow orchestration for Pi.",
   "type": "module",
   "main": "./dist/index.js",

package/src/agent.ts CHANGED Viewed

@@ -54,6 +54,8 @@ export interface AgentRunOptions<TSchemaDef extends TSchema | undefined = undefi
   model?: string;
   /** Called with the resolved model id once known (for display/telemetry). */
   onModelResolved?: (modelId: string) => void;
+  /** Run this agent in a different working directory (e.g. an isolated worktree). */
+  cwd?: string;
 }
 export type AgentRunResult<TSchemaDef extends TSchema | undefined> = TSchemaDef extends TSchema
@@ -105,7 +107,11 @@ export class WorkflowAgent {
     options: AgentRunOptions<TSchemaDef> = {},
   ): Promise<AgentRunResult<TSchemaDef>> {
     const capture: StructuredOutputCapture<any> = { called: false, value: undefined };
-    const customTools: ToolDefinition[] = [...this.baseTools, ...(options.tools ?? [])];
+    // Per-call cwd (e.g. a worktree) needs coding tools bound to that directory,
+    // since tools capture their cwd at construction and can't be relocated.
+    const runCwd = options.cwd ?? this.cwd;
+    const baseTools = runCwd === this.cwd ? this.baseTools : createCodingTools(runCwd);
+    const customTools: ToolDefinition[] = [...baseTools, ...(options.tools ?? [])];
     if (options.schema) {
       customTools.push(createStructuredOutputTool({ schema: options.schema, capture }) as unknown as ToolDefinition);
@@ -125,7 +131,7 @@ export class WorkflowAgent {
     const agentDir = getAgentDir();
     const { session } = await createAgentSession({
-      cwd: this.cwd,
+      cwd: runCwd,
       agentDir,
       sessionManager: SessionManager.inMemory(),
       // Use real SettingsManager to inherit user's default provider/model settings.

package/src/index.ts CHANGED Viewed

@@ -41,6 +41,7 @@ export type { StructuredOutputCapture, StructuredOutputToolOptions } from "./str
 export { createStructuredOutputTool } from "./structured-output.js";
 export type {
   AgentOptions,
+  JournalEntry,
   WorkflowMeta,
   WorkflowMetaPhase,
   WorkflowRunOptions,
@@ -54,3 +55,5 @@ export type { SavedWorkflow, WorkflowStorage } from "./workflow-saved.js";
 export { createWorkflowStorage } from "./workflow-saved.js";
 export type { WorkflowToolInput, WorkflowToolOptions } from "./workflow-tool.js";
 export { createWorkflowTool } from "./workflow-tool.js";
+export type { Worktree } from "./worktree.js";
+export { createWorktree, removeWorktree } from "./worktree.js";

package/src/run-persistence.ts CHANGED Viewed

@@ -40,6 +40,8 @@ export interface PersistedRunState {
     output: number;
     total: number;
   };
+  /** Cached agent results for resume, keyed by deterministic call index. */
+  journal?: Array<{ index: number; hash: string; result: unknown }>;
 }
 export interface RunPersistence {

package/src/workflow-manager.ts CHANGED Viewed

@@ -12,7 +12,7 @@ import {
   type RunPersistence,
   type RunStatus,
 } from "./run-persistence.js";
-import { parseWorkflowScript, runWorkflow, type WorkflowRunResult } from "./workflow.js";
+import { type JournalEntry, parseWorkflowScript, runWorkflow, type WorkflowRunResult } from "./workflow.js";
 export interface ManagedRun {
   runId: string;
@@ -22,6 +22,11 @@ export interface ManagedRun {
   error?: WorkflowError;
   controller: AbortController;
   startedAt: Date;
+  /** The real script, kept so the run can be resumed. */
+  script: string;
+  args?: unknown;
+  /** Accumulated agent results for resume (deterministic call index -> result). */
+  journal: JournalEntry[];
 }
 export interface WorkflowManagerOptions {
@@ -67,6 +72,9 @@ export class WorkflowManager extends EventEmitter {
       },
       controller,
       startedAt: new Date(),
+      script,
+      args,
+      journal: [],
     };
     this.runs.set(runId, managed);
@@ -115,19 +123,35 @@ export class WorkflowManager extends EventEmitter {
       },
       controller,
       startedAt: new Date(),
+      script,
+      args,
+      journal: [],
     };
     this.runs.set(runId, managed);
     return this.executeRun(managed, script, args);
   }
-  private async executeRun(managed: ManagedRun, script: string, args?: unknown): Promise<WorkflowRunResult> {
+  private async executeRun(
+    managed: ManagedRun,
+    script: string,
+    args?: unknown,
+    resumeJournal?: Map<number, JournalEntry>,
+  ): Promise<WorkflowRunResult> {
     try {
       const result = await runWorkflow(script, {
         cwd: this.cwd,
         args,
         signal: managed.controller.signal,
         concurrency: this.concurrency,
+        resumeJournal,
+        resumeFromRunId: resumeJournal ? managed.runId : undefined,
+        onAgentJournal: (entry) => {
+          // Append (crash-safe-ish): keep the latest entry per index, then persist.
+          managed.journal = managed.journal.filter((e) => e.index !== entry.index);
+          managed.journal.push(entry);
+          this.persistRun(managed);
+        },
         onLog: (message) => {
           managed.snapshot.logs.push(message);
           this.emit("log", { runId: managed.runId, message });
@@ -197,7 +221,11 @@ export class WorkflowManager extends EventEmitter {
     this.persistence.save({
       runId: managed.runId,
       workflowName: managed.snapshot.name,
-      script: "", // Don't persist script for security
+      // Persist the real script + journal so the run can be resumed. Runs live
+      // under .pi/workflows/runs/ — protect via directory permissions, not blanking.
+      script: managed.script,
+      args: managed.args,
+      journal: managed.journal,
       status: managed.status,
       phases: managed.snapshot.phases,
       currentPhase: managed.snapshot.currentPhase,
@@ -230,15 +258,42 @@ export class WorkflowManager extends EventEmitter {
   }
   /**
-   * Resume a paused workflow.
+   * Resume an interrupted run: replay journaled results for the unchanged prefix
+   * and run the rest live. Returns false if there is nothing resumable.
    */
   async resume(runId: string): Promise<boolean> {
+    const active = this.runs.get(runId);
+    if (active?.status === "running") return false; // already running
     const persisted = this.persistence.load(runId);
-    if (persisted?.status !== "paused") return false;
+    if (!persisted?.script || persisted.status === "completed") return false;
+    const controller = new AbortController();
+    const managed: ManagedRun = {
+      runId,
+      status: "running",
+      snapshot: {
+        name: persisted.workflowName,
+        phases: persisted.phases ?? [],
+        logs: persisted.logs ?? [],
+        agents: [],
+        agentCount: 0,
+        runningCount: 0,
+        doneCount: 0,
+        errorCount: 0,
+      },
+      controller,
+      startedAt: new Date(),
+      script: persisted.script,
+      args: persisted.args,
+      journal: persisted.journal ?? [],
+    };
+    this.runs.set(runId, managed);
-    // For now, resume creates a fresh run with completed agents' results cached
-    // Full resume would require re-executing the script with cached results
+    const resumeJournal = new Map((persisted.journal ?? []).map((e) => [e.index, e] as const));
     this.emit("resumed", { runId });
+    // Run in the background; executeRun records status/errors on the managed run.
+    void this.executeRun(managed, persisted.script, persisted.args, resumeJournal).catch(() => {});
     return true;
   }

package/src/workflow.ts CHANGED Viewed

@@ -1,3 +1,4 @@
+import { createHash } from "node:crypto";
 import vm from "node:vm";
 import type { Node } from "acorn";
 import { parse } from "acorn";
@@ -8,6 +9,7 @@ import { DEFAULT_AGENT_TIMEOUT_MS, MAX_AGENTS_PER_RUN, MAX_CONCURRENCY } from ".
 import { WorkflowError, WorkflowErrorCode, wrapError } from "./errors.js";
 import { createWorkflowLogger } from "./logger.js";
 import { parseModelRoutingFromMeta, resolveModelForPhase } from "./model-routing.js";
+import { createWorktree, removeWorktree, type Worktree } from "./worktree.js";
 export interface WorkflowMetaPhase {
   title: string;
@@ -22,6 +24,14 @@ export interface WorkflowMeta {
   phases?: WorkflowMetaPhase[];
 }
+/** One cached agent() result, keyed by its deterministic call index. */
+export interface JournalEntry {
+  index: number;
+  /** sha256 of the call's identity (prompt + model + phase + agentType + schema). */
+  hash: string;
+  result: unknown;
+}
 export interface WorkflowRunOptions extends WorkflowAgentOptions {
   args?: unknown;
   agent?: Pick<WorkflowAgent, "run">;
@@ -36,10 +46,16 @@ export interface WorkflowRunOptions extends WorkflowAgentOptions {
   persistLogs?: boolean;
   /** Run ID for persistence. Auto-generated if not provided. */
   runId?: string;
+  /** Resume: cached agent results keyed by deterministic call index. */
+  resumeJournal?: Map<number, JournalEntry>;
+  /** Resume: the run being resumed (informational; enables resume mode). */
+  resumeFromRunId?: string;
+  /** Called after each live agent completes so the caller can persist the journal. */
+  onAgentJournal?: (entry: JournalEntry) => void;
   onLog?: (message: string) => void;
   onPhase?: (title: string) => void;
   onAgentStart?: (event: { label: string; phase?: string; prompt: string; model?: string }) => void;
-  onAgentEnd?: (event: { label: string; phase?: string; result: unknown; tokens?: number }) => void;
+  onAgentEnd?: (event: { label: string; phase?: string; result: unknown; tokens?: number; worktree?: string }) => void;
   onTokenUsage?: (usage: { input: number; output: number; total: number; cost: number }) => void;
 }
@@ -75,6 +91,8 @@ interface RuntimeState {
   logs: string[];
   phases: string[];
   agentCount: number;
+  /** Monotonic, assigned at lexical agent() call time — the stable resume key. */
+  callSeq: number;
   spent: number;
   tokenUsage: {
     input: number;
@@ -99,6 +117,7 @@ export async function runWorkflow<T = unknown>(
   const maxAgents = options.maxAgents ?? MAX_AGENTS_PER_RUN;
   const agentTimeoutMs = options.agentTimeoutMs ?? DEFAULT_AGENT_TIMEOUT_MS;
   const runId = options.runId ?? `run-${started.toString(36)}`;
+  const baseCwd = options.cwd ?? process.cwd();
   // Initialize logger
   const logger = createWorkflowLogger({
@@ -112,6 +131,7 @@ export async function runWorkflow<T = unknown>(
     logs: [],
     phases: [],
     agentCount: 0,
+    callSeq: 0,
     spent: 0,
     tokenUsage: { input: 0, output: 0, total: 0, cost: 0 },
   };
@@ -170,6 +190,22 @@ export async function runWorkflow<T = unknown>(
     // Precedence: explicit agentOptions.model > phase model (meta.phases[].model).
     const modelSpec = agentOptions.model ?? resolveModelForPhase(assignedPhase, routingConfig);
+    // Deterministic resume key: assigned at lexical call time, before the limiter,
+    // so parallel()/pipeline() fan-out is reproducible for a fixed script.
+    const callIndex = state.callSeq++;
+    const callHash = hashAgentCall(prompt, modelSpec, assignedPhase, agentOptions);
+    // Resume: replay a cached result for an unchanged call (matching hash), without
+    // consuming a concurrency slot, tokens, or a real subagent run.
+    const cached = options.resumeJournal?.get(callIndex);
+    if (cached && cached.hash === callHash) {
+      state.agentCount++;
+      const label = requestedLabel || defaultAgentLabel(assignedPhase, state.agentCount);
+      options.onAgentStart?.({ label, phase: assignedPhase, prompt, model: modelSpec });
+      options.onAgentEnd?.({ label, phase: assignedPhase, result: cached.result, tokens: 0 });
+      return cached.result;
+    }
     return limiter(async () => {
       state.agentCount++;
       const label = requestedLabel || defaultAgentLabel(assignedPhase, state.agentCount);
@@ -177,6 +213,14 @@ export async function runWorkflow<T = unknown>(
       options.onAgentStart?.({ label, phase: assignedPhase, prompt, model: modelSpec });
+      // Optional per-agent worktree isolation (deterministic name -> stable resume keys).
+      let worktree: Worktree | undefined;
+      if (agentOptions.isolation === "worktree") {
+        worktree = await createWorktree(baseCwd, `${runId}-${callIndex}-${label}`);
+        if (!worktree.isolated) log(`isolation ignored for "${label}" (${worktree.reason})`);
+      }
+      const runCwd = worktree?.isolated ? worktree.cwd : undefined;
       // Captured from the subagent's real session usage; falls back to an
       // estimate when the provider reports no usage (total === 0).
       let usage: AgentUsage | undefined;
@@ -203,6 +247,7 @@ export async function runWorkflow<T = unknown>(
             signal: options.signal,
             instructions: buildAgentInstructions(assignedPhase, agentOptions),
             model: modelSpec,
+            cwd: runCwd,
             onUsage: (u: AgentUsage) => {
               usage = u;
             },
@@ -214,7 +259,8 @@ export async function runWorkflow<T = unknown>(
         throwIfAborted();
         const tokens = recordTokens(result);
-        options.onAgentEnd?.({ label, phase: assignedPhase, result, tokens });
+        options.onAgentJournal?.({ index: callIndex, hash: callHash, result });
+        options.onAgentEnd?.({ label, phase: assignedPhase, result, tokens, worktree: runCwd });
         return result;
       } catch (error) {
         if (options.signal?.aborted) throw error;
@@ -222,13 +268,16 @@ export async function runWorkflow<T = unknown>(
         const workflowError = wrapError(error, { agentLabel: label });
         logger.error(`agent ${label} failed: ${workflowError.message}`);
         const tokens = recordTokens(null);
-        options.onAgentEnd?.({ label, phase: assignedPhase, result: null, tokens });
+        options.onAgentEnd?.({ label, phase: assignedPhase, result: null, tokens, worktree: runCwd });
         // Return null for recoverable errors
         if (workflowError.recoverable) {
           return null;
         }
         throw workflowError;
+      } finally {
+        // Always tear down the worktree, even on timeout/abort.
+        if (worktree?.isolated) await removeWorktree(worktree);
       }
     });
   };
@@ -481,6 +530,23 @@ function defaultAgentLabel(phase: string | undefined, index: number): string {
   return phase ? `${phase} agent ${index}` : `agent ${index}`;
 }
+/** Stable identity hash for an agent() call — a cache miss on resume when anything changes. */
+function hashAgentCall(
+  prompt: string,
+  model: string | undefined,
+  phase: string | undefined,
+  options: AgentOptions,
+): string {
+  const identity = JSON.stringify({
+    prompt,
+    model: model ?? null,
+    phase: phase ?? null,
+    agentType: options.agentType ?? null,
+    schema: options.schema ?? null,
+  });
+  return createHash("sha256").update(identity).digest("hex");
+}
 function buildAgentInstructions(phase: string | undefined, options: AgentOptions): string | undefined {
   const lines = [];
   if (phase) lines.push(`Workflow phase: ${phase}`);

package/src/worktree.ts ADDED Viewed

@@ -0,0 +1,76 @@
+/**
+ * Per-agent git worktree isolation. When an agent requests `isolation: "worktree"`,
+ * it runs in a throwaway worktree on its own branch so parallel agents can edit the
+ * same files without conflict. Results are NOT auto-merged — the path is surfaced for
+ * the caller to inspect. Falls back to a logged no-op when isolation isn't possible.
+ */
+import { execFile } from "node:child_process";
+import { join } from "node:path";
+import { promisify } from "node:util";
+const exec = promisify(execFile);
+export interface Worktree {
+  /** True when a real worktree was created; false means "ran in the shared tree". */
+  isolated: boolean;
+  /** cwd the agent should run in (worktree path when isolated, else the base cwd). */
+  cwd: string;
+  branch?: string;
+  /** Repo root the worktree was added to (for teardown). */
+  repoRoot?: string;
+  /** Why isolation was skipped, when isolated === false. */
+  reason?: string;
+}
+function slug(name: string): string {
+  return (
+    name
+      .toLowerCase()
+      .replace(/[^a-z0-9]+/g, "-")
+      .replace(/^-+|-+$/g, "")
+      .slice(0, 32) || "agent"
+  );
+}
+/**
+ * Create an isolated worktree under `<repoRoot>/.pi/worktrees/<name>` on branch
+ * `pi/wf/<name>`. The `name` must be deterministic (derived from runId + call index,
+ * never wall-clock) so resume keys stay stable. Returns a no-op Worktree on any failure.
+ */
+export async function createWorktree(baseCwd: string, name: string): Promise<Worktree> {
+  const id = slug(name);
+  let repoRoot: string;
+  try {
+    const { stdout } = await exec("git", ["-C", baseCwd, "rev-parse", "--show-toplevel"]);
+    repoRoot = stdout.trim();
+  } catch {
+    return { isolated: false, cwd: baseCwd, reason: "not a git repository" };
+  }
+  const path = join(repoRoot, ".pi", "worktrees", id);
+  const branch = `pi/wf/${id}`;
+  try {
+    await exec("git", ["-C", repoRoot, "worktree", "add", "-b", branch, path, "HEAD"]);
+    return { isolated: true, cwd: path, branch, repoRoot };
+  } catch (error) {
+    return { isolated: false, cwd: baseCwd, reason: error instanceof Error ? error.message : String(error) };
+  }
+}
+/** Remove a worktree and its branch. Best-effort; safe to call on a no-op Worktree. */
+export async function removeWorktree(wt: Worktree): Promise<void> {
+  if (!wt.isolated || !wt.repoRoot) return;
+  try {
+    await exec("git", ["-C", wt.repoRoot, "worktree", "remove", "--force", wt.cwd]);
+  } catch {
+    // already gone / locked — fall through
+  }
+  if (wt.branch) {
+    try {
+      await exec("git", ["-C", wt.repoRoot, "branch", "-D", wt.branch]);
+    } catch {
+      // branch already deleted
+    }
+  }
+}