npm - palmier - Versions diffs - 0.5.5 → 0.5.7 - Mend

palmier 0.5.5 → 0.5.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/README.md +1 -1
package/dist/agents/codex.js +1 -2
package/dist/commands/run.d.ts +0 -4
package/dist/commands/run.js +22 -4
package/dist/rpc-handler.js +30 -7
package/dist/spawn-command.js +0 -1
package/package.json +1 -1
package/src/agents/codex.ts +1 -2
package/src/commands/run.ts +23 -3
package/src/rpc-handler.ts +30 -8
package/src/spawn-command.ts +0 -1
package/test/taskrun-messages.test.ts +224 -0

package/README.md CHANGED Viewed

@@ -22,7 +22,7 @@ The serve daemon always runs a local HTTP server. Three access modes are availab
 **Local mode** is always available. The PWA is served at `http://localhost:<port>` and works without pairing or internet. The daemon binds to `127.0.0.1` by default.
-**LAN mode** is enabled during `palmier init`. The daemon binds to `0.0.0.0` instead, making the PWA and API endpoints accessible from the local network at `http://<host-ip>:<port>`. Devices must pair via OTP to access. Push notifications are not available.
+**LAN mode** can be enabled during `palmier init`. The daemon binds to `0.0.0.0` instead, making the PWA and API endpoints accessible from the local network at `http://<host-ip>:<port>`. Devices must pair via OTP to access. Push notifications are not available.
 **Server mode** relays communication through the Palmier cloud server (via [NATS](https://nats.io), a lightweight messaging system). All features including push notifications are available. The PWA is served over HTTPS. Server mode and LAN mode can be active at the same time.

package/dist/agents/codex.js CHANGED Viewed

@@ -12,8 +12,7 @@ export class CodexAgent {
     getTaskRunCommandLine(task, followupPrompt, extraPermissions) {
         const yolo = extraPermissions === "yolo";
         const prompt = followupPrompt ?? (getAgentInstructions(task.frontmatter.id, yolo || !this.supportsPermissions) + "\n\n" + (task.body || task.frontmatter.user_prompt));
-        // Using danger-full-access until workspace-write is fixed: https://github.com/openai/codex/issues/12572
-        const args = ["exec", "--skip-git-repo-check", "--sandbox", "danger-full-access"];
+        const args = ["exec", "--skip-git-repo-check", "--sandbox", yolo ? "danger-full-access" : "workspace-write"];
         if (!yolo) {
             const allPerms = [...(task.frontmatter.permissions ?? []), ...(extraPermissions ?? [])];
             for (const p of allPerms) {

package/dist/commands/run.d.ts CHANGED Viewed

@@ -7,10 +7,6 @@ export declare function stripPalmierMarkers(output: string): string;
  * Execute a task by ID.
  */
 export declare function runCommand(taskId: string): Promise<void>;
-/**
- * Extract report file names from agent output.
- * Looks for lines matching: [PALMIER_REPORT] <filename>
- */
 export declare function parseReportFiles(output: string): string[];
 /**
  * Extract required permissions from agent output.

package/dist/commands/run.js CHANGED Viewed

@@ -70,6 +70,14 @@ async function invokeAgentWithRetries(ctx, invokeTask) {
         }
         writer.end(reportFiles.length > 0 ? reportFiles : undefined);
         await publishHostEvent(ctx.nc, ctx.config.hostId, ctx.taskId, { event_type: "result-updated", run_id: ctx.runId });
+        if (reportFiles.length > 0) {
+            await publishHostEvent(ctx.nc, ctx.config.hostId, ctx.taskId, {
+                event_type: "report-generated",
+                run_id: ctx.runId,
+                name: ctx.task.frontmatter.name,
+                report_files: reportFiles,
+            });
+        }
         // Permission handling — agent requested permissions
         if (requiredPermissions.length > 0) {
             const response = await requestPermission(ctx.config, ctx.task, ctx.taskDir, requiredPermissions);
@@ -77,7 +85,7 @@ async function invokeAgentWithRetries(ctx, invokeTask) {
                 await appendAndNotify(ctx, {
                     role: "user",
                     time: Date.now(),
-                    content: "Denied",
+                    content: "Deny & Abort Task",
                     type: "permission",
                 });
                 return { outcome: "failed" };
@@ -87,7 +95,7 @@ async function invokeAgentWithRetries(ctx, invokeTask) {
             await appendAndNotify(ctx, {
                 role: "user",
                 time: Date.now(),
-                content: response === "granted_all" ? "Granted for all" : "Granted",
+                content: response === "granted_all" ? "Allow Always" : "Allow Once",
                 type: "permission",
             });
             if (response === "granted_all") {
@@ -173,14 +181,19 @@ export async function runCommand(taskId) {
         // If requires_confirmation, notify clients and wait
         if (task.frontmatter.requires_confirmation) {
             const confirmed = await requestConfirmation(config, task, taskDir);
+            const confirmPrompt = `**Task Confirmation**\n\nRun task "${taskName || task.frontmatter.user_prompt}"?`;
+            appendRunMessage(taskDir, runId, { role: "assistant", time: Date.now(), content: confirmPrompt, type: "confirmation" });
+            await publishHostEvent(nc, config.hostId, taskId, { event_type: "result-updated", run_id: runId });
             if (!confirmed) {
                 console.log("Task aborted by user.");
+                appendRunMessage(taskDir, runId, { role: "user", time: Date.now(), content: "Aborted", type: "confirmation" });
                 appendRunMessage(taskDir, runId, { role: "status", time: Date.now(), content: "", type: "aborted" });
                 await publishTaskEvent(nc, config, taskDir, taskId, "aborted", taskName, runId);
                 await cleanup();
                 return;
             }
             console.log("Task confirmed by user.");
+            appendRunMessage(taskDir, runId, { role: "user", time: Date.now(), content: "Confirmed", type: "confirmation" });
             appendRunMessage(taskDir, runId, { role: "status", time: Date.now(), content: "", type: "confirmation" });
             await publishHostEvent(nc, config.hostId, taskId, { event_type: "result-updated", run_id: runId });
         }
@@ -408,6 +421,7 @@ async function requestConfirmation(config, task, taskDir) {
  * Extract report file names from agent output.
  * Looks for lines matching: [PALMIER_REPORT] <filename>
  */
+const ALLOWED_REPORT_EXT = [".md", ".txt", ".png", ".jpg", ".jpeg", ".gif", ".svg", ".webp"];
 export function parseReportFiles(output) {
     const regex = new RegExp(`^\\${TASK_REPORT_PREFIX}\\s+(.+)$`, "gm");
     const files = [];
@@ -415,8 +429,12 @@ export function parseReportFiles(output) {
     while ((match = regex.exec(output)) !== null) {
         const name = match[1].trim();
         // Skip placeholder examples echoed from the prompt (e.g. "<filename>")
-        if (name && !name.startsWith("<"))
-            files.push(name);
+        if (!name || name.startsWith("<"))
+            continue;
+        const ext = name.lastIndexOf(".") >= 0 ? name.slice(name.lastIndexOf(".")).toLowerCase() : "";
+        if (!ALLOWED_REPORT_EXT.includes(ext))
+            continue;
+        files.push(name);
     }
     return files;
 }

package/dist/rpc-handler.js CHANGED Viewed

@@ -37,10 +37,12 @@ function parseResultFrontmatter(raw) {
     const startedMsg = statusMessages.find((m) => m.type === "started");
     const terminalStates = ["finished", "failed", "aborted"];
     const terminalMsg = [...statusMessages].reverse().find((m) => terminalStates.includes(m.type ?? ""));
-    // If last status is "started", determine if it's a task run or follow-up
+    // If last status is "started" (or continuation like "confirmation"/"monitoring"),
+    // determine if it's a task run or follow-up
+    const activeStates = ["started", "monitoring", "confirmation"];
     let runningState;
-    if (lastStatus?.type === "started" || lastStatus?.type === "monitoring") {
-        runningState = terminalMsg ? "followup" : (lastStatus?.type ?? "started");
+    if (activeStates.includes(lastStatus?.type ?? "")) {
+        runningState = terminalMsg ? "followup" : "started";
     }
     else {
         runningState = lastStatus?.type;
@@ -154,6 +156,17 @@ export function createRpcHandler(config, nc) {
                     host_platform: process.platform,
                 };
             }
+            case "task.get": {
+                const params = request.params;
+                const taskDir = getTaskDir(config.projectRoot, params.id);
+                try {
+                    const task = parseTaskFile(taskDir);
+                    return flattenTask(task);
+                }
+                catch {
+                    return { error: "Task not found" };
+                }
+            }
             case "task.create": {
                 const params = request.params;
                 // Only generate a plan for longer prompts that benefit from it
@@ -497,11 +510,14 @@ export function createRpcHandler(config, nc) {
                 if (!params.run_id || !Array.isArray(params.report_files) || params.report_files.length === 0) {
                     return { error: "run_id and report_files are required" };
                 }
+                const ALLOWED_EXT = [".md", ".txt", ".png", ".jpg", ".jpeg", ".gif", ".svg", ".webp"];
+                const IMAGE_EXT = [".png", ".jpg", ".jpeg", ".gif", ".svg", ".webp"];
                 const reports = [];
                 const runDir = path.join(config.projectRoot, "tasks", params.id, params.run_id);
                 for (const file of params.report_files) {
-                    if (!file.endsWith(".md") && !file.endsWith(".txt")) {
-                        reports.push({ file, error: "must end with .md or .txt" });
+                    const ext = path.extname(file).toLowerCase();
+                    if (!ALLOWED_EXT.includes(ext)) {
+                        reports.push({ file, error: `unsupported file type: ${ext}` });
                         continue;
                     }
                     const basename = path.basename(file);
@@ -511,8 +527,15 @@ export function createRpcHandler(config, nc) {
                     }
                     const reportPath = path.join(runDir, basename);
                     try {
-                        const content = fs.readFileSync(reportPath, "utf-8");
-                        reports.push({ file, content });
+                        if (IMAGE_EXT.includes(ext)) {
+                            const buf = fs.readFileSync(reportPath);
+                            const mime = ext === ".svg" ? "image/svg+xml" : `image/${ext.slice(1).replace("jpg", "jpeg")}`;
+                            reports.push({ file, data_url: `data:${mime};base64,${buf.toString("base64")}` });
+                        }
+                        else {
+                            const content = fs.readFileSync(reportPath, "utf-8");
+                            reports.push({ file, content });
+                        }
                     }
                     catch {
                         reports.push({ file, error: "Report file not found" });

package/dist/spawn-command.js CHANGED Viewed

@@ -61,7 +61,6 @@ export function spawnCommand(command, args, opts) {
                 opts.onData(d.toString("utf-8"));
         });
         child.stderr.on("data", (d) => {
-            chunks.push(d);
             process.stderr.write(d);
             if (opts.onData)
                 opts.onData(d.toString("utf-8"));

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "palmier",
-  "version": "0.5.5",
+  "version": "0.5.7",
   "description": "Palmier host CLI - provisions, executes tasks, and serves NATS RPC",
   "license": "Apache-2.0",
   "author": "Hongxu Cai",

package/src/agents/codex.ts CHANGED Viewed

@@ -16,8 +16,7 @@ export class CodexAgent implements AgentTool {
   getTaskRunCommandLine(task: ParsedTask, followupPrompt?: string, extraPermissions?: RequiredPermission[] | "yolo"): CommandLine {
     const yolo = extraPermissions === "yolo";
     const prompt = followupPrompt ?? (getAgentInstructions(task.frontmatter.id, yolo || !this.supportsPermissions) + "\n\n" + (task.body || task.frontmatter.user_prompt));
-    // Using danger-full-access until workspace-write is fixed: https://github.com/openai/codex/issues/12572
-    const args = ["exec", "--skip-git-repo-check", "--sandbox", "danger-full-access"];
+    const args = ["exec", "--skip-git-repo-check", "--sandbox", yolo ? "danger-full-access" : "workspace-write"];
     if (!yolo) {
       const allPerms = [...(task.frontmatter.permissions ?? []), ...(extraPermissions ?? [])];

package/src/commands/run.ts CHANGED Viewed

@@ -106,6 +106,15 @@ async function invokeAgentWithRetries(
     writer.end(reportFiles.length > 0 ? reportFiles : undefined);
     await publishHostEvent(ctx.nc, ctx.config.hostId, ctx.taskId, { event_type: "result-updated", run_id: ctx.runId });
+    if (reportFiles.length > 0) {
+      await publishHostEvent(ctx.nc, ctx.config.hostId, ctx.taskId, {
+        event_type: "report-generated",
+        run_id: ctx.runId,
+        name: ctx.task.frontmatter.name,
+        report_files: reportFiles,
+      });
+    }
     // Permission handling — agent requested permissions
     if (requiredPermissions.length > 0) {
       const response = await requestPermission(ctx.config, ctx.task, ctx.taskDir, requiredPermissions);
@@ -114,7 +123,7 @@ async function invokeAgentWithRetries(
         await appendAndNotify(ctx, {
           role: "user",
           time: Date.now(),
-          content: "Denied",
+          content: "Deny & Abort Task",
           type: "permission",
         });
         return { outcome: "failed" };
@@ -128,7 +137,7 @@ async function invokeAgentWithRetries(
       await appendAndNotify(ctx, {
         role: "user",
         time: Date.now(),
-        content: response === "granted_all" ? "Granted for all" : "Granted",
+        content: response === "granted_all" ? "Allow Always" : "Allow Once",
         type: "permission",
       });
@@ -228,14 +237,20 @@ export async function runCommand(taskId: string): Promise<void> {
     // If requires_confirmation, notify clients and wait
     if (task.frontmatter.requires_confirmation) {
       const confirmed = await requestConfirmation(config, task, taskDir);
+      const confirmPrompt = `**Task Confirmation**\n\nRun task "${taskName || task.frontmatter.user_prompt}"?`;
+      appendRunMessage(taskDir, runId, { role: "assistant", time: Date.now(), content: confirmPrompt, type: "confirmation" });
+      await publishHostEvent(nc, config.hostId, taskId, { event_type: "result-updated", run_id: runId });
       if (!confirmed) {
         console.log("Task aborted by user.");
+        appendRunMessage(taskDir, runId, { role: "user", time: Date.now(), content: "Aborted", type: "confirmation" });
         appendRunMessage(taskDir, runId, { role: "status", time: Date.now(), content: "", type: "aborted" });
         await publishTaskEvent(nc, config, taskDir, taskId, "aborted", taskName, runId);
         await cleanup();
         return;
       }
       console.log("Task confirmed by user.");
+      appendRunMessage(taskDir, runId, { role: "user", time: Date.now(), content: "Confirmed", type: "confirmation" });
       appendRunMessage(taskDir, runId, { role: "status", time: Date.now(), content: "", type: "confirmation" });
       await publishHostEvent(nc, config.hostId, taskId, { event_type: "result-updated", run_id: runId });
     }
@@ -499,6 +514,8 @@ async function requestConfirmation(
  * Extract report file names from agent output.
  * Looks for lines matching: [PALMIER_REPORT] <filename>
  */
+const ALLOWED_REPORT_EXT = [".md", ".txt", ".png", ".jpg", ".jpeg", ".gif", ".svg", ".webp"];
 export function parseReportFiles(output: string): string[] {
   const regex = new RegExp(`^\\${TASK_REPORT_PREFIX}\\s+(.+)$`, "gm");
   const files: string[] = [];
@@ -506,7 +523,10 @@ export function parseReportFiles(output: string): string[] {
   while ((match = regex.exec(output)) !== null) {
     const name = match[1].trim();
     // Skip placeholder examples echoed from the prompt (e.g. "<filename>")
-    if (name && !name.startsWith("<")) files.push(name);
+    if (!name || name.startsWith("<")) continue;
+    const ext = name.lastIndexOf(".") >= 0 ? name.slice(name.lastIndexOf(".")).toLowerCase() : "";
+    if (!ALLOWED_REPORT_EXT.includes(ext)) continue;
+    files.push(name);
   }
   return files;
 }

package/src/rpc-handler.ts CHANGED Viewed

@@ -47,10 +47,12 @@ function parseResultFrontmatter(raw: string): Record<string, unknown> {
   const terminalStates = ["finished", "failed", "aborted"];
   const terminalMsg = [...statusMessages].reverse().find((m: ConversationMessage) => terminalStates.includes(m.type ?? ""));
-  // If last status is "started", determine if it's a task run or follow-up
+  // If last status is "started" (or continuation like "confirmation"/"monitoring"),
+  // determine if it's a task run or follow-up
+  const activeStates = ["started", "monitoring", "confirmation"];
   let runningState: string | undefined;
-  if (lastStatus?.type === "started" || lastStatus?.type === "monitoring") {
-    runningState = terminalMsg ? "followup" : (lastStatus?.type ?? "started");
+  if (activeStates.includes(lastStatus?.type ?? "")) {
+    runningState = terminalMsg ? "followup" : "started";
   } else {
     runningState = lastStatus?.type;
   }
@@ -182,6 +184,17 @@ export function createRpcHandler(config: HostConfig, nc?: NatsConnection) {
         };
       }
+      case "task.get": {
+        const params = request.params as { id: string };
+        const taskDir = getTaskDir(config.projectRoot, params.id);
+        try {
+          const task = parseTaskFile(taskDir);
+          return flattenTask(task);
+        } catch {
+          return { error: "Task not found" };
+        }
+      }
       case "task.create": {
         const params = request.params as {
           user_prompt: string;
@@ -577,11 +590,14 @@ export function createRpcHandler(config: HostConfig, nc?: NatsConnection) {
         if (!params.run_id || !Array.isArray(params.report_files) || params.report_files.length === 0) {
           return { error: "run_id and report_files are required" };
         }
-        const reports: Array<{ file: string; content?: string; error?: string }> = [];
+        const ALLOWED_EXT = [".md", ".txt", ".png", ".jpg", ".jpeg", ".gif", ".svg", ".webp"];
+        const IMAGE_EXT = [".png", ".jpg", ".jpeg", ".gif", ".svg", ".webp"];
+        const reports: Array<{ file: string; content?: string; data_url?: string; error?: string }> = [];
         const runDir = path.join(config.projectRoot, "tasks", params.id, params.run_id);
         for (const file of params.report_files) {
-          if (!file.endsWith(".md") && !file.endsWith(".txt")) {
-            reports.push({ file, error: "must end with .md or .txt" });
+          const ext = path.extname(file).toLowerCase();
+          if (!ALLOWED_EXT.includes(ext)) {
+            reports.push({ file, error: `unsupported file type: ${ext}` });
             continue;
           }
           const basename = path.basename(file);
@@ -591,8 +607,14 @@ export function createRpcHandler(config: HostConfig, nc?: NatsConnection) {
           }
           const reportPath = path.join(runDir, basename);
           try {
-            const content = fs.readFileSync(reportPath, "utf-8");
-            reports.push({ file, content });
+            if (IMAGE_EXT.includes(ext)) {
+              const buf = fs.readFileSync(reportPath);
+              const mime = ext === ".svg" ? "image/svg+xml" : `image/${ext.slice(1).replace("jpg", "jpeg")}`;
+              reports.push({ file, data_url: `data:${mime};base64,${buf.toString("base64")}` });
+            } else {
+              const content = fs.readFileSync(reportPath, "utf-8");
+              reports.push({ file, content });
+            }
           } catch {
             reports.push({ file, error: "Report file not found" });
           }

package/src/spawn-command.ts CHANGED Viewed

@@ -110,7 +110,6 @@ export function spawnCommand(
       if (opts.onData) opts.onData(d.toString("utf-8"));
     });
     child.stderr!.on("data", (d: Buffer) => {
-      chunks.push(d);
       process.stderr.write(d);
       if (opts.onData) opts.onData(d.toString("utf-8"));
     });

package/test/taskrun-messages.test.ts ADDED Viewed

@@ -0,0 +1,224 @@
+import { describe, it, beforeEach } from "node:test";
+import assert from "node:assert/strict";
+import * as fs from "fs";
+import * as os from "os";
+import * as path from "path";
+import {
+  createRunDir,
+  appendRunMessage,
+  readRunMessages,
+  beginStreamingMessage,
+  spliceUserMessage,
+} from "../src/task.js";
+let taskDir: string;
+let runId: string;
+function setup() {
+  taskDir = fs.mkdtempSync(path.join(os.tmpdir(), "palmier-test-"));
+  runId = createRunDir(taskDir, "Test Task", 1000, "claude");
+}
+describe("appendRunMessage + readRunMessages", () => {
+  beforeEach(setup);
+  it("writes and reads a user message", () => {
+    appendRunMessage(taskDir, runId, { role: "user", time: 1001, content: "Hello" });
+    const msgs = readRunMessages(taskDir, runId);
+    assert.equal(msgs.length, 1);
+    assert.equal(msgs[0].role, "user");
+    assert.equal(msgs[0].content, "Hello");
+    assert.equal(msgs[0].time, 1001);
+  });
+  it("writes and reads an assistant message", () => {
+    appendRunMessage(taskDir, runId, { role: "assistant", time: 1002, content: "Hi there" });
+    const msgs = readRunMessages(taskDir, runId);
+    assert.equal(msgs.length, 1);
+    assert.equal(msgs[0].role, "assistant");
+    assert.equal(msgs[0].content, "Hi there");
+  });
+  it("writes and reads a status message", () => {
+    appendRunMessage(taskDir, runId, { role: "status", time: 1003, content: "", type: "started" });
+    const msgs = readRunMessages(taskDir, runId);
+    assert.equal(msgs.length, 1);
+    assert.equal(msgs[0].role, "status");
+    assert.equal(msgs[0].type, "started");
+  });
+  it("preserves message type", () => {
+    appendRunMessage(taskDir, runId, { role: "user", time: 1004, content: "Confirmed", type: "confirmation" });
+    const msgs = readRunMessages(taskDir, runId);
+    assert.equal(msgs[0].type, "confirmation");
+  });
+  it("preserves attachments", () => {
+    appendRunMessage(taskDir, runId, { role: "assistant", time: 1005, content: "Done", attachments: ["report.md", "chart.png"] });
+    const msgs = readRunMessages(taskDir, runId);
+    assert.deepEqual(msgs[0].attachments, ["report.md", "chart.png"]);
+  });
+  it("reads multiple messages in order", () => {
+    appendRunMessage(taskDir, runId, { role: "status", time: 1000, content: "", type: "started" });
+    appendRunMessage(taskDir, runId, { role: "user", time: 1001, content: "Do something" });
+    appendRunMessage(taskDir, runId, { role: "assistant", time: 1002, content: "Done" });
+    appendRunMessage(taskDir, runId, { role: "status", time: 1003, content: "", type: "finished" });
+    const msgs = readRunMessages(taskDir, runId);
+    assert.equal(msgs.length, 4);
+    assert.equal(msgs[0].type, "started");
+    assert.equal(msgs[1].role, "user");
+    assert.equal(msgs[2].role, "assistant");
+    assert.equal(msgs[3].type, "finished");
+  });
+});
+describe("confirmation flow", () => {
+  beforeEach(setup);
+  it("records confirmation with assistant prompt, user response, and status", () => {
+    appendRunMessage(taskDir, runId, { role: "status", time: 1000, content: "", type: "started" });
+    appendRunMessage(taskDir, runId, { role: "assistant", time: 1001, content: '**Task Confirmation**\n\nRun task "My Task"?', type: "confirmation" });
+    appendRunMessage(taskDir, runId, { role: "user", time: 1002, content: "Confirmed", type: "confirmation" });
+    appendRunMessage(taskDir, runId, { role: "status", time: 1003, content: "", type: "confirmation" });
+    const msgs = readRunMessages(taskDir, runId);
+    assert.equal(msgs.length, 4);
+    assert.equal(msgs[1].role, "assistant");
+    assert.ok(msgs[1].content.includes("Task Confirmation"));
+    assert.equal(msgs[2].role, "user");
+    assert.equal(msgs[2].content, "Confirmed");
+    assert.equal(msgs[3].role, "status");
+    assert.equal(msgs[3].type, "confirmation");
+  });
+  it("records aborted confirmation", () => {
+    appendRunMessage(taskDir, runId, { role: "status", time: 1000, content: "", type: "started" });
+    appendRunMessage(taskDir, runId, { role: "assistant", time: 1001, content: '**Task Confirmation**\n\nRun task "My Task"?', type: "confirmation" });
+    appendRunMessage(taskDir, runId, { role: "user", time: 1002, content: "Aborted", type: "confirmation" });
+    appendRunMessage(taskDir, runId, { role: "status", time: 1003, content: "", type: "aborted" });
+    const msgs = readRunMessages(taskDir, runId);
+    assert.equal(msgs.length, 4);
+    assert.equal(msgs[2].content, "Aborted");
+    assert.equal(msgs[3].type, "aborted");
+  });
+});
+describe("beginStreamingMessage", () => {
+  beforeEach(setup);
+  it("streams chunks and finalizes", () => {
+    const writer = beginStreamingMessage(taskDir, runId, 2000);
+    writer.write("Hello ");
+    writer.write("world");
+    writer.end();
+    const msgs = readRunMessages(taskDir, runId);
+    assert.equal(msgs.length, 1);
+    assert.equal(msgs[0].role, "assistant");
+    assert.equal(msgs[0].content, "Hello world");
+  });
+  it("attaches report files to the last assistant message", () => {
+    const writer = beginStreamingMessage(taskDir, runId, 2000);
+    writer.write("Generated report.");
+    writer.end(["report.md", "chart.png"]);
+    const msgs = readRunMessages(taskDir, runId);
+    assert.equal(msgs.length, 1);
+    assert.deepEqual(msgs[0].attachments, ["report.md", "chart.png"]);
+  });
+});
+describe("spliceUserMessage", () => {
+  beforeEach(setup);
+  it("splits assistant stream for user input", () => {
+    const writer = beginStreamingMessage(taskDir, runId, 2000);
+    writer.write("Working on it...");
+    spliceUserMessage(taskDir, runId, { role: "user", time: 2001, content: "my-api-key", type: "input" });
+    writer.write("Continuing with key.");
+    writer.end();
+    const msgs = readRunMessages(taskDir, runId);
+    assert.equal(msgs.length, 3);
+    assert.equal(msgs[0].role, "assistant");
+    assert.equal(msgs[0].content, "Working on it...");
+    assert.equal(msgs[1].role, "user");
+    assert.equal(msgs[1].content, "my-api-key");
+    assert.equal(msgs[1].type, "input");
+    assert.equal(msgs[2].role, "assistant");
+    assert.equal(msgs[2].content, "Continuing with key.");
+  });
+  it("appends assistant text before splicing", () => {
+    const writer = beginStreamingMessage(taskDir, runId, 2000);
+    writer.write("Processing");
+    spliceUserMessage(
+      taskDir, runId,
+      { role: "user", time: 2001, content: "answer1", type: "input" },
+      "\n\n**What is your key?**",
+    );
+    writer.write("Done.");
+    writer.end();
+    const msgs = readRunMessages(taskDir, runId);
+    assert.equal(msgs.length, 3);
+    assert.ok(msgs[0].content.includes("What is your key?"));
+    assert.equal(msgs[1].content, "answer1");
+    assert.equal(msgs[2].content, "Done.");
+  });
+  it("attaches reports to last assistant message after splice", () => {
+    const writer = beginStreamingMessage(taskDir, runId, 2000);
+    writer.write("Part 1");
+    spliceUserMessage(taskDir, runId, { role: "user", time: 2001, content: "input", type: "input" });
+    writer.write("Part 2");
+    writer.end(["report.md"]);
+    const msgs = readRunMessages(taskDir, runId);
+    // Attachments should be on the last assistant message (after splice), not the first
+    assert.equal(msgs[0].attachments, undefined);
+    assert.deepEqual(msgs[2].attachments, ["report.md"]);
+  });
+});
+describe("permission flow", () => {
+  beforeEach(setup);
+  it("records permission grant as user message", () => {
+    appendRunMessage(taskDir, runId, { role: "status", time: 1000, content: "", type: "started" });
+    appendRunMessage(taskDir, runId, { role: "user", time: 1001, content: "Do something" });
+    // Simulate agent output with permission request (via streaming)
+    const writer = beginStreamingMessage(taskDir, runId, 1002);
+    writer.write("I need permission.\n\n**Permissions requested:**\n- **Read** Read files\n");
+    writer.end();
+    // Permission granted
+    appendRunMessage(taskDir, runId, { role: "user", time: 1003, content: "Granted", type: "permission" });
+    const msgs = readRunMessages(taskDir, runId);
+    assert.equal(msgs.length, 4);
+    assert.equal(msgs[3].role, "user");
+    assert.equal(msgs[3].content, "Granted");
+    assert.equal(msgs[3].type, "permission");
+  });
+  it("records permission denial", () => {
+    appendRunMessage(taskDir, runId, { role: "user", time: 1001, content: "Do something" });
+    const writer = beginStreamingMessage(taskDir, runId, 1002);
+    writer.write("Need permission.");
+    writer.end();
+    appendRunMessage(taskDir, runId, { role: "user", time: 1003, content: "Denied", type: "permission" });
+    const msgs = readRunMessages(taskDir, runId);
+    assert.equal(msgs[2].content, "Denied");
+    assert.equal(msgs[2].type, "permission");
+  });
+});