npm - alvin-bot - Versions diffs - 4.18.0 → 4.18.2 - Mend

alvin-bot 4.18.0 → 4.18.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (74) hide show

package/AEC-PLUGINS-SOURCES.md +53 -0
package/CHANGELOG.md +37 -2
package/DESIGN-SKILLS-SOURCES.md +81 -0
package/bin/cli.js +1 -1
package/dist/providers/claude-sdk-provider.js +24 -0
package/package.json +3 -1
package/test/allowed-users-gate.test.ts +0 -98
package/test/alvin-dispatch.test.ts +0 -220
package/test/async-agent-chunk-flow.test.ts +0 -244
package/test/async-agent-parser-staleness.test.ts +0 -412
package/test/async-agent-parser-streamjson.test.ts +0 -273
package/test/async-agent-parser.test.ts +0 -322
package/test/async-agent-watcher.test.ts +0 -229
package/test/background-bypass-integration.test.ts +0 -443
package/test/background-bypass-stress.test.ts +0 -417
package/test/background-bypass.test.ts +0 -127
package/test/browser-webfetch.test.ts +0 -121
package/test/claude-sdk-provider.test.ts +0 -115
package/test/claude-sdk-tool-use-id.test.ts +0 -180
package/test/console-timestamps.test.ts +0 -98
package/test/cron-progress-ticker.test.ts +0 -76
package/test/cron-restart-resilience.test.ts +0 -191
package/test/cron-run-resolver.test.ts +0 -133
package/test/cron-runjobnow-throw.test.ts +0 -100
package/test/debounce.test.ts +0 -60
package/test/delivery-registry.test.ts +0 -71
package/test/exec-guard-metachars.test.ts +0 -110
package/test/file-permissions.test.ts +0 -130
package/test/i18n.test.ts +0 -108
package/test/list-subagents-merged.test.ts +0 -172
package/test/memory-extractor.test.ts +0 -151
package/test/memory-layers.test.ts +0 -169
package/test/memory-sdk-injection.test.ts +0 -146
package/test/memory-stress-restart.test.ts +0 -337
package/test/multi-session-stress.test.ts +0 -255
package/test/platform-session-key.test.ts +0 -69
package/test/process-manager.test.ts +0 -186
package/test/registry.test.ts +0 -201
package/test/session-pending-background.test.ts +0 -59
package/test/session-persistence.test.ts +0 -195
package/test/slack-progress-ticker.test.ts +0 -123
package/test/slack-slash-command.test.ts +0 -61
package/test/slack-test-connection.test.ts +0 -176
package/test/stress-scenarios.test.ts +0 -356
package/test/stuck-timer.test.ts +0 -116
package/test/subagent-delivery-markdown-fallback.test.ts +0 -147
package/test/subagent-delivery-platform-routing.test.ts +0 -232
package/test/subagent-delivery.test.ts +0 -273
package/test/subagent-final-text.test.ts +0 -132
package/test/subagent-stats.test.ts +0 -119
package/test/subagent-toolset-allowlist.test.ts +0 -146
package/test/subagents-commands.test.ts +0 -64
package/test/subagents-config.test.ts +0 -114
package/test/subagents-depth.test.ts +0 -58
package/test/subagents-inheritance.test.ts +0 -67
package/test/subagents-name-resolver.test.ts +0 -122
package/test/subagents-priority-reject.test.ts +0 -88
package/test/subagents-queue.test.ts +0 -127
package/test/subagents-shutdown.test.ts +0 -126
package/test/subagents-toolset.test.ts +0 -71
package/test/sync-task-timeout.test.ts +0 -153
package/test/system-prompt-background-hint.test.ts +0 -65
package/test/telegram-error-filter.test.ts +0 -85
package/test/telegram-workspace-command.test.ts +0 -78
package/test/timing-safe-bearer.test.ts +0 -65
package/test/watchdog-brake.test.ts +0 -157
package/test/watcher-pending-count.test.ts +0 -228
package/test/watcher-zombie-fix.test.ts +0 -252
package/test/web-server-integration.test.ts +0 -189
package/test/web-server-resilience.test.ts +0 -118
package/test/web-server-shutdown.test.ts +0 -117
package/test/whatsapp-auth-resilience.test.ts +0 -96
package/test/workspaces.test.ts +0 -196
package/vitest.config.ts +0 -17

package/test/async-agent-chunk-flow.test.ts DELETED Viewed

@@ -1,244 +0,0 @@
-/**
- * Fix #17 (Stage 2) — when the SDK yields a tool_result chunk with an
- * "Async agent launched successfully" payload, the message handler
- * must register the pending agent with the watcher.
- *
- * This tests the helper `handleToolResultChunk` in isolation —
- * the integration with message.ts is covered by the live e2e test.
- */
-import { describe, it, expect, beforeEach, vi } from "vitest";
-describe("async agent chunk flow (Stage 2)", () => {
-  beforeEach(() => vi.resetModules());
-  it("tool_result with async_launched gets registered with the watcher", async () => {
-    const registered: unknown[] = [];
-    vi.doMock("../src/services/async-agent-watcher.js", () => ({
-      registerPendingAgent: (input: unknown) => registered.push(input),
-      startWatcher: () => {},
-      stopWatcher: () => {},
-      pollOnce: async () => {},
-      listPendingAgents: () => [],
-    }));
-    const { handleToolResultChunk } = await import(
-      "../src/handlers/async-agent-chunk-handler.js"
-    );
-    const chunk = {
-      type: "tool_result" as const,
-      toolUseId: "toolu_1",
-      toolResultContent:
-        "Async agent launched successfully.\n" +
-        "agentId: abc-1 (something)\n" +
-        "output_file: /tmp/out-abc-1.jsonl\n" +
-        "If asked, you can check progress.",
-    };
-    handleToolResultChunk(chunk, {
-      chatId: 42,
-      userId: 99,
-      lastToolUseInput: {
-        description: "SEO audit",
-        prompt: "audit example.com",
-      },
-    });
-    expect(registered).toHaveLength(1);
-    const r = registered[0] as { agentId: string; description: string; outputFile: string };
-    expect(r.agentId).toBe("abc-1");
-    expect(r.description).toBe("SEO audit");
-    expect(r.outputFile).toBe("/tmp/out-abc-1.jsonl");
-  });
-  it("v4.12.3 — passes sessionKey to registerPendingAgent and increments session counter", async () => {
-    const registered: Array<{ sessionKey?: string }> = [];
-    vi.doMock("../src/services/async-agent-watcher.js", () => ({
-      registerPendingAgent: (input: { sessionKey?: string }) =>
-        registered.push(input),
-      startWatcher: () => {},
-      stopWatcher: () => {},
-      pollOnce: async () => {},
-      listPendingAgents: () => [],
-    }));
-    const { getSession } = await import("../src/services/session.js");
-    const session = getSession("v412-chunk-test-session");
-    session.pendingBackgroundCount = 0;
-    const { handleToolResultChunk } = await import(
-      "../src/handlers/async-agent-chunk-handler.js"
-    );
-    handleToolResultChunk(
-      {
-        type: "tool_result",
-        toolUseId: "toolu_sess",
-        toolResultContent:
-          "Async agent launched successfully.\n" +
-          "agentId: ag-sess\n" +
-          "output_file: /tmp/ag-sess.jsonl\n",
-      },
-      {
-        chatId: 10,
-        userId: 20,
-        sessionKey: "v412-chunk-test-session",
-        lastToolUseInput: { description: "SEO", prompt: "do it" },
-      },
-    );
-    expect(registered).toHaveLength(1);
-    expect(registered[0].sessionKey).toBe("v412-chunk-test-session");
-    expect(session.pendingBackgroundCount).toBe(1);
-  });
-  it("v4.12.3 — multiple async launches in same turn stack the counter", async () => {
-    vi.doMock("../src/services/async-agent-watcher.js", () => ({
-      registerPendingAgent: () => {},
-      startWatcher: () => {},
-      stopWatcher: () => {},
-      pollOnce: async () => {},
-      listPendingAgents: () => [],
-    }));
-    const { getSession } = await import("../src/services/session.js");
-    const session = getSession("v412-chunk-stack");
-    session.pendingBackgroundCount = 0;
-    const { handleToolResultChunk } = await import(
-      "../src/handlers/async-agent-chunk-handler.js"
-    );
-    for (let i = 0; i < 3; i++) {
-      handleToolResultChunk(
-        {
-          type: "tool_result",
-          toolUseId: `toolu_${i}`,
-          toolResultContent:
-            `Async agent launched successfully.\n` +
-            `agentId: ag-${i}\n` +
-            `output_file: /tmp/ag-${i}.jsonl\n`,
-        },
-        {
-          chatId: 10,
-          userId: 20,
-          sessionKey: "v412-chunk-stack",
-          lastToolUseInput: { description: `task ${i}`, prompt: "p" },
-        },
-      );
-    }
-    expect(session.pendingBackgroundCount).toBe(3);
-  });
-  it("v4.12.3 — non-async tool_result does not increment the counter", async () => {
-    vi.doMock("../src/services/async-agent-watcher.js", () => ({
-      registerPendingAgent: () => {
-        throw new Error("should not be called");
-      },
-      startWatcher: () => {},
-      stopWatcher: () => {},
-      pollOnce: async () => {},
-      listPendingAgents: () => [],
-    }));
-    const { getSession } = await import("../src/services/session.js");
-    const session = getSession("v412-chunk-nonasync");
-    session.pendingBackgroundCount = 0;
-    const { handleToolResultChunk } = await import(
-      "../src/handlers/async-agent-chunk-handler.js"
-    );
-    handleToolResultChunk(
-      {
-        type: "tool_result",
-        toolUseId: "toolu_read",
-        toolResultContent: "plain read result — no async_launched marker",
-      },
-      {
-        chatId: 1,
-        userId: 1,
-        sessionKey: "v412-chunk-nonasync",
-        lastToolUseInput: { description: "read", prompt: "p" },
-      },
-    );
-    expect(session.pendingBackgroundCount).toBe(0);
-  });
-  it("falls back to a generic description when no toolUseInput is provided", async () => {
-    const registered: unknown[] = [];
-    vi.doMock("../src/services/async-agent-watcher.js", () => ({
-      registerPendingAgent: (input: unknown) => registered.push(input),
-      startWatcher: () => {},
-      stopWatcher: () => {},
-      pollOnce: async () => {},
-      listPendingAgents: () => [],
-    }));
-    const { handleToolResultChunk } = await import(
-      "../src/handlers/async-agent-chunk-handler.js"
-    );
-    handleToolResultChunk(
-      {
-        type: "tool_result",
-        toolUseId: "toolu_2",
-        toolResultContent:
-          "Async agent launched successfully.\n" +
-          "agentId: x\n" +
-          "output_file: /tmp/o\n",
-      },
-      { chatId: 42, userId: 99 },
-    );
-    expect(registered).toHaveLength(1);
-    const r = registered[0] as { description: string };
-    expect(r.description.length).toBeGreaterThan(0);
-  });
-  it("non-async tool_result (e.g. Read) is ignored", async () => {
-    const registered: unknown[] = [];
-    vi.doMock("../src/services/async-agent-watcher.js", () => ({
-      registerPendingAgent: (input: unknown) => registered.push(input),
-      startWatcher: () => {},
-      stopWatcher: () => {},
-      pollOnce: async () => {},
-      listPendingAgents: () => [],
-    }));
-    const { handleToolResultChunk } = await import(
-      "../src/handlers/async-agent-chunk-handler.js"
-    );
-    handleToolResultChunk(
-      {
-        type: "tool_result",
-        toolUseId: "toolu_3",
-        toolResultContent: "file contents here (plain Read result)",
-      },
-      { chatId: 42, userId: 99 },
-    );
-    expect(registered).toHaveLength(0);
-  });
-  it("non-tool_result chunks are ignored without throwing", async () => {
-    vi.doMock("../src/services/async-agent-watcher.js", () => ({
-      registerPendingAgent: () => {
-        throw new Error("should not be called");
-      },
-      startWatcher: () => {},
-      stopWatcher: () => {},
-      pollOnce: async () => {},
-      listPendingAgents: () => [],
-    }));
-    const { handleToolResultChunk } = await import(
-      "../src/handlers/async-agent-chunk-handler.js"
-    );
-    expect(() =>
-      handleToolResultChunk(
-        { type: "text", text: "hi" },
-        { chatId: 42, userId: 99 },
-      ),
-    ).not.toThrow();
-  });
-});

package/test/async-agent-parser-staleness.test.ts DELETED Viewed

@@ -1,412 +0,0 @@
-/**
- * v4.12.4 — parseOutputFileStatus staleness detection.
- *
- * Problem this fixes: when a background sub-agent is interrupted (e.g. by
- * v4.12.3's bypass-abort propagating through the SDK subprocess), its
- * outputFile is left with partial JSONL — real work, real text — but
- * without the `stop_reason: "end_turn"` marker the pre-v4.12.4 parser
- * required for "completed" state.
- *
- * Real-world evidence (2026-04-16):
- *   - Three agents (a03ce829, af61fa6e, ac47c4a2) pending in state file
- *   - Each outputFile has 81-131 lines of REAL work (WebSearch, tool_use,
- *     partial reports like "Here's the summary:\n\n## Critical Bugs")
- *   - Last event is either "[Request interrupted by user for tool use]"
- *     or a mid-streaming assistant text that never got end_turn
- *   - Watcher polls forever, hits 12h giveUpAt, delivers "empty output"
- *   - User sees useless "720m timeout · 0 in / 0 out · (empty output)"
- *     messages hours later, while the actual work is sitting on disk
- *
- * Fix behavior:
- *   - If no end_turn is found, check mtime/size of the file
- *   - If file hasn't been touched for `stalenessMs` (default 5 min) AND
- *     there's usable text content in the tail, mark as "completed"
- *     with the partial output PREFIXED by an "⚠️ interrupted, partial
- *     output" header so the user knows it's not a clean finish
- *   - If file IS fresh or has no text content, stay in "running" state
- *     (normal polling continues)
- *
- * This deliberately biases toward delivering SOMETHING rather than
- * nothing. Worst case: an agent that's still alive but genuinely idle
- * for >5 min gets its partial text delivered early. Best case: dozens
- * of stuck interrupted agents get their real work back to the user.
- */
-import { describe, it, expect, beforeEach, afterEach } from "vitest";
-import fs from "fs";
-import os from "os";
-import { resolve } from "path";
-import { parseOutputFileStatus } from "../src/services/async-agent-parser.js";
-const TMP_BASE = resolve(os.tmpdir(), `alvin-parser-stale-${process.pid}`);
-beforeEach(() => {
-  fs.mkdirSync(TMP_BASE, { recursive: true });
-});
-afterEach(() => {
-  try {
-    fs.rmSync(TMP_BASE, { recursive: true, force: true });
-  } catch {
-    /* ignore */
-  }
-});
-/**
- * Write a JSONL file with a mid-execution interrupted state. No end_turn,
- * but contains real assistant text + tool calls. Last line is the
- * "Request interrupted" marker.
- */
-function writeInterruptedJsonl(name: string): string {
-  const path = resolve(TMP_BASE, name);
-  const lines = [
-    JSON.stringify({
-      type: "user",
-      isSidechain: true,
-      agentId: "x",
-      message: { role: "user", content: "do a report" },
-    }),
-    JSON.stringify({
-      type: "assistant",
-      isSidechain: true,
-      agentId: "x",
-      message: {
-        role: "assistant",
-        content: [{ type: "text", text: "Starting research..." }],
-        stop_reason: "tool_use",
-      },
-    }),
-    JSON.stringify({
-      type: "assistant",
-      isSidechain: true,
-      agentId: "x",
-      message: {
-        role: "assistant",
-        content: [
-          {
-            type: "text",
-            text:
-              "Here's what I found:\n\n## Key Findings\n- Finding A\n- Finding B\n- Finding C",
-          },
-        ],
-        stop_reason: "tool_use",
-      },
-    }),
-    JSON.stringify({
-      type: "user",
-      isSidechain: true,
-      agentId: "x",
-      message: {
-        role: "user",
-        content: [
-          {
-            type: "tool_result",
-            content: "[Request interrupted by user for tool use]",
-          },
-        ],
-      },
-    }),
-  ];
-  fs.writeFileSync(path, lines.join("\n") + "\n", "utf-8");
-  return path;
-}
-/** Set file mtime to N ms in the past. */
-function setStale(path: string, ageMs: number): void {
-  const target = Date.now() - ageMs;
-  fs.utimesSync(path, target / 1000, target / 1000);
-}
-describe("parseOutputFileStatus — staleness detection (v4.12.4)", () => {
-  it("still returns 'completed' when end_turn is present (staleness is a fallback only)", async () => {
-    const path = resolve(TMP_BASE, "complete.jsonl");
-    fs.writeFileSync(
-      path,
-      JSON.stringify({
-        type: "assistant",
-        agentId: "x",
-        message: {
-          content: [{ type: "text", text: "clean end" }],
-          stop_reason: "end_turn",
-        },
-      }) + "\n",
-      "utf-8",
-    );
-    setStale(path, 3600_000); // 1h old
-    const status = await parseOutputFileStatus(path, {
-      stalenessMs: 300_000,
-    });
-    expect(status.state).toBe("completed");
-    if (status.state === "completed") {
-      expect(status.output).toContain("clean end");
-      // No interrupted banner for clean end_turn
-      expect(status.output).not.toMatch(/interrupt/i);
-    }
-  });
-  it("returns 'running' when file is fresh and no end_turn (normal polling)", async () => {
-    const path = writeInterruptedJsonl("fresh-interrupted.jsonl");
-    // File is fresh (just written)
-    const status = await parseOutputFileStatus(path, {
-      stalenessMs: 300_000,
-    });
-    expect(status.state).toBe("running");
-  });
-  it("returns 'completed' (partial) when file is stale AND has text content", async () => {
-    const path = writeInterruptedJsonl("stale-interrupted.jsonl");
-    setStale(path, 600_000); // 10 min old
-    const status = await parseOutputFileStatus(path, {
-      stalenessMs: 300_000, // 5 min threshold
-    });
-    expect(status.state).toBe("completed");
-    if (status.state === "completed") {
-      // Should contain the real report content
-      expect(status.output).toContain("Key Findings");
-      expect(status.output).toContain("Finding A");
-      // Should be prefixed with an interrupted banner so user knows
-      // (German "unterbrochen" / "partielle" OR English "interrupted"/"partial")
-      expect(status.output).toMatch(/interrupt|partial|unterbroch|partiell|⚠️/i);
-    }
-  });
-  it("returns 'running' when file is stale but has NO text content (nothing to deliver)", async () => {
-    // Only tool-use events, no text. Delivery would be useless.
-    const path = resolve(TMP_BASE, "no-text.jsonl");
-    fs.writeFileSync(
-      path,
-      [
-        JSON.stringify({
-          type: "user",
-          agentId: "x",
-          message: { role: "user", content: "go" },
-        }),
-        JSON.stringify({
-          type: "assistant",
-          agentId: "x",
-          message: {
-            content: [
-              { type: "tool_use", name: "Bash", input: { command: "ls" } },
-            ],
-            stop_reason: "tool_use",
-          },
-        }),
-      ].join("\n") + "\n",
-      "utf-8",
-    );
-    setStale(path, 600_000);
-    const status = await parseOutputFileStatus(path, {
-      stalenessMs: 300_000,
-    });
-    expect(status.state).toBe("running");
-  });
-  it("default stalenessMs is applied when not provided (no crashes on legacy callers)", async () => {
-    const path = writeInterruptedJsonl("default-cfg.jsonl");
-    setStale(path, 24 * 3600_000); // 24h old — very stale
-    const status = await parseOutputFileStatus(path);
-    // Whatever the default is, 24h should definitely exceed it
-    expect(status.state).toBe("completed");
-  });
-  it("stalenessMs: 0 disables the staleness fallback entirely", async () => {
-    const path = writeInterruptedJsonl("disabled.jsonl");
-    setStale(path, 24 * 3600_000);
-    const status = await parseOutputFileStatus(path, { stalenessMs: 0 });
-    // With staleness disabled, we're back to strict end_turn requirement
-    expect(status.state).toBe("running");
-  });
-  it("aggregates ALL text blocks from ALL assistant turns when delivering partial", async () => {
-    const path = resolve(TMP_BASE, "multi-turn-interrupted.jsonl");
-    const lines = [
-      { type: "user", agentId: "x", message: { role: "user", content: "go" } },
-      {
-        type: "assistant",
-        agentId: "x",
-        message: {
-          content: [{ type: "text", text: "First thought." }],
-          stop_reason: "tool_use",
-        },
-      },
-      {
-        type: "assistant",
-        agentId: "x",
-        message: {
-          content: [{ type: "text", text: "Second thought." }],
-          stop_reason: "tool_use",
-        },
-      },
-      {
-        type: "assistant",
-        agentId: "x",
-        message: {
-          content: [{ type: "text", text: "Final partial report." }],
-          stop_reason: "tool_use",
-        },
-      },
-    ];
-    fs.writeFileSync(
-      path,
-      lines.map((l) => JSON.stringify(l)).join("\n") + "\n",
-      "utf-8",
-    );
-    setStale(path, 600_000);
-    const status = await parseOutputFileStatus(path, {
-      stalenessMs: 300_000,
-    });
-    expect(status.state).toBe("completed");
-    if (status.state === "completed") {
-      // Should contain text from all three turns (bias toward delivering more)
-      expect(status.output).toContain("First thought");
-      expect(status.output).toContain("Second thought");
-      expect(status.output).toContain("Final partial report");
-    }
-  });
-  it("ignores thinking blocks in partial delivery (user doesn't want Claude's scratchpad)", async () => {
-    const path = resolve(TMP_BASE, "thinking-filter.jsonl");
-    const lines = [
-      {
-        type: "assistant",
-        agentId: "x",
-        message: {
-          content: [
-            { type: "thinking", text: "internal reasoning nobody should see" },
-            { type: "text", text: "Actual output text." },
-          ],
-          stop_reason: "tool_use",
-        },
-      },
-    ];
-    fs.writeFileSync(
-      path,
-      lines.map((l) => JSON.stringify(l)).join("\n") + "\n",
-      "utf-8",
-    );
-    setStale(path, 600_000);
-    const status = await parseOutputFileStatus(path, {
-      stalenessMs: 300_000,
-    });
-    expect(status.state).toBe("completed");
-    if (status.state === "completed") {
-      expect(status.output).toContain("Actual output text");
-      expect(status.output).not.toContain("internal reasoning");
-    }
-  });
-  it("extracts usage tokens from the last assistant event when available", async () => {
-    const path = resolve(TMP_BASE, "tokens-partial.jsonl");
-    const lines = [
-      {
-        type: "assistant",
-        agentId: "x",
-        message: {
-          content: [{ type: "text", text: "partial text" }],
-          stop_reason: "tool_use",
-          usage: { input_tokens: 500, output_tokens: 200 },
-        },
-      },
-    ];
-    fs.writeFileSync(
-      path,
-      lines.map((l) => JSON.stringify(l)).join("\n") + "\n",
-      "utf-8",
-    );
-    setStale(path, 600_000);
-    const status = await parseOutputFileStatus(path, {
-      stalenessMs: 300_000,
-    });
-    expect(status.state).toBe("completed");
-    if (status.state === "completed") {
-      expect(status.tokensUsed).toEqual({ input: 500, output: 200 });
-    }
-  });
-  it("handles file that only has the interruption marker (nothing useful to deliver)", async () => {
-    // Edge case: only interruption, no prior text
-    const path = resolve(TMP_BASE, "only-interrupt.jsonl");
-    const lines = [
-      {
-        type: "user",
-        agentId: "x",
-        message: {
-          role: "user",
-          content: [
-            {
-              type: "tool_result",
-              content: "[Request interrupted by user for tool use]",
-            },
-          ],
-        },
-      },
-    ];
-    fs.writeFileSync(
-      path,
-      lines.map((l) => JSON.stringify(l)).join("\n") + "\n",
-      "utf-8",
-    );
-    setStale(path, 600_000);
-    const status = await parseOutputFileStatus(path, {
-      stalenessMs: 300_000,
-    });
-    // No assistant text content at all → still running (nothing useful)
-    expect(status.state).toBe("running");
-  });
-  it("preserves ordering of text across turns (earlier text first, later text last)", async () => {
-    const path = resolve(TMP_BASE, "order.jsonl");
-    const lines = [
-      {
-        type: "assistant",
-        agentId: "x",
-        message: {
-          content: [{ type: "text", text: "ALPHA" }],
-          stop_reason: "tool_use",
-        },
-      },
-      {
-        type: "user",
-        agentId: "x",
-        message: { content: [{ type: "tool_result", content: "..." }] },
-      },
-      {
-        type: "assistant",
-        agentId: "x",
-        message: {
-          content: [{ type: "text", text: "BETA" }],
-          stop_reason: "tool_use",
-        },
-      },
-      {
-        type: "user",
-        agentId: "x",
-        message: { content: [{ type: "tool_result", content: "..." }] },
-      },
-      {
-        type: "assistant",
-        agentId: "x",
-        message: {
-          content: [{ type: "text", text: "GAMMA" }],
-          stop_reason: "tool_use",
-        },
-      },
-    ];
-    fs.writeFileSync(
-      path,
-      lines.map((l) => JSON.stringify(l)).join("\n") + "\n",
-      "utf-8",
-    );
-    setStale(path, 600_000);
-    const status = await parseOutputFileStatus(path, {
-      stalenessMs: 300_000,
-    });
-    expect(status.state).toBe("completed");
-    if (status.state === "completed") {
-      const alphaIdx = status.output.indexOf("ALPHA");
-      const betaIdx = status.output.indexOf("BETA");
-      const gammaIdx = status.output.indexOf("GAMMA");
-      expect(alphaIdx).toBeGreaterThan(-1);
-      expect(betaIdx).toBeGreaterThan(alphaIdx);
-      expect(gammaIdx).toBeGreaterThan(betaIdx);
-    }
-  });
-});