npm - zeitlich - Versions diffs - 0.2.21 → 0.2.23 - Mend

zeitlich 0.2.21 → 0.2.23

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (129) hide show

package/README.md +303 -105
package/dist/adapters/sandbox/daytona/index.cjs +7 -1
package/dist/adapters/sandbox/daytona/index.cjs.map +1 -1
package/dist/adapters/sandbox/daytona/index.d.cts +3 -1
package/dist/adapters/sandbox/daytona/index.d.ts +3 -1
package/dist/adapters/sandbox/daytona/index.js +7 -1
package/dist/adapters/sandbox/daytona/index.js.map +1 -1
package/dist/adapters/sandbox/daytona/workflow.cjs +33 -0
package/dist/adapters/sandbox/daytona/workflow.cjs.map +1 -0
package/dist/adapters/sandbox/daytona/workflow.d.cts +27 -0
package/dist/adapters/sandbox/daytona/workflow.d.ts +27 -0
package/dist/adapters/sandbox/daytona/workflow.js +31 -0
package/dist/adapters/sandbox/daytona/workflow.js.map +1 -0
package/dist/adapters/sandbox/inmemory/index.cjs +18 -1
package/dist/adapters/sandbox/inmemory/index.cjs.map +1 -1
package/dist/adapters/sandbox/inmemory/index.d.cts +4 -2
package/dist/adapters/sandbox/inmemory/index.d.ts +4 -2
package/dist/adapters/sandbox/inmemory/index.js +18 -1
package/dist/adapters/sandbox/inmemory/index.js.map +1 -1
package/dist/adapters/sandbox/inmemory/workflow.cjs +33 -0
package/dist/adapters/sandbox/inmemory/workflow.cjs.map +1 -0
package/dist/adapters/sandbox/inmemory/workflow.d.cts +25 -0
package/dist/adapters/sandbox/inmemory/workflow.d.ts +25 -0
package/dist/adapters/sandbox/inmemory/workflow.js +31 -0
package/dist/adapters/sandbox/inmemory/workflow.js.map +1 -0
package/dist/adapters/sandbox/virtual/index.cjs +36 -9
package/dist/adapters/sandbox/virtual/index.cjs.map +1 -1
package/dist/adapters/sandbox/virtual/index.d.cts +8 -5
package/dist/adapters/sandbox/virtual/index.d.ts +8 -5
package/dist/adapters/sandbox/virtual/index.js +36 -9
package/dist/adapters/sandbox/virtual/index.js.map +1 -1
package/dist/adapters/sandbox/virtual/workflow.cjs +33 -0
package/dist/adapters/sandbox/virtual/workflow.cjs.map +1 -0
package/dist/adapters/sandbox/virtual/workflow.d.cts +27 -0
package/dist/adapters/sandbox/virtual/workflow.d.ts +27 -0
package/dist/adapters/sandbox/virtual/workflow.js +31 -0
package/dist/adapters/sandbox/virtual/workflow.js.map +1 -0
package/dist/adapters/thread/google-genai/index.cjs +9 -1
package/dist/adapters/thread/google-genai/index.cjs.map +1 -1
package/dist/adapters/thread/google-genai/index.d.cts +31 -19
package/dist/adapters/thread/google-genai/index.d.ts +31 -19
package/dist/adapters/thread/google-genai/index.js +9 -1
package/dist/adapters/thread/google-genai/index.js.map +1 -1
package/dist/adapters/thread/google-genai/workflow.cjs +33 -0
package/dist/adapters/thread/google-genai/workflow.cjs.map +1 -0
package/dist/adapters/thread/google-genai/workflow.d.cts +32 -0
package/dist/adapters/thread/google-genai/workflow.d.ts +32 -0
package/dist/adapters/thread/google-genai/workflow.js +31 -0
package/dist/adapters/thread/google-genai/workflow.js.map +1 -0
package/dist/adapters/thread/langchain/index.cjs +9 -1
package/dist/adapters/thread/langchain/index.cjs.map +1 -1
package/dist/adapters/thread/langchain/index.d.cts +27 -16
package/dist/adapters/thread/langchain/index.d.ts +27 -16
package/dist/adapters/thread/langchain/index.js +9 -1
package/dist/adapters/thread/langchain/index.js.map +1 -1
package/dist/adapters/thread/langchain/workflow.cjs +33 -0
package/dist/adapters/thread/langchain/workflow.cjs.map +1 -0
package/dist/adapters/thread/langchain/workflow.d.cts +32 -0
package/dist/adapters/thread/langchain/workflow.d.ts +32 -0
package/dist/adapters/thread/langchain/workflow.js +31 -0
package/dist/adapters/thread/langchain/workflow.js.map +1 -0
package/dist/index.cjs +282 -90
package/dist/index.cjs.map +1 -1
package/dist/index.d.cts +38 -16
package/dist/index.d.ts +38 -16
package/dist/index.js +281 -87
package/dist/index.js.map +1 -1
package/dist/queries-DModcWRy.d.cts +44 -0
package/dist/queries-byD0jr1Y.d.ts +44 -0
package/dist/{types-BkAYmc96.d.ts → types-B50pBPEV.d.ts} +190 -38
package/dist/{types-YbL7JpEA.d.cts → types-Bll19FZJ.d.cts} +7 -0
package/dist/{types-YbL7JpEA.d.ts → types-Bll19FZJ.d.ts} +7 -0
package/dist/{queries-6Avfh74U.d.ts → types-BuXdFhaZ.d.cts} +7 -48
package/dist/{types-BMRzfELQ.d.cts → types-ChAMwU3q.d.cts} +17 -1
package/dist/{types-BMRzfELQ.d.ts → types-ChAMwU3q.d.ts} +17 -1
package/dist/{types-CES_30qx.d.cts → types-DQW8l7pY.d.cts} +190 -38
package/dist/{queries-CHa2iv_I.d.cts → types-GZ76HZSj.d.ts} +7 -48
package/dist/workflow.cjs +244 -86
package/dist/workflow.cjs.map +1 -1
package/dist/workflow.d.cts +54 -65
package/dist/workflow.d.ts +54 -65
package/dist/workflow.js +243 -83
package/dist/workflow.js.map +1 -1
package/package.json +54 -2
package/src/adapters/sandbox/daytona/filesystem.ts +1 -1
package/src/adapters/sandbox/daytona/index.ts +8 -0
package/src/adapters/sandbox/daytona/proxy.ts +56 -0
package/src/adapters/sandbox/e2b/filesystem.ts +147 -0
package/src/adapters/sandbox/e2b/index.ts +164 -0
package/src/adapters/sandbox/e2b/types.ts +23 -0
package/src/adapters/sandbox/inmemory/index.ts +27 -3
package/src/adapters/sandbox/inmemory/proxy.ts +53 -0
package/src/adapters/sandbox/virtual/filesystem.ts +41 -17
package/src/adapters/sandbox/virtual/provider.ts +9 -1
package/src/adapters/sandbox/virtual/proxy.ts +53 -0
package/src/adapters/sandbox/virtual/types.ts +9 -4
package/src/adapters/thread/google-genai/activities.ts +51 -17
package/src/adapters/thread/google-genai/index.ts +1 -0
package/src/adapters/thread/google-genai/proxy.ts +61 -0
package/src/adapters/thread/langchain/activities.ts +47 -14
package/src/adapters/thread/langchain/index.ts +1 -0
package/src/adapters/thread/langchain/proxy.ts +61 -0
package/src/lib/lifecycle.ts +57 -0
package/src/lib/sandbox/manager.ts +52 -6
package/src/lib/sandbox/sandbox.test.ts +12 -11
package/src/lib/sandbox/types.ts +31 -4
package/src/lib/session/index.ts +4 -5
package/src/lib/session/session-edge-cases.integration.test.ts +491 -66
package/src/lib/session/session.integration.test.ts +92 -80
package/src/lib/session/session.ts +108 -96
package/src/lib/session/types.ts +87 -17
package/src/lib/subagent/define.ts +6 -5
package/src/lib/subagent/handler.ts +148 -16
package/src/lib/subagent/index.ts +4 -0
package/src/lib/subagent/register.ts +10 -3
package/src/lib/subagent/signals.ts +8 -0
package/src/lib/subagent/subagent.integration.test.ts +893 -128
package/src/lib/subagent/tool.ts +2 -2
package/src/lib/subagent/types.ts +84 -21
package/src/lib/subagent/workflow.ts +83 -12
package/src/lib/tool-router/router-edge-cases.integration.test.ts +4 -1
package/src/lib/tool-router/router.integration.test.ts +141 -5
package/src/lib/tool-router/router.ts +13 -3
package/src/lib/tool-router/types.ts +7 -0
package/src/lib/workflow.test.ts +104 -27
package/src/lib/workflow.ts +37 -19
package/src/tools/bash/bash.test.ts +16 -7
package/src/workflow.ts +11 -14
package/tsup.config.ts +6 -0

package/src/lib/session/session-edge-cases.integration.test.ts CHANGED Viewed

@@ -34,7 +34,11 @@ vi.mock("@temporalio/workflow", () => {
     condition: async (fn: () => boolean) => fn(),
     defineUpdate: (name: string) => ({ __type: "update", name }),
     defineQuery: (name: string) => ({ __type: "query", name }),
+    defineSignal: (name: string) => ({ __type: "signal", name }),
     setHandler: (_def: unknown, _handler: unknown) => {},
+    startChild: async () => ({ result: () => Promise.resolve(null) }),
+    workflowInfo: () => ({ taskQueue: "default-queue" }),
+    getExternalWorkflowHandle: () => ({ signal: async () => {} }),
     uuid4: () =>
       `00000000-0000-0000-0000-${String(++idCounter).padStart(12, "0")}`,
     ApplicationFailure: MockApplicationFailure,
@@ -56,12 +60,11 @@ type TurnScript = {
  * Wraps every method on a ThreadOps object so it also has `.executeWithOptions()`,
  * matching Temporal's `ActivityInterfaceFor<ThreadOps>` shape.
  */
-function toActivityInterface(
-  raw: ThreadOps,
-): ActivityInterfaceFor<ThreadOps> {
+function toActivityInterface(raw: ThreadOps): ActivityInterfaceFor<ThreadOps> {
   const result = {} as Record<string, unknown>;
   for (const [key, fn] of Object.entries(raw)) {
-    const wrapped = (...args: unknown[]) => (fn as (...a: unknown[]) => unknown)(...args);
+    const wrapped = (...args: unknown[]) =>
+      (fn as (...a: unknown[]) => unknown)(...args);
     wrapped.executeWithOptions = (_opts: unknown, args: unknown[]) =>
       (fn as (...a: unknown[]) => unknown)(...args);
     result[key] = wrapped;
@@ -75,14 +78,14 @@ function createMockThreadOps() {
     initializeThread: async (threadId) => {
       log.push({ op: "initializeThread", args: [threadId] });
     },
-    appendHumanMessage: async (threadId, content) => {
-      log.push({ op: "appendHumanMessage", args: [threadId, content] });
+    appendHumanMessage: async (threadId, id, content) => {
+      log.push({ op: "appendHumanMessage", args: [threadId, id, content] });
     },
-    appendToolResult: async (config) => {
-      log.push({ op: "appendToolResult", args: [config] });
+    appendToolResult: async (id, config) => {
+      log.push({ op: "appendToolResult", args: [id, config] });
     },
-    appendSystemMessage: async (threadId, content) => {
-      log.push({ op: "appendSystemMessage", args: [threadId, content] });
+    appendSystemMessage: async (threadId, id, content) => {
+      log.push({ op: "appendSystemMessage", args: [threadId, id, content] });
     },
     forkThread: async (source, target) => {
       log.push({ op: "forkThread", args: [source, target] });
@@ -91,7 +94,9 @@ function createMockThreadOps() {
   return { ops, log };
 }
-function createScriptedRunAgent(turns: TurnScript[]): RunAgentActivity<unknown> {
+function createScriptedRunAgent(
+  turns: TurnScript[]
+): RunAgentActivity<unknown> {
   let call = 0;
   return async () => {
     const turn = turns[call++];
@@ -113,7 +118,7 @@ function createEchoTool() {
     schema: z.object({ text: z.string() }),
     handler: async (
       args: { text: string },
-      _ctx: RouterContext,
+      _ctx: RouterContext
     ): Promise<ToolHandlerResponse<{ echoed: string }>> => ({
       toolResponse: `Echo: ${args.text}`,
       data: { echoed: args.text },
@@ -150,7 +155,7 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       runAgent: createScriptedRunAgent([
         {
           message: "Need user input",
@@ -186,7 +191,7 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       runAgent: createScriptedRunAgent([
         {
           message: "bad calls",
@@ -216,8 +221,11 @@ describe("createSession edge cases", () => {
     const errorResults = log.filter((l) => {
       if (l.op !== "appendToolResult") return false;
-      const config = l.args[0] as ToolResultConfig;
-      return typeof config.content === "string" && config.content.includes("Invalid tool call");
+      const config = l.args[1] as ToolResultConfig;
+      return (
+        typeof config.content === "string" &&
+        config.content.includes("Invalid tool call")
+      );
     });
     expect(errorResults).toHaveLength(2);
   });
@@ -229,7 +237,7 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       runAgent: createScriptedRunAgent([
         {
           message: "no id",
@@ -260,7 +268,7 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       runAgent: createScriptedRunAgent([
         {
           message: "I tried calling a tool",
@@ -298,7 +306,7 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       runAgent: createScriptedRunAgent([
         {
           message: "calling fail",
@@ -328,7 +336,7 @@ describe("createSession edge cases", () => {
   // --- Tool handler throws without recovery ---
-  it("session fails when tool handler throws with no failure hook", async () => {
+  it("session completes when tool handler throws with no failure hook (error suppressed)", async () => {
     const { ops } = createMockThreadOps();
     let endReason: string | undefined;
@@ -343,7 +351,7 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       runAgent: createScriptedRunAgent([
         {
           message: "calling fail",
@@ -364,10 +372,10 @@ describe("createSession edge cases", () => {
       initialState: { systemPrompt: "test" },
     });
-    await expect(session.runSession({ stateManager })).rejects.toThrow(
-      "unrecoverable tool",
-    );
-    expect(endReason).toBe("failed");
+    const result = await session.runSession({ stateManager });
+    expect(result.exitReason).toBe("completed");
+    expect(result.finalMessage).toBe("done");
+    expect(endReason).toBe("completed");
   });
   // --- Metadata passed through to hooks ---
@@ -379,11 +387,9 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       metadata: { env: "test", version: 42 },
-      runAgent: createScriptedRunAgent([
-        { message: "done", toolCalls: [] },
-      ]),
+      runAgent: createScriptedRunAgent([{ message: "done", toolCalls: [] }]),
       threadOps: ops,
       buildContextMessage: () => "go",
       hooks: {
@@ -422,15 +428,17 @@ describe("createSession edge cases", () => {
         data: null,
         createdAt: new Date().toISOString(),
       }),
+      forkSandbox: async () => "forked-sandbox-id",
+      pauseSandbox: async () => {},
     };
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       runAgent: createScriptedRunAgent([{ message: "done", toolCalls: [] }]),
       threadOps: ops,
       buildContextMessage: () => "go",
-      sandbox: sandboxOps,
+      sandboxOps,
     });
     const stateManager = createAgentStateManager({
@@ -438,7 +446,7 @@ describe("createSession edge cases", () => {
     });
     await expect(session.runSession({ stateManager })).rejects.toThrow(
-      "sandbox creation failed",
+      "sandbox creation failed"
     );
   });
@@ -462,17 +470,19 @@ describe("createSession edge cases", () => {
         data: null,
         createdAt: new Date().toISOString(),
       }),
+      forkSandbox: async () => "forked-sandbox-id",
+      pauseSandbox: async () => {},
     };
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       runAgent: async () => {
         throw new Error("LLM crash");
       },
       threadOps: ops,
       buildContextMessage: () => "go",
-      sandbox: sandboxOps,
+      sandboxOps,
     });
     const stateManager = createAgentStateManager({
@@ -480,7 +490,7 @@ describe("createSession edge cases", () => {
     });
     await expect(session.runSession({ stateManager })).rejects.toThrow(
-      "LLM crash",
+      "LLM crash"
     );
     expect(sandboxLog).toContain("create");
@@ -494,7 +504,7 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       runAgent: createScriptedRunAgent([]),
       threadOps: ops,
       buildContextMessage: () => "hi",
@@ -505,7 +515,7 @@ describe("createSession edge cases", () => {
     });
     await expect(session.runSession({ stateManager })).rejects.toThrow(
-      "No system prompt in state",
+      "No system prompt in state"
     );
   });
@@ -527,7 +537,7 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       runAgent: createScriptedRunAgent([
         {
           message: "t1",
@@ -558,15 +568,14 @@ describe("createSession edge cases", () => {
     expect(result.usage.totalOutputTokens).toBe(50);
   });
-  // --- continueThread with no source thread ---
+  // --- Thread fork: new threadId from source ---
-  it("continueThread generates new threadId and forks when source is provided", async () => {
+  it("fork thread mode generates new threadId and forks when source is provided", async () => {
     const { ops, log } = createMockThreadOps();
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "original-thread",
-      continueThread: true,
+      thread: { mode: "fork", threadId: "original-thread" },
       runAgent: createScriptedRunAgent([
         { message: "continued", toolCalls: [] },
       ]),
@@ -597,7 +606,7 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       maxTurns: 1,
       runAgent: createScriptedRunAgent([
         {
@@ -642,7 +651,7 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       processToolsInParallel: false,
       runAgent: createScriptedRunAgent([
         {
@@ -675,7 +684,7 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       runAgent: createScriptedRunAgent([
         {
           message: "mixed",
@@ -700,24 +709,27 @@ describe("createSession edge cases", () => {
     const toolResults = log.filter((l) => l.op === "appendToolResult");
     const echoResult = toolResults.find((l) => {
-      const config = l.args[0] as ToolResultConfig;
+      const config = l.args[1] as ToolResultConfig;
       return config.toolName === "Echo";
     });
     expect(echoResult).toBeDefined();
     if (echoResult) {
-      expect((echoResult.args[0] as ToolResultConfig).content).toBe("Echo: valid");
+      expect((echoResult.args[1] as ToolResultConfig).content).toBe(
+        "Echo: valid"
+      );
     }
     const unknownResult = toolResults.find((l) => {
-      const config = l.args[0] as ToolResultConfig;
+      const config = l.args[1] as ToolResultConfig;
       return config.toolName === "Unknown";
     });
     expect(unknownResult).toBeDefined();
     const unknownContent = unknownResult
-      ? (unknownResult.args[0] as ToolResultConfig).content
+      ? (unknownResult.args[1] as ToolResultConfig).content
       : undefined;
     expect(
-      typeof unknownContent === "string" && unknownContent.includes("Invalid tool call"),
+      typeof unknownContent === "string" &&
+        unknownContent.includes("Invalid tool call")
     ).toBe(true);
   });
@@ -728,10 +740,8 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
-      runAgent: createScriptedRunAgent([
-        { message: "done", toolCalls: [] },
-      ]),
+      thread: { mode: "new", threadId: "thread-1" },
+      runAgent: createScriptedRunAgent([{ message: "done", toolCalls: [] }]),
       threadOps: ops,
       buildContextMessage: () => [
         { type: "text", text: "Hello" },
@@ -749,7 +759,7 @@ describe("createSession edge cases", () => {
     expect(humanOps).toHaveLength(1);
     const humanOp = humanOps[0];
     if (!humanOp) throw new Error("expected human op");
-    const content = humanOp.args[1];
+    const content = humanOp.args[2];
     expect(Array.isArray(content)).toBe(true);
     const firstContent = (content as { type: string }[])[0];
     if (!firstContent) throw new Error("expected content item");
@@ -764,7 +774,7 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       runAgent: createScriptedRunAgent([
         {
           message: "t1",
@@ -813,7 +823,7 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       runAgent: createScriptedRunAgent([
         {
           message: "self",
@@ -834,7 +844,7 @@ describe("createSession edge cases", () => {
     const toolResults = log.filter((l) => {
       if (l.op !== "appendToolResult") return false;
-      const config = l.args[0] as ToolResultConfig;
+      const config = l.args[1] as ToolResultConfig;
       return config.toolName === "SelfAppend";
     });
     expect(toolResults).toHaveLength(0);
@@ -847,7 +857,7 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       runAgent: createScriptedRunAgent([
         {
           message: "calling",
@@ -860,7 +870,10 @@ describe("createSession edge cases", () => {
       buildContextMessage: () => "go",
       hooks: {
         onPreToolUse: async ({ toolCall }) => {
-          if (toolCall.args && (toolCall.args as { text: string }).text === "skip-me") {
+          if (
+            toolCall.args &&
+            (toolCall.args as { text: string }).text === "skip-me"
+          ) {
             return { skip: true };
           }
           return {};
@@ -878,8 +891,10 @@ describe("createSession edge cases", () => {
     expect(toolResults).toHaveLength(1);
     const toolResult = toolResults[0];
     if (!toolResult) throw new Error("expected tool result");
-    const content = (toolResult.args[0] as ToolResultConfig).content;
-    expect(typeof content === "string" && content.includes("Skipped")).toBe(true);
+    const content = (toolResult.args[1] as ToolResultConfig).content;
+    expect(typeof content === "string" && content.includes("Skipped")).toBe(
+      true
+    );
   });
   // --- Sandbox snapshot is not called on normal flow ---
@@ -897,15 +912,17 @@ describe("createSession edge cases", () => {
       createSandbox: async () => ({ sandboxId: "sb-test" }),
       destroySandbox: async () => {},
       snapshotSandbox: snapshotSpy,
+      forkSandbox: async () => "forked-sandbox-id",
+      pauseSandbox: async () => {},
     };
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       runAgent: createScriptedRunAgent([{ message: "done", toolCalls: [] }]),
       threadOps: ops,
       buildContextMessage: () => "go",
-      sandbox: sandboxOps,
+      sandboxOps,
     });
     const stateManager = createAgentStateManager({
@@ -924,7 +941,7 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       runAgent: createScriptedRunAgent([
         {
           message: "t1",
@@ -959,7 +976,7 @@ describe("createSession edge cases", () => {
     const session = await createSession({
       agentName: "TestAgent",
-      threadId: "thread-1",
+      thread: { mode: "new", threadId: "thread-1" },
       maxTurns: 0,
       runAgent: createScriptedRunAgent([]),
       threadOps: ops,
@@ -977,4 +994,412 @@ describe("createSession edge cases", () => {
     expect(result.usage.turns).toBe(0);
     expect(result.finalMessage).toBeNull();
   });
+  // --- sandboxId returned from runSession ---
+  it("returns sandboxId from runSession when sandbox is created", async () => {
+    const { ops } = createMockThreadOps();
+    const sandboxOps: SandboxOps = {
+      createSandbox: async () => ({ sandboxId: "sb-created" }),
+      destroySandbox: async () => {},
+      pauseSandbox: async () => {},
+      snapshotSandbox: async () => ({
+        sandboxId: "sb-1",
+        providerId: "test",
+        data: null,
+        createdAt: new Date().toISOString(),
+      }),
+      forkSandbox: async () => "forked-sb",
+    };
+    const session = await createSession({
+      agentName: "TestAgent",
+      thread: { mode: "new", threadId: "thread-1" },
+      runAgent: createScriptedRunAgent([{ message: "done", toolCalls: [] }]),
+      threadOps: ops,
+      buildContextMessage: () => "go",
+      sandboxOps,
+    });
+    const stateManager = createAgentStateManager({
+      initialState: { systemPrompt: "test" },
+    });
+    const result = await session.runSession({ stateManager });
+    expect((result as { sandboxId?: string }).sandboxId).toBe("sb-created");
+  });
+  it("returns inherited sandboxId from runSession", async () => {
+    const { ops } = createMockThreadOps();
+    const sandboxOps: SandboxOps = {
+      createSandbox: async () => ({ sandboxId: "sb" }),
+      destroySandbox: async () => {},
+      pauseSandbox: async () => {},
+      snapshotSandbox: async () => ({
+        sandboxId: "sb",
+        providerId: "test",
+        data: null,
+        createdAt: new Date().toISOString(),
+      }),
+      forkSandbox: async () => "forked-sb",
+    };
+    const session = await createSession({
+      agentName: "TestAgent",
+      thread: { mode: "new", threadId: "thread-1" },
+      runAgent: createScriptedRunAgent([{ message: "done", toolCalls: [] }]),
+      threadOps: ops,
+      buildContextMessage: () => "go",
+      sandbox: { mode: "inherit", sandboxId: "inherited-sb" },
+      sandboxOps,
+    });
+    const stateManager = createAgentStateManager({
+      initialState: { systemPrompt: "test" },
+    });
+    const result = await session.runSession({ stateManager });
+    expect((result as { sandboxId?: string }).sandboxId).toBe("inherited-sb");
+  });
+  // --- Inherited sandbox is not destroyed ---
+  it("does not destroy inherited sandbox even when sandboxOps is provided", async () => {
+    const { ops } = createMockThreadOps();
+    const sandboxLog: string[] = [];
+    const sandboxOps: SandboxOps = {
+      createSandbox: async () => {
+        sandboxLog.push("create");
+        return { sandboxId: "new-sb" };
+      },
+      destroySandbox: async (id: string) => {
+        sandboxLog.push(`destroy:${id}`);
+      },
+      pauseSandbox: async (id: string) => {
+        sandboxLog.push(`pause:${id}`);
+      },
+      snapshotSandbox: async () => ({
+        sandboxId: "sb-1",
+        providerId: "test",
+        data: null,
+        createdAt: new Date().toISOString(),
+      }),
+      forkSandbox: async () => "forked-sb",
+    };
+    const session = await createSession({
+      agentName: "TestAgent",
+      thread: { mode: "new", threadId: "thread-1" },
+      runAgent: createScriptedRunAgent([{ message: "done", toolCalls: [] }]),
+      threadOps: ops,
+      buildContextMessage: () => "go",
+      sandboxOps,
+      sandbox: { mode: "inherit", sandboxId: "inherited-sb" },
+    });
+    const stateManager = createAgentStateManager({
+      initialState: { systemPrompt: "test" },
+    });
+    await session.runSession({ stateManager });
+    expect(sandboxLog).toHaveLength(0);
+  });
+  // --- Sandbox fork ---
+  it("forks sandbox when sandbox init mode is fork", async () => {
+    const { ops } = createMockThreadOps();
+    const sandboxLog: string[] = [];
+    const sandboxOps: SandboxOps = {
+      createSandbox: async () => {
+        sandboxLog.push("create");
+        return { sandboxId: "new-sb" };
+      },
+      destroySandbox: async (id: string) => {
+        sandboxLog.push(`destroy:${id}`);
+      },
+      pauseSandbox: async () => {},
+      snapshotSandbox: async () => ({
+        sandboxId: "sb-1",
+        providerId: "test",
+        data: null,
+        createdAt: new Date().toISOString(),
+      }),
+      forkSandbox: async (id: string) => {
+        sandboxLog.push(`fork:${id}`);
+        return `forked-from-${id}`;
+      },
+    };
+    const session = await createSession({
+      agentName: "TestAgent",
+      thread: { mode: "new", threadId: "thread-1" },
+      runAgent: createScriptedRunAgent([{ message: "done", toolCalls: [] }]),
+      threadOps: ops,
+      buildContextMessage: () => "go",
+      sandboxOps,
+      sandbox: { mode: "fork", sandboxId: "paused-sb-1" },
+    });
+    const stateManager = createAgentStateManager({
+      initialState: { systemPrompt: "test" },
+    });
+    const result = await session.runSession({ stateManager });
+    expect(sandboxLog).toContain("fork:paused-sb-1");
+    expect(sandboxLog).not.toContain("create");
+    expect((result as { sandboxId?: string }).sandboxId).toBe("forked-from-paused-sb-1");
+    expect(sandboxLog).toContain("destroy:forked-from-paused-sb-1");
+  });
+  // --- Forked sandbox is destroyed on exit ---
+  it("destroys forked sandbox on exit (not inherited)", async () => {
+    const { ops } = createMockThreadOps();
+    const sandboxLog: string[] = [];
+    const sandboxOps: SandboxOps = {
+      createSandbox: async () => ({ sandboxId: "new-sb" }),
+      destroySandbox: async (id: string) => {
+        sandboxLog.push(`destroy:${id}`);
+      },
+      pauseSandbox: async () => {},
+      snapshotSandbox: async () => ({
+        sandboxId: "sb-1",
+        providerId: "test",
+        data: null,
+        createdAt: new Date().toISOString(),
+      }),
+      forkSandbox: async () => "forked-sb",
+    };
+    const session = await createSession({
+      agentName: "TestAgent",
+      thread: { mode: "new", threadId: "thread-1" },
+      runAgent: createScriptedRunAgent([{ message: "done", toolCalls: [] }]),
+      threadOps: ops,
+      buildContextMessage: () => "go",
+      sandboxOps,
+      sandbox: { mode: "fork", sandboxId: "old-sb" },
+    });
+    const stateManager = createAgentStateManager({
+      initialState: { systemPrompt: "test" },
+    });
+    await session.runSession({ stateManager });
+    expect(sandboxLog).toContain("destroy:forked-sb");
+  });
+  // --- sandboxShutdown: "pause" ---
+  it("pauses sandbox on exit when sandboxShutdown is pause", async () => {
+    const { ops } = createMockThreadOps();
+    const sandboxLog: string[] = [];
+    const sandboxOps: SandboxOps = {
+      createSandbox: async () => ({ sandboxId: "sb-pause-test" }),
+      destroySandbox: async (id: string) => {
+        sandboxLog.push(`destroy:${id}`);
+      },
+      pauseSandbox: async (id: string) => {
+        sandboxLog.push(`pause:${id}`);
+      },
+      snapshotSandbox: async () => ({
+        sandboxId: "sb-1",
+        providerId: "test",
+        data: null,
+        createdAt: new Date().toISOString(),
+      }),
+      forkSandbox: async () => "forked-sb",
+    };
+    const session = await createSession({
+      agentName: "TestAgent",
+      thread: { mode: "new", threadId: "thread-1" },
+      runAgent: createScriptedRunAgent([{ message: "done", toolCalls: [] }]),
+      threadOps: ops,
+      buildContextMessage: () => "go",
+      sandboxOps,
+      sandboxShutdown: "pause",
+    });
+    const stateManager = createAgentStateManager({
+      initialState: { systemPrompt: "test" },
+    });
+    await session.runSession({ stateManager });
+    expect(sandboxLog).toContain("pause:sb-pause-test");
+    expect(sandboxLog).not.toContain("destroy:sb-pause-test");
+  });
+  // --- sandboxShutdown: "pause-until-parent-close" ---
+  it("pauses sandbox on exit when sandboxShutdown is pause-until-parent-close", async () => {
+    const { ops } = createMockThreadOps();
+    const sandboxLog: string[] = [];
+    const sandboxOps: SandboxOps = {
+      createSandbox: async () => ({ sandboxId: "sb-parent-close" }),
+      destroySandbox: async (id: string) => {
+        sandboxLog.push(`destroy:${id}`);
+      },
+      pauseSandbox: async (id: string) => {
+        sandboxLog.push(`pause:${id}`);
+      },
+      snapshotSandbox: async () => ({
+        sandboxId: "sb-1",
+        providerId: "test",
+        data: null,
+        createdAt: new Date().toISOString(),
+      }),
+      forkSandbox: async () => "forked-sb",
+    };
+    const session = await createSession({
+      agentName: "TestAgent",
+      thread: { mode: "new", threadId: "thread-1" },
+      runAgent: createScriptedRunAgent([{ message: "done", toolCalls: [] }]),
+      threadOps: ops,
+      buildContextMessage: () => "go",
+      sandboxOps,
+      sandboxShutdown: "pause-until-parent-close",
+    });
+    const stateManager = createAgentStateManager({
+      initialState: { systemPrompt: "test" },
+    });
+    await session.runSession({ stateManager });
+    expect(sandboxLog).toContain("pause:sb-parent-close");
+    expect(sandboxLog).not.toContain("destroy:sb-parent-close");
+  });
+  // --- Throws when sandbox fork/continue provided without sandboxOps ---
+  it("throws when sandbox fork mode is set without sandboxOps", async () => {
+    const { ops } = createMockThreadOps();
+    const session = await createSession({
+      agentName: "TestAgent",
+      thread: { mode: "new", threadId: "thread-1" },
+      runAgent: createScriptedRunAgent([{ message: "done", toolCalls: [] }]),
+      threadOps: ops,
+      buildContextMessage: () => "go",
+      sandbox: { mode: "fork", sandboxId: "prev-sb" },
+    });
+    const stateManager = createAgentStateManager({
+      initialState: { systemPrompt: "test" },
+    });
+    await expect(session.runSession({ stateManager })).rejects.toThrow(
+      "No sandboxOps provided — cannot fork sandbox"
+    );
+  });
+  // --- No sandboxId returned when no sandbox ---
+  it("does not return sandboxId when no sandbox is configured", async () => {
+    const { ops } = createMockThreadOps();
+    const session = await createSession({
+      agentName: "TestAgent",
+      thread: { mode: "new", threadId: "thread-1" },
+      runAgent: createScriptedRunAgent([{ message: "done", toolCalls: [] }]),
+      threadOps: ops,
+      buildContextMessage: () => "go",
+    });
+    const stateManager = createAgentStateManager({
+      initialState: { systemPrompt: "test" },
+    });
+    const result = await session.runSession({ stateManager });
+    expect((result as { sandboxId?: string }).sandboxId).toBeUndefined();
+  });
+  // --- Thread: defaults to new thread when no thread field provided ---
+  it("defaults to new thread without fork when no thread field is provided", async () => {
+    const { ops, log } = createMockThreadOps();
+    const session = await createSession({
+      agentName: "TestAgent",
+      runAgent: createScriptedRunAgent([
+        { message: "done", toolCalls: [] },
+      ]),
+      threadOps: ops,
+      buildContextMessage: () => "go",
+    });
+    const stateManager = createAgentStateManager({
+      initialState: { systemPrompt: "test" },
+    });
+    const result = await session.runSession({ stateManager });
+    expect(result.exitReason).toBe("completed");
+    const forkOps = log.filter((l) => l.op === "forkThread");
+    expect(forkOps).toHaveLength(0);
+    const systemOps = log.filter((l) => l.op === "appendSystemMessage");
+    expect(systemOps).toHaveLength(1);
+  });
+  // --- Sandbox pause on error ---
+  it("pauses sandbox even when session fails if sandboxShutdown is pause", async () => {
+    const { ops } = createMockThreadOps();
+    const sandboxLog: string[] = [];
+    const sandboxOps: SandboxOps = {
+      createSandbox: async () => ({ sandboxId: "sb-err" }),
+      destroySandbox: async (id: string) => {
+        sandboxLog.push(`destroy:${id}`);
+      },
+      pauseSandbox: async (id: string) => {
+        sandboxLog.push(`pause:${id}`);
+      },
+      snapshotSandbox: async () => ({
+        sandboxId: "sb-1",
+        providerId: "test",
+        data: null,
+        createdAt: new Date().toISOString(),
+      }),
+      forkSandbox: async () => "forked-sb",
+    };
+    const session = await createSession({
+      agentName: "TestAgent",
+      thread: { mode: "new", threadId: "thread-1" },
+      runAgent: async () => {
+        throw new Error("crash");
+      },
+      threadOps: ops,
+      buildContextMessage: () => "go",
+      sandboxOps,
+      sandboxShutdown: "pause",
+    });
+    const stateManager = createAgentStateManager({
+      initialState: { systemPrompt: "test" },
+    });
+    await expect(session.runSession({ stateManager })).rejects.toThrow(
+      "crash"
+    );
+    expect(sandboxLog).toContain("pause:sb-err");
+    expect(sandboxLog).not.toContain("destroy:sb-err");
+  });
 });