npm - illuma-agents - Versions diffs - 1.0.37 → 1.0.39 - Mend

illuma-agents 1.0.37 → 1.0.39

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (139) hide show

package/dist/cjs/agents/AgentContext.cjs +112 -14
package/dist/cjs/agents/AgentContext.cjs.map +1 -1
package/dist/cjs/common/enum.cjs +5 -1
package/dist/cjs/common/enum.cjs.map +1 -1
package/dist/cjs/graphs/Graph.cjs +148 -8
package/dist/cjs/graphs/Graph.cjs.map +1 -1
package/dist/cjs/graphs/MultiAgentGraph.cjs +277 -11
package/dist/cjs/graphs/MultiAgentGraph.cjs.map +1 -1
package/dist/cjs/llm/bedrock/index.cjs +128 -61
package/dist/cjs/llm/bedrock/index.cjs.map +1 -1
package/dist/cjs/main.cjs +22 -7
package/dist/cjs/main.cjs.map +1 -1
package/dist/cjs/messages/cache.cjs +140 -46
package/dist/cjs/messages/cache.cjs.map +1 -1
package/dist/cjs/messages/core.cjs +1 -1
package/dist/cjs/messages/core.cjs.map +1 -1
package/dist/cjs/messages/tools.cjs +2 -2
package/dist/cjs/messages/tools.cjs.map +1 -1
package/dist/cjs/schemas/validate.cjs +173 -0
package/dist/cjs/schemas/validate.cjs.map +1 -0
package/dist/cjs/stream.cjs +4 -2
package/dist/cjs/stream.cjs.map +1 -1
package/dist/cjs/tools/BrowserTools.cjs.map +1 -1
package/dist/cjs/tools/CodeExecutor.cjs +22 -21
package/dist/cjs/tools/CodeExecutor.cjs.map +1 -1
package/dist/cjs/tools/ProgrammaticToolCalling.cjs +14 -11
package/dist/cjs/tools/ProgrammaticToolCalling.cjs.map +1 -1
package/dist/cjs/tools/ToolNode.cjs +101 -2
package/dist/cjs/tools/ToolNode.cjs.map +1 -1
package/dist/cjs/tools/ToolSearch.cjs +862 -0
package/dist/cjs/tools/ToolSearch.cjs.map +1 -0
package/dist/esm/agents/AgentContext.mjs +112 -14
package/dist/esm/agents/AgentContext.mjs.map +1 -1
package/dist/esm/common/enum.mjs +5 -1
package/dist/esm/common/enum.mjs.map +1 -1
package/dist/esm/graphs/Graph.mjs +149 -9
package/dist/esm/graphs/Graph.mjs.map +1 -1
package/dist/esm/graphs/MultiAgentGraph.mjs +278 -12
package/dist/esm/graphs/MultiAgentGraph.mjs.map +1 -1
package/dist/esm/llm/bedrock/index.mjs +127 -60
package/dist/esm/llm/bedrock/index.mjs.map +1 -1
package/dist/esm/main.mjs +2 -1
package/dist/esm/main.mjs.map +1 -1
package/dist/esm/messages/cache.mjs +140 -46
package/dist/esm/messages/cache.mjs.map +1 -1
package/dist/esm/messages/core.mjs +1 -1
package/dist/esm/messages/core.mjs.map +1 -1
package/dist/esm/messages/tools.mjs +2 -2
package/dist/esm/messages/tools.mjs.map +1 -1
package/dist/esm/schemas/validate.mjs +167 -0
package/dist/esm/schemas/validate.mjs.map +1 -0
package/dist/esm/stream.mjs +4 -2
package/dist/esm/stream.mjs.map +1 -1
package/dist/esm/tools/BrowserTools.mjs.map +1 -1
package/dist/esm/tools/CodeExecutor.mjs +22 -21
package/dist/esm/tools/CodeExecutor.mjs.map +1 -1
package/dist/esm/tools/ProgrammaticToolCalling.mjs +14 -11
package/dist/esm/tools/ProgrammaticToolCalling.mjs.map +1 -1
package/dist/esm/tools/ToolNode.mjs +102 -3
package/dist/esm/tools/ToolNode.mjs.map +1 -1
package/dist/esm/tools/ToolSearch.mjs +827 -0
package/dist/esm/tools/ToolSearch.mjs.map +1 -0
package/dist/types/agents/AgentContext.d.ts +51 -1
package/dist/types/common/enum.d.ts +6 -2
package/dist/types/graphs/Graph.d.ts +12 -0
package/dist/types/graphs/MultiAgentGraph.d.ts +16 -0
package/dist/types/index.d.ts +2 -1
package/dist/types/llm/bedrock/index.d.ts +89 -11
package/dist/types/llm/bedrock/types.d.ts +27 -0
package/dist/types/llm/bedrock/utils/index.d.ts +5 -0
package/dist/types/llm/bedrock/utils/message_inputs.d.ts +31 -0
package/dist/types/llm/bedrock/utils/message_outputs.d.ts +33 -0
package/dist/types/messages/cache.d.ts +4 -1
package/dist/types/schemas/index.d.ts +1 -0
package/dist/types/schemas/validate.d.ts +36 -0
package/dist/types/tools/CodeExecutor.d.ts +0 -3
package/dist/types/tools/ProgrammaticToolCalling.d.ts +0 -3
package/dist/types/tools/ToolNode.d.ts +3 -1
package/dist/types/tools/ToolSearch.d.ts +148 -0
package/dist/types/types/graph.d.ts +71 -0
package/dist/types/types/llm.d.ts +3 -1
package/dist/types/types/tools.d.ts +42 -2
package/package.json +13 -6
package/src/agents/AgentContext.test.ts +312 -0
package/src/agents/AgentContext.ts +144 -16
package/src/common/enum.ts +5 -1
package/src/graphs/Graph.ts +214 -13
package/src/graphs/MultiAgentGraph.ts +350 -13
package/src/index.ts +4 -1
package/src/llm/bedrock/index.ts +221 -99
package/src/llm/bedrock/llm.spec.ts +616 -0
package/src/llm/bedrock/types.ts +51 -0
package/src/llm/bedrock/utils/index.ts +18 -0
package/src/llm/bedrock/utils/message_inputs.ts +563 -0
package/src/llm/bedrock/utils/message_outputs.ts +310 -0
package/src/messages/__tests__/tools.test.ts +21 -21
package/src/messages/cache.test.ts +304 -0
package/src/messages/cache.ts +183 -53
package/src/messages/core.ts +1 -1
package/src/messages/tools.ts +2 -2
package/src/schemas/index.ts +2 -0
package/src/schemas/validate.test.ts +358 -0
package/src/schemas/validate.ts +238 -0
package/src/scripts/caching.ts +27 -19
package/src/scripts/code_exec_files.ts +58 -15
package/src/scripts/code_exec_multi_session.ts +241 -0
package/src/scripts/code_exec_session.ts +282 -0
package/src/scripts/multi-agent-conditional.ts +1 -0
package/src/scripts/multi-agent-supervisor.ts +1 -0
package/src/scripts/programmatic_exec_agent.ts +4 -4
package/src/scripts/test-handoff-preamble.ts +277 -0
package/src/scripts/test-parallel-handoffs.ts +291 -0
package/src/scripts/test-tools-before-handoff.ts +8 -4
package/src/scripts/test_code_api.ts +361 -0
package/src/scripts/thinking-bedrock.ts +159 -0
package/src/scripts/thinking.ts +39 -18
package/src/scripts/{tool_search_regex.ts → tool_search.ts} +5 -5
package/src/scripts/tools.ts +7 -3
package/src/specs/cache.simple.test.ts +396 -0
package/src/stream.ts +4 -2
package/src/tools/BrowserTools.ts +39 -17
package/src/tools/CodeExecutor.ts +26 -23
package/src/tools/ProgrammaticToolCalling.ts +18 -14
package/src/tools/ToolNode.ts +114 -1
package/src/tools/ToolSearch.ts +1041 -0
package/src/tools/__tests__/ProgrammaticToolCalling.test.ts +0 -2
package/src/tools/__tests__/{ToolSearchRegex.integration.test.ts → ToolSearch.integration.test.ts} +6 -6
package/src/tools/__tests__/ToolSearch.test.ts +1003 -0
package/src/types/graph.test.ts +183 -0
package/src/types/graph.ts +73 -0
package/src/types/llm.ts +3 -1
package/src/types/tools.ts +51 -2
package/dist/cjs/tools/ToolSearchRegex.cjs +0 -455
package/dist/cjs/tools/ToolSearchRegex.cjs.map +0 -1
package/dist/esm/tools/ToolSearchRegex.mjs +0 -448
package/dist/esm/tools/ToolSearchRegex.mjs.map +0 -1
package/dist/types/tools/ToolSearchRegex.d.ts +0 -80
package/src/tools/ToolSearchRegex.ts +0 -535
package/src/tools/__tests__/ToolSearchRegex.test.ts +0 -232

package/src/scripts/test-parallel-handoffs.ts ADDED Viewed

@@ -0,0 +1,291 @@
+import { config } from 'dotenv';
+config();
+import { HumanMessage, BaseMessage } from '@langchain/core/messages';
+import type * as t from '@/types';
+import { ChatModelStreamHandler, createContentAggregator } from '@/stream';
+import { ToolEndHandler } from '@/events';
+import { Providers, GraphEvents } from '@/common';
+import { sleep } from '@/utils/run';
+import { Run } from '@/run';
+const conversationHistory: BaseMessage[] = [];
+/**
+ * Test parallel handoffs - where an LLM calls multiple transfer tools simultaneously
+ *
+ * Graph structure:
+ * coordinator -> [researcher, writer] (via parallel handoff tools)
+ *
+ * The coordinator agent has two transfer tools:
+ * - transfer_to_researcher
+ * - transfer_to_writer
+ *
+ * When given a task that needs both, it should call both tools in parallel.
+ */
+async function testParallelHandoffs() {
+  console.log(
+    'Testing Parallel Handoffs (LLM calling multiple transfers)...\n'
+  );
+  const { contentParts, aggregateContent } = createContentAggregator();
+  const agents: t.AgentInputs[] = [
+    {
+      agentId: 'coordinator',
+      provider: Providers.OPENAI,
+      clientOptions: {
+        modelName: 'gpt-4o-mini',
+        apiKey: process.env.OPENAI_API_KEY,
+      },
+      instructions: `You are a COORDINATOR agent. Your job is to delegate tasks to specialized agents.
+You have access to two transfer tools:
+- transfer_to_researcher: For research and fact-finding tasks
+- transfer_to_writer: For content creation and writing tasks
+IMPORTANT: When a task requires BOTH research AND writing, you MUST call BOTH transfer tools SIMULTANEOUSLY in the same response. Do not call them sequentially.
+For example, if asked to "research and write about X", call both transfers at once to enable parallel work.
+When delegating, provide clear instructions to each agent about what they should do.`,
+    },
+    {
+      agentId: 'researcher',
+      provider: Providers.ANTHROPIC,
+      clientOptions: {
+        modelName: 'claude-haiku-4-5',
+        apiKey: process.env.ANTHROPIC_API_KEY,
+      },
+      instructions: `You are a RESEARCHER. When you receive a task:
+1. Provide concise research findings (100-150 words)
+2. Start your response with "📚 RESEARCH FINDINGS:"`,
+    },
+    {
+      agentId: 'writer',
+      provider: Providers.ANTHROPIC,
+      clientOptions: {
+        modelName: 'claude-haiku-4-5',
+        apiKey: process.env.ANTHROPIC_API_KEY,
+      },
+      instructions: `You are a WRITER. When you receive a task:
+1. Provide creative content (100-150 words)
+2. Start your response with "✍️ WRITTEN CONTENT:"`,
+    },
+  ];
+  /**
+   * Create handoff edges from coordinator to both researcher and writer.
+   * These are separate edges so the LLM sees both transfer tools.
+   */
+  const edges: t.GraphEdge[] = [
+    {
+      from: 'coordinator',
+      to: 'researcher',
+      edgeType: 'handoff',
+      description: 'Transfer to researcher for research and fact-finding tasks',
+      prompt: 'Research task instructions',
+    },
+    {
+      from: 'coordinator',
+      to: 'writer',
+      edgeType: 'handoff',
+      description: 'Transfer to writer for content creation and writing tasks',
+      prompt: 'Writing task instructions',
+    },
+  ];
+  /** Track which agents are active and their timing */
+  const activeAgents = new Set<string>();
+  const agentTimings: Record<string, { start?: number; end?: number }> = {};
+  const startTime = Date.now();
+  const customHandlers = {
+    [GraphEvents.TOOL_END]: new ToolEndHandler(),
+    [GraphEvents.CHAT_MODEL_END]: {
+      handle: (
+        _event: string,
+        _data: t.StreamEventData,
+        metadata?: Record<string, unknown>
+      ): void => {
+        const nodeName = metadata?.langgraph_node as string;
+        if (nodeName) {
+          const elapsed = Date.now() - startTime;
+          agentTimings[nodeName] = agentTimings[nodeName] || {};
+          agentTimings[nodeName].end = elapsed;
+          activeAgents.delete(nodeName);
+          console.log(`\n⏱️  [${nodeName}] COMPLETED at ${elapsed}ms`);
+        }
+      },
+    },
+    [GraphEvents.CHAT_MODEL_START]: {
+      handle: (
+        _event: string,
+        _data: t.StreamEventData,
+        metadata?: Record<string, unknown>
+      ): void => {
+        const nodeName = metadata?.langgraph_node as string;
+        if (nodeName) {
+          const elapsed = Date.now() - startTime;
+          /** Store first start time for parallel overlap calculation */
+          if (!agentTimings[nodeName]?.start) {
+            agentTimings[nodeName] = agentTimings[nodeName] || {};
+            agentTimings[nodeName].start = elapsed;
+          }
+          activeAgents.add(nodeName);
+          console.log(`\n⏱️  [${nodeName}] STARTED at ${elapsed}ms`);
+          console.log(
+            `   Active agents: ${Array.from(activeAgents).join(', ')}`
+          );
+        }
+      },
+    },
+    [GraphEvents.CHAT_MODEL_STREAM]: new ChatModelStreamHandler(),
+    [GraphEvents.ON_RUN_STEP_COMPLETED]: {
+      handle: (
+        event: GraphEvents.ON_RUN_STEP_COMPLETED,
+        data: t.StreamEventData
+      ): void => {
+        aggregateContent({
+          event,
+          data: data as unknown as { result: t.ToolEndEvent },
+        });
+      },
+    },
+    [GraphEvents.ON_RUN_STEP]: {
+      handle: (
+        event: GraphEvents.ON_RUN_STEP,
+        data: t.StreamEventData
+      ): void => {
+        aggregateContent({ event, data: data as t.RunStep });
+      },
+    },
+    [GraphEvents.ON_RUN_STEP_DELTA]: {
+      handle: (
+        event: GraphEvents.ON_RUN_STEP_DELTA,
+        data: t.StreamEventData
+      ): void => {
+        aggregateContent({ event, data: data as t.RunStepDeltaEvent });
+      },
+    },
+    [GraphEvents.ON_MESSAGE_DELTA]: {
+      handle: (
+        event: GraphEvents.ON_MESSAGE_DELTA,
+        data: t.StreamEventData
+      ): void => {
+        aggregateContent({ event, data: data as t.MessageDeltaEvent });
+      },
+    },
+  };
+  const runConfig: t.RunConfig = {
+    runId: `parallel-handoffs-${Date.now()}`,
+    graphConfig: {
+      type: 'multi-agent',
+      agents,
+      edges,
+    },
+    customHandlers,
+    returnContent: true,
+  };
+  try {
+    const run = await Run.create(runConfig);
+    /** Prompt designed to trigger parallel handoffs without confusing language */
+    const userMessage = `Help me with two topics:
+1. The history of the internet
+2. A short poem about technology
+I need information on both topics.`;
+    conversationHistory.push(new HumanMessage(userMessage));
+    console.log('User message:', userMessage);
+    console.log(
+      '\nInvoking multi-agent graph with parallel handoff request...\n'
+    );
+    const config = {
+      configurable: {
+        thread_id: 'parallel-handoffs-test-1',
+      },
+      streamMode: 'values',
+      version: 'v2' as const,
+    };
+    const inputs = {
+      messages: conversationHistory,
+    };
+    await run.processStream(inputs, config);
+    const finalMessages = run.getRunMessages();
+    if (finalMessages) {
+      conversationHistory.push(...finalMessages);
+    }
+    /** Analyze parallel execution */
+    console.log('\n\n========== TIMING SUMMARY ==========');
+    console.log('Available timing keys:', Object.keys(agentTimings));
+    for (const [agent, timing] of Object.entries(agentTimings)) {
+      const duration =
+        timing.end && timing.start ? timing.end - timing.start : 'N/A';
+      console.log(
+        `${agent}: started=${timing.start}ms, ended=${timing.end}ms, duration=${duration}ms`
+      );
+    }
+    /** Check if researcher and writer ran in parallel (handle key variations) */
+    const researcherKey = Object.keys(agentTimings).find((k) =>
+      k.includes('researcher')
+    );
+    const writerKey = Object.keys(agentTimings).find((k) =>
+      k.includes('writer')
+    );
+    const researcherTiming = researcherKey
+      ? agentTimings[researcherKey]
+      : undefined;
+    const writerTiming = writerKey ? agentTimings[writerKey] : undefined;
+    if (researcherTiming && writerTiming) {
+      const bothStarted = researcherTiming.start && writerTiming.start;
+      const bothEnded = researcherTiming.end && writerTiming.end;
+      if (bothStarted && bothEnded) {
+        const overlap =
+          Math.min(researcherTiming.end!, writerTiming.end!) -
+          Math.max(researcherTiming.start!, writerTiming.start!);
+        if (overlap > 0) {
+          console.log(
+            `\n✅ PARALLEL HANDOFFS SUCCESSFUL: ${overlap}ms overlap between researcher and writer`
+          );
+        } else {
+          console.log(
+            `\n⚠️  SEQUENTIAL EXECUTION: researcher and writer did not overlap`
+          );
+          console.log(
+            `   This may indicate the LLM called transfers sequentially, not in parallel`
+          );
+        }
+      }
+    } else {
+      console.log(
+        '\n⚠️  Not all agents were invoked. Check if handoffs occurred.'
+      );
+      console.log('   researcher timing:', researcherTiming);
+      console.log('   writer timing:', writerTiming);
+    }
+    console.log('====================================\n');
+    console.log('Final content parts:', contentParts.length, 'parts');
+    console.dir(contentParts, { depth: null });
+    await sleep(3000);
+  } catch (error) {
+    console.error('Error in parallel handoffs test:', error);
+    throw error;
+  }
+}
+testParallelHandoffs();

package/src/scripts/test-tools-before-handoff.ts CHANGED Viewed

@@ -28,10 +28,14 @@ async function testToolsBeforeHandoff() {
   // Create custom handlers
   const customHandlers = {
-    [GraphEvents.TOOL_END]: new ToolEndHandler(undefined, (name?: string) => {
-      console.log(`\n✅ Tool completed: ${name}`);
-      return true;
-    }),
+    [GraphEvents.TOOL_END]: new ToolEndHandler(
+      undefined,
+      undefined,
+      (name?: string) => {
+        console.log(`\n✅ Tool completed: ${name}`);
+        return true;
+      }
+    ),
     [GraphEvents.CHAT_MODEL_END]: new ModelEndHandler(),
     [GraphEvents.CHAT_MODEL_STREAM]: new ChatModelStreamHandler(),
     [GraphEvents.ON_RUN_STEP]: {

package/src/scripts/test_code_api.ts ADDED Viewed

@@ -0,0 +1,361 @@
+// src/scripts/test_code_api.ts
+/**
+ * Direct test of the Code API to verify session file persistence.
+ * This bypasses the LLM and tests the API directly.
+ *
+ * Run with: npx ts-node -r dotenv/config src/scripts/test_code_api.ts
+ */
+import { config } from 'dotenv';
+config();
+import fetch, { RequestInit } from 'node-fetch';
+import { HttpsProxyAgent } from 'https-proxy-agent';
+const API_KEY = process.env.LIBRECHAT_CODE_API_KEY ?? '';
+const BASE_URL =
+  process.env.LIBRECHAT_CODE_BASEURL ?? 'https://api.librechat.ai/v1';
+const PROXY = process.env.PROXY;
+if (!API_KEY) {
+  console.error('LIBRECHAT_CODE_API_KEY not set');
+  process.exit(1);
+}
+interface FileRef {
+  id: string;
+  name: string;
+  session_id?: string;
+  /** Lineage tracking - present if file was modified from previous session */
+  modified_from?: {
+    id: string;
+    session_id: string;
+  };
+}
+interface ExecResult {
+  session_id: string;
+  stdout: string;
+  stderr: string;
+  files?: FileRef[];
+}
+interface FileInfo {
+  name: string;
+  metadata: Record<string, string>;
+}
+async function makeRequest(
+  endpoint: string,
+  body?: Record<string, unknown>
+): Promise<unknown> {
+  const fetchOptions: RequestInit = {
+    method: body ? 'POST' : 'GET',
+    headers: {
+      'Content-Type': 'application/json',
+      'User-Agent': 'LibreChat/1.0',
+      'X-API-Key': API_KEY,
+    },
+  };
+  if (body) {
+    fetchOptions.body = JSON.stringify(body);
+  }
+  if (PROXY) {
+    fetchOptions.agent = new HttpsProxyAgent(PROXY);
+  }
+  console.log(`\n>>> ${body ? 'POST' : 'GET'} ${endpoint}`);
+  if (body) {
+    console.log('Body:', JSON.stringify(body, null, 2));
+  }
+  const response = await fetch(endpoint, fetchOptions);
+  const result = await response.json();
+  console.log(`<<< Response (${response.status}):`);
+  console.log(JSON.stringify(result, null, 2));
+  if (!response.ok) {
+    throw new Error(`HTTP ${response.status}: ${JSON.stringify(result)}`);
+  }
+  return result;
+}
+async function testCodeAPI(): Promise<void> {
+  console.log('='.repeat(60));
+  console.log('TEST 1: Create a file');
+  console.log('='.repeat(60));
+  const createCode = `
+import json
+config = {
+    "app_name": "TestApp",
+    "version": "1.0.0",
+    "debug": True
+}
+with open("/mnt/data/test_config.json", "w") as f:
+    json.dump(config, f, indent=2)
+with open("/mnt/data/test_config.json", "r") as f:
+    print(f.read())
+`;
+  const result1 = (await makeRequest(`${BASE_URL}/exec`, {
+    lang: 'py',
+    code: createCode,
+  })) as ExecResult;
+  const sessionId = result1.session_id;
+  const files = result1.files ?? [];
+  console.log('\n--- Result Summary ---');
+  console.log('session_id:', sessionId);
+  console.log('files:', files);
+  console.log('stdout:', result1.stdout);
+  console.log('stderr:', result1.stderr);
+  if (!sessionId || files.length === 0) {
+    console.error('\n❌ No session_id or files returned!');
+    return;
+  }
+  // Check if files now include session_id (new API feature)
+  const hasSessionIdInFiles = files.some((f) => f.session_id != null);
+  console.log('\n✅ Files include session_id:', hasSessionIdInFiles);
+  console.log('\n' + '='.repeat(60));
+  console.log(
+    'TEST 2: Fetch files IMMEDIATELY (no delay - testing race condition fix)'
+  );
+  console.log('='.repeat(60));
+  const filesResult = (await makeRequest(
+    `${BASE_URL}/files/${sessionId}?detail=full`
+  )) as FileInfo[];
+  console.log('\n--- Files in session (detail=full) ---');
+  for (const file of filesResult) {
+    console.log('File:', file.name);
+    console.log('  metadata:', file.metadata);
+  }
+  if (filesResult.length === 0) {
+    console.log(
+      '\n⚠️  Files endpoint returned empty - race condition may still exist'
+    );
+  } else {
+    console.log('\n✅ Files available immediately!');
+  }
+  // Test new normalized detail level
+  console.log('\n' + '='.repeat(60));
+  console.log('TEST 2b: Fetch files with detail=normalized');
+  console.log('='.repeat(60));
+  const normalizedResult = (await makeRequest(
+    `${BASE_URL}/files/${sessionId}?detail=normalized`
+  )) as FileRef[];
+  console.log('\n--- Files in session (detail=normalized) ---');
+  console.log(JSON.stringify(normalizedResult, null, 2));
+  console.log('\n' + '='.repeat(60));
+  console.log(
+    'TEST 3: Read file IMMEDIATELY using files from original response'
+  );
+  console.log('='.repeat(60));
+  // Use files directly - if API returns session_id, use that; otherwise add it
+  const fileReferences: FileRef[] = files.map((file) => ({
+    session_id: file.session_id ?? sessionId,
+    id: file.id,
+    name: file.name,
+  }));
+  console.log(
+    '\nFile references we will send:',
+    JSON.stringify(fileReferences, null, 2)
+  );
+  const readCode = `
+import json
+with open("/mnt/data/test_config.json", "r") as f:
+    config = json.load(f)
+    print("Read config:")
+    print(json.dumps(config, indent=2))
+    print("Version:", config.get("version"))
+`;
+  const result2 = (await makeRequest(`${BASE_URL}/exec`, {
+    lang: 'py',
+    code: readCode,
+    files: fileReferences,
+  })) as ExecResult;
+  console.log('\n--- Result Summary ---');
+  console.log('stdout:', result2.stdout);
+  console.log('stderr:', result2.stderr);
+  if (result2.stderr && result2.stderr.includes('FileNotFoundError')) {
+    console.log(
+      '\n❌ File not found! The file reference format might be wrong.'
+    );
+    // Try alternative format - just session_id
+    console.log('\n' + '='.repeat(60));
+    console.log('TEST 4: Try with just session_id in request');
+    console.log('='.repeat(60));
+    const result3 = (await makeRequest(`${BASE_URL}/exec`, {
+      lang: 'py',
+      code: readCode,
+      session_id: sessionId,
+    })) as ExecResult;
+    console.log('\n--- Result Summary ---');
+    console.log('stdout:', result3.stdout);
+    console.log('stderr:', result3.stderr);
+  } else {
+    console.log('\n✅ File read successfully!');
+  }
+  // ============================================================
+  // TEST 4: MODIFY the file (same filename) - tests editable files
+  // ============================================================
+  console.log('\n' + '='.repeat(60));
+  console.log('TEST 4: MODIFY file in-place (testing editable files feature)');
+  console.log('='.repeat(60));
+  const modifyCode = `
+import json
+# Read the existing file
+with open("/mnt/data/test_config.json", "r") as f:
+    config = json.load(f)
+print("Original config:")
+print(json.dumps(config, indent=2))
+# Modify the config
+config["version"] = "2.0.0"
+config["modified"] = True
+# Write BACK to the SAME filename (should work now!)
+with open("/mnt/data/test_config.json", "w") as f:
+    json.dump(config, f, indent=2)
+# Verify the write
+with open("/mnt/data/test_config.json", "r") as f:
+    updated = json.load(f)
+print("\\nUpdated config:")
+print(json.dumps(updated, indent=2))
+`;
+  const result3 = (await makeRequest(`${BASE_URL}/exec`, {
+    lang: 'py',
+    code: modifyCode,
+    files: fileReferences,
+  })) as ExecResult;
+  console.log('\n--- Result Summary ---');
+  console.log('stdout:', result3.stdout);
+  console.log('stderr:', result3.stderr);
+  console.log('files:', JSON.stringify(result3.files, null, 2));
+  if (result3.stderr && result3.stderr.includes('Permission denied')) {
+    console.log('\n❌ Permission denied - files are still read-only!');
+  } else if (result3.stderr && result3.stderr.includes('Error')) {
+    console.log('\n❌ Error modifying file:', result3.stderr);
+  } else {
+    console.log('\n✅ File modified successfully!');
+    // Check for modified_from lineage
+    const modifiedFile = result3.files?.find(
+      (f) => f.name === 'test_config.json'
+    );
+    if (modifiedFile) {
+      console.log('\n--- Modified File Details ---');
+      console.log('  id:', modifiedFile.id);
+      console.log('  name:', modifiedFile.name);
+      console.log('  session_id:', modifiedFile.session_id);
+      if (modifiedFile.modified_from) {
+        console.log(
+          '  modified_from:',
+          JSON.stringify(modifiedFile.modified_from)
+        );
+        console.log(
+          '\n✅ Lineage tracking working! File shows it was modified from previous session.'
+        );
+      } else {
+        console.log(
+          '\n⚠️  No modified_from field - lineage tracking not present'
+        );
+      }
+    } else {
+      console.log('\n⚠️  Modified file not found in response files array');
+    }
+  }
+  // ============================================================
+  // TEST 5: Verify modification persists in next execution
+  // ============================================================
+  console.log('\n' + '='.repeat(60));
+  console.log(
+    'TEST 5: Verify modified file can be read in subsequent execution'
+  );
+  console.log('='.repeat(60));
+  // Use the new file references from the modify response
+  const newFileRefs: FileRef[] = (result3.files ?? []).map((file) => ({
+    session_id: file.session_id ?? result3.session_id,
+    id: file.id,
+    name: file.name,
+  }));
+  if (newFileRefs.length === 0) {
+    console.log(
+      '\n⚠️  No files returned from modification, skipping verification'
+    );
+  } else {
+    console.log(
+      '\nUsing new file references:',
+      JSON.stringify(newFileRefs, null, 2)
+    );
+    const verifyCode = `
+import json
+with open("/mnt/data/test_config.json", "r") as f:
+    config = json.load(f)
+print("Verified config:")
+print(json.dumps(config, indent=2))
+if config.get("version") == "2.0.0" and config.get("modified") == True:
+    print("\\n✅ Modification persisted correctly!")
+else:
+    print("\\n❌ Modification did NOT persist!")
+`;
+    const result4 = (await makeRequest(`${BASE_URL}/exec`, {
+      lang: 'py',
+      code: verifyCode,
+      files: newFileRefs,
+    })) as ExecResult;
+    console.log('\n--- Result Summary ---');
+    console.log('stdout:', result4.stdout);
+    console.log('stderr:', result4.stderr);
+  }
+}
+testCodeAPI().catch((err) => {
+  console.error('Error:', err);
+  process.exit(1);
+});