npm - @librechat/agents - Versions diffs - 2.3.1 → 2.3.3 - Mend

@librechat/agents 2.3.1 → 2.3.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (77) hide show

package/dist/cjs/graphs/Graph.cjs +6 -6
package/dist/cjs/graphs/Graph.cjs.map +1 -1
package/dist/cjs/llm/anthropic/llm.cjs +7 -7
package/dist/cjs/llm/anthropic/llm.cjs.map +1 -1
package/dist/cjs/llm/anthropic/utils/message_inputs.cjs +6 -6
package/dist/cjs/llm/anthropic/utils/message_inputs.cjs.map +1 -1
package/dist/cjs/llm/anthropic/utils/message_outputs.cjs +24 -24
package/dist/cjs/llm/anthropic/utils/message_outputs.cjs.map +1 -1
package/dist/cjs/llm/fake.cjs.map +1 -1
package/dist/cjs/llm/text.cjs.map +1 -1
package/dist/cjs/main.cjs +3 -0
package/dist/cjs/main.cjs.map +1 -1
package/dist/cjs/messages/core.cjs +6 -6
package/dist/cjs/messages/core.cjs.map +1 -1
package/dist/cjs/messages/format.cjs +11 -9
package/dist/cjs/messages/format.cjs.map +1 -1
package/dist/cjs/messages/prune.cjs +155 -205
package/dist/cjs/messages/prune.cjs.map +1 -1
package/dist/cjs/run.cjs.map +1 -1
package/dist/cjs/stream.cjs +7 -7
package/dist/cjs/stream.cjs.map +1 -1
package/dist/cjs/tools/ToolNode.cjs +1 -1
package/dist/cjs/tools/ToolNode.cjs.map +1 -1
package/dist/cjs/utils/tokens.cjs +3 -3
package/dist/cjs/utils/tokens.cjs.map +1 -1
package/dist/esm/graphs/Graph.mjs +6 -6
package/dist/esm/graphs/Graph.mjs.map +1 -1
package/dist/esm/llm/anthropic/llm.mjs +7 -7
package/dist/esm/llm/anthropic/llm.mjs.map +1 -1
package/dist/esm/llm/anthropic/utils/message_inputs.mjs +6 -6
package/dist/esm/llm/anthropic/utils/message_inputs.mjs.map +1 -1
package/dist/esm/llm/anthropic/utils/message_outputs.mjs +24 -24
package/dist/esm/llm/anthropic/utils/message_outputs.mjs.map +1 -1
package/dist/esm/llm/fake.mjs.map +1 -1
package/dist/esm/llm/text.mjs.map +1 -1
package/dist/esm/main.mjs +1 -1
package/dist/esm/messages/core.mjs +6 -6
package/dist/esm/messages/core.mjs.map +1 -1
package/dist/esm/messages/format.mjs +11 -9
package/dist/esm/messages/format.mjs.map +1 -1
package/dist/esm/messages/prune.mjs +153 -206
package/dist/esm/messages/prune.mjs.map +1 -1
package/dist/esm/run.mjs.map +1 -1
package/dist/esm/stream.mjs +7 -7
package/dist/esm/stream.mjs.map +1 -1
package/dist/esm/tools/ToolNode.mjs +1 -1
package/dist/esm/tools/ToolNode.mjs.map +1 -1
package/dist/esm/utils/tokens.mjs +3 -3
package/dist/esm/utils/tokens.mjs.map +1 -1
package/dist/types/messages/format.d.ts +1 -2
package/dist/types/messages/prune.d.ts +31 -2
package/dist/types/types/stream.d.ts +2 -2
package/dist/types/utils/tokens.d.ts +1 -1
package/package.json +4 -3
package/src/graphs/Graph.ts +8 -8
package/src/llm/anthropic/llm.ts +7 -8
package/src/llm/anthropic/types.ts +4 -4
package/src/llm/anthropic/utils/message_inputs.ts +6 -6
package/src/llm/anthropic/utils/message_outputs.ts +39 -39
package/src/llm/fake.ts +2 -2
package/src/llm/text.ts +1 -1
package/src/messages/core.ts +9 -9
package/src/messages/format.ts +43 -42
package/src/messages/formatAgentMessages.test.ts +35 -35
package/src/messages/formatAgentMessages.tools.test.ts +30 -30
package/src/messages/prune.ts +182 -255
package/src/messages/shiftIndexTokenCountMap.test.ts +18 -18
package/src/mockStream.ts +1 -1
package/src/run.ts +2 -2
package/src/specs/prune.test.ts +89 -89
package/src/specs/reasoning.test.ts +1 -1
package/src/specs/thinking-prune.test.ts +265 -261
package/src/specs/tool-error.test.ts +16 -17
package/src/stream.ts +21 -18
package/src/tools/ToolNode.ts +1 -1
package/src/types/stream.ts +4 -3
package/src/utils/tokens.ts +12 -12

package/src/specs/thinking-prune.test.ts CHANGED Viewed

@@ -7,21 +7,21 @@ import { createPruneMessages } from '@/messages/prune';
 const createTestTokenCounter = (): t.TokenCounter => {
   return (message: BaseMessage): number => {
     // Use type assertion to help TypeScript understand the type
-    const content = message.content as string | Array<any> | undefined;
+    const content = message.content as string | Array<t.MessageContentComplex | string> | undefined;
     // Handle string content
     if (typeof content === 'string') {
       return content.length;
     }
     // Handle array content
     if (Array.isArray(content)) {
       let totalLength = 0;
       for (const item of content) {
         if (typeof item === 'string') {
           totalLength += item.length;
-        } else if (item && typeof item === 'object') {
+        } else if (typeof item === 'object') {
           if (item.type === 'thinking' && typeof item.thinking === 'string') {
             totalLength += item.thinking.length;
           } else if ('text' in item && typeof item.text === 'string') {
@@ -31,10 +31,10 @@ const createTestTokenCounter = (): t.TokenCounter => {
           }
         }
       }
       return totalLength;
     }
     // Default case - if content is null, undefined, or any other type
     return 0;
   };
@@ -42,129 +42,129 @@ const createTestTokenCounter = (): t.TokenCounter => {
 describe('Prune Messages with Thinking Mode Tests', () => {
   jest.setTimeout(30000);
   it('should preserve thinking blocks when pruning with thinking mode enabled', () => {
     // Create a token counter
     const tokenCounter = createTestTokenCounter();
     // Create messages based on the example provided
     const userMessage = new HumanMessage({
       content: [
         {
-          type: "text",
-          text: "/home/danny/LibreChat/gistfile1.txt\n\nread it 200 lines at a time\n\nthere are 5000 lines\n\ndo not stop until done",
+          type: 'text',
+          text: '/home/danny/LibreChat/gistfile1.txt\n\nread it 200 lines at a time\n\nthere are 5000 lines\n\ndo not stop until done',
         },
       ],
     });
     const assistantMessageWithThinking = new AIMessage({
       content: [
         {
-          type: "thinking",
-          thinking: "The user is asking me to read a file located at `/home/danny/LibreChat/gistfile1.txt` in chunks of 200 lines at a time, mentioning that the file has 5000 lines total. They want me to continue reading through the entire file without stopping.\n\nI'll need to use the text editor tool to view the file in chunks of 200 lines each. Since the file has 5000 lines, I'll need to view it in 25 chunks (5000 ÷ 200 = 25).\n\nI'll need to make multiple calls to the text editor with the `view` command, specifying different line ranges for each call.\n\nLet me plan out the approach:\n1. Start with lines 1-200\n2. Then 201-400\n3. Then 401-600\n4. And so on until I reach 4801-5000\n\nFor each call, I'll use the `view` command with the specific line range in the `view_range` parameter. I'll continue until I've shown all 5000 lines as requested.",
+          type: 'thinking',
+          thinking: 'The user is asking me to read a file located at `/home/danny/LibreChat/gistfile1.txt` in chunks of 200 lines at a time, mentioning that the file has 5000 lines total. They want me to continue reading through the entire file without stopping.\n\nI\'ll need to use the text editor tool to view the file in chunks of 200 lines each. Since the file has 5000 lines, I\'ll need to view it in 25 chunks (5000 ÷ 200 = 25).\n\nI\'ll need to make multiple calls to the text editor with the `view` command, specifying different line ranges for each call.\n\nLet me plan out the approach:\n1. Start with lines 1-200\n2. Then 201-400\n3. Then 401-600\n4. And so on until I reach 4801-5000\n\nFor each call, I\'ll use the `view` command with the specific line range in the `view_range` parameter. I\'ll continue until I\'ve shown all 5000 lines as requested.',
         },
         {
-          type: "text",
-          text: "I'll read the file for you in chunks of 200 lines at a time until all 5000 lines are displayed.\n\nLet me start with the first 200 lines:",
+          type: 'text',
+          text: 'I\'ll read the file for you in chunks of 200 lines at a time until all 5000 lines are displayed.\n\nLet me start with the first 200 lines:',
         },
         {
-          type: "tool_use",
-          id: "toolu_01YApWuFsEQCuBFDgYXmcmeZ",
-          name: "text_editor_mcp_textEditor",
-          input: "{\"command\": \"view\", \"path\": \"/home/danny/LibreChat/gistfile1.txt\", \"description\": \"Viewing lines 1-200 of the file\", \"view_range\": [1,200]}",
+          type: 'tool_use',
+          id: 'toolu_01YApWuFsEQCuBFDgYXmcmeZ',
+          name: 'text_editor_mcp_textEditor',
+          input: '{"command": "view", "path": "/home/danny/LibreChat/gistfile1.txt", "description": "Viewing lines 1-200 of the file", "view_range": [1,200]}',
         },
       ],
     });
     const toolResponseMessage1 = new ToolMessage({
       content: [
         {
-          type: "text",
-          text: "{\"success\":true,\"message\":\"File content (truncated):\"",
+          type: 'text',
+          text: '{"success":true,"message":"File content (truncated):"',
         },
       ],
-      tool_call_id: "toolu_01YApWuFsEQCuBFDgYXmcmeZ",
-      name: "text_editor_mcp_textEditor",
+      tool_call_id: 'toolu_01YApWuFsEQCuBFDgYXmcmeZ',
+      name: 'text_editor_mcp_textEditor',
     });
     const assistantMessage2 = new AIMessage({
       content: [
         {
-          type: "text",
-          text: "It looks like the file content is clipped in the response. I'll continue with the next chunks:",
+          type: 'text',
+          text: 'It looks like the file content is clipped in the response. I\'ll continue with the next chunks:',
         },
         {
-          type: "tool_use",
-          id: "toolu_01VnyMQ4CvEd6zLDxxtTd6d4",
-          name: "text_editor_mcp_textEditor",
-          input: "{\"command\": \"view\", \"path\": \"/home/danny/LibreChat/gistfile1.txt\", \"description\": \"Viewing lines 201-400 of the file\", \"view_range\": [201,400]}",
+          type: 'tool_use',
+          id: 'toolu_01VnyMQ4CvEd6zLDxxtTd6d4',
+          name: 'text_editor_mcp_textEditor',
+          input: '{"command": "view", "path": "/home/danny/LibreChat/gistfile1.txt", "description": "Viewing lines 201-400 of the file", "view_range": [201,400]}',
         },
       ],
     });
     const toolResponseMessage2 = new ToolMessage({
       content: [
         {
-          type: "text",
-          text: "{\"success\":true,\"message\":\"File content (truncated):\"",
+          type: 'text',
+          text: '{"success":true,"message":"File content (truncated):"',
         },
       ],
-      tool_call_id: "toolu_01VnyMQ4CvEd6zLDxxtTd6d4",
-      name: "text_editor_mcp_textEditor",
+      tool_call_id: 'toolu_01VnyMQ4CvEd6zLDxxtTd6d4',
+      name: 'text_editor_mcp_textEditor',
     });
     const assistantMessage3 = new AIMessage({
       content: [
         {
-          type: "text",
-          text: "Continuing with the next chunk:",
+          type: 'text',
+          text: 'Continuing with the next chunk:',
         },
         {
-          type: "tool_use",
-          id: "toolu_01TZKs4nnBc58BYXKz1Mw4fp",
-          name: "text_editor_mcp_textEditor",
-          input: "{\"command\": \"view\", \"path\": \"/home/danny/LibreChat/gistfile1.txt\", \"description\": \"Viewing lines 401-600 of the file\", \"view_range\": [401,600]}",
+          type: 'tool_use',
+          id: 'toolu_01TZKs4nnBc58BYXKz1Mw4fp',
+          name: 'text_editor_mcp_textEditor',
+          input: '{"command": "view", "path": "/home/danny/LibreChat/gistfile1.txt", "description": "Viewing lines 401-600 of the file", "view_range": [401,600]}',
         },
       ],
     });
     const toolResponseMessage3 = new ToolMessage({
       content: [
         {
-          type: "text",
-          text: "{\"success\":true,\"message\":\"File content (truncated):\"",
+          type: 'text',
+          text: '{"success":true,"message":"File content (truncated):"',
         },
       ],
-      tool_call_id: "toolu_01TZKs4nnBc58BYXKz1Mw4fp",
-      name: "text_editor_mcp_textEditor",
+      tool_call_id: 'toolu_01TZKs4nnBc58BYXKz1Mw4fp',
+      name: 'text_editor_mcp_textEditor',
     });
     const assistantMessage4 = new AIMessage({
       content: [
         {
-          type: "text",
-          text: "Let's continue with the next chunk:",
+          type: 'text',
+          text: 'Let\'s continue with the next chunk:',
         },
         {
-          type: "tool_use",
-          id: "toolu_01TZgBacNxjx1QNUpJg9hca5",
-          name: "text_editor_mcp_textEditor",
-          input: "{\"command\": \"view\", \"path\": \"/home/danny/LibreChat/gistfile1.txt\", \"description\": \"Viewing lines 601-800 of the file\", \"view_range\": [601,800]}",
+          type: 'tool_use',
+          id: 'toolu_01TZgBacNxjx1QNUpJg9hca5',
+          name: 'text_editor_mcp_textEditor',
+          input: '{"command": "view", "path": "/home/danny/LibreChat/gistfile1.txt", "description": "Viewing lines 601-800 of the file", "view_range": [601,800]}',
         },
       ],
     });
     const toolResponseMessage4 = new ToolMessage({
       content: [
         {
-          type: "text",
-          text: "{\"success\":true,\"message\":\"File content (truncated):\"",
+          type: 'text',
+          text: '{"success":true,"message":"File content (truncated):"',
         },
       ],
-      tool_call_id: "toolu_01TZgBacNxjx1QNUpJg9hca5",
-      name: "text_editor_mcp_textEditor",
+      tool_call_id: 'toolu_01TZgBacNxjx1QNUpJg9hca5',
+      name: 'text_editor_mcp_textEditor',
     });
     const messages = [
       userMessage,
       assistantMessageWithThinking,
@@ -176,20 +176,20 @@ describe('Prune Messages with Thinking Mode Tests', () => {
       assistantMessage4,
       toolResponseMessage4,
     ];
     // Create indexTokenCountMap based on the example provided
     const indexTokenCountMap = {
-      "0": 617, // userMessage
-      "1": 52,  // assistantMessageWithThinking
-      "2": 4995, // toolResponseMessage1
-      "3": 307, // assistantMessage2
-      "4": 9359, // toolResponseMessage2
-      "5": 178, // assistantMessage3
-      "6": 5463, // toolResponseMessage3
-      "7": 125, // assistantMessage4
-      "8": 4264, // toolResponseMessage4
+      '0': 617, // userMessage
+      '1': 52,  // assistantMessageWithThinking
+      '2': 4995, // toolResponseMessage1
+      '3': 307, // assistantMessage2
+      '4': 9359, // toolResponseMessage2
+      '5': 178, // assistantMessage3
+      '6': 5463, // toolResponseMessage3
+      '7': 125, // assistantMessage4
+      '8': 4264, // toolResponseMessage4
     };
     // Create pruneMessages function with thinking mode enabled
     const pruneMessages = createPruneMessages({
       maxTokens: 19800,
@@ -198,9 +198,9 @@ describe('Prune Messages with Thinking Mode Tests', () => {
       indexTokenCountMap: { ...indexTokenCountMap },
       thinkingEnabled: true,
     });
     // Prune messages
-    const result = pruneMessages({
+    const result = pruneMessages({
       messages,
       usageMetadata: {
         input_tokens: 25254,
@@ -211,73 +211,73 @@ describe('Prune Messages with Thinking Mode Tests', () => {
           cache_creation: 0,
         },
       },
-      startOnMessageType: 'human',
+      startType: 'human',
     });
     // Verify that the first assistant message in the pruned context has a thinking block
     expect(result.context.length).toBeGreaterThan(0);
     // Find the first assistant message in the pruned context
     const firstAssistantIndex = result.context.findIndex(msg => msg.getType() === 'ai');
     expect(firstAssistantIndex).toBe(0);
     const firstAssistantMsg = result.context[firstAssistantIndex];
     expect(Array.isArray(firstAssistantMsg.content)).toBe(true);
     // Verify that the first assistant message has a thinking block
-    const hasThinkingBlock = (firstAssistantMsg.content as any[]).some(item =>
-      item && typeof item === 'object' && item.type === 'thinking');
+    const hasThinkingBlock = (firstAssistantMsg.content as t.MessageContentComplex[]).some((item: t.MessageContentComplex) =>
+      typeof item === 'object' && item.type === 'thinking');
     expect(hasThinkingBlock).toBe(true);
     // Verify that the thinking block is from the original assistant message
-    const thinkingBlock = (firstAssistantMsg.content as any[]).find(item =>
-      item && typeof item === 'object' && item.type === 'thinking');
+    const thinkingBlock = (firstAssistantMsg.content as t.MessageContentComplex[]).find((item: t.MessageContentComplex) =>
+      typeof item === 'object' && item.type === 'thinking');
     expect(thinkingBlock).toBeDefined();
-    expect(thinkingBlock.thinking).toContain("The user is asking me to read a file");
+    expect((thinkingBlock as t.ThinkingContentText).thinking).toContain('The user is asking me to read a file');
   });
   it('should handle token recalculation when inserting thinking blocks', () => {
     // Create a token counter
     const tokenCounter = createTestTokenCounter();
     // Create a message with thinking block
     const assistantMessageWithThinking = new AIMessage({
       content: [
         {
-          type: "thinking",
-          thinking: "This is a thinking block",
+          type: 'thinking',
+          thinking: 'This is a thinking block',
         },
         {
-          type: "text",
-          text: "Response with thinking",
+          type: 'text',
+          text: 'Response with thinking',
         },
       ],
     });
     // Create a message without thinking block
     const assistantMessageWithoutThinking = new AIMessage({
       content: [
         {
-          type: "text",
-          text: "Response without thinking",
+          type: 'text',
+          text: 'Response without thinking',
         },
       ],
     });
     const messages = [
-      new SystemMessage("System instruction"),
-      new HumanMessage("Hello"),
+      new SystemMessage('System instruction'),
+      new HumanMessage('Hello'),
       assistantMessageWithThinking,
-      new HumanMessage("Next message"),
+      new HumanMessage('Next message'),
       assistantMessageWithoutThinking,
     ];
     // Calculate token counts for each message
     const indexTokenCountMap: Record<string, number> = {};
     for (let i = 0; i < messages.length; i++) {
       indexTokenCountMap[i] = tokenCounter(messages[i]);
     }
     // Create pruneMessages function with thinking mode enabled
     const pruneMessages = createPruneMessages({
       maxTokens: 50, // Set a low token limit to force pruning
@@ -286,56 +286,44 @@ describe('Prune Messages with Thinking Mode Tests', () => {
       indexTokenCountMap: { ...indexTokenCountMap },
       thinkingEnabled: true,
     });
     // Prune messages
     const result = pruneMessages({ messages });
     // Verify that the pruned context has fewer messages than the original
     expect(result.context.length).toBeLessThan(messages.length);
-    // Find the first assistant message in the pruned context
-    const firstAssistantIndex = result.context.findIndex(msg => msg.getType() === 'ai');
-    expect(firstAssistantIndex).toBeGreaterThan(-1);
-    const firstAssistantMsg = result.context[firstAssistantIndex];
-    expect(Array.isArray(firstAssistantMsg.content)).toBe(true);
-    // Verify that the first assistant message has a thinking block
-    const hasThinkingBlock = (firstAssistantMsg.content as any[]).some(item =>
-      item && typeof item === 'object' && item.type === 'thinking');
-    expect(hasThinkingBlock).toBe(true);
   });
   it('should not modify messages when under token limit', () => {
     // Create a token counter
     const tokenCounter = createTestTokenCounter();
     // Create a message with thinking block
     const assistantMessageWithThinking = new AIMessage({
       content: [
         {
-          type: "thinking",
-          thinking: "This is a thinking block",
+          type: 'thinking',
+          thinking: 'This is a thinking block',
         },
         {
-          type: "text",
-          text: "Response with thinking",
+          type: 'text',
+          text: 'Response with thinking',
         },
       ],
     });
     const messages = [
-      new SystemMessage("System instruction"),
-      new HumanMessage("Hello"),
+      new SystemMessage('System instruction'),
+      new HumanMessage('Hello'),
       assistantMessageWithThinking,
     ];
     // Calculate token counts for each message
     const indexTokenCountMap: Record<string, number> = {};
     for (let i = 0; i < messages.length; i++) {
       indexTokenCountMap[i] = tokenCounter(messages[i]);
     }
     // Create pruneMessages function with thinking mode enabled
     const pruneMessages = createPruneMessages({
       maxTokens: 1000, // Set a high token limit to avoid pruning
@@ -344,34 +332,34 @@ describe('Prune Messages with Thinking Mode Tests', () => {
       indexTokenCountMap: { ...indexTokenCountMap },
       thinkingEnabled: true,
     });
     // Prune messages
     const result = pruneMessages({ messages });
     // Verify that all messages are preserved
     expect(result.context.length).toBe(messages.length);
     expect(result.context).toEqual(messages);
   });
   it('should handle the case when no thinking blocks are found', () => {
     // Create a token counter
     const tokenCounter = createTestTokenCounter();
     // Create messages without thinking blocks
     const messages = [
-      new SystemMessage("System instruction"),
-      new HumanMessage("Hello"),
-      new AIMessage("Response without thinking"),
-      new HumanMessage("Next message"),
-      new AIMessage("Another response without thinking"),
+      new SystemMessage('System instruction'),
+      new HumanMessage('Hello'),
+      new AIMessage('Response without thinking'),
+      new HumanMessage('Next message'),
+      new AIMessage('Another response without thinking'),
     ];
     // Calculate token counts for each message
     const indexTokenCountMap: Record<string, number> = {};
     for (let i = 0; i < messages.length; i++) {
       indexTokenCountMap[i] = tokenCounter(messages[i]);
     }
     // Create pruneMessages function with thinking mode enabled
     const pruneMessages = createPruneMessages({
       maxTokens: 50, // Set a low token limit to force pruning
@@ -380,76 +368,76 @@ describe('Prune Messages with Thinking Mode Tests', () => {
       indexTokenCountMap: { ...indexTokenCountMap },
       thinkingEnabled: true,
     });
     // Prune messages
     const result = pruneMessages({ messages });
     // Verify that the pruned context has fewer messages than the original
     expect(result.context.length).toBeLessThan(messages.length);
     // The function should not throw an error even though no thinking blocks are found
     expect(() => pruneMessages({ messages })).not.toThrow();
   });
   it('should preserve AI <--> tool message correspondences when pruning', () => {
     // Create a token counter
     const tokenCounter = createTestTokenCounter();
     // Create messages with tool calls
     const assistantMessageWithToolCall = new AIMessage({
       content: [
         {
-          type: "text",
-          text: "Let me check that file:",
+          type: 'text',
+          text: 'Let me check that file:',
         },
         {
-          type: "tool_use",
-          id: "tool123",
-          name: "text_editor_mcp_textEditor",
-          input: "{\"command\": \"view\", \"path\": \"/path/to/file.txt\"}",
+          type: 'tool_use',
+          id: 'tool123',
+          name: 'text_editor_mcp_textEditor',
+          input: '{"command": "view", "path": "/path/to/file.txt"}',
         },
       ],
     });
     const toolResponseMessage = new ToolMessage({
       content: [
         {
-          type: "text",
-          text: "{\"success\":true,\"message\":\"File content\"}",
+          type: 'text',
+          text: '{"success":true,"message":"File content"}',
         },
       ],
-      tool_call_id: "tool123",
-      name: "text_editor_mcp_textEditor",
+      tool_call_id: 'tool123',
+      name: 'text_editor_mcp_textEditor',
     });
     const assistantMessageWithThinking = new AIMessage({
       content: [
         {
-          type: "thinking",
-          thinking: "This is a thinking block",
+          type: 'thinking',
+          thinking: 'This is a thinking block',
         },
         {
-          type: "text",
-          text: "Response with thinking",
+          type: 'text',
+          text: 'Response with thinking',
         },
       ],
     });
     const messages = [
-      new SystemMessage("System instruction"),
-      new HumanMessage("Hello"),
+      new SystemMessage('System instruction'),
+      new HumanMessage('Hello'),
       assistantMessageWithToolCall,
       toolResponseMessage,
-      new HumanMessage("Next message"),
+      new HumanMessage('Next message'),
       assistantMessageWithThinking,
     ];
     // Calculate token counts for each message
     const indexTokenCountMap: Record<string, number> = {};
     for (let i = 0; i < messages.length; i++) {
       indexTokenCountMap[i] = tokenCounter(messages[i]);
     }
     // Create pruneMessages function with thinking mode enabled and a low token limit
     const pruneMessages = createPruneMessages({
       maxTokens: 100, // Set a low token limit to force pruning
@@ -458,107 +446,107 @@ describe('Prune Messages with Thinking Mode Tests', () => {
       indexTokenCountMap: { ...indexTokenCountMap },
       thinkingEnabled: true,
     });
     // Prune messages
     const result = pruneMessages({ messages });
     // Find assistant message with tool call and its corresponding tool message in the pruned context
-    const assistantIndex = result.context.findIndex(msg =>
-      msg.getType() === 'ai' &&
-      Array.isArray(msg.content) &&
-      msg.content.some(item => item && typeof item === 'object' && item.type === 'tool_use' && item.id === 'tool123')
+    const assistantIndex = result.context.findIndex(msg =>
+      msg.getType() === 'ai' &&
+      Array.isArray(msg.content) &&
+      msg.content.some(item => typeof item === 'object' && item.type === 'tool_use' && item.id === 'tool123')
     );
     // If the assistant message with tool call is in the context, its corresponding tool message should also be there
     if (assistantIndex !== -1) {
-      const toolIndex = result.context.findIndex(msg =>
-        msg.getType() === 'tool' &&
-        'tool_call_id' in msg &&
+      const toolIndex = result.context.findIndex(msg =>
+        msg.getType() === 'tool' &&
+        'tool_call_id' in msg &&
         msg.tool_call_id === 'tool123'
       );
       expect(toolIndex).not.toBe(-1);
     }
     // If the tool message is in the context, its corresponding assistant message should also be there
-    const toolIndex = result.context.findIndex(msg =>
-      msg.getType() === 'tool' &&
-      'tool_call_id' in msg &&
+    const toolIndex = result.context.findIndex(msg =>
+      msg.getType() === 'tool' &&
+      'tool_call_id' in msg &&
       msg.tool_call_id === 'tool123'
     );
     if (toolIndex !== -1) {
-      const assistantWithToolIndex = result.context.findIndex(msg =>
-        msg.getType() === 'ai' &&
-        Array.isArray(msg.content) &&
-        msg.content.some(item => item && typeof item === 'object' && item.type === 'tool_use' && item.id === 'tool123')
+      const assistantWithToolIndex = result.context.findIndex(msg =>
+        msg.getType() === 'ai' &&
+        Array.isArray(msg.content) &&
+        msg.content.some(item => typeof item === 'object' && item.type === 'tool_use' && item.id === 'tool123')
       );
       expect(assistantWithToolIndex).not.toBe(-1);
     }
   });
-  it('should ensure an assistant message with thinking appears at the beginning of the context when the latest message is an assistant message', () => {
+  it('should ensure an assistant message with thinking appears in the latest sequence of assistant/tool messages', () => {
     // Create a token counter
     const tokenCounter = createTestTokenCounter();
     // Create messages with the latest message being an assistant message with thinking
     const assistantMessageWithThinking = new AIMessage({
       content: [
         {
-          type: "thinking",
-          thinking: "This is a thinking block",
+          type: 'thinking',
+          thinking: 'This is a thinking block',
         },
         {
-          type: "text",
-          text: "Response with thinking",
+          type: 'text',
+          text: 'Response with thinking',
         },
       ],
     });
     // Create an assistant message with tool use
     const assistantMessageWithToolUse = new AIMessage({
       content: [
         {
-          type: "text",
-          text: "Let me check that file:",
+          type: 'text',
+          text: 'Let me check that file:',
         },
         {
-          type: "tool_use",
-          id: "tool123",
-          name: "text_editor_mcp_textEditor",
-          input: "{\"command\": \"view\", \"path\": \"/path/to/file.txt\"}",
+          type: 'tool_use',
+          id: 'tool123',
+          name: 'text_editor_mcp_textEditor',
+          input: '{"command": "view", "path": "/path/to/file.txt"}',
         },
       ],
     });
     // Create a tool response message
     const toolResponseMessage = new ToolMessage({
       content: [
         {
-          type: "text",
-          text: "{\"success\":true,\"message\":\"File content\"}",
+          type: 'text',
+          text: '{"success":true,"message":"File content"}',
         },
       ],
-      tool_call_id: "tool123",
-      name: "text_editor_mcp_textEditor",
+      tool_call_id: 'tool123',
+      name: 'text_editor_mcp_textEditor',
     });
     // Test case without system message
     const messagesWithoutSystem = [
-      new HumanMessage("Hello"),
+      new HumanMessage('Hello'),
       assistantMessageWithToolUse,
       toolResponseMessage,
-      new HumanMessage("Next message"),
+      new HumanMessage('Next message'),
       assistantMessageWithThinking, // Latest message is an assistant message with thinking
     ];
     // Calculate token counts for each message
     const indexTokenCountMapWithoutSystem: Record<string, number> = {};
     for (let i = 0; i < messagesWithoutSystem.length; i++) {
       indexTokenCountMapWithoutSystem[i] = tokenCounter(messagesWithoutSystem[i]);
     }
     // Create pruneMessages function with thinking mode enabled
     const pruneMessagesWithoutSystem = createPruneMessages({
       maxTokens: 100, // Set a token limit to force some pruning
@@ -567,37 +555,45 @@ describe('Prune Messages with Thinking Mode Tests', () => {
       indexTokenCountMap: { ...indexTokenCountMapWithoutSystem },
       thinkingEnabled: true,
     });
     // Prune messages
     const resultWithoutSystem = pruneMessagesWithoutSystem({ messages: messagesWithoutSystem });
-    // Verify that the first message in the pruned context is an assistant message with thinking when no system message
+    // Verify that the pruned context contains at least one message
     expect(resultWithoutSystem.context.length).toBeGreaterThan(0);
-    expect(resultWithoutSystem.context[0].getType()).toBe('ai');
-    // Verify that the first message has a thinking block
-    const firstMsgContent = resultWithoutSystem.context[0].content as any[];
-    expect(Array.isArray(firstMsgContent)).toBe(true);
-    const hasThinkingBlock = firstMsgContent.some(item =>
-      item && typeof item === 'object' && item.type === 'thinking');
+    // Find all assistant messages in the latest sequence (after the last human message)
+    const lastHumanIndex = resultWithoutSystem.context.map(msg => msg.getType()).lastIndexOf('human');
+    const assistantMessagesAfterLastHuman = resultWithoutSystem.context.slice(lastHumanIndex + 1)
+      .filter(msg => msg.getType() === 'ai');
+    // Verify that at least one assistant message exists in the latest sequence
+    expect(assistantMessagesAfterLastHuman.length).toBeGreaterThan(0);
+    // Verify that at least one of these assistant messages has a thinking block
+    const hasThinkingBlock = assistantMessagesAfterLastHuman.some(msg => {
+      const content = msg.content as t.MessageContentComplex[];
+      return Array.isArray(content) && content.some(item =>
+        typeof item === 'object' && item.type === 'thinking');
+    });
     expect(hasThinkingBlock).toBe(true);
     // Test case with system message
     const messagesWithSystem = [
-      new SystemMessage("System instruction"),
-      new HumanMessage("Hello"),
+      new SystemMessage('System instruction'),
+      new HumanMessage('Hello'),
       assistantMessageWithToolUse,
       toolResponseMessage,
-      new HumanMessage("Next message"),
+      new HumanMessage('Next message'),
       assistantMessageWithThinking, // Latest message is an assistant message with thinking
     ];
     // Calculate token counts for each message
     const indexTokenCountMapWithSystem: Record<string, number> = {};
     for (let i = 0; i < messagesWithSystem.length; i++) {
       indexTokenCountMapWithSystem[i] = tokenCounter(messagesWithSystem[i]);
     }
     // Create pruneMessages function with thinking mode enabled
     const pruneMessagesWithSystem = createPruneMessages({
       maxTokens: 120, // Set a token limit to force some pruning but keep system message
@@ -606,68 +602,76 @@ describe('Prune Messages with Thinking Mode Tests', () => {
       indexTokenCountMap: { ...indexTokenCountMapWithSystem },
       thinkingEnabled: true,
     });
     // Prune messages
     const resultWithSystem = pruneMessagesWithSystem({ messages: messagesWithSystem });
-    // Verify that the system message remains first, followed by an assistant message with thinking
+    // Verify that the system message remains first
     expect(resultWithSystem.context.length).toBeGreaterThan(1);
     expect(resultWithSystem.context[0].getType()).toBe('system');
-    expect(resultWithSystem.context[1].getType()).toBe('ai');
-    // Verify that the second message has a thinking block
-    const secondMsgContent = resultWithSystem.context[1].content as any[];
-    expect(Array.isArray(secondMsgContent)).toBe(true);
-    const hasThinkingBlockInSecond = secondMsgContent.some(item =>
-      item && typeof item === 'object' && item.type === 'thinking');
-    expect(hasThinkingBlockInSecond).toBe(true);
+    // Find all assistant messages in the latest sequence (after the last human message)
+    const lastHumanIndexWithSystem = resultWithSystem.context.map(msg => msg.getType()).lastIndexOf('human');
+    const assistantMessagesAfterLastHumanWithSystem = resultWithSystem.context.slice(lastHumanIndexWithSystem + 1)
+      .filter(msg => msg.getType() === 'ai');
+    // Verify that at least one assistant message exists in the latest sequence
+    expect(assistantMessagesAfterLastHumanWithSystem.length).toBeGreaterThan(0);
+    // Verify that at least one of these assistant messages has a thinking block
+    const hasThinkingBlockWithSystem = assistantMessagesAfterLastHumanWithSystem.some(msg => {
+      const content = msg.content as t.MessageContentComplex[];
+      return Array.isArray(content) && content.some(item =>
+        typeof item === 'object' && item.type === 'thinking');
+    });
+    expect(hasThinkingBlockWithSystem).toBe(true);
   });
   it('should look for thinking blocks starting from the most recent messages', () => {
     // Create a token counter
     const tokenCounter = createTestTokenCounter();
     // Create messages with multiple thinking blocks
     const olderAssistantMessageWithThinking = new AIMessage({
       content: [
         {
-          type: "thinking",
-          thinking: "This is an older thinking block",
+          type: 'thinking',
+          thinking: 'This is an older thinking block',
         },
         {
-          type: "text",
-          text: "Older response with thinking",
+          type: 'text',
+          text: 'Older response with thinking',
         },
       ],
     });
     const newerAssistantMessageWithThinking = new AIMessage({
       content: [
         {
-          type: "thinking",
-          thinking: "This is a newer thinking block",
+          type: 'thinking',
+          thinking: 'This is a newer thinking block',
         },
         {
-          type: "text",
-          text: "Newer response with thinking",
+          type: 'text',
+          text: 'Newer response with thinking',
         },
       ],
     });
     const messages = [
-      new SystemMessage("System instruction"),
-      new HumanMessage("Hello"),
+      new SystemMessage('System instruction'),
+      new HumanMessage('Hello'),
       olderAssistantMessageWithThinking,
-      new HumanMessage("Next message"),
+      new HumanMessage('Next message'),
       newerAssistantMessageWithThinking,
     ];
     // Calculate token counts for each message
     const indexTokenCountMap: Record<string, number> = {};
     for (let i = 0; i < messages.length; i++) {
       indexTokenCountMap[i] = tokenCounter(messages[i]);
     }
     // Create pruneMessages function with thinking mode enabled
     // Set a token limit that will force pruning of the older assistant message
     const pruneMessages = createPruneMessages({
@@ -677,23 +681,23 @@ describe('Prune Messages with Thinking Mode Tests', () => {
       indexTokenCountMap: { ...indexTokenCountMap },
       thinkingEnabled: true,
     });
     // Prune messages
     const result = pruneMessages({ messages });
     // Find the first assistant message in the pruned context
     const firstAssistantIndex = result.context.findIndex(msg => msg.getType() === 'ai');
     expect(firstAssistantIndex).not.toBe(-1);
     const firstAssistantMsg = result.context[firstAssistantIndex];
     expect(Array.isArray(firstAssistantMsg.content)).toBe(true);
     // Verify that the first assistant message has a thinking block
-    const thinkingBlock = (firstAssistantMsg.content as any[]).find(item =>
-      item && typeof item === 'object' && item.type === 'thinking');
+    const thinkingBlock = (firstAssistantMsg.content as t.MessageContentComplex[]).find(item =>
+      typeof item === 'object' && item.type === 'thinking');
     expect(thinkingBlock).toBeDefined();
     // Verify that it's the newer thinking block
-    expect(thinkingBlock.thinking).toContain("newer thinking block");
+    expect((thinkingBlock as t.ThinkingContentText).thinking).toContain('newer thinking block');
   });
 });