npm - @librechat/agents - Versions diffs - 3.1.97 → 3.1.99 - Mend

@librechat/agents 3.1.97 → 3.1.99

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (49) hide show

package/dist/cjs/graphs/Graph.cjs +6 -0
package/dist/cjs/graphs/Graph.cjs.map +1 -1
package/dist/cjs/langfuseToolOutputTracing.cjs +16 -5
package/dist/cjs/langfuseToolOutputTracing.cjs.map +1 -1
package/dist/cjs/llm/bedrock/index.cjs +10 -0
package/dist/cjs/llm/bedrock/index.cjs.map +1 -1
package/dist/cjs/llm/bedrock/toolCache.cjs +125 -0
package/dist/cjs/llm/bedrock/toolCache.cjs.map +1 -0
package/dist/cjs/messages/cache.cjs +17 -9
package/dist/cjs/messages/cache.cjs.map +1 -1
package/dist/cjs/messages/prune.cjs +45 -8
package/dist/cjs/messages/prune.cjs.map +1 -1
package/dist/cjs/tools/ToolNode.cjs +6 -1
package/dist/cjs/tools/ToolNode.cjs.map +1 -1
package/dist/esm/graphs/Graph.mjs +6 -0
package/dist/esm/graphs/Graph.mjs.map +1 -1
package/dist/esm/langfuseToolOutputTracing.mjs +16 -5
package/dist/esm/langfuseToolOutputTracing.mjs.map +1 -1
package/dist/esm/llm/bedrock/index.mjs +10 -0
package/dist/esm/llm/bedrock/index.mjs.map +1 -1
package/dist/esm/llm/bedrock/toolCache.mjs +122 -0
package/dist/esm/llm/bedrock/toolCache.mjs.map +1 -0
package/dist/esm/messages/cache.mjs +17 -9
package/dist/esm/messages/cache.mjs.map +1 -1
package/dist/esm/messages/prune.mjs +45 -8
package/dist/esm/messages/prune.mjs.map +1 -1
package/dist/esm/tools/ToolNode.mjs +6 -1
package/dist/esm/tools/ToolNode.mjs.map +1 -1
package/dist/types/llm/bedrock/index.d.ts +16 -0
package/dist/types/llm/bedrock/toolCache.d.ts +4 -0
package/dist/types/messages/cache.d.ts +2 -2
package/dist/types/types/llm.d.ts +2 -2
package/package.json +1 -1
package/src/agents/__tests__/AgentContext.anthropic.live.test.ts +332 -0
package/src/agents/__tests__/AgentContext.bedrock.live.test.ts +504 -0
package/src/graphs/Graph.ts +14 -0
package/src/langfuseToolOutputTracing.ts +26 -7
package/src/llm/bedrock/index.ts +32 -1
package/src/llm/bedrock/llm.spec.ts +154 -1
package/src/llm/bedrock/toolCache.test.ts +131 -0
package/src/llm/bedrock/toolCache.ts +191 -0
package/src/messages/cache.test.ts +97 -38
package/src/messages/cache.ts +18 -10
package/src/messages/prune.ts +55 -17
package/src/specs/langfuse-tool-output-tracing.test.ts +28 -0
package/src/specs/prune.test.ts +193 -0
package/src/tools/ToolNode.ts +7 -1
package/src/tools/__tests__/ToolNode.langfuse.test.ts +6 -0
package/src/types/llm.ts +2 -2

package/src/messages/cache.test.ts CHANGED Viewed

@@ -287,23 +287,28 @@ type TestMsg = {
 };
 describe('addBedrockCacheControl (Bedrock cache checkpoints)', () => {
-  it('returns input when not enough messages', () => {
+  it('returns empty input unchanged and caches a single user message', () => {
     const empty: TestMsg[] = [];
     expect(addBedrockCacheControl(empty)).toEqual(empty);
     const single: TestMsg[] = [{ role: 'user', content: 'only' }];
-    expect(addBedrockCacheControl(single)).toEqual(single);
+    expect(addBedrockCacheControl(single)[0].content).toEqual([
+      { type: ContentTypes.TEXT, text: 'only' },
+      { cachePoint: { type: 'default' } },
+    ]);
   });
-  it('wraps string content and appends separate cachePoint block', () => {
+  it('wraps latest user string content and appends separate cachePoint block', () => {
     const messages: TestMsg[] = [
       { role: 'user', content: 'Hello' },
       { role: 'assistant', content: [{ type: ContentTypes.TEXT, text: 'Hi' }] },
     ];
     const result = addBedrockCacheControl(messages);
-    const last = result[1].content as MessageContentComplex[];
-    expect(Array.isArray(last)).toBe(true);
-    expect(last[0]).toEqual({ type: ContentTypes.TEXT, text: 'Hi' });
-    expect(last[1]).toEqual({ cachePoint: { type: 'default' } });
+    const user = result[0].content as MessageContentComplex[];
+    const assistant = result[1].content as MessageContentComplex[];
+    expect(Array.isArray(user)).toBe(true);
+    expect(user[0]).toEqual({ type: ContentTypes.TEXT, text: 'Hello' });
+    expect(user[1]).toEqual({ cachePoint: { type: 'default' } });
+    expect(assistant).toEqual([{ type: ContentTypes.TEXT, text: 'Hi' }]);
   });
   it('inserts cachePoint after the last text when multiple text blocks exist', () => {
@@ -345,20 +350,21 @@ describe('addBedrockCacheControl (Bedrock cache checkpoints)', () => {
     expect(second[0]).toEqual({ type: ContentTypes.TEXT, text: 'Reply A' });
     expect(second[1]).toEqual({ type: ContentTypes.TEXT, text: 'Reply B' });
-    expect(second[2]).toEqual({ cachePoint: { type: 'default' } });
+    expect(second).toHaveLength(2);
   });
-  it('skips adding cachePoint when content is an empty array', () => {
+  it('skips empty arrays and caches the latest non-empty user message', () => {
     const messages: TestMsg[] = [
       { role: 'user', content: [] },
       { role: 'assistant', content: [] },
-      { role: 'user', content: 'ignored because only last two are modified' },
+      { role: 'user', content: 'latest cacheable user message' },
     ];
     const result = addBedrockCacheControl(messages);
     const first = result[0].content as MessageContentComplex[];
     const second = result[1].content as MessageContentComplex[];
+    const third = result[2].content as MessageContentComplex[];
     expect(Array.isArray(first)).toBe(true);
     expect(first.length).toBe(0);
@@ -366,39 +372,51 @@ describe('addBedrockCacheControl (Bedrock cache checkpoints)', () => {
     expect(Array.isArray(second)).toBe(true);
     expect(second.length).toBe(0);
     expect(second[0]).not.toEqual({ cachePoint: { type: 'default' } });
+    expect(third).toEqual([
+      { type: ContentTypes.TEXT, text: 'latest cacheable user message' },
+      { cachePoint: { type: 'default' } },
+    ]);
   });
-  it('skips adding cachePoint when content is an empty string', () => {
+  it('skips empty strings and caches the latest non-empty user message', () => {
     const messages: TestMsg[] = [
       { role: 'user', content: '' },
       { role: 'assistant', content: '' },
-      { role: 'user', content: 'ignored because only last two are modified' },
+      { role: 'user', content: 'latest cacheable user message' },
     ];
     const result = addBedrockCacheControl(messages);
     expect(result[0].content).toBe('');
     expect(result[1].content).toBe('');
+    expect(result[2].content).toEqual([
+      { type: ContentTypes.TEXT, text: 'latest cacheable user message' },
+      { cachePoint: { type: 'default' } },
+    ]);
   });
   /** (I don't think this will ever occur in actual use, but its the only branch left uncovered so I'm covering it */
-  it('skips messages with non-string, non-array content and still modifies the previous to reach two edits', () => {
+  it('skips messages with non-string, non-array content', () => {
     const messages: TestMsg[] = [
       {
         role: 'user',
-        content: [{ type: ContentTypes.TEXT, text: 'Will be modified' }],
+        content: [{ type: ContentTypes.TEXT, text: 'Older user message' }],
       },
       { role: 'assistant', content: undefined },
       {
         role: 'user',
-        content: [{ type: ContentTypes.TEXT, text: 'Also modified' }],
+        content: [{ type: ContentTypes.TEXT, text: 'Latest user message' }],
       },
     ];
     const result = addBedrockCacheControl(messages);
     const last = result[2].content as MessageContentComplex[];
-    expect(last[0]).toEqual({ type: ContentTypes.TEXT, text: 'Also modified' });
+    expect(last[0]).toEqual({
+      type: ContentTypes.TEXT,
+      text: 'Latest user message',
+    });
     expect(last[1]).toEqual({ cachePoint: { type: 'default' } });
     expect(result[1].content).toBeUndefined();
@@ -406,7 +424,7 @@ describe('addBedrockCacheControl (Bedrock cache checkpoints)', () => {
     const first = result[0].content as MessageContentComplex[];
     expect(first[0]).toEqual({
       type: ContentTypes.TEXT,
-      text: 'Will be modified',
+      text: 'Older user message',
     });
     expect(first[1]).toEqual({ cachePoint: { type: 'default' } });
   });
@@ -511,7 +529,7 @@ describe('addBedrockCacheControl (Bedrock cache checkpoints)', () => {
     expect(systemContent[2]).toHaveProperty('cache_control');
   });
-  it('skips serialized system messages while adding cache points to non-system turns', () => {
+  it('skips serialized system messages while adding a cache point to the latest user turn', () => {
     const messages: TestMsg[] = [
       {
         role: 'system',
@@ -575,7 +593,7 @@ describe('addBedrockCacheControl (Bedrock cache checkpoints)', () => {
       type: ContentTypes.TEXT,
       text: 'Sure! The capital of France is Paris.',
     });
-    expect(assistant[1]).toEqual({ cachePoint: { type: 'default' } });
+    expect(assistant).toHaveLength(1);
   });
   it('is idempotent - calling multiple times does not add duplicate cache points', () => {
@@ -601,12 +619,11 @@ describe('addBedrockCacheControl (Bedrock cache checkpoints)', () => {
     });
     expect(firstContent[1]).toEqual({ cachePoint: { type: 'default' } });
-    expect(secondContent.length).toBe(2);
+    expect(secondContent.length).toBe(1);
     expect(secondContent[0]).toEqual({
       type: ContentTypes.TEXT,
       text: 'First response',
     });
-    expect(secondContent[1]).toEqual({ cachePoint: { type: 'default' } });
     const result2 = addBedrockCacheControl(result1);
     const firstContentAfter = result2[0].content as MessageContentComplex[];
@@ -619,15 +636,14 @@ describe('addBedrockCacheControl (Bedrock cache checkpoints)', () => {
     });
     expect(firstContentAfter[1]).toEqual({ cachePoint: { type: 'default' } });
-    expect(secondContentAfter.length).toBe(2);
+    expect(secondContentAfter.length).toBe(1);
     expect(secondContentAfter[0]).toEqual({
       type: ContentTypes.TEXT,
       text: 'First response',
     });
-    expect(secondContentAfter[1]).toEqual({ cachePoint: { type: 'default' } });
   });
-  it('skips messages that already have cache points in multi-agent scenarios', () => {
+  it('strips stale cache points and caches the latest user messages in multi-agent scenarios', () => {
     const messages: TestMsg[] = [
       {
         role: 'user',
@@ -647,9 +663,17 @@ describe('addBedrockCacheControl (Bedrock cache checkpoints)', () => {
     ];
     const result = addBedrockCacheControl(messages);
+    const firstContent = result[0].content as MessageContentComplex[];
     const lastContent = result[2].content as MessageContentComplex[];
     const secondLastContent = result[1].content as MessageContentComplex[];
+    expect(firstContent.length).toBe(2);
+    expect(firstContent[0]).toEqual({
+      type: ContentTypes.TEXT,
+      text: 'Hello',
+    });
+    expect(firstContent[1]).toEqual({ cachePoint: { type: 'default' } });
     expect(lastContent.length).toBe(2);
     expect(lastContent[0]).toEqual({
       type: ContentTypes.TEXT,
@@ -657,12 +681,11 @@ describe('addBedrockCacheControl (Bedrock cache checkpoints)', () => {
     });
     expect(lastContent[1]).toEqual({ cachePoint: { type: 'default' } });
-    expect(secondLastContent.length).toBe(2);
+    expect(secondLastContent.length).toBe(1);
     expect(secondLastContent[0]).toEqual({
       type: ContentTypes.TEXT,
       text: 'Response from agent 1',
     });
-    expect(secondLastContent[1]).toEqual({ cachePoint: { type: 'default' } });
   });
   it('skips cachePoint on AI messages with only whitespace text and reasoning (tool-call scenario)', () => {
@@ -705,6 +728,42 @@ describe('addBedrockCacheControl (Bedrock cache checkpoints)', () => {
       cachePoint: { type: 'default' },
     });
   });
+  it('keeps cachePoint on the stable user boundary through tool loops', () => {
+    const messages: BaseMessage[] = [
+      new HumanMessage('Use the stable prompt context.'),
+      new AIMessage({
+        content: 'I will call the first tool.',
+        tool_calls: [{ id: 'call_1', name: 'lookup', args: { step: 1 } }],
+      }),
+      new ToolMessage({
+        content: 'volatile tool result 1',
+        tool_call_id: 'call_1',
+      }),
+      new AIMessage({
+        content: 'I will call the second tool.',
+        tool_calls: [{ id: 'call_2', name: 'lookup', args: { step: 2 } }],
+      }),
+      new ToolMessage({
+        content: 'volatile tool result 2',
+        tool_call_id: 'call_2',
+      }),
+    ];
+    const result = addBedrockCacheControl(messages);
+    const userContent = result[0].content as MessageContentComplex[];
+    expect(userContent[userContent.length - 1]).toEqual({
+      cachePoint: { type: 'default' },
+    });
+    for (const message of result.slice(1)) {
+      const content = message.content;
+      expect(
+        Array.isArray(content) && content.some((block) => 'cachePoint' in block)
+      ).toBe(false);
+    }
+  });
 });
 describe('stripAnthropicCacheControl', () => {
@@ -947,7 +1006,7 @@ describe('Multi-agent provider interoperability', () => {
     expect('cache_control' in secondContent[0]).toBe(false);
     expect(firstContent.some((b) => 'cachePoint' in b)).toBe(true);
-    expect(secondContent.some((b) => 'cachePoint' in b)).toBe(true);
+    expect(secondContent.some((b) => 'cachePoint' in b)).toBe(false);
   });
   it('strips Bedrock cache using separate function (backwards compat)', () => {
@@ -1142,7 +1201,7 @@ describe('Immutability - addBedrockCacheControl does not mutate original message
     expect(typeof originalMessages[1].content).toBe('string');
     expect(Array.isArray(result[0].content)).toBe(true);
-    expect(Array.isArray(result[1].content)).toBe(true);
+    expect(result[1].content).toBe('Hi there');
   });
   it('should not mutate original messages when adding cache points to array content', () => {
@@ -1178,9 +1237,9 @@ describe('Immutability - addBedrockCacheControl does not mutate original message
     const resultFirstContent = result[0].content as MessageContentComplex[];
     const resultSecondContent = result[1].content as MessageContentComplex[];
     expect(resultFirstContent.length).toBe(originalFirstContentLength + 1);
-    expect(resultSecondContent.length).toBe(originalSecondContentLength + 1);
+    expect(resultSecondContent.length).toBe(originalSecondContentLength);
     expect(resultFirstContent.some((b) => 'cachePoint' in b)).toBe(true);
-    expect(resultSecondContent.some((b) => 'cachePoint' in b)).toBe(true);
+    expect(resultSecondContent.some((b) => 'cachePoint' in b)).toBe(false);
   });
   it('should not mutate original messages when stripping existing cache control', () => {
@@ -1339,13 +1398,13 @@ describe('Multi-turn cache cleanup', () => {
     const lastContent = result[3].content as MessageContentComplex[];
     const secondLastContent = result[2].content as MessageContentComplex[];
-    expect(lastContent.some((b) => 'cachePoint' in b)).toBe(true);
+    expect(lastContent.some((b) => 'cachePoint' in b)).toBe(false);
     expect(secondLastContent.some((b) => 'cachePoint' in b)).toBe(true);
     const firstContent = result[0].content as MessageContentComplex[];
     const secondContent = result[1].content as MessageContentComplex[];
-    expect(firstContent.some((b) => 'cachePoint' in b)).toBe(false);
+    expect(firstContent.some((b) => 'cachePoint' in b)).toBe(true);
     expect(secondContent.some((b) => 'cachePoint' in b)).toBe(false);
   });
@@ -1561,14 +1620,14 @@ describe('OpenRouter prompt caching (reuses addCacheControl)', () => {
     const lastUser = converted[2];
     expect(Array.isArray(firstUser.content)).toBe(true);
-    expect(
-      (firstUser.content as CacheControlBlock[])[0]
-    ).toHaveProperty('cache_control');
+    expect((firstUser.content as CacheControlBlock[])[0]).toHaveProperty(
+      'cache_control'
+    );
     expect(Array.isArray(lastUser.content)).toBe(true);
-    expect(
-      (lastUser.content as CacheControlBlock[])[0]
-    ).toHaveProperty('cache_control');
+    expect((lastUser.content as CacheControlBlock[])[0]).toHaveProperty(
+      'cache_control'
+    );
   });
   it('strips Bedrock cache before applying OpenRouter/Anthropic cache', () => {

package/src/messages/cache.ts CHANGED Viewed

@@ -470,11 +470,11 @@ export function stripBedrockCacheControl<T extends MessageWithContent>(
 }
 /**
- * Adds Bedrock Converse API cache points to the last two messages.
+ * Adds Bedrock Converse API cache points to the latest two user messages.
  * Inserts `{ cachePoint: { type: 'default' } }` as a separate content block
  * immediately after the last text block in each targeted message.
  * Strips ALL existing cache control (both Bedrock and Anthropic formats) from all messages,
- * then adds fresh cache points to the last 2 messages in a single backward pass.
+ * then adds fresh cache points to the latest two non-tool user messages in a single backward pass.
  * This ensures we don't accumulate stale cache points across multiple turns.
  * Returns a new array - only clones messages that require modification.
  * @param messages - The array of message objects.
@@ -483,12 +483,12 @@ export function stripBedrockCacheControl<T extends MessageWithContent>(
 export function addBedrockCacheControl<
   T extends MessageWithContent & { getType?: () => string; role?: string },
 >(messages: T[]): T[] {
-  if (!Array.isArray(messages) || messages.length < 2) {
+  if (!Array.isArray(messages) || messages.length === 0) {
     return messages;
   }
   const updatedMessages: T[] = [...messages];
-  let messagesModified = 0;
+  let cachePointsAdded = 0;
   for (let i = updatedMessages.length - 1; i >= 0; i--) {
     const originalMessage = updatedMessages[i];
@@ -510,21 +510,27 @@ export function addBedrockCacheControl<
     }
     const isToolMessage = messageType === 'tool' || messageRole === 'tool';
+    const isUserMessage = messageType === 'human' || messageRole === 'user';
     const content = originalMessage.content;
+    const hasSerializationProps =
+      'lc_kwargs' in originalMessage ||
+      'lc_serializable' in originalMessage ||
+      'lc_namespace' in originalMessage;
     const hasArrayContent = Array.isArray(content);
     const isEmptyString = typeof content === 'string' && content === '';
     const needsCacheAdd =
-      messagesModified < 2 &&
+      cachePointsAdded < 2 &&
+      isUserMessage &&
       !isToolMessage &&
       !isEmptyString &&
       (typeof content === 'string' || hasArrayContent);
-    if (!needsCacheAdd && !hasArrayContent) {
+    if (!needsCacheAdd && !hasArrayContent && !hasSerializationProps) {
       continue;
     }
-    let workingContent: MessageContentComplex[];
-    let modified = false;
+    let workingContent: string | MessageContentComplex[];
+    let modified = hasSerializationProps;
     if (hasArrayContent) {
       // Single pass: clone blocks, strip cache markers, find last
@@ -563,14 +569,16 @@ export function addBedrockCacheControl<
         workingContent.splice(lastNonEmptyTextIndex + 1, 0, {
           cachePoint: { type: 'default' },
         } as MessageContentComplex);
-        messagesModified++;
+        cachePointsAdded++;
       }
     } else if (typeof content === 'string' && needsCacheAdd) {
       workingContent = [
         { type: ContentTypes.TEXT, text: content },
         { cachePoint: { type: 'default' } } as MessageContentComplex,
       ];
-      messagesModified++;
+      cachePointsAdded++;
+    } else if (typeof content === 'string' && hasSerializationProps) {
+      workingContent = content;
     } else {
       continue;
     }

package/src/messages/prune.ts CHANGED Viewed

@@ -563,7 +563,7 @@ function addThinkingBlock(
       },
     ];
   /** Edge case, the message already has the thinking block */
-  if (content[0].type === thinkingBlock.type) {
+  if (content[0]?.type === thinkingBlock.type) {
     return message;
   }
   content.unshift(thinkingBlock);
@@ -608,6 +608,33 @@ export type PruningResult = {
   thinkingStartIndex?: number;
 };
+/**
+ * Locates a reasoning block in assistant content. Reasoning blocks carry
+ * provider-specific `type` tags: Anthropic emits `thinking`, while Bedrock and
+ * OpenAI-compatible reasoning providers (DeepSeek-R1, DashScope/Qwen-thinking)
+ * emit `reasoning_content`. DeepSeek/Qwen route through the `THINKING` default
+ * even though their blocks are `reasoning_content` and aren't normalized
+ * upstream, so for the `THINKING` case we also accept `reasoning_content` — this
+ * is what fixes issue #191.
+ *
+ * The broadening is intentionally one-directional. A Bedrock run
+ * (`REASONING_CONTENT`) must NOT match an Anthropic `thinking` block: the
+ * Bedrock input converter rejects `thinking` blocks outright
+ * (`src/llm/bedrock/utils/message_inputs.ts`), so reattaching one to a
+ * surviving message would make the request fail before it is sent.
+ */
+function findReasoningBlock(
+  content: MessageContentComplex[],
+  reasoningType: ContentTypes
+): ThinkingContentText | ReasoningContentText | undefined {
+  return content.find(
+    (part) =>
+      part.type === reasoningType ||
+      (reasoningType === ContentTypes.THINKING &&
+        part.type === ContentTypes.REASONING_CONTENT)
+  ) as ThinkingContentText | ReasoningContentText | undefined;
+}
 /**
  * Processes an array of messages and returns a context of messages that fit within a specified token limit.
  * It iterates over the messages from newest to oldest, adding them to the context until the token limit is reached.
@@ -670,9 +697,7 @@ export function getMessagesWithinTokenLimit({
   if (_thinkingStartIndex > -1) {
     const thinkingMessageContent = messages[_thinkingStartIndex]?.content;
     if (Array.isArray(thinkingMessageContent)) {
-      thinkingBlock = thinkingMessageContent.find(
-        (content) => content.type === reasoningType
-      ) as ThinkingContentText | undefined;
+      thinkingBlock = findReasoningBlock(thinkingMessageContent, reasoningType);
     }
   }
@@ -705,9 +730,10 @@ export function getMessagesWithinTokenLimit({
         messageType === 'ai' &&
         Array.isArray(poppedMessage.content)
       ) {
-        thinkingBlock = poppedMessage.content.find(
-          (content) => content.type === reasoningType
-        ) as ThinkingContentText | undefined;
+        thinkingBlock = findReasoningBlock(
+          poppedMessage.content,
+          reasoningType
+        );
         thinkingStartIndex = thinkingBlock != null ? currentIndex : -1;
       }
       /**
@@ -811,16 +837,28 @@ export function getMessagesWithinTokenLimit({
     return result;
   }
-  if (thinkingEndIndex > -1 && thinkingStartIndex < 0) {
-    throw new Error(
-      'The payload is malformed. There is a thinking sequence but no "AI" messages with thinking blocks.'
-    );
-  }
-  if (!thinkingBlock) {
-    throw new Error(
-      'The payload is malformed. There is a thinking sequence but no thinking block found.'
-    );
+  /**
+   * A trailing reasoning sequence was detected but its block could not be
+   * located in the surviving context. Rather than throw — which permanently
+   * bricks the conversation, re-firing on every retry of the same thread (see
+   * issue #191) — return the partially-pruned context and let the provider
+   * surface a real, recoverable error if the payload is genuinely malformed.
+   * Strict providers (Anthropic) reject it cleanly; lenient ones (DeepSeek,
+   * Qwen) proceed. The pruner cannot know which applies, so it must not be the
+   * one to make the failure fatal.
+   */
+  if ((thinkingEndIndex > -1 && thinkingStartIndex < 0) || !thinkingBlock) {
+    /**
+     * No block was located, so any `thinkingStartIndex` set above came from a
+     * stale carried-over index pointing at a block-less message. Drop it:
+     * `createPruneMessages` persists the returned index as
+     * `runThinkingStartIndex`, and a stale value would suppress the trailing
+     * scan (`thinkingStartIndex < 0`) on later turns, causing a real reasoning
+     * block to be missed and never reattached.
+     */
+    delete result.thinkingStartIndex;
+    result.context = context.reverse() as BaseMessage[];
+    return result;
   }
   let assistantIndex = -1;

package/src/specs/langfuse-tool-output-tracing.test.ts CHANGED Viewed

@@ -180,6 +180,34 @@ describe('Langfuse tool output tracing redaction', () => {
     ).toBe(false);
   });
+  it('classifies LangGraph tool-node spans as Langfuse tool observations', () => {
+    const span = createSpan('tool_batch', {
+      [LangfuseOtelSpanAttributes.OBSERVATION_TYPE]: 'span',
+      [`${LangfuseOtelSpanAttributes.OBSERVATION_METADATA}.langgraph_node`]:
+        'tools=agent_1',
+    });
+    redactLangfuseSpanToolOutputs(span, createConfig());
+    expect(span.attributes[LangfuseOtelSpanAttributes.OBSERVATION_TYPE]).toBe(
+      'tool'
+    );
+  });
+  it('does not reclassify non-tool LangGraph spans', () => {
+    const span = createSpan('agent=agent_1', {
+      [LangfuseOtelSpanAttributes.OBSERVATION_TYPE]: 'span',
+      [`${LangfuseOtelSpanAttributes.OBSERVATION_METADATA}.langgraph_node`]:
+        'agent=agent_1',
+    });
+    redactLangfuseSpanToolOutputs(span, createConfig());
+    expect(span.attributes[LangfuseOtelSpanAttributes.OBSERVATION_TYPE]).toBe(
+      'span'
+    );
+  });
   it('redacts raw tool observation output when tool output tracing is disabled', () => {
     const span = createSpan('execute_sql', {
       [LangfuseOtelSpanAttributes.OBSERVATION_TYPE]: 'tool',