npm - @librechat/agents - Versions diffs - 3.2.34 → 3.2.36 - Mend

@librechat/agents 3.2.34 → 3.2.36

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (128) hide show

package/dist/cjs/agents/AgentContext.cjs +119 -9
package/dist/cjs/agents/AgentContext.cjs.map +1 -1
package/dist/cjs/agents/projection.cjs +25 -0
package/dist/cjs/agents/projection.cjs.map +1 -0
package/dist/cjs/common/enum.cjs +13 -0
package/dist/cjs/common/enum.cjs.map +1 -1
package/dist/cjs/graphs/Graph.cjs +106 -3
package/dist/cjs/graphs/Graph.cjs.map +1 -1
package/dist/cjs/llm/anthropic/utils/message_inputs.cjs +26 -4
package/dist/cjs/llm/anthropic/utils/message_inputs.cjs.map +1 -1
package/dist/cjs/llm/bedrock/utils/message_inputs.cjs +20 -0
package/dist/cjs/llm/bedrock/utils/message_inputs.cjs.map +1 -1
package/dist/cjs/llm/invoke.cjs +49 -8
package/dist/cjs/llm/invoke.cjs.map +1 -1
package/dist/cjs/main.cjs +7 -0
package/dist/cjs/messages/budget.cjs +23 -0
package/dist/cjs/messages/budget.cjs.map +1 -0
package/dist/cjs/messages/cache.cjs +1 -0
package/dist/cjs/messages/cache.cjs.map +1 -1
package/dist/cjs/messages/content.cjs +12 -14
package/dist/cjs/messages/content.cjs.map +1 -1
package/dist/cjs/messages/index.cjs +1 -0
package/dist/cjs/messages/prune.cjs +31 -13
package/dist/cjs/messages/prune.cjs.map +1 -1
package/dist/cjs/run.cjs +7 -2
package/dist/cjs/run.cjs.map +1 -1
package/dist/cjs/summarization/node.cjs +12 -1
package/dist/cjs/summarization/node.cjs.map +1 -1
package/dist/cjs/tools/search/format.cjs +91 -2
package/dist/cjs/tools/search/format.cjs.map +1 -1
package/dist/cjs/tools/search/tool.cjs +4 -3
package/dist/cjs/tools/search/tool.cjs.map +1 -1
package/dist/cjs/tools/subagent/SubagentExecutor.cjs +138 -2
package/dist/cjs/tools/subagent/SubagentExecutor.cjs.map +1 -1
package/dist/cjs/utils/tokens.cjs +30 -0
package/dist/cjs/utils/tokens.cjs.map +1 -1
package/dist/esm/agents/AgentContext.mjs +121 -11
package/dist/esm/agents/AgentContext.mjs.map +1 -1
package/dist/esm/agents/projection.mjs +25 -0
package/dist/esm/agents/projection.mjs.map +1 -0
package/dist/esm/common/enum.mjs +13 -0
package/dist/esm/common/enum.mjs.map +1 -1
package/dist/esm/graphs/Graph.mjs +107 -4
package/dist/esm/graphs/Graph.mjs.map +1 -1
package/dist/esm/llm/anthropic/utils/message_inputs.mjs +26 -4
package/dist/esm/llm/anthropic/utils/message_inputs.mjs.map +1 -1
package/dist/esm/llm/bedrock/utils/message_inputs.mjs +20 -0
package/dist/esm/llm/bedrock/utils/message_inputs.mjs.map +1 -1
package/dist/esm/llm/invoke.mjs +49 -8
package/dist/esm/llm/invoke.mjs.map +1 -1
package/dist/esm/main.mjs +6 -4
package/dist/esm/messages/budget.mjs +23 -0
package/dist/esm/messages/budget.mjs.map +1 -0
package/dist/esm/messages/cache.mjs +1 -1
package/dist/esm/messages/cache.mjs.map +1 -1
package/dist/esm/messages/content.mjs +12 -15
package/dist/esm/messages/content.mjs.map +1 -1
package/dist/esm/messages/index.mjs +1 -0
package/dist/esm/messages/prune.mjs +31 -13
package/dist/esm/messages/prune.mjs.map +1 -1
package/dist/esm/run.mjs +7 -2
package/dist/esm/run.mjs.map +1 -1
package/dist/esm/summarization/node.mjs +12 -1
package/dist/esm/summarization/node.mjs.map +1 -1
package/dist/esm/tools/search/format.mjs +91 -2
package/dist/esm/tools/search/format.mjs.map +1 -1
package/dist/esm/tools/search/tool.mjs +4 -3
package/dist/esm/tools/search/tool.mjs.map +1 -1
package/dist/esm/tools/subagent/SubagentExecutor.mjs +138 -2
package/dist/esm/tools/subagent/SubagentExecutor.mjs.map +1 -1
package/dist/esm/utils/tokens.mjs +30 -1
package/dist/esm/utils/tokens.mjs.map +1 -1
package/dist/types/agents/AgentContext.d.ts +37 -4
package/dist/types/agents/projection.d.ts +26 -0
package/dist/types/common/enum.d.ts +13 -0
package/dist/types/graphs/Graph.d.ts +8 -1
package/dist/types/index.d.ts +1 -0
package/dist/types/llm/invoke.d.ts +1 -1
package/dist/types/messages/budget.d.ts +11 -0
package/dist/types/messages/cache.d.ts +7 -0
package/dist/types/messages/content.d.ts +5 -0
package/dist/types/messages/index.d.ts +1 -0
package/dist/types/messages/prune.d.ts +4 -0
package/dist/types/run.d.ts +1 -0
package/dist/types/tools/search/format.d.ts +4 -1
package/dist/types/tools/search/types.d.ts +7 -0
package/dist/types/tools/subagent/SubagentExecutor.d.ts +11 -1
package/dist/types/types/graph.d.ts +89 -3
package/dist/types/types/run.d.ts +13 -0
package/dist/types/utils/tokens.d.ts +7 -0
package/package.json +1 -1
package/src/agents/AgentContext.ts +172 -8
package/src/agents/__tests__/AgentContext.test.ts +235 -2
package/src/agents/__tests__/projection.test.ts +73 -0
package/src/agents/projection.ts +46 -0
package/src/common/enum.ts +13 -0
package/src/graphs/Graph.ts +168 -0
package/src/index.ts +3 -0
package/src/llm/anthropic/utils/cross-provider-reasoning.test.ts +317 -0
package/src/llm/anthropic/utils/message_inputs.ts +78 -16
package/src/llm/bedrock/utils/cross-provider-reasoning.test.ts +131 -0
package/src/llm/bedrock/utils/message_inputs.ts +35 -0
package/src/llm/invoke.test.ts +79 -1
package/src/llm/invoke.ts +58 -4
package/src/messages/budget.ts +32 -0
package/src/messages/cache.ts +1 -1
package/src/messages/content.ts +24 -32
package/src/messages/index.ts +1 -0
package/src/messages/prune.ts +39 -2
package/src/run.ts +5 -0
package/src/scripts/subagent-usage-sink.ts +176 -0
package/src/specs/context-accuracy.live.test.ts +409 -0
package/src/specs/context-usage-event.test.ts +117 -0
package/src/specs/context-usage.live.test.ts +297 -0
package/src/specs/prune.test.ts +51 -1
package/src/specs/subagent.test.ts +124 -1
package/src/summarization/__tests__/node.test.ts +60 -1
package/src/summarization/node.ts +20 -1
package/src/tools/__tests__/SubagentExecutor.test.ts +443 -1
package/src/tools/search/format.test.ts +242 -0
package/src/tools/search/format.ts +122 -5
package/src/tools/search/tool.ts +5 -1
package/src/tools/search/types.ts +7 -0
package/src/tools/subagent/SubagentExecutor.ts +221 -3
package/src/types/graph.ts +94 -1
package/src/types/run.ts +13 -0
package/src/utils/__tests__/apportion.test.ts +32 -0
package/src/utils/tokens.ts +33 -0

package/src/tools/__tests__/SubagentExecutor.test.ts CHANGED Viewed

@@ -4,7 +4,9 @@ import type { BaseMessage } from '@langchain/core/messages';
 import type {
   AgentInputs,
   ResolvedSubagentConfig,
+  StandardGraphInput,
   SubagentUpdateEvent,
+  SubagentUsageEvent,
   ToolExecuteBatchRequest,
   ToolExecuteResult,
 } from '@/types';
@@ -17,7 +19,7 @@ import {
   summarizeEvent,
 } from '../subagent';
 import { sanitizeForwardedSubagentUpdateData } from '../subagent/SubagentExecutor';
-import { Providers, GraphEvents, StepTypes } from '@/common';
+import { Constants, Providers, GraphEvents, StepTypes } from '@/common';
 import { AgentContext } from '@/agents/AgentContext';
 import { HookRegistry } from '@/hooks/HookRegistry';
 import { HandlerRegistry } from '@/events';
@@ -456,6 +458,446 @@ describe('SubagentExecutor', () => {
     expect(observedLangfuse).toBe(langfuse);
   });
+  describe('usage sink', () => {
+    type CapturedCallbackHandler = {
+      handleChatModelStart?: (
+        llm: unknown,
+        messages: unknown,
+        runId: string,
+        parentRunId?: string,
+        extraParams?: Record<string, unknown>,
+        tags?: string[],
+        metadata?: Record<string, unknown>
+      ) => unknown;
+      handleLLMEnd?: (output: unknown, runId: string) => unknown;
+      handleLLMError?: (err: unknown, runId: string) => unknown;
+    };
+    type CapturedInvokeOptions = { callbacks?: CapturedCallbackHandler[] };
+    /**
+     * Stub factory that records the `StandardGraphInput` the executor
+     * builds and the options passed to `workflow.invoke`, so tests can
+     * drive the attached usage-capture callback directly (the stubbed
+     * invoke never makes real model calls, so callbacks would otherwise
+     * never fire).
+     */
+    function makeCapturingGraphFactory(driveDuringInvoke?: {
+      drive: (handler: CapturedCallbackHandler) => void | Promise<void>;
+    }): {
+      factory: (input: StandardGraphInput) => StandardGraph;
+      getInput: () => StandardGraphInput | undefined;
+      getInvokeOptions: () => CapturedInvokeOptions | undefined;
+    } {
+      let capturedInput: StandardGraphInput | undefined;
+      let capturedOptions: CapturedInvokeOptions | undefined;
+      const factory = (input: StandardGraphInput): StandardGraph => {
+        capturedInput = input;
+        return {
+          createWorkflow: (): { invoke: jest.Mock } => ({
+            invoke: jest
+              .fn()
+              .mockImplementation(
+                async (_input: unknown, options: CapturedInvokeOptions) => {
+                  capturedOptions = options;
+                  const usageHandler = options.callbacks?.find(
+                    (cb) => cb.handleLLMEnd != null
+                  );
+                  if (driveDuringInvoke && usageHandler) {
+                    await driveDuringInvoke.drive(usageHandler);
+                  }
+                  return { messages: [new AIMessage('child done')] };
+                }
+              ),
+          }),
+          clearHeavyState: jest.fn(),
+        } as unknown as StandardGraph;
+      };
+      return {
+        factory,
+        getInput: () => capturedInput,
+        getInvokeOptions: () => capturedOptions,
+      };
+    }
+    const makeChoice = (
+      usage: Record<string, number> | undefined
+    ): unknown => ({
+      text: 'ok',
+      message: new AIMessage({
+        content: 'ok',
+        ...(usage
+          ? {
+            usage_metadata: usage as unknown as AIMessage['usage_metadata'],
+          }
+          : {}),
+      }),
+    });
+    const makeLLMEndOutput = (
+      usage: Record<string, number> | undefined
+    ): unknown => ({
+      generations: [[makeChoice(usage)]],
+    });
+    it('forwards a wrapped sink into the child graph input that rewrites runId to the root run', async () => {
+      const events: SubagentUsageEvent[] = [];
+      const { factory, getInput } = makeCapturingGraphFactory();
+      const executor = createExecutor({
+        usageSink: (event) => {
+          events.push(event);
+        },
+        createChildGraph: factory,
+      });
+      await executor.execute({
+        description: 'Research this topic',
+        subagentType: 'researcher',
+      });
+      const forwarded = getInput()?.subagentUsageSink;
+      expect(typeof forwarded).toBe('function');
+      /**
+       * Simulate a NESTED child's emission: its executor stamps `runId`
+       * with its own parent (an intermediate `*_sub_*` id). The wrapper
+       * must rewrite it to THIS executor's parent run so the host always
+       * sees root-run attribution, while the emitting child's identity
+       * (`subagentRunId`) is preserved.
+       */
+      forwarded?.({
+        usage: { input_tokens: 1, output_tokens: 1, total_tokens: 2 },
+        model: 'gpt-4o-mini',
+        provider: Providers.OPENAI,
+        subagentType: 'nested-grandchild',
+        subagentRunId: 'test-run_sub_a_sub_b',
+        subagentAgentId: 'grandchild',
+        runId: 'test-run_sub_a',
+      });
+      expect(events).toHaveLength(1);
+      expect(events[0].runId).toBe('test-run');
+      expect(events[0].subagentRunId).toBe('test-run_sub_a_sub_b');
+      expect(events[0].subagentType).toBe('nested-grandchild');
+    });
+    it('does not attach a capture callback when no sink is provided', async () => {
+      const { factory, getInvokeOptions } = makeCapturingGraphFactory();
+      const executor = createExecutor({ createChildGraph: factory });
+      await executor.execute({
+        description: 'Research this topic',
+        subagentType: 'researcher',
+      });
+      expect(getInvokeOptions()?.callbacks).toEqual([]);
+    });
+    it('emits tagged usage events with per-call ls_model_name', async () => {
+      const events: SubagentUsageEvent[] = [];
+      const { factory } = makeCapturingGraphFactory({
+        drive: async (handler) => {
+          await handler.handleChatModelStart?.(
+            {},
+            [[]],
+            'call-1',
+            undefined,
+            undefined,
+            undefined,
+            { ls_model_name: 'gpt-4o-mini-2024-07-18' }
+          );
+          await handler.handleLLMEnd?.(
+            makeLLMEndOutput({
+              input_tokens: 11,
+              output_tokens: 7,
+              total_tokens: 18,
+            }),
+            'call-1'
+          );
+        },
+      });
+      const executor = createExecutor({
+        usageSink: (event) => {
+          events.push(event);
+        },
+        createChildGraph: factory,
+      });
+      await executor.execute({
+        description: 'Research this topic',
+        subagentType: 'researcher',
+      });
+      expect(events).toHaveLength(1);
+      const event = events[0];
+      expect(event.usage).toEqual({
+        input_tokens: 11,
+        output_tokens: 7,
+        total_tokens: 18,
+      });
+      expect(event.model).toBe('gpt-4o-mini-2024-07-18');
+      expect(event.provider).toBe(Providers.OPENAI);
+      expect(event.subagentType).toBe('researcher');
+      expect(event.subagentAgentId).toBe('child-agent');
+      expect(event.subagentRunId).toContain('test-run_sub_');
+      expect(event.runId).toBe('test-run');
+    });
+    it('falls back to the configured model when a call has no ls_model_name', async () => {
+      const events: SubagentUsageEvent[] = [];
+      const { factory } = makeCapturingGraphFactory({
+        drive: async (handler) => {
+          await handler.handleLLMEnd?.(
+            makeLLMEndOutput({
+              input_tokens: 3,
+              output_tokens: 2,
+              total_tokens: 5,
+            }),
+            'call-1'
+          );
+        },
+      });
+      const executor = createExecutor({
+        usageSink: (event) => {
+          events.push(event);
+        },
+        createChildGraph: factory,
+      });
+      await executor.execute({
+        description: 'Research this topic',
+        subagentType: 'researcher',
+      });
+      expect(events).toHaveLength(1);
+      /** `makeChildInputs` configures `clientOptions.modelName`. */
+      expect(events[0].model).toBe('gpt-4o-mini');
+    });
+    it('emits one event per generation group when a call has multiple completions (n > 1)', async () => {
+      const usage = { input_tokens: 10, output_tokens: 4, total_tokens: 14 };
+      const events: SubagentUsageEvent[] = [];
+      const { factory } = makeCapturingGraphFactory({
+        drive: async (handler) => {
+          /**
+           * One provider request with two choices — both carry the same
+           * request-level usage. Emitting per choice would double-bill.
+           */
+          await handler.handleLLMEnd?.(
+            { generations: [[makeChoice(usage), makeChoice(usage)]] },
+            'call-1'
+          );
+          /** Batched prompts: two groups = two requests = two events. */
+          await handler.handleLLMEnd?.(
+            { generations: [[makeChoice(usage)], [makeChoice(usage)]] },
+            'call-2'
+          );
+        },
+      });
+      const executor = createExecutor({
+        usageSink: (event) => {
+          events.push(event);
+        },
+        createChildGraph: factory,
+      });
+      await executor.execute({
+        description: 'Research this topic',
+        subagentType: 'researcher',
+      });
+      expect(events).toHaveLength(3);
+    });
+    it('prefers INVOKED_PROVIDER/INVOKED_MODEL metadata for fallback-served calls', async () => {
+      const events: SubagentUsageEvent[] = [];
+      const { factory } = makeCapturingGraphFactory({
+        drive: async (handler) => {
+          /**
+           * Mirror a fallback-served call: `attemptInvoke` stamps the
+           * serving provider, `tryFallbackProviders` stamps the fallback's
+           * configured model, and the provider reports no `ls_model_name`.
+           */
+          await handler.handleChatModelStart?.(
+            {},
+            [[]],
+            'call-1',
+            undefined,
+            undefined,
+            undefined,
+            {
+              [Constants.INVOKED_PROVIDER]: Providers.ANTHROPIC,
+              [Constants.INVOKED_MODEL]: 'claude-fallback-1',
+            }
+          );
+          await handler.handleLLMEnd?.(
+            makeLLMEndOutput({
+              input_tokens: 5,
+              output_tokens: 3,
+              total_tokens: 8,
+            }),
+            'call-1'
+          );
+        },
+      });
+      const executor = createExecutor({
+        usageSink: (event) => {
+          events.push(event);
+        },
+        createChildGraph: factory,
+      });
+      await executor.execute({
+        description: 'Research this topic',
+        subagentType: 'researcher',
+      });
+      expect(events).toHaveLength(1);
+      /** Not the configured primary (openAI / gpt-4o-mini). */
+      expect(events[0].provider).toBe(Providers.ANTHROPIC);
+      expect(events[0].model).toBe('claude-fallback-1');
+    });
+    it('prefers provider-reported ls_model_name over INVOKED_MODEL', async () => {
+      const events: SubagentUsageEvent[] = [];
+      const { factory } = makeCapturingGraphFactory({
+        drive: async (handler) => {
+          await handler.handleChatModelStart?.(
+            {},
+            [[]],
+            'call-1',
+            undefined,
+            undefined,
+            undefined,
+            {
+              ls_model_name: 'claude-fallback-1-20260101',
+              [Constants.INVOKED_PROVIDER]: Providers.ANTHROPIC,
+              [Constants.INVOKED_MODEL]: 'claude-fallback-1',
+            }
+          );
+          await handler.handleLLMEnd?.(
+            makeLLMEndOutput({
+              input_tokens: 5,
+              output_tokens: 3,
+              total_tokens: 8,
+            }),
+            'call-1'
+          );
+        },
+      });
+      const executor = createExecutor({
+        usageSink: (event) => {
+          events.push(event);
+        },
+        createChildGraph: factory,
+      });
+      await executor.execute({
+        description: 'Research this topic',
+        subagentType: 'researcher',
+      });
+      expect(events[0].model).toBe('claude-fallback-1-20260101');
+    });
+    it('skips model calls that report no usage_metadata', async () => {
+      const events: SubagentUsageEvent[] = [];
+      const { factory } = makeCapturingGraphFactory({
+        drive: async (handler) => {
+          await handler.handleLLMEnd?.(makeLLMEndOutput(undefined), 'call-1');
+        },
+      });
+      const executor = createExecutor({
+        usageSink: (event) => {
+          events.push(event);
+        },
+        createChildGraph: factory,
+      });
+      await executor.execute({
+        description: 'Research this topic',
+        subagentType: 'researcher',
+      });
+      expect(events).toEqual([]);
+    });
+    it('swallows sink errors without breaking the child run', async () => {
+      const { factory } = makeCapturingGraphFactory({
+        drive: async (handler) => {
+          await handler.handleLLMEnd?.(
+            makeLLMEndOutput({
+              input_tokens: 1,
+              output_tokens: 1,
+              total_tokens: 2,
+            }),
+            'call-1'
+          );
+        },
+      });
+      const executor = createExecutor({
+        usageSink: () => {
+          throw new Error('host sink exploded');
+        },
+        createChildGraph: factory,
+      });
+      const result = await executor.execute({
+        description: 'Research this topic',
+        subagentType: 'researcher',
+      });
+      expect(result.content).toBe('child done');
+    });
+    it('awaits async sinks and swallows their rejections', async () => {
+      const settled: string[] = [];
+      const { factory } = makeCapturingGraphFactory({
+        drive: async (handler) => {
+          await handler.handleLLMEnd?.(
+            makeLLMEndOutput({
+              input_tokens: 1,
+              output_tokens: 1,
+              total_tokens: 2,
+            }),
+            'call-1'
+          );
+          await handler.handleLLMEnd?.(
+            makeLLMEndOutput({
+              input_tokens: 2,
+              output_tokens: 2,
+              total_tokens: 4,
+            }),
+            'call-2'
+          );
+          /**
+           * Both sink dispatches must have settled by the time
+           * `handleLLMEnd` resolves — a dropped promise would leave
+           * `recorded` missing here and surface the second call's
+           * rejection as unhandled.
+           */
+          settled.push('drive-done');
+        },
+      });
+      const executor = createExecutor({
+        usageSink: async (event) => {
+          await new Promise((resolve) => setTimeout(resolve, 5));
+          if (event.usage.input_tokens === 2) {
+            throw new Error('async host sink rejected');
+          }
+          settled.push('recorded');
+        },
+        createChildGraph: factory,
+      });
+      const result = await executor.execute({
+        description: 'Research this topic',
+        subagentType: 'researcher',
+      });
+      expect(result.content).toBe('child done');
+      expect(settled).toEqual(['recorded', 'drive-done']);
+    });
+  });
   it('returns error message when child graph throws', async () => {
     const executor = createExecutor({
       createChildGraph: makeThrowingGraphFactory(

package/src/tools/search/format.test.ts ADDED Viewed

@@ -0,0 +1,242 @@
+import type * as t from './types';
+import { formatResultsForLLM, resolveMaxLLMOutputChars } from './format';
+const makeOrganic = (
+  link: string,
+  highlights: t.Highlight[]
+): t.ProcessedOrganic => ({
+  link,
+  title: `Title for ${link}`,
+  snippet: `Snippet for ${link}`,
+  highlights,
+});
+const highlight = (text: string, score = 0.9): t.Highlight => ({ text, score });
+const reference = (url: string, originalIndex = 0): t.UsedReferences[number] => ({
+  type: 'link',
+  originalIndex,
+  reference: { originalUrl: url, title: 'Ref', text: 'ref' },
+});
+const countHighlightBlocks = (output: string): number =>
+  (output.match(/### Highlight \d+/g) ?? []).length;
+const OMISSION_MARKER = 'omitted to fit the context budget';
+describe('resolveMaxLLMOutputChars', () => {
+  const originalEnv = process.env.SEARCH_MAX_LLM_OUTPUT_CHARS;
+  afterEach(() => {
+    if (originalEnv == null) {
+      delete process.env.SEARCH_MAX_LLM_OUTPUT_CHARS;
+    } else {
+      process.env.SEARCH_MAX_LLM_OUTPUT_CHARS = originalEnv;
+    }
+  });
+  test('falls back to the 50,000 char default when nothing is configured', () => {
+    delete process.env.SEARCH_MAX_LLM_OUTPUT_CHARS;
+    expect(resolveMaxLLMOutputChars()).toBe(50000);
+    expect(resolveMaxLLMOutputChars(0)).toBe(50000);
+    expect(resolveMaxLLMOutputChars(-100)).toBe(50000);
+  });
+  test('honors the SEARCH_MAX_LLM_OUTPUT_CHARS env var', () => {
+    process.env.SEARCH_MAX_LLM_OUTPUT_CHARS = '777';
+    expect(resolveMaxLLMOutputChars()).toBe(777);
+    expect(resolveMaxLLMOutputChars(0)).toBe(777);
+  });
+  test('an explicit positive config value wins over env and default', () => {
+    process.env.SEARCH_MAX_LLM_OUTPUT_CHARS = '777';
+    expect(resolveMaxLLMOutputChars(1234)).toBe(1234);
+  });
+  test('ignores a non-numeric env var', () => {
+    process.env.SEARCH_MAX_LLM_OUTPUT_CHARS = 'not-a-number';
+    expect(resolveMaxLLMOutputChars()).toBe(50000);
+  });
+});
+describe('formatResultsForLLM highlight budget', () => {
+  test('keeps whole highlights in relevance order until the budget is hit', () => {
+    const results: t.SearchResultData = {
+      organic: [
+        makeOrganic('https://a.com', [highlight('A'.repeat(100))]),
+        makeOrganic('https://b.com', [highlight('B'.repeat(100))]),
+      ],
+    };
+    const { output } = formatResultsForLLM(0, results, 100);
+    expect(output).toContain('A'.repeat(100));
+    expect(output).not.toContain('B'.repeat(100));
+    expect(countHighlightBlocks(output)).toBe(1);
+    expect(output).toContain('_[1 additional highlight omitted to fit the context budget');
+  });
+  test('truncates the boundary highlight when meaningful room remains', () => {
+    const results: t.SearchResultData = {
+      organic: [makeOrganic('https://a.com', [highlight('A'.repeat(1000))])],
+    };
+    const { output } = formatResultsForLLM(0, results, 500);
+    expect(output).toContain('…[truncated]');
+    expect(output).toContain('A'.repeat(500));
+    expect(output).not.toContain('A'.repeat(501));
+    expect(output).toContain('_[1 additional highlight omitted to fit the context budget');
+  });
+  test('drops the boundary highlight entirely when too little room remains', () => {
+    const results: t.SearchResultData = {
+      organic: [
+        makeOrganic('https://a.com', [highlight('A'.repeat(100))]),
+        makeOrganic('https://b.com', [highlight('B'.repeat(100))]),
+      ],
+    };
+    const { output } = formatResultsForLLM(0, results, 150);
+    expect(output).toContain('A'.repeat(100));
+    expect(output).not.toContain('…[truncated]');
+    expect(output).not.toContain('B');
+    expect(countHighlightBlocks(output)).toBe(1);
+  });
+  test('always keeps snippets, titles, and URLs even when all highlights are dropped', () => {
+    const results: t.SearchResultData = {
+      organic: [makeOrganic('https://a.com', [highlight('A'.repeat(100))])],
+    };
+    const { output } = formatResultsForLLM(0, results, 10);
+    expect(output).toContain('URL: https://a.com');
+    expect(output).toContain('Summary: Snippet for https://a.com');
+    expect(output).toContain('"Title for https://a.com"');
+    expect(countHighlightBlocks(output)).toBe(0);
+    expect(output).toContain('_[1 additional highlight omitted to fit the context budget');
+  });
+  test('emits no omission marker when every highlight fits the budget', () => {
+    const results: t.SearchResultData = {
+      organic: [
+        makeOrganic('https://a.com', [highlight('A'.repeat(100))]),
+        makeOrganic('https://b.com', [highlight('B'.repeat(100))]),
+      ],
+    };
+    const { output } = formatResultsForLLM(0, results, 50000);
+    expect(output).toContain('A'.repeat(100));
+    expect(output).toContain('B'.repeat(100));
+    expect(countHighlightBlocks(output)).toBe(2);
+    expect(output).not.toContain(OMISSION_MARKER);
+  });
+  test('drops references with no surviving marker when truncating', () => {
+    const withRefs = highlight('A'.repeat(1000));
+    withRefs.references = [reference('https://cited.example')];
+    const results: t.SearchResultData = {
+      organic: [makeOrganic('https://a.com', [withRefs])],
+    };
+    const { output, references } = formatResultsForLLM(0, results, 500);
+    expect(output).toContain('…[truncated]');
+    expect(output).not.toContain('Core References');
+    expect(output).not.toContain('https://cited.example');
+    expect(references).toHaveLength(0);
+  });
+  test('keeps references whose marker survives truncation and drops the rest', () => {
+    const withRefs = highlight(`(link#1) ${'A'.repeat(1000)} (link#2)`);
+    withRefs.references = [
+      reference('https://one.example', 0),
+      reference('https://two.example', 1),
+    ];
+    const results: t.SearchResultData = {
+      organic: [makeOrganic('https://a.com', [withRefs])],
+    };
+    const { output, references } = formatResultsForLLM(0, results, 500);
+    expect(output).toContain('…[truncated]');
+    expect(output).toContain('https://one.example');
+    expect(output).not.toContain('https://two.example');
+    expect(references).toHaveLength(1);
+    expect(references[0].link).toBe('https://one.example');
+  });
+  test('stops at the boundary highlight — no lower-ranked highlight slips in', () => {
+    const results: t.SearchResultData = {
+      organic: [
+        makeOrganic('https://a.com', [
+          highlight('A'.repeat(100), 0.9),
+          highlight('B'.repeat(300), 0.8),
+          highlight('C'.repeat(10), 0.7),
+        ]),
+      ],
+    };
+    const { output } = formatResultsForLLM(0, results, 150);
+    expect(output).toContain('A'.repeat(100));
+    expect(output).not.toContain('B'.repeat(300));
+    expect(output).not.toContain('C'.repeat(10));
+    expect(output).not.toContain('…[truncated]');
+    expect(countHighlightBlocks(output)).toBe(1);
+  });
+  test('keeps references on a whole highlight that fits the budget', () => {
+    const withRefs = highlight('A'.repeat(100));
+    withRefs.references = [reference('https://cited.example')];
+    const results: t.SearchResultData = {
+      organic: [makeOrganic('https://a.com', [withRefs])],
+    };
+    const { output, references } = formatResultsForLLM(0, results, 50000);
+    expect(output).toContain('Core References');
+    expect(references).toHaveLength(1);
+    expect(references[0].link).toBe('https://cited.example');
+  });
+  test('skips blank highlights instead of charging them against the budget', () => {
+    const results: t.SearchResultData = {
+      organic: [
+        makeOrganic('https://a.com', [
+          highlight('   \n\t  '),
+          highlight('A'.repeat(100)),
+        ]),
+      ],
+    };
+    const { output } = formatResultsForLLM(0, results, 100);
+    expect(output).toContain('A'.repeat(100));
+    expect(output).not.toContain('…[truncated]');
+    expect(countHighlightBlocks(output)).toBe(1);
+    expect(output).not.toContain(OMISSION_MARKER);
+  });
+  test('spends the budget across organic results before news results', () => {
+    const results: t.SearchResultData = {
+      organic: [makeOrganic('https://a.com', [highlight('A'.repeat(100))])],
+      topStories: [
+        {
+          link: 'https://news.com',
+          title: 'Story',
+          highlights: [highlight('N'.repeat(100))],
+        },
+      ],
+    };
+    const { output } = formatResultsForLLM(0, results, 100);
+    expect(output).toContain('A'.repeat(100));
+    expect(output).not.toContain('N'.repeat(100));
+    expect(output).toContain('_[1 additional highlight omitted to fit the context budget');
+  });
+});