npm - @illuma-ai/agents - Versions diffs - 1.5.1 → 2.1.1 - Mend

@illuma-ai/agents 1.5.1 → 2.1.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (319) hide show

package/README.md +0 -62
package/dist/cjs/agents/AgentContext.cjs +160 -259
package/dist/cjs/agents/AgentContext.cjs.map +1 -1
package/dist/cjs/common/enum.cjs +12 -12
package/dist/cjs/common/enum.cjs.map +1 -1
package/dist/cjs/graphs/Graph.cjs +30 -13
package/dist/cjs/graphs/Graph.cjs.map +1 -1
package/dist/cjs/graphs/MultiAgentGraph.cjs +1 -1
package/dist/cjs/graphs/MultiAgentGraph.cjs.map +1 -1
package/dist/cjs/graphs/phases/memoryFlushPhase.cjs +1 -1
package/dist/cjs/graphs/phases/memoryFlushPhase.cjs.map +1 -1
package/dist/cjs/hooks/HookRegistry.cjs +1 -1
package/dist/cjs/hooks/HookRegistry.cjs.map +1 -1
package/dist/cjs/hooks/matchers.cjs +2 -2
package/dist/cjs/hooks/matchers.cjs.map +1 -1
package/dist/cjs/hooks/types.cjs +1 -1
package/dist/cjs/hooks/types.cjs.map +1 -1
package/dist/cjs/llm/anthropic/utils/message_inputs.cjs +1 -5
package/dist/cjs/llm/anthropic/utils/message_inputs.cjs.map +1 -1
package/dist/cjs/llm/bedrock/index.cjs +33 -61
package/dist/cjs/llm/bedrock/index.cjs.map +1 -1
package/dist/cjs/llm/openai/index.cjs +1 -1
package/dist/cjs/llm/openai/index.cjs.map +1 -1
package/dist/cjs/llm/openai/utils/index.cjs +10 -27
package/dist/cjs/llm/openai/utils/index.cjs.map +1 -1
package/dist/cjs/main.cjs +3 -84
package/dist/cjs/main.cjs.map +1 -1
package/dist/cjs/memory/citations.cjs +4 -4
package/dist/cjs/memory/citations.cjs.map +1 -1
package/dist/cjs/memory/constants.cjs +17 -17
package/dist/cjs/memory/constants.cjs.map +1 -1
package/dist/cjs/memory/mmr.cjs +1 -1
package/dist/cjs/memory/mmr.cjs.map +1 -1
package/dist/cjs/memory/paths.cjs +1 -1
package/dist/cjs/memory/paths.cjs.map +1 -1
package/dist/cjs/memory/recallTracking.cjs +3 -3
package/dist/cjs/memory/recallTracking.cjs.map +1 -1
package/dist/cjs/memory/temporalDecay.cjs +2 -2
package/dist/cjs/memory/temporalDecay.cjs.map +1 -1
package/dist/cjs/messages/cache.cjs +0 -89
package/dist/cjs/messages/cache.cjs.map +1 -1
package/dist/cjs/messages/format.cjs +13 -71
package/dist/cjs/messages/format.cjs.map +1 -1
package/dist/cjs/tools/BashExecutor.cjs +11 -21
package/dist/cjs/tools/BashExecutor.cjs.map +1 -1
package/dist/cjs/tools/CodeExecutor.cjs +13 -41
package/dist/cjs/tools/CodeExecutor.cjs.map +1 -1
package/dist/cjs/tools/ProgrammaticToolCalling.cjs +11 -16
package/dist/cjs/tools/ProgrammaticToolCalling.cjs.map +1 -1
package/dist/cjs/tools/ToolNode.cjs +78 -13
package/dist/cjs/tools/ToolNode.cjs.map +1 -1
package/dist/cjs/tools/memory/memoryAppendTool.cjs +1 -1
package/dist/cjs/tools/memory/memoryAppendTool.cjs.map +1 -1
package/dist/cjs/tools/memory/memoryGetTool.cjs +2 -2
package/dist/cjs/tools/memory/memoryGetTool.cjs.map +1 -1
package/dist/cjs/tools/memory/memorySearchTool.cjs +3 -3
package/dist/cjs/tools/memory/memorySearchTool.cjs.map +1 -1
package/dist/cjs/tools/memory/shared.cjs +1 -1
package/dist/cjs/tools/memory/shared.cjs.map +1 -1
package/dist/cjs/tools/search/search.cjs +3 -11
package/dist/cjs/tools/search/search.cjs.map +1 -1
package/dist/cjs/tools/search/tool.cjs +4 -28
package/dist/cjs/tools/search/tool.cjs.map +1 -1
package/dist/cjs/tools/search/utils.cjs +3 -10
package/dist/cjs/tools/search/utils.cjs.map +1 -1
package/dist/cjs/tools/subagent/SubagentExecutor.cjs +48 -0
package/dist/cjs/tools/subagent/SubagentExecutor.cjs.map +1 -1
package/dist/cjs/types/graph.cjs.map +1 -1
package/dist/esm/agents/AgentContext.mjs +160 -259
package/dist/esm/agents/AgentContext.mjs.map +1 -1
package/dist/esm/common/enum.mjs +12 -12
package/dist/esm/common/enum.mjs.map +1 -1
package/dist/esm/graphs/Graph.mjs +30 -13
package/dist/esm/graphs/Graph.mjs.map +1 -1
package/dist/esm/graphs/MultiAgentGraph.mjs +1 -1
package/dist/esm/graphs/MultiAgentGraph.mjs.map +1 -1
package/dist/esm/graphs/phases/memoryFlushPhase.mjs +1 -1
package/dist/esm/graphs/phases/memoryFlushPhase.mjs.map +1 -1
package/dist/esm/hooks/HookRegistry.mjs +1 -1
package/dist/esm/hooks/HookRegistry.mjs.map +1 -1
package/dist/esm/hooks/matchers.mjs +2 -2
package/dist/esm/hooks/matchers.mjs.map +1 -1
package/dist/esm/hooks/types.mjs +1 -1
package/dist/esm/hooks/types.mjs.map +1 -1
package/dist/esm/llm/anthropic/utils/message_inputs.mjs +1 -5
package/dist/esm/llm/anthropic/utils/message_inputs.mjs.map +1 -1
package/dist/esm/llm/bedrock/index.mjs +34 -61
package/dist/esm/llm/bedrock/index.mjs.map +1 -1
package/dist/esm/llm/openai/index.mjs +1 -1
package/dist/esm/llm/openai/index.mjs.map +1 -1
package/dist/esm/llm/openai/utils/index.mjs +10 -27
package/dist/esm/llm/openai/utils/index.mjs.map +1 -1
package/dist/esm/main.mjs +1 -5
package/dist/esm/main.mjs.map +1 -1
package/dist/esm/memory/citations.mjs +4 -4
package/dist/esm/memory/citations.mjs.map +1 -1
package/dist/esm/memory/constants.mjs +17 -17
package/dist/esm/memory/constants.mjs.map +1 -1
package/dist/esm/memory/mmr.mjs +1 -1
package/dist/esm/memory/mmr.mjs.map +1 -1
package/dist/esm/memory/paths.mjs +1 -1
package/dist/esm/memory/paths.mjs.map +1 -1
package/dist/esm/memory/recallTracking.mjs +3 -3
package/dist/esm/memory/recallTracking.mjs.map +1 -1
package/dist/esm/memory/temporalDecay.mjs +2 -2
package/dist/esm/memory/temporalDecay.mjs.map +1 -1
package/dist/esm/messages/cache.mjs +0 -89
package/dist/esm/messages/cache.mjs.map +1 -1
package/dist/esm/messages/format.mjs +13 -71
package/dist/esm/messages/format.mjs.map +1 -1
package/dist/esm/tools/BashExecutor.mjs +12 -22
package/dist/esm/tools/BashExecutor.mjs.map +1 -1
package/dist/esm/tools/CodeExecutor.mjs +14 -41
package/dist/esm/tools/CodeExecutor.mjs.map +1 -1
package/dist/esm/tools/ProgrammaticToolCalling.mjs +12 -17
package/dist/esm/tools/ProgrammaticToolCalling.mjs.map +1 -1
package/dist/esm/tools/ToolNode.mjs +78 -13
package/dist/esm/tools/ToolNode.mjs.map +1 -1
package/dist/esm/tools/memory/memoryAppendTool.mjs +1 -1
package/dist/esm/tools/memory/memoryAppendTool.mjs.map +1 -1
package/dist/esm/tools/memory/memoryGetTool.mjs +2 -2
package/dist/esm/tools/memory/memoryGetTool.mjs.map +1 -1
package/dist/esm/tools/memory/memorySearchTool.mjs +3 -3
package/dist/esm/tools/memory/memorySearchTool.mjs.map +1 -1
package/dist/esm/tools/memory/shared.mjs +1 -1
package/dist/esm/tools/memory/shared.mjs.map +1 -1
package/dist/esm/tools/search/search.mjs +3 -11
package/dist/esm/tools/search/search.mjs.map +1 -1
package/dist/esm/tools/search/tool.mjs +4 -28
package/dist/esm/tools/search/tool.mjs.map +1 -1
package/dist/esm/tools/search/utils.mjs +3 -10
package/dist/esm/tools/search/utils.mjs.map +1 -1
package/dist/esm/tools/subagent/SubagentExecutor.mjs +48 -0
package/dist/esm/tools/subagent/SubagentExecutor.mjs.map +1 -1
package/dist/esm/types/graph.mjs.map +1 -1
package/dist/types/agents/AgentContext.d.ts +25 -95
package/dist/types/common/enum.d.ts +12 -12
package/dist/types/graphs/Graph.d.ts +2 -2
package/dist/types/graphs/phases/memoryFlushPhase.d.ts +2 -2
package/dist/types/hooks/HookRegistry.d.ts +1 -1
package/dist/types/hooks/matchers.d.ts +2 -2
package/dist/types/hooks/types.d.ts +1 -1
package/dist/types/index.d.ts +0 -1
package/dist/types/llm/bedrock/index.d.ts +1 -54
package/dist/types/llm/openai/index.d.ts +1 -1
package/dist/types/memory/citations.d.ts +4 -4
package/dist/types/memory/constants.d.ts +17 -17
package/dist/types/memory/mmr.d.ts +3 -3
package/dist/types/memory/paths.d.ts +1 -1
package/dist/types/memory/temporalDecay.d.ts +2 -2
package/dist/types/memory/types.d.ts +3 -3
package/dist/types/messages/format.d.ts +2 -5
package/dist/types/tools/CodeExecutor.d.ts +0 -6
package/dist/types/tools/ToolNode.d.ts +3 -3
package/dist/types/tools/memory/shared.d.ts +1 -1
package/dist/types/tools/search/test.d.ts +1 -0
package/dist/types/tools/search/types.d.ts +5 -99
package/dist/types/tools/search/utils.d.ts +2 -2
package/dist/types/tools/subagent/SubagentExecutor.d.ts +29 -0
package/dist/types/types/graph.d.ts +30 -34
package/dist/types/types/index.d.ts +0 -1
package/dist/types/types/messages.d.ts +1 -1
package/dist/types/types/run.d.ts +1 -3
package/dist/types/types/tools.d.ts +5 -14
package/package.json +1 -61
package/src/agents/AgentContext.test.ts +176 -0
package/src/agents/AgentContext.ts +179 -305
package/src/agents/__tests__/AgentContext.test.ts +0 -632
package/src/common/__tests__/enum.test.ts +1 -1
package/src/common/enum.ts +12 -12
package/src/graphs/Graph.ts +32 -13
package/src/graphs/MultiAgentGraph.ts +1 -1
package/src/graphs/gapFeatures.test.ts +1 -1
package/src/graphs/phases/__tests__/memoryFlushPhase.test.ts +1 -1
package/src/graphs/phases/memoryFlushPhase.ts +2 -2
package/src/hooks/HookRegistry.ts +1 -1
package/src/hooks/index.ts +1 -1
package/src/hooks/matchers.ts +2 -2
package/src/hooks/types.ts +1 -1
package/src/index.ts +0 -6
package/src/llm/anthropic/utils/message_inputs.ts +1 -10
package/src/llm/bedrock/__tests__/bedrock-caching.test.ts +18 -166
package/src/llm/bedrock/index.ts +41 -116
package/src/llm/openai/index.ts +2 -2
package/src/llm/openai/utils/index.ts +14 -31
package/src/memory/citations.ts +4 -4
package/src/memory/constants.ts +17 -17
package/src/memory/mmr.ts +3 -3
package/src/memory/paths.ts +1 -1
package/src/memory/recallTracking.ts +3 -3
package/src/memory/temporalDecay.ts +2 -2
package/src/memory/types.ts +3 -3
package/src/messages/cache.test.ts +24 -62
package/src/messages/cache.ts +0 -112
package/src/messages/ensureThinkingBlock.test.ts +1 -1
package/src/messages/format.ts +13 -92
package/src/messages/formatAgentMessages.test.ts +1 -1
package/src/scripts/subagent-configurable-inheritance.ts +263 -0
package/src/scripts/subagent-event-driven-debug.ts +2 -2
package/src/specs/anthropic.simple.test.ts +0 -61
package/src/specs/prune.orphans.test.ts +1 -1
package/src/tools/BashExecutor.ts +13 -37
package/src/tools/CodeExecutor.ts +14 -59
package/src/tools/ProgrammaticToolCalling.ts +14 -29
package/src/tools/ToolNode.ts +75 -14
package/src/tools/__tests__/CodeExecutor.test.ts +3 -3
package/src/tools/__tests__/ProgrammaticToolCalling.test.ts +0 -60
package/src/tools/__tests__/SubagentExecutor.test.ts +157 -0
package/src/tools/memory/memoryAppendTool.ts +1 -1
package/src/tools/memory/memoryGetTool.ts +2 -2
package/src/tools/memory/memorySearchTool.ts +3 -3
package/src/tools/memory/shared.ts +1 -1
package/src/tools/search/output.md +2775 -0
package/src/tools/search/search.ts +2 -12
package/src/tools/search/test.html +884 -0
package/src/tools/search/test.md +643 -0
package/src/tools/search/test.ts +159 -0
package/src/tools/search/tool.ts +2 -36
package/src/tools/search/types.ts +8 -133
package/src/tools/search/utils.ts +5 -13
package/src/tools/subagent/SubagentExecutor.ts +78 -0
package/src/types/graph.ts +27 -34
package/src/types/index.ts +0 -1
package/src/types/messages.ts +1 -1
package/src/types/run.ts +1 -3
package/src/types/tools.ts +5 -14
package/dist/cjs/langchain/google-common.cjs +0 -3
package/dist/cjs/langchain/google-common.cjs.map +0 -1
package/dist/cjs/langchain/index.cjs +0 -86
package/dist/cjs/langchain/index.cjs.map +0 -1
package/dist/cjs/langchain/language_models/chat_models.cjs +0 -3
package/dist/cjs/langchain/language_models/chat_models.cjs.map +0 -1
package/dist/cjs/langchain/messages/tool.cjs +0 -3
package/dist/cjs/langchain/messages/tool.cjs.map +0 -1
package/dist/cjs/langchain/messages.cjs +0 -51
package/dist/cjs/langchain/messages.cjs.map +0 -1
package/dist/cjs/langchain/openai.cjs +0 -3
package/dist/cjs/langchain/openai.cjs.map +0 -1
package/dist/cjs/langchain/prompts.cjs +0 -11
package/dist/cjs/langchain/prompts.cjs.map +0 -1
package/dist/cjs/langchain/runnables.cjs +0 -19
package/dist/cjs/langchain/runnables.cjs.map +0 -1
package/dist/cjs/langchain/tools.cjs +0 -23
package/dist/cjs/langchain/tools.cjs.map +0 -1
package/dist/cjs/langchain/utils/env.cjs +0 -11
package/dist/cjs/langchain/utils/env.cjs.map +0 -1
package/dist/cjs/llm/bedrock/cacheSupport.cjs +0 -55
package/dist/cjs/llm/bedrock/cacheSupport.cjs.map +0 -1
package/dist/cjs/tools/search/tavily-scraper.cjs +0 -189
package/dist/cjs/tools/search/tavily-scraper.cjs.map +0 -1
package/dist/cjs/tools/search/tavily-search.cjs +0 -372
package/dist/cjs/tools/search/tavily-search.cjs.map +0 -1
package/dist/cjs/types/agent-cache.cjs +0 -54
package/dist/cjs/types/agent-cache.cjs.map +0 -1
package/dist/esm/langchain/google-common.mjs +0 -2
package/dist/esm/langchain/google-common.mjs.map +0 -1
package/dist/esm/langchain/index.mjs +0 -5
package/dist/esm/langchain/index.mjs.map +0 -1
package/dist/esm/langchain/language_models/chat_models.mjs +0 -2
package/dist/esm/langchain/language_models/chat_models.mjs.map +0 -1
package/dist/esm/langchain/messages/tool.mjs +0 -2
package/dist/esm/langchain/messages/tool.mjs.map +0 -1
package/dist/esm/langchain/messages.mjs +0 -2
package/dist/esm/langchain/messages.mjs.map +0 -1
package/dist/esm/langchain/openai.mjs +0 -2
package/dist/esm/langchain/openai.mjs.map +0 -1
package/dist/esm/langchain/prompts.mjs +0 -2
package/dist/esm/langchain/prompts.mjs.map +0 -1
package/dist/esm/langchain/runnables.mjs +0 -2
package/dist/esm/langchain/runnables.mjs.map +0 -1
package/dist/esm/langchain/tools.mjs +0 -2
package/dist/esm/langchain/tools.mjs.map +0 -1
package/dist/esm/langchain/utils/env.mjs +0 -2
package/dist/esm/langchain/utils/env.mjs.map +0 -1
package/dist/esm/llm/bedrock/cacheSupport.mjs +0 -52
package/dist/esm/llm/bedrock/cacheSupport.mjs.map +0 -1
package/dist/esm/tools/search/tavily-scraper.mjs +0 -186
package/dist/esm/tools/search/tavily-scraper.mjs.map +0 -1
package/dist/esm/tools/search/tavily-search.mjs +0 -370
package/dist/esm/tools/search/tavily-search.mjs.map +0 -1
package/dist/esm/types/agent-cache.mjs +0 -52
package/dist/esm/types/agent-cache.mjs.map +0 -1
package/dist/types/langchain/google-common.d.ts +0 -1
package/dist/types/langchain/index.d.ts +0 -8
package/dist/types/langchain/language_models/chat_models.d.ts +0 -1
package/dist/types/langchain/messages/tool.d.ts +0 -1
package/dist/types/langchain/messages.d.ts +0 -2
package/dist/types/langchain/openai.d.ts +0 -1
package/dist/types/langchain/prompts.d.ts +0 -1
package/dist/types/langchain/runnables.d.ts +0 -2
package/dist/types/langchain/tools.d.ts +0 -2
package/dist/types/langchain/utils/env.d.ts +0 -1
package/dist/types/llm/bedrock/cacheSupport.d.ts +0 -35
package/dist/types/tools/search/tavily-scraper.d.ts +0 -19
package/dist/types/tools/search/tavily-search.d.ts +0 -4
package/dist/types/tools/subagent/types.d.ts +0 -84
package/dist/types/types/agent-cache.d.ts +0 -71
package/src/agents/__tests__/AgentContext.cacheTtl.live.test.ts +0 -259
package/src/agents/__tests__/AgentContext.crossAgentTier1.live.test.ts +0 -266
package/src/agents/__tests__/AgentContext.crossUserCache.live.test.ts +0 -342
package/src/langchain/google-common.ts +0 -1
package/src/langchain/index.ts +0 -8
package/src/langchain/language_models/chat_models.ts +0 -1
package/src/langchain/messages/tool.ts +0 -5
package/src/langchain/messages.ts +0 -21
package/src/langchain/openai.ts +0 -1
package/src/langchain/prompts.ts +0 -1
package/src/langchain/runnables.ts +0 -7
package/src/langchain/tools.ts +0 -8
package/src/langchain/utils/env.ts +0 -1
package/src/llm/anthropic/utils/server-tool-inputs.test.ts +0 -436
package/src/llm/bedrock/cacheSupport.test.ts +0 -99
package/src/llm/bedrock/cacheSupport.ts +0 -53
package/src/tools/search/tavily-scraper.ts +0 -235
package/src/tools/search/tavily-search.ts +0 -424
package/src/tools/search/tavily.test.ts +0 -965
package/src/tools/subagent/types.test.ts +0 -70
package/src/tools/subagent/types.ts +0 -115
package/src/types/agent-cache.ts +0 -74

package/src/agents/AgentContext.ts CHANGED Viewed

@@ -12,8 +12,6 @@ import type * as t from '@/types';
 import type { createPruneMessages } from '@/messages';
 import { createSchemaOnlyTools } from '@/tools/schema';
 import { ContentTypes, Providers } from '@/common';
-import { MAX_SYSTEM_CACHE_BLOCKS } from '@/types/agent-cache';
-import { isBedrockCacheSupported } from '@/llm/bedrock/cacheSupport';
 import { toJsonSchema } from '@/utils/schema';
 /**
@@ -39,9 +37,7 @@ export class AgentContext {
       toolEnd,
       toolRegistry,
       toolDefinitions,
-      system_cache_blocks,
       instructions,
-      instructions_cache_ttl,
       additional_instructions,
       streamBuffer,
       maxContextTokens,
@@ -56,6 +52,8 @@ export class AgentContext {
       persistedSummary,
       summarizationConfig,
       fileManifest,
+      system_cache_blocks,
+      instructions_cache_ttl,
     } = agentConfig;
     // Normalize structured output: support both camelCase and snake_case inputs
@@ -89,9 +87,7 @@ export class AgentContext {
       toolMap,
       toolRegistry,
       toolDefinitions,
-      systemCacheBlocks: system_cache_blocks,
       instructions,
-      instructionsCacheTtl: instructions_cache_ttl,
       additionalInstructions: additional_instructions,
       reasoningKey,
       toolEnd,
@@ -105,10 +101,12 @@ export class AgentContext {
       persistedSummary,
       summarizationConfig,
       fileManifest,
+      systemCacheBlocks: system_cache_blocks,
+      instructionsCacheTtl: instructions_cache_ttl,
     });
     /**
-     * Track subagent inputs on the context. `_sourceInputs`
+     * Track upstream-aligned subagent inputs on the context. `_sourceInputs`
      * preserves the original AgentInputs so SubagentExecutor can self-spawn
      * (`SubagentConfig.self === true`) without separate config; the other
      * two flow straight from agentConfig.
@@ -189,18 +187,9 @@ export class AgentContext {
   toolDefinitions?: t.LCTool[];
   /** Set of tool names discovered via tool search (to be loaded) */
   discoveredToolNames: Set<string> = new Set();
-  /**
-   * Cacheable system content blocks emitted before `instructions`. Each
-   * gets its own cache marker (cachePoint on Bedrock, cache_control on
-   * Anthropic). Earlier entries = wider cache key (best for cross-tenant
-   * sharing). See `src/types/agent-cache.ts`.
-   */
-  systemCacheBlocks?: t.SystemCacheBlock[];
-  /** Stable/cacheable instructions for this agent (gets trailing marker). */
+  /** Instructions for this agent */
   instructions?: string;
-  /** TTL for the trailing instructions cache marker. Defaults to '5m'. */
-  instructionsCacheTtl?: t.AgentCacheTTL;
-  /** Dynamic system tail (per-user / per-message — never cached). */
+  /** Additional instructions for this agent */
   additionalInstructions?: string;
   /**
    * Dynamic context that changes per-request (e.g., current time, user info).
@@ -279,6 +268,15 @@ export class AgentContext {
   summarizationConfig?: t.SummarizationConfig;
   /** Lightweight file manifest for file-aware compaction (IDs and names only, no content) */
   fileManifest?: t.FileManifestEntry[];
+  /**
+   * Workspace-shared system-message tiers. When set, each entry becomes a
+   * separate text block in the SystemMessage with its own cachePoint /
+   * cache_control marker, BEFORE the per-agent `instructions` block.
+   * See {@link t.AgentInputs.system_cache_blocks} for full semantics.
+   */
+  systemCacheBlocks?: Array<{ text: string; ttl?: '5m' | '1h' }>;
+  /** TTL hint for the per-agent instructions cache marker. Defaults to '5m'. */
+  instructionsCacheTtl?: '5m' | '1h';
   /** Original AgentInputs used to create this context — used for self-spawn subagent resolution. */
   _sourceInputs?: t.AgentInputs;
   /** Subagent configurations for hierarchical delegation. */
@@ -299,9 +297,7 @@ export class AgentContext {
     toolMap,
     toolRegistry,
     toolDefinitions,
-    systemCacheBlocks,
     instructions,
-    instructionsCacheTtl,
     additionalInstructions,
     dynamicContext,
     reasoningKey,
@@ -314,6 +310,8 @@ export class AgentContext {
     persistedSummary,
     summarizationConfig,
     fileManifest,
+    systemCacheBlocks,
+    instructionsCacheTtl,
   }: {
     agentId: string;
     name?: string;
@@ -327,9 +325,7 @@ export class AgentContext {
     toolMap?: t.ToolMap;
     toolRegistry?: t.LCToolRegistry;
     toolDefinitions?: t.LCTool[];
-    systemCacheBlocks?: t.SystemCacheBlock[];
     instructions?: string;
-    instructionsCacheTtl?: t.AgentCacheTTL;
     additionalInstructions?: string;
     dynamicContext?: string;
     reasoningKey?: 'reasoning_content' | 'reasoning';
@@ -344,6 +340,8 @@ export class AgentContext {
     persistedSummary?: string;
     summarizationConfig?: t.SummarizationConfig;
     fileManifest?: t.FileManifestEntry[];
+    systemCacheBlocks?: Array<{ text: string; ttl?: '5m' | '1h' }>;
+    instructionsCacheTtl?: '5m' | '1h';
   }) {
     this.agentId = agentId;
     this.name = name;
@@ -357,20 +355,7 @@ export class AgentContext {
     this.toolMap = toolMap;
     this.toolRegistry = toolRegistry;
     this.toolDefinitions = toolDefinitions;
-    if (
-      systemCacheBlocks &&
-      systemCacheBlocks.length > MAX_SYSTEM_CACHE_BLOCKS
-    ) {
-      throw new Error(
-        `system_cache_blocks supports at most ${MAX_SYSTEM_CACHE_BLOCKS} entries ` +
-          `(received ${systemCacheBlocks.length}); excess entries would exceed ` +
-          `Bedrock's 4-cachePoint per-request budget once the tools array and ` +
-          `trailing 'instructions' marker are counted. See src/types/agent-cache.ts.`,
-      );
-    }
-    this.systemCacheBlocks = systemCacheBlocks;
     this.instructions = instructions;
-    this.instructionsCacheTtl = instructionsCacheTtl;
     this.additionalInstructions = additionalInstructions;
     this.dynamicContext = dynamicContext;
     this.structuredOutput = structuredOutput;
@@ -378,6 +363,12 @@ export class AgentContext {
     this.persistedSummary = persistedSummary;
     this.summarizationConfig = summarizationConfig;
     this.fileManifest = fileManifest;
+    if (systemCacheBlocks && systemCacheBlocks.length > 0) {
+      this.systemCacheBlocks = systemCacheBlocks;
+    }
+    if (instructionsCacheTtl) {
+      this.instructionsCacheTtl = instructionsCacheTtl;
+    }
     if (reasoningKey) {
       this.reasoningKey = reasoningKey;
     }
@@ -605,11 +596,8 @@ export class AgentContext {
     }
     // Stale or first access - rebuild
-    this.cachedSystemRunnable = this.buildSystemRunnable({
-      systemCacheBlocks: this.systemCacheBlocks ?? [],
-      stableInstructions: this.buildStableInstructionsString(),
-      dynamicInstructions: this.buildDynamicInstructionsString(),
-    });
+    const instructionsString = this.buildInstructionsString();
+    this.cachedSystemRunnable = this.buildSystemRunnable(instructionsString);
     this.systemRunnableStale = false;
     return this.cachedSystemRunnable;
   }
@@ -620,27 +608,17 @@ export class AgentContext {
    */
   initializeSystemRunnable(): void {
     if (this.systemRunnableStale || this.cachedSystemRunnable === undefined) {
-      this.cachedSystemRunnable = this.buildSystemRunnable({
-        systemCacheBlocks: this.systemCacheBlocks ?? [],
-        stableInstructions: this.buildStableInstructionsString(),
-        dynamicInstructions: this.buildDynamicInstructionsString(),
-      });
+      const instructionsString = this.buildInstructionsString();
+      this.cachedSystemRunnable = this.buildSystemRunnable(instructionsString);
       this.systemRunnableStale = false;
     }
   }
   /**
-   * Builds the cacheable instructions string (without creating SystemMessage).
-   * Includes agent identity preamble, the agent's static instructions, and
-   * programmatic-only tool documentation. This is the part of the system
-   * message that stays byte-stable across turns and across users for the
-   * same agent — the prompt cache prefix.
-   *
-   * Per-user/per-message dynamic context belongs in
-   * `buildDynamicInstructionsString()` so it does not invalidate the cache
-   * marker. (See `feedback_cache_stability_invariant` for the rule.)
+   * Builds the raw instructions string (without creating SystemMessage).
+   * Includes agent identity preamble and handoff context when available.
    */
-  private buildStableInstructionsString(): string {
+  private buildInstructionsString(): string {
     const parts: string[] = [];
     /** Build agent identity and handoff context preamble */
@@ -654,27 +632,7 @@ export class AgentContext {
       parts.push(this.instructions);
     }
-    /** Add programmatic tools documentation */
-    const programmaticToolsDoc = this.buildProgrammaticOnlyToolsInstructions();
-    if (programmaticToolsDoc) {
-      parts.push(programmaticToolsDoc);
-    }
-    return parts.join('\n\n');
-  }
-  /**
-   * Builds the dynamic system-tail string (without creating SystemMessage).
-   * Keep this out of prompt-cache-marked content so volatile per-call
-   * context does not invalidate the stable prefix.
-   *
-   * `additional_instructions` is treated as dynamic (per-user/per-message
-   * memory, runtime context, etc.) and intentionally excluded from the
-   * cacheable prefix.
-   */
-  private buildDynamicInstructionsString(): string {
-    const parts: string[] = [];
+    /** Add additional instructions */
     if (
       this.additionalInstructions != null &&
       this.additionalInstructions !== ''
@@ -682,6 +640,12 @@ export class AgentContext {
       parts.push(this.additionalInstructions);
     }
+    /** Add programmatic tools documentation */
+    const programmaticToolsDoc = this.buildProgrammaticOnlyToolsInstructions();
+    if (programmaticToolsDoc) {
+      parts.push(programmaticToolsDoc);
+    }
     return parts.join('\n\n');
   }
@@ -737,168 +701,121 @@ export class AgentContext {
   }
   /**
-   * True when Anthropic prompt caching is enabled for this agent.
-   * Used by `buildSystemRunnable` to decide whether to emit a cache_control
-   * marker on the stable instructions prefix.
-   */
-  private hasAnthropicPromptCache(): boolean {
-    if (this.provider !== Providers.ANTHROPIC) {
-      return false;
-    }
-    const anthropicOptions = this.clientOptions as
-      | t.AnthropicClientOptions
-      | undefined;
-    return anthropicOptions?.promptCache === true;
-  }
-  /**
-   * True when Bedrock prompt caching is enabled for this agent AND the
-   * configured model supports `cachePoint` blocks. Only Claude (and Nova)
-   * models on Bedrock honour cachePoint — Llama / Titan reject it.
-   *
-   * Used by `buildSystemRunnable` to inline a `cachePoint` block right
-   * after the stable system text so the system prefix is cached at the
-   * AWS account level (cross-user, cross-conversation).
+   * Build system runnable from pre-built instructions string.
+   * Only called when content has actually changed.
    */
-  private hasBedrockPromptCache(): boolean {
-    if (this.provider !== Providers.BEDROCK) {
-      return false;
-    }
-    const bedrockOptions = this.clientOptions as
-      | (t.BedrockAnthropicClientOptions & {
-          model?: string;
-          bedrockCacheModelPatterns?: readonly RegExp[];
-        })
-      | undefined;
-    if (bedrockOptions?.promptCache !== true) {
-      return false;
-    }
-    /* Allowlist-based check (see src/llm/bedrock/cacheSupport.ts). The
-     * `bedrockCacheModelPatterns` clientOption lets consumers add new
-     * model patterns without forking the library — useful when AWS adds
-     * a new family before the next library release. */
-    return isBedrockCacheSupported(
-      bedrockOptions.model,
-      bedrockOptions.bedrockCacheModelPatterns,
-    );
-  }
-  /**
-   * Build system runnable from cacheable blocks + the trailing
-   * `instructions` block + optional dynamic tail.
-   *
-   *   ┌──────────────────────────────────────────┐
-   *   │ system_cache_blocks[0].text              │ ← consumer-defined block 0
-   *   ├──── cache marker (TTL = blocks[0].ttl) ──┤
-   *   │ system_cache_blocks[1].text              │ ← consumer-defined block 1
-   *   ├──── cache marker (TTL = blocks[1].ttl) ──┤
-   *   │ instructions                             │ ← per-agent stable
-   *   ├──── cache marker (TTL = instructionsCacheTtl) ┤
-   *   │ additional_instructions                  │ ← dynamic (uncached)
-   *   └──────────────────────────────────────────┘
-   *
-   * If `system_cache_blocks` is empty, behavior reduces to the 2-tier
-   * (instructions + dynamic) path used by simpler consumers.
-   *
-   * Provider-specific cache marker:
-   *   - Anthropic: `cache_control: { type: 'ephemeral', ttl?: '1h'|'5m' }` on
-   *     each cacheable text block. Up to 4 cache breakpoints per workspace.
-   *   - Bedrock (Claude/Nova): a `{ cachePoint: { type: 'default', ttl?: '1h'|'5m' } }`
-   *     block inserted after each cacheable section. Up to 4 cachePoints per
-   *     request, of which the tools array can consume up to 2.
-   *
-   * Cache key composition: every byte from message start to a given cache
-   * marker forms that marker's cache key. Earlier blocks = wider cache key
-   * = more cross-tenant share. Place the most stable content first.
-   */
-  private buildSystemRunnable({
-    systemCacheBlocks,
-    stableInstructions,
-    dynamicInstructions,
-  }: {
-    systemCacheBlocks: t.SystemCacheBlock[];
-    stableInstructions: string;
-    dynamicInstructions: string;
-  }):
+  private buildSystemRunnable(
+    instructionsString: string
+  ):
     | Runnable<
         BaseMessage[],
         (BaseMessage | SystemMessage)[],
         RunnableConfig<Record<string, unknown>>
       >
     | undefined {
-    const hasAnyCacheBlocks = systemCacheBlocks.length > 0;
-    if (!hasAnyCacheBlocks && !stableInstructions && !dynamicInstructions) {
+    if (!instructionsString) {
       // Remove previous tokens if we had a system message before
       this.instructionTokens -= this.systemMessageTokens;
       this.systemMessageTokens = 0;
       return undefined;
     }
-    const useAnthropicCache = this.hasAnthropicPromptCache();
-    const useBedrockCache = this.hasBedrockPromptCache();
-    const instructionsTtl: t.AgentCacheTTL = this.instructionsCacheTtl ?? '5m';
+    let finalInstructions: string | BaseMessageFields = instructionsString;
-    let finalInstructions: string | BaseMessageFields;
-    if (useAnthropicCache) {
-      type AnthropicTextBlock = {
-        type: 'text';
-        text: string;
-        cache_control?: { type: 'ephemeral'; ttl?: t.AgentCacheTTL };
-      };
-      const content: AnthropicTextBlock[] = [];
-      // Emit each system_cache_blocks entry with its own cache_control.
-      for (const block of systemCacheBlocks) {
-        if (!block.text) continue;
-        content.push({
-          type: 'text',
-          text: block.text,
-          cache_control: { type: 'ephemeral', ttl: block.ttl ?? '5m' },
-        });
-      }
-      // Trailing stable instructions block (also cacheable).
-      if (stableInstructions) {
-        content.push({
-          type: 'text',
-          text: stableInstructions,
-          cache_control: { type: 'ephemeral', ttl: instructionsTtl },
-        });
-      }
-      if (dynamicInstructions) {
-        // Dynamic tail: NO cache_control so it doesn't shift the cache prefix.
-        content.push({ type: 'text', text: dynamicInstructions });
-      }
-      finalInstructions = { content } as BaseMessageFields;
-    } else if (useBedrockCache && (hasAnyCacheBlocks || stableInstructions)) {
-      type BedrockBlock =
-        | { type: 'text'; text: string }
-        | { cachePoint: { type: 'default'; ttl?: t.AgentCacheTTL } };
-      const content: BedrockBlock[] = [];
-      // Emit each system_cache_blocks entry as text + cachePoint pair.
-      for (const block of systemCacheBlocks) {
-        if (!block.text) continue;
-        content.push({ type: 'text', text: block.text });
-        content.push({
-          cachePoint: { type: 'default', ttl: block.ttl ?? '5m' },
-        });
-      }
-      if (stableInstructions) {
-        content.push({ type: 'text', text: stableInstructions });
-        content.push({
-          cachePoint: { type: 'default', ttl: instructionsTtl },
-        });
-      }
-      if (dynamicInstructions) {
-        content.push({ type: 'text', text: dynamicInstructions });
+    /**
+     * Tiered system-message assembly. When `systemCacheBlocks` is set, build
+     * a multi-block SystemMessage so each tier has its own cache breakpoint:
+     *
+     *   [tier1_block_1][tier1_cachePoint]...[tier1_block_N][tier1_cachePoint]
+     *   [instructions][instructions_cachePoint]
+     *
+     * Forward-prefix-hash means agents in the same workspace whose tier-1
+     * bytes are identical share the platform cache entry; only the per-agent
+     * `instructions` block invalidates per-agent.
+     *
+     * - Bedrock: emit `cachePoint: { type: 'default' }` blocks (handled by
+     *   `convertSystemMessageToConverseMessage`).
+     * - Anthropic: emit `cache_control: { type: 'ephemeral' }` on each text
+     *   block. (TTL hints are dropped for Anthropic — the SDK currently
+     *   only supports `'ephemeral'`. Bedrock cachePoint has no TTL knob.)
+     */
+    const hasTieredCache =
+      Array.isArray(this.systemCacheBlocks) &&
+      this.systemCacheBlocks.length > 0;
+    const isBedrock = this.provider === Providers.BEDROCK;
+    const isAnthropic = this.provider === Providers.ANTHROPIC;
+    const anthropicCacheEnabled =
+      isAnthropic &&
+      (this.clientOptions as t.AnthropicClientOptions | undefined)
+        ?.promptCache === true;
+    /**
+     * Bedrock cachePoint is Claude-only — Nova/Llama/Titan reject it.
+     * Mirrors the model check in `IllumaBedrockConverse.invocationParams`
+     * (src/llm/bedrock/index.ts:186-189).
+     */
+    const bedrockCacheEnabled =
+      isBedrock &&
+      (() => {
+        const opts = this.clientOptions as
+          | (t.BedrockAnthropicClientOptions & { model?: string })
+          | undefined;
+        const modelId = (opts?.model ?? '').toLowerCase();
+        const isClaudeModel =
+          modelId.includes('claude') || modelId.includes('anthropic');
+        return opts?.promptCache === true && isClaudeModel;
+      })();
+    if (hasTieredCache && (bedrockCacheEnabled || anthropicCacheEnabled)) {
+      /**
+       * Anthropic / Bedrock cap cache breakpoints at 4 per request. The
+       * lib already emits one for tools and up to two for messages, so we
+       * have at most 1 left for the system block. We spend it on Tier 1
+       * (the workspace-shared bytes) — per-agent Tier 2 caching is still
+       * achieved implicitly via the tools breakpoint that follows, since
+       * cache lookups are forward-prefix-hash.
+       *
+       * Tier 1 may itself be emitted as multiple text blocks (one per
+       * `systemCacheBlocks` entry); only the LAST gets the cache marker,
+       * the rest are plain text inside the same cached prefix.
+       */
+      const contentBlocks: Array<Record<string, unknown>> = [];
+      const tier1Blocks = this.systemCacheBlocks!.filter((b) => b?.text);
+      tier1Blocks.forEach((block, idx) => {
+        const isLast = idx === tier1Blocks.length - 1;
+        if (bedrockCacheEnabled) {
+          contentBlocks.push({ type: 'text', text: block.text });
+          if (isLast) {
+            contentBlocks.push({ cachePoint: { type: 'default' } });
+          }
+        } else if (isLast) {
+          contentBlocks.push({
+            type: 'text',
+            text: block.text,
+            cache_control: { type: 'ephemeral' },
+          });
+        } else {
+          contentBlocks.push({ type: 'text', text: block.text });
+        }
+      });
+      if (instructionsString) {
+        // No cache marker on the trailing per-agent block — tools'
+        // breakpoint covers it.
+        contentBlocks.push({ type: 'text', text: instructionsString });
       }
-      finalInstructions = { content } as unknown as BaseMessageFields;
-    } else {
-      finalInstructions = [
-        ...systemCacheBlocks.map((b) => b.text),
-        stableInstructions,
-        dynamicInstructions,
-      ]
-        .filter((part) => part !== '')
-        .join('\n\n');
+      finalInstructions = {
+        content: contentBlocks as unknown as BaseMessageFields['content'],
+      };
+    } else if (anthropicCacheEnabled) {
+      // Legacy single-block Anthropic caching (preserved for back-compat).
+      finalInstructions = {
+        content: [
+          {
+            type: 'text',
+            text: instructionsString,
+            cache_control: { type: 'ephemeral' },
+          },
+        ],
+      };
     }
     const systemMessage = new SystemMessage(finalInstructions);
@@ -974,49 +891,6 @@ export class AgentContext {
     }
   }
-  /** Active tool definitions for token accounting (excludes deferred-and-undiscovered entries
-   * and definitions whose `allowed_callers` exclude `'direct'`). Mirrors the gate
-   * `getEventDrivenToolsForBinding` applies so accounting and binding stay aligned. */
-  private getActiveToolDefinitions(): t.LCTool[] {
-    if (!this.toolDefinitions) {
-      return [];
-    }
-    return this.toolDefinitions.filter((def) => {
-      const allowedCallers = def.allowed_callers ?? ['direct'];
-      if (!allowedCallers.includes('direct')) {
-        return false;
-      }
-      return (
-        def.defer_loading !== true || this.discoveredToolNames.has(def.name)
-      );
-    });
-  }
-  /**
-   * Single source of truth for "which entries of `this.tools` should be
-   * treated as actually bound". Callers:
-   *   - `getToolsForBinding` (non-event-driven branch)
-   *   - `getEventDrivenToolsForBinding` (appends instance tools alongside
-   *     schema-only definitions)
-   *   - `calculateInstructionTokens` (counts schema bytes for accounting)
-   *
-   * In event-driven mode (`toolDefinitions` present) instance tools are
-   * appended unfiltered; outside event-driven mode they pass through
-   * `filterToolsForBinding`. Centralizing the decision here prevents the
-   * accounting/binding paths from drifting apart, which was the root
-   * cause of the original miscount (Fixes #121).
-   */
-  private getEffectiveInstanceTools(): t.GraphTools | undefined {
-    if (!this.tools) {
-      return undefined;
-    }
-    const isEventDriven = (this.toolDefinitions?.length ?? 0) > 0;
-    if (isEventDriven || !this.toolRegistry) {
-      return this.tools;
-    }
-    return this.filterToolsForBinding(this.tools);
-  }
   /**
    * Calculate tool tokens and add to instruction tokens
    * Note: System message tokens are calculated during systemRunnable creation
@@ -1034,17 +908,9 @@ export class AgentContext {
     // Reset per-tool breakdown
     this.toolsDetail = [];
-    /* Use `getEffectiveInstanceTools()` so accounting reflects exactly the
-     * subset that `getToolsForBinding` would emit — preventing the
-     * worst-case-ceiling miscount that triggered spurious `empty_messages`
-     * preflight rejections at low `maxContextTokens`. Deferred and
-     * non-`'direct'` `toolDefinitions` are excluded by
-     * `getActiveToolDefinitions()` below. */
-    const effectiveInstanceTools = this.getEffectiveInstanceTools();
     // Count tokens for bound tools (StructuredTool instances with .schema)
-    if (effectiveInstanceTools && effectiveInstanceTools.length > 0) {
-      for (const tool of effectiveInstanceTools) {
+    if (this.tools && this.tools.length > 0) {
+      for (const tool of this.tools) {
         const genericTool = tool as Record<string, unknown>;
         if (
           genericTool.schema != null &&
@@ -1073,27 +939,25 @@ export class AgentContext {
     // Count tokens for tool definitions (MCP / event-driven tools).
     // These are sent to the provider API as tool schemas alongside bound tools.
     // Both can be populated simultaneously (graph tools + MCP tools).
-    // Use `getActiveToolDefinitions()` so programmatic-only definitions
-    // (e.g. `allowed_callers: ['code_execution']`) and deferred-and-
-    // -undiscovered ones don't inflate `toolSchemaTokens` while never
-    // being bound to the model.
-    for (const def of this.getActiveToolDefinitions()) {
-      if (countedToolNames.has(def.name)) {
-        continue; // Already counted via this.tools
+    if (this.toolDefinitions && this.toolDefinitions.length > 0) {
+      for (const def of this.toolDefinitions) {
+        if (countedToolNames.has(def.name)) {
+          continue; // Already counted via this.tools
+        }
+        const schema = {
+          name: def.name,
+          description: def.description ?? '',
+          parameters: def.parameters ?? {},
+        };
+        const defTokens = tokenCounter(
+          new SystemMessage(JSON.stringify(schema))
+        );
+        this.toolsDetail.push({
+          name: def.name || 'unknown',
+          tokens: defTokens,
+        });
+        toolTokens += defTokens;
       }
-      const schema = {
-        name: def.name,
-        description: def.description ?? '',
-        parameters: def.parameters ?? {},
-      };
-      const defTokens = tokenCounter(
-        new SystemMessage(JSON.stringify(schema))
-      );
-      this.toolsDetail.push({
-        name: def.name || 'unknown',
-        tokens: defTokens,
-      });
-      toolTokens += defTokens;
     }
     // Store total tool tokens for breakdown reporting
@@ -1264,7 +1128,10 @@ export class AgentContext {
     }
     /** Traditional mode: filter actual tool instances */
-    const filtered = this.getEffectiveInstanceTools();
+    const filtered =
+      !this.tools || !this.toolRegistry
+        ? this.tools
+        : this.filterToolsForBinding(this.tools);
     if (this.graphTools && this.graphTools.length > 0) {
       return [...(filtered ?? []), ...this.graphTools];
@@ -1279,11 +1146,21 @@ export class AgentContext {
       return this.graphTools ?? [];
     }
-    /* Reuse `getActiveToolDefinitions()` so the binding gate matches the
-     * accounting filter exactly (single source of truth). */
-    const schemaTools = createSchemaOnlyTools(
-      this.getActiveToolDefinitions()
-    ) as t.GraphTools;
+    const defsToInclude = this.toolDefinitions.filter((def) => {
+      const allowedCallers = def.allowed_callers ?? ['direct'];
+      if (!allowedCallers.includes('direct')) {
+        return false;
+      }
+      if (
+        def.defer_loading === true &&
+        !this.discoveredToolNames.has(def.name)
+      ) {
+        return false;
+      }
+      return true;
+    });
+    const schemaTools = createSchemaOnlyTools(defsToInclude) as t.GraphTools;
     const allTools = [...schemaTools];
@@ -1291,9 +1168,6 @@ export class AgentContext {
       allTools.push(...this.graphTools);
     }
-    /* In event-driven mode, instance tools are appended UNFILTERED (matching
-     * `getEffectiveInstanceTools()`'s event-driven branch). Deferred /
-     * non-direct logic is represented in `toolDefinitions`, not here. */
     if (this.tools && this.tools.length > 0) {
       allTools.push(...this.tools);
     }