npm - @animus-labs/cortex - Versions diffs - 0.2.0 - Mend

@animus-labs/cortex 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (293) hide show

package/LICENSE +21 -0
package/README.md +73 -0
package/dist/budget-guard.d.ts +75 -0
package/dist/budget-guard.d.ts.map +1 -0
package/dist/budget-guard.js +142 -0
package/dist/budget-guard.js.map +1 -0
package/dist/compaction/compaction.d.ts +99 -0
package/dist/compaction/compaction.d.ts.map +1 -0
package/dist/compaction/compaction.js +302 -0
package/dist/compaction/compaction.js.map +1 -0
package/dist/compaction/failsafe.d.ts +57 -0
package/dist/compaction/failsafe.d.ts.map +1 -0
package/dist/compaction/failsafe.js +135 -0
package/dist/compaction/failsafe.js.map +1 -0
package/dist/compaction/index.d.ts +381 -0
package/dist/compaction/index.d.ts.map +1 -0
package/dist/compaction/index.js +979 -0
package/dist/compaction/index.js.map +1 -0
package/dist/compaction/microcompaction.d.ts +219 -0
package/dist/compaction/microcompaction.d.ts.map +1 -0
package/dist/compaction/microcompaction.js +536 -0
package/dist/compaction/microcompaction.js.map +1 -0
package/dist/compaction/observational/buffering.d.ts +225 -0
package/dist/compaction/observational/buffering.d.ts.map +1 -0
package/dist/compaction/observational/buffering.js +354 -0
package/dist/compaction/observational/buffering.js.map +1 -0
package/dist/compaction/observational/constants.d.ts +70 -0
package/dist/compaction/observational/constants.d.ts.map +1 -0
package/dist/compaction/observational/constants.js +507 -0
package/dist/compaction/observational/constants.js.map +1 -0
package/dist/compaction/observational/index.d.ts +219 -0
package/dist/compaction/observational/index.d.ts.map +1 -0
package/dist/compaction/observational/index.js +641 -0
package/dist/compaction/observational/index.js.map +1 -0
package/dist/compaction/observational/observer.d.ts +97 -0
package/dist/compaction/observational/observer.d.ts.map +1 -0
package/dist/compaction/observational/observer.js +424 -0
package/dist/compaction/observational/observer.js.map +1 -0
package/dist/compaction/observational/recall-tool.d.ts +27 -0
package/dist/compaction/observational/recall-tool.d.ts.map +1 -0
package/dist/compaction/observational/recall-tool.js +93 -0
package/dist/compaction/observational/recall-tool.js.map +1 -0
package/dist/compaction/observational/reflector.d.ts +94 -0
package/dist/compaction/observational/reflector.d.ts.map +1 -0
package/dist/compaction/observational/reflector.js +167 -0
package/dist/compaction/observational/reflector.js.map +1 -0
package/dist/compaction/observational/types.d.ts +271 -0
package/dist/compaction/observational/types.d.ts.map +1 -0
package/dist/compaction/observational/types.js +15 -0
package/dist/compaction/observational/types.js.map +1 -0
package/dist/context-manager.d.ts +134 -0
package/dist/context-manager.d.ts.map +1 -0
package/dist/context-manager.js +170 -0
package/dist/context-manager.js.map +1 -0
package/dist/cortex-agent.d.ts +1020 -0
package/dist/cortex-agent.d.ts.map +1 -0
package/dist/cortex-agent.js +3589 -0
package/dist/cortex-agent.js.map +1 -0
package/dist/error-classifier.d.ts +48 -0
package/dist/error-classifier.d.ts.map +1 -0
package/dist/error-classifier.js +152 -0
package/dist/error-classifier.js.map +1 -0
package/dist/event-bridge.d.ts +166 -0
package/dist/event-bridge.d.ts.map +1 -0
package/dist/event-bridge.js +381 -0
package/dist/event-bridge.js.map +1 -0
package/dist/index.d.ts +55 -0
package/dist/index.d.ts.map +1 -0
package/dist/index.js +57 -0
package/dist/index.js.map +1 -0
package/dist/mcp-client.d.ts +119 -0
package/dist/mcp-client.d.ts.map +1 -0
package/dist/mcp-client.js +474 -0
package/dist/mcp-client.js.map +1 -0
package/dist/model-wrapper.d.ts +58 -0
package/dist/model-wrapper.d.ts.map +1 -0
package/dist/model-wrapper.js +86 -0
package/dist/model-wrapper.js.map +1 -0
package/dist/noop-logger.d.ts +4 -0
package/dist/noop-logger.d.ts.map +1 -0
package/dist/noop-logger.js +8 -0
package/dist/noop-logger.js.map +1 -0
package/dist/prompt-diagnostics.d.ts +47 -0
package/dist/prompt-diagnostics.d.ts.map +1 -0
package/dist/prompt-diagnostics.js +230 -0
package/dist/prompt-diagnostics.js.map +1 -0
package/dist/provider-manager.d.ts +224 -0
package/dist/provider-manager.d.ts.map +1 -0
package/dist/provider-manager.js +563 -0
package/dist/provider-manager.js.map +1 -0
package/dist/provider-registry.d.ts +115 -0
package/dist/provider-registry.d.ts.map +1 -0
package/dist/provider-registry.js +305 -0
package/dist/provider-registry.js.map +1 -0
package/dist/schema-converter.d.ts +20 -0
package/dist/schema-converter.d.ts.map +1 -0
package/dist/schema-converter.js +48 -0
package/dist/schema-converter.js.map +1 -0
package/dist/skill-preprocessor.d.ts +46 -0
package/dist/skill-preprocessor.d.ts.map +1 -0
package/dist/skill-preprocessor.js +237 -0
package/dist/skill-preprocessor.js.map +1 -0
package/dist/skill-registry.d.ts +107 -0
package/dist/skill-registry.d.ts.map +1 -0
package/dist/skill-registry.js +330 -0
package/dist/skill-registry.js.map +1 -0
package/dist/skill-tool.d.ts +54 -0
package/dist/skill-tool.d.ts.map +1 -0
package/dist/skill-tool.js +88 -0
package/dist/skill-tool.js.map +1 -0
package/dist/sub-agent-manager.d.ts +90 -0
package/dist/sub-agent-manager.d.ts.map +1 -0
package/dist/sub-agent-manager.js +192 -0
package/dist/sub-agent-manager.js.map +1 -0
package/dist/token-estimator.d.ts +23 -0
package/dist/token-estimator.d.ts.map +1 -0
package/dist/token-estimator.js +27 -0
package/dist/token-estimator.js.map +1 -0
package/dist/tool-contract.d.ts +68 -0
package/dist/tool-contract.d.ts.map +1 -0
package/dist/tool-contract.js +35 -0
package/dist/tool-contract.js.map +1 -0
package/dist/tool-result-persistence.d.ts +89 -0
package/dist/tool-result-persistence.d.ts.map +1 -0
package/dist/tool-result-persistence.js +152 -0
package/dist/tool-result-persistence.js.map +1 -0
package/dist/tools/bash/index.d.ts +71 -0
package/dist/tools/bash/index.d.ts.map +1 -0
package/dist/tools/bash/index.js +485 -0
package/dist/tools/bash/index.js.map +1 -0
package/dist/tools/bash/interactive.d.ts +47 -0
package/dist/tools/bash/interactive.d.ts.map +1 -0
package/dist/tools/bash/interactive.js +262 -0
package/dist/tools/bash/interactive.js.map +1 -0
package/dist/tools/bash/safety.d.ts +149 -0
package/dist/tools/bash/safety.d.ts.map +1 -0
package/dist/tools/bash/safety.js +1116 -0
package/dist/tools/bash/safety.js.map +1 -0
package/dist/tools/edit.d.ts +57 -0
package/dist/tools/edit.d.ts.map +1 -0
package/dist/tools/edit.js +310 -0
package/dist/tools/edit.js.map +1 -0
package/dist/tools/glob.d.ts +34 -0
package/dist/tools/glob.d.ts.map +1 -0
package/dist/tools/glob.js +268 -0
package/dist/tools/glob.js.map +1 -0
package/dist/tools/grep.d.ts +53 -0
package/dist/tools/grep.d.ts.map +1 -0
package/dist/tools/grep.js +673 -0
package/dist/tools/grep.js.map +1 -0
package/dist/tools/index.d.ts +62 -0
package/dist/tools/index.d.ts.map +1 -0
package/dist/tools/index.js +52 -0
package/dist/tools/index.js.map +1 -0
package/dist/tools/read.d.ts +43 -0
package/dist/tools/read.d.ts.map +1 -0
package/dist/tools/read.js +459 -0
package/dist/tools/read.js.map +1 -0
package/dist/tools/runtime.d.ts +62 -0
package/dist/tools/runtime.d.ts.map +1 -0
package/dist/tools/runtime.js +116 -0
package/dist/tools/runtime.js.map +1 -0
package/dist/tools/shared/cwd-tracker.d.ts +32 -0
package/dist/tools/shared/cwd-tracker.d.ts.map +1 -0
package/dist/tools/shared/cwd-tracker.js +44 -0
package/dist/tools/shared/cwd-tracker.js.map +1 -0
package/dist/tools/shared/edit-history.d.ts +55 -0
package/dist/tools/shared/edit-history.d.ts.map +1 -0
package/dist/tools/shared/edit-history.js +72 -0
package/dist/tools/shared/edit-history.js.map +1 -0
package/dist/tools/shared/edit-matcher.d.ts +83 -0
package/dist/tools/shared/edit-matcher.d.ts.map +1 -0
package/dist/tools/shared/edit-matcher.js +359 -0
package/dist/tools/shared/edit-matcher.js.map +1 -0
package/dist/tools/shared/file-mutation-lock.d.ts +22 -0
package/dist/tools/shared/file-mutation-lock.d.ts.map +1 -0
package/dist/tools/shared/file-mutation-lock.js +35 -0
package/dist/tools/shared/file-mutation-lock.js.map +1 -0
package/dist/tools/shared/gitignore.d.ts +17 -0
package/dist/tools/shared/gitignore.d.ts.map +1 -0
package/dist/tools/shared/gitignore.js +59 -0
package/dist/tools/shared/gitignore.js.map +1 -0
package/dist/tools/shared/pdf-extractor.d.ts +96 -0
package/dist/tools/shared/pdf-extractor.d.ts.map +1 -0
package/dist/tools/shared/pdf-extractor.js +196 -0
package/dist/tools/shared/pdf-extractor.js.map +1 -0
package/dist/tools/shared/read-registry.d.ts +66 -0
package/dist/tools/shared/read-registry.d.ts.map +1 -0
package/dist/tools/shared/read-registry.js +65 -0
package/dist/tools/shared/read-registry.js.map +1 -0
package/dist/tools/shared/safe-env.d.ts +18 -0
package/dist/tools/shared/safe-env.d.ts.map +1 -0
package/dist/tools/shared/safe-env.js +70 -0
package/dist/tools/shared/safe-env.js.map +1 -0
package/dist/tools/sub-agent.d.ts +91 -0
package/dist/tools/sub-agent.d.ts.map +1 -0
package/dist/tools/sub-agent.js +89 -0
package/dist/tools/sub-agent.js.map +1 -0
package/dist/tools/task-output.d.ts +38 -0
package/dist/tools/task-output.d.ts.map +1 -0
package/dist/tools/task-output.js +186 -0
package/dist/tools/task-output.js.map +1 -0
package/dist/tools/tool-search/index.d.ts +40 -0
package/dist/tools/tool-search/index.d.ts.map +1 -0
package/dist/tools/tool-search/index.js +110 -0
package/dist/tools/tool-search/index.js.map +1 -0
package/dist/tools/tool-search/registry.d.ts +82 -0
package/dist/tools/tool-search/registry.d.ts.map +1 -0
package/dist/tools/tool-search/registry.js +238 -0
package/dist/tools/tool-search/registry.js.map +1 -0
package/dist/tools/undo-edit.d.ts +51 -0
package/dist/tools/undo-edit.d.ts.map +1 -0
package/dist/tools/undo-edit.js +231 -0
package/dist/tools/undo-edit.js.map +1 -0
package/dist/tools/web-fetch/cache.d.ts +49 -0
package/dist/tools/web-fetch/cache.d.ts.map +1 -0
package/dist/tools/web-fetch/cache.js +89 -0
package/dist/tools/web-fetch/cache.js.map +1 -0
package/dist/tools/web-fetch/index.d.ts +53 -0
package/dist/tools/web-fetch/index.d.ts.map +1 -0
package/dist/tools/web-fetch/index.js +513 -0
package/dist/tools/web-fetch/index.js.map +1 -0
package/dist/tools/write.d.ts +59 -0
package/dist/tools/write.d.ts.map +1 -0
package/dist/tools/write.js +316 -0
package/dist/tools/write.js.map +1 -0
package/dist/types.d.ts +881 -0
package/dist/types.d.ts.map +1 -0
package/dist/types.js +16 -0
package/dist/types.js.map +1 -0
package/dist/working-tags.d.ts +44 -0
package/dist/working-tags.d.ts.map +1 -0
package/dist/working-tags.js +103 -0
package/dist/working-tags.js.map +1 -0
package/package.json +87 -0
package/src/budget-guard.ts +170 -0
package/src/compaction/compaction.ts +386 -0
package/src/compaction/failsafe.ts +185 -0
package/src/compaction/index.ts +1199 -0
package/src/compaction/microcompaction.ts +709 -0
package/src/compaction/observational/buffering.ts +430 -0
package/src/compaction/observational/constants.ts +532 -0
package/src/compaction/observational/index.ts +837 -0
package/src/compaction/observational/observer.ts +510 -0
package/src/compaction/observational/recall-tool.ts +130 -0
package/src/compaction/observational/reflector.ts +221 -0
package/src/compaction/observational/types.ts +343 -0
package/src/context-manager.ts +237 -0
package/src/cortex-agent.ts +4297 -0
package/src/error-classifier.ts +199 -0
package/src/event-bridge.ts +508 -0
package/src/index.ts +292 -0
package/src/mcp-client.ts +582 -0
package/src/model-wrapper.ts +128 -0
package/src/noop-logger.ts +9 -0
package/src/prompt-diagnostics.ts +296 -0
package/src/provider-manager.ts +823 -0
package/src/provider-registry.ts +386 -0
package/src/schema-converter.ts +51 -0
package/src/skill-preprocessor.ts +314 -0
package/src/skill-registry.ts +378 -0
package/src/skill-tool.ts +130 -0
package/src/sub-agent-manager.ts +236 -0
package/src/token-estimator.ts +26 -0
package/src/tool-contract.ts +113 -0
package/src/tool-result-persistence.ts +197 -0
package/src/tools/bash/index.ts +633 -0
package/src/tools/bash/interactive.ts +302 -0
package/src/tools/bash/safety.ts +1297 -0
package/src/tools/edit.ts +422 -0
package/src/tools/glob.ts +330 -0
package/src/tools/grep.ts +819 -0
package/src/tools/index.ts +110 -0
package/src/tools/read.ts +580 -0
package/src/tools/runtime.ts +173 -0
package/src/tools/shared/cwd-tracker.ts +50 -0
package/src/tools/shared/edit-history.ts +96 -0
package/src/tools/shared/edit-matcher.ts +457 -0
package/src/tools/shared/file-mutation-lock.ts +40 -0
package/src/tools/shared/gitignore.ts +61 -0
package/src/tools/shared/pdf-extractor.ts +290 -0
package/src/tools/shared/read-registry.ts +93 -0
package/src/tools/shared/safe-env.ts +82 -0
package/src/tools/sub-agent.ts +171 -0
package/src/tools/task-output.ts +236 -0
package/src/tools/tool-search/index.ts +167 -0
package/src/tools/tool-search/registry.ts +278 -0
package/src/tools/undo-edit.ts +314 -0
package/src/tools/web-fetch/cache.ts +112 -0
package/src/tools/web-fetch/index.ts +604 -0
package/src/tools/write.ts +385 -0
package/src/types.ts +1057 -0
package/src/working-tags.ts +118 -0

package/src/compaction/compaction.ts ADDED Viewed

@@ -0,0 +1,386 @@
+/**
+ * Layer 2: Conversation Summarization.
+ *
+ * Replaces older conversation history with an LLM-generated summary
+ * while preserving a tail of recent turns. Uses the primary model
+ * for summarization quality (the conversation history is structurally
+ * complex with interleaved tool calls and multi-turn reasoning).
+ *
+ * Fires at 70% of context window (configurable). Emits lifecycle
+ * events (onBeforeCompaction, onPostCompaction) for consumer
+ * coordination (e.g., observational memory flush).
+ *
+ * References:
+ *   - compaction-strategy.md (Layer 2: Conversation Summarization)
+ *   - phase-5-compaction.md (5.3)
+ */
+import type { AgentMessage } from '../context-manager.js';
+import type { CompactionConfig, CompactionResult, CompactionTarget } from '../types.js';
+import { estimateTokens } from '../token-estimator.js';
+import { extractTextContent, isToolUseMessage, isToolResultMessage } from './microcompaction.js';
+// ---------------------------------------------------------------------------
+// Defaults
+// ---------------------------------------------------------------------------
+export const COMPACTION_DEFAULTS: CompactionConfig = {
+  threshold: 0.70,
+  preserveRecentTurns: 6,
+};
+// ---------------------------------------------------------------------------
+// Summarization prompt
+// ---------------------------------------------------------------------------
+const DEFAULT_SUMMARIZATION_PROMPT = `Your task is to create a detailed summary of the conversation so far. This summary will replace the conversation history, so it must capture everything needed to continue work without losing context. A small tail of the most recent turns is preserved separately and does not need to be repeated.
+Before writing your summary, analyze the conversation inside <analysis> tags. Walk through the conversation chronologically and note:
+- Each user request and how it was addressed
+- Key decisions and their rationale
+- Tool calls made, what they returned, and any errors
+- User feedback or corrections (especially when you were told to do something differently)
+- What was being worked on most recently
+The <analysis> block is a private scratchpad. Keep it concise (a line or two per point). Save all detail for the <summary> block.
+Then write your summary inside <summary> tags with the following sections:
+1. Primary Request and Intent
+   Capture all user requests and intents in detail. Preserve the user's exact words for directives, preferences, and constraints.
+2. Key Technical Concepts
+   List all important technical concepts, technologies, and frameworks discussed.
+3. Files and Code Sections
+   Enumerate specific files and code sections examined, modified, or created. Include file paths and relevant code snippets. For each file, summarize why it was read or edited and what changed.
+4. Tool Call Outcomes
+   What tools were called, what they found, and what failed. Include specific file paths, function names, URLs, error messages, and return values. Pay special attention to tool results that informed later decisions.
+5. Errors and Fixes
+   List all errors encountered and how they were resolved. Include specific user feedback received, especially corrections or redirections.
+6. All User Messages
+   List ALL user messages that are not tool results. These are critical for understanding the user's feedback and changing intent. Preserve the user's exact words.
+7. Problem Solving
+   Document problems solved and any ongoing troubleshooting efforts.
+8. Pending Tasks
+   Outline any pending tasks that have been explicitly requested but not yet completed.
+9. Current Work
+   Describe precisely what was being worked on immediately before this summary. Include file names, code snippets, and the specific state of the work. This section is the most important for seamless continuation.
+10. Key Decisions (Cumulative)
+    If a previous compaction summary exists in the conversation, carry forward its Key Decisions section and append any new decisions from this cycle. This section grows across compactions to prevent progressive loss of important decisions.
+11. Optional Next Step
+    List the next step related to the most recent work, but ONLY if it is directly in line with the user's most recent explicit request. If the last task was concluded, do not suggest tangential work. Include direct quotes from the conversation showing exactly what task was in progress.
+When preserving details, extract and retain exact values rather than paraphrasing:
+- File paths, directory names, and line numbers
+- URLs, API endpoints, and query parameters
+- Function names, class names, variable names
+- IDs, hashes, version numbers, and configuration values
+- Error messages and status codes
+- Specific quantities, dates, and thresholds
+Be thorough. Err on the side of including information that would prevent duplicate work or repeated mistakes.`;
+// ---------------------------------------------------------------------------
+// Summary extraction
+// ---------------------------------------------------------------------------
+/**
+ * Extract the <summary> content from the LLM's compaction output.
+ * The prompt asks for <analysis> (scratchpad) then <summary> (the actual summary).
+ * We strip the analysis and keep only the summary content.
+ * If no <summary> tags are found, return the full output (the model may
+ * have skipped the tags but still produced useful content).
+ */
+export function extractSummaryContent(raw: string): string {
+  const match = raw.match(/<summary>([\s\S]*?)<\/summary>/);
+  if (match?.[1]) {
+    return match[1].trim();
+  }
+  // Fallback: strip <analysis> block if present, return the rest
+  const stripped = raw.replace(/<analysis>[\s\S]*?<\/analysis>/g, '').trim();
+  return stripped || raw.trim();
+}
+// ---------------------------------------------------------------------------
+// Summarization
+// ---------------------------------------------------------------------------
+/**
+ * Partition conversation history into compaction target and preserved tail.
+ *
+ * @param history - The full conversation history (post-slot region)
+ * @param preserveRecentTurns - Number of recent turns to preserve
+ * @returns [target, preserved] where target is summarized and preserved is kept verbatim
+ */
+export function partitionHistory(
+  history: AgentMessage[],
+  preserveRecentTurns: number,
+): [AgentMessage[], AgentMessage[]] {
+  if (history.length <= preserveRecentTurns) {
+    return [[], history];
+  }
+  let splitPoint = history.length - preserveRecentTurns;
+  // Never split between a tool_use (assistant) and its tool_result (user).
+  // If the split lands on a tool_result whose preceding message is a tool_use,
+  // move the split back one so the entire pair goes into the preserved tail.
+  if (
+    splitPoint > 0 &&
+    splitPoint < history.length &&
+    isToolResultMessage(history[splitPoint]!) &&
+    isToolUseMessage(history[splitPoint - 1]!)
+  ) {
+    splitPoint -= 1;
+  }
+  // Guard: don't create an empty target from the adjustment
+  if (splitPoint <= 0) {
+    return [[], history];
+  }
+  return [history.slice(0, splitPoint), history.slice(splitPoint)];
+}
+/**
+ * Build the compaction summary message wrapping it in XML tags.
+ *
+ * @param summary - The LLM-generated summary text
+ * @param turnsCompacted - Number of turns that were summarized
+ * @returns A user-role message containing the tagged summary
+ */
+export function buildSummaryMessage(
+  summary: string,
+  turnsCompacted: number,
+): AgentMessage {
+  const timestamp = new Date().toISOString();
+  const content = `<compaction-summary generated="${timestamp}" turns-summarized="${turnsCompacted}">\n${summary}\n</compaction-summary>`;
+  return { role: 'user', content, timestamp: Date.now() };
+}
+/**
+ * Format conversation turns for the summarization prompt.
+ * Extracts text content and labels each turn with role.
+ */
+export function formatTurnsForSummarization(turns: AgentMessage[]): string {
+  // No per-turn truncation. The compaction target is already bounded by
+  // partitionHistory (everything minus the preserved tail), and the
+  // summarizer needs access to full turn content for high-quality
+  // compression. See compaction-strategy.md Layer 2.
+  return turns
+    .map((msg, i) => {
+      const text = extractTextContent(msg);
+      return `[Turn ${i + 1}] ${msg.role}:\n${text}`;
+    })
+    .join('\n\n---\n\n');
+}
+/**
+ * Type for the LLM completion function.
+ * Matches the signature of CortexAgent.directComplete().
+ */
+export type CompleteFn = (context: {
+  systemPrompt: string;
+  messages: unknown[];
+}) => Promise<string>;
+/**
+ * Type for the consumer's onBeforeCompaction handler.
+ */
+export type BeforeCompactionHandler = (target: CompactionTarget) => Promise<void>;
+/**
+ * Type for the consumer's onPostCompaction handler.
+ */
+export type PostCompactionHandler = (result: CompactionResult) => void;
+/**
+ * Type for the consumer's onCompactionError handler.
+ */
+export type CompactionErrorHandler = (error: Error) => void;
+/**
+ * Run Layer 2 conversation summarization.
+ *
+ * Steps:
+ * 1. Partition history into target and preserved tail
+ * 2. Emit onBeforeCompaction (awaited)
+ * 3. Generate summary via LLM
+ * 4. Build new history: [summary message] + [preserved tail]
+ * 5. Emit onPostCompaction
+ *
+ * @param history - Current conversation history (post-slot region)
+ * @param config - Compaction configuration
+ * @param complete - LLM completion function
+ * @param handlers - Consumer lifecycle handlers
+ * @returns The new conversation history and compaction result
+ */
+export async function runCompaction(
+  history: AgentMessage[],
+  config: CompactionConfig,
+  complete: CompleteFn,
+  handlers: {
+    onBeforeCompaction?: BeforeCompactionHandler[];
+    onPostCompaction?: PostCompactionHandler[];
+    onCompactionError?: CompactionErrorHandler[];
+  } = {},
+  /** Actual full-context token count (includes system prompt, slots, tools). When provided, used as tokensBefore instead of text-only heuristic. */
+  actualContextTokens?: number,
+): Promise<{ newHistory: AgentMessage[]; result: CompactionResult }> {
+  const [target, preserved] = partitionHistory(history, config.preserveRecentTurns);
+  if (target.length === 0) {
+    // Nothing to compact; not enough history
+    throw new Error('Not enough conversation history to compact');
+  }
+  // Compute text-only heuristic for history content.
+  const historyTextTokens = estimateTokens(
+    history.map(m => extractTextContent(m)).join('\n'),
+  );
+  // Use actual full-context token count when provided (includes system prompt,
+  // slots, tool definitions); fall back to text-only heuristic for backward compat.
+  const tokensBefore = actualContextTokens ?? historyTextTokens;
+  // Overhead = system prompt + slots + tool definitions (everything except history text).
+  // Used to compute tokensAfter on the same basis as tokensBefore.
+  const overhead = actualContextTokens ? Math.max(0, actualContextTokens - historyTextTokens) : 0;
+  // Build compaction target info for the event
+  const targetInfo: CompactionTarget = {
+    turnsToCompact: target.length,
+    estimatedTokens: estimateTokens(
+      target.map(m => extractTextContent(m)).join('\n'),
+    ),
+  };
+  // Emit onBeforeCompaction (awaited)
+  if (handlers.onBeforeCompaction) {
+    for (const handler of handlers.onBeforeCompaction) {
+      await handler(targetInfo);
+    }
+  }
+  // Generate summary via LLM
+  const prompt = config.customPrompt ?? DEFAULT_SUMMARIZATION_PROMPT;
+  const turnsText = formatTurnsForSummarization(target);
+  let summary: string;
+  try {
+    summary = await complete({
+      systemPrompt: prompt,
+      messages: [
+        {
+          role: 'user',
+          content: `Here are the conversation turns to summarize:\n\n${turnsText}`,
+        },
+      ],
+    });
+  } catch (err) {
+    const error = err instanceof Error ? err : new Error(String(err));
+    // Emit compaction error
+    if (handlers.onCompactionError) {
+      for (const handler of handlers.onCompactionError) {
+        try {
+          handler(error);
+        } catch {
+          // Swallow handler errors
+        }
+      }
+    }
+    throw error;
+  }
+  // Extract summary content from <summary> tags, stripping <analysis>
+  const parsedSummary = extractSummaryContent(summary);
+  // Build new history
+  const summaryMessage = buildSummaryMessage(parsedSummary, target.length);
+  const newHistory = [summaryMessage, ...preserved];
+  // Calculate result metrics. Include the same overhead (system prompt, slots,
+  // tool definitions) so tokensBefore and tokensAfter are on the same basis.
+  const newHistoryTextTokens = estimateTokens(
+    newHistory.map(m => extractTextContent(m)).join('\n'),
+  );
+  const tokensAfter = overhead + newHistoryTextTokens;
+  const summaryTokens = estimateTokens(parsedSummary);
+  // The oldest preserved turn's index in the original history.
+  // target.length is the split point: all turns before it were compacted.
+  const oldestPreservedIndex = target.length;
+  // Attempt to find a timestamp in the preserved messages; null if not found.
+  const oldestPreservedTimestamp = findOldestTimestamp(preserved);
+  const result: CompactionResult = {
+    tokensBefore,
+    tokensAfter,
+    turnsCompacted: target.length,
+    turnsPreserved: preserved.length,
+    summaryTokens,
+    oldestPreservedTimestamp,
+    oldestPreservedIndex,
+    summary: parsedSummary,
+  };
+  // Emit onPostCompaction
+  if (handlers.onPostCompaction) {
+    for (const handler of handlers.onPostCompaction) {
+      try {
+        handler(result);
+      } catch {
+        // Swallow handler errors
+      }
+    }
+  }
+  return { newHistory, result };
+}
+/**
+ * Attempt to find the oldest timestamp in a set of messages.
+ *
+ * Scans message content for ISO date patterns. Returns the first match
+ * or null if none found. This is a best-effort heuristic; the consumer
+ * should prefer `oldestPreservedIndex` from CompactionResult for
+ * reliable timestamp resolution via their own database.
+ */
+function findOldestTimestamp(messages: AgentMessage[]): string | null {
+  const isoPattern = /\d{4}-\d{2}-\d{2}T\d{2}:\d{2}:\d{2}/;
+  for (const msg of messages) {
+    const text = extractTextContent(msg);
+    const match = isoPattern.exec(text);
+    if (match) {
+      return match[0];
+    }
+  }
+  // No ISO timestamp found in preserved messages. Return null rather
+  // than Date.now() so the consumer knows no timestamp was found and
+  // can fall back to oldestPreservedIndex for database-level resolution.
+  return null;
+}
+/**
+ * Check if compaction should trigger based on token count and threshold.
+ */
+export function shouldCompact(
+  currentTokens: number,
+  contextWindow: number,
+  threshold: number,
+): boolean {
+  if (contextWindow <= 0) return false;
+  return (currentTokens / contextWindow) >= threshold;
+}

package/src/compaction/failsafe.ts ADDED Viewed

@@ -0,0 +1,185 @@
+/**
+ * Layer 3: Emergency Truncation (Failsafe).
+ *
+ * Last-resort truncation when Layer 2 fails or context is still too large.
+ * Drops the oldest conversation turns purely mechanically (no LLM call).
+ * Preserves structural integrity: tool_use/tool_result pairs are dropped together.
+ *
+ * Triggers at 90% of context window (configurable), or reactively when
+ * the API returns a context overflow error.
+ *
+ * This layer also serves as a mid-loop safety valve: it fires inside
+ * transformContext during the agentic loop when estimated token count
+ * exceeds 90%. Mid-loop truncation does NOT emit onBeforeCompaction
+ * (no observational memory processing mid-loop).
+ *
+ * References:
+ *   - compaction-strategy.md (Layer 3: Emergency Truncation)
+ *   - phase-5-compaction.md (5.4)
+ */
+import type { AgentMessage } from '../context-manager.js';
+import type { FailsafeConfig } from '../types.js';
+import { estimateTokens } from '../token-estimator.js';
+import { isToolResultMessage, isToolUseMessage, extractTextContent } from './microcompaction.js';
+// ---------------------------------------------------------------------------
+// Defaults
+// ---------------------------------------------------------------------------
+export const FAILSAFE_DEFAULTS: FailsafeConfig = {
+  threshold: 0.90,
+};
+/**
+ * Minimum number of recent turns to preserve during emergency truncation.
+ * Fewer turns preserved than Layer 2 since this is a last resort.
+ */
+const FAILSAFE_PRESERVE_TURNS = 3;
+// ---------------------------------------------------------------------------
+// Truncation
+// ---------------------------------------------------------------------------
+/**
+ * Result of an emergency truncation operation.
+ */
+export interface FailsafeTruncationResult {
+  /** The truncated conversation history. */
+  newHistory: AgentMessage[];
+  /** Number of turns removed. */
+  turnsRemoved: number;
+  /** Estimated tokens after truncation. */
+  tokensAfter: number;
+}
+/**
+ * Find structural pairs in conversation history.
+ * A tool_use message and its corresponding tool_result form a pair.
+ * When dropping one, we must drop both.
+ *
+ * Returns indices that should be dropped together for each index.
+ * If a message at index i is part of a pair, pairMap[i] contains
+ * all indices in that pair.
+ */
+function findStructuralPairs(history: AgentMessage[]): Map<number, number[]> {
+  const pairMap = new Map<number, number[]>();
+  for (let i = 0; i < history.length; i++) {
+    const msg = history[i]!;
+    if (isToolUseMessage(msg)) {
+      // Look for the corresponding tool_result in the next message
+      if (i + 1 < history.length && isToolResultMessage(history[i + 1]!)) {
+        const pair = [i, i + 1];
+        pairMap.set(i, pair);
+        pairMap.set(i + 1, pair);
+      }
+    }
+  }
+  return pairMap;
+}
+/**
+ * Perform emergency truncation on conversation history.
+ *
+ * Drops the oldest turns (preserving structural pairs) until the
+ * estimated token count drops below the threshold, or until only
+ * the preserved tail remains.
+ *
+ * @param history - Conversation history (post-slot region)
+ * @param contextWindow - Total context window size in tokens
+ * @param slotTokens - Estimated tokens used by slots
+ * @param threshold - Usage ratio threshold (default 0.90)
+ * @returns Truncation result with new history and metrics
+ */
+export function emergencyTruncate(
+  history: AgentMessage[],
+  contextWindow: number,
+  slotTokens: number,
+  threshold: number = FAILSAFE_DEFAULTS.threshold,
+): FailsafeTruncationResult {
+  if (history.length === 0) {
+    return { newHistory: [], turnsRemoved: 0, tokensAfter: slotTokens };
+  }
+  const targetTokens = contextWindow * threshold;
+  const pairMap = findStructuralPairs(history);
+  const dropped = new Set<number>();
+  // Calculate initial token estimate
+  let currentTokens = slotTokens + estimateTokens(
+    history.map(m => extractTextContent(m)).join('\n'),
+  );
+  // Drop from the front, but respect the preserved tail
+  const preserveFrom = Math.max(0, history.length - FAILSAFE_PRESERVE_TURNS);
+  let i = 0;
+  while (currentTokens > targetTokens && i < preserveFrom) {
+    if (dropped.has(i)) {
+      i++;
+      continue;
+    }
+    // Get all indices that must be dropped together
+    const pair = pairMap.get(i);
+    const indicesToDrop = pair ?? [i];
+    // Check that none of the pair indices are in the preserved tail
+    const canDrop = indicesToDrop.every(idx => idx < preserveFrom);
+    if (!canDrop) {
+      i++;
+      continue;
+    }
+    // Drop the turn(s)
+    for (const idx of indicesToDrop) {
+      const msgTokens = estimateTokens(extractTextContent(history[idx]!));
+      currentTokens -= msgTokens;
+      dropped.add(idx);
+    }
+    i++;
+  }
+  // Build new history excluding dropped messages
+  const newHistory = history.filter((_, idx) => !dropped.has(idx));
+  return {
+    newHistory,
+    turnsRemoved: dropped.size,
+    tokensAfter: currentTokens,
+  };
+}
+/**
+ * Check if emergency truncation should fire based on token count.
+ */
+export function shouldTruncate(
+  currentTokens: number,
+  contextWindow: number,
+  threshold: number = FAILSAFE_DEFAULTS.threshold,
+): boolean {
+  if (contextWindow <= 0) return false;
+  return (currentTokens / contextWindow) >= threshold;
+}
+/**
+ * Check if an error represents a context overflow.
+ * Matches common API error patterns from various providers.
+ */
+export function isContextOverflow(error: Error): boolean {
+  const msg = error.message.toLowerCase();
+  return (
+    msg.includes('context_length_exceeded') ||
+    msg.includes('context window') ||
+    msg.includes('maximum context length') ||
+    msg.includes('token limit') ||
+    msg.includes('too many tokens') ||
+    msg.includes('request too large') ||
+    msg.includes('prompt is too long') ||
+    msg.includes('input too long')
+  );
+}