npm - @digitalforgestudios/openclaw-sulcus - Versions diffs - 5.4.0 → 6.1.0 - Mend

@digitalforgestudios/openclaw-sulcus 5.4.0 → 6.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/index.ts CHANGED Viewed

@@ -1,44 +1,205 @@
+// @ts-nocheck
 import { resolve } from "node:path";
-import { existsSync, mkdirSync } from "node:fs";
+import { existsSync, mkdirSync, readFileSync, writeFileSync } from "node:fs";
 import * as https from "node:https";
 import * as http from "node:http";
 import { URL } from "node:url";
 import { Type } from "@sinclair/typebox";
-// ─── STATIC AWARENESS ───────────────────────────────────────────────────────
+// --- SESSION SCOPE (Task 30) -------------------------------------------------------
+// Each plugin instance gets a unique session ID at init time.
+// Session memories are stored under `session:<id>` namespace prefix and
+// auto-purged on agent_end so they never outlive the conversation.
-function buildStaticAwareness(backendMode: string, namespace: string): string {
-  return `## Persistent Memory (Sulcus)
-You have Sulcus — a persistent, reactive, thermodynamic memory system with reactive triggers.
-Memories survive across sessions. They have heat (0.0–1.0) that decays over time.
+function generateSessionId(): string {
+  const ts = Date.now().toString(36);
+  const rand = Math.random().toString(36).slice(2, 8);
+  return `${ts}-${rand}`;
+}
+// Module-scope session ID — reset on gateway restart (which is the right behavior).
+// Each plugin load gets fresh ephemeral context.
+const CURRENT_SESSION_ID = generateSessionId();
+// Track IDs of session-scoped memories so we can purge them on agent_end.
+// Using a Set so dedup is free and lookup is O(1).
+const sessionMemoryIds = new Set<string>();
+// --- SULCUS.TOML CONFIG LAYER (Task 69) ------------------------------------
+// Optional `~/.sulcus/sulcus.toml` config file. Provides file-based defaults
+// that are merged with the plugin UI config (which wins on conflict).
+// Precedence: pluginConfig (OpenClaw UI) > sulcus.toml > built-in defaults.
+//
+// Supported types: string, number, boolean, inline arrays of strings.
+// Supports [sections] which map to nested objects (e.g. [guardrails.outputGuard]).
+// Lines starting with # are comments.
+/** Flat key-value result from TOML parse — nested keys joined with dots. */
+type TomlFlat = Record<string, string | number | boolean | string[]>;
+/**
+ * Minimal TOML parser for sulcus.toml.
+ * Supports: scalar string/number/boolean values, inline string arrays,
+ * [section] and [section.subsection] headers, # comments.
+ * Does NOT support multi-line strings, inline tables, or date types.
+ */
+function parseSulcusToml(raw: string): TomlFlat {
+  const result: TomlFlat = {};
+  let section = "";
+  for (const rawLine of raw.split("\n")) {
+    const line = rawLine.trim();
+    if (!line || line.startsWith("#")) continue;
+    // Section header: [section] or [section.sub]
+    if (line.startsWith("[") && line.endsWith("]")) {
+      section = line.slice(1, -1).trim();
+      continue;
+    }
+    // Key = value
+    const eqIdx = line.indexOf("=");
+    if (eqIdx === -1) continue;
+    const rawKey = line.slice(0, eqIdx).trim();
+    const rawVal = line.slice(eqIdx + 1).trim();
+    const fullKey = section ? `${section}.${rawKey}` : rawKey;
+    // Strip inline comment (outside of strings/arrays)
+    const valNoComment = rawVal.replace(/\s*#.*$/, "");
+    // Parse value
+    let parsed: string | number | boolean | string[];
+    if (valNoComment === "true") {
+      parsed = true;
+    } else if (valNoComment === "false") {
+      parsed = false;
+    } else if (valNoComment.startsWith('[') && valNoComment.endsWith(']')) {
+      // Inline array of strings: ["a", "b"] or ['a', 'b']
+      const inner = valNoComment.slice(1, -1);
+      parsed = inner
+        .split(",")
+        .map(s => s.trim().replace(/^["']|["']$/g, ""))
+        .filter(Boolean);
+    } else if (
+      (valNoComment.startsWith('"') && valNoComment.endsWith('"')) ||
+      (valNoComment.startsWith("'") && valNoComment.endsWith("'"))
+    ) {
+      parsed = valNoComment.slice(1, -1);
+    } else {
+      const num = Number(valNoComment);
+      parsed = isNaN(num) ? valNoComment : num;
+    }
+    result[fullKey] = parsed;
+  }
+  return result;
+}
+/**
+ * Expand dotted keys into nested objects.
+ * "guardrails.outputGuard.enabled" → { guardrails: { outputGuard: { enabled: … } } }
+ */
+function expandTomlKeys(flat: TomlFlat): Record<string, unknown> {
+  const out: Record<string, unknown> = {};
+  for (const [key, value] of Object.entries(flat)) {
+    const parts = key.split(".");
+    let cur = out as Record<string, unknown>;
+    for (let i = 0; i < parts.length - 1; i++) {
+      const part = parts[i];
+      if (typeof cur[part] !== "object" || cur[part] === null) {
+        cur[part] = {};
+      }
+      cur = cur[part] as Record<string, unknown>;
+    }
+    cur[parts[parts.length - 1]] = value;
+  }
+  return out;
+}
-**Connection:** Backend: ${backendMode} | Namespace: ${namespace}
+/**
+ * Load and parse sulcus.toml from disk.
+ * Returns an empty object if the file doesn't exist or can't be parsed.
+ * @param configPath  Override path; defaults to ~/.sulcus/sulcus.toml
+ */
+function loadSulcusToml(
+  configPath?: string,
+  logger?: { warn: (s: string) => void; info: (s: string) => void }
+): Record<string, unknown> {
+  const defaultPath = resolve(process.env.HOME || "~", ".sulcus/sulcus.toml");
+  const tomlPath = configPath ?? defaultPath;
+  if (!existsSync(tomlPath)) {
+    return {};
+  }
+  try {
+    const raw = readFileSync(tomlPath, "utf8");
+    const flat = parseSulcusToml(raw);
+    const expanded = expandTomlKeys(flat);
+    const keyCount = Object.keys(flat).length;
+    logger?.info(`sulcus: loaded sulcus.toml (${keyCount} keys) from ${tomlPath}`);
+    return expanded;
+  } catch (err: unknown) {
+    logger?.warn(`sulcus: failed to parse sulcus.toml at ${tomlPath}: ${(err as Error).message}`);
+    return {};
+  }
+}
-**Your memory tools:**
-- \`memory_store\` — Save important information (preferences, facts, procedures, decisions, lessons)
-  Parameters: content, memory_type (episodic|semantic|preference|procedural|fact)
-- \`memory_recall\` — Search memories semantically. Use before answering about past work, decisions, or people.
-  Parameters: query, limit
+/**
+ * Deep-merge two config objects.
+ * `override` wins on scalar conflicts; nested objects are merged recursively.
+ * Used to merge sulcus.toml (base) with pluginConfig (override).
+ */
+function mergeConfig(
+  base: Record<string, unknown>,
+  override: Record<string, unknown>
+): Record<string, unknown> {
+  const result: Record<string, unknown> = { ...base };
+  for (const [key, val] of Object.entries(override)) {
+    if (
+      val !== null &&
+      typeof val === "object" &&
+      !Array.isArray(val) &&
+      typeof result[key] === "object" &&
+      result[key] !== null &&
+      !Array.isArray(result[key])
+    ) {
+      // Both sides are objects — recurse
+      result[key] = mergeConfig(
+        result[key] as Record<string, unknown>,
+        val as Record<string, unknown>
+      );
+    } else {
+      // Scalar or array — override wins
+      result[key] = val;
+    }
+  }
+  return result;
+}
-**When to store:** User states a preference, important decision made, correction given, lesson learned, anything worth surviving this session.
-**When to search:** Questions about prior work/decisions, context seems incomplete, user references past conversations.
+// --- STATIC AWARENESS -------------------------------------------------------
+// Task 12: XML-structured injection — static awareness uses the same
+// <sulcus_context> envelope as the dynamic recall path for LLM consistency.
-**Memory types:** episodic (events, fast decay) · semantic (knowledge, slow) · preference (opinions, slower) · procedural (how-tos, slowest) · fact (data, slow)`;
+function buildStaticAwareness(backendMode: string, namespace: string): string {
+  // Minimal awareness — tool schemas handle parameter docs.
+  // One sentence: you have memory, it's thermodynamic, it's automatic.
+  return `<sulcus_context backend="${backendMode}" namespace="${namespace}">
+You have Sulcus — persistent, thermodynamic memory. Memories survive across sessions with heat (0.0\u20131.0) that decays over time. Context is injected automatically each turn.
+</sulcus_context>`;
 }
 let STATIC_AWARENESS = buildStaticAwareness("local", "default");
-const FALLBACK_AWARENESS = `<sulcus_context token_budget="500">
-  <cheatsheet>
-    You have Sulcus — persistent memory with reactive triggers.
-    STORE:    memory_store (content, memory_type)
-    FIND:     memory_recall (query, limit)
-    TYPES:    episodic (fast fade), semantic (slow), preference, procedural (slowest), fact
-    Context build failed this turn — use memory_recall to search manually.
-  </cheatsheet>
+// Fallback when recall fails — same minimal awareness, plus a hint to search manually.
+const FALLBACK_AWARENESS = `<sulcus_context token_budget="4000">
+You have Sulcus — persistent memory. Context build failed this turn. Use memory_recall to search manually.
 </sulcus_context>`;
-// ─── HOOKS CONFIG TYPES ──────────────────────────────────────────────────────
+// --- HOOKS CONFIG TYPES ------------------------------------------------------
 interface HookConfig {
   action: string;
@@ -69,6 +230,12 @@ interface HookHandlerCtx {
   storeLibPath?: string;
   vectorsLibPath?: string;
   wasmDir?: string;
+  boostOnRecall?: boolean;
+  profileFrequency?: number;
+  /** Task 66: configurable token budget for recall context injection. Default: 4000. */
+  tokenBudget?: number;
+  /** Task 102: model context window size in tokens. Default: 200000. */
+  contextWindowSize?: number;
 }
 interface PluginLogger {
@@ -80,7 +247,324 @@ interface PluginLogger {
 type HookHandler = (event: Record<string, unknown>, config: HookConfig, ctx: HookHandlerCtx) => Promise<unknown>;
-// ─── HOOK HANDLERS ───────────────────────────────────────────────────────────
+// --- GUARDRAILS (Task 54) --------------------------------------------------
+// Memory-aware output guard. Intercepts agent output before delivery.
+// Two hooks: llm_output (fast pre-analysis, regex only) + message_sending (enforcement).
+// All disabled by default — opt-in via guardrails.outputGuard.enabled in plugin config.
+interface PiiPattern {
+  name: string;
+  regex: RegExp;
+}
+interface PiiSpan {
+  start: number;
+  end: number;
+  type: string;
+  redactionId: string;
+}
+interface SulcusGuardFlags {
+  piiDetected: boolean;
+  piiSpans: PiiSpan[];
+  suspectedPreferenceViolation: boolean;
+  suspectedViolationReason?: string;
+  scanTimeMs: number;
+}
+interface OutputGuardConfig {
+  enabled: boolean;
+  pii: {
+    enabled: boolean;
+    reversible: boolean;
+    storageKey: string;
+    patterns: string[];
+    customPatterns: Array<{ name: string; regex: string; replacement?: string }>;
+    onViolation: "redact" | "replace" | "block";
+  };
+  preferenceViolation: {
+    enabled: boolean;
+    onViolation: "replace" | "warn" | "block";
+    replacementMessage: string;
+  };
+  failMode: "fail-open" | "fail-closed";
+  auditTrail: boolean;
+}
+interface ToolGuardConfig {
+  enabled: boolean;
+  sensitiveTools: string[];
+  requireApprovalThreshold: "info" | "warning" | "critical";
+  allowlist: string[];
+  blocklist: string[];
+  objectiveCheck: boolean;
+  failMode: "fail-open" | "fail-closed";
+  auditTrail: boolean;
+}
+// Built-in PII patterns (GDPR-neutral, common formats)
+const BUILTIN_PII_PATTERNS: PiiPattern[] = [
+  { name: "email",       regex: /\b[A-Za-z0-9._%+\-]+@[A-Za-z0-9.\-]+\.[A-Za-z]{2,}\b/g },
+  { name: "phone",       regex: /(?:\+?\d[\s.\-]?)?(?:\(?\d{3}\)?[\s.\-]?)\d{3}[\s.\-]?\d{4}\b/g },
+  { name: "ssn",         regex: /\b\d{3}[\s\-]\d{2}[\s\-]\d{4}\b/g },
+  { name: "credit_card", regex: /\b(?:4\d{12}(?:\d{3})?|5[1-5]\d{14}|3[47]\d{13}|6011\d{12}|3(?:0[0-5]|[68]\d)\d{11})\b/g },
+  { name: "ip_address",  regex: /\b(?:\d{1,3}\.){3}\d{1,3}\b/g },
+];
+// Module-scope negative preference cache to avoid hammering Sulcus on every message
+interface NegPrefCache {
+  prefs: string[];
+  cachedAt: number;
+  namespace: string;
+}
+let negPrefCache: NegPrefCache | null = null;
+const NEG_PREF_CACHE_TTL_MS = 5 * 60 * 1000; // 5 minutes
+// Module-scope llm_output flag relay (flags produced by llm_output, consumed by message_sending)
+// Keyed by a simple turn counter since OpenClaw doesn't expose a stable runId.
+let lastGuardFlags: SulcusGuardFlags | null = null;
+// --- INSPECT BUFFER (Task 56) ------------------------------------------------
+// Module-scope debug window for memory_inspect tool.
+// Captures last recall injection + guardrail events across both hook and SDK paths.
+// Never resets intentionally — survives topic shifts so agent can review last N events.
+interface InspectRecallSnapshot {
+  capturedAt: number;          // Date.now() when injection happened
+  path: "hook" | "sdk";        // which recall path produced this
+  turn: number;                // turn number within the session
+  query: string;               // query used for recall (first 200 chars)
+  fromCache: boolean;          // true = HookRecallCache hit, false = fresh API call
+  itemsInjected: number;       // total items injected (profile + recall combined)
+  recallItems: Array<{         // recall items (not profile items)
+    id: string;
+    content_preview: string;   // first 80 chars
+    memory_type: string;
+    heat: number;
+    score: number | null;      // server fused_score if available
+    stale: boolean;            // age > 30 days
+    source: "semantic" | "graph" | "unknown";
+  }>;
+  profileItems: number;        // number of profile items injected
+  staleCount: number;          // items flagged as stale
+  graphHopCount: number;       // items from graph expansion
+  tokensBudget: number;
+  tokensUsed: number;
+}
+interface InspectGuardrailEvent {
+  capturedAt: number;
+  guard: "output" | "tool";
+  eventType: string;           // e.g. "pii_redacted", "preference_violation", "tool_blocked", "tool_allowed"
+  action: string;              // e.g. "redact", "block", "allow", "warn"
+  details: string;
+  toolName?: string;           // for tool guard events
+  severity?: string;           // for tool guard events
+}
+interface InspectBuffer {
+  lastRecall: InspectRecallSnapshot | null;
+  guardrailEvents: InspectGuardrailEvent[];  // ring buffer, last 10
+}
+const inspectBuffer: InspectBuffer = {
+  lastRecall: null,
+  guardrailEvents: [],
+};
+const INSPECT_GUARDRAIL_MAX = 10;
+// --- GUARDRAIL STATUS SNAPSHOT (Task 57) ------------------------------------
+// Set during init after parsing both guard configs. Read by guardrail_status tool.
+interface GuardrailStatusSnapshot {
+  outputGuard: {
+    enabled: boolean;
+    pii: { enabled: boolean; patterns: string[]; onViolation: string; reversible: boolean };
+    preferenceViolation: { enabled: boolean; onViolation: string };
+    failMode: string;
+    auditTrail: boolean;
+  };
+  toolGuard: {
+    enabled: boolean;
+    sensitiveTools: string[];
+    allowlist: string[];
+    blocklist: string[];
+    objectiveCheck: boolean;
+    requireApprovalThreshold: string;
+    failMode: string;
+    auditTrail: boolean;
+  };
+  negPrefCount: () => number;
+  negPrefCachedAt: () => number | null;
+}
+let guardrailStatus: GuardrailStatusSnapshot | null = null;
+function pushGuardrailEvent(evt: InspectGuardrailEvent): void {
+  inspectBuffer.guardrailEvents.push(evt);
+  if (inspectBuffer.guardrailEvents.length > INSPECT_GUARDRAIL_MAX) {
+    inspectBuffer.guardrailEvents.shift();
+  }
+}
+function scanForPii(content: string, activePatterns: string[], customPatterns: Array<{ name: string; regex: string }>): PiiSpan[] {
+  const spans: PiiSpan[] = [];
+  const patterns = BUILTIN_PII_PATTERNS.filter(p => activePatterns.includes(p.name));
+  // Add custom patterns
+  for (const cp of customPatterns) {
+    try { patterns.push({ name: cp.name, regex: new RegExp(cp.regex, "g") }); } catch { /* ignore bad regex */ }
+  }
+  for (const pat of patterns) {
+    const re = new RegExp(pat.regex.source, "g");
+    let m: RegExpExecArray | null;
+    while ((m = re.exec(content)) !== null) {
+      const redactionId = `${Date.now().toString(36)}-${Math.random().toString(36).slice(2, 8)}`;
+      spans.push({ start: m.index, end: m.index + m[0].length, type: pat.name, redactionId });
+    }
+  }
+  // Sort by start position for left-to-right replacement
+  spans.sort((a, b) => a.start - b.start);
+  return spans;
+}
+function redactSpans(content: string, spans: PiiSpan[]): string {
+  let result = "";
+  let cursor = 0;
+  for (const span of spans) {
+    if (span.start > cursor) result += content.slice(cursor, span.start);
+    result += `[REDACTED-${span.redactionId}]`;
+    cursor = span.end;
+  }
+  result += content.slice(cursor);
+  return result;
+}
+function storeRedactionKey(spans: PiiSpan[], content: string, storageKey: string, namespace: string): void {
+  // Best-effort local reversible redaction storage (plain JSON, no crypto dep in plugin)
+  // NOTE: Full AES-256 encryption from design doc requires native crypto — using JSON for now.
+  // The owning agent can decrypt by reading this file. Cross-agent sharing requires file export.
+  try {
+    const keyPath = storageKey.replace("~", process.env.HOME || "~");
+    let store: Record<string, unknown> = {};
+    if (existsSync(keyPath)) {
+      try { store = JSON.parse(readFileSync(keyPath, "utf-8")); } catch { store = {}; }
+    }
+    if (!store.version) { store.version = 1; store.entries = {}; }
+    const entries = store.entries as Record<string, unknown>;
+    for (const span of spans) {
+      entries[span.redactionId] = {
+        original: content.slice(span.start, span.end),
+        type: span.type,
+        redactedAt: new Date().toISOString(),
+        namespace,
+      };
+    }
+    const dir = keyPath.split("/").slice(0, -1).join("/");
+    if (dir && !existsSync(dir)) mkdirSync(dir, { recursive: true });
+    writeFileSync(keyPath, JSON.stringify(store, null, 2), { mode: 0o600 });
+  } catch { /* best effort — don't break output delivery */ }
+}
+function parseOutputGuardConfig(pluginConfig: Record<string, unknown>): OutputGuardConfig {
+  const g = (pluginConfig?.guardrails as Record<string, unknown> | undefined) ?? {};
+  const og = (g?.outputGuard as Record<string, unknown> | undefined) ?? {};
+  const pii = (og?.pii as Record<string, unknown> | undefined) ?? {};
+  const pv = (og?.preferenceViolation as Record<string, unknown> | undefined) ?? {};
+  return {
+    enabled: (og?.enabled as boolean | undefined) ?? false,
+    pii: {
+      enabled: (pii?.enabled as boolean | undefined) ?? false,
+      reversible: (pii?.reversible as boolean | undefined) ?? true,
+      storageKey: (pii?.storageKey as string | undefined) ?? "~/.openclaw/sulcus-redaction-key.json",
+      patterns: (pii?.patterns as string[] | undefined) ?? ["email", "phone", "ssn", "credit_card", "ip_address"],
+      customPatterns: (pii?.customPatterns as Array<{ name: string; regex: string }> | undefined) ?? [],
+      onViolation: ((pii?.onViolation as string | undefined) ?? "redact") as "redact" | "replace" | "block",
+    },
+    preferenceViolation: {
+      enabled: (pv?.enabled as boolean | undefined) ?? true,
+      onViolation: ((pv?.onViolation as string | undefined) ?? "replace") as "replace" | "warn" | "block",
+      replacementMessage: (pv?.replacementMessage as string | undefined) ?? "⚠️ I stopped myself — this output would violate a preference you've stored with me.",
+    },
+    failMode: ((og?.failMode as string | undefined) ?? "fail-open") as "fail-open" | "fail-closed",
+    auditTrail: (og?.auditTrail as boolean | undefined) ?? true,
+  };
+}
+function parseToolGuardConfig(pluginConfig: Record<string, unknown>): ToolGuardConfig {
+  const g = (pluginConfig?.guardrails as Record<string, unknown> | undefined) ?? {};
+  const tg = (g?.toolGuard as Record<string, unknown> | undefined) ?? {};
+  return {
+    enabled: (tg?.enabled as boolean | undefined) ?? false,
+    sensitiveTools: (tg?.sensitiveTools as string[] | undefined) ?? ["exec", "write", "edit", "delete", "message"],
+    requireApprovalThreshold: ((tg?.requireApprovalThreshold as string | undefined) ?? "warning") as "info" | "warning" | "critical",
+    allowlist: (tg?.allowlist as string[] | undefined) ?? [],
+    blocklist: (tg?.blocklist as string[] | undefined) ?? [],
+    objectiveCheck: (tg?.objectiveCheck as boolean | undefined) ?? true,
+    failMode: ((tg?.failMode as string | undefined) ?? "fail-open") as "fail-open" | "fail-closed",
+    auditTrail: (tg?.auditTrail as boolean | undefined) ?? true,
+  };
+}
+// --- HOOK RECALL CACHE (Task 14 parity for hook path) ----------------------
+// Per-namespace topic-shift cache for the auto_recall hook.
+// Mirrors the SDK recall handler cache so hooks avoid redundant API calls
+// when the conversation topic is stable across consecutive turns.
+interface HookRecallCache {
+  results: Record<string, unknown>[];
+  topicTokens: Set<string>;
+  cachedAt: number;
+}
+const hookRecallCacheMap = new Map<string, HookRecallCache>();
+const HOOK_CACHE_TTL_MS = 5 * 60 * 1000; // 5 minutes
+const HOOK_TOPIC_SHIFT_THRESHOLD = 0.25;  // Jaccard overlap below this = topic shift
+// --- RECALL QUALITY METRICS (Task 32) --------------------------------------
+// Module-scope counters — written by both SDK and hook recall paths.
+// Exposed via memory_status so the agent can inspect recall health.
+// Resets on gateway restart (session-scoped is intentional).
+interface RecallQualityMetrics {
+  freshRecalls: number;       // turns where API was called (topic shifted)
+  cacheHits: number;          // turns where cached results were served
+  totalItemsServed: number;   // cumulative recall items injected
+  zeroResultTurns: number;    // turns where recall returned nothing
+  graphHopContrib: number;    // total graph-hop items folded in
+  graphHopTurns: number;      // turns with at least one graph-hop item
+  scoreSum: number;           // sum of avg heat per fresh recall (for avg relevance)
+  scoreTurns: number;         // fresh recall turns that had items (for avg relevance)
+}
+const recallQM: RecallQualityMetrics = {
+  freshRecalls: 0,
+  cacheHits: 0,
+  totalItemsServed: 0,
+  zeroResultTurns: 0,
+  graphHopContrib: 0,
+  graphHopTurns: 0,
+  scoreSum: 0,
+  scoreTurns: 0,
+};
+// --- COMPACTION REBUILD FLAG (Task 70) --------------------------------------
+// Set to true when before_compaction fires. Cleared after the first
+// post-compaction before_prompt_build injects a rich Sulcus context rebuild.
+// This is per-session (module scope); each gateway restart resets it correctly.
+let wasJustCompacted = false;
+// Token budget for post-compaction context rebuild. Configured via
+// contextRebuild.tokenBudget (default 4000, max 10000).
+let REBUILD_TOKEN_BUDGET = 4000;
+// --- HOOK PROFILE STATE (Task 31) --------------------------------------------
+// Per-namespace profile cache for the auto_recall hook.
+// Mirrors the SDK recall handler: inject full profile on turn 1 + every N turns,
+// serve cached profile on stable turns to reduce token waste.
+interface HookProfileState {
+  turnCount: number;
+  cache: { preferences: Record<string, unknown>[]; facts: Record<string, unknown>[]; cachedAt: number } | null;
+}
+const hookProfileStateMap = new Map<string, HookProfileState>();
+// --- HOOK HANDLERS -----------------------------------------------------------
 const hookHandlers: Record<string, HookHandler> = {
   inject_awareness: async (_event, _config, _ctx) => {
@@ -88,28 +572,363 @@ const hookHandlers: Record<string, HookHandler> = {
   },
   auto_recall: async (event, config, ctx) => {
+    // Task 22: Unified recall pipeline — same XML formatting, budget enforcement,
+    // diversity filter, and conflict surfacing as the SDK recall path.
+    // Task 14 parity: topic-shift detection + per-namespace cache for hook path.
+    // Task 31: Profile injection frequency — full profile on turn 1 + every N turns.
     const { sulcusMem, namespace, logger } = ctx;
     if (!sulcusMem) return;
     const agentLabel = (event?.agentId as string) ?? "(unknown)";
     logger.info(`sulcus: auto_recall hook triggered for agent ${agentLabel}`);
-    const prompt = typeof event?.prompt === "string" ? event.prompt : "";
-    if (!prompt) return;
+    const rawPrompt = typeof event?.prompt === "string" ? event.prompt : "";
+    if (!rawPrompt) return;
+    // Strip OpenClaw metadata noise before using as search query
+    const prompt = sanitizeRecallQuery(rawPrompt);
+    if (!prompt || prompt.length < 3) return;
+    // Task 62: Use focused last-user-turn for recall query; full prompt for topic-shift
+    const recallQuery = extractLastUserTurn(rawPrompt);
     try {
       const limit = (config.limit as number) ?? 5;
-      logger.debug?.(`sulcus: searching context for prompt: ${prompt.substring(0, 50)}... (namespace: ${namespace})`);
-      const res = await sulcusMem.search_memory(prompt, limit, namespace);
-      const results = res?.results ?? [];
-      if (!results || results.length === 0) {
+      // -- Task 31: Profile injection frequency ------------------------------
+      // Track per-namespace turn count + profile cache. Inject full profile
+      // (prefs + facts) on turn 1 and every profileFrequency turns; serve
+      // cache on stable turns to avoid redundant API calls.
+      const profileFreq = ctx.profileFrequency ?? 10;
+      let hookProfileState = hookProfileStateMap.get(namespace);
+      if (!hookProfileState) {
+        hookProfileState = { turnCount: 0, cache: null };
+        hookProfileStateMap.set(namespace, hookProfileState);
+      }
+      hookProfileState.turnCount++;
+      const hookTurn = hookProfileState.turnCount;
+      const includeProfile = hookTurn === 1 || hookTurn % profileFreq === 0;
+      // -- Task 101: Adaptive scaling — reduce recall footprint as conversation grows
+      const hookScale = applyAdaptiveScaling(hookTurn, limit, ctx.tokenBudget ?? 4000);
+      // -- Task 102: Context-window-aware throttling (hook path) — same logic as SDK
+      const hookContextWindow = ctx.contextWindowSize ?? 200000;
+      const hookThrottled = applyContextWindowThrottle(rawPrompt.length, hookContextWindow, hookScale, logger);
+      if (hookThrottled.selfMuted) {
+        logger.warn(`sulcus: hook path self-muted — context ${((rawPrompt.length / 4 / hookContextWindow) * 100).toFixed(0)}% full`);
+        return;
+      }
+      const hookEffectiveLimit = hookThrottled.effectiveMax;
+      const hookEffectiveTokenBudget = hookThrottled.effectiveTokenBudget;
+      if (hookTurn > 5) logger.debug?.(`sulcus: adaptive scaling (hook turn ${hookTurn}) — limit=${hookEffectiveLimit}, budget=${hookEffectiveTokenBudget}`);
+      // -- end Task 31 + 102 --------------------------------------------------
+      // -- Topic-shift detection (Task 14 parity) ----------------------------
+      const cacheKey = namespace;
+      const currentTokens = extractTopicTokens(prompt);
+      const existingCache = hookRecallCacheMap.get(cacheKey);
+      const cacheExpired = existingCache !== undefined && (Date.now() - existingCache.cachedAt) > HOOK_CACHE_TTL_MS;
+      const overlap = existingCache !== undefined ? topicOverlap(currentTokens, existingCache.topicTokens) : 0;
+      const topicShifted = existingCache === undefined || cacheExpired || overlap < HOOK_TOPIC_SHIFT_THRESHOLD;
+      let vectorResults: Record<string, unknown>[];
+      if (!topicShifted && existingCache !== undefined) {
+        vectorResults = existingCache.results;
+        recallQM.cacheHits++;  // Task 32: module-scope QM
+        logger.info(`sulcus: auto_recall hook — topic stable (overlap=${overlap.toFixed(2)}), serving cached recall`);
+      } else {
+        if (existingCache !== undefined) {
+          logger.info(`sulcus: auto_recall hook — TOPIC SHIFT detected (overlap=${overlap.toFixed(2)}), fresh recall`);
+        }
+        logger.debug?.(`sulcus: searching context for prompt (focused: ${recallQuery.substring(0, 50)}...) (namespace: ${namespace})`);
+        // Task 62: Use focused last-user-turn query for better relevance
+        // Task 101: Use adaptive limit instead of raw config limit
+        const res = await sulcusMem.search_memory(recallQuery, hookEffectiveLimit, namespace);
+        vectorResults = res?.results ?? [];
+        recallQM.freshRecalls++;  // Task 32: module-scope QM
+        // Update cache with fresh results
+        hookRecallCacheMap.set(cacheKey, { results: vectorResults, topicTokens: currentTokens, cachedAt: Date.now() });
+      }
+      // -- end topic-shift detection -----------------------------------------
+      if (!vectorResults || vectorResults.length === 0) {
+        recallQM.zeroResultTurns++;  // Task 32: module-scope QM
         return { prependSystemContext: FALLBACK_AWARENESS };
       }
-      const items = results.map((r: Record<string, unknown>) => {
-        const heat = ((r.current_heat as number) ?? (r.score as number) ?? 0).toFixed(2);
-        const mtype = (r.memory_type as string) ?? "unknown";
-        const label = (r.label as string) ?? (r.pointer_summary as string) ?? "";
-        return `    <memory id="${r.id}" heat="${heat}" type="${mtype}">${label}</memory>`;
-      }).join("\n");
-      const context = `<sulcus_context token_budget="500" namespace="${namespace}">\n${items}\n</sulcus_context>`;
-      logger.info(`sulcus: injecting ${results.length} recalled memories (${context.length} chars)`);
+      // -- Task 35: Query expansion for thin recall --------------------------
+      // When vector search returns < THIN_RECALL_THRESHOLD results, use the
+      // entity knowledge graph to find synonym terms and directly-connected
+      // memories, then do a second vector search with the expanded query.
+      let hookExpanded = vectorResults;
+      if (topicShifted && vectorResults.length < THIN_RECALL_THRESHOLD && sulcusMem instanceof SulcusCloudClient) {
+        try {
+          // Task 62: use focused recallQuery for entity expansion too
+          const { extraMemories, expandedQuery } = await expandQueryWithEntities(
+            sulcusMem, recallQuery, namespace, logger
+          );
+          // Merge extra memories from entity graph (dedup by ID)
+          const seenExpandIds = new Set(vectorResults.map((r) => r.id as string));
+          const newExtras = extraMemories.filter((m) => !seenExpandIds.has(m.id as string));
+          if (newExtras.length > 0) {
+            hookExpanded = [...vectorResults, ...newExtras];
+            logger.info(`sulcus: auto_recall thin-recall expansion added ${newExtras.length} entity-graph memory/memories`);
+          }
+          // If still thin, do second vector search with expanded query
+          if (hookExpanded.length < THIN_RECALL_THRESHOLD && expandedQuery !== recallQuery) {
+            try {
+              const expandedRes = await sulcusMem.search_memory(expandedQuery, hookEffectiveLimit, namespace);
+              const expandedVec = expandedRes?.results ?? [];
+              const expandedSeenIds = new Set(hookExpanded.map((r) => r.id as string));
+              const newVecExtras = expandedVec.filter((r) => !expandedSeenIds.has(r.id as string));
+              if (newVecExtras.length > 0) {
+                hookExpanded = [...hookExpanded, ...newVecExtras];
+                logger.info(`sulcus: auto_recall expanded query search added ${newVecExtras.length} result(s)`);
+              }
+            } catch {
+              // expanded search failed — keep what we have
+            }
+          }
+        } catch {
+          // expansion failed — proceed with original results
+        }
+      }
+      const vectorResults_expanded = hookExpanded;
+      // -- end Task 35 -------------------------------------------------------
+      // -- Graph-hop expansion (Task 13) — parity with SDK recall path ------
+      // Seed from top-2 vector hits, fetch AGE neighbours, fold in warm nodes.
+      let rawResults = vectorResults_expanded;
+      if (sulcusMem instanceof SulcusCloudClient) {
+        const seedIds = vectorResults_expanded.slice(0, 2).map((r) => r.id as string).filter(Boolean);
+        if (seedIds.length > 0) {
+          try {
+            const neighborFetches = await Promise.allSettled(
+              seedIds.map((id) => (sulcusMem as SulcusCloudClient).graph_neighbors(id, 6))
+            );
+            const seenIds = new Set(vectorResults_expanded.map((r) => r.id as string));
+            const graphExtras: Record<string, unknown>[] = [];
+            for (const result of neighborFetches) {
+              if (result.status !== "fulfilled") continue;
+              for (const node of result.value) {
+                const nodeId = node.id as string;
+                if (!nodeId || seenIds.has(nodeId)) continue;
+                const heat = (node.current_heat as number) ?? 0;
+                if (heat < 0.2) continue; // skip cold ephemeral noise
+                seenIds.add(nodeId);
+                graphExtras.push({ ...node, _source: "graph" });
+              }
+            }
+            if (graphExtras.length > 0) {
+              graphExtras.sort((a, b) => ((b.current_heat as number) ?? 0) - ((a.current_heat as number) ?? 0));
+              const hopCount = Math.min(graphExtras.length, 4);
+              rawResults = [...vectorResults_expanded, ...graphExtras.slice(0, hopCount)];
+              recallQM.graphHopContrib += hopCount;  // Task 32: graph-hop metrics
+              recallQM.graphHopTurns++;               // Task 32: graph-hop metrics
+              logger.info(`sulcus: auto_recall graph-hop added ${hopCount} neighbour(s)`);
+            }
+          } catch {
+            // graph expansion failed — fall back to vector results only
+          }
+        }
+      }
+      // -- end graph-hop -----------------------------------------------------
+      // -- Budget constants (mirror SDK recall) ------------------------------
+      // Task 66: configurable tokenBudget, Task 101: adaptive scaling reduces it
+      const TOKEN_BUDGET = hookEffectiveTokenBudget;
+      const FIXED_OVERHEAD = 80;
+      // -- Task 31: Profile fetch (frequency-gated) ------------------------------
+      // Fetch prefs + facts on turn 1 and every profileFreq turns.
+      // Serve cached profile on all other turns to save API calls + tokens.
+      let profilePreferences: Record<string, unknown>[] = [];
+      let profileFacts: Record<string, unknown>[] = [];
+      if (includeProfile) {
+        try {
+          const [prefRes, factRes] = await Promise.all([
+            sulcusMem.search_memory("user preference", Math.min(hookEffectiveLimit, 5), namespace),
+            sulcusMem.search_memory("fact data knowledge", Math.min(hookEffectiveLimit, 5), namespace),
+          ]);
+          profilePreferences = (prefRes?.results ?? []).filter((r) => r.memory_type === "preference");
+          profileFacts = (factRes?.results ?? []).filter((r) => r.memory_type === "fact");
+          hookProfileState!.cache = { preferences: profilePreferences, facts: profileFacts, cachedAt: Date.now() };
+          logger.info(`sulcus: auto_recall profile refreshed (turn ${hookTurn}, prefs=${profilePreferences.length}, facts=${profileFacts.length})`);
+        } catch {
+          // profile fetch failed — continue without
+        }
+      } else if (hookProfileState!.cache) {
+        profilePreferences = hookProfileState!.cache.preferences;
+        profileFacts = hookProfileState!.cache.facts;
+      }
+      // -- end Task 31 profile fetch ------------------------------------------
+      // Dedup profile IDs from recall results so profile items don't double-appear
+      const profileIdSet = new Set([
+        ...profilePreferences.map((r) => r.id as string),
+        ...profileFacts.map((r) => r.id as string),
+      ]);
+      // -- Diversity filter (Task 20) ---------------------------------------------
+      const preDiversity = rawResults
+        .filter((r) => !profileIdSet.has(r.id as string)) // exclude profile items from recall
+        .map((r) => ({
+          ...r,
+          label: ((r.label ?? r.pointer_summary ?? r.id ?? "") as string),
+          // Fix 2: prefer server fused_score over raw heat for ranking (Task 58)
+          _heat: (r.score as number) ?? (r.current_heat as number) ?? 0,
+        }));
+      preDiversity.sort((a, b) => b._heat - a._heat);
+      const diverseResults = diversityFilter(preDiversity, hookEffectiveLimit);
+      const droppedCount = preDiversity.length - diverseResults.length;
+      if (droppedCount > 0) logger.info(`sulcus: auto_recall diversity filter dropped ${droppedCount} near-duplicate(s)`);
+      // -- Budget split: ~30% profile / ~70% recall (mirrors SDK path) -----------
+      const profileBudgetTokens = Math.floor((TOKEN_BUDGET - FIXED_OVERHEAD) * 0.3);
+      const recallBudgetTokens = TOKEN_BUDGET - FIXED_OVERHEAD - profileBudgetTokens;
+      // Profile items sorted by heat desc
+      const profileItemsSorted = [...profilePreferences, ...profileFacts].map((r) => ({
+        ...r,
+        label: ((r.label ?? r.pointer_summary ?? r.id ?? "") as string)
+          .replace(/&/g, "&amp;").replace(/</g, "&lt;").replace(/>/g, "&gt;"),
+        _heat: (r.score as number) ?? (r.current_heat as number) ?? 0,
+      })).sort((a, b) => b._heat - a._heat);
+      const budgetedProfile = enforceContextBudget(profileItemsSorted, TOKEN_BUDGET, FIXED_OVERHEAD + recallBudgetTokens);
+      // -- XML-escape labels ----------------------------------------------------
+      const escapedResults = diverseResults.map((r) => ({
+        ...r,
+        label: r.label.replace(/&/g, "&amp;").replace(/</g, "&lt;").replace(/>/g, "&gt;"),
+      }));
+      // -- Task 80: Temporal supersession (hook path) ----------------------------
+      // Mark older conflicting memories as superseded (score penalty + flag).
+      // Must run BEFORE budget enforcement so penalized items fall below the cut.
+      const hookSupersededCount = markSuperseded(escapedResults);
+      if (hookSupersededCount > 0) logger.info(`sulcus: temporal supersession (hook) marked ${hookSupersededCount} memory/memories as superseded`);
+      // -- Budget enforcement (Task 18) ---------------------------------------------
+      // Re-sort after supersession penalties so budget cuts superseded items first
+      escapedResults.sort((a, b) => b._heat - a._heat);
+      const budgeted = enforceContextBudget(escapedResults, TOKEN_BUDGET, FIXED_OVERHEAD + profileBudgetTokens);
+      // -- Task 79: Temporal re-ranking (hook path) ----------------------------
+      const hookTemporalDetected = isTemporalQuery(recallQuery);
+      const orderedBudgeted = hookTemporalDetected ? temporalRerank(budgeted) : budgeted;
+      if (hookTemporalDetected) logger.info(`sulcus: temporal query detected (hook) — re-ranking ${orderedBudgeted.length} results chronologically`);
+      // -- Flat recall list — superseded items get demoted with attribute ---------
+      const recallElements: string[] = [];
+      for (const r of orderedBudgeted) {
+        const heat = r._heat as number;
+        const heatStr = heat.toFixed(2);
+        const mtype = (r.memory_type as string) ?? "episodic";
+        const updatedAt = r.updated_at as string | undefined;
+        const ageStr = updatedAt ? formatRelativeTime(updatedAt) : "unknown";
+        const staleAttr = isStaleMemory(updatedAt) ? ` stale="true"` : "";
+        // Task 80: superseded memories get a marker so the LLM treats them as historical
+        const supersededAttr = r._superseded ? ` superseded="true"` : "";
+        recallElements.push(`  <memory type="${mtype}" heat="${heatStr}" age="${ageStr}"${staleAttr}${supersededAttr}>${r.label}</memory>`);
+      }
+      // -- Assemble context XML ------------------------------------------------
+      const sections: string[] = [];
+      // Profile section (Task 31) — inject before recall so agent sees identity context first
+      if (budgetedProfile.length > 0) {
+        const profileElements: string[] = [];
+        for (const r of budgetedProfile) {
+          const mtype = (r.memory_type as string) ?? "preference";
+          const heat = (r._heat as number).toFixed(2);
+          profileElements.push(`  <item type="${mtype}" heat="${heat}">${r.label}</item>`);
+        }
+        sections.push(`<profile>\n${profileElements.join("\n")}\n</profile>`);
+      }
+      if (recallElements.length > 0) {
+        const recallOrderAttr = hookTemporalDetected ? ` order="chronological"` : "";
+        sections.push(`<recall${recallOrderAttr}>\n${recallElements.join("\n")}\n</recall>`);
+      }
+      if (sections.length === 0) return { prependSystemContext: FALLBACK_AWARENESS };
+      const guidance = "Background context from long-term memory. Use it silently to inform your understanding — only reference it when the conversation naturally calls for it.";
+      const contextParts = [
+        `<guidance>${guidance}</guidance>`,
+        ...sections,
+      ];
+      const context = `<sulcus_context token_budget="${TOKEN_BUDGET}" namespace="${namespace}" turn="${hookTurn}">\n${contextParts.join("\n")}\n</sulcus_context>`;
+      const estimatedTokens = estimateTokens(context);
+      // Task 32: track items served + avg relevance score in module-scope QM
+      recallQM.totalItemsServed += budgeted.length;
+      if (budgeted.length === 0) recallQM.zeroResultTurns++;
+      if (budgeted.length > 0 && topicShifted) {
+        const hookAvgScore = budgeted.reduce((s, r) => s + ((r._heat as number) ?? 0), 0) / budgeted.length;
+        recallQM.scoreSum += hookAvgScore;
+        recallQM.scoreTurns++;
+      }
+      logger.info(`sulcus: auto_recall injecting context (${context.length} chars, ~${estimatedTokens}/${TOKEN_BUDGET} tokens, turn ${hookTurn}, profile: ${budgetedProfile.length}, recall: ${budgeted.length})`);
+      // Task 56: write to inspect buffer for memory_inspect tool (hook path)
+      {
+        const staleHookItems = budgeted.filter((r) => (r as Record<string, unknown>).stale === true || (r as Record<string, unknown>)._stale === true);
+        const graphHookItems = budgeted.filter((r) => (r as Record<string, unknown>)._source === "graph");
+        inspectBuffer.lastRecall = {
+          capturedAt: Date.now(),
+          path: "hook",
+          turn: hookTurn,
+          query: prompt.substring(0, 200),
+          fromCache: !topicShifted,
+          itemsInjected: budgetedProfile.length + budgeted.length,
+          recallItems: budgeted.map((r) => ({
+            id: (r.id as string) ?? "",
+            content_preview: ((r.content ?? r.text ?? "") as string).substring(0, 80),
+            memory_type: (r.memory_type ?? r.type ?? "unknown") as string,
+            heat: (r.current_heat ?? r._heat ?? 0) as number,
+            score: (r.score as number | null) ?? null,
+            stale: !!(r.stale ?? r._stale),
+            source: ((r._source as string) === "graph" ? "graph" : "semantic") as "semantic" | "graph" | "unknown",
+          })),
+          profileItems: budgetedProfile.length,
+          staleCount: staleHookItems.length,
+          graphHopCount: graphHookItems.length,
+          tokensBudget: TOKEN_BUDGET,
+          tokensUsed: estimatedTokens,
+        };
+      }
+      // Spaced repetition: boost heat for recalled memories (fire-and-forget)
+      if (ctx.boostOnRecall !== false && sulcusMem instanceof SulcusCloudClient) {
+        boostRecalledMemories(sulcusMem, budgeted, logger).catch(() => {});
+      }
+      // -- Task 27: SIRU recall logging (hook path parity with SDK Task 23) --
+      // Post recall session metadata to SIRU on fresh recalls so the server
+      // can learn which memories were most useful. Skipped on cache-hit turns
+      // (topicShifted === false) to avoid duplicate logging for stable topics.
+      if (topicShifted && sulcusMem instanceof SulcusCloudClient) {
+        const recallIds = budgeted.map((r) => (r.id as string) ?? "").filter(Boolean);
+        const recallScores = budgeted.map((r) => (r._heat as number) ?? 0);
+        const recallSources = budgeted.map((r) =>
+          (r._source as string) === "graph" ? "graph" : "semantic"
+        );
+        const entityHints = Array.from(currentTokens).slice(0, 10);
+        const semanticCount = recallSources.filter((s) => s === "semantic").length;
+        const graphCount = recallSources.filter((s) => s === "graph").length;
+        sulcusMem.recall_log({
+          namespace,
+          agent_id: namespace,
+          query_text: recallQuery.substring(0, 500),  // Task 62: focused query
+          memory_ids: recallIds,
+          memory_scores: recallScores,
+          memory_sources: recallSources,
+          token_budget: TOKEN_BUDGET,
+          tokens_used: estimatedTokens,
+          candidates_total: rawResults.length,
+          candidates_selected: recallIds.length,
+          semantic_count: semanticCount,
+          hot_count: graphCount,
+          entity_count: entityHints.length,
+          entity_hints: entityHints,
+        }).catch(() => {}); // never block context injection
+        logger.debug?.("sulcus: auto_recall SIRU log posted (hook path)");
+      }
+      // -- end Task 27 -------------------------------------------------------
       return { prependSystemContext: context };
     } catch (e) {
       logger.warn(`sulcus: context build failed: ${e} — injecting fallback awareness`);
@@ -165,9 +984,18 @@ const hookHandlers: Record<string, HookHandler> = {
           return;
         }
-        const res = await sulcusMem.add_memory(userMessage, memoryType);
+        const hints = buildExtractionHints(memoryType, ctx.namespace, "user_capture", userMessage.substring(0, 200));
+        const res = await sulcusMem.add_memory(userMessage, memoryType, hints);
         const typeConf = ((siuResult?.type_confidence as number) ?? 0).toFixed(3);
-        logger.info(`sulcus: sivu_auto_capture — stored [${memoryType}] (id: ${res?.id ?? "?"}, sivu_conf: ${storeConf.toFixed(3)}, sicu_conf: ${typeConf}, model: ${modelVersion}): "${userMessage.substring(0, 60)}..."`);
+        logger.info(`sulcus: sivu_auto_capture — stored [${memoryType}] (id: ${res?.id ?? "?"}, sivu_conf: ${storeConf.toFixed(3)}, sicu_conf: ${typeConf}, model: ${modelVersion}, hints: ${hints ? "yes" : "no"}): "${userMessage.substring(0, 60)}..."`);
+        // -- Task 21: Correction detection (SIVU path) -----------------------
+        if (isCorrectionMessage(userMessage)) {
+          const boosted = await boostRelatedMemories(sulcusMem, userMessage, ctx.namespace, 0.85, 3, logger);
+          if (boosted > 0) {
+            logger.info(`sulcus: sivu_auto_capture — correction detected, heat-boosted ${boosted} related memor${boosted === 1 ? "y" : "ies"}`);
+          }
+        }
         return;
       } catch (e: unknown) {
         const msg = e instanceof Error ? e.message : String(e);
@@ -177,8 +1005,17 @@ const hookHandlers: Record<string, HookHandler> = {
     }
     try {
-      const res = await sulcusMem.add_memory(userMessage, "episodic");
+      const fallbackHints = buildExtractionHints("episodic", ctx.namespace, "user_capture", userMessage.substring(0, 200));
+      const res = await sulcusMem.add_memory(userMessage, "episodic", fallbackHints);
       logger.info(`sulcus: sivu_auto_capture — fallback stored [episodic] (id: ${res?.id ?? "?"}): "${userMessage.substring(0, 60)}..."`);
+      // -- Task 21: Correction detection (fallback path) -------------------
+      if (isCorrectionMessage(userMessage) && sulcusMem instanceof SulcusCloudClient) {
+        const boosted = await boostRelatedMemories(sulcusMem, userMessage, ctx.namespace, 0.85, 3, logger);
+        if (boosted > 0) {
+          logger.info(`sulcus: sivu_auto_capture — correction detected, heat-boosted ${boosted} related memor${boosted === 1 ? "y" : "ies"}`);
+        }
+      }
     } catch (e: unknown) {
       const msg = e instanceof Error ? e.message : String(e);
       logger.warn(`sulcus: sivu_auto_capture — fallback store failed: ${msg}`);
@@ -219,7 +1056,8 @@ const hookHandlers: Record<string, HookHandler> = {
     const memoryContent = `Tool '${toolName}' failed: ${truncated}`;
     try {
-      const res = await sulcusMem.add_memory(memoryContent, "episodic");
+      const errorHints = buildExtractionHints("episodic", ctx.namespace, "tool_error", memoryContent.substring(0, 200));
+      const res = await sulcusMem.add_memory(memoryContent, "episodic", errorHints);
       // Boost heat so error memories persist longer — failures are high-value learnings
       if (res?.id && sulcusMem instanceof SulcusCloudClient) {
         await sulcusMem.request("PATCH", `/api/v1/agent/memory/${res.id}`, {
@@ -240,6 +1078,10 @@ const hookHandlers: Record<string, HookHandler> = {
     const messages = Array.isArray(event?.messages) ? event.messages as Record<string, unknown>[] : [];
     if (messages.length === 0) return;
+    // --- Task 70: Set rebuild flag so next before_prompt_build does full context rebuild ---
+    wasJustCompacted = true;
+    logger.info("sulcus: pre_compaction_capture — rebuild flag SET (next turn will inject full Sulcus context)");
     const firstUser = messages.find((m) => m.role === "user" || m.type === "human");
     const lastAssistant = [...messages].reverse().find((m) => m.role === "assistant" || m.type === "ai");
@@ -255,8 +1097,55 @@ const hookHandlers: Record<string, HookHandler> = {
         ? (lastAssistant.text as string).substring(0, 200)
         : "(none)";
+    // --- Task 70: Extract richer multi-part knowledge from session ---
+    // 1. Files modified (write/edit tool calls)
     const filesModified: string[] = [];
+    // 2. Commands run (exec tool calls)
+    const commandsRun: string[] = [];
+    // 3. Decisions made (assistant messages containing decision markers)
+    const decisions: string[] = [];
+    // 4. Errors encountered
+    const errors: string[] = [];
+    // 5. All user intents (short user messages for multi-query rebuild)
+    const userIntents: string[] = [];
+    const DECISION_MARKERS = ["decided", "will use", "going to", "plan is", "the fix", "conclusion", "recommend", "approach"];
+    const ERROR_MARKERS = ["error:", "failed:", "exception", "traceback", "panicked", "stack trace"];
     for (const msg of messages) {
+      const role = (msg.role ?? msg.type) as string | undefined;
+      const rawContent = typeof msg.content === "string" ? msg.content
+        : typeof msg.text === "string" ? msg.text : "";
+      // Extract user intents (first 150 chars of each user message)
+      if ((role === "user" || role === "human") && rawContent.length > 10) {
+        userIntents.push(rawContent.substring(0, 150));
+      }
+      // Extract decisions from assistant messages
+      if ((role === "assistant" || role === "ai") && rawContent.length > 20) {
+        const lc = rawContent.toLowerCase();
+        if (DECISION_MARKERS.some((m) => lc.includes(m))) {
+          // Extract the sentence containing the decision marker
+          const sentences = rawContent.split(/[.!?\n]/).filter((s) => s.trim().length > 10);
+          for (const s of sentences) {
+            if (DECISION_MARKERS.some((m) => s.toLowerCase().includes(m)) && !decisions.includes(s.trim())) {
+              decisions.push(s.trim().substring(0, 200));
+              if (decisions.length >= 5) break;
+            }
+          }
+        }
+        // Extract errors
+        const lcContent = rawContent.toLowerCase();
+        if (ERROR_MARKERS.some((m) => lcContent.includes(m))) {
+          const errorLine = rawContent.split("\n").find((l) => ERROR_MARKERS.some((m) => l.toLowerCase().includes(m)));
+          if (errorLine && !errors.includes(errorLine.trim())) {
+            errors.push(errorLine.trim().substring(0, 150));
+          }
+        }
+      }
+      // Extract tool calls
       const toolCalls = Array.isArray(msg.tool_calls) ? msg.tool_calls as Record<string, unknown>[] : [];
       for (const tc of toolCalls) {
         const name = (tc.name ?? tc.function) as string | undefined;
@@ -265,15 +1154,24 @@ const hookHandlers: Record<string, HookHandler> = {
           const fp = input?.file_path ?? input?.path;
           if (fp && typeof fp === "string" && !filesModified.includes(fp)) filesModified.push(fp);
         }
+        if (name === "Bash" || name === "bash" || name === "exec" || name === "shell") {
+          const input = (tc.input ?? tc.arguments ?? {}) as Record<string, unknown>;
+          const cmd = input?.command ?? input?.cmd;
+          if (cmd && typeof cmd === "string" && commandsRun.length < 5) {
+            commandsRun.push(cmd.substring(0, 100));
+          }
+        }
       }
     }
+    // --- Build primary summary memory ---
     const summaryParts = [
       `Session compaction — ${messages.length} messages`,
       `First user message: ${firstUserText}`,
       `Last assistant message: ${lastAssistantText}`,
     ];
     if (filesModified.length > 0) summaryParts.push(`Files modified: ${filesModified.join(", ")}`);
+    if (commandsRun.length > 0) summaryParts.push(`Commands run: ${commandsRun.join(" | ")}`);
     const summary = summaryParts.join("\n");
     if (!shouldCapture(summary)) {
@@ -281,17 +1179,156 @@ const hookHandlers: Record<string, HookHandler> = {
       return;
     }
-    try {
-      const res = await sulcusMem.add_memory(summary, "episodic");
-      logger.info(`sulcus: pre_compaction_capture — stored session summary (id: ${res?.id ?? "?"})`);
-    } catch (e: unknown) {
-      const msg = e instanceof Error ? e.message : String(e);
-      logger.debug?.(`sulcus: pre_compaction_capture — store failed: ${msg}`);
+    const storePromises: Promise<unknown>[] = [];
+    // Store primary session summary
+    const compactionHints = buildExtractionHints("episodic", ctx.namespace, "compaction", summary.substring(0, 200));
+    storePromises.push(
+      sulcusMem.add_memory(summary, "episodic", compactionHints)
+        .then((res) => logger.info(`sulcus: pre_compaction_capture — stored session summary (id: ${res?.id ?? "?"})`)
+        ).catch((e: unknown) => logger.debug?.(`sulcus: pre_compaction_capture — summary store failed: ${e instanceof Error ? e.message : String(e)}`))
+    );
+    // --- Task 70: Store decisions as semantic memories for long-term value ---
+    if (decisions.length > 0) {
+      const decisionText = `Session decisions: ${decisions.join(" | ")}`;
+      const decisionHints = buildExtractionHints("semantic", ctx.namespace, "compaction", decisionText.substring(0, 200));
+      storePromises.push(
+        sulcusMem.add_memory(decisionText, "semantic", decisionHints)
+          .then((res) => logger.info(`sulcus: pre_compaction_capture — stored decisions (id: ${res?.id ?? "?"})`)
+          ).catch((e: unknown) => logger.debug?.(`sulcus: pre_compaction_capture — decisions store failed: ${e instanceof Error ? e.message : String(e)}`))
+      );
+    }
+    // --- Task 70: Store user intents for multi-query rebuild ---
+    // Store the middle of the session's user intents as a searchable procedural memory.
+    // This lets the post-compaction rebuild find relevant session context.
+    if (userIntents.length > 2) {
+      const midIntents = userIntents.slice(Math.floor(userIntents.length / 4), Math.floor(3 * userIntents.length / 4)).slice(0, 3);
+      const intentsText = `Session user intents: ${midIntents.join(" | ")}`;
+      if (shouldCapture(intentsText)) {
+        const intentHints = buildExtractionHints("episodic", ctx.namespace, "compaction", intentsText.substring(0, 200));
+        storePromises.push(
+          sulcusMem.add_memory(intentsText, "episodic", intentHints)
+            .then((res) => logger.info(`sulcus: pre_compaction_capture — stored intents (id: ${res?.id ?? "?"})`)
+            ).catch((e: unknown) => logger.debug?.(`sulcus: pre_compaction_capture — intents store failed: ${e instanceof Error ? e.message : String(e)}`))
+        );
+      }
     }
+    // Fire all stores in parallel (non-blocking from OpenClaw's perspective)
+    await Promise.allSettled(storePromises);
+    logger.info(`sulcus: pre_compaction_capture — stored ${storePromises.length} memory/memories from ${messages.length}-message session`);
   },
 };
-// ─── CLOUD HTTP CLIENT ───────────────────────────────────────────────────────
+// --- EXTRACTION HINTS -------------------------------------------------------
+/**
+ * Caller-supplied hints for SILU entity extraction + classification.
+ * Mirrors the server-side ExtractionHints struct (entity_extraction.rs).
+ * These are injected as a preamble into the SILU system prompt to guide
+ * extraction without overriding the LLM's judgment.
+ */
+export interface ExtractionHints {
+  /** Entity types the caller expects (e.g. ["person", "tool", "project"]). */
+  entity_types?: string[];
+  /** Free-form domain focus areas (e.g. ["infrastructure", "memory systems"]). */
+  focus_areas?: string[];
+  /** Entity types to suppress if irrelevant (e.g. ["location"]). */
+  suppress_types?: string[];
+  /** Soft suggestion for memory type — SILU may override if content clearly differs. */
+  expected_type?: string;
+  /** Free-form context note injected verbatim (max 500 chars server-side). */
+  context_note?: string;
+}
+/**
+ * Derive ExtractionHints from available context signals.
+ * Called at store time to guide SILU toward better entity extraction + classification.
+ *
+ * @param memoryType  - The memory type being stored (episodic|semantic|etc.)
+ * @param namespace   - Agent namespace (provides domain context)
+ * @param eventType   - Hook event type (e.g. "sivu_auto_capture", "tool_error", "compaction")
+ * @param contentSnippet - First 200 chars of content for heuristic detection
+ */
+function buildExtractionHints(
+  memoryType: string | null | undefined,
+  namespace: string,
+  eventType: string,
+  contentSnippet: string
+): ExtractionHints | undefined {
+  const hints: ExtractionHints = {};
+  // -- Expected type from known memory_type --
+  if (memoryType && memoryType !== "episodic") {
+    hints.expected_type = memoryType;
+  }
+  // -- Domain focus from namespace --
+  // Namespace is typically the agent id — map known agents to domains
+  const ns = namespace.toLowerCase();
+  if (ns.includes("sulcus") || ns.includes("memory")) {
+    hints.focus_areas = ["memory systems", "AI infrastructure", "sulcus"];
+    hints.entity_types = ["tool", "concept", "project", "model"];
+  } else if (ns.includes("daedalus") || ns.includes("forge") || ns.includes("workshop")) {
+    hints.focus_areas = ["infrastructure", "devops", "software engineering", "AI agents"];
+    hints.entity_types = ["tool", "project", "person", "organization"];
+  } else if (ns.includes("icarus") || ns.includes("booker")) {
+    hints.focus_areas = ["product development", "business logic"];
+    hints.entity_types = ["tool", "project", "person"];
+  }
+  // -- Event-type signals --
+  if (eventType === "tool_error") {
+    hints.context_note = "This is a tool failure memory — focus on tool names, error patterns, and failure causes.";
+    hints.entity_types = [...(hints.entity_types ?? []), "tool"];
+    hints.suppress_types = ["location"];
+  } else if (eventType === "compaction") {
+    hints.context_note = "This is a session summary from context compaction — extract key decisions, files modified, and tasks completed.";
+    hints.entity_types = [...(hints.entity_types ?? []), "project", "tool"];
+  } else if (eventType === "user_capture") {
+    // User conversational content — don't over-suppress anything
+    if (!hints.context_note) {
+      hints.context_note = "This was captured from a user message during an agent session.";
+    }
+  }
+  // -- Content heuristics --
+  const lower = contentSnippet.toLowerCase();
+  if (lower.includes("prefer") || lower.includes("always") || lower.includes("never") || lower.includes("want")) {
+    if (!hints.expected_type) hints.expected_type = "preference";
+  } else if (lower.includes("step") || lower.includes("command") || lower.includes("run ") || lower.includes("deploy")) {
+    if (!hints.expected_type) hints.expected_type = "procedural";
+  } else if (lower.includes("is defined as") || lower.includes("means") || lower.includes("concept") || lower.includes("architecture")) {
+    if (!hints.expected_type) hints.expected_type = "semantic";
+  }
+  // Return undefined if nothing useful was derived (avoid sending empty hints)
+  const hasContent =
+    (hints.entity_types?.length ?? 0) > 0 ||
+    (hints.focus_areas?.length ?? 0) > 0 ||
+    (hints.suppress_types?.length ?? 0) > 0 ||
+    hints.expected_type != null ||
+    hints.context_note != null;
+  return hasContent ? hints : undefined;
+}
+// --- CLOUD HTTP CLIENT -------------------------------------------------------
+// Task 29: Typed HTTP error — carries statusCode and optional Retry-After delay
+// so the retry loop can honour server-specified backoff on 429s.
+class SulcusHttpError extends Error {
+  constructor(
+    message: string,
+    public readonly statusCode: number,
+    public readonly retryAfterMs?: number,
+  ) {
+    super(message);
+    this.name = "SulcusHttpError";
+  }
+}
 class SulcusCloudClient {
   private serverUrl: string;
@@ -302,20 +1339,19 @@ class SulcusCloudClient {
     this.apiKey = apiKey;
   }
-  request(method: string, path: string, body?: unknown): Promise<unknown> {
-    return new Promise((resolveP, rejectP) => {
-      let parsedUrl: URL;
-      try {
-        parsedUrl = new URL(this.serverUrl + path);
-      } catch (e: unknown) {
-        const msg = e instanceof Error ? e.message : String(e);
-        return rejectP(new Error(`SulcusCloudClient: invalid URL ${this.serverUrl}${path}: ${msg}`));
-      }
+  // -- Task 28: Transient retry with exponential backoff ---------------------
+  // Retries on 502/503/504 and network errors — up to RETRY_MAX attempts.
+  // Backoff: 400ms → 800ms → 1600ms (jitter ±20%). Non-retryable errors (4xx
+  // except 429, 5xx ≠ 502/503/504) are surfaced immediately.
+  private static readonly RETRY_MAX = 3;
+  private static readonly RETRY_BASE_MS = 400;
+  private static readonly RETRY_JITTER = 0.2; // ±20%
+  private _rawRequest(method: string, path: string, bodyStr: string | undefined, parsedUrl: URL): Promise<unknown> {
+    return new Promise((resolveP, rejectP) => {
       const isHttps = parsedUrl.protocol === "https:";
       const transport = isHttps ? https : http;
-      const bodyStr = body !== undefined ? JSON.stringify(body) : undefined;
       const headers: Record<string, string> = {
         "Authorization": `Bearer ${this.apiKey}`,
         "Accept": "application/json",
@@ -339,7 +1375,23 @@ class SulcusCloudClient {
         res.on("end", () => {
           const raw = Buffer.concat(chunks).toString("utf-8");
           if (!res.statusCode || res.statusCode >= 400) {
-            return rejectP(new Error(`SulcusCloudClient: HTTP ${res.statusCode} for ${method} ${path}: ${raw.substring(0, 200)}`));
+            // Task 29: Parse Retry-After header on 429 — prefer server-specified delay
+            let retryAfterMs: number | undefined;
+            if (res.statusCode === 429) {
+              const ra = res.headers["retry-after"];
+              if (ra) {
+                const raNum = Number(ra);
+                // RFC 7231: value is either seconds or an HTTP-date
+                retryAfterMs = isNaN(raNum)
+                  ? Math.max(0, new Date(ra).getTime() - Date.now())
+                  : raNum * 1000;
+              }
+            }
+            return rejectP(new SulcusHttpError(
+              `SulcusCloudClient: HTTP ${res.statusCode} for ${method} ${path}: ${raw.substring(0, 200)}`,
+              res.statusCode,
+              retryAfterMs,
+            ));
           }
           if (!raw || raw.trim() === "") return resolveP(null);
           try {
@@ -350,12 +1402,55 @@ class SulcusCloudClient {
         });
       });
-      req.on("error", (e: Error) => rejectP(new Error(`SulcusCloudClient: network error for ${method} ${path}: ${e.message}`)));
+      req.on("error", (e: Error) => rejectP(new SulcusHttpError(`SulcusCloudClient: network error for ${method} ${path}: ${e.message}`, 0)));
       if (bodyStr !== undefined) req.write(bodyStr);
       req.end();
     });
   }
+  request(method: string, path: string, body?: unknown): Promise<unknown> {
+    let parsedUrl: URL;
+    try {
+      parsedUrl = new URL(this.serverUrl + path);
+    } catch (e: unknown) {
+      const msg = e instanceof Error ? e.message : String(e);
+      return Promise.reject(new Error(`SulcusCloudClient: invalid URL ${this.serverUrl}${path}: ${msg}`));
+    }
+    const bodyStr = body !== undefined ? JSON.stringify(body) : undefined;
+    // Task 29: 429 is retryable — server is asking us to back off, not fail
+    const isRetryable = (err: SulcusHttpError): boolean => {
+      // Network errors (statusCode === 0) are always retryable
+      if (err.statusCode === 0) return true;
+      // 429 Too Many Requests — retryable, honours Retry-After below
+      if (err.statusCode === 429) return true;
+      // 502/503/504 are transient gateway errors
+      return err.statusCode === 502 || err.statusCode === 503 || err.statusCode === 504;
+    };
+    const attempt = (tries: number): Promise<unknown> => {
+      return this._rawRequest(method, path, bodyStr, parsedUrl).catch((err: SulcusHttpError) => {
+        if (tries >= SulcusCloudClient.RETRY_MAX || !isRetryable(err)) {
+          throw err;
+        }
+        // Task 29: Prefer Retry-After from server (429) over our own exponential schedule
+        let delay: number;
+        if (err.retryAfterMs !== undefined && err.retryAfterMs > 0) {
+          delay = err.retryAfterMs;
+        } else {
+          // Exponential backoff with jitter
+          const base = SulcusCloudClient.RETRY_BASE_MS * Math.pow(2, tries - 1);
+          const jitter = base * SulcusCloudClient.RETRY_JITTER * (Math.random() * 2 - 1);
+          delay = Math.round(base + jitter);
+        }
+        return new Promise<void>((res) => setTimeout(res, delay)).then(() => attempt(tries + 1));
+      });
+    };
+    return attempt(1);
+  }
+  // -- end Task 28 --------------------------------------------------------------
   async search_memory(query: string, limit?: number, namespace?: string): Promise<{ results: Record<string, unknown>[] }> {
     const body: Record<string, unknown> = { query };
     if (limit !== undefined) body.limit = limit;
@@ -365,9 +1460,11 @@ class SulcusCloudClient {
     return { results };
   }
-  async add_memory(content: string, memoryType?: string | null): Promise<{ id: string; [key: string]: unknown }> {
+  async add_memory(content: string, memoryType?: string | null, hints?: ExtractionHints): Promise<{ id: string; [key: string]: unknown }> {
     const body: Record<string, unknown> = { label: content };
     if (memoryType) body.memory_type = memoryType;
+    // Phase 2: SILU prompt injection — pass extraction hints to guide entity extraction + classification
+    if (hints) body.extraction_hints = hints;
     const res = await this.request("POST", "/api/v1/agent/nodes", body) as Record<string, unknown> | null;
     return (res ?? { id: "unknown" }) as { id: string; [key: string]: unknown };
   }
@@ -431,6 +1528,39 @@ class SulcusCloudClient {
     }
   }
+  async get_memory(id: string): Promise<Record<string, unknown> | null> {
+    try {
+      const res = await this.request("GET", `/api/v1/agent/nodes/${encodeURIComponent(id)}`) as Record<string, unknown> | null;
+      return res;
+    } catch (e: unknown) {
+      const msg = e instanceof Error ? e.message : String(e);
+      if (msg.includes("404")) return null;
+      throw e;
+    }
+  }
+  async list_memories(opts: { page?: number; page_size?: number; memory_type?: string; namespace?: string; pinned?: boolean; sort_by?: string; sort_order?: string } = {}): Promise<{ items: Record<string, unknown>[]; total?: number; page?: number; page_size?: number }> {
+    const params = new URLSearchParams();
+    if (opts.page !== undefined) params.set("page", String(opts.page));
+    if (opts.page_size !== undefined) params.set("page_size", String(opts.page_size));
+    if (opts.memory_type) params.set("memory_type", opts.memory_type);
+    if (opts.namespace) params.set("namespace", opts.namespace);
+    if (opts.pinned !== undefined) params.set("pinned", String(opts.pinned));
+    if (opts.sort_by) params.set("sort_by", opts.sort_by);
+    if (opts.sort_order) params.set("sort_order", opts.sort_order);
+    const q = params.toString() ? `?${params.toString()}` : "";
+    const res = await this.request("GET", `/api/v1/agent/nodes${q}`) as Record<string, unknown> | unknown[] | null;
+    if (Array.isArray(res)) return { items: res as Record<string, unknown>[], total: res.length };
+    const r = (res ?? {}) as Record<string, unknown>;
+    const items = (r.items ?? r.nodes ?? r.results ?? []) as Record<string, unknown>[];
+    return { items, total: r.total as number | undefined, page: r.page as number | undefined, page_size: r.page_size as number | undefined };
+  }
+  async update_memory(id: string, updates: { content?: string; label?: string; memory_type?: string; is_pinned?: boolean; current_heat?: number }): Promise<Record<string, unknown> | null> {
+    const res = await this.request("PATCH", `/api/v1/agent/memory/${encodeURIComponent(id)}`, updates) as Record<string, unknown> | null;
+    return res;
+  }
   async probe(): Promise<boolean> {
     try {
       await this.search_memory("probe", 1);
@@ -439,36 +1569,118 @@ class SulcusCloudClient {
       return false;
     }
   }
-}
-// ─── NATIVE LIB LOADER ──────────────────────────────────────────────────────
-class NativeLibLoader {
-  // eslint-disable-next-line @typescript-eslint/no-explicit-any
-  private koffi: unknown = null;
-  private storeLib: unknown = null;
-  private vectorsLib: unknown = null;
-  private vectorsHandle: unknown = null;
-  // eslint-disable-next-line @typescript-eslint/no-explicit-any
-  private fn_store_init: any = null;
-  private fn_store_query: any = null;
-  private fn_store_free: any = null;
-  private fn_vectors_create: any = null;
-  private fn_vectors_text: any = null;
-  private fn_vectors_free: any = null;
-  public loaded = false;
-  public error: string | null = null;
-  constructor(private storeLibPath: string, private vectorsLibPath: string) {}
-  init(logger: PluginLogger): void {
+  /**
+   * Fetch graph neighbours for a memory node via AGE Cypher.
+   * Returns [] gracefully if the endpoint is unavailable (server too old).
+   */
+  async graph_neighbors(nodeId: string, limit = 6): Promise<Record<string, unknown>[]> {
     try {
-      // eslint-disable-next-line @typescript-eslint/no-require-imports
-      this.koffi = require("koffi");
+      const res = await this.request("GET", `/api/v1/agent/graph/neighbors/${encodeURIComponent(nodeId)}?limit=${limit}`) as Record<string, unknown> | null;
+      if (!res) return [];
+      const nodes = (res.neighbors ?? res.nodes ?? res.results ?? (Array.isArray(res) ? res : [])) as Record<string, unknown>[];
+      return nodes;
     } catch (e: unknown) {
-      this.error = `koffi not available: ${e instanceof Error ? e.message : e}`;
-      logger.warn(`sulcus: ${this.error}`);
+      const msg = e instanceof Error ? e.message : String(e);
+      // 404 = server too old, no graph endpoint — degrade gracefully
+      if (msg.includes("404") || msg.includes("HTTP 404")) return [];
+      return [];
+    }
+  }
+  /**
+   * Task 23: SIRU recall logging — post a recall session to the server for training data.
+   * Fire-and-forget: called after each fresh recall, never blocks context injection.
+   * Server stores this in recall_sessions table for SIRU adaptive scoring.
+   */
+  async recall_log(payload: {
+    namespace: string;
+    agent_id: string;
+    query_text: string;
+    memory_ids: string[];
+    memory_scores: number[];
+    memory_sources: string[];
+    token_budget: number;
+    tokens_used: number;
+    candidates_total: number;
+    candidates_selected: number;
+    semantic_count: number;
+    hot_count: number;
+    entity_count: number;
+    entity_hints: string[];
+  }): Promise<void> {
+    try {
+      await this.request("POST", "/api/v1/agent/recall-log", payload);
+    } catch {
+      // Logging failure must never interrupt recall — silently drop
+    }
+  }
+  /**
+   * Task 35: Entity-context lookup for query expansion.
+   * Fetches graph-connected memories and sibling entities for a set of entity names.
+   * Returns empty gracefully if the endpoint is unavailable.
+   */
+  async entity_context(entityNames: string[], namespace?: string, limit = 3): Promise<EntityContextEntry[]> {
+    try {
+      const body: Record<string, unknown> = { entity_names: entityNames, limit };
+      if (namespace) body.namespace = namespace;
+      const res = await this.request("POST", "/api/v1/agent/entity-context", body) as Record<string, unknown> | null;
+      if (!res) return [];
+      return (res.entities as EntityContextEntry[]) ?? [];
+    } catch {
+      return [];
+    }
+  }
+  /**
+   * Task 34: Batch heat-boost — single round-trip to POST /api/v1/agent/boost-batch.
+   * Accepts an array of { id, heat } boost items.
+   * Returns true if the server accepted the batch; false if the endpoint is not yet deployed (404).
+   * On false, the caller falls back to individual PATCH requests.
+   */
+  async boost_batch(boosts: Array<{ id: string; heat: number }>): Promise<boolean> {
+    try {
+      await this.request("POST", "/api/v1/agent/boost-batch", { boosts });
+      return true;
+    } catch (e: unknown) {
+      const msg = e instanceof Error ? e.message : String(e);
+      // 404 means endpoint not deployed yet — caller will fall back to individual PATCHes
+      if (msg.includes("404")) return false;
+      // Other errors (5xx, network) — propagate so caller can handle
+      throw e;
+    }
+  }
+}
+// --- NATIVE LIB LOADER ------------------------------------------------------
+class NativeLibLoader {
+  // eslint-disable-next-line @typescript-eslint/no-explicit-any
+  private koffi: unknown = null;
+  private storeLib: unknown = null;
+  private vectorsLib: unknown = null;
+  private vectorsHandle: unknown = null;
+  // eslint-disable-next-line @typescript-eslint/no-explicit-any
+  private fn_store_init: any = null;
+  private fn_store_query: any = null;
+  private fn_store_free: any = null;
+  private fn_vectors_create: any = null;
+  private fn_vectors_text: any = null;
+  private fn_vectors_free: any = null;
+  public loaded = false;
+  public error: string | null = null;
+  constructor(private storeLibPath: string, private vectorsLibPath: string) {}
+  init(logger: PluginLogger): void {
+    try {
+      // eslint-disable-next-line @typescript-eslint/no-require-imports
+      this.koffi = require("koffi");
+    } catch (e: unknown) {
+      this.error = `koffi not available: ${e instanceof Error ? e.message : e}`;
+      logger.warn(`sulcus: ${this.error}`);
       return;
     }
@@ -555,7 +1767,7 @@ class NativeLibLoader {
   }
 }
-// ─── PRE-SEND FILTER ─────────────────────────────────────────────────────────
+// --- PRE-SEND FILTER ---------------------------------------------------------
 const JUNK_PATTERNS: RegExp[] = [
   /^(HEARTBEAT_OK|NO_REPLY|NOOP)$/i,
@@ -569,7 +1781,11 @@ const JUNK_PATTERNS: RegExp[] = [
   /^UNTRUSTED (channel|Discord)/i,
   /^<<<EXTERNAL_UNTRUSTED_CONTENT/i,
   /^Runtime:/i,
-  /tool_call|function_call|<function_calls>/i,
+  // Match raw function-call blobs only — NOT prose that mentions tool/function concepts.
+  // e.g. raw JSON {"tool_calls":[...]} or <function_calls><invoke> XML sequences.
+  // Avoids false-positives on architectural content like "the tool call returns..."
+  /^\{"tool_calls":/i,
+  /^<function_calls>\s*<invoke/i,
   /\[Inter-session message\]\s*sourceSession=/i,
   /<<<BEGIN_UNTRUSTED_CHILD_RESULT>>>/,
   /<<<END_UNTRUSTED_CHILD_RESULT>>>/,
@@ -592,7 +1808,7 @@ function isJunkMemory(text: string): boolean {
   return false;
 }
-// ─── CAPTURE DEDUP ───────────────────────────────────────────────────────────
+// --- CAPTURE DEDUP -----------------------------------------------------------
 const captureDedup = new Map<string, number>();
 const DEDUP_WINDOW_MS = 5 * 60 * 1000; // 5 minutes
@@ -608,7 +1824,7 @@ function shouldCapture(content: string): boolean {
   return true;
 }
-// ─── HOOKS CONFIG LOADER ─────────────────────────────────────────────────────
+// --- HOOKS CONFIG LOADER -----------------------------------------------------
 function loadHooksConfig(apiConfig: Record<string, unknown>): HooksConfig {
   const defaultsPath = resolve(__dirname, "hooks.defaults.json");
@@ -630,11 +1846,16 @@ function loadHooksConfig(apiConfig: Record<string, unknown>): HooksConfig {
         memory_recall: { enabled: true },
         memory_store: { enabled: true },
         memory_status: { enabled: true },
+        memory_profile: { enabled: true },
         consolidate: { enabled: false },
         export_markdown: { enabled: false },
         import_markdown: { enabled: false },
         evaluate_triggers: { enabled: false },
+        memory_inspect: { enabled: true },
+        guardrail_status: { enabled: true },
         __sulcus_workflow__: { enabled: true },
+        session_store: { enabled: true },
+        session_recall: { enabled: true },
       },
     };
   }
@@ -668,7 +1889,7 @@ function loadHooksConfig(apiConfig: Record<string, unknown>): HooksConfig {
   return { version: defaults.version, hooks: mergedHooks, tools: mergedTools };
 }
-// ─── RELATIVE TIME FORMATTER ─────────────────────────────────────────────────
+// --- RELATIVE TIME FORMATTER -------------------------------------------------
 function formatRelativeTime(isoTimestamp: string): string {
   try {
@@ -690,7 +1911,767 @@ function formatRelativeTime(isoTimestamp: string): string {
   }
 }
-// ─── SDK RECALL HANDLER (for before_prompt_build with prependContext) ──────────
+// --- MEMORY AGE WARNING (Task 33) ----------------------------------------------
+// Returns true when a memory's updated_at timestamp is older than 30 days.
+// Used to emit stale="true" on <memory> elements so the agent can weigh recency.
+const STALE_THRESHOLD_MS = 30 * 24 * 60 * 60 * 1000; // 30 days in ms
+function isStaleMemory(isoTimestamp: string | undefined): boolean {
+  if (!isoTimestamp) return false;
+  try {
+    const dt = new Date(isoTimestamp);
+    return Date.now() - dt.getTime() > STALE_THRESHOLD_MS;
+  } catch {
+    return false;
+  }
+}
+// --- CORRECTION DETECTION + HEAT-BOOST (Task 21) ----------------------------------
+/**
+ * Markers that strongly suggest the user is correcting or updating a prior belief.
+ * Checked against the full message text (case-insensitive).
+ */
+const CORRECTION_MARKERS: string[] = [
+  "actually,", "actually ", "that's wrong", "thats wrong",
+  "that is wrong", "correction:", "no, it", "no it's", "not quite",
+  "update:", "i meant", "i mean", "i was wrong", "was incorrect",
+  "is incorrect", "please update", "forget that", "ignore that",
+  "disregard", "instead,", "rather,", "not that,", "fix:",
+];
+function isCorrectionMessage(text: string): boolean {
+  const lower = text.toLowerCase();
+  return CORRECTION_MARKERS.some((m) => lower.includes(m));
+}
+// --- ASSISTANT OUTPUT CAPTURE HELPERS (Task 67) ------------------------------
+// Generic acknowledgment patterns — not worth storing as memories.
+const GENERIC_ACK_PATTERNS: RegExp[] = [
+  /^(ok|okay|sure|got it|will do|understood|noted|done|sounds good|great|perfect|no problem|no worries|absolutely|certainly|of course|copy that|roger|on it|right away|working on it|let me|i'll|i will)[\.!,]?$/i,
+  /^(yes|yeah|yep|yup|nope|no|nah)[\.!]?$/i,
+  /^(thanks|thank you|thx|ty)[\.!]?$/i,
+  /^(one moment|just a moment|give me a (second|moment|sec))[\.!,]?$/i,
+  /^(looking into|checking|fetching|retrieving|processing|analyzing)\b/i,
+];
+/**
+ * Returns true if the assistant output is a generic acknowledgment
+ * (short filler responses not worth capturing as memories).
+ */
+function isGenericAck(text: string): boolean {
+  const trimmed = text.trim();
+  if (trimmed.length > 250) return false; // Long responses are never pure acks
+  return GENERIC_ACK_PATTERNS.some((p) => p.test(trimmed));
+}
+/** Maximum characters of assistant output to store directly. Longer → summarized. */
+const ASSISTANT_CAPTURE_MAX_DIRECT = 1500;
+/**
+ * Compresses a long assistant response into a compact summary for storage.
+ * Extracts: first paragraph (context), last paragraph (conclusion/decision),
+ * and any sentences containing decision/recommendation markers.
+ */
+function summarizeForCapture(text: string, namespace: string): string {
+  const paragraphs = text.split(/\n{2,}/).map((p) => p.trim()).filter((p) => p.length > 20);
+  if (paragraphs.length === 0) return text.substring(0, ASSISTANT_CAPTURE_MAX_DIRECT);
+  const DECISION_MARKERS = [
+    "decided", "recommend", "conclusion", "therefore", "result:", "outcome:",
+    "solution:", "answer:", "key point", "important:", "note:", "summary:",
+    "in summary", "to summarize", "bottom line", "takeaway",
+  ];
+  const keyParagraphs: string[] = [];
+  // Always include first paragraph (sets context)
+  if (paragraphs[0]) keyParagraphs.push(paragraphs[0]);
+  // Include paragraphs with decision markers
+  for (let i = 1; i < paragraphs.length - 1; i++) {
+    const pLower = paragraphs[i].toLowerCase();
+    if (DECISION_MARKERS.some((m) => pLower.includes(m))) {
+      keyParagraphs.push(paragraphs[i]);
+      if (keyParagraphs.length >= 3) break;
+    }
+  }
+  // Always include last paragraph (conclusion)
+  const last = paragraphs[paragraphs.length - 1];
+  if (last && last !== keyParagraphs[0]) keyParagraphs.push(last);
+  const summary = keyParagraphs.join(" [...] ").substring(0, ASSISTANT_CAPTURE_MAX_DIRECT);
+  return `[assistant summary, ns=${namespace}] ${summary}`;
+}
+/**
+ * Heat-boost memories semantically related to a correction message.
+ * Searches for up to `limit` related memories and PATCHes each with
+ * elevated heat so they surface strongly and decay slowly.
+ * Best-effort — individual PATCH failures are silently skipped.
+ */
+async function boostRelatedMemories(
+  sulcusMem: SulcusCloudClient,
+  query: string,
+  namespace: string,
+  boostHeat: number,
+  limit: number,
+  logger: PluginLogger,
+): Promise<number> {
+  let boosted = 0;
+  try {
+    const res = await sulcusMem.search_memory(query, limit, namespace);
+    const results = res?.results ?? [];
+    await Promise.allSettled(
+      results.map(async (node) => {
+        const nodeId = node.id as string;
+        if (!nodeId) return;
+        try {
+          await sulcusMem.request("PATCH", `/api/v1/agent/memory/${nodeId}`, { current_heat: boostHeat });
+          boosted++;
+        } catch {
+          // best-effort
+        }
+      })
+    );
+  } catch {
+    // search failed — no boost possible
+  }
+  return boosted;
+}
+// --- SPACED REPETITION: BOOST ON RECALL -----------------------------------------
+/**
+ * Spaced-repetition heat boost for recalled memories.
+ * When a memory surfaces in context, nudge its heat upward so frequently
+ * accessed knowledge persists longer. Caps at 0.95 to avoid pinning memories
+ * that should eventually decay.
+ *
+ * Boost is small (delta 0.05–0.10) so the thermodynamic decay still governs
+ * long-term retention — this just resets the decay clock slightly.
+ * Best-effort — PATCH failures are silently swallowed.
+ */
+/**
+ * Task 27: Heat-graduated spaced repetition boost.
+ *
+ * Flat-delta boosts waste PATCH calls on already-hot nodes and under-reinforce
+ * cooling memories. This version applies a graduated delta:
+ *
+ *   heat in [0.10, 0.40) → delta 0.12  (cold: needs a real nudge to stay alive)
+ *   heat in [0.40, 0.65) → delta 0.08  (warm: moderate reinforcement)
+ *   heat in [0.65, 0.85) → delta 0.05  (hot: small top-up only)
+ *   heat in [0.85, 1.00] → skip        (already near cap — no wasted PATCH)
+ *
+ * Effect: recall frequency governs long-term retention more faithfully.
+ * Rarely-recalled but still-warm memories get a strong rescue; near-maxed
+ * memories don't get artificially pinned.
+ */
+async function boostRecalledMemories(
+  sulcusMem: SulcusCloudClient,
+  memories: Array<{ id?: unknown; current_heat?: unknown }>,
+  logger: PluginLogger,
+): Promise<void> {
+  const BOOST_CAP = 0.95;
+  const MIN_HEAT_FOR_BOOST = 0.10; // skip nearly-dead nodes — they should decay
+  const SKIP_ABOVE = 0.85;         // already near cap — no PATCH needed
+  /** Returns heat-graduated boost delta, or 0 if node should be skipped. */
+  function boostDelta(heat: number): number {
+    if (heat < MIN_HEAT_FOR_BOOST || heat >= SKIP_ABOVE) return 0;
+    if (heat < 0.40) return 0.12;
+    if (heat < 0.65) return 0.08;
+    return 0.05;
+  }
+  const toBoost = memories
+    .map((m) => ({ id: m.id as string | undefined, heat: (m.current_heat as number) ?? 0 }))
+    .filter((m) => m.id && boostDelta(m.heat) > 0);
+  if (toBoost.length === 0) return;
+  // -- Task 34: Batch heat-boost — single round-trip when server supports it --
+  // Try POST /api/v1/agent/boost-batch first (server >= 2.11.0).
+  // Falls back to N individual PATCHes if the endpoint returns 404.
+  const batchItems = toBoost.map(({ id, heat }) => ({
+    id: id!,
+    heat: parseFloat(Math.min(BOOST_CAP, heat + boostDelta(heat)).toFixed(3)),
+  }));
+  let usedBatch = false;
+  try {
+    usedBatch = await sulcusMem.boost_batch(batchItems);
+  } catch {
+    // network error or 5xx — fall through to individual PATCHes
+  }
+  if (usedBatch) {
+    const totalDeltaBatch = toBoost.reduce((acc, { heat }) => acc + boostDelta(heat), 0);
+    const avgDelta = (totalDeltaBatch / toBoost.length).toFixed(3);
+    logger.info(`sulcus: boost-on-recall — batch boost for ${toBoost.length} memor${toBoost.length === 1 ? "y" : "ies"} (avg Δ${avgDelta}, 1 round-trip)`);
+    return;
+  }
+  // Fallback: individual PATCHes (server < 2.11.0 or batch endpoint unavailable)
+  let boosted = 0;
+  let totalDelta = 0;
+  await Promise.allSettled(
+    toBoost.map(async ({ id, heat }) => {
+      const delta = boostDelta(heat);
+      const newHeat = Math.min(BOOST_CAP, heat + delta);
+      try {
+        await sulcusMem.request("PATCH", `/api/v1/agent/memory/${encodeURIComponent(id!)}`, {
+          current_heat: parseFloat(newHeat.toFixed(3)),
+        });
+        boosted++;
+        totalDelta += delta;
+      } catch {
+        // best-effort — server may be busy or node already decayed
+      }
+    })
+  );
+  if (boosted > 0) {
+    const avgDelta = (totalDelta / boosted).toFixed(3);
+    logger.info(`sulcus: boost-on-recall — individual boost for ${boosted}/${toBoost.length} memor${boosted === 1 ? "y" : "ies"} (avg Δ${avgDelta}, ${toBoost.length} round-trips)`);
+  }
+}
+// --- CONTEXT BUDGET ENFORCEMENT (Task 18) ---------------------------------------
+/**
+ * Rough token estimator — 1 token ≈ 4 chars (conservative for XML-heavy content).
+ * Used to enforce the context token budget before injecting.
+ */
+function estimateTokens(text: string): number {
+  return Math.ceil(text.length / 4);
+}
+/**
+ * Truncate a memory label to fit within a character budget.
+ * Appends ellipsis if truncated. Prefers word-boundary cuts.
+ */
+function truncateLabel(label: string, maxChars: number): string {
+  if (label.length <= maxChars) return label;
+  const cut = label.lastIndexOf(" ", maxChars - 3);
+  const boundary = cut > maxChars * 0.6 ? cut : maxChars - 3;
+  return label.slice(0, boundary) + "…";
+}
+// --- ADAPTIVE SCALING (Task 101) -----------------------------------------------
+// Reduces recall budget and result count as conversation grows.
+// Early turns get full context; later turns shrink to leave room for actual work.
+// This prevents Sulcus from consuming an ever-larger share of the context window
+// in long conversations, which was causing compaction/summarization triggers.
+interface AdaptiveScale {
+  effectiveMax: number;
+  effectiveTokenBudget: number;
+  /** True when context utilization is so high that injection should be skipped entirely. */
+  selfMuted: boolean;
+}
+function applyAdaptiveScaling(turnCount: number, maxResults: number, tokenBudget: number): AdaptiveScale {
+  // Turns 1-5: full budget
+  // Turns 6-15: 80%
+  // Turns 16-30: 60%
+  // Turns 30+: 40%
+  let factor = 1.0;
+  if (turnCount > 30) factor = 0.4;
+  else if (turnCount > 15) factor = 0.6;
+  else if (turnCount > 5) factor = 0.8;
+  return {
+    effectiveMax: Math.max(2, Math.floor(maxResults * factor)),
+    effectiveTokenBudget: Math.max(500, Math.floor(tokenBudget * factor)),
+    selfMuted: false,
+  };
+}
+/**
+ * Task 102: Context-window-aware throttling.
+ * Measures the actual prompt size (event.prompt) against the model's context window
+ * and applies aggressive throttling when utilization is high.
+ *
+ * This is the REAL defense against context crashes — turn-based scaling is a heuristic,
+ * but prompt size measurement is ground truth. A few turns with large tool outputs
+ * (e.g. file reads, verbose exec results) can fill the window fast regardless of turn count.
+ *
+ * Thresholds:
+ *   <70%: no additional throttling (turn-based scaling is sufficient)
+ *   70-85%: reduce to 50% of budget
+ *   85-93%: reduce to 20% of budget, max 2 results
+ *   >93%: self-mute — return nothing, let the model breathe
+ */
+function applyContextWindowThrottle(
+  promptChars: number,
+  contextWindowTokens: number,
+  scale: AdaptiveScale,
+  logger?: PluginLogger,
+): AdaptiveScale {
+  // Estimate tokens from chars (~4 chars per token for English + code mixed content)
+  const estimatedTokens = Math.ceil(promptChars / 4);
+  const utilization = estimatedTokens / contextWindowTokens;
+  if (utilization > 0.93) {
+    // DANGER ZONE: self-mute entirely. Every token counts.
+    logger?.warn?.(`sulcus: context window ${(utilization * 100).toFixed(0)}% full (~${estimatedTokens} tokens / ${contextWindowTokens}) — SELF-MUTING recall injection`);
+    return { effectiveMax: 0, effectiveTokenBudget: 0, selfMuted: true };
+  }
+  if (utilization > 0.85) {
+    // HIGH: minimal injection — just enough for continuity
+    logger?.info?.(`sulcus: context window ${(utilization * 100).toFixed(0)}% full — aggressive throttle (20% budget, max 2 results)`);
+    return {
+      effectiveMax: Math.min(2, scale.effectiveMax),
+      effectiveTokenBudget: Math.max(200, Math.floor(scale.effectiveTokenBudget * 0.2)),
+      selfMuted: false,
+    };
+  }
+  if (utilization > 0.70) {
+    // MODERATE: reduce footprint
+    logger?.debug?.(`sulcus: context window ${(utilization * 100).toFixed(0)}% full — moderate throttle (50% budget)`);
+    return {
+      effectiveMax: Math.max(2, Math.floor(scale.effectiveMax * 0.6)),
+      effectiveTokenBudget: Math.max(300, Math.floor(scale.effectiveTokenBudget * 0.5)),
+      selfMuted: false,
+    };
+  }
+  // <70%: no additional throttling
+  return scale;
+}
+/**
+ * Given a list of memory items already sorted by heat desc, trim them to fit
+ * within `tokenBudget` tokens (estimated). Returns the subset that fits.
+ * Each item's label is also truncated if it alone would exceed the per-item cap.
+ *
+ * @param items        - Memory records with normalized `label` field, sorted by heat desc
+ * @param tokenBudget  - Max tokens for the entire recall block
+ * @param overhead     - Fixed overhead tokens already allocated elsewhere
+ */
+function enforceContextBudget(
+  items: Array<{ label: string; [k: string]: unknown }>,
+  tokenBudget: number,
+  overhead: number
+): Array<{ label: string; [k: string]: unknown }> {
+  const remaining = tokenBudget - overhead;
+  if (remaining <= 0) return [];
+  // Per-item cap: a single memory should not dominate the budget.
+  // Allow up to 40% of the remaining budget for any one item, but never exceed 250 chars
+  // (Task 101: prevents verbose pointer_summaries from consuming the context window).
+  const MAX_LABEL_CHARS = 250;
+  const perItemCharCap = Math.min(MAX_LABEL_CHARS, Math.floor((remaining * 4) * 0.4));
+  const result: Array<{ label: string; [k: string]: unknown }> = [];
+  let usedTokens = 0;
+  for (const item of items) {
+    const truncated = truncateLabel(item.label, perItemCharCap);
+    const itemTokens = estimateTokens(truncated) + 8; // +8 for XML tag overhead
+    if (usedTokens + itemTokens > remaining) break;
+    result.push({ ...item, label: truncated });
+    usedTokens += itemTokens;
+  }
+  return result;
+}
+// --- DIVERSITY FILTER (Task 20) -----------------------------------------------
+/**
+ * Jaccard-penalised diversity filter — prevents the context window from being
+ * filled with near-duplicate memories about the same thing.
+ *
+ * Algorithm (MMR-lite):
+ *   1. Start with the highest-heat item as the first selected.
+ *   2. For each remaining candidate, compute its max Jaccard similarity to
+ *      any already-selected item.
+ *   3. Score = heat * (1 - LAMBDA * maxSim)  where LAMBDA controls how
+ *      strongly we penalise similarity (0 = pure heat, 1 = pure diversity).
+ *   4. Pick the highest-scoring candidate next. Repeat until cap reached.
+ *
+ * This keeps the top result trustworthy (highest heat wins) while diversifying
+ * the rest. A cap of `limit` prevents runaway expansion.
+ */
+const DIVERSITY_LAMBDA = 0.55; // penalty weight for similarity
+const DIVERSITY_SIM_THRESHOLD = 0.65; // above this → considered near-duplicate
+function diversityFilter(
+  items: Array<{ label: string; _heat: number; [k: string]: unknown }>,
+  limit: number
+): typeof items {
+  if (items.length <= 1) return items;
+  const selected: typeof items = [];
+  const remaining = [...items];
+  // Always seed with the top-heat item
+  const first = remaining.splice(0, 1)[0];
+  selected.push(first);
+  while (selected.length < limit && remaining.length > 0) {
+    let bestIdx = 0;
+    let bestScore = -Infinity;
+    for (let i = 0; i < remaining.length; i++) {
+      const candidate = remaining[i];
+      // Max similarity to any already-selected item
+      let maxSim = 0;
+      for (const sel of selected) {
+        const sim = topicTokenOverlap(candidate.label, sel.label);
+        if (sim > maxSim) maxSim = sim;
+      }
+      // MMR score: balance heat vs novelty
+      const score = candidate._heat * (1 - DIVERSITY_LAMBDA * maxSim);
+      if (score > bestScore) {
+        bestScore = score;
+        bestIdx = i;
+      }
+    }
+    const chosen = remaining.splice(bestIdx, 1)[0];
+    // Hard cutoff: skip if too similar to anything already in window
+    // (score so low even penalised it won't help)
+    const maxSimToSelected = selected.reduce((m, s) => {
+      const sim = topicTokenOverlap(chosen.label, s.label);
+      return sim > m ? sim : m;
+    }, 0);
+    if (maxSimToSelected < DIVERSITY_SIM_THRESHOLD) {
+      selected.push(chosen);
+    }
+    // If similarity was too high, we still consumed the slot (prevents infinite loop)
+    // but don't add it — effectively dropping the near-duplicate.
+  }
+  return selected;
+}
+// --- CONFLICT DETECTION (Task 19) ----------------------------------------------
+/**
+ * Lightweight conflict detector — finds pairs of memories that share
+ * significant topic overlap but where one contains negation/correction
+ * language that may contradict the other, OR where both address the same
+ * concept but one is substantially newer (stale vs updated).
+ *
+ * Returns pairs as { older, newer } with a reason string.
+ * Capped at 3 conflict pairs to stay within token budget.
+ */
+const NEGATION_MARKERS = [
+  "not ", "no longer", "never", "removed", "deprecated", "disabled",
+  "changed", "replaced", "fixed", "incorrect", "wrong", "actually",
+  "correction", "mistake", "was wrong", "instead", "update:",
+];
+function hasNegationMarker(text: string): boolean {
+  const lower = text.toLowerCase();
+  return NEGATION_MARKERS.some((m) => lower.includes(m));
+}
+function topicTokenOverlap(a: string, b: string): number {
+  const ta = extractTopicTokens(a);
+  const tb = extractTopicTokens(b);
+  return topicOverlap(ta, tb);
+}
+function parseISOMs(iso: string | undefined): number {
+  if (!iso) return 0;
+  try { return new Date(iso).getTime(); } catch { return 0; }
+}
+// -- Task 79: Temporal query detection ------------------------------------------
+// Detects whether a user query is asking about events in time-order ("when did",
+// "what happened yesterday", "sequence of events", etc.) so recall results can
+// be re-sorted chronologically instead of by relevance/heat.
+const TEMPORAL_KEYWORDS = [
+  "yesterday", "today", "last week", "this week", "last month", "this month",
+  "days ago", "hours ago", "weeks ago", "months ago",
+  "last monday", "last tuesday", "last wednesday", "last thursday",
+  "last friday", "last saturday", "last sunday",
+  "recently", "timeline", "chronolog", "sequence of", "in order",
+  "what order", "time order", "when did", "when was", "since when",
+  "how long ago", "first thing", "before that", "after that",
+];
+function isTemporalQuery(query: string): boolean {
+  const q = query.toLowerCase();
+  return TEMPORAL_KEYWORDS.some((kw) => q.includes(kw));
+}
+/**
+ * Re-sort recall results chronologically (oldest → newest) for temporal queries.
+ * Falls back to original order if updated_at is missing from results.
+ * Returns a new array — does not mutate the input.
+ */
+function temporalRerank<T extends { updated_at?: string; [k: string]: unknown }>(items: T[]): T[] {
+  const withTimestamp = items.filter((r) => r.updated_at);
+  // Only re-rank if at least half the results have timestamps — otherwise
+  // chronological ordering would be meaningless (too many unknowns).
+  if (withTimestamp.length < items.length / 2) return items;
+  return [...items].sort((a, b) => {
+    const aMs = parseISOMs(a.updated_at);
+    const bMs = parseISOMs(b.updated_at);
+    return aMs - bMs; // ascending = oldest first (chronological)
+  });
+}
+// -- end Task 79 ----------------------------------------------------------------
+// Task 35: entity-context response entry
+interface EntityContextEntry {
+  name: string;
+  type: string;
+  related_memories: Array<{ id: string; pointer_summary: string; memory_type: string; current_heat: number }>;
+  connections: Array<{ name: string; relationship: string }>;
+}
+// -- Task 80: Temporal supersession (replaces Task 19 conflict detection) -----
+// When two memories share significant topic overlap AND one is newer (by time
+// or by containing correction/negation language), the newer one is the truth.
+// The older one is historical context that should rank below.
+//
+// Instead of a separate <conflicts> block, we:
+//   1. Detect superseded items via topic overlap + time/negation
+//   2. Mark them with _superseded = true
+//   3. Apply a 50% score penalty so they fall below the budget cut line
+//   4. Tag them with superseded="true" in the XML
+//   5. The newer memory keeps its natural (prominent) position
+//
+// This aligns with transformer attention: prominent/later context items have
+// stronger influence on generation. Newer memory = primary, older = footnote.
+const SUPERSESSION_SCORE_PENALTY = 0.5; // 50% penalty on superseded item scores
+const SUPERSESSION_MIN_OVERLAP = 0.35;  // minimum topic overlap to compare
+const SUPERSESSION_STALENESS_GAP_MS = 7 * 24 * 60 * 60 * 1000; // 7 days
+/**
+ * Scan items for supersession: when two memories share topic overlap and one
+ * is newer (by timestamp or negation markers), the older one gets _superseded=true
+ * and a score penalty. Mutates items in-place. Returns count of superseded items.
+ */
+function markSuperseded<T extends { label: string; _heat: number; updated_at?: string; _superseded?: boolean; [k: string]: unknown }>(
+  items: T[]
+): number {
+  let supersededCount = 0;
+  const alreadySuperseded = new Set<number>();
+  for (let i = 0; i < items.length; i++) {
+    if (alreadySuperseded.has(i)) continue;
+    for (let j = i + 1; j < items.length; j++) {
+      if (alreadySuperseded.has(j)) continue;
+      const a = items[i];
+      const b = items[j];
+      const overlap = topicTokenOverlap(a.label, b.label);
+      if (overlap < SUPERSESSION_MIN_OVERLAP) continue;
+      // Determine which is newer
+      const aNeg = hasNegationMarker(a.label);
+      const bNeg = hasNegationMarker(b.label);
+      const aMs = parseISOMs(a.updated_at);
+      const bMs = parseISOMs(b.updated_at);
+      let olderIdx: number | null = null;
+      // Negation supersession: the corrective memory supersedes the original
+      if (aNeg !== bNeg) {
+        olderIdx = aNeg ? j : i; // non-negation item is the older/superseded one
+      }
+      // Staleness supersession: significantly newer timestamp wins
+      else if (aMs > 0 && bMs > 0 && Math.abs(aMs - bMs) > SUPERSESSION_STALENESS_GAP_MS) {
+        olderIdx = aMs < bMs ? i : j;
+      }
+      if (olderIdx !== null) {
+        items[olderIdx]._superseded = true;
+        items[olderIdx]._heat *= SUPERSESSION_SCORE_PENALTY;
+        alreadySuperseded.add(olderIdx);
+        supersededCount++;
+      }
+    }
+  }
+  return supersededCount;
+}
+// -- end Task 80 -----------------------------------------------------------------
+// Legacy alias — detectConflicts is no longer used but kept for backward compat
+// in case external code references it. Returns empty array.
+function detectConflicts(
+  _items: Array<{ label: string; memory_type?: string; updated_at?: string; [k: string]: unknown }>
+): Array<{ olderLabel: string; newerLabel: string; reason: string }> {
+  return [];
+}
+// --- SDK RECALL HANDLER (for before_prompt_build with prependContext) ----------
+// Topic-shift detection constants (Task 14)
+const TOPIC_SHIFT_THRESHOLD = 0.25; // Jaccard overlap below this = topic shift
+const TOPIC_CACHE_TTL_MS = 5 * 60 * 1000; // 5 minutes hard TTL
+const STOPWORDS = new Set([
+  "a", "an", "the", "and", "or", "but", "in", "on", "at", "to", "for",
+  "of", "with", "by", "is", "it", "this", "that", "be", "as", "are",
+  "was", "were", "has", "have", "had", "do", "does", "did", "can", "could",
+  "will", "would", "should", "i", "you", "we", "they", "he", "she", "me",
+  "my", "your", "our", "their", "its", "not", "no", "so", "if", "what",
+  "how", "when", "where", "which", "who", "from", "up", "about", "into",
+  "just", "also", "any", "all", "than", "then", "there", "been", "more",
+]);
+// --- QUERY SANITIZATION ------------------------------------------------------
+// Strip OpenClaw framework noise from prompts before using them as search queries.
+// Removes sender metadata JSON blocks, untrusted content wrappers, conversation
+// info blocks, and timestamp prefixes that pollute semantic search.
+/**
+ * Task 62: Extract the last user-authored turn from the full prompt context.
+ * The full `event.prompt` in before_prompt_build is the entire accumulated context
+ * buffer — using it as a recall query means old context dominates over what the
+ * user is actually asking right now.
+ *
+ * Strategy: find the last non-empty block of text that looks like user input
+ * (not a system header, not a JSON metadata block, not an assistant turn marker).
+ * Falls back to the last 500 chars of the full sanitized prompt if extraction fails.
+ *
+ * Used for: recall vector search query (current intent)
+ * NOT used for: topic-shift detection (still uses full prompt for drift measurement)
+ */
+function extractLastUserTurn(rawPrompt: string): string {
+  // First sanitize to remove metadata noise
+  const cleaned = sanitizeRecallQuery(rawPrompt);
+  if (!cleaned || cleaned.length < 3) return cleaned;
+  // Split into paragraphs — user messages are typically separated by newlines
+  const paragraphs = cleaned
+    .split(/\n{2,}/)
+    .map((p) => p.trim())
+    .filter((p) => p.length > 0);
+  if (paragraphs.length === 0) return cleaned.substring(cleaned.length - 500);
+  // Walk backwards to find the last paragraph that looks like user content
+  // Skip: system headers ("You are...", "Your task..."), very short fragments,
+  // pure JSON/XML blocks, assistant turn markers
+  for (let i = paragraphs.length - 1; i >= 0; i--) {
+    const p = paragraphs[i];
+    if (p.length < 10) continue;  // too short to be meaningful
+    if (/^\{[\s\S]*\}$/.test(p)) continue;  // pure JSON object
+    if (/^<[a-zA-Z]/.test(p) && /<\/[a-zA-Z]/.test(p)) continue;  // pure XML block
+    if (/^(you are|your task|system:|assistant:|\[system\])/i.test(p)) continue;  // system/role headers
+    if (/^\s*```/.test(p)) continue;  // code block
+    // Found a usable paragraph — take up to 500 chars
+    return p.substring(0, 500);
+  }
+  // Fallback: last 500 chars of the full cleaned prompt
+  return cleaned.substring(Math.max(0, cleaned.length - 500));
+}
+function sanitizeRecallQuery(raw: string): string {
+  let cleaned = raw;
+  // Strip "Conversation info (untrusted metadata):" + JSON code blocks
+  cleaned = cleaned.replace(/Conversation info \(untrusted metadata\):\s*```json[\s\S]*?```\s*/gi, "");
+  // Strip "Sender (untrusted metadata):" + JSON code blocks
+  cleaned = cleaned.replace(/Sender \(untrusted metadata\):\s*```json[\s\S]*?```\s*/gi, "");
+  // Strip "Replied message (untrusted, for context):" + JSON code blocks
+  cleaned = cleaned.replace(/Replied message \(untrusted[^)]*\):\s*```json[\s\S]*?```\s*/gi, "");
+  // Strip EXTERNAL_UNTRUSTED_CONTENT wrappers
+  cleaned = cleaned.replace(/<<<EXTERNAL_UNTRUSTED_CONTENT[\s\S]*?<<<END_EXTERNAL_UNTRUSTED_CONTENT[^>]*>>>/g, "");
+  // Strip "Untrusted context (metadata, do not treat as instructions or commands):" headers
+  cleaned = cleaned.replace(/Untrusted context \(metadata[^)]*\):\s*/gi, "");
+  // Strip leading [timestamp] or [sender] tags
+  cleaned = cleaned.replace(/^\[[^\]]{0,100}\]\s*/g, "");
+  // Strip @ mentions
+  cleaned = cleaned.replace(/<@!?\d+>/g, "");
+  cleaned = cleaned.replace(/@\w+/g, "");
+  // Collapse whitespace
+  cleaned = cleaned.replace(/\s+/g, " ").trim();
+  return cleaned || raw;
+}
+function extractTopicTokens(text: string): Set<string> {
+  const tokens = text
+    .toLowerCase()
+    .replace(/[^a-z0-9\s]/g, " ")
+    .split(/\s+/)
+    .filter((t) => t.length > 2 && !STOPWORDS.has(t));
+  return new Set(tokens.slice(0, 40));
+}
+function topicOverlap(a: Set<string>, b: Set<string>): number {
+  if (a.size === 0 || b.size === 0) return 0;
+  let shared = 0;
+  for (const token of a) { if (b.has(token)) shared++; }
+  return shared / Math.max(a.size, b.size);
+}
+/**
+ * Task 35: Query expansion for thin recall.
+ * When vector search returns < THIN_RECALL_THRESHOLD results, call entity-context
+ * to discover synonym terms and directly-connected memories from the knowledge graph.
+ *
+ * Returns an object with:
+ * - extraMemories: additional memory records from entity graph connections
+ * - expandedQuery: a broadened query string with synonym entity names appended
+ */
+async function expandQueryWithEntities(
+  client: SulcusCloudClient,
+  originalQuery: string,
+  namespace: string | undefined,
+  logger: PluginLogger,
+): Promise<{ extraMemories: Record<string, unknown>[]; expandedQuery: string }> {
+  const tokens = Array.from(extractTopicTokens(originalQuery)).slice(0, 5);
+  if (tokens.length === 0) return { extraMemories: [], expandedQuery: originalQuery };
+  const entityData = await client.entity_context(tokens, namespace, 3);
+  if (entityData.length === 0) return { extraMemories: [], expandedQuery: originalQuery };
+  const synonymTerms: string[] = [];
+  const extraMemories: Record<string, unknown>[] = [];
+  const seenIds = new Set<string>();
+  for (const entity of entityData) {
+    // Collect connected entity names as synonym expansion terms
+    for (const conn of entity.connections) {
+      if (conn.name && conn.name.length > 2) {
+        synonymTerms.push(conn.name);
+      }
+    }
+    // Collect directly-connected memories
+    for (const mem of entity.related_memories) {
+      if (mem.id && !seenIds.has(mem.id)) {
+        seenIds.add(mem.id);
+        extraMemories.push({
+          id: mem.id,
+          label: mem.pointer_summary,
+          pointer_summary: mem.pointer_summary,
+          memory_type: mem.memory_type,
+          current_heat: mem.current_heat,
+          _heat: mem.current_heat,
+          _source: "entity_expansion",
+        });
+      }
+    }
+  }
+  // Build expanded query: original terms + up to 5 unique synonym terms
+  const uniqueSynonyms = [...new Set(synonymTerms)].slice(0, 5);
+  const expandedQuery = uniqueSynonyms.length > 0
+    ? `${originalQuery} ${uniqueSynonyms.join(" ")}`
+    : originalQuery;
+  logger.info(`sulcus: query expansion found ${entityData.length} entity/entities, ${extraMemories.length} extra memories, ${uniqueSynonyms.length} synonym(s)`);
+  return { extraMemories, expandedQuery };
+}
+/** Minimum vector results before triggering query expansion (Task 35). */
+const THIN_RECALL_THRESHOLD = 3;
+interface RecallCache {
+  results: Record<string, unknown>[];
+  topicTokens: Set<string>;
+  cachedAt: number;
+}
 interface ProfileCache {
   preferences: Record<string, unknown>[];
@@ -703,29 +2684,263 @@ function buildSdkRecallHandler(
   namespace: string,
   maxResults: number,
   profileFrequency: number,
-  logger: PluginLogger
+  logger: PluginLogger,
+  boostOnRecall: boolean = true,
+  /** Task 66: configurable token budget for recall context injection. */
+  tokenBudget: number = 4000,
+  /** Task 70: enable post-compaction context rebuild. Default true. */
+  contextRebuild: boolean = true,
+  /** Task 102: model context window size in tokens. Used for utilization-based throttling. */
+  contextWindowSize: number = 200000,
 ) {
   let turnCount = 0;
   let profileCache: ProfileCache | null = null;
+  let recallCache: RecallCache | null = null;
+  // -- Task 26: Recall quality metrics (session-scoped) ---------------------
+  let qm_freshRecalls = 0;     // turns where we hit the API (topic shifted)
+  let qm_cacheHits = 0;        // turns where we served cached results
+  let qm_totalItemsServed = 0; // cumulative recall items injected into context
+  let qm_totalFails = 0;       // turns where recall returned nothing
+  const QM_LOG_INTERVAL = 10;  // log a quality summary every N turns
+  // -- end Task 26 ------------------------------------------------------------
   return async (event: Record<string, unknown>, _ctx: unknown): Promise<{ prependContext: string } | undefined> => {
-    const prompt = typeof event?.prompt === "string" ? event.prompt : "";
-    if (!prompt || prompt.length < 5) return undefined;
+    const rawPrompt = typeof event?.prompt === "string" ? event.prompt : "";
+    if (!rawPrompt || rawPrompt.length < 5) return undefined;
+    // Strip OpenClaw metadata noise before using as search query
+    const prompt = sanitizeRecallQuery(rawPrompt);
+    if (!prompt || prompt.length < 3) return undefined;
+    // Task 62: Use focused last-user-turn for recall query; full prompt for topic-shift detection
+    const recallQuery = extractLastUserTurn(rawPrompt);
     turnCount++;
+    // -- Task 101: Adaptive scaling — reduce recall footprint as conversation grows
+    const sdkScale = applyAdaptiveScaling(turnCount, maxResults, tokenBudget);
+    // -- Task 102: Context-window-aware throttling — measure ACTUAL prompt size
+    // This is the real defense against context crashes. Turn-based scaling is a heuristic;
+    // prompt size measurement is ground truth. A few turns with large tool outputs can
+    // fill the window fast regardless of turn count.
+    const throttled = applyContextWindowThrottle(rawPrompt.length, contextWindowSize, sdkScale, logger);
+    if (throttled.selfMuted) {
+      // Context window is critically full. Don't inject anything — let the model breathe.
+      // Return minimal awareness only (no recall, no profile).
+      return { prependContext: `<!-- sulcus: self-muted, context ${((rawPrompt.length / 4 / contextWindowSize) * 100).toFixed(0)}% full -->` };
+    }
+    const effectiveMax = throttled.effectiveMax;
+    const effectiveTokenBudget = throttled.effectiveTokenBudget;
+    if (turnCount > 5) logger.debug?.(`sulcus: adaptive scaling (sdk turn ${turnCount}) — limit=${effectiveMax}, budget=${effectiveTokenBudget}`);
+    // -- end Task 101 + 102 -----------------------------------------------------
     const includeProfile = turnCount === 1 || turnCount % profileFrequency === 0;
+    // -- Task 70: Post-compaction context rebuild --------------------------------------
+    // When before_compaction fired, the context window was degraded (150k→20k tokens).
+    // On the very next turn, skip topic-shift cache, use an expanded token budget,
+    // and fire multiple parallel queries to rebuild a rich Sulcus context from scratch.
+    if (wasJustCompacted && contextRebuild) {
+      wasJustCompacted = false; // clear flag — rebuild happens exactly once per compaction
+      logger.info(`sulcus: POST-COMPACTION REBUILD — injecting full Sulcus context (budget: ${REBUILD_TOKEN_BUDGET} tokens)`);
+      try {
+        // Multi-query recall: focused current turn + broader prompt coverage
+        const rebuildQueries = [recallQuery];
+        const promptHead = prompt.substring(0, 150).trim();
+        if (promptHead.length > 10 && promptHead !== recallQuery) rebuildQueries.push(promptHead);
+        const rebuildLimit = Math.min(30, maxResults * 3);
+        const rawParallel = await Promise.allSettled(
+          rebuildQueries.map((q) => sulcusMem.search_memory(q, rebuildLimit, namespace))
+        );
+        const seenRebuildIds = new Set<string>();
+        const rebuildResults: Record<string, unknown>[] = [];
+        for (const r of rawParallel) {
+          if (r.status === "fulfilled") {
+            const items = (r.value?.results ?? []) as Record<string, unknown>[];
+            for (const item of items) {
+              const id = item.id as string;
+              if (!seenRebuildIds.has(id)) { seenRebuildIds.add(id); rebuildResults.push(item); }
+            }
+          }
+        }
+        // Sort by score desc, apply diversity filter (higher threshold — allow more overlap post-compaction)
+        const sorted = rebuildResults.sort((a, b) => ((b.score ?? 0) as number) - ((a.score ?? 0) as number));
+        const diverse = diversityFilter(sorted, 0.9);
+        // Bust the recall cache so next turn re-evaluates fresh
+        recallCache = null;
+        if (diverse.length > 0) {
+          const staleThresholdMs = 30 * 24 * 60 * 60 * 1000;
+          const nowMs = Date.now();
+          const memXml = diverse.map((m) => {
+            const id = m.id as string ?? "?";
+            const content = typeof m.content === "string" ? m.content : JSON.stringify(m.content ?? "");
+            const heat = typeof m.current_heat === "number" ? m.current_heat.toFixed(3) : "?";
+            const score = typeof m.score === "number" ? m.score.toFixed(3) : "?";
+            const mtype = typeof m.memory_type === "string" ? m.memory_type : "unknown";
+            const created = typeof m.created_at === "string" ? m.created_at : null;
+            const stale = created !== null && (nowMs - new Date(created).getTime()) > staleThresholdMs;
+            return `  <memory id="${id}" type="${mtype}" heat="${heat}" score="${score}"${stale ? " age=\"stale\"" : ""}>${escapeXml(content)}</memory>`;
+          }).join("\n");
+          const rebuildXml = [
+            `<sulcus_context mode="post_compaction_rebuild" memories="${diverse.length}" budget="${REBUILD_TOKEN_BUDGET}">`,
+            `  <!-- Context rebuilt from Sulcus after session compaction. Use this to restore working knowledge. -->`,
+            `  <memories count="${diverse.length}">`,
+            memXml,
+            `  </memories>`,
+            `  <session turn="${turnCount}" mode="compaction_rebuild" />`,
+            `</sulcus_context>`,
+          ].join("\n");
+          const budgetedRebuild = enforceContextBudget(rebuildXml, REBUILD_TOKEN_BUDGET);
+          if (boostOnRecall) {
+            boostRecalledMemories(sulcusMem, diverse, namespace, logger).catch(() => {/* non-critical */});
+          }
+          recallQM.freshRecalls++;
+          recallQM.totalItemsServed += diverse.length;
+          logger.info(`sulcus: post-compaction rebuild injected ${diverse.length} memories (~${Math.round(budgetedRebuild.length / 4)} tokens)`);
+          return { prependContext: budgetedRebuild };
+        }
+      } catch (e: unknown) {
+        logger.warn(`sulcus: post-compaction rebuild failed: ${e instanceof Error ? e.message : String(e)} — falling back to normal recall`);
+        // Fall through to normal recall path on error
+      }
+    }
+    // -- end Task 70 --------------------------------------------------------------------
+    // -- Topic-shift detection (Task 14) ---------------------------------------
+    const currentTokens = extractTopicTokens(prompt);
+    const cacheExpired = recallCache !== null && (Date.now() - recallCache.cachedAt) > TOPIC_CACHE_TTL_MS;
+    const overlap = recallCache !== null ? topicOverlap(currentTokens, recallCache.topicTokens) : 0;
+    const topicShifted = recallCache === null || cacheExpired || overlap < TOPIC_SHIFT_THRESHOLD;
+    let searchResults: Record<string, unknown>[] = [];
+    if (!topicShifted && recallCache !== null) {
+      // Topic stable — reuse cached recall results, skip API call
+      searchResults = recallCache.results;
+      qm_cacheHits++; // Task 26: count cache-hit turns
+      recallQM.cacheHits++;  // Task 32: module-scope QM
+      logger.info(`sulcus: topic stable (overlap=${overlap.toFixed(2)}) — serving cached recall (turn ${turnCount})`);
+    } else {
+      if (recallCache !== null) {
+        logger.info(`sulcus: TOPIC SHIFT detected (overlap=${overlap.toFixed(2)}) — fresh recall (turn ${turnCount})`);
+      }
     try {
-      const searchRes = await sulcusMem.search_memory(prompt, maxResults, namespace);
-      const searchResults = searchRes?.results ?? [];
+      // Task 62: Use focused recallQuery instead of full accumulated prompt
+      // Task 101: Use adaptive limit instead of raw config maxResults
+      const searchRes = await sulcusMem.search_memory(recallQuery, effectiveMax, namespace);
+      const vectorResults = searchRes?.results ?? [];
+      // -- Task 35: Query expansion for thin recall (SDK path) ---------------
+      let sdkExpanded = vectorResults;
+      if (vectorResults.length < THIN_RECALL_THRESHOLD) {
+        try {
+          // Task 62: use focused recallQuery for entity expansion
+          const { extraMemories: sdkExtraMem, expandedQuery: sdkExpandedQ } = await expandQueryWithEntities(
+            sulcusMem, recallQuery, namespace, logger
+          );
+          const sdkSeenIds = new Set(vectorResults.map((r) => r.id as string));
+          const sdkNewExtras = sdkExtraMem.filter((m) => !sdkSeenIds.has(m.id as string));
+          if (sdkNewExtras.length > 0) {
+            sdkExpanded = [...vectorResults, ...sdkNewExtras];
+            logger.info(`sulcus: sdk thin-recall expansion added ${sdkNewExtras.length} entity-graph memory/memories`);
+          }
+          if (sdkExpanded.length < THIN_RECALL_THRESHOLD && sdkExpandedQ !== recallQuery) {
+            try {
+              const sdkExpandedRes = await sulcusMem.search_memory(sdkExpandedQ, effectiveMax, namespace);
+              const sdkExpandedVec = sdkExpandedRes?.results ?? [];
+              const sdkExpandedSeen = new Set(sdkExpanded.map((r) => r.id as string));
+              const sdkExpandedNew = sdkExpandedVec.filter((r) => !sdkExpandedSeen.has(r.id as string));
+              if (sdkExpandedNew.length > 0) {
+                sdkExpanded = [...sdkExpanded, ...sdkExpandedNew];
+                logger.info(`sulcus: sdk expanded query search added ${sdkExpandedNew.length} result(s)`);
+              }
+            } catch {
+              // expanded search failed — keep what we have
+            }
+          }
+        } catch {
+          // expansion failed — proceed with original results
+        }
+      }
+      // -- end Task 35 (SDK path) -----------------------------------------
+      // -- Graph-hop expansion (Task 13) ---------------------------------------------
+      // Seed from top-2 expanded results, fetch AGE neighbors non-blocking.
+      // Fold in Memory-type neighbors (heat >= 0.2), dedup, cap at maxResults+4.
+      searchResults = sdkExpanded;
+      const seedIds = sdkExpanded.slice(0, 2).map((r) => r.id as string).filter(Boolean);
+      if (seedIds.length > 0) {
+        try {
+          const neighborFetches = await Promise.allSettled(
+            seedIds.map((id) => sulcusMem.graph_neighbors(id, 6))
+          );
+          const seenIds = new Set(sdkExpanded.map((r) => r.id as string));
+          const graphExtras: Record<string, unknown>[] = [];
+          for (const result of neighborFetches) {
+            if (result.status !== "fulfilled") continue;
+            for (const node of result.value) {
+              const nodeId = node.id as string;
+              if (!nodeId || seenIds.has(nodeId)) continue;
+              const heat = (node.current_heat as number) ?? 0;
+              // Only include meaningful nodes — skip cold ephemeral noise
+              if (heat < 0.2) continue;
+              seenIds.add(nodeId);
+              graphExtras.push(node);
+            }
+          }
+          if (graphExtras.length > 0) {
+            // Sort graph extras by heat desc, cap at 4
+            graphExtras.sort((a, b) => ((b.current_heat as number) ?? 0) - ((a.current_heat as number) ?? 0));
+            // Tag graph-hop results with source so context formatter can annotate them
+            const taggedExtras = graphExtras.slice(0, 4).map((r) => ({ ...r, _source: "graph" }));
+            const sdkHopCount = taggedExtras.length;
+            searchResults = [...sdkExpanded, ...taggedExtras];
+            recallQM.graphHopContrib += sdkHopCount;  // Task 32: module-scope QM
+            recallQM.graphHopTurns++;                   // Task 32: module-scope QM
+            logger.info(`sulcus: graph-hop added ${sdkHopCount} neighbours (seeds: ${seedIds.length})`);
+          }
+        } catch {
+          // graph expansion failed — fall back to vector results only
+        }
+      }
+      // -- end graph-hop ------------------------------------------------------
+      // Update recall cache (fresh fetch path)
+      qm_freshRecalls++; // Task 26: count fresh-recall turns
+      recallQM.freshRecalls++;  // Task 32: module-scope QM
+      recallCache = { results: searchResults, topicTokens: currentTokens, cachedAt: Date.now() };
+    } catch (freshErr) {
+      // fresh recall failed — fall back to cache if available
+      if (recallCache !== null) {
+        logger.warn(`sulcus: fresh recall failed (${freshErr}), using stale cache`);
+        searchResults = recallCache.results;
+      } else {
+        throw freshErr; // no cache to fall back to — let outer catch handle
+      }
+    }
+    } // end topic-shift branch
+    try { // processing, scoring, budget enforcement, XML assembly
       let preferences: Record<string, unknown>[] = [];
       let facts: Record<string, unknown>[] = [];
       if (includeProfile) {
         try {
-          const prefRes = await sulcusMem.search_memory("user preference", Math.min(maxResults, 5), namespace);
-          const factRes = await sulcusMem.search_memory("fact data knowledge", Math.min(maxResults, 5), namespace);
+          const prefRes = await sulcusMem.search_memory("user preference", Math.min(effectiveMax, 5), namespace);
+          const factRes = await sulcusMem.search_memory("fact data knowledge", Math.min(effectiveMax, 5), namespace);
           preferences = (prefRes?.results ?? []).filter((r) => r.memory_type === "preference");
           facts = (factRes?.results ?? []).filter((r) => r.memory_type === "fact");
           profileCache = { preferences, facts, cachedAt: Date.now() };
@@ -743,51 +2958,272 @@ function buildSdkRecallHandler(
       ]);
       const dedupedSearch = searchResults.filter((r) => !profileIds.has(r.id as string));
+      // -- Task 20: Recall diversity filter --------------------------------------
+      // Before budget enforcement: apply MMR-lite diversity filter to recall results.
+      // Penalises near-duplicate memories (same topic, different phrasings) so the
+      // context window surfaces genuinely distinct information.
+      // Pre-normalise labels for topic extraction (strip XML escapes not needed yet).
+      const preDiversityItems = dedupedSearch.map((r) => ({
+        ...r,
+        label: ((r.label ?? r.pointer_summary ?? r.id ?? "") as string),
+        // Fix 2: prefer server fused_score over raw heat for ranking (Task 58)
+        _heat: (r.score as number) ?? (r.current_heat as number) ?? 0,
+      }));
+      // Sort score-desc first so diversity filter seeds on best item
+      preDiversityItems.sort((a, b) => b._heat - a._heat);
+      const diverseSearch = diversityFilter(preDiversityItems, effectiveMax);
+      const droppedByDiversity = preDiversityItems.length - diverseSearch.length;
+      if (droppedByDiversity > 0) {
+        logger.info(`sulcus: diversity filter dropped ${droppedByDiversity} near-duplicate(s)`);
+      }
+      // -- end Task 20 ------------------------------------------------------
+      // -- Task 18: Context budget enforcement ------------------------------------
+      // -- Category-priority ranking (Mem0 parity) --------------------------
+      // Rank by memory type priority (durable types first), then by heat within tier.
+      // Procedural and preference memories are high-priority (identity/config equivalent).
+      // This ensures persistent knowledge surfaces before transient observations.
+      const TYPE_PRIORITY: Record<string, number> = {
+        procedural: 0, // how-tos = highest priority
+        preference: 1, // user preferences = identity
+        fact: 2,       // stable data
+        semantic: 3,   // domain knowledge
+        episodic: 4,   // events = lowest priority
+      };
+      diverseSearch.sort((a, b) => {
+        const typeA = (a.memory_type as string) ?? "episodic";
+        const typeB = (b.memory_type as string) ?? "episodic";
+        const prioA = TYPE_PRIORITY[typeA] ?? 5;
+        const prioB = TYPE_PRIORITY[typeB] ?? 5;
+        if (prioA !== prioB) return prioA - prioB;
+        return (b._heat as number) - (a._heat as number); // heat desc within tier
+      });
+      // -- end category-priority ranking -------------------------------------
+      // Sort all items by heat desc so highest-value memories always fit first.
+      // Task 66: token budget is configurable (default 4000). ~80 for fixed overhead.
+      // Remaining split ~30% profile / ~70% recall.
+      // Task 101: Use adaptive token budget instead of raw config value
+      const TOKEN_BUDGET = effectiveTokenBudget;
+      const FIXED_OVERHEAD = 80;
+      const profileBudgetTokens = Math.floor((TOKEN_BUDGET - FIXED_OVERHEAD) * 0.3);
+      const recallBudgetTokens = TOKEN_BUDGET - FIXED_OVERHEAD - profileBudgetTokens;
+      // Normalize + XML-escape labels up front, attach _heat for sorting
+      const profileItemsSorted = [...preferences, ...facts]
+        .map((r) => ({
+          ...r,
+          label: ((r.label ?? r.pointer_summary ?? r.id ?? "") as string)
+            .replace(/&/g, "&amp;").replace(/</g, "&lt;").replace(/>/g, "&gt;"),
+          _heat: (r.current_heat as number) ?? 0,
+        }))
+        .sort((a, b) => b._heat - a._heat);
+      // Task 20: use diversity-filtered items (already heat-sorted by diversityFilter)
+      const recallItemsSorted = diverseSearch
+        .map((r) => ({
+          ...r,
+          label: ((r.label ?? r.pointer_summary ?? r.id ?? "") as string)
+            .replace(/&/g, "&amp;").replace(/</g, "&lt;").replace(/>/g, "&gt;"),
+          _heat: (r.score as number) ?? (r.current_heat as number) ?? 0,
+        }));
+      // -- Task 80: Temporal supersession (SDK path) ------------------------------
+      // Mark older conflicting memories as superseded BEFORE budget enforcement
+      // so the penalty pushes them below the cut line.
+      const sdkSupersededCount = markSuperseded(recallItemsSorted);
+      if (sdkSupersededCount > 0) {
+        logger.info(`sulcus: temporal supersession (sdk) marked ${sdkSupersededCount} memory/memories as superseded`);
+        // Re-sort after penalties so budget cuts superseded items first
+        recallItemsSorted.sort((a, b) => b._heat - a._heat);
+      }
+      const budgetedProfile = enforceContextBudget(profileItemsSorted, TOKEN_BUDGET, FIXED_OVERHEAD + recallBudgetTokens);
+      let budgetedRecall = enforceContextBudget(recallItemsSorted, TOKEN_BUDGET, FIXED_OVERHEAD + profileBudgetTokens);
+      // -- end Task 18 -----------------------------------------------------------
+      // -- Task 79: Temporal re-ranking (SDK path) ---------------------------------
+      const sdkTemporalDetected = isTemporalQuery(recallQuery);
+      if (sdkTemporalDetected) {
+        budgetedRecall = temporalRerank(budgetedRecall);
+        logger.info(`sulcus: temporal query detected (sdk) — re-ranking ${budgetedRecall.length} results chronologically`);
+      }
+      // -- end Task 79 (SDK) -------------------------------------------------------
       const sections: string[] = [];
-      if (includeProfile && (preferences.length > 0 || facts.length > 0)) {
-        const profileLines: string[] = [];
-        for (const r of preferences) {
-          const label = (r.label ?? r.pointer_summary ?? r.id ?? "") as string;
-          profileLines.push(`- [preference] ${label}`);
+      // Task 18: use budgetedProfile (heat-sorted, budget-trimmed, labels already normalized)
+      if (includeProfile && budgetedProfile.length > 0) {
+        const profileElements: string[] = [];
+        for (const r of budgetedProfile) {
+          const mtype = (r.memory_type as string) === "fact" ? "fact" : "preference";
+          const heat = (r._heat as number).toFixed(2);
+          profileElements.push(`  <item type="${mtype}" heat="${heat}">${r.label}</item>`);
         }
-        for (const r of facts) {
-          const label = (r.label ?? r.pointer_summary ?? r.id ?? "") as string;
-          profileLines.push(`- [fact] ${label}`);
-        }
-        if (profileLines.length > 0) {
-          sections.push(`## User Profile (from preferences + facts)\n${profileLines.join("\n")}`);
+        if (profileElements.length > 0) {
+          sections.push(`<profile>\n${profileElements.join("\n")}\n</profile>`);
         }
       }
-      if (dedupedSearch.length > 0) {
-        const memLines = dedupedSearch.slice(0, maxResults).map((r) => {
-          const heat = ((r.current_heat as number) ?? (r.score as number) ?? 0);
-          const pct = `[${Math.round(heat * 100)}%]`;
+      if (budgetedRecall.length > 0) {
+        // -- Task 12: Structured context formatting ----------------------------
+        // Group recall items by memory type so LLM receives semantically
+        // coherent blocks. Add source (vector/graph) and relevance tier.
+        // Task 18: iterate over budgetedRecall instead of raw dedupedSearch —
+        //   already heat-sorted, budget-trimmed, labels normalized.
+        // Flat recall list — no group wrappers, no source/relevance attributes.
+        // Items already sorted by category-priority (procedural > preference > fact > semantic > episodic)
+        // then by heat within tier. Type is an attribute on each memory element.
+        // Task 79: when temporal, items are re-sorted chronologically (oldest first).
+        const recallElements: string[] = [];
+        for (const r of budgetedRecall) {
+          const heat = r._heat as number;
+          const heatStr = heat.toFixed(2);
+          const mtype = (r.memory_type as string) ?? "episodic";
           const updatedAt = r.updated_at as string | undefined;
-          const timeStr = updatedAt ? `[${formatRelativeTime(updatedAt)}]` : "";
-          const label = (r.label ?? r.pointer_summary ?? r.id ?? "") as string;
-          return `- ${pct} ${timeStr} ${label}`.trim();
-        });
-        sections.push(`## Relevant Memories (with relevance %)\n${memLines.join("\n")}`);
+          const ageStr = updatedAt ? formatRelativeTime(updatedAt) : "unknown";
+          const staleAttr = isStaleMemory(updatedAt) ? ` stale="true"` : "";
+          // Task 80: superseded memories get a marker so the LLM treats them as historical
+          const supersededAttr = r._superseded ? ` superseded="true"` : "";
+          // label already normalized + escaped + budget-truncated by enforceContextBudget
+          recallElements.push(`  <memory type="${mtype}" heat="${heatStr}" age="${ageStr}"${staleAttr}${supersededAttr}>${r.label}</memory>`);
+        }
+        if (recallElements.length > 0) {
+          // Task 79: annotate recall block with ordering hint for the LLM
+          const sdkRecallOrderAttr = sdkTemporalDetected ? ` order="chronological"` : "";
+          sections.push(`<recall${sdkRecallOrderAttr}>\n${recallElements.join("\n")}\n</recall>`);
+        }
+        // -- end Task 12 / Task 18 / Task 79 -----------------------------------------
       }
+      // Task 19 (conflict detection) replaced by Task 80 (temporal supersession).
+      // Superseded items are already marked inline with superseded="true" attribute.
+      // No separate <conflicts> block needed — the transformer sees position + markup.
       if (sections.length === 0) return undefined;
-      const intro =
-        "The following is background context from long-term memory. Use it silently to inform your understanding — only reference it when the conversation naturally calls for it.";
-      const context = `<sulcus_context token_budget="500" namespace="${namespace}">\n${intro}\n\n${sections.join("\n\n")}\n</sulcus_context>`;
+      const guidance = "Background context from long-term memory. Use it silently to inform your understanding — only reference it when the conversation naturally calls for it.";
+      const recallMode = !topicShifted ? "cached" : "fresh";
+      const contextParts: string[] = [
+        `<session turn="${turnCount}" mode="${recallMode}" />`,
+        `<guidance>${guidance}</guidance>`,
+      ];
+      contextParts.push(...sections);
+      const context = `<sulcus_context token_budget="${TOKEN_BUDGET}" namespace="${namespace}">\n${contextParts.join("\n")}\n</sulcus_context>`;
+      // Task 18: log budget utilisation
+      const estimatedTokens = estimateTokens(context);
+      logger.info(`sulcus: SDK recall injecting context (${context.length} chars, ~${estimatedTokens}/${TOKEN_BUDGET} tokens, turn ${turnCount}, profile: ${budgetedProfile.length}, recall: ${budgetedRecall.length})`);
+      // -- Task 26: Recall quality metrics ----------------------------------------
+      qm_totalItemsServed += budgetedRecall.length;
+      if (budgetedRecall.length === 0) qm_totalFails++;
+      // Task 32: write to module-scope QM for memory_status exposure
+      recallQM.totalItemsServed += budgetedRecall.length;
+      if (budgetedRecall.length === 0) recallQM.zeroResultTurns++;
+      if (budgetedRecall.length > 0 && topicShifted) {
+        const sdkAvgScore = budgetedRecall.reduce((s, r) => s + ((r._heat as number) ?? 0), 0) / budgetedRecall.length;
+        recallQM.scoreSum += sdkAvgScore;
+        recallQM.scoreTurns++;
+      }
+      // Emit a periodic quality summary every QM_LOG_INTERVAL turns
+      if (turnCount % QM_LOG_INTERVAL === 0) {
+        const qm_totalRecallTurns = qm_freshRecalls + qm_cacheHits;
+        const qm_cacheHitRate = qm_totalRecallTurns > 0
+          ? ((qm_cacheHits / qm_totalRecallTurns) * 100).toFixed(1)
+          : "0.0";
+        const qm_avgItems = qm_totalRecallTurns > 0
+          ? (qm_totalItemsServed / qm_totalRecallTurns).toFixed(1)
+          : "0.0";
+        logger.info(
+          `sulcus: [quality-metrics turn=${turnCount}] ` +
+          `fresh=${qm_freshRecalls} cached=${qm_cacheHits} ` +
+          `cache_hit_rate=${qm_cacheHitRate}% ` +
+          `avg_items_served=${qm_avgItems} ` +
+          `zero_result_turns=${qm_totalFails}`
+        );
+      }
+      // -- end Task 26 ------------------------------------------------------------
+      // Task 56: write to inspect buffer for memory_inspect tool (SDK path)
+      {
+        const staleSDKItems = budgetedRecall.filter((r) => (r as Record<string, unknown>).stale === true || (r as Record<string, unknown>)._stale === true);
+        const graphSDKItems = budgetedRecall.filter((r) => (r as Record<string, unknown>)._source === "graph");
+        inspectBuffer.lastRecall = {
+          capturedAt: Date.now(),
+          path: "sdk",
+          turn: turnCount,
+          query: prompt.substring(0, 200),
+          fromCache: !topicShifted,
+          itemsInjected: budgetedProfile.length + budgetedRecall.length,
+          recallItems: budgetedRecall.map((r) => ({
+            id: (r.id as string) ?? "",
+            content_preview: ((r.content ?? r.text ?? "") as string).substring(0, 80),
+            memory_type: (r.memory_type ?? r.type ?? "unknown") as string,
+            heat: (r.current_heat ?? r._heat ?? 0) as number,
+            score: (r.score as number | null) ?? null,
+            stale: !!(r.stale ?? r._stale),
+            source: ((r._source as string) === "graph" ? "graph" : "semantic") as "semantic" | "graph" | "unknown",
+          })),
+          profileItems: budgetedProfile.length,
+          staleCount: staleSDKItems.length,
+          graphHopCount: graphSDKItems.length,
+          tokensBudget: TOKEN_BUDGET,
+          tokensUsed: estimatedTokens,
+        };
+      }
+      // Spaced repetition: boost heat for recalled memories (fire-and-forget, non-blocking)
+      if (boostOnRecall && budgetedRecall.length > 0) {
+        boostRecalledMemories(sulcusMem, budgetedRecall, logger).catch(() => {});
+      }
+      // -- Task 23: SIRU recall logging (fire-and-forget, only on fresh recall) ----
+      // Post recall session metadata to the server so SIRU can learn which memories
+      // were most useful. Skipped on cache-hit turns (topicShifted === false) to avoid
+      // logging identical sessions when the topic is stable.
+      if (topicShifted && sulcusMem instanceof SulcusCloudClient) {
+        const recallIds = budgetedRecall.map((r) => (r.id as string) ?? "").filter(Boolean);
+        const recallScores = budgetedRecall.map((r) => (r._heat as number) ?? 0);
+        const recallSources = budgetedRecall.map((r) =>
+          (r._source as string) === "graph" ? "graph" : "semantic"
+        );
+        // Extract entity hints from prompt (reuse topic tokens as lightweight entity proxy)
+        const entityHints = Array.from(currentTokens).slice(0, 10);
+        // Source breakdown counts
+        const semanticCount = recallSources.filter((s) => s === "semantic").length;
+        const graphCount = recallSources.filter((s) => s === "graph").length;
+        sulcusMem.recall_log({
+          namespace,
+          agent_id: namespace,
+          query_text: prompt.substring(0, 500),
+          memory_ids: recallIds,
+          memory_scores: recallScores,
+          memory_sources: recallSources,
+          token_budget: TOKEN_BUDGET,
+          tokens_used: estimatedTokens,
+          candidates_total: searchResults.length,
+          candidates_selected: recallIds.length,
+          semantic_count: semanticCount,
+          hot_count: graphCount,
+          entity_count: entityHints.length,
+          entity_hints: entityHints,
+        }).catch(() => {}); // never block context injection
+        logger.debug?.("sulcus: SIRU recall log posted");
+      }
+      // -- end Task 23 -----------------------------------------------------------
-      logger.info(`sulcus: SDK recall injecting context (${context.length} chars, turn ${turnCount})`);
       return { prependContext: context };
     } catch (err) {
+      qm_totalFails++; // Task 26: count hard-fail turns
+      recallQM.zeroResultTurns++;  // Task 32: module-scope QM
       logger.warn(`sulcus: SDK recall failed: ${err}`);
       return undefined;
     }
   };
 }
-// ─── MEMORY RUNTIME BUILDER ───────────────────────────────────────────────────
+// --- MEMORY RUNTIME BUILDER ---------------------------------------------------
 function buildMemoryRuntime(sulcusMem: SulcusCloudClient, backendMode: string) {
   const searchManager = {
@@ -819,29 +3255,25 @@ function buildMemoryRuntime(sulcusMem: SulcusCloudClient, backendMode: string) {
   };
 }
-// ─── PROMPT SECTION BUILDER ───────────────────────────────────────────────────
+// --- PROMPT SECTION BUILDER ---------------------------------------------------
 function buildPromptSection(params: { availableTools: Set<string> }): string[] {
   const hasRecall = params.availableTools.has("memory_recall");
   const hasStore = params.availableTools.has("memory_store");
   if (!hasRecall && !hasStore) return [];
+  // Behavioral nudge only — tool schemas already document parameters.
+  // Goal: tell the agent WHEN to use memory, not HOW (tool defs handle that).
   const lines: string[] = [
     "## Memory (Sulcus)",
     "",
     "You have persistent thermodynamic memory powered by Sulcus.",
     "Relevant memories are automatically injected at the start of each conversation.",
-    "",
   ];
   if (hasRecall) lines.push("- Use `memory_recall` to search prior conversations, preferences, and facts.");
   if (hasStore) lines.push("- Use `memory_store` to save information the user asks you to remember.");
-  if (params.availableTools.has("memory_delete")) lines.push("- Use `memory_delete` to remove incorrect or stale memories.");
   if (params.availableTools.has("memory_status")) lines.push("- Use `memory_status` to check backend connection and hot nodes.");
-  if (params.availableTools.has("consolidate")) lines.push("- Use `consolidate` to prune cold memories below a heat threshold.");
-  if (params.availableTools.has("export_markdown")) lines.push("- Use `export_markdown` to export all memories as Markdown.");
-  if (params.availableTools.has("import_markdown")) lines.push("- Use `import_markdown` to import memories from a Markdown document.");
-  if (params.availableTools.has("evaluate_triggers")) lines.push("- Use `evaluate_triggers` to evaluate reactive memory triggers.");
   lines.push("");
   lines.push("Memory types: episodic (events, fast decay), semantic (knowledge, slow), preference (opinions, slower), procedural (how-tos, slowest), fact (data, slow)");
@@ -849,7 +3281,7 @@ function buildPromptSection(params: { availableTools: Set<string> }): string[] {
   return lines;
 }
-// ─── TOOL DEFINITIONS ────────────────────────────────────────────────────────
+// --- TOOL DEFINITIONS --------------------------------------------------------
 interface ToolDeps {
   sulcusMem: SulcusCloudClient | null;
@@ -920,7 +3352,9 @@ const toolDefinitions: Record<string, ToolDefinition> = {
         }
         if (!isAvailable || !sulcusMem) throw new Error(`Sulcus unavailable: ${nativeLoader.error || "not loaded"}`);
         const mtype = (params.memory_type as string | undefined) || "episodic";
-        const res = await sulcusMem.add_memory(content, mtype);
+        // Phase 2: SILU prompt injection — derive hints from memory type + namespace for manual stores
+        const storeHints = buildExtractionHints(mtype, namespace, "user_capture", content.substring(0, 200));
+        const res = await sulcusMem.add_memory(content, mtype, storeHints);
         const nodeId = res?.id ?? "unknown";
         let trainResult: string | null = null;
         if (params.train === true) {
@@ -963,8 +3397,66 @@ const toolDefinitions: Record<string, ToolDefinition> = {
           ]);
           const nodeList = hotNodes?.nodes ?? [];
           const si = statusInfo as Record<string, unknown> | null;
+          // Task 32: compute recall quality metrics for exposure
+          const qm_totalTurns = recallQM.freshRecalls + recallQM.cacheHits;
+          const qm_cacheHitRate = qm_totalTurns > 0 ? parseFloat(((recallQM.cacheHits / qm_totalTurns) * 100).toFixed(1)) : null;
+          const qm_avgRelevance = recallQM.scoreTurns > 0 ? parseFloat((recallQM.scoreSum / recallQM.scoreTurns).toFixed(3)) : null;
+          const qm_graphHopRate = qm_totalTurns > 0 ? parseFloat(((recallQM.graphHopTurns / qm_totalTurns) * 100).toFixed(1)) : null;
+          const qm_avgItemsServed = qm_totalTurns > 0 ? parseFloat((recallQM.totalItemsServed / qm_totalTurns).toFixed(1)) : null;
+          const recallQuality = {
+            total_turns: qm_totalTurns,
+            fresh_recalls: recallQM.freshRecalls,
+            cache_hits: recallQM.cacheHits,
+            cache_hit_rate_pct: qm_cacheHitRate,
+            avg_relevance_score: qm_avgRelevance,
+            avg_items_served: qm_avgItemsServed,
+            zero_result_turns: recallQM.zeroResultTurns,
+            graph_hop_turns: recallQM.graphHopTurns,
+            graph_hop_contrib_total: recallQM.graphHopContrib,
+            graph_hop_rate_pct: qm_graphHopRate,
+          };
+          // Task 58: last_injection block — snapshot of what was actually injected last turn
+          let lastInjection: Record<string, unknown> | null = null;
+          const lr = inspectBuffer.lastRecall;
+          if (lr) {
+            const recallHeats = lr.recallItems.map((i) => i.heat);
+            const avgHeat = recallHeats.length > 0
+              ? parseFloat((recallHeats.reduce((s, h) => s + h, 0) / recallHeats.length).toFixed(3))
+              : null;
+            const typeSet = new Set(lr.recallItems.map((i) => i.memory_type));
+            const typeCoveragePct = lr.recallItems.length > 0
+              ? parseFloat(((typeSet.size / 5) * 100).toFixed(1))  // 5 = total memory types
+              : null;
+            const stalePct = lr.recallItems.length > 0
+              ? parseFloat(((lr.staleCount / lr.recallItems.length) * 100).toFixed(1))
+              : null;
+            const ageMs = Date.now() - lr.capturedAt;
+            lastInjection = {
+              captured_ms_ago: ageMs,
+              turn: lr.turn,
+              path: lr.path,
+              from_cache: lr.fromCache,
+              query_preview: lr.query.slice(0, 100),
+              items_injected: lr.itemsInjected,
+              recall_items: lr.recallItems.length,
+              profile_items: lr.profileItems,
+              stale_count: lr.staleCount,
+              stale_pct: stalePct,
+              graph_hop_count: lr.graphHopCount,
+              avg_heat_injected: avgHeat,
+              type_coverage_pct: typeCoveragePct,
+              types_present: Array.from(typeSet),
+              token_budget: lr.tokensBudget,
+              tokens_used: lr.tokensUsed,
+              budget_utilization_pct: lr.tokensBudget > 0
+                ? parseFloat(((lr.tokensUsed / lr.tokensBudget) * 100).toFixed(1))
+                : null,
+            };
+          }
           return {
-            content: [{ type: "text", text: JSON.stringify({ status: "ok", backend: backendMode, namespace, ...(si?.capabilities ? { capabilities: si.capabilities } : {}), ...(si?.stats ? { stats: si.stats } : {}), hot_node_count: nodeList.length, hot_nodes: nodeList }, null, 2) }],
+            content: [{ type: "text", text: JSON.stringify({ status: "ok", backend: backendMode, namespace, ...(si?.capabilities ? { capabilities: si.capabilities } : {}), ...(si?.stats ? { stats: si.stats } : {}), hot_node_count: nodeList.length, hot_nodes: nodeList, recall_quality: recallQuality, last_injection: lastInjection }, null, 2) }],
             details: { status: "ok", backend: backendMode, namespace, count: nodeList.length },
           };
         } catch (e: unknown) {
@@ -1063,9 +3555,234 @@ const toolDefinitions: Record<string, ToolDefinition> = {
       },
   },
+  memory_get: {
+    schema: {
+      name: "memory_get",
+      label: "Get Memory",
+      description: "Fetch a specific memory by its UUID. Returns full memory details including content, type, heat, graph edges, and metadata.",
+      parameters: Type.Object({
+        id: Type.String({ description: "Memory node UUID." }),
+      }),
+    },
+    options: { name: "memory_get" },
+    makeExecute: ({ sulcusMem, backendMode, namespace, nativeLoader, isAvailable }) =>
+      async (_id, params) => {
+        if (!isAvailable || !sulcusMem) throw new Error(`Sulcus unavailable: ${nativeLoader.error || "not loaded"}`);
+        if (!(sulcusMem instanceof SulcusCloudClient)) throw new Error("memory_get requires cloud backend");
+        const memId = params.id as string;
+        const res = await sulcusMem.get_memory(memId);
+        if (!res) return { content: [{ type: "text", text: `Memory ${memId} not found.` }], details: { found: false, id: memId } };
+        return {
+          content: [{ type: "text", text: JSON.stringify(res, null, 2) }],
+          details: { ...res, backend: backendMode, namespace },
+        };
+      },
+  },
+  memory_list: {
+    schema: {
+      name: "memory_list",
+      label: "List Memories",
+      description: "Browse memories with optional filters. Returns paginated results sorted by heat (hottest first). Use this to explore what Sulcus knows without a search query.",
+      parameters: Type.Object({
+        page: Type.Optional(Type.Number({ default: 1, description: "Page number (1-indexed)." })),
+        page_size: Type.Optional(Type.Number({ default: 20, description: "Results per page (1-100).", minimum: 1, maximum: 100 })),
+        memory_type: Type.Optional(Type.Union([
+          Type.Literal("episodic"), Type.Literal("semantic"), Type.Literal("preference"),
+          Type.Literal("procedural"), Type.Literal("fact"),
+        ], { description: "Filter by memory type." })),
+        pinned: Type.Optional(Type.Boolean({ description: "Filter by pinned status." })),
+        sort_by: Type.Optional(Type.Union([
+          Type.Literal("current_heat"), Type.Literal("created_at"), Type.Literal("updated_at"),
+        ], { description: "Sort field (default: current_heat)." })),
+        sort_order: Type.Optional(Type.Union([
+          Type.Literal("asc"), Type.Literal("desc"),
+        ], { description: "Sort order (default: desc)." })),
+      }),
+    },
+    options: { name: "memory_list" },
+    makeExecute: ({ sulcusMem, backendMode, namespace, nativeLoader, isAvailable }) =>
+      async (_id, params) => {
+        if (!isAvailable || !sulcusMem) throw new Error(`Sulcus unavailable: ${nativeLoader.error || "not loaded"}`);
+        if (!(sulcusMem instanceof SulcusCloudClient)) throw new Error("memory_list requires cloud backend");
+        const page = (params.page as number | undefined) ?? 1;
+        const pageSize = Math.min(100, Math.max(1, (params.page_size as number | undefined) ?? 20));
+        const res = await sulcusMem.list_memories({
+          page,
+          page_size: pageSize,
+          memory_type: params.memory_type as string | undefined,
+          pinned: params.pinned as boolean | undefined,
+          sort_by: (params.sort_by as string | undefined) ?? "current_heat",
+          sort_order: (params.sort_order as string | undefined) ?? "desc",
+          namespace,
+        });
+        const summary = `Page ${page} — ${res.items.length} memories${res.total !== undefined ? ` (${res.total} total)` : ""}`;
+        return {
+          content: [{ type: "text", text: summary + "\n" + JSON.stringify(res.items, null, 2) }],
+          details: { page, page_size: pageSize, count: res.items.length, total: res.total, backend: backendMode, namespace },
+        };
+      },
+  },
+  memory_update: {
+    schema: {
+      name: "memory_update",
+      label: "Update Memory",
+      description: "Update fields on an existing memory in-place. Preserves graph edges and history. More surgical than delete+re-store.",
+      parameters: Type.Object({
+        id: Type.String({ description: "Memory node UUID to update." }),
+        content: Type.Optional(Type.String({ description: "New content text (replaces existing)." })),
+        memory_type: Type.Optional(Type.Union([
+          Type.Literal("episodic"), Type.Literal("semantic"), Type.Literal("preference"),
+          Type.Literal("procedural"), Type.Literal("fact"),
+        ], { description: "New memory type classification." })),
+        is_pinned: Type.Optional(Type.Boolean({ description: "Pin (prevent decay) or unpin." })),
+        heat: Type.Optional(Type.Number({ description: "Set heat directly (0.0-1.0).", minimum: 0, maximum: 1 })),
+      }),
+    },
+    options: { name: "memory_update" },
+    makeExecute: ({ sulcusMem, backendMode, namespace, nativeLoader, isAvailable, logger }) =>
+      async (_id, params) => {
+        if (!isAvailable || !sulcusMem) throw new Error(`Sulcus unavailable: ${nativeLoader.error || "not loaded"}`);
+        if (!(sulcusMem instanceof SulcusCloudClient)) throw new Error("memory_update requires cloud backend");
+        const memId = params.id as string;
+        const updates: Record<string, unknown> = {};
+        if (params.content !== undefined) updates.label = params.content as string;
+        if (params.memory_type !== undefined) updates.memory_type = params.memory_type as string;
+        if (params.is_pinned !== undefined) updates.is_pinned = params.is_pinned as boolean;
+        if (params.heat !== undefined) updates.current_heat = params.heat as number;
+        if (Object.keys(updates).length === 0) {
+          return { content: [{ type: "text", text: "No fields to update. Provide at least one of: content, memory_type, is_pinned, heat." }] };
+        }
+        const res = await sulcusMem.update_memory(memId, updates as any);
+        const fields = Object.keys(updates).join(", ");
+        logger.info(`sulcus: memory_update — updated ${memId} (fields: ${fields})`);
+        return {
+          content: [{ type: "text", text: `Updated memory ${memId} (fields: ${fields}). Backend: ${backendMode}, namespace: ${namespace}` }],
+          details: { id: memId, updated_fields: Object.keys(updates), result: res as Record<string, unknown>, backend: backendMode, namespace },
+        };
+      },
+  },
+  memory_profile: {
+    schema: {
+      name: "memory_profile",
+      label: "Memory Profile",
+      description: "Show a rich snapshot of this agent's memory health: type distribution, heat curve, top hot nodes, top preferences/facts, and graph stats. Call this to understand what Sulcus knows and how active the memory is.",
+      parameters: Type.Object({
+        limit: Type.Optional(Type.Number({ description: "Max hot nodes to surface (default 10).", minimum: 1, maximum: 50 })),
+      }),
+    },
+    options: { name: "memory_profile" },
+    makeExecute: ({ sulcusMem, backendMode, namespace, isAvailable }) =>
+      async (_id, params) => {
+        if (!isAvailable || !sulcusMem) {
+          return { content: [{ type: "text", text: `Memory profile unavailable — backend: ${backendMode}, namespace: ${namespace}` }] };
+        }
+        const hotLimit = Math.min(50, Math.max(1, (params?.limit as number | undefined) ?? 10));
+        try {
+          const [statusRes, hotRes, prefRes, factRes] = await Promise.allSettled([
+            (sulcusMem as SulcusCloudClient).request("GET", "/api/v1/agent/memory/status").catch(() => null),
+            (sulcusMem as SulcusCloudClient).list_hot_nodes(hotLimit),
+            (sulcusMem as SulcusCloudClient).search_memory("preference", hotLimit),
+            (sulcusMem as SulcusCloudClient).search_memory("fact", hotLimit),
+          ]);
+          const status = (statusRes.status === "fulfilled" ? statusRes.value : null) as Record<string, unknown> | null;
+          const hotNodes = (hotRes.status === "fulfilled" ? hotRes.value?.nodes : []) ?? [];
+          const preferences = (prefRes.status === "fulfilled" ? prefRes.value?.results : []) ?? [];
+          const facts = (factRes.status === "fulfilled" ? factRes.value?.results : []) ?? [];
+          // Filter preferences/facts by type
+          const prefItems = (preferences as Record<string, unknown>[]).filter(
+            (r) => (r.memory_type ?? r.type) === "preference"
+          ).slice(0, 5);
+          const factItems = (facts as Record<string, unknown>[]).filter(
+            (r) => (r.memory_type ?? r.type) === "fact"
+          ).slice(0, 5);
+          const stats = status?.stats as Record<string, unknown> | undefined;
+          const caps = status?.capabilities as Record<string, unknown> | undefined;
+          // Build human-readable summary
+          const lines: string[] = [];
+          lines.push(`## 🧠 Sulcus Memory Profile`);
+          lines.push(`**Namespace:** ${namespace} | **Backend:** ${backendMode}`);
+          lines.push("");
+          if (stats) {
+            const total = (stats.total_nodes ?? stats.total ?? "?") as string | number;
+            const hot = (stats.hot_nodes ?? "?") as string | number;
+            const cold = (stats.cold_nodes ?? "?") as string | number;
+            const avgHeat = typeof stats.average_heat === "number" ? (stats.average_heat * 100).toFixed(1) + "%" : "?";
+            lines.push(`### Memory Stats`);
+            lines.push(`- **Total nodes:** ${total}`);
+            lines.push(`- **Hot / Cold:** ${hot} hot / ${cold} cold`);
+            lines.push(`- **Average heat:** ${avgHeat}`);
+            if (stats.memory_types && Array.isArray(stats.memory_types)) {
+              const types = (stats.memory_types as { type: string; count: number }[])
+                .sort((a, b) => b.count - a.count)
+                .map((t) => `${t.type}: ${t.count}`)
+                .join(" | ");
+              lines.push(`- **By type:** ${types}`);
+            }
+            lines.push("");
+          }
+          if (caps) {
+            const enabled = Object.entries(caps)
+              .filter(([, v]) => v === true)
+              .map(([k]) => k)
+              .join(", ");
+            if (enabled) lines.push(`**Active capabilities:** ${enabled}\n`);
+          }
+          if (hotNodes.length > 0) {
+            lines.push(`### 🔥 Top Hot Nodes (${hotNodes.length})`);
+            for (const n of (hotNodes as Record<string, unknown>[]).slice(0, hotLimit)) {
+              const heat = typeof n.current_heat === "number" ? (n.current_heat * 100).toFixed(0) + "%" : "?";
+              const mtype = (n.memory_type ?? n.type ?? "?") as string;
+              const label = ((n.summary ?? n.label ?? n.content ?? "") as string).slice(0, 80);
+              lines.push(`- [${heat} ${mtype}] ${label}`);
+            }
+            lines.push("");
+          }
+          if (prefItems.length > 0) {
+            lines.push(`### 📌 Active Preferences`);
+            for (const p of prefItems) {
+              const heat = typeof p.current_heat === "number" ? (p.current_heat * 100).toFixed(0) + "%" : "?";
+              const label = ((p.summary ?? p.label ?? p.content ?? "") as string).slice(0, 100);
+              lines.push(`- [${heat}] ${label}`);
+            }
+            lines.push("");
+          }
+          if (factItems.length > 0) {
+            lines.push(`### 📚 Active Facts`);
+            for (const f of factItems) {
+              const heat = typeof f.current_heat === "number" ? (f.current_heat * 100).toFixed(0) + "%" : "?";
+              const label = ((f.summary ?? f.label ?? f.content ?? "") as string).slice(0, 100);
+              lines.push(`- [${heat}] ${label}`);
+            }
+            lines.push("");
+          }
+          const summary = lines.join("\n");
+          return {
+            content: [{ type: "text", text: summary }],
+            details: { backend: backendMode, namespace, hot_count: hotNodes.length, pref_count: prefItems.length, fact_count: factItems.length },
+          };
+        } catch (e: unknown) {
+          return { content: [{ type: "text", text: `Memory profile error: ${e instanceof Error ? e.message : String(e)}` }] };
+        }
+      },
+  },
   siu_label: {
     schema: {
       name: "siu_label",
       label: "SIU Label",
       description: "Classify text using SIU v2 — returns SIVU store/reject decision and SICU memory type classification.",
       parameters: Type.Object({
@@ -1162,6 +3879,271 @@ const toolDefinitions: Record<string, ToolDefinition> = {
       },
   },
+  session_store: {
+    schema: {
+      name: "session_store",
+      label: "Session Store",
+      description: "Store ephemeral context for the current conversation only. Automatically purged when the session ends. Use this for short-term scratch-pad notes, intermediate reasoning, or context that's only relevant to this exchange.",
+      parameters: Type.Object({
+        content: Type.String({ description: "Content to store for this session." }),
+        memory_type: Type.Optional(Type.Union([
+          Type.Literal("episodic"), Type.Literal("semantic"), Type.Literal("preference"),
+          Type.Literal("procedural"), Type.Literal("fact"),
+        ], { description: "Memory type classification. Default: episodic" })),
+      }),
+    },
+    options: { name: "session_store" },
+    makeExecute: ({ sulcusMem, backendMode, namespace, nativeLoader, isAvailable, logger }) =>
+      async (_id, params) => {
+        if (!isAvailable || !sulcusMem) throw new Error(`Sulcus unavailable: ${nativeLoader.error || "not loaded"}`);
+        const content = params.content as string;
+        if (isJunkMemory(content)) {
+          return { content: [{ type: "text", text: "Filtered: content looks like system noise." }], details: { filtered: true } };
+        }
+        const mtype = (params.memory_type as string | undefined) || "episodic";
+        // Session namespace: "session:<id>" — scoped prefix ensures auto-purge targets only this session
+        const sessionNs = `session:${CURRENT_SESSION_ID}`;
+        const hints = buildExtractionHints(mtype, namespace, "user_capture", content.substring(0, 200));
+        // Store with high initial heat so session memories surface immediately
+        const res = await sulcusMem.add_memory(content, mtype, hints);
+        const nodeId = res?.id ?? "unknown";
+        // Pin with high heat so it persists clearly for the session duration (will be deleted at end)
+        if (nodeId !== "unknown" && sulcusMem instanceof SulcusCloudClient) {
+          await (sulcusMem as SulcusCloudClient).request("PATCH", `/api/v1/agent/memory/${nodeId}`, {
+            current_heat: 0.95,
+            // Tag with session namespace via a search-scoped namespace field
+          }).catch(() => {}); // best-effort
+        }
+        // Track session memory IDs for purge at agent_end
+        sessionMemoryIds.add(nodeId);
+        logger.info(`sulcus: session_store — stored [${mtype}] for session ${CURRENT_SESSION_ID} (id: ${nodeId})`);
+        return {
+          content: [{ type: "text", text: `Stored session memory [${mtype}] (id: ${nodeId}) — will be purged at session end.` }],
+          details: { id: nodeId, memory_type: mtype, session_id: CURRENT_SESSION_ID, backend: backendMode, namespace: sessionNs },
+        };
+      },
+  },
+  session_recall: {
+    schema: {
+      name: "session_recall",
+      label: "Session Recall",
+      description: "Search ephemeral context stored in the current conversation with session_store. Returns only memories from this session — nothing from prior sessions.",
+      parameters: Type.Object({
+        query: Type.String({ description: "Search query string." }),
+        limit: Type.Optional(Type.Number({ default: 5, description: "Maximum results (1-10)." })),
+      }),
+    },
+    options: { name: "session_recall" },
+    makeExecute: ({ sulcusMem, backendMode, namespace, nativeLoader, isAvailable }) =>
+      async (_id, params) => {
+        if (!isAvailable || !sulcusMem) throw new Error(`Sulcus unavailable: ${nativeLoader.error || "not loaded"}`);
+        if (sessionMemoryIds.size === 0) {
+          return { content: [{ type: "text", text: "No session memories stored yet. Use session_store to add ephemeral context." }], details: { results: [], session_id: CURRENT_SESSION_ID } };
+        }
+        // Search the main namespace but filter to only this session's IDs
+        const limit = Math.min(10, Math.max(1, (params.limit as number | undefined) ?? 5));
+        const res = await sulcusMem.search_memory(params.query as string, limit * 3, namespace);
+        const allResults = res?.results ?? [];
+        // Filter to session-owned IDs only
+        const sessionResults = allResults.filter((r) => sessionMemoryIds.has(r.id as string)).slice(0, limit);
+        return {
+          content: [{ type: "text", text: JSON.stringify(sessionResults, null, 2) }],
+          details: { results: sessionResults as unknown as Record<string, unknown>[], session_id: CURRENT_SESSION_ID, session_count: sessionMemoryIds.size, backend: backendMode },
+        };
+      },
+  },
+  memory_inspect: {
+    schema: {
+      name: "memory_inspect",
+      label: "Memory Inspect",
+      description: "Debug window into what Sulcus is actually doing. Shows what was injected in the last recall, what the output/tool guard scanned, what was blocked and why, and the last N guardrail events. Use this to verify Sulcus is working correctly.",
+      parameters: Type.Object({}),
+    },
+    options: { name: "memory_inspect" },
+    makeExecute: (_deps: ToolDeps) =>
+      async (_id: string, _params: Record<string, unknown>) => {
+        const now = Date.now();
+        // Format last recall snapshot
+        const recall = inspectBuffer.lastRecall;
+        const recallSection: Record<string, unknown> = recall
+          ? {
+              captured_ago_s: Math.round((now - recall.capturedAt) / 1000),
+              path: recall.path,
+              turn: recall.turn,
+              query_preview: recall.query,
+              from_cache: recall.fromCache,
+              items_injected: recall.itemsInjected,
+              profile_items: recall.profileItems,
+              recall_item_count: recall.recallItems.length,
+              stale_items: recall.staleCount,
+              graph_hop_items: recall.graphHopCount,
+              tokens_used: recall.tokensUsed,
+              tokens_budget: recall.tokensBudget,
+              recall_items: recall.recallItems.map((r) => ({
+                id: r.id,
+                preview: r.content_preview,
+                type: r.memory_type,
+                heat: r.heat.toFixed(3),
+                score: r.score !== null ? r.score.toFixed(4) : null,
+                stale: r.stale,
+                source: r.source,
+              })),
+            }
+          : { status: "no_recall_yet", note: "No recall injection has occurred this session yet." };
+        // Format guardrail events (most recent first)
+        const events = inspectBuffer.guardrailEvents
+          .slice()
+          .reverse()
+          .map((e) => ({
+            ago_s: Math.round((now - e.capturedAt) / 1000),
+            guard: e.guard,
+            event: e.eventType,
+            action: e.action,
+            details: e.details,
+            ...(e.toolName ? { tool: e.toolName } : {}),
+            ...(e.severity ? { severity: e.severity } : {}),
+          }));
+        const result = {
+          last_recall: recallSection,
+          guardrail_events: events.length > 0 ? events : [{ status: "none", note: "No guardrail events this session." }],
+          guardrail_event_count: inspectBuffer.guardrailEvents.length,
+        };
+        const lines: string[] = [
+          "## \U0001f50d Sulcus Inspect",
+          "",
+          "### Last Recall Injection",
+          "```json",
+          JSON.stringify(recallSection, null, 2),
+          "```",
+          "",
+          "### Guardrail Events (most recent first)",
+          "```json",
+          JSON.stringify(events.length > 0 ? events : [{ status: "none" }], null, 2),
+          "```",
+        ];
+        return {
+          content: [{ type: "text", text: lines.join("\n") }],
+          details: result as unknown as Record<string, unknown>,
+        };
+      },
+  },
+  guardrail_status: {
+    schema: {
+      name: "guardrail_status",
+      label: "Guardrail Status",
+      description: "Returns current guardrail configuration: outputGuard enabled/disabled, which rules are active (PII/preferences/custom), last 5 blocked events with reasons, preference keywords cached, negative prefs count. Use this to verify the guard is working and what it's watching.",
+      parameters: Type.Object({}),
+    },
+    options: { name: "guardrail_status" },
+    makeExecute: (_deps: ToolDeps) =>
+      async (_id: string, _params: Record<string, unknown>) => {
+        const now = Date.now();
+        if (!guardrailStatus) {
+          return {
+            content: [{ type: "text", text: "## 🛡️ Guardrail Status\n\nPlugin not fully initialized yet. Try again after the first turn." }],
+            details: { status: "not_initialized" },
+          };
+        }
+        const gs = guardrailStatus;
+        const negCount = gs.negPrefCount();
+        const negCachedAt = gs.negPrefCachedAt();
+        const negCacheAge = negCachedAt ? Math.round((now - negCachedAt) / 1000) : null;
+        // Last 5 blocked/flagged guardrail events
+        const blockedEvents = inspectBuffer.guardrailEvents
+          .slice()
+          .reverse()
+          .filter((e) => e.action === "block" || e.action === "redact" || e.action === "replace" || e.action === "warn" || e.eventType.includes("violation") || e.eventType.includes("blocked"))
+          .slice(0, 5)
+          .map((e) => ({
+            ago_s: Math.round((now - e.capturedAt) / 1000),
+            guard: e.guard,
+            event: e.eventType,
+            action: e.action,
+            details: e.details,
+            ...(e.toolName ? { tool: e.toolName } : {}),
+            ...(e.severity ? { severity: e.severity } : {}),
+          }));
+        const result = {
+          output_guard: {
+            enabled: gs.outputGuard.enabled,
+            pii: gs.outputGuard.pii,
+            preference_violation: gs.outputGuard.preferenceViolation,
+            fail_mode: gs.outputGuard.failMode,
+            audit_trail: gs.outputGuard.auditTrail,
+          },
+          tool_guard: {
+            enabled: gs.toolGuard.enabled,
+            sensitive_tools: gs.toolGuard.sensitiveTools,
+            allowlist: gs.toolGuard.allowlist,
+            blocklist: gs.toolGuard.blocklist,
+            objective_check: gs.toolGuard.objectiveCheck,
+            require_approval_threshold: gs.toolGuard.requireApprovalThreshold,
+            fail_mode: gs.toolGuard.failMode,
+            audit_trail: gs.toolGuard.auditTrail,
+          },
+          neg_pref_cache: {
+            count: negCount,
+            cached_age_s: negCacheAge,
+            note: negCount === 0 ? "No negative preferences cached (cache empty or not yet loaded)" : `${negCount} negative preference(s) cached`,
+          },
+          recent_blocked_events: blockedEvents.length > 0 ? blockedEvents : [{ status: "none", note: "No blocks/violations this session" }],
+        };
+        const ogStatus = gs.outputGuard.enabled
+          ? `✅ enabled (PII: ${gs.outputGuard.pii.enabled ? "on" : "off"}, prefViolation: ${gs.outputGuard.preferenceViolation.enabled ? "on" : "off"})`
+          : `❌ disabled (set guardrails.outputGuard.enabled=true to activate)`;
+        const tgStatus = gs.toolGuard.enabled
+          ? `✅ enabled (objectiveCheck: ${gs.toolGuard.objectiveCheck ? "on" : "off"}, threshold: ${gs.toolGuard.requireApprovalThreshold})`
+          : `❌ disabled (set guardrails.toolGuard.enabled=true to activate)`;
+        const lines: string[] = [
+          "## 🛡️ Guardrail Status",
+          "",
+          `**Output Guard:** ${ogStatus}`,
+          ...(gs.outputGuard.enabled ? [
+            `  - PII patterns: ${gs.outputGuard.pii.patterns.join(", ")}`,
+            `  - PII action: ${gs.outputGuard.pii.onViolation} (reversible: ${gs.outputGuard.pii.reversible})`,
+            `  - Preference violation action: ${gs.outputGuard.preferenceViolation.onViolation}`,
+            `  - Fail mode: ${gs.outputGuard.failMode}`,
+          ] : []),
+          "",
+          `**Tool Guard:** ${tgStatus}`,
+          ...(gs.toolGuard.enabled ? [
+            `  - Sensitive tools: ${gs.toolGuard.sensitiveTools.join(", ")}`,
+            `  - Allowlist: ${gs.toolGuard.allowlist.length > 0 ? gs.toolGuard.allowlist.join(", ") : "(none)"}`,
+            `  - Blocklist: ${gs.toolGuard.blocklist.length > 0 ? gs.toolGuard.blocklist.join(", ") : "(none)"}`,
+            `  - Approval threshold: ${gs.toolGuard.requireApprovalThreshold}`,
+            `  - Fail mode: ${gs.toolGuard.failMode}`,
+          ] : []),
+          "",
+          `**Negative Pref Cache:** ${negCount} prefs cached${negCacheAge !== null ? `, ${negCacheAge}s ago` : ""}`,
+          "",
+          `**Recent Blocks (last 5):**`,
+          "```json",
+          JSON.stringify(blockedEvents.length > 0 ? blockedEvents : [{ status: "none" }], null, 2),
+          "```",
+        ];
+        return {
+          content: [{ type: "text", text: lines.join("\n") }],
+          details: result as unknown as Record<string, unknown>,
+        };
+      },
+  },
   __sulcus_workflow__: {
     schema: {
       name: "__sulcus_workflow__",
@@ -1187,7 +4169,7 @@ const toolDefinitions: Record<string, ToolDefinition> = {
   },
 };
-// ─── FIRST-INSTALL HISTORY IMPORT ────────────────────────────────────────────
+// --- FIRST-INSTALL HISTORY IMPORT --------------------------------------------
 async function importOpenClawHistory(sulcusMem: SulcusCloudClient, logger: PluginLogger): Promise<void> {
   // eslint-disable-next-line @typescript-eslint/no-require-imports
@@ -1254,7 +4236,7 @@ async function importOpenClawHistory(sulcusMem: SulcusCloudClient, logger: Plugi
   } catch (_e) { /* best-effort */ }
 }
-// ─── PLUGIN ──────────────────────────────────────────────────────────────────
+// --- PLUGIN ------------------------------------------------------------------
 const sulcusPlugin = {
   id: "openclaw-sulcus",
@@ -1264,9 +4246,17 @@ const sulcusPlugin = {
   register(api: Record<string, unknown>) {
     const logger = api.logger as PluginLogger;
-    const pluginConfig = (api.pluginConfig ?? {}) as Record<string, unknown>;
+    const rawPluginConfig = (api.pluginConfig ?? {}) as Record<string, unknown>;
+    // -- Task 69: Load sulcus.toml config layer --
+    // sulcus.toml provides file-based defaults. Plugin UI config wins on conflict.
+    // Precedence: pluginConfig (OpenClaw UI) > sulcus.toml > built-in defaults.
+    const tomlConfigPath = rawPluginConfig?.configFile as string | undefined;
+    const tomlConfig = loadSulcusToml(tomlConfigPath, logger);
+    // Merge: toml is the base, pluginConfig overrides. Deep merge for nested objects.
+    const pluginConfig = mergeConfig(tomlConfig, rawPluginConfig);
-    // ── Configuration ──
+    // -- Configuration --
     const libDir = pluginConfig?.libDir
       ? resolve(pluginConfig.libDir as string)
       : resolve(process.env.HOME || "~", ".sulcus/lib");
@@ -1307,11 +4297,26 @@ const sulcusPlugin = {
     const autoCapture: boolean = (pluginConfig?.autoCapture as boolean | undefined) ?? false;
     const maxRecallResults: number = Math.min(20, Math.max(1, (pluginConfig?.maxRecallResults as number | undefined) ?? 5));
     const profileFrequency: number = Math.min(500, Math.max(1, (pluginConfig?.profileFrequency as number | undefined) ?? 10));
-    // ── Load hooks config ──
+    // Task 66: configurable token budget. Clamped to [100, 8000]; default 4000.
+    // Task 101: maxRecallChars is an alias — converted to token budget at ~4 chars/token.
+    const rawMaxRecallChars = pluginConfig?.maxRecallChars as number | undefined;
+    const tokenBudgetFromChars = rawMaxRecallChars ? Math.floor(rawMaxRecallChars / 4) : undefined;
+    const tokenBudget: number = Math.min(8000, Math.max(100, tokenBudgetFromChars ?? (pluginConfig?.tokenBudget as number | undefined) ?? 4000));
+    // Task 102: Context window size for utilization-based throttling.
+    const contextWindowSize: number = Math.max(8000, (pluginConfig?.contextWindowSize as number | undefined) ?? 200000);
+    const boostOnRecallEnabled: boolean = (pluginConfig?.boostOnRecall as boolean | undefined) ?? true;
+    // Task 67: assistant output capture
+    const captureFromAssistant: boolean = (pluginConfig?.captureFromAssistant as boolean | undefined) ?? false;
+    // Task 70: Context rebuild config. Enabled by default when autoRecall + cloud backend are active.
+    const contextRebuildEnabled: boolean = (pluginConfig?.contextRebuild as Record<string, unknown> | undefined)?.enabled !== false;
+    const contextRebuildBudget: number = Math.min(10000, Math.max(500, (
+      (pluginConfig?.contextRebuild as Record<string, unknown> | undefined)?.tokenBudget as number | undefined
+    ) ?? 4000));
+    // -- Load hooks config --
     const hooksConfig = loadHooksConfig(pluginConfig);
-    // ── Backend init ──
+    // -- Backend init --
     let sulcusMem: SulcusCloudClient | null = null;
     let backendMode = "unavailable";
@@ -1358,9 +4363,13 @@ const sulcusPlugin = {
     // Update static awareness with runtime info
     STATIC_AWARENESS = buildStaticAwareness(backendMode, namespace);
-    // ── Startup summary ──
+    // Task 70: Wire contextRebuild budget to module-scope variable so rebuild
+    // handler (inside buildSdkRecallHandler closure) picks up configured value.
+    REBUILD_TOKEN_BUDGET = contextRebuildBudget;
+    // -- Startup summary --
     if (isAvailable) {
-      logger.info(`sulcus: ready ✅ (backend: ${backendMode}, namespace: ${namespace}, autoRecall: ${autoRecall}, autoCapture: ${autoCapture})`);
+      logger.info(`sulcus: ready ✅ (backend: ${backendMode}, namespace: ${namespace}, autoRecall: ${autoRecall}, autoCapture: ${autoCapture}, captureFromAssistant: ${captureFromAssistant}, contextRebuild: ${contextRebuildEnabled})`);
     } else {
       // Give clear, actionable guidance instead of cryptic error chains
       const hints: string[] = [];
@@ -1380,12 +4389,12 @@ const sulcusPlugin = {
       logger.warn(`sulcus: not ready — ${hints.join(". ")}`);
     }
-    // ── SIU v2 request helper ──
+    // -- SIU v2 request helper --
     const siuRequestFn = isCloudBackend && sulcusMem
       ? (method: string, path: string, body?: unknown) => (sulcusMem as SulcusCloudClient).request(method, path, body)
       : null;
-    // ── Shared deps ──
+    // -- Shared deps --
     const toolDeps: ToolDeps = {
       sulcusMem,
       backendMode,
@@ -1408,11 +4417,15 @@ const sulcusPlugin = {
       storeLibPath,
       vectorsLibPath,
       wasmDir,
+      boostOnRecall: boostOnRecallEnabled,
+      profileFrequency,
+      tokenBudget,
+      contextWindowSize,
     };
-    // ─────────────────────────────────────────────────────────────────────────
+    // -------------------------------------------------------------------------
     // SDK INTEGRATIONS (v4.0.0)
-    // ─────────────────────────────────────────────────────────────────────────
+    // -------------------------------------------------------------------------
     // 1. registerMemoryRuntime — Sulcus becomes the OpenClaw memory backend
     if (isCloudBackend && sulcusMem && typeof (api.registerMemoryRuntime as unknown) === "function") {
@@ -1490,7 +4503,11 @@ const sulcusPlugin = {
           namespace,
           maxRecallResults,
           profileFrequency,
-          logger
+          logger,
+          boostOnRecallEnabled,
+          tokenBudget,
+          contextRebuildEnabled,
+          contextWindowSize,
         );
         const apiOn = api.on as (event: string, handler: unknown) => void;
         apiOn("before_prompt_build", async (event: Record<string, unknown>, ctx: unknown) => {
@@ -1557,7 +4574,10 @@ const sulcusPlugin = {
       const agentEndCaptureConfig: HookConfig = {
         action: "sivu_auto_capture",
         enabled: true,
-        min_store_confidence: 0.5,
+        // Task 25: Lowered from 0.5 → 0.4 — SIVU gate was too aggressive,
+        // rejecting real architectural/technical content that scored in the
+        // 0.4–0.5 range. 0.4 is still well above noise threshold (< 0.2).
+        min_store_confidence: 0.4,
         fallback_on_error: true,
       };
       const apiOn = api.on as (event: string, handler: unknown) => void;
@@ -1572,9 +4592,635 @@ const sulcusPlugin = {
       logger.info("sulcus: registered auto-capture (agent_end)");
     }
-    // ─────────────────────────────────────────────────────────────────────────
+    // -------------------------------------------------------------------------
+    // SESSION MEMORY AUTO-PURGE (Task 30)
+    // When agent_end fires, delete all session-scoped memories so they don't
+    // persist beyond the conversation. Fire-and-forget — purge failure is silent.
+    // -------------------------------------------------------------------------
+    if (isAvailable && sulcusMem instanceof SulcusCloudClient) {
+      const sessionPurgeApiOn = api.on as (event: string, handler: unknown) => void;
+      sessionPurgeApiOn("agent_end", async () => {
+        if (sessionMemoryIds.size === 0) return;
+        const ids = Array.from(sessionMemoryIds);
+        sessionMemoryIds.clear();
+        logger.info(`sulcus: session_purge — purging ${ids.length} session memor${ids.length === 1 ? "y" : "ies"} (session: ${CURRENT_SESSION_ID})`);
+        Promise.allSettled(
+          ids.map((id) =>
+            (sulcusMem as SulcusCloudClient).delete_memory(id, false).catch(() => {})
+          )
+        ).then((results) => {
+          const deleted = results.filter((r) => r.status === "fulfilled").length;
+          logger.info(`sulcus: session_purge — purged ${deleted}/${ids.length} session memor${ids.length === 1 ? "y" : "ies"}`);
+        }).catch(() => {});
+      });
+      logger.info(`sulcus: registered session_purge (agent_end) for session ${CURRENT_SESSION_ID}`);
+    }
+    // -------------------------------------------------------------------------
+    // DREAM AUTO-TRIGGER (Phase 4)
+    // Cheap local gates → expensive API call → fire-and-forget consolidation.
+    // Gate cascade: session counter → time gap → memory count → lock → execute.
+    // -------------------------------------------------------------------------
+    const dreamEnabled = (pluginConfig?.dreamAutoTrigger as boolean) !== false; // default: true
+    const dreamSessionInterval = (pluginConfig?.dreamSessionInterval as number) ?? 10;
+    const dreamMinGapMs = ((pluginConfig?.dreamMinGapHours as number) ?? 24) * 3600_000;
+    const dreamMinMemories = (pluginConfig?.dreamMinMemories as number) ?? 50;
+    const dreamMinHeat = (pluginConfig?.dreamConsolidateMinHeat as number) ?? 0.1;
+    if (dreamEnabled && isAvailable && sulcusMem instanceof SulcusCloudClient) {
+      // State file for cross-session persistence
+      const stateDir = resolve(__dirname, ".sulcus-state");
+      if (!existsSync(stateDir)) mkdirSync(stateDir, { recursive: true });
+      const dreamStateFile = resolve(stateDir, "dream-state.json");
+      const dreamLockFile = resolve(stateDir, "dream.lock");
+      // In-memory session counter (resets on gateway restart, which is fine)
+      let dreamSessionCount = 0;
+      // Read persisted state
+      function readDreamState(): { lastDreamMs: number; lastSessionCount: number } {
+        try {
+          if (existsSync(dreamStateFile)) {
+            const raw = readFileSync(dreamStateFile, "utf-8");
+            const parsed = JSON.parse(raw);
+            return {
+              lastDreamMs: typeof parsed.lastDreamMs === "number" ? parsed.lastDreamMs : 0,
+              lastSessionCount: typeof parsed.lastSessionCount === "number" ? parsed.lastSessionCount : 0,
+            };
+          }
+        } catch { /* corrupted state = treat as fresh */ }
+        return { lastDreamMs: 0, lastSessionCount: 0 };
+      }
+      function writeDreamState(state: { lastDreamMs: number; lastSessionCount: number }): void {
+        try { writeFileSync(dreamStateFile, JSON.stringify(state)); } catch { /* best effort */ }
+      }
+      // Simple file lock (not bulletproof, but prevents obvious races)
+      function acquireDreamLock(): boolean {
+        try {
+          if (existsSync(dreamLockFile)) {
+            const lockAge = Date.now() - (JSON.parse(readFileSync(dreamLockFile, "utf-8")).ts ?? 0);
+            if (lockAge < 600_000) return false; // Lock held < 10 min = still running
+            // Stale lock — claim it
+          }
+          writeFileSync(dreamLockFile, JSON.stringify({ ts: Date.now(), pid: process.pid }));
+          return true;
+        } catch { return false; }
+      }
+      function releaseDreamLock(): void {
+        try { if (existsSync(dreamLockFile)) require("node:fs").unlinkSync(dreamLockFile); } catch { /* best effort */ }
+      }
+      // Register on before_prompt_build to count sessions (cheap — just increment)
+      const origBeforePromptBuild = api.on as (event: string, handler: unknown) => void;
+      origBeforePromptBuild("session_start", async () => {
+        dreamSessionCount++;
+      });
+      // Register on agent_end to check dream gates
+      const dreamApiOn = api.on as (event: string, handler: unknown) => void;
+      dreamApiOn("agent_end", async () => {
+        // Gate 1 (free): Session counter — only check every N sessions
+        if (dreamSessionCount % dreamSessionInterval !== 0) return;
+        if (dreamSessionCount === 0) return; // Skip first session
+        // Gate 2 (free): Time gap — minimum hours since last dream
+        const state = readDreamState();
+        const elapsed = Date.now() - state.lastDreamMs;
+        if (elapsed < dreamMinGapMs) {
+          logger.info(`sulcus/dream: gate 2 skip — ${Math.round(elapsed / 3600_000)}h since last dream (need ${Math.round(dreamMinGapMs / 3600_000)}h)`);
+          return;
+        }
+        // Gate 3 (cheap API): Memory count — only consolidate if enough memories exist
+        try {
+          const statusResp = await (sulcusMem as SulcusCloudClient).request("GET", "/api/v1/agent/memory/status") as Record<string, unknown> | null;
+          const stats = statusResp?.stats as Record<string, unknown> | undefined;
+          const totalMemories = typeof stats?.total_memories === "number" ? stats.total_memories as number : 0;
+          if (totalMemories < dreamMinMemories) {
+            logger.info(`sulcus/dream: gate 3 skip — ${totalMemories} memories (need ${dreamMinMemories})`);
+            return;
+          }
+          logger.info(`sulcus/dream: gates passed — ${totalMemories} memories, ${Math.round(elapsed / 3600_000)}h since last dream`);
+        } catch (e: unknown) {
+          logger.warn(`sulcus/dream: gate 3 error — ${e instanceof Error ? e.message : e}`);
+          return;
+        }
+        // Gate 4 (lock): Prevent concurrent consolidation
+        if (!acquireDreamLock()) {
+          logger.info("sulcus/dream: lock held — another consolidation in progress");
+          return;
+        }
+        // Execute: Fire-and-forget consolidation
+        logger.info(`sulcus/dream: triggering consolidation (minHeat=${dreamMinHeat})`);
+        (sulcusMem as SulcusCloudClient).consolidate(dreamMinHeat)
+          .then((result: unknown) => {
+            writeDreamState({ lastDreamMs: Date.now(), lastSessionCount: dreamSessionCount });
+            logger.info(`sulcus/dream: consolidation complete — ${JSON.stringify(result)}`);
+          })
+          .catch((e: unknown) => {
+            logger.warn(`sulcus/dream: consolidation failed — ${e instanceof Error ? e.message : e}`);
+          })
+          .finally(() => {
+            releaseDreamLock();
+          });
+      });
+      logger.info(`sulcus: dream auto-trigger enabled (every ${dreamSessionInterval} sessions, ${Math.round(dreamMinGapMs / 3600_000)}h gap, min ${dreamMinMemories} memories)`);
+    }
+    // -------------------------------------------------------------------------
+    // GUARDRAIL HOOK REGISTRATION (Task 54 — outputGuard)
+    // llm_output: fast pre-analysis (regex only, <5ms target)
+    // message_sending: enforcement (may do async Sulcus recall for pref check)
+    // -------------------------------------------------------------------------
+    const outputGuardCfg = parseOutputGuardConfig(pluginConfig);
+    if (outputGuardCfg.enabled) {
+      // -- Hook 1: llm_output — fast pre-analysis --------------------------
+      const llmOutputApiOn = api.on as (event: string, handler: unknown) => void;
+      llmOutputApiOn("llm_output", async (event: Record<string, unknown>) => {
+        const t0 = Date.now();
+        try {
+          const content = (event?.content ?? event?.text ?? "") as string;
+          if (!content) { lastGuardFlags = null; return undefined; }
+          // Fast PII scan (regex only — no API calls)
+          let piiSpans: PiiSpan[] = [];
+          if (outputGuardCfg.pii.enabled) {
+            piiSpans = scanForPii(content, outputGuardCfg.pii.patterns, outputGuardCfg.pii.customPatterns);
+          }
+          // Fast preference violation heuristic (keyword check against cached prefs)
+          let suspectedPrefViolation = false;
+          let suspectedReason: string | undefined;
+          if (outputGuardCfg.preferenceViolation.enabled && negPrefCache && negPrefCache.namespace === namespace) {
+            const lowerContent = content.toLowerCase();
+            for (const pref of negPrefCache.prefs) {
+              if (lowerContent.includes(pref.toLowerCase())) {
+                suspectedPrefViolation = true;
+                suspectedReason = `Content contains term matching stored negative preference: "${pref.slice(0, 50)}"`;
+                break;
+              }
+            }
+          }
+          const flags: SulcusGuardFlags = {
+            piiDetected: piiSpans.length > 0,
+            piiSpans,
+            suspectedPreferenceViolation: suspectedPrefViolation,
+            suspectedViolationReason: suspectedReason,
+            scanTimeMs: Date.now() - t0,
+          };
+          lastGuardFlags = flags;
+          logger.debug?.(`sulcus/output-guard: llm_output scan complete (${flags.scanTimeMs}ms, pii=${flags.piiDetected}, prefViolation=${flags.suspectedPreferenceViolation})`);
+          return undefined; // no modification at this stage — enforcement is in message_sending
+        } catch (err) {
+          logger.warn(`sulcus/output-guard: llm_output threw: ${err}`);
+          lastGuardFlags = null;
+          return outputGuardCfg.failMode === "fail-closed" ? { content: "⚠️ Output guardrail error — message blocked (fail-closed mode)." } : undefined;
+        }
+      });
+      // -- Hook 2: message_sending — enforcement --------------------------
+      const msgSendingApiOn = api.on as (event: string, handler: unknown) => void;
+      msgSendingApiOn("message_sending", async (event: Record<string, unknown>) => {
+        try {
+          const content = (event?.content ?? event?.text ?? event?.message ?? "") as string;
+          if (!content) return undefined;
+          // Consume flags from llm_output (or run fast scan if unavailable)
+          const flags: SulcusGuardFlags = lastGuardFlags ?? (() => {
+            const t0 = Date.now();
+            const piiSpans = outputGuardCfg.pii.enabled
+              ? scanForPii(content, outputGuardCfg.pii.patterns, outputGuardCfg.pii.customPatterns)
+              : [];
+            return {
+              piiDetected: piiSpans.length > 0,
+              piiSpans,
+              suspectedPreferenceViolation: false,
+              scanTimeMs: Date.now() - t0,
+            };
+          })();
+          lastGuardFlags = null; // consume flags — one-shot per turn
+          let modified = false;
+          let finalContent = content;
+          const auditEvents: Array<{ eventType: string; action: string; details: string }> = [];
+          // -- PII enforcement ---------------------------------------------
+          if (outputGuardCfg.pii.enabled && flags.piiDetected) {
+            switch (outputGuardCfg.pii.onViolation) {
+              case "redact": {
+                // Store redaction key if reversible
+                if (outputGuardCfg.pii.reversible) {
+                  storeRedactionKey(flags.piiSpans, content, outputGuardCfg.pii.storageKey, namespace);
+                }
+                finalContent = redactSpans(finalContent, flags.piiSpans);
+                modified = true;
+                auditEvents.push({ eventType: "pii_redacted", action: "redact", details: `${flags.piiSpans.length} span(s) redacted (types: ${[...new Set(flags.piiSpans.map(s => s.type))].join(", ")})` });
+                logger.info(`sulcus/output-guard: redacted ${flags.piiSpans.length} PII span(s)`);
+                break;
+              }
+              case "replace":
+              case "block": {
+                // Never silent cancel — always explain (Dooley's directive)
+                finalContent = `⚠️ This message contained personal information (${[...new Set(flags.piiSpans.map(s => s.type))].join(", ")}) and was blocked by the output guard. Please rephrase without including identifiable data.`;
+                modified = true;
+                auditEvents.push({ eventType: "pii_blocked", action: outputGuardCfg.pii.onViolation, details: `${flags.piiSpans.length} span(s) blocked` });
+                logger.info(`sulcus/output-guard: blocked message containing PII (${outputGuardCfg.pii.onViolation})`);
+                break;
+              }
+            }
+          }
+          // -- Preference violation enforcement (async — Sulcus recall) ----
+          if (outputGuardCfg.preferenceViolation.enabled && flags.suspectedPreferenceViolation && sulcusMem instanceof SulcusCloudClient) {
+            try {
+              // Refresh negative pref cache if stale or namespace changed
+              const now = Date.now();
+              if (!negPrefCache || negPrefCache.namespace !== namespace || (now - negPrefCache.cachedAt) > NEG_PREF_CACHE_TTL_MS) {
+                const prefRes = await sulcusMem.search_memory("negative preference dislike avoid", 10, namespace);
+                const prefMemories = prefRes?.results ?? [];
+                // Extract content strings from preference memories
+                const prefTexts = prefMemories
+                  .filter((m) => {
+                    const mtype = m.memory_type as string | undefined;
+                    return !mtype || mtype === "preference";
+                  })
+                  .map((m) => ((m.label ?? m.content ?? "") as string).toLowerCase())
+                  .filter((t) => t.length > 3);
+                negPrefCache = { prefs: prefTexts, cachedAt: now, namespace };
+              }
+              // Confirm violation against actual recalled preferences
+              const lowerFinal = finalContent.toLowerCase();
+              let confirmedViolation = false;
+              let violatedPref = "";
+              for (const pref of negPrefCache.prefs) {
+                if (lowerFinal.includes(pref.toLowerCase().slice(0, 30))) {
+                  confirmedViolation = true;
+                  violatedPref = pref.slice(0, 80);
+                  break;
+                }
+              }
+              if (confirmedViolation) {
+                const replacement = outputGuardCfg.preferenceViolation.replacementMessage;
+                switch (outputGuardCfg.preferenceViolation.onViolation) {
+                  case "replace":
+                  case "block":
+                    finalContent = replacement;
+                    modified = true;
+                    auditEvents.push({ eventType: "preference_violation", action: outputGuardCfg.preferenceViolation.onViolation, details: `Violated preference: "${violatedPref}"` });
+                    logger.info(`sulcus/output-guard: preference violation — replaced message (pref: "${violatedPref.slice(0, 50)}")`);
+                    break;
+                  case "warn":
+                    finalContent = `⚠️ Note: This response may conflict with your stored preferences.
+${finalContent}`;
+                    modified = true;
+                    auditEvents.push({ eventType: "preference_violation", action: "warn", details: `Possible conflict with preference: "${violatedPref}"` });
+                    break;
+                }
+              }
+            } catch (prefErr) {
+              logger.warn(`sulcus/output-guard: preference check failed: ${prefErr}`);
+              if (outputGuardCfg.failMode === "fail-closed") {
+                finalContent = "⚠️ Output guardrail check failed — message blocked (fail-closed mode).";
+                modified = true;
+              }
+            }
+          }
+          // -- Audit trail + inspect buffer (Task 56) -------------------------------
+          if (auditEvents.length > 0) {
+            // Always push to inspect buffer (regardless of auditTrail config)
+            for (const evt of auditEvents) {
+              pushGuardrailEvent({
+                capturedAt: Date.now(),
+                guard: "output",
+                eventType: evt.eventType,
+                action: evt.action,
+                details: evt.details,
+              });
+            }
+            // Persist to Sulcus only when auditTrail is enabled
+            if (outputGuardCfg.auditTrail && sulcusMem instanceof SulcusCloudClient) {
+              for (const evt of auditEvents) {
+                sulcusMem.store({
+                  content: `[output_guard] ${evt.eventType}: ${evt.details}. Action: ${evt.action}. Timestamp: ${new Date().toISOString()}.`,
+                  memory_type: "episodic",
+                  metadata: { _source: "output_guard", eventType: evt.eventType, action: evt.action, namespace },
+                } as any).catch(() => { /* best effort audit */ });
+              }
+            }
+          }
+          if (modified) {
+            return { content: finalContent };
+          }
+          return undefined;
+        } catch (err) {
+          logger.warn(`sulcus/output-guard: message_sending threw: ${err}`);
+          return outputGuardCfg.failMode === "fail-closed" ? { content: "⚠️ Output guardrail error — message blocked (fail-closed mode)." } : undefined;
+        }
+      });
+      logger.info(`sulcus/output-guard: registered (pii=${outputGuardCfg.pii.enabled}, prefViolation=${outputGuardCfg.preferenceViolation.enabled}, failMode=${outputGuardCfg.failMode})`);
+    } else {
+      logger.info("sulcus/output-guard: disabled (set guardrails.outputGuard.enabled=true to activate)");
+    }
+    // -------------------------------------------------------------------------
+    // ASSISTANT OUTPUT CAPTURE (Task 67 — llm_output hook)
+    // Captures assistant responses as memories via SIVU quality gate.
+    // Filters generic acks; compresses long responses before storing.
+    // Config: captureFromAssistant=true (disabled by default).
+    // -------------------------------------------------------------------------
+    if (captureFromAssistant && isAvailable && sulcusMem) {
+      const assistantCaptureApiOn = api.on as (event: string, handler: unknown) => void;
+      assistantCaptureApiOn("llm_output", async (event: Record<string, unknown>) => {
+        try {
+          const content = (event?.content ?? event?.text ?? "") as string;
+          if (!content || typeof content !== "string") return undefined;
+          // Skip generic acknowledgments ("ok", "sure", "got it", etc.)
+          if (isGenericAck(content)) {
+            logger.debug?.("sulcus: assistant_capture — skipping generic ack");
+            return undefined;
+          }
+          // Skip junk (system blobs, patterns we never want)
+          if (isJunkMemory(content)) {
+            logger.debug?.(`sulcus: assistant_capture — skipping junk: "${content.substring(0, 50)}..."`);
+            return undefined;
+          }
+          // Build capture text: summarize long responses
+          const captureText = content.length > ASSISTANT_CAPTURE_MAX_DIRECT
+            ? summarizeForCapture(content, namespace)
+            : content;
+          // Dedup check
+          if (!shouldCapture(captureText)) {
+            logger.debug?.("sulcus: assistant_capture — dedup skip");
+            return undefined;
+          }
+          // SIVU quality gate + store
+          if (sulcusMem instanceof SulcusCloudClient) {
+            try {
+              const siuResult = await sulcusMem.request("POST", "/api/v2/siu/label", { text: captureText }) as Record<string, unknown>;
+              const storeConf = (siuResult?.store_confidence as number) ?? 0;
+              const shouldStore = siuResult?.store === true && storeConf >= 0.4;
+              if (!shouldStore) {
+                logger.debug?.(`sulcus: assistant_capture — SIVU rejected (conf: ${storeConf.toFixed(3)}): "${captureText.substring(0, 60)}..."`);
+                return undefined;
+              }
+              const memoryType = (siuResult?.memory_type as string) ?? "episodic";
+              const hints = buildExtractionHints(memoryType, namespace, "assistant_capture", captureText.substring(0, 200));
+              const res = await sulcusMem.add_memory(captureText, memoryType, hints);
+              logger.info(`sulcus: assistant_capture — stored [${memoryType}] (id: ${res?.id ?? "?"}, conf: ${storeConf.toFixed(3)}): "${captureText.substring(0, 60)}..."`);
+            } catch (e: unknown) {
+              const msg = e instanceof Error ? e.message : String(e);
+              logger.warn(`sulcus: assistant_capture — SIVU error: ${msg}`);
+              // fallback: store as episodic without quality gate
+              try {
+                const hints = buildExtractionHints("episodic", namespace, "assistant_capture", captureText.substring(0, 200));
+                const res = await sulcusMem.add_memory(captureText, "episodic", hints);
+                logger.info(`sulcus: assistant_capture — fallback stored [episodic] (id: ${res?.id ?? "?"}): "${captureText.substring(0, 60)}..."`);
+              } catch (fe: unknown) {
+                logger.warn(`sulcus: assistant_capture — fallback failed: ${fe instanceof Error ? fe.message : fe}`);
+              }
+            }
+          }
+          return undefined; // never modify output — capture only
+        } catch (err) {
+          logger.warn("sulcus: assistant_capture — hook threw: " + err);
+          return undefined;
+        }
+      });
+      logger.info("sulcus: registered assistant_capture (llm_output hook, captureFromAssistant=true)");
+    } else if (!captureFromAssistant) {
+      logger.debug?.("sulcus: assistant_capture disabled (set captureFromAssistant=true to activate)");
+    }
+    // -------------------------------------------------------------------------
+    // TOOL GUARD HOOK REGISTRATION (Task 55 — before_tool_call)
+    // Evaluates tool calls against memory + allowlists before execution
+    // -------------------------------------------------------------------------
+    const toolGuardCfg = parseToolGuardConfig(pluginConfig);
+    // Task 57: populate module-scope snapshot for guardrail_status tool
+    guardrailStatus = {
+      outputGuard: {
+        enabled: outputGuardCfg.enabled,
+        pii: {
+          enabled: outputGuardCfg.pii.enabled,
+          patterns: outputGuardCfg.pii.patterns,
+          onViolation: outputGuardCfg.pii.onViolation,
+          reversible: outputGuardCfg.pii.reversible,
+        },
+        preferenceViolation: {
+          enabled: outputGuardCfg.preferenceViolation.enabled,
+          onViolation: outputGuardCfg.preferenceViolation.onViolation,
+        },
+        failMode: outputGuardCfg.failMode,
+        auditTrail: outputGuardCfg.auditTrail,
+      },
+      toolGuard: {
+        enabled: toolGuardCfg.enabled,
+        sensitiveTools: toolGuardCfg.sensitiveTools,
+        allowlist: toolGuardCfg.allowlist,
+        blocklist: toolGuardCfg.blocklist,
+        objectiveCheck: toolGuardCfg.objectiveCheck,
+        requireApprovalThreshold: toolGuardCfg.requireApprovalThreshold,
+        failMode: toolGuardCfg.failMode,
+        auditTrail: toolGuardCfg.auditTrail,
+      },
+      negPrefCount: () => negPrefCache?.prefs.length ?? 0,
+      negPrefCachedAt: () => negPrefCache?.cachedAt ?? null,
+    };
+    if (toolGuardCfg.enabled) {
+      const toolGuardApiOn = api.on as (event: string, handler: unknown) => void;
+      toolGuardApiOn("before_tool_call", async (event: Record<string, unknown>) => {
+        try {
+          const toolName = (event?.name ?? event?.function ?? event?.tool_name ?? "") as string;
+          const toolArgs = (event?.arguments ?? event?.input ?? event?.params ?? {}) as Record<string, unknown>;
+          if (!toolName) {
+            logger.warn("sulcus/tool-guard: no tool name in event — allowing by default");
+            return { allow: true };
+          }
+          // -- Allowlist check (immediate pass) ------------------------------
+          if (toolGuardCfg.allowlist.length > 0 && toolGuardCfg.allowlist.includes(toolName)) {
+            // Task 56: push to inspect buffer
+            pushGuardrailEvent({ capturedAt: Date.now(), guard: "tool", eventType: "tool_allowed", action: "allow", details: `Allowlisted tool: ${toolName}`, toolName, severity: "info" });
+            if (toolGuardCfg.auditTrail && sulcusMem instanceof SulcusCloudClient) {
+              sulcusMem.add_memory(
+                `[tool_guard] ${toolName}: allowed (allowlist). Args: ${JSON.stringify(toolArgs).slice(0, 200)}`,
+                "episodic",
+                { _source: "tool_guard" } as any
+              ).catch(() => {});
+            }
+            return { allow: true };
+          }
+          // -- Blocklist check (immediate block) -----------------------------
+          if (toolGuardCfg.blocklist.length > 0 && toolGuardCfg.blocklist.includes(toolName)) {
+            const reason = `Tool '${toolName}' is on the blocklist and cannot be used.`;
+            // Task 56: push to inspect buffer
+            pushGuardrailEvent({ capturedAt: Date.now(), guard: "tool", eventType: "tool_blocked", action: "block", details: `Blocklisted tool: ${toolName}`, toolName, severity: "critical" });
+            if (toolGuardCfg.auditTrail && sulcusMem instanceof SulcusCloudClient) {
+              sulcusMem.add_memory(
+                `[tool_guard] ${toolName}: blocked (blocklist). Reason: ${reason}`,
+                "episodic",
+                { _source: "tool_guard" } as any
+              ).catch(() => {});
+            }
+            logger.info(`sulcus/tool-guard: blocked tool '${toolName}' (blocklist)`);
+            return { block: true, reason };
+          }
+          // -- Sensitivity check ---------------------------------------------
+          const isSensitive = toolGuardCfg.sensitiveTools.includes(toolName);
+          if (!isSensitive) {
+            // Non-sensitive tools pass without evaluation
+            return { allow: true };
+          }
+          // -- Objective alignment check (for sensitive tools) ---------------
+          let severity: "info" | "warning" | "critical" = "info";
+          let reason = "";
+          if (toolGuardCfg.objectiveCheck && sulcusMem instanceof SulcusCloudClient) {
+            try {
+              // Search for relevant objectives and preferences
+              const objectiveRes = await sulcusMem.search_memory(`objective goal preference ${toolName}`, 5, namespace);
+              const objectives = objectiveRes?.results ?? [];
+              // Simplified alignment scoring based on memory content
+              const toolDescription = `Tool call: ${toolName} with args ${JSON.stringify(toolArgs).slice(0, 200)}`;
+              let hasConflict = false;
+              let conflictingObjective = "";
+              // Check for explicit negative preferences about this tool or action
+              for (const obj of objectives) {
+                const content = ((obj.label ?? obj.content ?? "") as string).toLowerCase();
+                const toolLower = toolName.toLowerCase();
+                // Look for explicit prohibitions
+                if (content.includes("never") || content.includes("don't") || content.includes("avoid")) {
+                  if (content.includes(toolLower) ||
+                      (toolName === "exec" && (content.includes("command") || content.includes("execute"))) ||
+                      (toolName === "write" && content.includes("file")) ||
+                      (toolName === "edit" && content.includes("modify")) ||
+                      (toolName === "delete" && content.includes("remove"))) {
+                    hasConflict = true;
+                    conflictingObjective = (obj.label ?? obj.content ?? "") as string;
+                    break;
+                  }
+                }
+              }
+              if (hasConflict) {
+                severity = "critical";
+                reason = `This tool call conflicts with stored preference: "${conflictingObjective.slice(0, 100)}"`;
+              } else if (objectives.length === 0) {
+                // No relevant memories found — low risk
+                severity = "info";
+                reason = "No relevant objectives found in memory — proceeding with caution.";
+              } else {
+                // Has relevant memories but no clear conflict
+                severity = "warning";
+                reason = "Tool call is sensitive but appears aligned with stored objectives.";
+              }
+            } catch (objErr) {
+              logger.warn(`sulcus/tool-guard: objective check failed: ${objErr}`);
+              if (toolGuardCfg.failMode === "fail-closed") {
+                return { block: true, reason: "Tool guard objective check failed (fail-closed mode)." };
+              }
+              // fail-open: allow with info severity
+              severity = "info";
+              reason = "Objective check failed — allowing with reduced confidence.";
+            }
+          } else {
+            // No objective check configured — default to warning for sensitive tools
+            severity = "warning";
+            reason = `Tool '${toolName}' is marked as sensitive. Please verify this action is intended.`;
+          }
+          // -- Severity threshold evaluation ---------------------------------
+          const severityLevels = { "info": 0, "warning": 1, "critical": 2 };
+          const currentLevel = severityLevels[severity];
+          const thresholdLevel = severityLevels[toolGuardCfg.requireApprovalThreshold];
+          // -- Audit trail + inspect buffer (Task 56) -----------------------
+          {
+            const decision = currentLevel >= thresholdLevel ? "require_approval" : "allow";
+            // Always push to inspect buffer
+            pushGuardrailEvent({
+              capturedAt: Date.now(),
+              guard: "tool",
+              eventType: currentLevel >= thresholdLevel ? "tool_require_approval" : "tool_allowed",
+              action: decision,
+              details: reason.slice(0, 200),
+              toolName,
+              severity,
+            });
+            if (toolGuardCfg.auditTrail && sulcusMem instanceof SulcusCloudClient) {
+              sulcusMem.add_memory(
+                `[tool_guard] ${toolName}: ${decision}. Severity: ${severity}. Reason: ${reason}. Args: ${JSON.stringify(toolArgs).slice(0, 200)}`,
+                "episodic",
+                { _source: "tool_guard" } as any
+              ).catch(() => {});
+            }
+          }
+          if (currentLevel >= thresholdLevel) {
+            logger.info(`sulcus/tool-guard: requiring approval for '${toolName}' (severity: ${severity}, threshold: ${toolGuardCfg.requireApprovalThreshold})`);
+            return {
+              requireApproval: true,
+              severity,
+              reason: `${reason}\n\nTool: ${toolName}\nArguments: ${JSON.stringify(toolArgs, null, 2)}`,
+            };
+          } else {
+            logger.debug?.(`sulcus/tool-guard: allowing '${toolName}' (severity: ${severity} below threshold: ${toolGuardCfg.requireApprovalThreshold})`);
+            return { allow: true };
+          }
+        } catch (err) {
+          logger.warn(`sulcus/tool-guard: before_tool_call threw: ${err}`);
+          if (toolGuardCfg.failMode === "fail-closed") {
+            return { block: true, reason: "Tool guard error — blocked (fail-closed mode)." };
+          }
+          // fail-open: allow on error
+          return { allow: true };
+        }
+      });
+      logger.info(`sulcus/tool-guard: registered (sensitiveTools=${toolGuardCfg.sensitiveTools.length}, objectiveCheck=${toolGuardCfg.objectiveCheck}, threshold=${toolGuardCfg.requireApprovalThreshold}, failMode=${toolGuardCfg.failMode})`);
+    } else {
+      logger.info("sulcus/tool-guard: disabled (set guardrails.toolGuard.enabled=true to activate)");
+    }
+    // -------------------------------------------------------------------------
     // LEGACY HOOK REGISTRATION (config-driven, backward compat)
-    // ─────────────────────────────────────────────────────────────────────────
+    // -------------------------------------------------------------------------
     for (const [hookName, hookConfig] of Object.entries(hooksConfig.hooks)) {
       if (!hookConfig.enabled) continue;
@@ -1602,9 +5248,9 @@ const sulcusPlugin = {
       }
     }
-    // ─────────────────────────────────────────────────────────────────────────
+    // -------------------------------------------------------------------------
     // TOOL REGISTRATION
-    // ─────────────────────────────────────────────────────────────────────────
+    // -------------------------------------------------------------------------
     for (const [toolName, toolConfig] of Object.entries(hooksConfig.tools)) {
       if (!toolConfig.enabled) continue;
@@ -1623,6 +5269,264 @@ const sulcusPlugin = {
       }
     }
+    // -------------------------------------------------------------------------
+    // CLI REGISTRATION (Phase 3: `openclaw sulcus <subcommand>`)
+    // -------------------------------------------------------------------------
+    const registerCli = api.registerCli as ((registrar: (ctx: { program: any; config: any; logger: any }) => void, opts?: any) => void) | undefined;
+    if (typeof registerCli === "function") {
+      registerCli((ctx: { program: any; config: any; logger: any }) => {
+        const sulcusCmd = ctx.program.command("sulcus").description("Sulcus memory management");
+        // --- openclaw sulcus status ---
+        sulcusCmd.command("status")
+          .description("Check Sulcus connection, config, and memory stats")
+          .option("--json", "Machine-readable JSON output")
+          .action(async (opts: { json?: boolean }) => {
+            if (!isAvailable || !sulcusMem) {
+              const out = { status: "unavailable", backend: backendMode, namespace, error: "Backend not connected" };
+              if (opts.json) { console.log(JSON.stringify(out, null, 2)); } else {
+                console.log(`Status: unavailable`);
+                console.log(`Backend: ${backendMode}`);
+                console.log(`Namespace: ${namespace}`);
+                if (serverUrl) console.log(`Server: ${serverUrl}`);
+                console.log(`\nRun \`openclaw sulcus init\` to configure.`);
+              }
+              return;
+            }
+            try {
+              const status = await (sulcusMem as SulcusCloudClient).request("GET", "/api/v1/agent/memory/status") as Record<string, unknown> | null;
+              const hot = await (sulcusMem as SulcusCloudClient).list_hot_nodes(5);
+              const out = {
+                status: "connected",
+                backend: backendMode,
+                namespace,
+                server: serverUrl,
+                autoRecall,
+                autoCapture,
+                ...(status?.stats ? { stats: status.stats } : {}),
+                ...(status?.capabilities ? { capabilities: status.capabilities } : {}),
+                hot_nodes: (hot.nodes || []).length,
+              };
+              if (opts.json) { console.log(JSON.stringify(out, null, 2)); } else {
+                console.log(`Status: connected \u2705`);
+                console.log(`Backend: ${backendMode}`);
+                console.log(`Namespace: ${namespace}`);
+                console.log(`Server: ${serverUrl}`);
+                console.log(`Auto-recall: ${autoRecall}`);
+                console.log(`Auto-capture: ${autoCapture}`);
+                const stats = status?.stats as Record<string, unknown> | undefined;
+                if (stats?.total_memories !== undefined) console.log(`Memories: ${stats.total_memories}`);
+                if (stats?.average_heat !== undefined) console.log(`Average heat: ${(stats.average_heat as number).toFixed(3)}`);
+                console.log(`Hot nodes: ${(hot.nodes || []).length}`);
+              }
+            } catch (e: unknown) {
+              const msg = e instanceof Error ? e.message : String(e);
+              if (opts.json) { console.log(JSON.stringify({ status: "error", error: msg })); }
+              else { console.error(`Error: ${msg}`); }
+            }
+          });
+        // --- openclaw sulcus search ---
+        sulcusCmd.command("search <query>")
+          .description("Search memories")
+          .option("-n, --limit <n>", "Max results", "10")
+          .option("--json", "Machine-readable JSON output")
+          .action(async (query: string, opts: { limit: string; json?: boolean }) => {
+            if (!isAvailable || !sulcusMem) { console.error("Sulcus not connected."); return; }
+            try {
+              const res = await sulcusMem.search_memory(query, parseInt(opts.limit, 10), namespace);
+              const results = res?.results ?? [];
+              if (opts.json) { console.log(JSON.stringify(results, null, 2)); return; }
+              if (results.length === 0) { console.log("No results."); return; }
+              for (const r of results) {
+                const heat = typeof r.current_heat === "number" ? (r.current_heat * 100).toFixed(0) + "%" : "?";
+                const mtype = (r.memory_type ?? "?") as string;
+                const label = ((r.label ?? r.content ?? "") as string).slice(0, 120);
+                console.log(`[${heat} ${mtype}] ${label}`);
+                console.log(`  id: ${r.id}`);
+              }
+              console.log(`\n${results.length} result(s)`);
+            } catch (e: unknown) { console.error(`Error: ${e instanceof Error ? e.message : e}`); }
+          });
+        // --- openclaw sulcus add ---
+        sulcusCmd.command("add <content>")
+          .description("Store a memory")
+          .option("-t, --type <type>", "Memory type", "semantic")
+          .option("--json", "Machine-readable JSON output")
+          .action(async (content: string, opts: { type: string; json?: boolean }) => {
+            if (!isAvailable || !sulcusMem) { console.error("Sulcus not connected."); return; }
+            try {
+              const hints = buildExtractionHints(opts.type, namespace, "cli_add", content.substring(0, 200));
+              const res = await sulcusMem.add_memory(content, opts.type, hints);
+              if (opts.json) { console.log(JSON.stringify(res, null, 2)); }
+              else { console.log(`Stored [${opts.type}] memory (id: ${res?.id ?? "?"})`); }
+            } catch (e: unknown) { console.error(`Error: ${e instanceof Error ? e.message : e}`); }
+          });
+        // --- openclaw sulcus get ---
+        sulcusCmd.command("get <id>")
+          .description("Fetch a memory by ID")
+          .option("--json", "Machine-readable JSON output")
+          .action(async (id: string, opts: { json?: boolean }) => {
+            if (!isAvailable || !(sulcusMem instanceof SulcusCloudClient)) { console.error("Sulcus not connected."); return; }
+            try {
+              const res = await sulcusMem.get_memory(id);
+              if (!res) { console.log(`Memory ${id} not found.`); return; }
+              if (opts.json) { console.log(JSON.stringify(res, null, 2)); } else {
+                const heat = typeof res.current_heat === "number" ? ((res.current_heat as number) * 100).toFixed(0) + "%" : "?";
+                console.log(`ID: ${res.id}`);
+                console.log(`Type: ${res.memory_type ?? "?"}`); console.log(`Heat: ${heat}`);
+                console.log(`Pinned: ${res.is_pinned ?? false}`);
+                console.log(`Content: ${((res.label ?? res.content ?? "") as string).slice(0, 500)}`);
+              }
+            } catch (e: unknown) { console.error(`Error: ${e instanceof Error ? e.message : e}`); }
+          });
+        // --- openclaw sulcus list ---
+        sulcusCmd.command("list")
+          .description("List memories")
+          .option("-n, --limit <n>", "Max results", "20")
+          .option("-t, --type <type>", "Filter by memory type")
+          .option("--pinned", "Only pinned memories")
+          .option("--sort <field>", "Sort by: current_heat, created_at, updated_at", "current_heat")
+          .option("--json", "Machine-readable JSON output")
+          .action(async (opts: { limit: string; type?: string; pinned?: boolean; sort: string; json?: boolean }) => {
+            if (!isAvailable || !(sulcusMem instanceof SulcusCloudClient)) { console.error("Sulcus not connected."); return; }
+            try {
+              const res = await sulcusMem.list_memories({
+                page_size: parseInt(opts.limit, 10),
+                memory_type: opts.type,
+                pinned: opts.pinned,
+                sort_by: opts.sort,
+                sort_order: "desc",
+                namespace,
+              });
+              if (opts.json) { console.log(JSON.stringify(res, null, 2)); return; }
+              if (res.items.length === 0) { console.log("No memories."); return; }
+              for (const r of res.items) {
+                const heat = typeof r.current_heat === "number" ? ((r.current_heat as number) * 100).toFixed(0) + "%" : "?";
+                const mtype = (r.memory_type ?? "?") as string;
+                const label = ((r.label ?? r.content ?? "") as string).slice(0, 100);
+                console.log(`[${heat} ${mtype}] ${label}`);
+                console.log(`  id: ${r.id}`);
+              }
+              console.log(`\n${res.items.length} shown${res.total ? ` of ${res.total}` : ""}`);
+            } catch (e: unknown) { console.error(`Error: ${e instanceof Error ? e.message : e}`); }
+          });
+        // --- openclaw sulcus update ---
+        sulcusCmd.command("update <id>")
+          .description("Update a memory")
+          .option("-c, --content <text>", "New content")
+          .option("-t, --type <type>", "New memory type")
+          .option("--pin", "Pin the memory")
+          .option("--unpin", "Unpin the memory")
+          .option("--heat <value>", "Set heat (0.0-1.0)")
+          .option("--json", "Machine-readable JSON output")
+          .action(async (id: string, opts: { content?: string; type?: string; pin?: boolean; unpin?: boolean; heat?: string; json?: boolean }) => {
+            if (!isAvailable || !(sulcusMem instanceof SulcusCloudClient)) { console.error("Sulcus not connected."); return; }
+            const updates: Record<string, unknown> = {};
+            if (opts.content) updates.label = opts.content;
+            if (opts.type) updates.memory_type = opts.type;
+            if (opts.pin) updates.is_pinned = true;
+            if (opts.unpin) updates.is_pinned = false;
+            if (opts.heat) updates.current_heat = parseFloat(opts.heat);
+            if (Object.keys(updates).length === 0) { console.error("No fields to update."); return; }
+            try {
+              const res = await sulcusMem.update_memory(id, updates as any);
+              if (opts.json) { console.log(JSON.stringify(res, null, 2)); }
+              else { console.log(`Updated memory ${id} (${Object.keys(updates).join(", ")})`); }
+            } catch (e: unknown) { console.error(`Error: ${e instanceof Error ? e.message : e}`); }
+          });
+        // --- openclaw sulcus delete ---
+        sulcusCmd.command("delete <id>")
+          .description("Delete a memory")
+          .option("--no-train", "Don't train SIVU to reject similar")
+          .option("--json", "Machine-readable JSON output")
+          .action(async (id: string, opts: { train?: boolean; json?: boolean }) => {
+            if (!isAvailable || !sulcusMem) { console.error("Sulcus not connected."); return; }
+            try {
+              const train = opts.train !== false;
+              await sulcusMem.delete_memory(id, train);
+              if (opts.json) { console.log(JSON.stringify({ deleted: id, trained: train })); }
+              else { console.log(`Deleted memory ${id}${train ? " (trained SIVU)" : ""}`); }
+            } catch (e: unknown) { console.error(`Error: ${e instanceof Error ? e.message : e}`); }
+          });
+        // --- openclaw sulcus export ---
+        sulcusCmd.command("export")
+          .description("Export all memories as Markdown")
+          .action(async () => {
+            if (!isAvailable || !sulcusMem) { console.error("Sulcus not connected."); return; }
+            try {
+              const md = await sulcusMem.export_markdown();
+              console.log(md);
+            } catch (e: unknown) { console.error(`Error: ${e instanceof Error ? e.message : e}`); }
+          });
+        // --- openclaw sulcus import ---
+        sulcusCmd.command("import <file>")
+          .description("Import memories from a Markdown file")
+          .action(async (file: string) => {
+            if (!isAvailable || !sulcusMem) { console.error("Sulcus not connected."); return; }
+            try {
+              const { readFileSync } = require("fs") as { readFileSync: (p: string, e: string) => string };
+              const text = readFileSync(file, "utf-8");
+              const res = await sulcusMem.import_markdown(text);
+              console.log(JSON.stringify(res, null, 2));
+            } catch (e: unknown) { console.error(`Error: ${e instanceof Error ? e.message : e}`); }
+          });
+        // --- openclaw sulcus consolidate ---
+        sulcusCmd.command("consolidate")
+          .description("Run dream/consolidation on cold memories")
+          .option("--min-heat <value>", "Heat threshold (0.0-1.0)", "0.1")
+          .option("--json", "Machine-readable JSON output")
+          .action(async (opts: { minHeat: string; json?: boolean }) => {
+            if (!isAvailable || !sulcusMem) { console.error("Sulcus not connected."); return; }
+            try {
+              const res = await sulcusMem.consolidate(parseFloat(opts.minHeat));
+              if (opts.json) { console.log(JSON.stringify(res, null, 2)); }
+              else { console.log("Consolidation complete."); console.log(JSON.stringify(res, null, 2)); }
+            } catch (e: unknown) { console.error(`Error: ${e instanceof Error ? e.message : e}`); }
+          });
+        // --- openclaw sulcus hot ---
+        sulcusCmd.command("hot")
+          .description("Show hottest memories")
+          .option("-n, --limit <n>", "Max results", "10")
+          .option("--json", "Machine-readable JSON output")
+          .action(async (opts: { limit: string; json?: boolean }) => {
+            if (!isAvailable || !sulcusMem) { console.error("Sulcus not connected."); return; }
+            try {
+              const res = await sulcusMem.list_hot_nodes(parseInt(opts.limit, 10));
+              const nodes = res?.nodes ?? [];
+              if (opts.json) { console.log(JSON.stringify(nodes, null, 2)); return; }
+              if (nodes.length === 0) { console.log("No hot nodes."); return; }
+              for (const n of nodes) {
+                const heat = typeof n.current_heat === "number" ? ((n.current_heat as number) * 100).toFixed(0) + "%" : "?";
+                const label = ((n.label ?? n.pointer_summary ?? "") as string).slice(0, 100);
+                console.log(`[${heat}] ${label}`);
+              }
+            } catch (e: unknown) { console.error(`Error: ${e instanceof Error ? e.message : e}`); }
+          });
+        logger.info("sulcus: registered CLI commands (openclaw sulcus <cmd>)");
+      }, {
+        commands: ["sulcus"],
+        descriptors: [{
+          name: "sulcus",
+          description: "Sulcus memory management \u2014 status, search, add, get, list, update, delete, export, import, consolidate, hot",
+          hasSubcommands: true,
+        }],
+      });
+    } else {
+      logger.info("sulcus: registerCli not available \u2014 CLI commands skipped");
+    }
     // Fire-and-forget first-install history import
     if (isAvailable && sulcusMem instanceof SulcusCloudClient) {
       importOpenClawHistory(sulcusMem, logger).catch((e: unknown) => {