npm - @shadowforge0/aquifer-memory - Versions diffs - 1.2.1 → 1.5.8 - Mend

@shadowforge0/aquifer-memory 1.2.1 → 1.5.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (43) hide show

package/README.md +8 -9
package/consumers/cli.js +11 -1
package/consumers/default/index.js +17 -4
package/consumers/mcp.js +21 -0
package/consumers/miranda/index.js +15 -4
package/consumers/miranda/profile.json +145 -0
package/consumers/miranda/recall-format.js +5 -3
package/consumers/miranda/render-daily-md.js +186 -0
package/consumers/shared/config.js +8 -0
package/consumers/shared/factory.js +2 -1
package/consumers/shared/llm.js +1 -1
package/consumers/shared/recall-format.js +21 -1
package/core/aquifer.js +693 -87
package/core/artifacts.js +174 -0
package/core/bundles.js +400 -0
package/core/consolidation.js +340 -0
package/core/decisions.js +164 -0
package/core/entity-state.js +483 -0
package/core/errors.js +97 -0
package/core/handoff.js +153 -0
package/core/insights.js +499 -0
package/core/mcp-manifest.js +131 -0
package/core/narratives.js +212 -0
package/core/profiles.js +171 -0
package/core/state.js +163 -0
package/core/storage.js +82 -5
package/core/timeline.js +152 -0
package/index.js +14 -0
package/package.json +1 -1
package/pipeline/extract-state-changes.js +205 -0
package/schema/001-base.sql +186 -16
package/schema/002-entities.sql +35 -1
package/schema/004-completion.sql +391 -0
package/schema/005-entity-state-history.sql +87 -0
package/schema/006-insights.sql +138 -0
package/scripts/diagnose-fts-zh.js +37 -4
package/scripts/drop-entity-state-history.sql +17 -0
package/scripts/drop-insights.sql +12 -0
package/scripts/extract-insights-from-recent-sessions.js +315 -0
package/scripts/find-dburl-hints.js +29 -0
package/scripts/queries.json +45 -0
package/scripts/retro-recall-bench.js +409 -0
package/scripts/sample-bench-queries.sql +75 -0

package/core/aquifer.js CHANGED Viewed

@@ -42,15 +42,45 @@ function loadSql(filename, schema) {
 // ---------------------------------------------------------------------------
 function buildRerankDocument(row, maxChars) {
-  let text = (row.summary_text || row.summary_snippet || '').replace(/\s+/g, ' ').trim();
+  // Prefer structured_summary fields when available — title/overview carry
+  // more signal than summary_text for short Chinese recaps, and topics /
+  // decisions / open_loops give the cross-encoder substantive content.
+  // Fall back to summary_text / matched_turn_text when structured is absent.
+  const ss = row.structured_summary || null;
+  const parts = [];
+  if (ss) {
+    if (ss.title) parts.push(String(ss.title).trim());
+    if (ss.overview) parts.push(String(ss.overview).trim());
+    if (Array.isArray(ss.topics)) {
+      const topics = ss.topics
+        .map(t => typeof t === 'string' ? t : (t && t.name ? `${t.name}${t.summary ? ': ' + t.summary : ''}` : ''))
+        .filter(Boolean).join(' / ');
+      if (topics) parts.push(topics);
+    }
+    if (Array.isArray(ss.decisions)) {
+      const decisions = ss.decisions
+        .map(d => typeof d === 'string' ? d : (d && d.decision ? d.decision : ''))
+        .filter(Boolean).join(' / ');
+      if (decisions) parts.push(`Decisions: ${decisions}`);
+    }
+    if (Array.isArray(ss.open_loops)) {
+      const loops = ss.open_loops
+        .map(l => typeof l === 'string' ? l : (l && l.item ? l.item : ''))
+        .filter(Boolean).join(' / ');
+      if (loops) parts.push(`Open loops: ${loops}`);
+    }
+  }
+  if (!parts.length) {
+    const bare = (row.summary_text || row.summary_snippet || '').trim();
+    if (bare) parts.push(bare);
+  }
   const turn = (row.matched_turn_text || '').replace(/\s+/g, ' ').trim();
-  if (!text) {
-    text = turn;
-  } else if (turn && !text.includes(turn)) {
-    text = `${text}\n\nMatched turn:\n${turn}`;
+  if (turn) {
+    const joined = parts.join(' \n ');
+    if (!joined.includes(turn)) parts.push(`Matched turn: ${turn}`);
   }
+  let text = parts.join('\n\n').replace(/[ \t]+/g, ' ').trim();
   if (text.length > maxChars) text = text.slice(0, maxChars);
   return text;
 }
@@ -92,6 +122,48 @@ function resolveEmbedFn(embedConfig, env) {
 // createAquifer
 // ---------------------------------------------------------------------------
+// Decide whether to invoke the optional reranker on this recall call.
+// Returns `{ apply: boolean, reason: string }`. Pure function — no side effects.
+function shouldAutoRerank({ query, mode, ranked, hasEntities, autoTrigger }) {
+  if (!autoTrigger.enabled) return { apply: false, reason: 'auto_disabled' };
+  if (hasEntities && autoTrigger.alwaysWhenEntities) {
+    return { apply: true, reason: 'entities_present' };
+  }
+  const len = ranked.length;
+  if (len < autoTrigger.minResults) return { apply: false, reason: 'too_few_results' };
+  if (len > autoTrigger.maxResults) return { apply: false, reason: 'too_many_results' };
+  const q = String(query || '').trim();
+  const tokenCount = q.split(/\s+/).filter(Boolean).length;
+  if (q.length < autoTrigger.minQueryChars && tokenCount < autoTrigger.minQueryTokens) {
+    return { apply: false, reason: 'query_too_short' };
+  }
+  // FTS-only path: rerank when results are wide enough that semantic narrowing
+  // is valuable. Cohere-style cross-encoders excel at re-ranking keyword hits.
+  if (mode === 'fts') {
+    if (len > autoTrigger.ftsMinResults) return { apply: true, reason: 'fts_wide_shortlist' };
+    return { apply: false, reason: 'fts_shortlist_too_narrow' };
+  }
+  if (!autoTrigger.modes.includes(mode)) {
+    return { apply: false, reason: 'mode_not_in_autotrigger_modes' };
+  }
+  // Hybrid: if top-1 and top-2 are close, signals are mixed enough to benefit.
+  if (len >= 2) {
+    const s0 = ranked[0]?._score ?? 0;
+    const s1 = ranked[1]?._score ?? 0;
+    if (s0 - s1 <= autoTrigger.maxTopScoreGap) {
+      return { apply: true, reason: 'top_score_gap_close' };
+    }
+  }
+  return { apply: false, reason: 'top_score_gap_wide' };
+}
 function createAquifer(config = {}) {
   // v1.2.0: db falls back to DATABASE_URL / AQUIFER_DB_URL env so hosts can
   // call createAquifer() with zero args for install-and-go.
@@ -176,6 +248,24 @@ function createAquifer(config = {}) {
   const defaultRerankTopK = rerankConfig ? Math.max(1, rerankConfig.topK || 20) : 0;
   const rerankMaxChars = rerankConfig ? Math.max(200, rerankConfig.maxChars || 1600) : 0;
+  // Auto-trigger gate for rerank: when reranker is configured but caller didn't
+  // explicitly pass opts.rerank, decide per-call whether the cost is worth it.
+  // Defaults aim for "rerank when shortlist is dense enough to benefit, query
+  // is non-trivial, and either signals are mixed (hybrid) or FTS returned a
+  // wide candidate set worth narrowing semantically."
+  const autoTriggerCfg = (rerankConfig && rerankConfig.autoTrigger) || {};
+  const autoTrigger = {
+    enabled: autoTriggerCfg.enabled !== false,  // default true when reranker exists
+    modes: autoTriggerCfg.modes || ['hybrid'],
+    minQueryChars: autoTriggerCfg.minQueryChars ?? 6,
+    minQueryTokens: autoTriggerCfg.minQueryTokens ?? 2,
+    minResults: autoTriggerCfg.minResults ?? 2,
+    maxResults: autoTriggerCfg.maxResults ?? 12,
+    maxTopScoreGap: autoTriggerCfg.maxTopScoreGap ?? 0.08,
+    alwaysWhenEntities: autoTriggerCfg.alwaysWhenEntities !== false,  // default true
+    ftsMinResults: autoTriggerCfg.ftsMinResults ?? 5,  // FTS-only mode triggers when results > this
+  };
   // Source registry (in-memory)
   const sources = new Map();
@@ -183,57 +273,104 @@ function createAquifer(config = {}) {
   let migrated = false;
   let migratePromise = null;
-  async function ensureMigrated() {
-    if (migrated) return;
-    if (migratePromise) return migratePromise;
-    migratePromise = aquifer.migrate().finally(() => { migratePromise = null; });
-    return migratePromise;
+  // FTS tsconfig — auto-detected during migrate(). 'zhcfg' if zhparser is
+  // installed (better Chinese segmentation), otherwise 'simple' (legacy).
+  // Override via config.ftsConfig if you need to force one or the other.
+  let ftsConfig = config.ftsConfig || null;
+  // State-change extraction (Q3): off by default. When enabled, enrich() runs
+  // an extra LLM call to capture temporal state transitions on whitelisted
+  // entities. See pipeline/extract-state-changes.js + core/entity-state.js.
+  const stateChangesCfg = config.stateChanges || {};
+  const stateChangesEnabled = stateChangesCfg.enabled === true;
+  const stateChangesWhitelist = new Set(
+    (Array.isArray(stateChangesCfg.whitelist) ? stateChangesCfg.whitelist : [])
+      .map(s => String(s).toLowerCase())
+  );
+  const stateChangesPromptFn = stateChangesCfg.promptFn || null;
+  const stateChangesConfThreshold = Number.isFinite(stateChangesCfg.confidenceThreshold)
+    ? stateChangesCfg.confidenceThreshold : 0.7;
+  const stateChangesTimeoutMs = Number.isFinite(stateChangesCfg.timeoutMs)
+    ? stateChangesCfg.timeoutMs : 10000;
+  const stateChangesMaxOutputTokens = Number.isFinite(stateChangesCfg.maxOutputTokens)
+    ? stateChangesCfg.maxOutputTokens : 600;
+  const migrationsCfg = config.migrations || {};
+  const migrationsMode = (() => {
+    const raw = migrationsCfg.mode;
+    if (raw === 'apply' || raw === 'check' || raw === 'off') return raw;
+    if (raw === undefined || raw === null) return 'apply';
+    throw new Error(`config.migrations.mode must be 'apply' | 'check' | 'off' (got ${JSON.stringify(raw)})`);
+  })();
+  const migrationLockTimeoutMs = Number.isFinite(migrationsCfg.lockTimeoutMs)
+    ? Math.max(0, migrationsCfg.lockTimeoutMs) : 30000;
+  const migrationStartupTimeoutMs = Number.isFinite(migrationsCfg.startupTimeoutMs)
+    ? Math.max(0, migrationsCfg.startupTimeoutMs) : 60000;
+  const migrationOnEvent = typeof migrationsCfg.onEvent === 'function' ? migrationsCfg.onEvent : null;
+  function emitMigrationEvent(name, payload) {
+    if (!migrationOnEvent) return;
+    try { migrationOnEvent({ name, schema, ...payload }); } catch (err) {
+      console.warn(`[aquifer] migrations.onEvent handler threw: ${err.message}`);
+    }
   }
-  // --- Helper: embed search on summaries ---
-  async function embeddingSearchSummaries(queryVec, opts) {
-    const { agentIds, source, dateFrom, dateTo, limit = 20 } = opts;
-    const where = [`s.tenant_id = $1`];
-    const params = [tenantId];
-    params.push(`[${queryVec.join(',')}]`);
-    const vecPos = params.length;
-    if (dateFrom) {
-      params.push(dateFrom);
-      where.push(`($${params.length}::date IS NULL OR s.started_at::date >= $${params.length}::date)`);
-    }
-    if (dateTo) {
-      params.push(dateTo);
-      where.push(`($${params.length}::date IS NULL OR s.started_at::date <= $${params.length}::date)`);
-    }
-    if (agentIds && agentIds.length > 0) {
-      params.push(agentIds);
-      where.push(`s.agent_id = ANY($${params.length})`);
-    }
-    if (source) {
-      params.push(source);
-      where.push(`s.source = $${params.length}`);
-    }
+  // Expected migration set — used for lazy plan introspection. `always: true`
+  // runs every migrate(); others are gated by feature flags. Signature tables
+  // let listPendingMigrations() probe pg_tables without executing DDL.
+  const MIGRATION_PLAN = [
+    { id: '001-base',                file: '001-base.sql',                always: true, signature: 'sessions' },
+    { id: '002-entities',            file: '002-entities.sql',            gate: 'entities', signature: 'entities' },
+    { id: '003-trust-feedback',      file: '003-trust-feedback.sql',      always: true, signature: 'session_feedback' },
+    { id: '004-facts',               file: '004-facts.sql',               gate: 'facts', signature: 'facts' },
+    { id: '004-completion',          file: '004-completion.sql',          always: true, signature: 'narratives' },
+    { id: '005-entity-state-history',file: '005-entity-state-history.sql',gate: 'entities', signature: 'entity_state_history' },
+    { id: '006-insights',            file: '006-insights.sql',            always: true, signature: 'insights' },
+  ];
+  function requiredMigrations() {
+    return MIGRATION_PLAN
+      .filter(m => m.always
+        || (m.gate === 'entities' && entitiesEnabled)
+        || (m.gate === 'facts' && factsEnabled))
+      .map(m => m.id);
+  }
-    params.push(limit);
-    const result = await pool.query(
-      `SELECT
-        s.id, s.session_id, s.agent_id, s.source, s.started_at, s.last_message_at,
-        ss.summary_text, ss.structured_summary, ss.access_count, ss.last_accessed_at,
-        ss.trust_score,
-        (ss.embedding <=> $${vecPos}::vector) AS distance
-      FROM ${qi(schema)}.session_summaries ss
-      JOIN ${qi(schema)}.sessions s ON s.id = ss.session_row_id
-      WHERE ss.embedding IS NOT NULL
-        AND ${where.join(' AND ')}
-      ORDER BY distance ASC
-      LIMIT $${params.length}`,
-      params
+  async function readAppliedMigrations(queryRunner) {
+    const required = MIGRATION_PLAN.filter(m => m.always
+      || (m.gate === 'entities' && entitiesEnabled)
+      || (m.gate === 'facts' && factsEnabled));
+    const signatures = required.map(m => m.signature);
+    if (signatures.length === 0) return [];
+    const r = await queryRunner.query(
+      `SELECT tablename FROM pg_tables
+         WHERE schemaname = $1 AND tablename = ANY($2::text[])`,
+      [schema, signatures]
     );
+    const present = new Set(r.rows.map(row => row.tablename));
+    return required.filter(m => present.has(m.signature)).map(m => m.id);
+  }
+  async function buildMigrationPlan(queryRunner) {
+    const required = requiredMigrations();
+    const applied = await readAppliedMigrations(queryRunner);
+    const appliedSet = new Set(applied);
+    const pending = required.filter(id => !appliedSet.has(id));
+    return { required, applied, pending };
+  }
-    return result.rows;
+  async function ensureMigrated() {
+    if (migrated) return;
+    if (migratePromise) return migratePromise;
+    if (migrationsMode === 'off') { migrated = true; return; }
+    if (migrationsMode === 'check') {
+      // Lazy compare only — don't execute DDL implicitly.
+      const plan = await buildMigrationPlan(pool).catch(() => null);
+      if (plan && plan.pending.length === 0) migrated = true;
+      return;
+    }
+    migratePromise = aquifer.migrate().finally(() => { migratePromise = null; });
+    return migratePromise;
   }
   // =========================================================================
@@ -243,38 +380,329 @@ function createAquifer(config = {}) {
   const aquifer = {
     // --- lifecycle ---
+    async ensureMigrated() {
+      return ensureMigrated();
+    },
     async migrate() {
+      const t0 = Date.now();
       // Advisory lock prevents concurrent migrations across processes.
       // Lock key is derived from schema name to allow parallel migration
       // of different schemas in the same database.
       const lockKey = Buffer.from(`aquifer:${schema}`).reduce((h, b) => (h * 31 + b) & 0x7fffffff, 0);
-      await pool.query('SELECT pg_advisory_lock($1)', [lockKey]);
+      emitMigrationEvent('init_started', { mode: migrationsMode });
+      // Run all migration DDL on a single checked-out client so we can
+      // capture RAISE NOTICE/WARNING emitted by the DO blocks. node-postgres
+      // swallows notices on pool.query(); attaching a 'notice' listener to a
+      // held client surfaces them. Fall back to pool.query() when the caller
+      // passed a bare mock (no connect/release) — tests using minimal pool
+      // stubs still exercise the migration shape, just without notice capture.
+      const supportsCheckout = typeof pool.connect === 'function';
+      const client = supportsCheckout ? await pool.connect() : pool;
+      const releasesClient = supportsCheckout && typeof client.release === 'function';
+      const notices = [];
+      const onNotice = (n) => {
+        notices.push({ severity: n.severity || 'NOTICE', message: n.message || String(n) });
+      };
+      const hasEvents = typeof client.on === 'function' && typeof client.off === 'function';
+      if (hasEvents) client.on('notice', onNotice);
+      const ddlExecuted = [];
+      let lockAcquired = false;
       try {
-        // 1. Run base DDL
-        const baseSql = loadSql('001-base.sql', schema);
-        await pool.query(baseSql);
-        // 2. If entities enabled, run entity DDL
-        if (entitiesEnabled) {
-          const entitySql = loadSql('002-entities.sql', schema);
-          await pool.query(entitySql);
+        // Plan probe before lock: lets consumers see pending list and lets
+        // us emit an accurate check_completed event even when the DDL is a
+        // no-op on an already-migrated schema.
+        const planBefore = await buildMigrationPlan(client).catch(() => null);
+        emitMigrationEvent('check_completed', {
+          required: planBefore ? planBefore.required : requiredMigrations(),
+          applied:  planBefore ? planBefore.applied  : [],
+          pending:  planBefore ? planBefore.pending  : requiredMigrations(),
+        });
+        // Try-lock with poll + timeout. Replaces the old blocking
+        // pg_advisory_lock() which could hang indefinitely if another
+        // process crashed holding the lock. Defensive against mock pools:
+        // only poll when PG explicitly returns ok=false; a missing/empty
+        // response (test mocks that don't model pg_try_advisory_lock) is
+        // treated as acquired so suite doesn't hang on the deadline.
+        const lockDeadline = Date.now() + migrationLockTimeoutMs;
+        const pollMs = 250;
+        while (true) {
+          const r = await client.query('SELECT pg_try_advisory_lock($1) AS ok', [lockKey]);
+          const row = r && r.rows ? r.rows[0] : null;
+          if (row && row.ok === false) {
+            if (Date.now() >= lockDeadline) break;
+            await new Promise(res => setTimeout(res, pollMs));
+            continue;
+          }
+          lockAcquired = true;
+          break;
         }
+        if (!lockAcquired) {
+          const err = new Error(`aquifer: failed to acquire migration advisory lock within ${migrationLockTimeoutMs}ms for schema "${schema}"`);
+          err.code = 'AQ_MIGRATION_LOCK_TIMEOUT';
+          err.failedAt = 'acquire_lock';
+          throw err;
+        }
+        emitMigrationEvent('apply_started', {
+          pending: planBefore ? planBefore.pending : requiredMigrations(),
+        });
-        // 3. Trust + feedback (always, not gated by entities)
-        const trustSql = loadSql('003-trust-feedback.sql', schema);
-        await pool.query(trustSql);
+        try {
+          // 1. Run base DDL
+          const baseSql = loadSql('001-base.sql', schema);
+          await client.query(baseSql); ddlExecuted.push('001-base');
+          // 2. If entities enabled, run entity DDL
+          if (entitiesEnabled) {
+            const entitySql = loadSql('002-entities.sql', schema);
+            await client.query(entitySql); ddlExecuted.push('002-entities');
+          }
-        // 4. Facts / consolidation (opt-in)
-        if (factsEnabled) {
-          const factsSql = loadSql('004-facts.sql', schema);
-          await pool.query(factsSql);
+          // 3. Trust + feedback (always, not gated by entities)
+          const trustSql = loadSql('003-trust-feedback.sql', schema);
+          await client.query(trustSql); ddlExecuted.push('003-trust-feedback');
+          // 4. Facts / consolidation (opt-in)
+          if (factsEnabled) {
+            const factsSql = loadSql('004-facts.sql', schema);
+            await client.query(factsSql); ddlExecuted.push('004-facts');
+          }
+          // 5. Completion foundation (always, additive): narratives,
+          // consumer_profiles, sessions.consolidation_phases. Pure additive DDL
+          // with IF NOT EXISTS guards — safe on every migrate() call.
+          const completionSql = loadSql('004-completion.sql', schema);
+          await client.query(completionSql); ddlExecuted.push('004-completion');
+          // 6. Entity state history (always, gated by entitiesEnabled because
+          // it FK-references entities). Drop-clean — see scripts/drop-entity-state-history.sql.
+          if (entitiesEnabled) {
+            const stateHistorySql = loadSql('005-entity-state-history.sql', schema);
+            await client.query(stateHistorySql); ddlExecuted.push('005-entity-state-history');
+          }
+          // 7. Insights (always, additive). No FK from anywhere into this table —
+          // safe to DROP CASCADE. See scripts/drop-insights.sql.
+          const insightsSql = loadSql('006-insights.sql', schema);
+          await client.query(insightsSql); ddlExecuted.push('006-insights');
+          migrated = true;
+        } finally {
+          await client.query('SELECT pg_advisory_unlock($1)', [lockKey]).catch((err) => {
+            console.warn(`[aquifer] failed to release migration advisory lock for schema "${schema}": ${err.message}`);
+          });
         }
+      } catch (err) {
+        err.notices = Array.isArray(err.notices) ? err.notices : notices.slice();
+        err.failedAt = err.failedAt || 'apply_ddl';
+        emitMigrationEvent('apply_failed', {
+          error: { code: err.code || null, message: err.message },
+          failedAt: err.failedAt,
+          notices: err.notices,
+          durationMs: Date.now() - t0,
+        });
+        throw err;
+      } finally {
+        if (hasEvents) client.off('notice', onNotice);
+        if (releasesClient) client.release();
+      }
-        migrated = true;
+      // Surface captured migration notices that operators need to see:
+      //   - any WARNING/ERROR (zhcfg rebuild warnings, HNSW OOM, etc.)
+      //   - aquifer-authored NOTICE messages ('[aquifer] ...' prefix in the
+      //     migration DO blocks; these announce extension-install fallback,
+      //     HNSW deferral, and other operational decisions)
+      // Filtered out: PG's own "relation already exists, skipping" and
+      // similar idempotent-DDL chatter that floods a re-run.
+      for (const n of notices) {
+        const sev = (n.severity || 'NOTICE').toUpperCase();
+        const msg = n.message || '';
+        const line = `[aquifer] migration ${sev.toLowerCase()}: ${msg}`;
+        if (sev === 'WARNING' || sev === 'ERROR') {
+          console.warn(line);
+        } else if (sev === 'NOTICE' && msg.startsWith('[aquifer]')) {
+          process.stderr.write(line + '\n');
+        }
+      }
+      // Auto-detect FTS tsconfig if not forced by config. Restrict to the
+      // public namespace — same restriction the trigger function uses — so a
+      // same-named config in another schema doesn't fool the detection.
+      if (!ftsConfig) {
+        try {
+          const r = await pool.query(
+            `SELECT 1 FROM pg_ts_config
+               WHERE cfgname = 'zhcfg' AND cfgnamespace = 'public'::regnamespace
+               LIMIT 1`);
+          ftsConfig = r.rowCount > 0 ? 'zhcfg' : 'simple';
+        } catch {
+          ftsConfig = 'simple';
+        }
+      }
+      // Post-flight: surface which Chinese FTS backend the migration actually
+      // landed on, and warm the backend's tokenizer so the first live query
+      // doesn't pay cold-start cost unpredictably. RAISE NOTICE/WARNING from
+      // the migration DO blocks are swallowed by node-postgres unless a
+      // notice handler is attached, so without this operators can't tell if
+      // pg_jieba silently failed to install and FTS is degraded to 'simple'.
+      //
+      // pg_jieba first-backend load is ~60MB RAM + 0.5-1s to mmap the dict.
+      // Warming once inside migrate() amortizes that on the backend that runs
+      // migration; other pool backends still pay it on first use, but the
+      // timing surfaces the cost so operators who see unexpected latency
+      // know where to look.
+      try {
+        const f = await pool.query(`
+          SELECT
+            EXISTS(SELECT 1 FROM pg_extension WHERE extname='pg_jieba')   AS have_jieba,
+            EXISTS(SELECT 1 FROM pg_extension WHERE extname='zhparser')   AS have_zhparser,
+            (SELECT p.prsname FROM pg_ts_config c
+               JOIN pg_ts_parser p ON c.cfgparser = p.oid
+               WHERE c.cfgname='zhcfg' AND c.cfgnamespace='public'::regnamespace
+               LIMIT 1)                                                    AS zhcfg_parser
+        `);
+        const row = f.rows[0] || {};
+        const backend = row.zhcfg_parser
+          ? `zhcfg(parser=${row.zhcfg_parser})`
+          : `simple (no zhcfg in public namespace)`;
+        let warmupMs = null;
+        if (row.zhcfg_parser) {
+          const t0 = Date.now();
+          await pool.query(`SELECT to_tsvector('zhcfg', $1)`, ['warmup 記憶系統 aquifer'])
+            .catch(() => {});
+          warmupMs = Date.now() - t0;
+        }
+        const warmupNote = warmupMs !== null ? ` warmup=${warmupMs}ms` : '';
+        process.stderr.write(
+          `[aquifer] FTS post-flight: backend=${backend} ` +
+          `jieba=${row.have_jieba} zhparser=${row.have_zhparser} ` +
+          `selected=${ftsConfig}${warmupNote}\n`
+        );
+        if (warmupMs !== null && warmupMs > 500) {
+          process.stderr.write(
+            `[aquifer] Note: first FTS call paid ~${warmupMs}ms for tokenizer init ` +
+            `(dictionary mmap). Subsequent calls on the same backend are cached.\n`
+          );
+        }
+      } catch (err) {
+        console.warn(`[aquifer] FTS post-flight check failed: ${err.message}`);
+      }
+      const durationMs = Date.now() - t0;
+      emitMigrationEvent('apply_succeeded', {
+        ddlExecuted,
+        durationMs,
+        notices: notices.slice(),
+      });
+      return { ok: true, durationMs, notices: notices.slice(), ddlExecuted };
+    },
+    async listPendingMigrations() {
+      const plan = await buildMigrationPlan(pool);
+      return { ...plan, lastRunAt: null };
+    },
+    async getMigrationStatus() {
+      return this.listPendingMigrations();
+    },
+    async init() {
+      const t0 = Date.now();
+      const mode = migrationsMode;
+      let deadlineTimer = null;
+      const startupDeadline = migrationStartupTimeoutMs > 0
+        ? new Promise((_, reject) => {
+            deadlineTimer = setTimeout(() => {
+              const err = new Error(`aquifer: init() exceeded startupTimeoutMs=${migrationStartupTimeoutMs}ms`);
+              err.code = 'AQ_MIGRATION_STARTUP_TIMEOUT';
+              reject(err);
+            }, migrationStartupTimeoutMs);
+            if (typeof deadlineTimer.unref === 'function') deadlineTimer.unref();
+          })
+        : null;
+      const withDeadline = (p) => startupDeadline ? Promise.race([p, startupDeadline]) : p;
+      const clearDeadline = () => { if (deadlineTimer) { clearTimeout(deadlineTimer); deadlineTimer = null; } };
+      try {
+        let plan;
+        try {
+          plan = await withDeadline(buildMigrationPlan(pool));
+        } catch (err) {
+          const durationMs = Date.now() - t0;
+          emitMigrationEvent('apply_failed', {
+            error: { code: err.code || null, message: err.message },
+            failedAt: 'plan_probe',
+            notices: [],
+            durationMs,
+          });
+          return {
+            ready: false,
+            memoryMode: 'off',
+            migrationMode: mode,
+            pendingMigrations: [],
+            appliedMigrations: [],
+            error: { code: err.code || 'AQ_MIGRATION_PROBE_FAILED', message: err.message },
+            durationMs,
+          };
+        }
+        if (mode === 'off') {
+          return {
+            ready: true, memoryMode: 'rw', migrationMode: mode,
+            pendingMigrations: plan.pending, appliedMigrations: plan.applied,
+            error: null, durationMs: Date.now() - t0,
+          };
+        }
+        if (mode === 'check') {
+          const ready = plan.pending.length === 0;
+          if (ready) migrated = true;
+          return {
+            ready, memoryMode: ready ? 'rw' : 'ro', migrationMode: mode,
+            pendingMigrations: plan.pending, appliedMigrations: plan.applied,
+            error: null, durationMs: Date.now() - t0,
+          };
+        }
+        // mode === 'apply'
+        if (plan.pending.length === 0) {
+          migrated = true;
+          return {
+            ready: true, memoryMode: 'rw', migrationMode: mode,
+            pendingMigrations: [], appliedMigrations: plan.applied,
+            error: null, durationMs: Date.now() - t0,
+          };
+        }
+        try {
+          const result = await withDeadline(this.migrate());
+          const planAfter = await buildMigrationPlan(pool).catch(() => null);
+          return {
+            ready: true, memoryMode: 'rw', migrationMode: mode,
+            pendingMigrations: planAfter ? planAfter.pending : [],
+            appliedMigrations: planAfter ? planAfter.applied : plan.required,
+            error: null, durationMs: result.durationMs || (Date.now() - t0),
+          };
+        } catch (err) {
+          return {
+            ready: false, memoryMode: 'ro', migrationMode: mode,
+            pendingMigrations: plan.pending, appliedMigrations: plan.applied,
+            error: { code: err.code || 'AQ_MIGRATION_FAILED', message: err.message },
+            durationMs: Date.now() - t0,
+          };
+        }
       } finally {
-        await pool.query('SELECT pg_advisory_unlock($1)', [lockKey]).catch((err) => {
-          console.warn(`[aquifer] failed to release migration advisory lock for schema "${schema}": ${err.message}`);
-        });
+        clearDeadline();
       }
     },
@@ -498,6 +926,34 @@ function createAquifer(config = {}) {
         } catch (e) { warnings.push(`entity extraction failed: ${e.message}`); }
       }
+      // 4d. State-change extraction (Q3) — only if enabled, entities available,
+      // and at least one parsed entity matches whitelist. Returns changes with
+      // entity_name (not id); resolution happens in tx after entity upsert.
+      let parsedStateChanges = [];
+      if (stateChangesEnabled && entitiesEnabled && !skipEntities && parsedEntities.length > 0 && llmFn) {
+        const scopedEntities = stateChangesWhitelist.size === 0
+          ? parsedEntities  // empty whitelist == all parsed entities in scope
+          : parsedEntities.filter(e => stateChangesWhitelist.has(String(e.name).toLowerCase()));
+        if (scopedEntities.length > 0) {
+          try {
+            const { extractStateChanges } = require('../pipeline/extract-state-changes');
+            const result = await extractStateChanges(normalized, {
+              llmFn,
+              promptFn: stateChangesPromptFn,
+              entities: scopedEntities.map(e => ({ name: e.name, aliases: e.aliases || [] })),
+              sessionStartedAt: session.started_at ? new Date(session.started_at).toISOString() : null,
+              evidenceSessionId: sessionId,
+              confidenceThreshold: stateChangesConfThreshold,
+              timeoutMs: stateChangesTimeoutMs,
+              maxOutputTokens: stateChangesMaxOutputTokens,
+              logger: { warn: (m) => warnings.push(`state-change: ${m}`) },
+            });
+            parsedStateChanges = result.changes || [];
+            for (const w of (result.warnings || [])) warnings.push(`state-change: ${w}`);
+          } catch (e) { warnings.push(`state-change extraction failed: ${e.message}`); }
+        }
+      }
       // 5. Now open transaction — only DB writes, no external calls
       const client = await pool.connect();
       let turnsEmbedded = 0;
@@ -589,6 +1045,49 @@ function createAquifer(config = {}) {
           }
           entitiesFound = entityIds.length;
+          // 5d. Apply state changes (Q3) inside SAVEPOINT so a CONFLICT or
+          // CHECK violation can't poison the parent transaction.
+          if (parsedStateChanges.length > 0) {
+            // Build name→id map from upserted entities (parsedEntities aligned
+            // with entityIds by index).
+            const nameToId = new Map();
+            for (let i = 0; i < parsedEntities.length && i < entityIds.length; i++) {
+              const ent = parsedEntities[i];
+              if (!ent || entityIds[i] === null || entityIds[i] === undefined) continue;
+              nameToId.set(String(ent.name).toLowerCase(), entityIds[i]);
+              for (const a of (ent.aliases || [])) {
+                if (typeof a === 'string') nameToId.set(a.toLowerCase(), entityIds[i]);
+              }
+            }
+            const resolved = [];
+            for (const ch of parsedStateChanges) {
+              const id = nameToId.get(String(ch.entityName || '').toLowerCase());
+              if (id === null || id === undefined) continue;
+              const { entityName: _drop, ...rest } = ch;
+              void _drop;
+              resolved.push({ ...rest, entityId: id, sessionRowId: session.id });
+            }
+            if (resolved.length > 0) {
+              try {
+                await client.query('SAVEPOINT state_changes');
+                const r = await aquifer.entityState.applyChanges(client, {
+                  agentId,
+                  sessionRowId: session.id,
+                  changes: resolved,
+                });
+                if (!r.ok) {
+                  warnings.push(`state-change apply failed: ${r.error.code} ${r.error.message}`);
+                  await client.query('ROLLBACK TO SAVEPOINT state_changes');
+                } else {
+                  await client.query('RELEASE SAVEPOINT state_changes');
+                }
+              } catch (e) {
+                warnings.push(`state-change savepoint error: ${e.message}`);
+                try { await client.query('ROLLBACK TO SAVEPOINT state_changes'); } catch { /* ignore */ }
+              }
+            }
+          }
         }
         // 8. Mark status + commit (M5: use 'partial' if warnings)
@@ -666,7 +1165,13 @@ function createAquifer(config = {}) {
     // --- read path ---
     async recall(query, opts = {}) {
-      if (!query) return [];
+      // Contract (aligned across core / manifest / consumer tools): query must
+      // be a non-empty string. Empty strings previously short-circuited to []
+      // silently — that masks caller bugs. Callers wanting "recent sessions"
+      // should use a dedicated API, not pass empty to recall().
+      if (typeof query !== 'string' || query.trim().length === 0) {
+        throw new Error('aquifer.recall(query): query must be a non-empty string');
+      }
       const VALID_MODES = ['fts', 'hybrid', 'vector'];
       const mode = opts.mode !== undefined ? opts.mode : 'hybrid';
@@ -718,8 +1223,12 @@ function createAquifer(config = {}) {
       await ensureMigrated();
-      const rerankEnabled = !!reranker && opts.rerank !== false;
-      const rerankTopK = rerankEnabled ? Math.max(limit, opts.rerankTopK || defaultRerankTopK) : limit;
+      // rerank gating: provider must be configured + caller didn't disable.
+      // Whether to actually invoke is decided after hybridRank, since the
+      // shortlist is needed for the auto-trigger heuristics.
+      const rerankProviderReady = !!reranker && opts.rerank !== false;
+      const rerankForced = opts.rerank === true;
+      const rerankTopK = rerankProviderReady ? Math.max(limit, opts.rerankTopK || defaultRerankTopK) : limit;
       const fetchLimit = rerankTopK * 4;
       // 1. Embed query (only needed for hybrid/vector modes)
@@ -763,14 +1272,24 @@ function createAquifer(config = {}) {
             entityScoreBySession.set(row.session_id, 1.0);
           }
         } else {
-          // 'any' mode with explicit entities: use resolved IDs for boost
+          // 'any' mode with explicit entities: use resolved IDs for boost.
+          // Filter by tenant_id + agentIds to prevent cross-tenant / cross-agent
+          // boost pollution (session_id is caller-supplied and not globally unique).
+          const esParams = [entityIds, tenantId];
+          let esAgentClause = '';
+          if (resolvedAgentIds && resolvedAgentIds.length > 0) {
+            esParams.push(resolvedAgentIds);
+            esAgentClause = `AND s.agent_id = ANY($${esParams.length})`;
+          }
           const esResult = await pool.query(
             `SELECT es.session_row_id, s.session_id, COUNT(*) AS entity_count
             FROM ${qi(schema)}.entity_sessions es
             JOIN ${qi(schema)}.sessions s ON s.id = es.session_row_id
             WHERE es.entity_id = ANY($1)
+              AND s.tenant_id = $2
+              ${esAgentClause}
             GROUP BY es.session_row_id, s.session_id`,
-            [entityIds]
+            esParams
           );
           const maxCount = Math.max(1, ...esResult.rows.map(r => parseInt(r.entity_count)));
@@ -787,13 +1306,21 @@ function createAquifer(config = {}) {
           if (matchedEntities.length > 0) {
             const entityIds = matchedEntities.map(e => e.id);
+            const esParams = [entityIds, tenantId];
+            let esAgentClause = '';
+            if (resolvedAgentIds && resolvedAgentIds.length > 0) {
+              esParams.push(resolvedAgentIds);
+              esAgentClause = `AND s.agent_id = ANY($${esParams.length})`;
+            }
             const esResult = await pool.query(
               `SELECT es.session_row_id, s.session_id, COUNT(*) AS entity_count
               FROM ${qi(schema)}.entity_sessions es
               JOIN ${qi(schema)}.sessions s ON s.id = es.session_row_id
               WHERE es.entity_id = ANY($1)
+                AND s.tenant_id = $2
+                ${esAgentClause}
               GROUP BY es.session_row_id, s.session_id`,
-              [entityIds]
+              esParams
             );
             const maxCount = Math.max(1, ...esResult.rows.map(r => parseInt(r.entity_count)));
@@ -808,23 +1335,25 @@ function createAquifer(config = {}) {
       const runFts = mode === 'fts' || mode === 'hybrid';
       const runVector = mode === 'vector' || mode === 'hybrid';
-      const [ftsRows, embRows, turnResult] = await Promise.all([
+      const [ftsRows, embResult, turnResult] = await Promise.all([
         runFts
           ? storage.searchSessions(pool, query, {
               schema, tenantId, agentIds: resolvedAgentIds, source, dateFrom, dateTo, limit: fetchLimit,
+              ftsConfig,
             }).catch((err) => {
               recordSearchError('fts', err);
               return [];
             })
           : Promise.resolve([]),
         runVector
-          ? embeddingSearchSummaries(queryVec, {
+          ? storage.searchSummaryEmbeddings(pool, {
+              schema, tenantId, queryVec,
               agentIds: resolvedAgentIds, source, dateFrom, dateTo, limit: fetchLimit,
             }).catch((err) => {
               recordSearchError('summary-vector', err);
-              return [];
+              return { rows: [] };
             })
-          : Promise.resolve([]),
+          : Promise.resolve({ rows: [] }),
         runVector
           ? storage.searchTurnEmbeddings(pool, {
               schema, tenantId, queryVec, dateFrom, dateTo, agentIds: resolvedAgentIds, source, limit: fetchLimit,
@@ -835,6 +1364,7 @@ function createAquifer(config = {}) {
           : Promise.resolve({ rows: [] }),
       ]);
+      const embRows = embResult.rows || [];
       const turnRows = turnResult.rows || [];
       // 3b. Apply candidate filter (entityMode 'all')
@@ -902,9 +1432,35 @@ function createAquifer(config = {}) {
         },
       );
-      // 6b. Rerank (optional)
+      // 6b. Rerank (optional, with auto-trigger gate)
       let finalRanked = ranked;
-      if (rerankEnabled && ranked.length > 1) {
+      let rerankDecision = { apply: false, reason: 'provider_not_ready' };
+      if (rerankProviderReady && ranked.length > 1) {
+        if (rerankForced) {
+          rerankDecision = { apply: true, reason: 'forced' };
+        } else {
+          // hasEntities = either caller passed entities explicitly OR the
+          // query-derived path found matching entities (non-empty boost map).
+          // shouldAutoRerank names the condition "entities present"; honour both.
+          rerankDecision = shouldAutoRerank({
+            query,
+            mode,
+            ranked,
+            hasEntities: (explicitEntities && explicitEntities.length > 0)
+              || entityScoreBySession.size > 0,
+            autoTrigger,
+          });
+        }
+      } else if (!rerankProviderReady) {
+        rerankDecision = {
+          apply: false,
+          reason: !reranker ? 'no_provider_configured' : 'caller_disabled',
+        };
+      } else {
+        rerankDecision = { apply: false, reason: 'shortlist_too_short' };
+      }
+      if (rerankDecision.apply) {
         try {
           const docs = ranked.map(r => buildRerankDocument(r, rerankMaxChars));
           const rerankResult = await reranker.rerank(query, docs, { topN: ranked.length });
@@ -914,6 +1470,7 @@ function createAquifer(config = {}) {
             ...r,
             _hybridScore: r._score,
             _rerankScore: scoreMap.has(i) ? scoreMap.get(i) : null,
+            _rerankReason: rerankDecision.reason,
           }));
           finalRanked.sort((a, b) => {
@@ -926,10 +1483,15 @@ function createAquifer(config = {}) {
         } catch (rerankErr) {
           // Fallback: use original hybrid-rank order, flag in debug
           if (process.env.AQUIFER_DEBUG) console.error('[aquifer] rerank error:', rerankErr.message);
-          finalRanked = ranked.slice(0, limit).map(r => ({ ...r, _rerankFallback: true }));
+          finalRanked = ranked.slice(0, limit).map(r => ({
+            ...r,
+            _rerankFallback: true,
+            _rerankReason: rerankDecision.reason,
+            _rerankErrorMessage: rerankErr.message,
+          }));
         }
       } else {
-        finalRanked = ranked.slice(0, limit);
+        finalRanked = ranked.slice(0, limit).map(r => ({ ...r, _rerankReason: rerankDecision.reason }));
       }
       // 7. Record access
@@ -966,6 +1528,9 @@ function createAquifer(config = {}) {
           hybridScore: r._hybridScore ?? r._score,
           rerankScore: r._rerankScore ?? null,
           rerankFallback: r._rerankFallback || false,
+          rerankApplied: rerankDecision.apply,
+          rerankReason: r._rerankReason || rerankDecision.reason,
+          rerankErrorMessage: r._rerankErrorMessage || null,
           searchErrors: searchErrors.slice(),
         },
       }));
@@ -1233,6 +1798,47 @@ function createAquifer(config = {}) {
     },
   };
+  // Completion-capability surfaces (P2). All methods return AqResult envelope;
+  // DDL materialised in schema/004-completion.sql (migrated unconditionally,
+  // additive only). See core/errors.js for envelope shape.
+  const { createNarratives } = require('./narratives');
+  const { createTimeline } = require('./timeline');
+  const { createState } = require('./state');
+  const { createHandoff } = require('./handoff');
+  const { createProfiles } = require('./profiles');
+  const { createDecisions } = require('./decisions');
+  const { createArtifacts } = require('./artifacts');
+  const { createConsolidation } = require('./consolidation');
+  const { createBundles } = require('./bundles');
+  const { createEntityState } = require('./entity-state');
+  const { createInsights } = require('./insights');
+  const qSchema = qi(schema);
+  aquifer.narratives = createNarratives({ pool, schema: qSchema, defaultTenantId: tenantId });
+  aquifer.timeline = createTimeline({ pool, schema: qSchema, defaultTenantId: tenantId });
+  aquifer.state = createState({ pool, schema: qSchema, defaultTenantId: tenantId });
+  aquifer.handoff = createHandoff({ pool, schema: qSchema, defaultTenantId: tenantId });
+  aquifer.profiles = createProfiles({ pool, schema: qSchema, defaultTenantId: tenantId });
+  aquifer.decisions = createDecisions({ pool, schema: qSchema, defaultTenantId: tenantId });
+  aquifer.artifacts = createArtifacts({ pool, schema: qSchema, defaultTenantId: tenantId });
+  aquifer.consolidation = createConsolidation({ pool, schema: qSchema, defaultTenantId: tenantId });
+  aquifer.bundles = createBundles({ pool, schema: qSchema, defaultTenantId: tenantId });
+  // entityState materialises in schema/005-entity-state-history.sql, gated on
+  // entitiesEnabled (it FK-references entities). Drop-clean — see
+  // scripts/drop-entity-state-history.sql.
+  aquifer.entityState = createEntityState({ pool, schema: qSchema, defaultTenantId: tenantId });
+  // insights materialises in schema/006-insights.sql. No FK from elsewhere
+  // into this table; DROP CASCADE is clean. See scripts/drop-insights.sql.
+  // Recall ranking weights configurable via config.insights.recallWeights.
+  aquifer.insights = createInsights({
+    pool,
+    schema: qSchema,
+    defaultTenantId: tenantId,
+    embedFn,
+    recallWeights: (config.insights && config.insights.recallWeights) || null,
+    recencyWindowDays: config.insights && Number.isFinite(config.insights.recencyWindowDays)
+      ? config.insights.recencyWindowDays : undefined,
+  });
   return aquifer;
 }
@@ -1291,4 +1897,4 @@ function formatBootstrapText(data, maxChars) {
 // Exports
 // ---------------------------------------------------------------------------
-module.exports = { createAquifer, formatBootstrapText };
+module.exports = { createAquifer, formatBootstrapText, shouldAutoRerank };