npm - claude-mem-lite - Versions diffs - 3.7.0 → 3.8.0 - Mend

claude-mem-lite 3.7.0 → 3.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

package/.claude-plugin/marketplace.json +1 -1
package/.claude-plugin/plugin.json +1 -1
package/README.md +3 -1
package/README.zh-CN.md +1 -1
package/hook-update.mjs +102 -2
package/hook.mjs +403 -373
package/install.mjs +666 -629
package/lib/doctor-benchmark.mjs +4 -4
package/lib/release-digest.mjs +106 -0
package/lib/search-core.mjs +272 -16
package/mem-cli.mjs +55 -174
package/package.json +3 -2
package/schema.mjs +7 -1
package/scripts/setup.sh +2 -0
package/search-engine.mjs +1 -1
package/{server-internals.mjs → search-scoring.mjs} +6 -2
package/server.mjs +72 -293
package/source-files.mjs +5 -1

package/mem-cli.mjs CHANGED Viewed

@@ -8,8 +8,8 @@ import { truncate, typeIcon, inferProject, scrubSecrets } from './utils.mjs';
 import { resolveProject } from './project-utils.mjs';
 import { TIER_CASE_SQL, tierSqlParams } from './tier.mjs';
 import { _resetVocabCache } from './tfidf.mjs';
-import { autoBoostIfNeeded, reRankWithContext, markSuperseded } from './server-internals.mjs';
-import { searchObservationsHybrid, countSearchTotal, attachBodyTokens } from './search-engine.mjs';
+import { autoBoostIfNeeded, reRankWithContext, markSuperseded } from './search-scoring.mjs';
+import { searchObservationsHybrid } from './search-engine.mjs';
 import { deepSearch, resolveDeepMode, shouldEscalateToDeep, autoDeepLlmReady } from './deep-search.mjs';
 import { ensureRegistryDb, upsertResource } from './registry.mjs';
 import { searchResources } from './registry-retriever.mjs';
@@ -37,7 +37,7 @@ import { saveObservation } from './lib/save-observation.mjs';
 import { rebuildObservationDerived } from './lib/observation-write.mjs';
 import { recallByFile } from './lib/recall-core.mjs';
 import { resolveAnchorToken, formatAnchorError, resolveQueryAnchor, fetchRecentTimeline, fetchTimelineWindow } from './lib/timeline-core.mjs';
-import { buildSearchFtsQuery, parseDateBounds, computePerSourceWindow, effectiveObsFtsQuery, searchSessionsFts, searchPromptsFts, normalizeCrossSourceScores, applyUserSort, applyTierFilter } from './lib/search-core.mjs';
+import { buildSearchFtsQuery, parseDateBounds, coreRunSearchPipeline } from './lib/search-core.mjs';
 import { AUTO_MERGE_THRESHOLD } from './lib/dedup-constants.mjs';
 import { countRecentHookErrors } from './lib/hook-telemetry.mjs';
 import { computeCitationFunnelTrend } from './lib/citation-tracker.mjs';
@@ -156,116 +156,51 @@ async function cmdSearch(db, args, { llm } = {}) {
     ? 'observations'
     : (source || ((type || tier || minImportance || branch) ? 'observations' : null));
-  // Cross-source mode: each source needs more candidates than the final limit
-  // so the post-merge sort has room to pick the best from each (shared sizing
-  // with mem_search — without this, obs gets systematically squeezed out by
-  // sessions). Over-fetch from offset 0; --offset applies ONCE at the final
-  // slice below (see computePerSourceWindow for the #8217/#8638 rationale).
-  const isCrossSourceMode = !effectiveSource;
-  const { perSourceLimit, perSourceOffset } = computePerSourceWindow(limit, offset);
-  const results = [];
-  // Tracks whether AND returned 0 and OR recovered non-empty. Mirrors server.mjs
-  // ctx.orFallbackFired so the header can surface a "(relaxed AND→OR)" hint.
-  let orFallbackFired = false;
-  let deepVariants = null;
-  let isReranked = false;
-  let isDeep = deepMode === 'deep';
-  // Search observations — shared engine with server.mjs (#8198/#8212 paired-path fix)
-  if (!effectiveSource || effectiveSource === 'observations') {
-    const obsCtx = {
-      ftsQuery,
-      args: {
-        project: project || null,
-        obs_type: type || null,
-        importance: minImportance || null,
-        branch: branch || null,
-        include_noise: includeNoise,
-      },
-      epochFrom: dateFrom,
-      epochTo: dateTo,
-      perSourceLimit,
-      perSourceOffset,
-      currentProject: project ? null : inferProject(),
-      limit,
-      orFallbackFired: false,
-    };
-    const runDeep = async ({ auto = false } = {}) => {
-      const ds = await deepSearch(db, {
-        query,
-        project: project || null,
-        type: type || null,
-        importance: minImportance || null,
-        branch: branch || null,
-        includeNoise,
-        epochFrom: dateFrom,
-        epochTo: dateTo,
-        limit: perSourceLimit,
-        currentProject: project ? null : inferProject(),
-      }, llm ? { llm, rerank: rerank && !auto } : { auto, rerank: rerank && !auto });
-      deepVariants = ds.variants;
-      isReranked = ds.reranked;
-      if (deepVariants.length > 1) {
-        process.stderr.write(`[mem] Deep search: rewrote into ${deepVariants.length} query variants, RRF-fused\n`);
-      } else {
-        process.stderr.write('[mem] Deep search: rewrite returned no usable variants; used original query only\n');
-      }
-      if (rerank && !auto) {
-        process.stderr.write(ds.reranked
-          ? '[mem] Deep search: LLM-reranked the fused top-20\n'
-          : '[mem] Deep search: rerank produced no usable order; kept fused order\n');
-      }
-      return ds.results;
-    };
-    let obsResults;
-    if (deepMode === 'deep') {
-      obsResults = await runDeep();
-    } else {
-      obsResults = searchObservationsHybrid(db, obsCtx);
-      if (obsCtx.orFallbackFired) orFallbackFired = true;
-      if (deepMode === 'auto' && autoDeepLlmReady(process.env, llm) && shouldEscalateToDeep(obsResults, obsCtx, { db, project: project || null })) {
-        process.stderr.write(`[mem] auto-escalated to deep search (weak results: ${obsResults.length} hits)\n`);
-        obsResults = await runDeep({ auto: true });
-        isDeep = true;
-      }
-    }
-    for (const r of obsResults) results.push({ ...r, _source: 'obs', score: r.score ?? 0 });
-    // Tier post-filter — applied to ALL obs results from the engine.
-    if (tier) {
-      const filtered = applyTierFilter(db, results, { tier, sourceKey: '_source', currentProject: project || inferProject() });
-      results.length = 0;
-      results.push(...filtered);
-    }
-  }
-  // Search sessions (shared engine with MCP mem_search — lib/search-core.mjs)
-  if ((!effectiveSource || effectiveSource === 'sessions') && !isDeep) {
-    try {
-      const sessRows = searchSessionsFts(db, {
-        ftsQuery, project, projectBoost: project ? null : inferProject(),
-        epochFrom: dateFrom, epochTo: dateTo, perSourceLimit, perSourceOffset,
-      });
-      for (const r of sessRows) results.push({ ...r, _source: 'session' });
-    } catch { /* session FTS may not exist in older DBs */ }
-  }
-  // Search prompts (shared engine incl. CJK precision gate + LIKE fallback)
-  if ((!effectiveSource || effectiveSource === 'prompts') && !isDeep) {
-    try {
-      const promptRows = searchPromptsFts(db, {
-        query, ftsQuery, project,
-        epochFrom: dateFrom, epochTo: dateTo, perSourceLimit, perSourceOffset,
-      });
-      for (const r of promptRows) results.push({ ...r, _source: 'prompt' });
-    } catch { /* prompt FTS may not exist in older DBs */ }
-  }
-  if (results.length === 0) {
+  const res = await coreRunSearchPipeline(
+    {
+      db, currentProject: project ? null : inferProject(), env: process.env,
+      searchObservationsHybrid, deepSearch, shouldEscalateToDeep, autoDeepLlmReady,
+      reRankWithContext, markSuperseded, llm,
+    },
+    {
+      query, ftsQuery, effectiveSource, deepMode, rerank,
+      limit, offset, project: project || null, obsType: type, importance: minImportance,
+      branch, includeNoise, epochFrom: dateFrom, epochTo: dateTo, sort, tier,
+      // ── CLI surface policy ──
+      obsTypeFallback: false,            // #8217 removed list-by-type fallback from the CLI
+      crossSourceEpochSortNoFts: false,  // CLI never reaches cross-source with empty ftsQuery (fails earlier)
+      rerankPolicy: 'cli',               // re-rank/supersede on any obs; re-sort gated on cross-source
+      rerankProject: project || inferProject(),
+      recentListingNoFts: false,
+      tolerateMissingFts: true,          // pre-FTS legacy DBs: swallow session/prompt FTS errors
+      tierPosition: 'early',             // tier filter inside the obs block (before sessions/prompts)
+      tierProject: project || inferProject(),
+    }
+  );
+  const isDeep = res.isDeep;
+  const orFallbackFired = res.orFallbackFired;
+  const deepVariants = res.variants;
+  const paged = res.page;
+  const total = res.total;
+  // Deep / escalation observability on stderr — reconstructed from core signals.
+  // The CLI emitted these inline in runDeep; same strings, same order (escalation →
+  // variants → rerank). rerank is only ever true on explicit --deep (never auto).
+  if (res.escalated) process.stderr.write(`[mem] auto-escalated to deep search (weak results: ${res.escalatedObsCount} hits)\n`);
+  if (isDeep && deepVariants) {
+    process.stderr.write(deepVariants.length > 1
+      ? `[mem] Deep search: rewrote into ${deepVariants.length} query variants, RRF-fused\n`
+      : '[mem] Deep search: rewrite returned no usable variants; used original query only\n');
+  }
+  if (rerank) {
+    process.stderr.write(res.reranked
+      ? '[mem] Deep search: LLM-reranked the fused top-20\n'
+      : '[mem] Deep search: rerank produced no usable order; kept fused order\n');
+  }
+  // "nothing matched" (no offset) vs "this page is empty" (with offset) — the two
+  // CLI messages. preFinalizeCount is the pre-pagination population (post-tier).
+  if (res.preFinalizeCount === 0) {
     if (jsonOutput) {
       out(JSON.stringify({ query, total: 0, returned: 0, offset, limit, deep: isDeep, variants: isDeep ? deepVariants : undefined, results: [] }));
     } else {
@@ -274,60 +209,6 @@ async function cmdSearch(db, args, { llm } = {}) {
     return;
   }
-  // Cross-source score normalization (shared with mem_search).
-  // ftsQuery gate prevents normalization when scores are all 0 (no-FTS path).
-  const isCrossSource = isCrossSourceMode;
-  if (isCrossSource && results.length > 0 && ftsQuery) {
-    normalizeCrossSourceScores(results, '_source');
-    results.sort((a, b) => (a.score ?? 0) - (b.score ?? 0));
-  }
-  // Context re-ranking + superseded marking (aligned with MCP mem_search)
-  const obsResults = results.filter(r => r._source === 'obs');
-  if (obsResults.length > 0) {
-    // reRankWithContext/markSuperseded expect source='obs' — alias _source for compatibility
-    for (const r of obsResults) r.source = 'obs';
-    // Explicit LLM rerank order is final — skip file-context re-rank when reranked
-    // (paired-path with mem_search; markSuperseded still runs for stale-tagging).
-    if (!isReranked) reRankWithContext(db, obsResults, project || inferProject());
-    markSuperseded(obsResults);
-    if (isCrossSource) results.sort((a, b) => (a.score ?? 0) - (b.score ?? 0));
-  }
-  // Apply user-requested sort (after relevance scoring; shared with mem_search)
-  applyUserSort(results, sort);
-  // Trim to limit with offset. The engine always received perSourceOffset=0 and
-  // over-fetched (see above), so the merged+reranked `results` start at row 0 and
-  // the offset is applied exactly ONCE here — for every mode.
-  //
-  // `total` must be the TRUE population, independent of --limit/--offset (else the
-  // over-fetched candidate count grew with the page and broke the "N of M" /
-  // pagination contract). countSearchTotal mirrors each source's MATCH+filters;
-  // clamp to >= results.length so it never understates the rows actually shown
-  // (vector/concept augmentation can add obs rows beyond the FTS count).
-  // For --deep the population is the fused variant result set: deepSearch already
-  // returned all fused rows (capped at perSourceLimit) and they are the only rows
-  // in `results` (deep is obs-only). countSearchTotal would instead count the
-  // ORIGINAL query's FTS matches — wrong, and ~0 on the vocabulary-mismatch
-  // queries deep exists for, which falsely shrinks the "N of M" total (F1).
-  const total = isDeep
-    ? results.length
-    : Math.max(countSearchTotal(db, {
-      effectiveSource,
-      ftsQuery,
-      obsFtsQuery: effectiveObsFtsQuery(ftsQuery, orFallbackFired),
-      args: { project: project || null, obs_type: type || null, importance: minImportance || null, branch: branch || null },
-      project: project || null,
-      epochFrom: dateFrom,
-      epochTo: dateTo,
-      includeNoise,
-    }), results.length);
-  const paged = results.slice(offset, offset + limit);
-  // Enrich the final page with the ~Nt fetch-cost hint (paired with MCP mem_search; #8654 both
-  // source keys handled). Batch-fetches heavy obs fields by id — no-op on an empty page.
-  attachBodyTokens(db, paged);
   if (paged.length === 0) {
     if (jsonOutput) {
       out(JSON.stringify({ query, total, returned: 0, offset, limit, deep: isDeep, variants: isDeep ? deepVariants : undefined, results: [] }));
@@ -337,24 +218,24 @@ async function cmdSearch(db, args, { llm } = {}) {
     return;
   }
-  // paired-path with server.mjs formatSearchOutput (#8198): "N of M" total when paged < total.
+  // "N of M" total when paged < total (paired-path with server.mjs formatSearchOutput, #8198).
   const showTime = sort === 'time';
-  const hasMixed = paged.some(r => r._source === 'session' || r._source === 'prompt');
+  const hasMixed = paged.some(r => r.source === 'session' || r.source === 'prompt');
   // Suppressed when --or was explicit — user already asked for OR, no "fallback" there.
   const fallbackHint = orFallbackFired && !useOr ? ' (relaxed AND→OR)' : '';
   if (jsonOutput) {
     const items = paged.map(r => {
       const base = {
-        source: r._source,
+        source: r.source,
         id: r.id,
         created_at: r.created_at,
         score: r.score ?? null,
       };
-      if (r._source === 'session') {
+      if (r.source === 'session') {
         return { ...base, request: r.request || null, completed: r.completed || null, project: r.project || null };
       }
-      if (r._source === 'prompt') {
+      if (r.source === 'prompt') {
         return { ...base, prompt_text: r.prompt_text || null };
       }
       return {
@@ -392,10 +273,10 @@ async function cmdSearch(db, args, { llm } = {}) {
   const tok = r => (r.bodyTokens ? ` ~${r.bodyTokens}t` : '');
   for (const r of paged) {
     const timeStr = showTime && r.created_at_epoch ? ` (${relativeTime(r.created_at_epoch)})` : '';
-    if (r._source === 'session') {
+    if (r.source === 'session') {
       const date = fmtDateShort(r.created_at);
       out(`S#${r.id} 📋 ${date}${timeStr} ${truncate(r.request || r.completed || '(no summary)', 80)}${tok(r)}`);
-    } else if (r._source === 'prompt') {
+    } else if (r.source === 'prompt') {
       const date = fmtDateShort(r.created_at);
       out(`P#${r.id} 💬 ${date}${timeStr} ${truncate(r.prompt_text || '(empty)', 80)}${tok(r)}`);
     } else {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "claude-mem-lite",
-  "version": "3.7.0",
+  "version": "3.8.0",
   "description": "Persistent long-term memory for Claude Code via MCP — captures coding decisions, bugfixes, and context across sessions. Hybrid FTS5 + TF-IDF search with episode batching. Single SQLite DB, no external services. A lighter, lower-cost alternative to claude-mem (episode batching + a smaller model; cost savings are an internal estimate, not a measured benchmark).",
   "type": "module",
   "packageManager": "npm@10.9.2",
@@ -28,7 +28,7 @@
     "cli-path.mjs",
     "mem-cli.mjs",
     "server.mjs",
-    "server-internals.mjs",
+    "search-scoring.mjs",
     "search-engine.mjs",
     "deep-search.mjs",
     "rerank.mjs",
@@ -73,6 +73,7 @@
     "lib/binding-probe.mjs",
     "lib/proc-lock.mjs",
     "lib/atomic-write.mjs",
+    "lib/release-digest.mjs",
     "lib/mem-override.mjs",
     "lib/save-observation.mjs",
     "lib/observation-write.mjs",

package/schema.mjs CHANGED Viewed

@@ -894,7 +894,13 @@ export function ensureDb() {
   db.pragma('foreign_keys = OFF'); // Enabled after dedup migration
   try {
-    return initSchema(db);
+    const ready = initSchema(db);
+    // P1-5: sentinel-gated data cleanups must run on EVERY open (schema.mjs:766).
+    // They were extracted out of initSchema into runDeferredCleanups but never
+    // wired into a production opener — without this call they ran nowhere but
+    // tests, silently halting orphan/normalize hygiene. Best-effort: never throws.
+    runDeferredCleanups(ready);
+    return ready;
   } catch (e) {
     try { db.close(); } catch {}
     throw e;

package/scripts/setup.sh CHANGED Viewed

@@ -86,6 +86,7 @@ mark_deps_broken() {
   # having to re-derive them. Delegate JSON serialization to node so embedded
   # quotes / shell metachars in $ROOT or $reason can't produce an invalid file
   # (bash `printf '"..%s.."'` cannot escape arbitrary strings safely; v2.79.1 fix).
+  # shellcheck disable=SC2016  # node script single-quoted on purpose; vars passed via env (MARK_*), not shell expansion
   MARK_REASON="$reason" MARK_ROOT="$ROOT" MARK_FLAG="$DEPS_FLAG" node -e '
     const fs = require("fs");
     const reason = process.env.MARK_REASON || "unknown";
@@ -141,6 +142,7 @@ fi
 #    versions; same shape as the .deps-broken self-heal pattern.
 MCP_MIGRATION="$DATA_DIR/runtime/.mcp-dedup-v2.78"
 if [[ -n "${CLAUDE_PLUGIN_ROOT:-}" && ! -f "$MCP_MIGRATION" ]]; then
+  # shellcheck disable=SC2016  # node script single-quoted on purpose; CLAUDE_JSON passed via env, not shell expansion
   CLAUDE_JSON="$HOME/.claude.json" node -e '
     const fs = require("fs");
     let changed = false;

package/search-engine.mjs CHANGED Viewed

@@ -12,7 +12,7 @@ import {
   relaxFtsQueryToOr, debugLog, debugCatch, estimateTokens,
 } from './utils.mjs';
 import { getVocabulary, computeVector, vectorSearch, rrfMerge } from './tfidf.mjs';
-import { extractPRFTerms, expandQueryByConcepts } from './server-internals.mjs';
+import { extractPRFTerms, expandQueryByConcepts } from './search-scoring.mjs';
 // Scoring expressions — full adds project boost + access bonus; simple is for
 // expansion paths where boost would over-amplify already-loose matches.

package/{server-internals.mjs → search-scoring.mjs} RENAMED Viewed

@@ -1,5 +1,9 @@
-// claude-mem-lite server internal functions
-// Extracted from server.mjs for testability (server.mjs has top-level side effects)
+// claude-mem-lite shared search-scoring / ranking helpers: re-ranking, supersede
+// marking, PRF term extraction, concept-expansion — plus the MCP instructions
+// builder and idle-cleanup/access-boost side helpers. Used by the MCP server,
+// the CLI (mem-cli), and search-engine; originally extracted from server.mjs for
+// testability (server.mjs has top-level side effects), hence the former
+// "server-internals" name — renamed in audit P3 since it is not server-only.
 import { debugCatch, COMPRESSED_AUTO, COMPRESSED_PENDING_PURGE, OBS_BM25 } from './utils.mjs';
 import { BASE_STOP_WORDS } from './stop-words.mjs';