npm - claude-mem-lite - Versions diffs - 2.3.1 → 2.3.3 - Mend

claude-mem-lite 2.3.1 → 2.3.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

package/.claude-plugin/marketplace.json +1 -1
package/.claude-plugin/plugin.json +1 -1
package/.mcp.json +2 -7
package/commands/mem.md +7 -0
package/commands/update.md +2 -1
package/dispatch-inject.mjs +5 -4
package/dispatch.mjs +37 -15
package/hook-shared.mjs +10 -6
package/hook.mjs +6 -5
package/hooks/hooks.json +1 -1
package/install.mjs +440 -11
package/package.json +1 -1
package/registry/preinstalled.json +0 -13
package/registry-retriever.mjs +0 -3
package/registry.mjs +1 -1
package/schema.mjs +1 -0
package/scripts/setup.sh +20 -1
package/server.mjs +153 -159
package/tool-schemas.mjs +4 -2
package/utils.mjs +10 -2

package/server.mjs CHANGED Viewed

@@ -4,12 +4,15 @@
 import { McpServer } from '@modelcontextprotocol/sdk/server/mcp.js';
 import { StdioServerTransport } from '@modelcontextprotocol/sdk/server/stdio.js';
-import { jaccardSimilarity, truncate, typeIcon, sanitizeFtsQuery, relaxFtsQueryToOr, inferProject, computeMinHash, scrubSecrets, fmtDate, isoWeekKey, debugLog, debugCatch } from './utils.mjs';
-import { ensureDb, DB_PATH, DB_DIR } from './schema.mjs';
+import { jaccardSimilarity, truncate, typeIcon, sanitizeFtsQuery, relaxFtsQueryToOr, inferProject, computeMinHash, estimateJaccardFromMinHash, scrubSecrets, fmtDate, isoWeekKey, debugLog, debugCatch, COMPRESSED_AUTO, COMPRESSED_PENDING_PURGE } from './utils.mjs';
+import { ensureDb, DB_PATH, REGISTRY_DB_PATH } from './schema.mjs';
 import { reRankWithContext, markSuperseded, extractPRFTerms, expandQueryByConcepts } from './server-internals.mjs';
 import { memSearchSchema, memTimelineSchema, memGetSchema, memDeleteSchema, memSaveSchema, memStatsSchema, memCompressSchema, memMaintainSchema, memRegistrySchema } from './tool-schemas.mjs';
 import { ensureRegistryDb, upsertResource } from './registry.mjs';
-import { join } from 'path';
+import { createRequire } from 'module';
+const require = createRequire(import.meta.url);
+const { version: PKG_VERSION } = require('./package.json');
 // ─── Database ───────────────────────────────────────────────────────────────
@@ -38,7 +41,6 @@ db.pragma('busy_timeout = 5000');
 // ─── Registry Database (lazy-loaded on first mem_registry call) ─────────────
-const REGISTRY_DB_PATH = join(DB_DIR, 'resource-registry.db');
 let registryDb = null;
 function getRegistryDb() {
@@ -79,7 +81,7 @@ const RECENCY_HALF_LIFE_MS = 1209600000; // 14 days in milliseconds
 // ─── MCP Server ─────────────────────────────────────────────────────────────
 const server = new McpServer(
-  { name: 'claude-mem-lite', version: '2.2.2' },
+  { name: 'claude-mem-lite', version: PKG_VERSION },
   {
     instructions: [
       'Proactively search memory to leverage past experience. This is your long-term memory across sessions.',
@@ -119,6 +121,69 @@ function safeHandler(fn) {
 // ─── Tool: mem_search — helper functions ────────────────────────────────────
+// Score expression variants for FTS5 queries (see Scoring Model Constants above)
+const FULL_SCORE = `${OBS_BM25}
+  * (1.0 + EXP(-0.693 * (? - o.created_at_epoch) / ${RECENCY_HALF_LIFE_MS}.0))
+  * (CASE WHEN ? IS NOT NULL AND o.project = ? THEN 2.0 ELSE 1.0 END)
+  * (0.5 + 0.5 * COALESCE(o.importance, 1))
+  * (1.0 + 0.1 * LN(1 + COALESCE(o.access_count, 0)))`;
+const SIMPLE_SCORE = `${OBS_BM25}
+  * (1.0 + EXP(-0.693 * (? - o.created_at_epoch) / ${RECENCY_HALF_LIFE_MS}.0))
+  * (0.5 + 0.5 * COALESCE(o.importance, 1))`;
+/**
+ * Build an FTS5 observation search query.
+ * @param {'full'|'simple'} scoring - full includes project boost + access bonus
+ * @param {object} opts - { multiplier, withSnippet, withOffset }
+ */
+function buildObsFtsQuery(scoring, { multiplier, withSnippet, withOffset } = {}) {
+  const scoreExpr = scoring === 'full' ? FULL_SCORE : SIMPLE_SCORE;
+  const mult = multiplier ? ` * ${multiplier}` : '';
+  return `
+    SELECT o.id, o.type, o.title, o.subtitle, o.project, o.created_at, o.importance,
+           o.files_modified,
+           ${withSnippet ? "snippet(observations_fts, 2, '»', '«', '…', 10) as match_snippet," : ''}
+           ${scoreExpr}${mult} as score
+    FROM observations_fts
+    JOIN observations o ON observations_fts.rowid = o.id
+    WHERE observations_fts MATCH ?
+      AND COALESCE(o.compressed_into, 0) = 0
+      AND (? IS NULL OR o.project = ?)
+      AND (? IS NULL OR o.type = ?)
+      AND (? IS NULL OR o.created_at_epoch >= ?)
+      AND (? IS NULL OR o.created_at_epoch <= ?)
+      AND (? IS NULL OR COALESCE(o.importance, 1) >= ?)
+    ORDER BY score
+    LIMIT ?${withOffset ? ' OFFSET ?' : ''}`;
+}
+/** Build params array for an FTS5 observation query. */
+function buildObsFtsParams({ now, projectBoost, ftsQuery, args, epochFrom, epochTo, limit, offset }) {
+  const params = [now];
+  if (projectBoost !== undefined) params.push(projectBoost, projectBoost); // full scoring only
+  params.push(
+    ftsQuery,
+    args.project ?? null, args.project ?? null,
+    args.obs_type ?? null, args.obs_type ?? null,
+    epochFrom, epochFrom,
+    epochTo, epochTo,
+    args.importance ?? null, args.importance ?? null,
+    limit,
+  );
+  if (offset !== undefined) params.push(offset);
+  return params;
+}
+/** Map a raw FTS5 row to a result object. */
+function ftsRowToResult(r, { scoreMultiplier, snippet } = {}) {
+  return {
+    source: 'obs', id: r.id, type: r.type, title: r.title, subtitle: r.subtitle,
+    project: r.project, date: r.created_at, score: scoreMultiplier ? r.score * scoreMultiplier : r.score,
+    files_modified: r.files_modified, importance: r.importance, snippet: snippet ? (r.match_snippet || '') : '',
+  };
+}
 function searchObservations(ctx) {
   const { ftsQuery, args, epochFrom, epochTo, perSourceLimit, perSourceOffset, currentProject, limit } = ctx;
   const results = [];
@@ -126,81 +191,19 @@ function searchObservations(ctx) {
   if (ftsQuery) {
     const now = Date.now();
     const projectBoost = args.project ? null : currentProject;
-    const rows = db.prepare(`
-      SELECT o.id, o.type, o.title, o.subtitle, o.project, o.created_at, o.importance,
-             o.files_modified,
-             snippet(observations_fts, 2, '»', '«', '…', 10) as match_snippet,
-             ${OBS_BM25}
-               * (1.0 + EXP(-0.693 * (? - o.created_at_epoch) / ${RECENCY_HALF_LIFE_MS}.0))
-               * (CASE WHEN ? IS NOT NULL AND o.project = ? THEN 2.0 ELSE 1.0 END)
-               * (0.5 + 0.5 * COALESCE(o.importance, 1))
-               * (1.0 + 0.1 * LN(1 + COALESCE(o.access_count, 0))) as score
-      FROM observations_fts
-      JOIN observations o ON observations_fts.rowid = o.id
-      WHERE observations_fts MATCH ?
-        AND COALESCE(o.compressed_into, 0) = 0
-        AND (? IS NULL OR o.project = ?)
-        AND (? IS NULL OR o.type = ?)
-        AND (? IS NULL OR o.created_at_epoch >= ?)
-        AND (? IS NULL OR o.created_at_epoch <= ?)
-        AND (? IS NULL OR COALESCE(o.importance, 1) >= ?)
-      ORDER BY score
-      LIMIT ? OFFSET ?
-    `).all(
-      now,
-      projectBoost, projectBoost,
-      ftsQuery,
-      args.project ?? null, args.project ?? null,
-      args.obs_type ?? null, args.obs_type ?? null,
-      epochFrom, epochFrom,
-      epochTo, epochTo,
-      args.importance ?? null, args.importance ?? null,
-      perSourceLimit, perSourceOffset
-    );
-    for (const r of rows) {
-      results.push({ source: 'obs', id: r.id, type: r.type, title: r.title, subtitle: r.subtitle, project: r.project, date: r.created_at, score: r.score, files_modified: r.files_modified, importance: r.importance, snippet: r.match_snippet || '' });
-    }
+    const rows = db.prepare(buildObsFtsQuery('full', { withSnippet: true, withOffset: true }))
+      .all(...buildObsFtsParams({ now, projectBoost, ftsQuery, args, epochFrom, epochTo, limit: perSourceLimit, offset: perSourceOffset }));
+    for (const r of rows) results.push(ftsRowToResult(r, { snippet: true }));
     // OR fallback: when AND query returns 0 results, retry with OR semantics
     if (rows.length === 0) {
       const orQuery = relaxFtsQueryToOr(ftsQuery);
       if (orQuery) {
         try {
-          const orRows = db.prepare(`
-            SELECT o.id, o.type, o.title, o.subtitle, o.project, o.created_at, o.importance,
-                   o.files_modified,
-                   snippet(observations_fts, 2, '»', '«', '…', 10) as match_snippet,
-                   ${OBS_BM25}
-                     * (1.0 + EXP(-0.693 * (? - o.created_at_epoch) / ${RECENCY_HALF_LIFE_MS}.0))
-                     * (CASE WHEN ? IS NOT NULL AND o.project = ? THEN 2.0 ELSE 1.0 END)
-                     * (0.5 + 0.5 * COALESCE(o.importance, 1))
-                     * (1.0 + 0.1 * LN(1 + COALESCE(o.access_count, 0)))
-                     * 0.8 as score
-            FROM observations_fts
-            JOIN observations o ON observations_fts.rowid = o.id
-            WHERE observations_fts MATCH ?
-              AND COALESCE(o.compressed_into, 0) = 0
-              AND (? IS NULL OR o.project = ?)
-              AND (? IS NULL OR o.type = ?)
-              AND (? IS NULL OR o.created_at_epoch >= ?)
-              AND (? IS NULL OR o.created_at_epoch <= ?)
-              AND (? IS NULL OR COALESCE(o.importance, 1) >= ?)
-            ORDER BY score
-            LIMIT ? OFFSET ?
-          `).all(
-            now,
-            projectBoost, projectBoost,
-            orQuery,
-            args.project ?? null, args.project ?? null,
-            args.obs_type ?? null, args.obs_type ?? null,
-            epochFrom, epochFrom,
-            epochTo, epochTo,
-            args.importance ?? null, args.importance ?? null,
-            perSourceLimit, perSourceOffset
-          );
-          for (const r of orRows) {
-            results.push({ source: 'obs', id: r.id, type: r.type, title: r.title, subtitle: r.subtitle, project: r.project, date: r.created_at, score: r.score, files_modified: r.files_modified, importance: r.importance, snippet: r.match_snippet || '' });
-          }
+          const orRows = db.prepare(buildObsFtsQuery('full', { multiplier: 0.8, withSnippet: true, withOffset: true }))
+            .all(...buildObsFtsParams({ now, projectBoost, ftsQuery: orQuery, args, epochFrom, epochTo, limit: perSourceLimit, offset: perSourceOffset }));
+          for (const r of orRows) results.push(ftsRowToResult(r, { snippet: true }));
         } catch (e) { debugCatch(e, 'searchObservations-or-fallback'); }
       }
     }
@@ -242,36 +245,12 @@ function expandObsByConceptCo(ctx, now, existingIds, results) {
   if (expanded.length === 0) return;
   const expansionFts = expanded.map(c => `"${c.replace(/"/g, '""')}"`).join(' OR ');
   try {
-    const expRows = db.prepare(`
-      SELECT o.id, o.type, o.title, o.subtitle, o.project, o.created_at, o.importance,
-             o.files_modified,
-             ${OBS_BM25}
-               * (1.0 + EXP(-0.693 * (? - o.created_at_epoch) / ${RECENCY_HALF_LIFE_MS}.0))
-               * (0.5 + 0.5 * COALESCE(o.importance, 1)) as score
-      FROM observations_fts
-      JOIN observations o ON observations_fts.rowid = o.id
-      WHERE observations_fts MATCH ?
-        AND COALESCE(o.compressed_into, 0) = 0
-        AND (? IS NULL OR o.project = ?)
-        AND (? IS NULL OR o.type = ?)
-        AND (? IS NULL OR o.created_at_epoch >= ?)
-        AND (? IS NULL OR o.created_at_epoch <= ?)
-        AND (? IS NULL OR COALESCE(o.importance, 1) >= ?)
-      ORDER BY score
-      LIMIT ?
-    `).all(
-      now, expansionFts,
-      args.project ?? null, args.project ?? null,
-      args.obs_type ?? null, args.obs_type ?? null,
-      epochFrom, epochFrom,
-      epochTo, epochTo,
-      args.importance ?? null, args.importance ?? null,
-      limit
-    );
+    const expRows = db.prepare(buildObsFtsQuery('simple'))
+      .all(...buildObsFtsParams({ now, ftsQuery: expansionFts, args, epochFrom, epochTo, limit }));
     for (const r of expRows) {
       if (!existingIds.has(r.id)) {
         existingIds.add(r.id);
-        results.push({ source: 'obs', id: r.id, type: r.type, title: r.title, subtitle: r.subtitle, project: r.project, date: r.created_at, score: r.score * 0.7, files_modified: r.files_modified, importance: r.importance, snippet: '' });
+        results.push(ftsRowToResult(r, { scoreMultiplier: 0.7 }));
       }
     }
   } catch (e) { debugLog('WARN', 'mem_search', `concept expansion error: ${e.message}`); }
@@ -292,36 +271,12 @@ function expandObsByPRF(ctx, now, primaryCount, existingIds, results) {
   if (prfTerms.length === 0) return;
   const prfFts = prfTerms.map(t => `"${t.replace(/"/g, '""')}"`).join(' OR ');
   try {
-    const prfRows = db.prepare(`
-      SELECT o.id, o.type, o.title, o.subtitle, o.project, o.created_at, o.importance,
-             o.files_modified,
-             ${OBS_BM25}
-               * (1.0 + EXP(-0.693 * (? - o.created_at_epoch) / ${RECENCY_HALF_LIFE_MS}.0))
-               * (0.5 + 0.5 * COALESCE(o.importance, 1)) as score
-      FROM observations_fts
-      JOIN observations o ON observations_fts.rowid = o.id
-      WHERE observations_fts MATCH ?
-        AND COALESCE(o.compressed_into, 0) = 0
-        AND (? IS NULL OR o.project = ?)
-        AND (? IS NULL OR o.type = ?)
-        AND (? IS NULL OR o.created_at_epoch >= ?)
-        AND (? IS NULL OR o.created_at_epoch <= ?)
-        AND (? IS NULL OR COALESCE(o.importance, 1) >= ?)
-      ORDER BY score
-      LIMIT ?
-    `).all(
-      now, prfFts,
-      args.project ?? null, args.project ?? null,
-      args.obs_type ?? null, args.obs_type ?? null,
-      epochFrom, epochFrom,
-      epochTo, epochTo,
-      args.importance ?? null, args.importance ?? null,
-      limit
-    );
+    const prfRows = db.prepare(buildObsFtsQuery('simple'))
+      .all(...buildObsFtsParams({ now, ftsQuery: prfFts, args, epochFrom, epochTo, limit }));
     for (const r of prfRows) {
       if (!existingIds.has(r.id)) {
         existingIds.add(r.id);
-        results.push({ source: 'obs', id: r.id, type: r.type, title: r.title, subtitle: r.subtitle, project: r.project, date: r.created_at, score: r.score * 0.6, files_modified: r.files_modified, importance: r.importance, snippet: '' });
+        results.push(ftsRowToResult(r, { scoreMultiplier: 0.6 }));
       }
     }
   } catch (e) { debugLog('WARN', 'mem_search', `PRF expansion error: ${e.message}`); }
@@ -1016,7 +971,7 @@ server.registerTool(
     const baseParams = project ? [project] : [];
     if (action === 'scan') {
-      // 1. Find near-duplicate titles (pre-compute word sets, then O(n²) Jaccard)
+      // 1. Find near-duplicate titles (MinHash pre-filter → exact Jaccard on candidates)
       const recent = db.prepare(`
         SELECT id, title, project, importance, access_count, created_at_epoch
         FROM observations
@@ -1025,13 +980,17 @@ server.registerTool(
         LIMIT ${SCAN_LIMIT}
       `).all(...baseParams);
-      const wordSets = recent.map(r => new Set((r.title || '').toLowerCase().split(/\s+/).filter(w => w.length > 2)));
+      const titles = recent.map(r => (r.title || '').trim());
+      const minhashes = titles.map(t => t ? computeMinHash(t) : null);
+      const MINHASH_PRE_THRESHOLD = 0.5; // loose pre-filter to catch candidates
       const duplicates = [];
       for (let i = 0; i < recent.length && duplicates.length < DUPLICATE_LIMIT; i++) {
-        if (wordSets[i].size === 0) continue;
+        if (!titles[i] || !minhashes[i]) continue;
         for (let j = i + 1; j < recent.length; j++) {
-          if (wordSets[j].size === 0) continue;
-          const sim = jaccardSimilarity(wordSets[i], wordSets[j]);
+          if (!titles[j] || !minhashes[j]) continue;
+          // Fast MinHash estimate to skip obvious non-matches
+          if (estimateJaccardFromMinHash(minhashes[i], minhashes[j]) < MINHASH_PRE_THRESHOLD) continue;
+          const sim = jaccardSimilarity(titles[i], titles[j]);
           if (sim > SIMILARITY_THRESHOLD) {
             duplicates.push({
               a: { id: recent[i].id, title: recent[i].title, importance: recent[i].importance },
@@ -1058,6 +1017,11 @@ server.registerTool(
         WHERE COALESCE(compressed_into, 0) = 0 ${projectFilter}
       `).get(staleAge, ...baseParams);
+      // Count pending-purge items (marked by idle cleanup)
+      const pendingPurge = db.prepare(`
+        SELECT COUNT(*) as count FROM observations WHERE compressed_into = ${COMPRESSED_PENDING_PURGE} ${projectFilter}
+      `).get(...baseParams);
       const lines = [
         `Memory maintenance scan:`,
         `  Total active observations: ${stats.total}`,
@@ -1065,6 +1029,7 @@ server.registerTool(
         `  Stale (>30d, imp=1, no access): ${stats.stale}`,
         `  Broken (no title/narrative): ${stats.broken}`,
         `  Boostable (accessed>3, imp<3): ${stats.boostable}`,
+        `  Pending purge (idle-marked): ${pendingPurge.count}`,
       ];
       if (duplicates.length > 0) {
         lines.push('', 'Top duplicates:');
@@ -1079,40 +1044,53 @@ server.registerTool(
       const ops = args.operations || [];
       const results = [];
       const staleAge = Date.now() - STALE_AGE_MS;
+      const OP_ROW_CAP = 1000; // safety cap per operation
       db.transaction(() => {
         if (ops.includes('cleanup')) {
           const deleted = db.prepare(`
             DELETE FROM observations
-            WHERE COALESCE(compressed_into, 0) = 0
-              AND (title IS NULL OR title = '')
-              AND (narrative IS NULL OR narrative = '')
-              ${projectFilter}
+            WHERE id IN (
+              SELECT id FROM observations
+              WHERE COALESCE(compressed_into, 0) = 0
+                AND (title IS NULL OR title = '')
+                AND (narrative IS NULL OR narrative = '')
+                ${projectFilter}
+              LIMIT ${OP_ROW_CAP}
+            )
           `).run(...baseParams);
-          results.push(`Cleaned up ${deleted.changes} broken observations`);
+          results.push(`Cleaned up ${deleted.changes} broken observations` + (deleted.changes >= OP_ROW_CAP ? ' (cap reached, re-run for more)' : ''));
         }
         if (ops.includes('decay')) {
           const decayed = db.prepare(`
             UPDATE observations SET importance = MAX(1, COALESCE(importance, 1) - 1)
-            WHERE COALESCE(compressed_into, 0) = 0
-              AND COALESCE(importance, 1) > 1
-              AND COALESCE(access_count, 0) = 0
-              AND created_at_epoch < ?
-              ${projectFilter}
+            WHERE id IN (
+              SELECT id FROM observations
+              WHERE COALESCE(compressed_into, 0) = 0
+                AND COALESCE(importance, 1) > 1
+                AND COALESCE(access_count, 0) = 0
+                AND created_at_epoch < ?
+                ${projectFilter}
+              LIMIT ${OP_ROW_CAP}
+            )
           `).run(staleAge, ...baseParams);
-          results.push(`Decayed ${decayed.changes} stale observations`);
+          results.push(`Decayed ${decayed.changes} stale observations` + (decayed.changes >= OP_ROW_CAP ? ' (cap reached, re-run for more)' : ''));
         }
         if (ops.includes('boost')) {
           const boosted = db.prepare(`
             UPDATE observations SET importance = MIN(3, COALESCE(importance, 1) + 1)
-            WHERE COALESCE(compressed_into, 0) = 0
-              AND COALESCE(access_count, 0) > 3
-              AND COALESCE(importance, 1) < 3
-              ${projectFilter}
+            WHERE id IN (
+              SELECT id FROM observations
+              WHERE COALESCE(compressed_into, 0) = 0
+                AND COALESCE(access_count, 0) > 3
+                AND COALESCE(importance, 1) < 3
+                ${projectFilter}
+              LIMIT ${OP_ROW_CAP}
+            )
           `).run(...baseParams);
-          results.push(`Boosted ${boosted.changes} frequently-accessed observations`);
+          results.push(`Boosted ${boosted.changes} frequently-accessed observations` + (boosted.changes >= OP_ROW_CAP ? ' (cap reached, re-run for more)' : ''));
         }
         if (ops.includes('dedup') && args.merge_ids) {
@@ -1126,6 +1104,22 @@ server.registerTool(
           }
           results.push(`Merged ${totalMerged} duplicate observations`);
         }
+        if (ops.includes('purge_stale')) {
+          // Delete observations previously marked as pending-purge by idle cleanup.
+          // Requires user confirmation via /mem:update or /mem:mem.
+          const retainDays = args.retain_days ?? 30;
+          const retainCutoff = Date.now() - retainDays * 86400000;
+          const purged = db.prepare(`
+            DELETE FROM observations
+            WHERE id IN (
+              SELECT id FROM observations
+              WHERE compressed_into = ${COMPRESSED_PENDING_PURGE} AND created_at_epoch < ? ${projectFilter}
+              LIMIT ${OP_ROW_CAP}
+            )
+          `).run(retainCutoff, ...baseParams);
+          results.push(`Purged ${purged.changes} stale observations (retained last ${retainDays} days)` + (purged.changes >= OP_ROW_CAP ? ' (cap reached, re-run for more)' : ''));
+        }
       })();
       // FTS5 optimize (outside transaction)
@@ -1258,23 +1252,23 @@ const idleTimer = setInterval(() => {
     const thirtyDaysAgo = Date.now() - 30 * 86400000;
     db.transaction(() => {
-      // Delete old low-quality observations (importance<=1, never accessed, 30+ days).
+      // Mark old low-quality observations as pending-purge (importance<=1, never accessed, 30+ days).
+      // Actual deletion only happens when user confirms via mem_maintain execute purge_stale.
       // NOTE: no project filter — MCP server is global, operates across all projects.
-      // This is intentionally broader than hook.mjs auto-compress (which scopes to current project).
-      const deleted = db.prepare(`
-        DELETE FROM observations
+      const marked = db.prepare(`
+        UPDATE observations SET compressed_into = ${COMPRESSED_PENDING_PURGE}
         WHERE importance <= 1 AND COALESCE(access_count, 0) = 0
           AND created_at_epoch < ? AND COALESCE(compressed_into, 0) = 0
       `).run(thirtyDaysAgo);
-      if (deleted.changes > 0) {
-        debugLog('INFO', 'idle-cleanup', `Deleted ${deleted.changes} stale low-quality observations`);
+      if (marked.changes > 0) {
+        debugLog('INFO', 'idle-cleanup', `Marked ${marked.changes} stale observations as pending-purge`);
       }
-      // Mark old importance=1 as compressed (30+ days)
-      // NOTE: compressed_into = -1 is an established sentinel meaning "auto-compressed without merge target"
-      // (same pattern used in hook.mjs:456 for time-based compression)
+      // Mark old importance=1 with access_count>0 as compressed (30+ days).
+      // Note: importance=1, access_count=0 rows were already marked pending-purge above,
+      // so this only catches importance=1 rows that HAVE been accessed.
       const compressed = db.prepare(`
-        UPDATE observations SET compressed_into = -1
+        UPDATE observations SET compressed_into = ${COMPRESSED_AUTO}
         WHERE COALESCE(compressed_into, 0) = 0 AND importance = 1
           AND created_at_epoch < ?
       `).run(thirtyDaysAgo);

package/tool-schemas.mjs CHANGED Viewed

@@ -57,10 +57,12 @@ export const memCompressSchema = {
 export const memMaintainSchema = {
   action: z.enum(['scan', 'execute']).describe('scan=analyze candidates, execute=apply changes'),
-  operations: z.array(z.enum(['dedup', 'decay', 'cleanup', 'boost'])).optional()
-    .describe('Operations to execute (for action=execute)'),
+  operations: z.array(z.enum(['dedup', 'decay', 'cleanup', 'boost', 'purge_stale'])).optional()
+    .describe('Operations to execute (for action=execute). purge_stale deletes idle-marked observations after user confirmation.'),
   merge_ids: z.array(z.array(z.number().int()).min(2)).optional()
     .describe('For dedup: [[keepId, removeId1, removeId2], ...] — first ID in each group is kept'),
+  retain_days: z.number().int().min(7).max(365).optional()
+    .describe('For purge_stale: keep observations newer than N days (default 30)'),
   project: z.string().optional().describe('Filter by project'),
 };

package/utils.mjs CHANGED Viewed

@@ -3,6 +3,13 @@
 import { basename, dirname } from 'path';
+// ─── Sentinel Values ────────────────────────────────────────────────────────
+/** compressed_into sentinel: auto-compressed without merge target */
+export const COMPRESSED_AUTO = -1;
+/** compressed_into sentinel: pending user-confirmed purge (marked by idle cleanup) */
+export const COMPRESSED_PENDING_PURGE = -2;
 // ─── String Utilities ────────────────────────────────────────────────────────
 /**
@@ -420,7 +427,8 @@ export function inferProject() {
   const parent = basename(dirname(p));
   const raw = parent && parent !== '.' && parent !== '/' ? `${parent}--${base}` : base;
   // Sanitize to prevent path traversal when used in filenames (ep-<project>.json)
-  return raw.replace(/[^a-zA-Z0-9_.-]/g, '-');
+  // Truncate to 100 chars to avoid exceeding filesystem name limits (255 bytes)
+  return raw.replace(/[^a-zA-Z0-9_.-]/g, '-').slice(0, 100);
 }
 // ─── Bash Analysis ───────────────────────────────────────────────────────────
@@ -700,7 +708,7 @@ export function tokenizeHandoff(text) {
   if (!text) return [];
   return text
     .split(/[\s,;:.()[\]{}'"`<>→|/\\#@!?=+*&^%$~]+/)
-    .map(w => w.toLowerCase().replace(/^[.\-]+|[.\-]+$/g, ''))
+    .map(w => w.toLowerCase().replace(/^[.-]+|[.-]+$/g, ''))
     .filter(w => w.length >= 3);
 }