npm - memory-lancedb-pro - Versions diffs - 1.0.10 → 1.0.12 - Mend

memory-lancedb-pro 1.0.10 → 1.0.12

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/CHANGELOG.md +11 -0
package/README.md +30 -1
package/README_CN.md +30 -1
package/index.ts +57 -53
package/openclaw.plugin.json +15 -2
package/package.json +2 -2
package/src/adaptive-retrieval.ts +15 -5
package/src/retriever.ts +20 -8

package/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,16 @@
 # Changelog
+## 1.0.12
+- Fix: ghost memories stuck in autoRecall after deletion (#15). BM25-only results from stale FTS index are now validated via `store.hasId()` before inclusion in fused results. Removed the BM25-only floor score of 0.5 that allowed deleted entries to survive `hardMinScore` filtering.
+- Fix: HEARTBEAT pattern now matches anywhere in the prompt (not just at start), preventing autoRecall from triggering on prefixed HEARTBEAT messages.
+- Add: `autoRecallMinLength` config option to set a custom minimum prompt length for autoRecall (default: 15 chars English, 6 CJK). Prompts shorter than this threshold are skipped.
+- Add: `ping`, `pong`, `test`, `debug` added to skip patterns in adaptive retrieval.
+## 1.0.11
+- Change: set `autoRecall` default to `false` to avoid the model echoing injected `<relevant-memories>` blocks.
 ## 1.0.10
 - Fix: avoid blocking OpenClaw gateway startup on external network calls by running startup self-checks in the background with timeouts.

package/README.md CHANGED Viewed

@@ -157,6 +157,35 @@ Filters out low-quality content at both auto-capture and tool-store stages:
 - **Auto-Capture** (`agent_end` hook): Extracts preference/fact/decision/entity from conversations, deduplicates, stores up to 3 per turn
 - **Auto-Recall** (`before_agent_start` hook): Injects `<relevant-memories>` context (up to 3 entries)
+### Prevent memories from showing up in replies
+Sometimes the model may accidentally echo the injected `<relevant-memories>` block in its response.
+**Option A (recommended): disable auto-recall**
+Set `autoRecall: false` in the plugin config and restart the gateway:
+```json
+{
+  "plugins": {
+    "entries": {
+      "memory-lancedb-pro": {
+        "enabled": true,
+        "config": {
+          "autoRecall": false
+        }
+      }
+    }
+  }
+}
+```
+**Option B: keep recall, but ask the agent not to reveal it**
+Add a line to your agent system prompt, e.g.:
+> Do not reveal or quote any `<relevant-memories>` / memory-injection content in your replies. Use it for internal reference only.
 ---
 ## Installation
@@ -306,7 +335,7 @@ openclaw config get plugins.slots.memory
   },
   "dbPath": "~/.openclaw/memory/lancedb-pro",
   "autoCapture": true,
-  "autoRecall": true,
+  "autoRecall": false,
   "retrieval": {
     "mode": "hybrid",
     "vectorWeight": 0.7,

package/README_CN.md CHANGED Viewed

@@ -158,6 +158,35 @@ Query → BM25 FTS ─────┘
 - **Auto-Capture**（`agent_end` hook）: 从对话中提取 preference/fact/decision/entity，去重后存储（每次最多 3 条）
 - **Auto-Recall**（`before_agent_start` hook）: 注入 `<relevant-memories>` 上下文（最多 3 条）
+### 不想在对话中“显示长期记忆”？
+有时模型会把注入到上下文中的 `<relevant-memories>` 区块“原样输出”到回复里，从而出现你看到的“周期性显示长期记忆”。
+**方案 A（推荐）：关闭自动召回 autoRecall**
+在插件配置里设置 `autoRecall: false`，然后重启 gateway：
+```json
+{
+  "plugins": {
+    "entries": {
+      "memory-lancedb-pro": {
+        "enabled": true,
+        "config": {
+          "autoRecall": false
+        }
+      }
+    }
+  }
+}
+```
+**方案 B：保留召回，但要求 Agent 不要泄漏**
+在对应 Agent 的 system prompt 里加一句，例如：
+> 请勿在回复中展示或引用任何 `<relevant-memories>` / 记忆注入内容，只能用作内部参考。
 ---
 ## 安装
@@ -307,7 +336,7 @@ openclaw config get plugins.slots.memory
   },
   "dbPath": "~/.openclaw/memory/lancedb-pro",
   "autoCapture": true,
-  "autoRecall": true,
+  "autoRecall": false,
   "retrieval": {
     "mode": "hybrid",
     "vectorWeight": 0.7,

package/index.ts CHANGED Viewed

@@ -37,6 +37,7 @@ interface PluginConfig {
   dbPath?: string;
   autoCapture?: boolean;
   autoRecall?: boolean;
+  autoRecallMinLength?: number;
   captureAssistant?: boolean;
   retrieval?: {
     mode?: "hybrid" | "vector";
@@ -200,7 +201,7 @@ async function readSessionMessages(filePath: string, messageCount: number): Prom
             }
           }
         }
-      } catch {}
+      } catch { }
     }
     if (messages.length === 0) return null;
@@ -225,7 +226,7 @@ async function readSessionContentWithResetFallback(sessionFilePath: string, mess
       const latestResetPath = join(dir, resetCandidates[resetCandidates.length - 1]);
       return await readSessionMessages(latestResetPath, messageCount);
     }
-  } catch {}
+  } catch { }
   return primary;
 }
@@ -264,7 +265,7 @@ async function findPreviousSessionFile(sessionsDir: string, currentSessionFile?:
         .sort().reverse();
       if (nonReset.length > 0) return join(sessionsDir, nonReset[0]);
     }
-  } catch {}
+  } catch { }
 }
 // ============================================================================
@@ -364,9 +365,10 @@ const memoryLanceDBProPlugin = {
     // ========================================================================
     // Auto-recall: inject relevant memories before agent starts
-    if (config.autoRecall !== false) {
+    // Default is OFF to prevent the model from accidentally echoing injected context.
+    if (config.autoRecall === true) {
       api.on("before_agent_start", async (event, ctx) => {
-        if (!event.prompt || shouldSkipRetrieval(event.prompt)) {
+        if (!event.prompt || shouldSkipRetrieval(event.prompt, config.autoRecallMinLength)) {
           return;
         }
@@ -622,7 +624,7 @@ const memoryLanceDBProPlugin = {
         if (files.length > 7) {
           const { unlink } = await import("node:fs/promises");
           for (const old of files.slice(0, files.length - 7)) {
-            await unlink(join(backupDir, old)).catch(() => {});
+            await unlink(join(backupDir, old)).catch(() => { });
           }
         }
@@ -663,10 +665,10 @@ const memoryLanceDBProPlugin = {
             api.logger.info(
               `memory-lancedb-pro: initialized successfully ` +
-                `(embedding: ${embedTest.success ? "OK" : "FAIL"}, ` +
-                `retrieval: ${retrievalTest.success ? "OK" : "FAIL"}, ` +
-                `mode: ${retrievalTest.mode}, ` +
-                `FTS: ${retrievalTest.hasFtsSupport ? "enabled" : "disabled"})`
+              `(embedding: ${embedTest.success ? "OK" : "FAIL"}, ` +
+              `retrieval: ${retrievalTest.success ? "OK" : "FAIL"}, ` +
+              `mode: ${retrievalTest.mode}, ` +
+              `FTS: ${retrievalTest.hasFtsSupport ? "enabled" : "disabled"})`
             );
             if (!embedTest.success) {
@@ -700,53 +702,55 @@ const memoryLanceDBProPlugin = {
 };
 function parsePluginConfig(value: unknown): PluginConfig {
-    if (!value || typeof value !== "object" || Array.isArray(value)) {
-      throw new Error("memory-lancedb-pro config required");
-    }
-    const cfg = value as Record<string, unknown>;
+  if (!value || typeof value !== "object" || Array.isArray(value)) {
+    throw new Error("memory-lancedb-pro config required");
+  }
+  const cfg = value as Record<string, unknown>;
-    const embedding = cfg.embedding as Record<string, unknown> | undefined;
-    if (!embedding) {
-      throw new Error("embedding config is required");
-    }
+  const embedding = cfg.embedding as Record<string, unknown> | undefined;
+  if (!embedding) {
+    throw new Error("embedding config is required");
+  }
-    const apiKey = typeof embedding.apiKey === "string"
-      ? embedding.apiKey
-      : process.env.OPENAI_API_KEY || "";
+  const apiKey = typeof embedding.apiKey === "string"
+    ? embedding.apiKey
+    : process.env.OPENAI_API_KEY || "";
-    if (!apiKey) {
-      throw new Error("embedding.apiKey is required (set directly or via OPENAI_API_KEY env var)");
-    }
+  if (!apiKey) {
+    throw new Error("embedding.apiKey is required (set directly or via OPENAI_API_KEY env var)");
+  }
-    return {
-      embedding: {
-        provider: "openai-compatible",
-        apiKey,
-        model: typeof embedding.model === "string" ? embedding.model : "text-embedding-3-small",
-        baseURL: typeof embedding.baseURL === "string" ? resolveEnvVars(embedding.baseURL) : undefined,
-        // Accept number, numeric string, or env-var string (e.g. "${EMBED_DIM}").
-        // Also accept legacy top-level `dimensions` for convenience.
-        dimensions: parsePositiveInt(embedding.dimensions ?? cfg.dimensions),
-        taskQuery: typeof embedding.taskQuery === "string" ? embedding.taskQuery : undefined,
-        taskPassage: typeof embedding.taskPassage === "string" ? embedding.taskPassage : undefined,
-        normalized: typeof embedding.normalized === "boolean" ? embedding.normalized : undefined,
-      },
-      dbPath: typeof cfg.dbPath === "string" ? cfg.dbPath : undefined,
-      autoCapture: cfg.autoCapture !== false,
-      autoRecall: cfg.autoRecall !== false,
-      captureAssistant: cfg.captureAssistant === true,
-      retrieval: typeof cfg.retrieval === "object" && cfg.retrieval !== null ? cfg.retrieval as any : undefined,
-      scopes: typeof cfg.scopes === "object" && cfg.scopes !== null ? cfg.scopes as any : undefined,
-      enableManagementTools: cfg.enableManagementTools === true,
-      sessionMemory: typeof cfg.sessionMemory === "object" && cfg.sessionMemory !== null
-        ? {
-            enabled: (cfg.sessionMemory as Record<string, unknown>).enabled !== false,
-            messageCount: typeof (cfg.sessionMemory as Record<string, unknown>).messageCount === "number"
-              ? (cfg.sessionMemory as Record<string, unknown>).messageCount as number
-              : undefined,
-          }
-        : undefined,
-    };
+  return {
+    embedding: {
+      provider: "openai-compatible",
+      apiKey,
+      model: typeof embedding.model === "string" ? embedding.model : "text-embedding-3-small",
+      baseURL: typeof embedding.baseURL === "string" ? resolveEnvVars(embedding.baseURL) : undefined,
+      // Accept number, numeric string, or env-var string (e.g. "${EMBED_DIM}").
+      // Also accept legacy top-level `dimensions` for convenience.
+      dimensions: parsePositiveInt(embedding.dimensions ?? cfg.dimensions),
+      taskQuery: typeof embedding.taskQuery === "string" ? embedding.taskQuery : undefined,
+      taskPassage: typeof embedding.taskPassage === "string" ? embedding.taskPassage : undefined,
+      normalized: typeof embedding.normalized === "boolean" ? embedding.normalized : undefined,
+    },
+    dbPath: typeof cfg.dbPath === "string" ? cfg.dbPath : undefined,
+    autoCapture: cfg.autoCapture !== false,
+    // Default OFF: only enable when explicitly set to true.
+    autoRecall: cfg.autoRecall === true,
+    autoRecallMinLength: parsePositiveInt(cfg.autoRecallMinLength),
+    captureAssistant: cfg.captureAssistant === true,
+    retrieval: typeof cfg.retrieval === "object" && cfg.retrieval !== null ? cfg.retrieval as any : undefined,
+    scopes: typeof cfg.scopes === "object" && cfg.scopes !== null ? cfg.scopes as any : undefined,
+    enableManagementTools: cfg.enableManagementTools === true,
+    sessionMemory: typeof cfg.sessionMemory === "object" && cfg.sessionMemory !== null
+      ? {
+        enabled: (cfg.sessionMemory as Record<string, unknown>).enabled !== false,
+        messageCount: typeof (cfg.sessionMemory as Record<string, unknown>).messageCount === "number"
+          ? (cfg.sessionMemory as Record<string, unknown>).messageCount as number
+          : undefined,
+      }
+      : undefined,
+  };
 }
 export default memoryLanceDBProPlugin;

package/openclaw.plugin.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "id": "memory-lancedb-pro",
   "name": "Memory (LanceDB Pro)",
   "description": "Enhanced LanceDB-backed long-term memory with hybrid retrieval, multi-scope isolation, and management CLI",
-  "version": "1.0.10",
+  "version": "1.0.12",
   "kind": "memory",
   "configSchema": {
     "type": "object",
@@ -58,7 +58,15 @@
         "type": "boolean"
       },
       "autoRecall": {
-        "type": "boolean"
+        "type": "boolean",
+        "default": false
+      },
+      "autoRecallMinLength": {
+        "type": "integer",
+        "minimum": 1,
+        "maximum": 200,
+        "default": 15,
+        "description": "Minimum prompt length (in characters) to trigger auto-recall. Prompts shorter than this are skipped. Default: 15 for English, 6 for CJK."
       },
       "captureAssistant": {
         "type": "boolean"
@@ -265,6 +273,11 @@
       "label": "Auto-Recall",
       "help": "Automatically inject relevant memories into context"
     },
+    "autoRecallMinLength": {
+      "label": "Auto-Recall Min Length",
+      "help": "Minimum prompt length to trigger auto-recall (shorter prompts are skipped). Default: 15 chars for English, 6 for CJK.",
+      "advanced": true
+    },
     "captureAssistant": {
       "label": "Capture Assistant Messages",
       "help": "Also auto-capture assistant messages (default false to reduce memory pollution)",

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "memory-lancedb-pro",
-  "version": "1.0.10",
+  "version": "1.0.12",
   "description": "OpenClaw enhanced LanceDB memory plugin with hybrid retrieval (Vector + BM25), cross-encoder rerank, multi-scope isolation, and management CLI",
   "type": "module",
   "main": "index.ts",
@@ -40,4 +40,4 @@
     "jiti": "^2.6.0",
     "typescript": "^5.9.3"
   }
-}
+}

package/src/adaptive-retrieval.ts CHANGED Viewed

@@ -18,9 +18,11 @@ const SKIP_PATTERNS = [
   /^(go ahead|continue|proceed|do it|start|begin|next|实施|开始|继续|好的|可以|行)\s*[.!]?$/i,
   // Pure emoji
   /^[\p{Emoji}\s]+$/u,
-  // Heartbeat/system
-  /^HEARTBEAT/i,
+  // Heartbeat/system (match anywhere, not just at start, to handle prefixed formats)
+  /HEARTBEAT/i,
   /^\[System/i,
+  // Single-word utility pings
+  /^(ping|pong|test|debug)\s*[.!?]?$/i,
 ];
 // Queries that SHOULD trigger retrieval even if short
@@ -61,8 +63,10 @@ function normalizeQuery(query: string): string {
 /**
  * Determine if a query should skip memory retrieval.
  * Returns true if retrieval should be skipped.
+ * @param query The raw prompt text
+ * @param minLength Optional minimum length override (if set, overrides built-in thresholds)
  */
-export function shouldSkipRetrieval(query: string): boolean {
+export function shouldSkipRetrieval(query: string, minLength?: number): boolean {
   const trimmed = normalizeQuery(query);
   // Force retrieve if query has memory-related intent (checked FIRST,
@@ -75,11 +79,17 @@ export function shouldSkipRetrieval(query: string): boolean {
   // Skip if matches any skip pattern
   if (SKIP_PATTERNS.some(p => p.test(trimmed))) return true;
+  // If caller provides a custom minimum length, use it
+  if (minLength !== undefined && minLength > 0) {
+    if (trimmed.length < minLength && !trimmed.includes('?') && !trimmed.includes('？')) return true;
+    return false;
+  }
   // Skip very short non-question messages (likely commands or affirmations)
   // CJK characters carry more meaning per character, so use a lower threshold
   const hasCJK = /[\u4e00-\u9fff\u3040-\u309f\u30a0-\u30ff\uac00-\ud7af]/.test(trimmed);
-  const minLength = hasCJK ? 6 : 15;
-  if (trimmed.length < minLength && !trimmed.includes('?') && !trimmed.includes('？')) return true;
+  const defaultMinLength = hasCJK ? 6 : 15;
+  if (trimmed.length < defaultMinLength && !trimmed.includes('?') && !trimmed.includes('？')) return true;
   // Default: do retrieve
   return false;

package/src/retriever.ts CHANGED Viewed

@@ -282,8 +282,8 @@ export class MemoryRetriever {
       this.runBM25Search(query, candidatePoolSize, scopeFilter, category),
     ]);
-    // Fuse results using RRF
-    const fusedResults = this.fuseResults(vectorResults, bm25Results);
+    // Fuse results using RRF (async: validates BM25-only entries exist in store)
+    const fusedResults = await this.fuseResults(vectorResults, bm25Results);
     // Apply minimum score threshold
     const filtered = fusedResults.filter(r => r.score >= this.config.minScore);
@@ -357,10 +357,10 @@ export class MemoryRetriever {
     }));
   }
-  private fuseResults(
+  private async fuseResults(
     vectorResults: Array<MemorySearchResult & { rank: number }>,
     bm25Results: Array<MemorySearchResult & { rank: number }>
-  ): RetrievalResult[] {
+  ): Promise<RetrievalResult[]> {
     // Create maps for quick lookup
     const vectorMap = new Map<string, MemorySearchResult & { rank: number }>();
     const bm25Map = new Map<string, MemorySearchResult & { rank: number }>();
@@ -383,6 +383,18 @@ export class MemoryRetriever {
       const vectorResult = vectorMap.get(id);
       const bm25Result = bm25Map.get(id);
+      // FIX(#15): BM25-only results may be "ghost" entries whose vector data was
+      // deleted but whose FTS index entry lingers until the next index rebuild.
+      // Validate that the entry actually exists in the store before including it.
+      if (!vectorResult && bm25Result) {
+        try {
+          const exists = await this.store.hasId(id);
+          if (!exists) continue; // Skip ghost entry
+        } catch {
+          // If hasId fails, keep the result (fail-open)
+        }
+      }
       // Use the result with more complete data (prefer vector result if both exist)
       const baseResult = vectorResult || bm25Result!;
@@ -392,12 +404,12 @@ export class MemoryRetriever {
       const bm25Hit = bm25Result ? 1 : 0;
       // Base = vector score; BM25 hit boosts by up to 15%
-      // BM25-only results use their normalized score (floor 0.5) so exact keyword
-      // matches aren't buried — e.g. searching "JINA_API_KEY" should surface even
-      // when vector distance is large.
+      // BM25-only results use their raw BM25 score so exact keyword matches
+      // (e.g. searching "JINA_API_KEY") still surface. The previous floor of 0.5
+      // was too generous and allowed ghost entries to survive hardMinScore (0.35).
       const fusedScore = vectorResult
         ? clamp01(vectorScore + (bm25Hit * 0.15 * vectorScore), 0.1)
-        : clamp01(Math.max(bm25Result!.score, 0.5), 0.1);
+        : clamp01(bm25Result!.score, 0.1);
       fusedResults.push({
         entry: baseResult.entry,