npm - openclaw-mem - Versions diffs - 1.0.4 → 1.3.0 - Mend

openclaw-mem 1.0.4 → 1.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (47) hide show

package/HOOK.md +125 -0
package/LICENSE +1 -1
package/MCP.json +11 -0
package/README.md +158 -167
package/backfill-embeddings.js +79 -0
package/context-builder.js +703 -0
package/database.js +625 -0
package/debug-logger.js +280 -0
package/extractor.js +268 -0
package/gateway-llm.js +250 -0
package/handler.js +941 -0
package/mcp-http-api.js +424 -0
package/mcp-server.js +605 -0
package/mem-get.sh +24 -0
package/mem-search.sh +17 -0
package/monitor.js +112 -0
package/package.json +58 -30
package/realtime-monitor.js +371 -0
package/session-watcher.js +192 -0
package/setup.js +114 -0
package/sync-recent.js +63 -0
package/README_CN.md +0 -201
package/bin/openclaw-mem.js +0 -117
package/docs/locales/README_AR.md +0 -35
package/docs/locales/README_DE.md +0 -35
package/docs/locales/README_ES.md +0 -35
package/docs/locales/README_FR.md +0 -35
package/docs/locales/README_HE.md +0 -35
package/docs/locales/README_HI.md +0 -35
package/docs/locales/README_ID.md +0 -35
package/docs/locales/README_IT.md +0 -35
package/docs/locales/README_JA.md +0 -57
package/docs/locales/README_KO.md +0 -35
package/docs/locales/README_NL.md +0 -35
package/docs/locales/README_PL.md +0 -35
package/docs/locales/README_PT.md +0 -35
package/docs/locales/README_RU.md +0 -35
package/docs/locales/README_TH.md +0 -35
package/docs/locales/README_TR.md +0 -35
package/docs/locales/README_UK.md +0 -35
package/docs/locales/README_VI.md +0 -35
package/docs/logo.svg +0 -32
package/lib/context-builder.js +0 -415
package/lib/database.js +0 -309
package/lib/handler.js +0 -494
package/scripts/commands.js +0 -141
package/scripts/init.js +0 -248

package/gateway-llm.js ADDED Viewed

@@ -0,0 +1,250 @@
+/**
+ * DeepSeek LLM helper
+ * Calls the DeepSeek OpenAI-compatible endpoint to summarize sessions.
+ */
+const SUMMARY_SESSION_PREFIX = 'mem-summary:';
+const DEFAULT_DEEPSEEK_BASE_URL = 'https://api.deepseek.com/v1';
+const DEFAULT_DEEPSEEK_MODEL = 'deepseek-chat';
+function getDeepSeekBaseUrl() {
+  return process.env.DEEPSEEK_BASE_URL
+    || DEFAULT_DEEPSEEK_BASE_URL;
+}
+function getDeepSeekApiKey() {
+  return process.env.DEEPSEEK_API_KEY || '';
+}
+function getDeepSeekModel() {
+  return process.env.DEEPSEEK_MODEL
+    || DEFAULT_DEEPSEEK_MODEL;
+}
+function truncateText(text, maxChars) {
+  if (!text) return '';
+  if (text.length <= maxChars) return text;
+  return text.slice(0, maxChars) + '…';
+}
+function formatTranscript(messages, maxChars = 12000) {
+  const lines = [];
+  for (const m of messages) {
+    const role = (m.role || 'unknown').toUpperCase();
+    const content = String(m.content || '').replace(/\s+/g, ' ').trim();
+    if (!content) continue;
+    lines.push(`${role}: ${content}`);
+  }
+  return truncateText(lines.join('\n'), maxChars);
+}
+function parseSummaryJson(text) {
+  if (!text) return null;
+  const match = text.match(/\{[\s\S]*\}/);
+  if (!match) return null;
+  try {
+    const obj = JSON.parse(match[0]);
+    return obj && typeof obj === 'object' ? obj : null;
+  } catch {
+    return null;
+  }
+}
+function normalizeSummaryFields(obj) {
+  if (!obj) return null;
+  const pick = (key) => {
+    const val = obj[key];
+    if (typeof val === 'string') return val.trim();
+    if (val == null) return '';
+    return String(val).trim();
+  };
+  return {
+    request: pick('request'),
+    investigated: pick('investigated'),
+    learned: pick('learned'),
+    completed: pick('completed'),
+    next_steps: pick('next_steps')
+  };
+}
+async function callGatewayChat(messages, options = {}) {
+  const {
+    sessionKey = 'unknown',
+    temperature = 0.2,
+    max_tokens = 300,
+    model
+  } = options;
+  const apiKey = getDeepSeekApiKey();
+  if (!apiKey) {
+    console.log('[openclaw-mem] No DEEPSEEK_API_KEY found');
+    return null;
+  }
+  const baseUrl = getDeepSeekBaseUrl();
+  const resolvedModel = model || getDeepSeekModel();
+  const url = `${baseUrl}/chat/completions`;
+  const payload = {
+    model: resolvedModel,
+    stream: false,
+    temperature,
+    max_tokens,
+    messages
+  };
+  const headers = {
+    'Content-Type': 'application/json',
+    'Authorization': `Bearer ${apiKey}`
+  };
+  try {
+    console.log('[openclaw-mem] Calling DeepSeek API...');
+    const res = await fetch(url, {
+      method: 'POST',
+      headers,
+      body: JSON.stringify(payload)
+    });
+    if (!res.ok) {
+      const errText = await res.text();
+      console.error('[openclaw-mem] DeepSeek API error:', res.status, errText);
+      return null;
+    }
+    const json = await res.json();
+    const content = json?.choices?.[0]?.message?.content || '';
+    console.log('[openclaw-mem] DeepSeek response received');
+    return content;
+  } catch (err) {
+    console.error('[openclaw-mem] DeepSeek fetch error:', err.message);
+    return null;
+  }
+}
+export async function summarizeSession(messages, options = {}) {
+  const { sessionKey = 'unknown' } = options;
+  const transcript = formatTranscript(messages, 12000);
+  if (!transcript) return null;
+  const buildPrompts = (strict = false) => {
+    const systemPrompt = `You are a session summarizer for an AI agent memory system. Your summaries help the agent recall past work in future sessions.
+INSTRUCTIONS:
+- Focus on OUTCOMES and DELIVERABLES, not conversational flow
+- Use action verbs: implemented, fixed, configured, discovered, decided, explored
+- Be specific: include file names, tool names, error messages, key decisions
+- Write in the language the user used (Chinese if they spoke Chinese, English if English)
+OUTPUT FORMAT: Return ONLY a valid JSON object with these fields:
+{
+  "request": "What the user wanted to accomplish (1 sentence, specific)",
+  "investigated": "What was explored or researched to fulfill the request",
+  "learned": "Key technical insights, discoveries, or new understanding gained",
+  "completed": "Concrete deliverables: what was built, fixed, configured, or decided",
+  "next_steps": "Unfinished work or logical follow-up actions (null if fully completed)"
+}
+QUALITY GUIDELINES:
+- "request" should capture the real goal, not just "user asked a question"
+- "investigated" should list specific files read, APIs explored, architectures examined
+- "learned" should contain reusable knowledge (not "learned how to do X" but the actual insight)
+- "completed" should be a concrete outcome someone can verify
+- "next_steps" should be actionable, not vague
+${strict ? 'CRITICAL: Output ONLY the JSON object. No markdown, no explanation, no code fences.' : ''}`;
+    const userPrompt = 'Session transcript:\n' + transcript + '\n\nJSON:';
+    return [
+      { role: 'system', content: systemPrompt },
+      { role: 'user', content: userPrompt }
+    ];
+  };
+  // First attempt
+  let content = await callGatewayChat(buildPrompts(false), { sessionKey, temperature: 0.2, max_tokens: 600 });
+  let parsed = parseSummaryJson(content || '');
+  if (parsed) return normalizeSummaryFields(parsed);
+  // Retry once with stricter instruction
+  content = await callGatewayChat(buildPrompts(true), { sessionKey, temperature: 0.1, max_tokens: 600 });
+  parsed = parseSummaryJson(content || '');
+  if (parsed) return normalizeSummaryFields(parsed);
+  return null;
+}
+// ============ Local Embedding Model (Qwen3-Embedding-0.6B) ============
+const EMBEDDING_MODEL = 'Xenova/multilingual-e5-small';
+const EMBEDDING_DIMS = 384;
+const EMBEDDING_PREFIX = 'query: ';
+// Singleton: lazily initialized embedding pipeline
+let _extractorPromise = null;
+function getExtractor() {
+  if (!_extractorPromise) {
+    _extractorPromise = (async () => {
+      try {
+        const { pipeline } = await import('@huggingface/transformers');
+        console.log('[openclaw-mem] Loading embedding model (first run downloads ~110MB)...');
+        const extractor = await pipeline('feature-extraction', EMBEDDING_MODEL);
+        console.log('[openclaw-mem] Embedding model loaded');
+        return extractor;
+      } catch (err) {
+        console.error('[openclaw-mem] Failed to load embedding model:', err.message);
+        _extractorPromise = null; // Allow retry
+        return null;
+      }
+    })();
+  }
+  return _extractorPromise;
+}
+/**
+ * Generate embedding vector for text using local Qwen3-Embedding-0.6B model.
+ * Returns Float32Array of 1024 dimensions, or null on failure.
+ */
+export async function callGatewayEmbeddings(text) {
+  try {
+    const extractor = await getExtractor();
+    if (!extractor) return null;
+    const input = EMBEDDING_PREFIX + text;
+    const output = await extractor(input, {
+      pooling: 'mean',
+      normalize: true,
+    });
+    return new Float32Array(output.data);
+  } catch (err) {
+    console.error('[openclaw-mem] Embedding generation error:', err.message);
+    return null;
+  }
+}
+/**
+ * Generate embeddings for multiple texts sequentially.
+ * Returns array of Float32Array, or null entries on failure.
+ */
+export async function batchEmbeddings(texts) {
+  const extractor = await getExtractor();
+  if (!extractor) return texts.map(() => null);
+  const results = [];
+  for (const text of texts) {
+    try {
+      const input = EMBEDDING_PREFIX + text;
+      const output = await extractor(input, {
+        pooling: 'mean',
+        normalize: true,
+      });
+      results.push(new Float32Array(output.data));
+    } catch (err) {
+      console.error('[openclaw-mem] Batch embedding error:', err.message);
+      results.push(null);
+    }
+  }
+  return results;
+}
+export { EMBEDDING_DIMS };
+export const INTERNAL_SUMMARY_PREFIX = SUMMARY_SESSION_PREFIX;
+export { callGatewayChat };