npm - @alex900530/claude-persistent-memory - Versions diffs - 1.0.0 - Mend

@alex900530/claude-persistent-memory 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

package/LICENSE +21 -0
package/README.md +271 -0
package/bin/setup.js +418 -0
package/bin/uninstall.js +122 -0
package/config.default.js +49 -0
package/config.js +7 -0
package/hooks/post-tool-memory-hook.js +151 -0
package/hooks/pre-compact-hook.js +61 -0
package/hooks/pre-tool-memory-hook.js +148 -0
package/hooks/session-end-hook.js +159 -0
package/hooks/user-prompt-hook.js +151 -0
package/lib/compact-analyzer.js +319 -0
package/lib/embedding-client.js +113 -0
package/lib/llm-client.js +61 -0
package/lib/memory-db.js +1310 -0
package/lib/utils.js +92 -0
package/package.json +44 -0
package/services/embedding-server.js +108 -0
package/services/llm-server.js +421 -0
package/services/memory-mcp-server.js +252 -0
package/tools/rebuild-vectors.js +27 -0

package/lib/utils.js ADDED Viewed

@@ -0,0 +1,92 @@
+/**
+ * Minimal utility functions for the persistent memory system.
+ * Extracted from .claude/scripts/lib/utils.js - only memory-relevant utilities.
+ */
+const fs = require('fs');
+const path = require('path');
+/**
+ * Ensure a directory exists (create recursively if not).
+ * @param {string} dirPath - Directory path to ensure
+ * @returns {string} The directory path
+ */
+function ensureDir(dirPath) {
+  if (!fs.existsSync(dirPath)) {
+    fs.mkdirSync(dirPath, { recursive: true });
+  }
+  return dirPath;
+}
+/**
+ * Calculate cosine similarity between two vectors.
+ * @param {number[]} vec1 - First vector
+ * @param {number[]} vec2 - Second vector
+ * @returns {number} Similarity score between 0 and 1
+ */
+function cosineSimilarity(vec1, vec2) {
+  if (!vec1 || !vec2 || vec1.length !== vec2.length) return 0;
+  let dotProduct = 0;
+  let norm1 = 0;
+  let norm2 = 0;
+  for (let i = 0; i < vec1.length; i++) {
+    dotProduct += vec1[i] * vec2[i];
+    norm1 += vec1[i] * vec1[i];
+    norm2 += vec2[i] * vec2[i];
+  }
+  const magnitude = Math.sqrt(norm1) * Math.sqrt(norm2);
+  return magnitude === 0 ? 0 : dotProduct / magnitude;
+}
+/**
+ * Log to stderr (visible to user in Claude Code, does not pollute stdout).
+ * @param {string} message - Message to log
+ */
+function log(message) {
+  console.error(message);
+}
+/**
+ * Read a text file safely. Returns null if file does not exist or read fails.
+ * @param {string} filePath - Absolute path to the file
+ * @returns {string|null} File contents or null
+ */
+function readFile(filePath) {
+  try {
+    return fs.readFileSync(filePath, 'utf8');
+  } catch {
+    return null;
+  }
+}
+/**
+ * Write a text file. Parent directories are created automatically.
+ * @param {string} filePath - Absolute path to the file
+ * @param {string} content - Content to write
+ */
+function writeFile(filePath, content) {
+  ensureDir(path.dirname(filePath));
+  fs.writeFileSync(filePath, content, 'utf8');
+}
+/**
+ * Append to a text file. Parent directories are created automatically.
+ * @param {string} filePath - Absolute path to the file
+ * @param {string} content - Content to append
+ */
+function appendFile(filePath, content) {
+  ensureDir(path.dirname(filePath));
+  fs.appendFileSync(filePath, content, 'utf8');
+}
+module.exports = {
+  ensureDir,
+  cosineSimilarity,
+  log,
+  readFile,
+  writeFile,
+  appendFile,
+};

package/package.json ADDED Viewed

@@ -0,0 +1,44 @@
+{
+  "name": "@alex900530/claude-persistent-memory",
+  "version": "1.0.0",
+  "description": "Persistent memory system for Claude Code — hybrid BM25 + vector search, LLM-driven structuring, automatic clustering",
+  "main": "lib/memory-db.js",
+  "bin": {
+    "claude-persistent-memory": "bin/setup.js"
+  },
+  "scripts": {
+    "postinstall": "node bin/setup.js --postinstall",
+    "setup": "node bin/setup.js",
+    "uninstall": "node bin/uninstall.js",
+    "embedding-server": "node services/embedding-server.js",
+    "llm-server": "node services/llm-server.js",
+    "mcp-server": "node services/memory-mcp-server.js",
+    "rebuild-vectors": "node tools/rebuild-vectors.js"
+  },
+  "files": [
+    "bin/",
+    "hooks/",
+    "lib/",
+    "services/",
+    "tools/",
+    "config.js",
+    "config.default.js"
+  ],
+  "publishConfig": {
+    "registry": "https://registry.npmjs.org"
+  },
+  "engines": {
+    "node": ">=18"
+  },
+  "dependencies": {
+    "@huggingface/transformers": "^3.8.1",
+    "@modelcontextprotocol/sdk": "^1.26.0",
+    "better-sqlite3": "^12.6.2",
+    "sqlite-vec": "^0.1.7-alpha.2",
+    "zod": "^3.24.0"
+  },
+  "optionalDependencies": {
+    "nodejieba": "^2.6.0"
+  },
+  "license": "MIT"
+}

package/services/embedding-server.js ADDED Viewed

@@ -0,0 +1,108 @@
+#!/usr/bin/env node
+const net = require('net');
+const fs = require('fs');
+const path = require('path');
+const config = require('../config');
+const { ensureDir } = require('../lib/utils');
+const PORT = config.embeddingPort;
+const PID_FILE = path.join(config.pidDir, 'claude-embedding.pid');
+let memoryDb = null;
+let isReady = false;
+let server = null;
+const LOG_FILE = path.join(config.logDir, 'embedding-server.log');
+ensureDir(config.logDir);
+function str(v) { return v == null ? '' : typeof v === 'string' ? v : JSON.stringify(v); }
+function log(msg) { const line = `[${new Date().toISOString()}] ${msg}\n`; try { fs.appendFileSync(LOG_FILE, line); } catch (e) {} }
+async function initialize() {
+  console.error('[EmbeddingServer] Starting...');
+  try {
+    memoryDb = require('../lib/memory-db');
+    if (memoryDb.warmupEmbedding) {
+      console.error('[EmbeddingServer] Warming up embedding model...');
+      await memoryDb.warmupEmbedding();
+      console.error('[EmbeddingServer] Embedding model ready');
+    }
+    isReady = true;
+  } catch (e) {
+    console.error('[EmbeddingServer] Failed to initialize:', e.message);
+    process.exit(1);
+  }
+}
+async function handleRequest(data) {
+  if (!isReady) return { success: false, error: 'Server not ready' };
+  try {
+    const request = JSON.parse(data);
+    const startTime = Date.now();
+    switch (request.action) {
+      case 'search': {
+        log(`[REQ] action=search query=${str(request.query)} limit=${request.limit || 3}`);
+        const results = await memoryDb.search(request.query, request.limit || 3, request.options || {});
+        const duration = Date.now() - startTime;
+        log(`[RES] action=search duration=${duration}ms results=${results.length} matches=${results.map(r => '#' + r.id + '(' + (r.vectorSimilarity != null ? r.vectorSimilarity.toFixed(3) : '?') + ')').join(',')}`);
+        return { success: true, results };
+      }
+      case 'quickSearch': {
+        log(`[REQ] action=quickSearch query=${str(request.query)} limit=${request.limit || 3}`);
+        const quickResults = memoryDb.quickSearch(request.query, request.limit || 3, request.options || {});
+        const duration = Date.now() - startTime;
+        log(`[RES] action=quickSearch duration=${duration}ms results=${quickResults.length} matches=${quickResults.map(r => '#' + r.id + '(' + (r.vectorSimilarity != null ? r.vectorSimilarity.toFixed(3) : '?') + ')').join(',')}`);
+        return { success: true, results: quickResults };
+      }
+      case 'ping': return { success: true, message: 'pong', ready: isReady };
+      case 'shutdown':
+        console.error('[EmbeddingServer] Shutdown requested');
+        setTimeout(() => { cleanup(); process.exit(0); }, 100);
+        return { success: true, message: 'Shutting down' };
+      case 'stats':
+        const stats = memoryDb.getStats();
+        return { success: true, stats };
+      default: return { success: false, error: `Unknown action: ${request.action}` };
+    }
+  } catch (e) {
+    log(`[ERR] error=${e.message}`);
+    return { success: false, error: e.message };
+  }
+}
+function cleanup() {
+  try { if (fs.existsSync(PID_FILE)) fs.unlinkSync(PID_FILE); if (memoryDb && memoryDb.closeDb) memoryDb.closeDb(); } catch (e) {}
+}
+async function startServer() {
+  await initialize();
+  server = net.createServer((socket) => {
+    let buffer = '';
+    socket.on('data', async (chunk) => {
+      buffer += chunk.toString();
+      const lines = buffer.split('\n');
+      buffer = lines.pop();
+      for (const line of lines) {
+        if (line.trim()) {
+          const response = await handleRequest(line);
+          socket.write(JSON.stringify(response) + '\n');
+        }
+      }
+    });
+    socket.on('error', () => {});
+  });
+  server.on('error', (err) => {
+    if (err.code === 'EADDRINUSE') { console.error(`[EmbeddingServer] Port ${PORT} already in use`); process.exit(0); }
+    console.error('[EmbeddingServer] Server error:', err.message);
+    cleanup();
+    process.exit(1);
+  });
+  server.listen(PORT, '127.0.0.1', () => {
+    console.error(`[EmbeddingServer] Listening on 127.0.0.1:${PORT}`);
+    fs.writeFileSync(PID_FILE, process.pid.toString());
+  });
+  process.on('SIGTERM', () => { console.error('[EmbeddingServer] SIGTERM received'); cleanup(); process.exit(0); });
+  process.on('SIGINT', () => { console.error('[EmbeddingServer] SIGINT received'); cleanup(); process.exit(0); });
+}
+startServer().catch((err) => { console.error('[EmbeddingServer] Failed to start:', err.message); process.exit(1); });

package/services/llm-server.js ADDED Viewed

@@ -0,0 +1,421 @@
+#!/usr/bin/env node
+/**
+ * LLM Server (Azure OpenAI) - LLM classification service using Azure OpenAI API
+ *
+ * Same functionality as llm-server.js, but uses Azure OpenAI instead of local llama-server
+ */
+const net = require('net');
+const https = require('https');
+const fs = require('fs');
+const path = require('path');
+const os = require('os');
+const config = require('../config');
+const { ensureDir } = require('../lib/utils');
+const PORT = config.llmPort;
+const PID_FILE = path.join(config.pidDir, 'claude-llm.pid');
+// Azure OpenAI Configuration
+const AZURE_CONFIG = {
+  endpoint: config.azure.endpoint,
+  apiKey: config.azure.apiKey,
+  deployment: config.azure.deployment,
+  apiVersion: config.azure.apiVersion,
+};
+if (!AZURE_CONFIG.endpoint || !AZURE_CONFIG.apiKey) {
+  console.error('[LLMServer] Error: Azure OpenAI endpoint and apiKey must be configured.');
+  console.error('[LLMServer] Set AZURE_OPENAI_ENDPOINT and AZURE_OPENAI_KEY environment variables,');
+  console.error('[LLMServer] or configure them in config.js');
+  process.exit(1);
+}
+let isReady = false;
+let server = null;
+const LOG_FILE = path.join(config.logDir, 'llm-server.log');
+ensureDir(config.logDir);
+function str(v) { return v == null ? '' : typeof v === 'string' ? v : JSON.stringify(v); }
+function log(msg) {
+  const line = `[${new Date().toISOString()}] ${msg}\n`;
+  try { fs.appendFileSync(LOG_FILE, line); } catch (e) {}
+}
+// ============== Azure OpenAI API ==============
+async function callAzureOpenAI(messages, maxTokens = 200) {
+  const startTime = Date.now();
+  const userMsg = messages.find(m => m.role === 'user');
+  const sysMsg = messages.find(m => m.role === 'system');
+  log(`[AZURE-REQ] system=${str(sysMsg?.content)} user=${str(userMsg?.content)} max_tokens=${maxTokens}`);
+  return new Promise((resolve, reject) => {
+    const url = new URL(
+      `/openai/deployments/${AZURE_CONFIG.deployment}/chat/completions?api-version=${AZURE_CONFIG.apiVersion}`,
+      AZURE_CONFIG.endpoint
+    );
+    const postData = JSON.stringify({
+      messages,
+      max_tokens: maxTokens || 32768,
+      temperature: 0.1
+    });
+    const options = {
+      hostname: url.hostname,
+      port: 443,
+      path: url.pathname + url.search,
+      method: 'POST',
+      headers: {
+        'Content-Type': 'application/json',
+        'api-key': AZURE_CONFIG.apiKey
+      },
+      timeout: 60000
+    };
+    const req = https.request(options, (res) => {
+      let data = '';
+      res.on('data', chunk => data += chunk);
+      res.on('end', () => {
+        const duration = Date.now() - startTime;
+        try {
+          const json = JSON.parse(data);
+          if (json.error) {
+            log(`[AZURE-ERR] duration=${duration}ms error=${json.error.message || 'Azure API error'}`);
+            reject(new Error(json.error.message || 'Azure API error'));
+          } else {
+            const content = json.choices?.[0]?.message?.content || '';
+            const usage = json.usage || {};
+            log(`[AZURE-RES] duration=${duration}ms tokens=${usage.prompt_tokens||'-'}/${usage.completion_tokens||'-'}/${usage.total_tokens||'-'} response=${str(content)}`);
+            resolve(content);
+          }
+        } catch (e) {
+          log(`[AZURE-ERR] duration=${duration}ms parse_error=${e.message} raw=${str(data)}`);
+          reject(new Error(`Invalid response: ${data.slice(0, 200)}`));
+        }
+      });
+    });
+    req.on('error', (e) => {
+      const duration = Date.now() - startTime;
+      log(`[AZURE-ERR] duration=${duration}ms network_error=${e.message}`);
+      reject(e);
+    });
+    req.on('timeout', () => {
+      const duration = Date.now() - startTime;
+      log(`[AZURE-ERR] duration=${duration}ms timeout`);
+      req.destroy();
+      reject(new Error('Request timeout'));
+    });
+    req.write(postData);
+    req.end();
+  });
+}
+// ============== Request Handling ==============
+async function handleRequest(data) {
+  const { action, text } = data;
+  switch (action) {
+    case 'ping':
+      return { success: true, ready: isReady };
+    case 'structurize': {
+      const { type: memType } = data;
+      const typeRules = {
+        fact: 'only <what>',
+        pattern: '<what> + <when> + <do> + <warn>',
+        decision: '<what> + <warn>',
+        preference: '<what> + <warn>',
+        bug: '<what> + <do>',
+        context: '<what> + <when>'
+      };
+      const rule = typeRules[memType] || typeRules.context;
+      const messages = [
+        {
+          role: 'system',
+          content: `You are a memory structuring assistant. Structure content into XML-formatted persistent memory.
+First determine: is this worth saving long-term?
+- One-off operation instructions ("change A to B") -> return REJECT
+- Temporary conversation/debugging requests -> return REJECT
+- Only meaningful in the current session -> return REJECT
+If it has value, output XML (do not output anything else):
+<memory type="${memType || 'context'}" domain="choose one: frontend/backend/database/devops/testing/memory/general">
+  <what>Core fact, 1-2 sentences, remove redundant words (required)</what>
+  <when>When to trigger/apply (use | to separate multiple scenarios)</when>
+  <do>Specific operation steps or commands (use ; to separate)</do>
+  <warn>Prohibited actions or common pitfalls</warn>
+</memory>
+Current type ${memType || 'context'} uses fields: ${rule}
+Omit fields that are not needed.`
+        },
+        {
+          role: 'user',
+          content: text
+        }
+      ];
+      try {
+        const response = await callAzureOpenAI(messages, 300);
+        const trimmed = response.trim();
+        if (/REJECT/i.test(trimmed) && !trimmed.includes('<memory')) {
+          return { success: true, structured: { __rejected: true, reason: 'low value' } };
+        }
+        const xmlMatch = trimmed.match(/<memory[\s\S]*?<\/memory>/);
+        if (xmlMatch) {
+          return { success: true, structured: xmlMatch[0] };
+        }
+        return { success: false, error: 'No XML found in response' };
+      } catch (e) {
+        console.error('[LLMServer-Azure] Structurize error:', e.message);
+        return { success: false, error: e.message };
+      }
+    }
+    case 'merge': {
+      const { memories, domain: mergeDomain } = data;
+      if (!memories || !Array.isArray(memories) || memories.length === 0) {
+        return { success: false, error: 'memories array required' };
+      }
+      const d = mergeDomain || 'general';
+      const memoriesText = memories.map((m, i) => `[${i + 1}] ${m}`).join('\n');
+      const messages = [
+        {
+          role: 'system',
+          content: `You are a knowledge aggregation assistant. Deduplicate and merge multiple related memories into a single XML memory.
+Merge rules:
+- <what> Summarize the core theme of all memories in 1-2 sentences
+- <when> Merge all applicable scenarios (use | to separate)
+- <do> Merge all specific operations (use ; to separate), remove duplicates
+- <warn> Merge all warnings, remove duplicates
+Output only XML:
+<memory type="pattern" domain="${d}">
+  <what>...</what>
+  <when>...</when>
+  <do>...</do>
+  <warn>...</warn>
+</memory>`
+        },
+        {
+          role: 'user',
+          content: `Merge the following ${memories.length} memories:\n\n${memoriesText}`
+        }
+      ];
+      try {
+        const response = await callAzureOpenAI(messages, 500);
+        const xmlMatch = response.match(/<memory[\s\S]*?<\/memory>/);
+        if (xmlMatch) {
+          return { success: true, merged: xmlMatch[0] };
+        }
+        // fallback
+        return {
+          success: true,
+          merged: {
+            summary: memories[0].slice(0, 100),
+            content: memories.join('\n---\n'),
+            scenarios: [], rules: { must: [], must_not: [], prefer: [] }, triggers: []
+          }
+        };
+      } catch (e) {
+        console.error('[LLMServer-Azure] Merge error:', e.message);
+        return { success: false, error: e.message };
+      }
+    }
+    case 'analyzeSession': {
+      const { transcript } = data;
+      if (!transcript || transcript.length < 50) {
+        return { success: true, memories: [] };
+      }
+      const messages = [
+        {
+          role: 'system',
+          content: `You are a development session analysis assistant. Analyze session transcripts and extract content worth saving as long-term memory.
+[Extraction criteria] Only extract:
+1. bug: error encountered -> fix experience (including error message and fix method)
+2. decision: user's explicitly stated technical decisions or preferences ("always use X from now on", "don't use Y")
+3. pattern: reusable development patterns or operational workflows
+4. preference: user's coding habits, tool preferences
+[Do NOT extract]
+- One-off operation instructions ("add a button", "modify the API", "optimize xxx")
+- Code snapshots or specific implementation details (code changes, not worth memorizing)
+- Routine file viewing/searching/installing dependencies/starting services
+- Information queries and Q&A
+- Specific steps of the current task
+[Output format]
+Return a <memory> block for each memory:
+<memory type="choose one: bug/decision/pattern/preference" domain="choose one: frontend/backend/database/devops/testing/memory/general" confidence="0.7-0.9">
+  <summary>Plain text summary (one sentence)</summary>
+  <what>Core fact (1-2 sentences)</what>
+  <when>Trigger scenarios (optional, use | to separate)</when>
+  <do>Specific operations (optional, use ; to separate)</do>
+  <warn>Caveats (optional)</warn>
+</memory>
+If there is nothing worth saving, return only NONE.
+Better to extract fewer items than to extract low-value content. Return at most 3 items.`
+        },
+        {
+          role: 'user',
+          content: `=== Session Transcript ===\n${transcript}`
+        }
+      ];
+      try {
+        const response = await callAzureOpenAI(messages, null);
+        const trimmed = response.trim();
+        if (/^NONE$/i.test(trimmed)) {
+          return { success: true, memories: [] };
+        }
+        // Extract all <memory> blocks
+        const memoryBlocks = [];
+        const regex = /<memory\s+([^>]+)>([\s\S]*?)<\/memory>/g;
+        let match;
+        while ((match = regex.exec(trimmed)) !== null) {
+          const attrs = match[1];
+          const body = match[2];
+          // Parse attributes
+          const type = (attrs.match(/type="([^"]+)"/) || [])[1] || 'pattern';
+          const domain = (attrs.match(/domain="([^"]+)"/) || [])[1] || 'general';
+          const confidence = parseFloat((attrs.match(/confidence="([^"]+)"/) || [])[1] || '0.8');
+          // Extract summary
+          const summaryMatch = body.match(/<summary>([\s\S]*?)<\/summary>/);
+          const summary = summaryMatch ? summaryMatch[1].trim() : '';
+          // Build structured_content (remove summary tag, keep the rest)
+          const structuredBody = body.replace(/<summary>[\s\S]*?<\/summary>\s*/, '');
+          const structuredContent = `<memory type="${type}" domain="${domain}">\n${structuredBody.trim()}\n</memory>`;
+          if (summary) {
+            memoryBlocks.push({ type, domain, confidence, summary, structuredContent });
+          }
+        }
+        return { success: true, memories: memoryBlocks };
+      } catch (e) {
+        console.error('[LLMServer-Azure] analyzeSession error:', e.message);
+        return { success: false, error: e.message, memories: [] };
+      }
+    }
+    default:
+      return { success: false, error: `Unknown action: ${action}` };
+  }
+}
+// ============== Server Startup ==============
+async function checkAzureConnection() {
+  try {
+    const messages = [{ role: 'user', content: 'ping' }];
+    await callAzureOpenAI(messages, 10);
+    return true;
+  } catch (e) {
+    console.error('[LLMServer-Azure] Connection check failed:', e.message);
+    return false;
+  }
+}
+async function startServer() {
+  console.error('[LLMServer-Azure] Starting...');
+  console.error(`[LLMServer-Azure] Endpoint: ${AZURE_CONFIG.endpoint}`);
+  console.error(`[LLMServer-Azure] Deployment: ${AZURE_CONFIG.deployment}`);
+  // Check connection
+  const connected = await checkAzureConnection();
+  if (!connected) {
+    console.error('[LLMServer-Azure] Failed to connect to Azure OpenAI');
+    process.exit(1);
+  }
+  console.error('[LLMServer-Azure] Azure OpenAI connected');
+  isReady = true;
+  // Create TCP server
+  server = net.createServer((socket) => {
+    let buffer = '';
+    socket.on('data', async (chunk) => {
+      buffer += chunk.toString();
+      const lines = buffer.split('\n');
+      buffer = lines.pop();
+      for (const line of lines) {
+        if (line.trim()) {
+          try {
+            const data = JSON.parse(line);
+            const response = await handleRequest(data);
+            socket.write(JSON.stringify(response) + '\n');
+          } catch (e) {
+            socket.write(JSON.stringify({ success: false, error: e.message }) + '\n');
+          }
+        }
+      }
+    });
+    socket.on('error', () => {});
+  });
+  server.on('error', (err) => {
+    if (err.code === 'EADDRINUSE') {
+      console.error(`[LLMServer-Azure] Port ${PORT} already in use`);
+      process.exit(0);
+    }
+    console.error('[LLMServer-Azure] Server error:', err.message);
+    process.exit(1);
+  });
+  server.listen(PORT, '127.0.0.1', () => {
+    console.error(`[LLMServer-Azure] Listening on port ${PORT}`);
+    fs.writeFileSync(PID_FILE, process.pid.toString());
+  });
+  // Graceful shutdown
+  process.on('SIGTERM', () => {
+    console.error('[LLMServer-Azure] SIGTERM received');
+    cleanup();
+    process.exit(0);
+  });
+  process.on('SIGINT', () => {
+    console.error('[LLMServer-Azure] SIGINT received');
+    cleanup();
+    process.exit(0);
+  });
+}
+function cleanup() {
+  try {
+    if (fs.existsSync(PID_FILE)) {
+      fs.unlinkSync(PID_FILE);
+    }
+  } catch (e) {}
+}
+startServer().catch((err) => {
+  console.error('[LLMServer-Azure] Failed to start:', err.message);
+  process.exit(1);
+});