npm - @psiclawops/hypermem - Versions diffs - 0.1.0 - Mend

@psiclawops/hypermem 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (94) hide show

package/ARCHITECTURE.md +296 -0
package/LICENSE +190 -0
package/README.md +243 -0
package/dist/background-indexer.d.ts +117 -0
package/dist/background-indexer.d.ts.map +1 -0
package/dist/background-indexer.js +732 -0
package/dist/compaction-fence.d.ts +89 -0
package/dist/compaction-fence.d.ts.map +1 -0
package/dist/compaction-fence.js +153 -0
package/dist/compositor.d.ts +139 -0
package/dist/compositor.d.ts.map +1 -0
package/dist/compositor.js +1109 -0
package/dist/cross-agent.d.ts +57 -0
package/dist/cross-agent.d.ts.map +1 -0
package/dist/cross-agent.js +254 -0
package/dist/db.d.ts +131 -0
package/dist/db.d.ts.map +1 -0
package/dist/db.js +398 -0
package/dist/desired-state-store.d.ts +100 -0
package/dist/desired-state-store.d.ts.map +1 -0
package/dist/desired-state-store.js +212 -0
package/dist/doc-chunk-store.d.ts +115 -0
package/dist/doc-chunk-store.d.ts.map +1 -0
package/dist/doc-chunk-store.js +278 -0
package/dist/doc-chunker.d.ts +99 -0
package/dist/doc-chunker.d.ts.map +1 -0
package/dist/doc-chunker.js +324 -0
package/dist/episode-store.d.ts +48 -0
package/dist/episode-store.d.ts.map +1 -0
package/dist/episode-store.js +135 -0
package/dist/fact-store.d.ts +57 -0
package/dist/fact-store.d.ts.map +1 -0
package/dist/fact-store.js +175 -0
package/dist/fleet-store.d.ts +144 -0
package/dist/fleet-store.d.ts.map +1 -0
package/dist/fleet-store.js +276 -0
package/dist/hybrid-retrieval.d.ts +60 -0
package/dist/hybrid-retrieval.d.ts.map +1 -0
package/dist/hybrid-retrieval.js +340 -0
package/dist/index.d.ts +611 -0
package/dist/index.d.ts.map +1 -0
package/dist/index.js +1042 -0
package/dist/knowledge-graph.d.ts +110 -0
package/dist/knowledge-graph.d.ts.map +1 -0
package/dist/knowledge-graph.js +305 -0
package/dist/knowledge-store.d.ts +72 -0
package/dist/knowledge-store.d.ts.map +1 -0
package/dist/knowledge-store.js +241 -0
package/dist/library-schema.d.ts +22 -0
package/dist/library-schema.d.ts.map +1 -0
package/dist/library-schema.js +717 -0
package/dist/message-store.d.ts +76 -0
package/dist/message-store.d.ts.map +1 -0
package/dist/message-store.js +273 -0
package/dist/preference-store.d.ts +54 -0
package/dist/preference-store.d.ts.map +1 -0
package/dist/preference-store.js +109 -0
package/dist/preservation-gate.d.ts +82 -0
package/dist/preservation-gate.d.ts.map +1 -0
package/dist/preservation-gate.js +150 -0
package/dist/provider-translator.d.ts +40 -0
package/dist/provider-translator.d.ts.map +1 -0
package/dist/provider-translator.js +349 -0
package/dist/rate-limiter.d.ts +76 -0
package/dist/rate-limiter.d.ts.map +1 -0
package/dist/rate-limiter.js +179 -0
package/dist/redis.d.ts +188 -0
package/dist/redis.d.ts.map +1 -0
package/dist/redis.js +534 -0
package/dist/schema.d.ts +15 -0
package/dist/schema.d.ts.map +1 -0
package/dist/schema.js +203 -0
package/dist/secret-scanner.d.ts +51 -0
package/dist/secret-scanner.d.ts.map +1 -0
package/dist/secret-scanner.js +248 -0
package/dist/seed.d.ts +108 -0
package/dist/seed.d.ts.map +1 -0
package/dist/seed.js +177 -0
package/dist/system-store.d.ts +73 -0
package/dist/system-store.d.ts.map +1 -0
package/dist/system-store.js +182 -0
package/dist/topic-store.d.ts +45 -0
package/dist/topic-store.d.ts.map +1 -0
package/dist/topic-store.js +136 -0
package/dist/types.d.ts +329 -0
package/dist/types.d.ts.map +1 -0
package/dist/types.js +9 -0
package/dist/vector-store.d.ts +132 -0
package/dist/vector-store.d.ts.map +1 -0
package/dist/vector-store.js +498 -0
package/dist/work-store.d.ts +112 -0
package/dist/work-store.d.ts.map +1 -0
package/dist/work-store.js +273 -0
package/package.json +57 -0

package/dist/background-indexer.js ADDED Viewed

@@ -0,0 +1,732 @@
+/**
+ * HyperMem Background Indexer
+ *
+ * Processes message history to extract structured knowledge:
+ *   - Facts: atomic pieces of learned information
+ *   - Episodes: significant events worth remembering
+ *   - Topics: conversation threads and their lifecycle
+ *   - Knowledge: durable structured entries (domain + key)
+ *
+ * Runs as a periodic background task, processing unindexed messages
+ * in batches. Each batch is scored, classified, and stored in L4 (library.db).
+ *
+ * Design principles:
+ *   - No LLM dependency: extraction uses pattern matching + heuristics
+ *   - Idempotent: tracks watermarks per agent to avoid reprocessing
+ *   - Bounded: processes N messages per tick to avoid blocking
+ *   - Observable: logs extraction stats for monitoring
+ */
+import { MessageStore } from './message-store.js';
+import { FactStore } from './fact-store.js';
+import { EpisodeStore } from './episode-store.js';
+import { TopicStore } from './topic-store.js';
+import { KnowledgeStore } from './knowledge-store.js';
+import { isSafeForSharedVisibility } from './secret-scanner.js';
+function extractFactCandidates(content) {
+    const facts = [];
+    if (!content || content.length < 20)
+        return facts;
+    // Decision patterns: "decided to", "agreed on", "choosing", "going with" — high confidence (0.75)
+    const decisionPatterns = [
+        /(?:we |I |they )?(?:decided|agreed|chose|selected|committed) (?:to |on |that )(.{20,200})/gi,
+        /(?:going|went) with (.{10,150})/gi,
+        /decision:\s*(.{10,200})/gi,
+    ];
+    // Learned/discovered patterns — medium-high confidence (0.65)
+    const learnedPatterns = [
+        /(?:learned|discovered|found out|realized|noticed) (?:that |)(.{20,200})/gi,
+        /turns out (?:that |)(.{20,200})/gi,
+        /(?:TIL|FYI|note to self)[:\s]+(.{10,200})/gi,
+    ];
+    // Config/setting patterns — medium confidence (0.60); matches more promiscuously
+    const configPatterns = [
+        /(?:set|changed|updated|configured) (\S+ to .{5,150})/gi,
+        /(?:model|config|setting)[:\s]+(\S+\s*(?:→|->|=|is)\s*.{5,100})/gi,
+    ];
+    // Preference patterns — medium confidence (0.60)
+    const preferencePatterns = [
+        /(?:prefer|always use|never use|don't use|avoid) (.{10,150})/gi,
+        /(?:ragesaq|operator) (?:wants|prefers|likes|hates|dislikes) (.{10,150})/gi,
+    ];
+    // Operational patterns: deployments, incidents, fixes — high confidence (0.70)
+    const operationalPatterns = [
+        /(?:deployed|shipped|released|rolled back|reverted) (.{10,200})/gi,
+        /(?:outage|incident|failure|broke|broken|crashed)(?:: | — | - )(.{10,200})/gi,
+        /(?:fixed|resolved|patched|hotfixed) (.{10,200})/gi,
+    ];
+    const patternGroups = [
+        { patterns: decisionPatterns, confidence: 0.75 },
+        { patterns: learnedPatterns, confidence: 0.65 },
+        { patterns: configPatterns, confidence: 0.60 },
+        { patterns: preferencePatterns, confidence: 0.60 },
+        { patterns: operationalPatterns, confidence: 0.70 },
+    ];
+    for (const { patterns, confidence } of patternGroups) {
+        for (const pattern of patterns) {
+            let match;
+            // Reset lastIndex for global patterns
+            pattern.lastIndex = 0;
+            while ((match = pattern.exec(content)) !== null) {
+                const candidate = match[1].trim();
+                // Quality gate: reject noise that matched patterns but isn't a real fact
+                if (!isQualityFact(candidate))
+                    continue;
+                facts.push({ content: candidate, confidence });
+            }
+        }
+    }
+    return facts;
+}
+/**
+ * TUNE-011: Quality gate for fact extraction.
+ * Rejects pattern matches that are code, table fragments, questions,
+ * or too short to be meaningful facts.
+ */
+function isQualityFact(content) {
+    // Too short — sentence fragments
+    if (content.length < 40)
+        return false;
+    // Too long — likely captured a paragraph, not a fact
+    if (content.length > 300)
+        return false;
+    // Fewer than 5 words — fragment
+    const wordCount = content.split(/\s+/).filter(w => w.length > 0).length;
+    if (wordCount < 5)
+        return false;
+    // Questions — not assertions of fact
+    if (content.trimEnd().endsWith('?'))
+        return false;
+    // Code indicators: braces, arrows, imports, variable declarations
+    if (/^[\s{}\[\]|`]/.test(content))
+        return false; // starts with structural char
+    if (/[{}].*[{}]/.test(content))
+        return false; // contains paired braces (code blocks)
+    if (/^\s*(import|export|const|let|var|function|class|interface|type|return|if|for|while|switch)\s/i.test(content))
+        return false;
+    if (/=>\s*[{(]/.test(content))
+        return false; // arrow functions
+    if (/SELECT\s|INSERT\s|UPDATE\s|DELETE\s|CREATE\s/i.test(content))
+        return false; // SQL
+    // Table cell fragments: contains pipe-delimited cells
+    if (/\|.*\|.*\|/.test(content))
+        return false;
+    // Regex patterns leaked from source
+    if (/\/[^/]+\/[gimsuvy]*[,;]/.test(content))
+        return false;
+    // Raw file paths without context (tool output, not facts)
+    if (/^\/[\w/.-]+$/.test(content.trim()))
+        return false;
+    // Markdown formatting artifacts
+    if (content.startsWith('```') || content.startsWith('---') || content.startsWith('==='))
+        return false;
+    // Git output
+    if (/^[a-f0-9]{7,40}\s/.test(content) || /^\+\+\+|^---\s[ab]\//.test(content))
+        return false;
+    if (/^\d+ files? changed/.test(content))
+        return false;
+    // Stack traces
+    if (/^\s*at\s+\S+\s+\(/.test(content) || /node:internal/.test(content))
+        return false;
+    // High non-alpha ratio indicates code/data, not natural language
+    const alphaChars = (content.match(/[a-zA-Z]/g) || []).length;
+    if (alphaChars / content.length < 0.5)
+        return false;
+    return true;
+}
+/**
+ * Classify a message for episode significance.
+ * Returns episode type and significance score, or null if not significant.
+ */
+function classifyEpisode(msg) {
+    const content = msg.textContent || '';
+    if (!content || content.length < 50)
+        return null; // Raised from 30
+    // Skip heartbeats
+    if (msg.isHeartbeat)
+        return null;
+    // Skip messages that are primarily code/data output (tool results, logs)
+    const alphaRatio = (content.match(/[a-zA-Z]/g) || []).length / content.length;
+    if (alphaRatio < 0.4)
+        return null;
+    // Skip messages that start with structural output indicators
+    if (/^[\s]*[{[\d|#=+\-]/.test(content) && content.length < 200)
+        return null;
+    const lower = content.toLowerCase();
+    // ── Negation-aware incident detection ──────────────────────
+    // Only trigger on actual incidents, not "zero failures" or "no crashes"
+    const incidentTerms = ['outage', 'incident', 'failure', 'crash', 'broke', 'broken', 'emergency'];
+    const negationPrefixes = ['no ', 'zero ', 'without ', '0 ', 'never ', 'fixed ', 'resolved '];
+    const hasIncidentTerm = incidentTerms.some(term => lower.includes(term));
+    const isNegated = hasIncidentTerm && incidentTerms.some(term => {
+        const idx = lower.indexOf(term);
+        if (idx < 0)
+            return false;
+        const prefix = lower.substring(Math.max(0, idx - 15), idx).toLowerCase();
+        return negationPrefixes.some(neg => prefix.includes(neg.trimEnd()));
+    });
+    if (hasIncidentTerm && !isNegated && content.length > 100) {
+        // Genuine incident — verify it's describing a problem, not analyzing code
+        if (!/^\s*(\/\/|#|\*|\/\*|```|import|const|function)/.test(content)) {
+            const summary = content.slice(0, 200);
+            return { type: 'incident', significance: 0.9, summary };
+        }
+    }
+    // Deployment events (high significance)
+    if (/(?:deployed|shipped|released|went live|now live|go live)/i.test(content) &&
+        content.length > 60) {
+        const summary = content.slice(0, 200);
+        return { type: 'deployment', significance: 0.8, summary };
+    }
+    // Architecture decisions (high significance)
+    if (/(?:decided on|chose|committed to|architecture|design decision)/i.test(content) &&
+        content.length > 80) {
+        const summary = content.slice(0, 200);
+        return { type: 'decision', significance: 0.7, summary };
+    }
+    // Discovery/insight (medium significance)
+    if (/(?:discovered|found|realized|root cause|turns out)/i.test(content) && content.length > 80) {
+        const summary = content.slice(0, 200);
+        return { type: 'discovery', significance: 0.5, summary };
+    }
+    // Config changes (medium significance) — TUNE-004: raised to 0.5
+    if (/(?:changed|updated|migrated|switched|model.*(?:→|->|to))/i.test(content) && content.length > 60) {
+        // Skip if it's just a tool output confirmation
+        if (/^Successfully replaced|^\[main [a-f0-9]|^ok \d+ -/.test(content))
+            return null;
+        const summary = content.slice(0, 200);
+        return { type: 'config_change', significance: 0.5, summary };
+    }
+    // Milestone/completion (medium significance)
+    if (/(?:completed|finished|done|milestone|all tests pass|all green)/i.test(content) &&
+        content.length > 60) {
+        // Skip tool output that happens to contain "done"
+        if (/^Successfully|^\[main|^ok \d+/.test(content))
+            return null;
+        const summary = content.slice(0, 200);
+        return { type: 'milestone', significance: 0.5, summary };
+    }
+    return null;
+}
+/**
+ * Extract knowledge candidates — structured (domain, key, value) tuples.
+ */
+function extractKnowledgeCandidates(content, agentId) {
+    const results = [];
+    if (!content || content.length < 30)
+        return results;
+    // TUNE-012: Broadened path extraction.
+    // Real messages use paths inline without explicit prefixes like "located at".
+    // Match any absolute path that's at least 3 segments deep (filters /tmp, /etc noise).
+    const pathMatches = content.matchAll(/(?:`([/][\w./-]{10,})`|(?:^|[\s:=])(\/home\/[\w./-]{10,}|\/opt\/[\w./-]{10,}|\/var\/[\w./-]{10,}))/gm);
+    for (const match of pathMatches) {
+        const value = (match[1] || match[2]).replace(/[`'".,;:)]+$/, '').trim();
+        if (value.length > 10 && value.split('/').length >= 4) {
+            const segments = value.split('/').filter(s => s.length > 0);
+            const lastSeg = segments[segments.length - 1] || '';
+            // Reject truncated paths (last segment < 3 chars unless it's a known ext)
+            if (lastSeg.length < 3 && !lastSeg.includes('.'))
+                continue;
+            const key = lastSeg || segments[segments.length - 2] || 'unknown';
+            results.push({ domain: 'paths', key, value });
+        }
+    }
+    // Explicit location references (original patterns, kept for completeness)
+    const locationPatterns = [
+        /(?:path|located at|lives at|stored at|found at|repo at|running at)[:\s]+(`[^`]+`|\/\S+)/gi,
+        /(?:workspace|directory|repo|project)[:\s]+(`[^`]+`|\/\S+)/gi,
+    ];
+    for (const pattern of locationPatterns) {
+        pattern.lastIndex = 0;
+        let match;
+        while ((match = pattern.exec(content)) !== null) {
+            const value = match[1].replace(/[`'".,;:)]+/g, '').trim();
+            if (value.startsWith('/') && value.length > 10 && !results.some(r => r.value === value)) {
+                const key = value.split('/').pop() || 'unknown';
+                results.push({ domain: 'paths', key, value });
+            }
+        }
+    }
+    // Service/port patterns — broadened to catch "port NNNN" and "on :NNNN"
+    const servicePatterns = [
+        /(\S+)\s+(?:runs on|listening on|port|on port)\s+(\d{2,5})/gi,
+        /(?:service|server|daemon)\s+(\S+)\s+(?:on |at |: )(\S+)/gi,
+        /(?:localhost|127\.0\.0\.1):(\d{2,5})\b/gi,
+    ];
+    for (const pattern of servicePatterns) {
+        pattern.lastIndex = 0;
+        let match;
+        while ((match = pattern.exec(content)) !== null) {
+            if (pattern.source.includes('localhost')) {
+                // localhost:PORT pattern — key is the port, value is the URL
+                results.push({ domain: 'services', key: `port:${match[1]}`, value: match[0] });
+            }
+            else {
+                results.push({ domain: 'services', key: match[1], value: match[2] });
+            }
+        }
+    }
+    // Agent identity patterns — broadened
+    const identityPatterns = [
+        /(\w+)\s+(?:is|was)\s+(?:the\s+)?(\w+)\s+(?:seat|director|specialist|council)/gi,
+        /(\w+)\s+(?:reports to|owned by|managed by)\s+(\w+)/gi,
+        /(?:agents?|directors?|seats?)[:\s]+(\w+)(?:\s*[,/]\s*(\w+))+/gi,
+    ];
+    for (const pattern of identityPatterns) {
+        pattern.lastIndex = 0;
+        let match;
+        while ((match = pattern.exec(content)) !== null) {
+            if (match[2]) {
+                results.push({ domain: 'fleet', key: match[1].toLowerCase(), value: `${match[1]} ${match[2]}` });
+            }
+        }
+    }
+    // Dedup by domain+key
+    const seen = new Set();
+    return results.filter(r => {
+        const k = `${r.domain}:${r.key}`;
+        if (seen.has(k))
+            return false;
+        seen.add(k);
+        return true;
+    });
+}
+/**
+ * Detect conversation topic from message content.
+ * Returns a topic name candidate or null.
+ */
+function detectTopic(content) {
+    if (!content || content.length < 50)
+        return null;
+    // Product/project name detection
+    const productMatch = content.match(/\b(HyperMem|ClawText|ClawDash|ClawCanvas|ClawCouncil|ClawTomation|OpenClaw|ClawDispatch)\b/i);
+    if (productMatch)
+        return productMatch[1];
+    // Infrastructure topic detection
+    if (/\b(?:redis|sqlite|database|migration|deployment|docker|nginx)\b/i.test(content)) {
+        return 'infrastructure';
+    }
+    // Security topic detection
+    if (/\b(?:security|auth|permission|access|token|credential)\b/i.test(content)) {
+        return 'security';
+    }
+    return null;
+}
+// ─── Background Indexer ─────────────────────────────────────────
+export class BackgroundIndexer {
+    getMessageDb;
+    getLibraryDb;
+    listAgents;
+    getCursor;
+    config;
+    intervalHandle = null;
+    running = false;
+    vectorStore = null;
+    constructor(config, getMessageDb, getLibraryDb, listAgents, getCursor) {
+        this.getMessageDb = getMessageDb;
+        this.getLibraryDb = getLibraryDb;
+        this.listAgents = listAgents;
+        this.getCursor = getCursor;
+        this.config = {
+            enabled: config?.enabled ?? true,
+            factExtractionMode: config?.factExtractionMode ?? 'tiered',
+            topicDormantAfter: config?.topicDormantAfter ?? '24h',
+            topicClosedAfter: config?.topicClosedAfter ?? '7d',
+            factDecayRate: config?.factDecayRate ?? 0.01,
+            episodeSignificanceThreshold: config?.episodeSignificanceThreshold ?? 0.5,
+            periodicInterval: config?.periodicInterval ?? 300000, // 5 minutes
+        };
+    }
+    /**
+     * Set the vector store for embedding new facts/episodes at index time.
+     * Optional — if not set, indexer runs without embedding (FTS5-only mode).
+     */
+    setVectorStore(vs) {
+        this.vectorStore = vs;
+    }
+    /**
+     * Start periodic indexing.
+     */
+    start() {
+        if (!this.config.enabled)
+            return;
+        if (this.intervalHandle)
+            return;
+        // Run once immediately
+        this.tick().catch(err => {
+            console.error('[indexer] Initial tick failed:', err);
+        });
+        // Then periodically
+        this.intervalHandle = setInterval(() => {
+            this.tick().catch(err => {
+                console.error('[indexer] Periodic tick failed:', err);
+            });
+        }, this.config.periodicInterval);
+        console.log(`[indexer] Started with interval ${this.config.periodicInterval}ms`);
+    }
+    /**
+     * Stop periodic indexing.
+     */
+    stop() {
+        if (this.intervalHandle) {
+            clearInterval(this.intervalHandle);
+            this.intervalHandle = null;
+        }
+    }
+    /**
+     * Run one indexing pass across all agents.
+     */
+    async tick() {
+        if (this.running) {
+            console.log('[indexer] Skipping tick — previous run still active');
+            return [];
+        }
+        this.running = true;
+        const results = [];
+        try {
+            if (!this.listAgents || !this.getMessageDb || !this.getLibraryDb) {
+                console.warn('[indexer] Missing database accessors — skipping');
+                return [];
+            }
+            const agents = this.listAgents();
+            const libraryDb = this.getLibraryDb();
+            for (const agentId of agents) {
+                try {
+                    const stats = await this.processAgent(agentId, libraryDb);
+                    if (stats.messagesProcessed > 0) {
+                        results.push(stats);
+                    }
+                }
+                catch (err) {
+                    const msg = err instanceof Error ? err.message : String(err);
+                    console.error(`[indexer] Failed to process ${agentId}: ${msg}`);
+                }
+            }
+            if (results.length > 0) {
+                const totalMessages = results.reduce((s, r) => s + r.messagesProcessed, 0);
+                const totalFacts = results.reduce((s, r) => s + r.factsExtracted, 0);
+                const totalEpisodes = results.reduce((s, r) => s + r.episodesRecorded, 0);
+                console.log(`[indexer] Tick complete: ${totalMessages} messages → ${totalFacts} facts, ${totalEpisodes} episodes`);
+            }
+            // Run decay on every tick
+            this.applyDecay(libraryDb);
+        }
+        finally {
+            this.running = false;
+        }
+        return results;
+    }
+    /**
+     * Process a single agent's unindexed messages.
+     *
+     * When a cursor fetcher is available, messages are split into two tiers:
+     *   - Post-cursor (id > cursor.lastSentId): "unseen" by the model, high-signal priority
+     *   - Pre-cursor (id <= cursor.lastSentId): already in the model's context window, lower priority
+     * Post-cursor messages are processed first. This ensures the indexer prioritizes
+     * content the model hasn't seen yet — decisions, incidents, and discoveries that
+     * happened between context windows.
+     */
+    async processAgent(agentId, libraryDb) {
+        const start = Date.now();
+        const messageDb = this.getMessageDb(agentId);
+        const messageStore = new MessageStore(messageDb);
+        const factStore = new FactStore(libraryDb);
+        const episodeStore = new EpisodeStore(libraryDb);
+        const topicStore = new TopicStore(libraryDb);
+        const knowledgeStore = new KnowledgeStore(libraryDb);
+        // Get watermark — last processed message ID for this agent
+        const watermark = this.getWatermark(libraryDb, agentId);
+        const lastProcessedId = watermark?.lastMessageId ?? 0;
+        // Fetch unindexed messages (batch size: 100)
+        const messages = this.getUnindexedMessages(messageDb, agentId, lastProcessedId, 100);
+        if (messages.length === 0) {
+            return {
+                agentId,
+                messagesProcessed: 0,
+                factsExtracted: 0,
+                episodesRecorded: 0,
+                topicsUpdated: 0,
+                knowledgeUpserted: 0,
+                postCursorMessages: 0,
+                elapsedMs: Date.now() - start,
+            };
+        }
+        // ── Cursor-aware prioritization ──────────────────────────────
+        // Fetch the cursor boundary to split messages into post-cursor (unseen)
+        // and pre-cursor (already in context). Post-cursor messages are processed
+        // first — they're the highest signal for fact/episode extraction.
+        let cursorBoundary = 0;
+        if (this.getCursor) {
+            try {
+                // Get session key from the first message's conversation
+                const sessionKey = this.getSessionKeyForMessage(messageDb, messages[0].conversationId);
+                if (sessionKey) {
+                    const cursor = await this.getCursor(agentId, sessionKey);
+                    if (cursor) {
+                        cursorBoundary = cursor.lastSentId;
+                    }
+                }
+            }
+            catch {
+                // Cursor fetch is best-effort — fall through to default ordering
+            }
+        }
+        // Sort: post-cursor messages first (highest signal), then pre-cursor.
+        // Within each tier, maintain original (ascending) order.
+        const postCursor = messages.filter(m => m.id > cursorBoundary);
+        const preCursor = messages.filter(m => m.id <= cursorBoundary);
+        const ordered = [...postCursor, ...preCursor];
+        let factsExtracted = 0;
+        let episodesRecorded = 0;
+        let topicsUpdated = 0;
+        let knowledgeUpserted = 0;
+        let maxMessageId = lastProcessedId;
+        for (const msg of ordered) {
+            const content = msg.textContent || '';
+            if (msg.id > maxMessageId)
+                maxMessageId = msg.id;
+            // Skip heartbeats and very short messages
+            if (msg.isHeartbeat || content.length < 30)
+                continue;
+            // 1. Extract facts (TUNE-003: confidence varies by extraction pattern type)
+            const factCandidates = extractFactCandidates(content);
+            for (const { content: factContent, confidence: factConfidence } of factCandidates) {
+                try {
+                    const fact = factStore.addFact(agentId, factContent, {
+                        scope: 'agent',
+                        confidence: factConfidence,
+                        sourceType: 'indexer',
+                        sourceSessionKey: this.getSessionKeyForMessage(messageDb, msg.conversationId),
+                        sourceRef: `msg:${msg.id}`,
+                    });
+                    factsExtracted++;
+                    // Embed new fact for semantic recall (best-effort, non-blocking)
+                    if (this.vectorStore && fact.id) {
+                        this.vectorStore.indexItem('facts', fact.id, factContent, fact.domain || undefined)
+                            .catch(() => { });
+                    }
+                }
+                catch {
+                    // Duplicate or constraint violation — skip
+                }
+            }
+            // 2. Classify episodes
+            const episode = classifyEpisode(msg);
+            if (episode && episode.significance >= this.config.episodeSignificanceThreshold) {
+                // Secret gate: shared visibility requires clean content.
+                // Downgrade to 'private' rather than drop, so we don't lose the episode.
+                const episodeVisibility = isSafeForSharedVisibility(episode.summary) ? 'org' : 'private';
+                try {
+                    const recorded = episodeStore.record(agentId, episode.type, episode.summary, {
+                        significance: episode.significance,
+                        visibility: episodeVisibility,
+                        sessionKey: this.getSessionKeyForMessage(messageDb, msg.conversationId),
+                    });
+                    episodesRecorded++;
+                    // Embed high-significance episodes (decisions, incidents, deployments)
+                    if (this.vectorStore && recorded?.id && episode.significance >= 0.7) {
+                        this.vectorStore.indexItem('episodes', recorded.id, episode.summary, episode.type)
+                            .catch(() => { });
+                    }
+                }
+                catch {
+                    // Skip duplicate episodes
+                }
+            }
+            // 3. Detect and update topics
+            const topicName = detectTopic(content);
+            if (topicName) {
+                try {
+                    const existingTopics = topicStore.getActive(agentId, 100);
+                    const existingTopic = existingTopics.find((t) => t.name.toLowerCase() === topicName.toLowerCase());
+                    if (!existingTopic) {
+                        topicStore.create(agentId, topicName, `Auto-detected from conversation`);
+                        topicsUpdated++;
+                    }
+                }
+                catch {
+                    // Skip topic creation errors
+                }
+            }
+            // 4. Extract knowledge candidates
+            const knowledgeCandidates = extractKnowledgeCandidates(content, agentId);
+            for (const { domain, key, value } of knowledgeCandidates) {
+                try {
+                    knowledgeStore.upsert(agentId, domain, key, value, {
+                        sourceType: 'indexer',
+                        sourceRef: `msg:${msg.id}`,
+                    });
+                    knowledgeUpserted++;
+                }
+                catch {
+                    // Skip duplicates
+                }
+            }
+        }
+        // Update watermark
+        this.setWatermark(libraryDb, agentId, maxMessageId);
+        return {
+            agentId,
+            messagesProcessed: messages.length,
+            factsExtracted,
+            episodesRecorded,
+            topicsUpdated,
+            knowledgeUpserted,
+            postCursorMessages: postCursor.length,
+            elapsedMs: Date.now() - start,
+        };
+    }
+    /**
+     * Fetch unindexed messages for an agent.
+     */
+    getUnindexedMessages(db, agentId, afterId, limit) {
+        const rows = db.prepare(`
+      SELECT m.*, c.session_key
+      FROM messages m
+      JOIN conversations c ON m.conversation_id = c.id
+      WHERE m.agent_id = ? AND m.id > ?
+      ORDER BY m.id ASC
+      LIMIT ?
+    `).all(agentId, afterId, limit);
+        return rows.map(row => ({
+            id: row.id,
+            conversationId: row.conversation_id,
+            agentId: row.agent_id,
+            role: row.role,
+            textContent: row.text_content || null,
+            toolCalls: row.tool_calls ? JSON.parse(row.tool_calls) : null,
+            toolResults: row.tool_results ? JSON.parse(row.tool_results) : null,
+            metadata: row.metadata ? JSON.parse(row.metadata) : undefined,
+            messageIndex: row.message_index,
+            tokenCount: row.token_count || null,
+            isHeartbeat: row.is_heartbeat === 1,
+            createdAt: row.created_at,
+        }));
+    }
+    /**
+     * Get the session key for a conversation ID.
+     */
+    getSessionKeyForMessage(db, conversationId) {
+        const row = db.prepare('SELECT session_key FROM conversations WHERE id = ?').get(conversationId);
+        return row?.session_key;
+    }
+    /**
+     * Get the indexing watermark for an agent.
+     */
+    getWatermark(libraryDb, agentId) {
+        // Ensure watermarks table exists
+        libraryDb.prepare(`
+      CREATE TABLE IF NOT EXISTS indexer_watermarks (
+        agent_id TEXT PRIMARY KEY,
+        last_message_id INTEGER NOT NULL DEFAULT 0,
+        last_run_at TEXT NOT NULL
+      )
+    `).run();
+        const row = libraryDb.prepare('SELECT agent_id, last_message_id, last_run_at FROM indexer_watermarks WHERE agent_id = ?').get(agentId);
+        if (!row)
+            return null;
+        return {
+            agentId: row.agent_id,
+            lastMessageId: row.last_message_id,
+            lastRunAt: row.last_run_at,
+        };
+    }
+    /**
+     * Set the indexing watermark for an agent.
+     */
+    setWatermark(libraryDb, agentId, lastMessageId) {
+        const now = new Date().toISOString();
+        libraryDb.prepare(`
+      INSERT INTO indexer_watermarks (agent_id, last_message_id, last_run_at)
+      VALUES (?, ?, ?)
+      ON CONFLICT(agent_id) DO UPDATE SET
+        last_message_id = excluded.last_message_id,
+        last_run_at = excluded.last_run_at
+    `).run(agentId, lastMessageId, now);
+    }
+    /**
+     * Apply time-based decay to facts.
+     * Increases decay_score for older facts, making them less relevant.
+     */
+    applyDecay(libraryDb) {
+        const rate = this.config.factDecayRate;
+        // Decay facts that haven't been referenced recently
+        libraryDb.prepare(`
+      UPDATE facts
+      SET decay_score = MIN(1.0, decay_score + ?)
+      WHERE superseded_by IS NULL
+        AND decay_score < 1.0
+        AND updated_at < datetime('now', '-1 day')
+    `).run(rate);
+        // Decay episodes older than 7 days
+        libraryDb.prepare(`
+      UPDATE episodes
+      SET decay_score = MIN(1.0, decay_score + ?)
+      WHERE decay_score < 1.0
+        AND created_at < datetime('now', '-7 days')
+    `).run(rate * 0.5);
+        // Mark dormant topics
+        const dormantThreshold = this.parseDuration(this.config.topicDormantAfter);
+        if (dormantThreshold > 0) {
+            libraryDb.prepare(`
+        UPDATE topics
+        SET status = 'dormant'
+        WHERE status = 'active'
+          AND updated_at < datetime('now', '-${dormantThreshold} seconds')
+      `).run();
+        }
+        // Close old dormant topics
+        const closedThreshold = this.parseDuration(this.config.topicClosedAfter);
+        if (closedThreshold > 0) {
+            libraryDb.prepare(`
+        UPDATE topics
+        SET status = 'closed'
+        WHERE status = 'dormant'
+          AND updated_at < datetime('now', '-${closedThreshold} seconds')
+      `).run();
+        }
+    }
+    /**
+     * Parse a duration string like "24h", "7d" into seconds.
+     */
+    parseDuration(dur) {
+        const match = dur.match(/^(\d+)\s*(h|d|m|s)$/);
+        if (!match)
+            return 0;
+        const val = parseInt(match[1]);
+        switch (match[2]) {
+            case 's': return val;
+            case 'm': return val * 60;
+            case 'h': return val * 3600;
+            case 'd': return val * 86400;
+            default: return 0;
+        }
+    }
+    /**
+     * Get current watermarks for all agents.
+     */
+    getWatermarks(libraryDb) {
+        try {
+            const rows = libraryDb.prepare('SELECT agent_id, last_message_id, last_run_at FROM indexer_watermarks ORDER BY agent_id').all();
+            return rows.map(r => ({
+                agentId: r.agent_id,
+                lastMessageId: r.last_message_id,
+                lastRunAt: r.last_run_at,
+            }));
+        }
+        catch {
+            return [];
+        }
+    }
+}
+// ─── Standalone runner ──────────────────────────────────────────
+/**
+ * Create and start a background indexer connected to HyperMem databases.
+ * Used by the hook or a standalone daemon.
+ */
+export function createIndexer(getMessageDb, getLibraryDb, listAgents, config, getCursor, vectorStore) {
+    const indexer = new BackgroundIndexer(config, getMessageDb, getLibraryDb, listAgents, getCursor);
+    if (vectorStore)
+        indexer.setVectorStore(vectorStore);
+    return indexer;
+}
+//# sourceMappingURL=background-indexer.js.map