npm - superlocalmemory - Versions diffs - 3.4.18 → 3.4.21 - Mend

superlocalmemory 3.4.18 → 3.4.21

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (172) hide show

package/CHANGELOG.md +35 -0
package/README.md +42 -34
package/bin/slm +11 -0
package/bin/slm.bat +12 -0
package/package.json +4 -3
package/pyproject.toml +3 -2
package/scripts/build-slm-hook.ps1 +40 -0
package/scripts/build-slm-hook.sh +45 -0
package/scripts/build_entry.py +452 -0
package/scripts/ci/stage5b_gate.sh +50 -0
package/scripts/postinstall/validation.js +187 -0
package/scripts/postinstall-interactive.js +756 -0
package/scripts/postinstall_binary.js +287 -0
package/scripts/release_manifest.py +273 -0
package/scripts/slm-hook.spec +56 -0
package/skills/slm-build-graph/SKILL.md +423 -0
package/skills/slm-list-recent/SKILL.md +348 -0
package/skills/slm-recall/SKILL.md +343 -0
package/skills/slm-remember/SKILL.md +194 -0
package/skills/slm-show-patterns/SKILL.md +224 -0
package/skills/slm-status/SKILL.md +363 -0
package/skills/slm-switch-profile/SKILL.md +442 -0
package/src/superlocalmemory/cli/commands.py +219 -79
package/src/superlocalmemory/cli/context_commands.py +192 -0
package/src/superlocalmemory/cli/daemon.py +15 -1
package/src/superlocalmemory/cli/db_migrate.py +80 -0
package/src/superlocalmemory/cli/escape_hatch.py +220 -0
package/src/superlocalmemory/cli/main.py +72 -1
package/src/superlocalmemory/core/context_cache.py +397 -0
package/src/superlocalmemory/core/embeddings.py +8 -2
package/src/superlocalmemory/core/engine.py +38 -2
package/src/superlocalmemory/core/engine_wiring.py +1 -1
package/src/superlocalmemory/core/ram_lock.py +111 -0
package/src/superlocalmemory/core/recall_pipeline.py +433 -3
package/src/superlocalmemory/core/recall_worker.py +8 -3
package/src/superlocalmemory/core/security_primitives.py +635 -0
package/src/superlocalmemory/core/shadow_router.py +319 -0
package/src/superlocalmemory/core/slm_disabled.py +87 -0
package/src/superlocalmemory/core/slmignore.py +125 -0
package/src/superlocalmemory/core/topic_signature.py +143 -0
package/src/superlocalmemory/core/worker_pool.py +14 -3
package/src/superlocalmemory/encoding/cognitive_consolidator.py +2 -2
package/src/superlocalmemory/evolution/budget.py +321 -0
package/src/superlocalmemory/evolution/llm_dispatch.py +508 -0
package/src/superlocalmemory/evolution/skill_evolver.py +144 -94
package/src/superlocalmemory/hooks/_outcome_common.py +506 -0
package/src/superlocalmemory/hooks/adapter_base.py +317 -0
package/src/superlocalmemory/hooks/antigravity_adapter.py +192 -0
package/src/superlocalmemory/hooks/claude_code_hooks.py +33 -1
package/src/superlocalmemory/hooks/context_payload.py +312 -0
package/src/superlocalmemory/hooks/copilot_adapter.py +154 -0
package/src/superlocalmemory/hooks/cross_platform_connector.py +90 -0
package/src/superlocalmemory/hooks/cursor_adapter.py +195 -0
package/src/superlocalmemory/hooks/hook_handlers.py +109 -8
package/src/superlocalmemory/hooks/ide_connector.py +25 -2
package/src/superlocalmemory/hooks/post_tool_async_hook.py +165 -0
package/src/superlocalmemory/hooks/post_tool_outcome_hook.py +223 -0
package/src/superlocalmemory/hooks/prewarm_auth.py +170 -0
package/src/superlocalmemory/hooks/session_registry.py +186 -0
package/src/superlocalmemory/hooks/stop_outcome_hook.py +134 -0
package/src/superlocalmemory/hooks/sync_loop.py +114 -0
package/src/superlocalmemory/hooks/user_prompt_hook.py +128 -0
package/src/superlocalmemory/hooks/user_prompt_rehash_hook.py +202 -0
package/src/superlocalmemory/infra/backup.py +3 -3
package/src/superlocalmemory/infra/cloud_backup.py +2 -2
package/src/superlocalmemory/infra/event_bus.py +2 -2
package/src/superlocalmemory/infra/webhook_dispatcher.py +3 -3
package/src/superlocalmemory/learning/arm_catalog.py +99 -0
package/src/superlocalmemory/learning/bandit.py +526 -0
package/src/superlocalmemory/learning/bandit_cache.py +133 -0
package/src/superlocalmemory/learning/behavioral.py +53 -1
package/src/superlocalmemory/learning/consolidation_cycle.py +381 -0
package/src/superlocalmemory/learning/consolidation_worker.py +188 -520
package/src/superlocalmemory/learning/database.py +256 -0
package/src/superlocalmemory/learning/dedup_hnsw.py +413 -0
package/src/superlocalmemory/learning/ensemble.py +300 -0
package/src/superlocalmemory/learning/fact_outcome_joins.py +207 -0
package/src/superlocalmemory/learning/forgetting_scheduler.py +55 -0
package/src/superlocalmemory/learning/hnsw_dedup.py +69 -0
package/src/superlocalmemory/learning/labeler.py +87 -0
package/src/superlocalmemory/learning/legacy_migration.py +277 -0
package/src/superlocalmemory/learning/memory_merge.py +160 -0
package/src/superlocalmemory/learning/model_cache.py +269 -0
package/src/superlocalmemory/learning/model_rollback.py +278 -0
package/src/superlocalmemory/learning/outcome_queue.py +284 -0
package/src/superlocalmemory/learning/pattern_miner.py +415 -0
package/src/superlocalmemory/learning/pattern_miner_constants.py +47 -0
package/src/superlocalmemory/learning/ranker.py +225 -81
package/src/superlocalmemory/learning/ranker_common.py +163 -0
package/src/superlocalmemory/learning/ranker_retrain_legacy.py +202 -0
package/src/superlocalmemory/learning/ranker_retrain_online.py +411 -0
package/src/superlocalmemory/learning/reward.py +777 -0
package/src/superlocalmemory/learning/reward_archive.py +210 -0
package/src/superlocalmemory/learning/reward_boost.py +201 -0
package/src/superlocalmemory/learning/reward_proxy.py +326 -0
package/src/superlocalmemory/learning/shadow_test.py +524 -0
package/src/superlocalmemory/learning/signal_worker.py +270 -0
package/src/superlocalmemory/learning/signals.py +314 -0
package/src/superlocalmemory/learning/trigram_index.py +547 -0
package/src/superlocalmemory/mcp/server.py +5 -5
package/src/superlocalmemory/mcp/tools_context.py +183 -0
package/src/superlocalmemory/mcp/tools_core.py +92 -27
package/src/superlocalmemory/parameterization/soft_prompt_generator.py +13 -0
package/src/superlocalmemory/retrieval/engine.py +52 -0
package/src/superlocalmemory/retrieval/reranker.py +4 -2
package/src/superlocalmemory/server/api.py +2 -2
package/src/superlocalmemory/server/bandit_loops.py +140 -0
package/src/superlocalmemory/server/middleware/__init__.py +11 -0
package/src/superlocalmemory/server/middleware/security_headers.py +144 -0
package/src/superlocalmemory/server/routes/backup.py +36 -13
package/src/superlocalmemory/server/routes/behavioral.py +50 -19
package/src/superlocalmemory/server/routes/brain.py +1234 -0
package/src/superlocalmemory/server/routes/data_io.py +4 -4
package/src/superlocalmemory/server/routes/events.py +2 -2
package/src/superlocalmemory/server/routes/helpers.py +1 -1
package/src/superlocalmemory/server/routes/learning.py +192 -7
package/src/superlocalmemory/server/routes/memories.py +189 -1
package/src/superlocalmemory/server/routes/prewarm.py +171 -0
package/src/superlocalmemory/server/routes/profiles.py +3 -3
package/src/superlocalmemory/server/routes/token.py +88 -0
package/src/superlocalmemory/server/routes/ws.py +5 -5
package/src/superlocalmemory/server/security_middleware.py +13 -7
package/src/superlocalmemory/server/ui.py +2 -2
package/src/superlocalmemory/server/unified_daemon.py +335 -3
package/src/superlocalmemory/storage/migration_runner.py +545 -0
package/src/superlocalmemory/storage/migrations/M001_add_signal_features_columns.py +67 -0
package/src/superlocalmemory/storage/migrations/M002_model_state_history.py +132 -0
package/src/superlocalmemory/storage/migrations/M003_migration_log.py +38 -0
package/src/superlocalmemory/storage/migrations/M004_cross_platform_sync_log.py +46 -0
package/src/superlocalmemory/storage/migrations/M005_bandit_tables.py +75 -0
package/src/superlocalmemory/storage/migrations/M006_action_outcomes_reward.py +75 -0
package/src/superlocalmemory/storage/migrations/M007_pending_outcomes.py +63 -0
package/src/superlocalmemory/storage/migrations/M009_model_lineage.py +54 -0
package/src/superlocalmemory/storage/migrations/M010_evolution_config.py +75 -0
package/src/superlocalmemory/storage/migrations/M011_archive_and_merge.py +87 -0
package/src/superlocalmemory/storage/migrations/M012_shadow_observations.py +72 -0
package/src/superlocalmemory/storage/migrations/M013_bi_temporal_columns.py +55 -0
package/src/superlocalmemory/storage/migrations/__init__.py +81 -0
package/src/superlocalmemory/storage/models.py +4 -0
package/src/superlocalmemory/ui/css/brain.css +409 -0
package/src/superlocalmemory/ui/css/legacy-dashboard.css +645 -0
package/src/superlocalmemory/ui/index.html +459 -1345
package/src/superlocalmemory/ui/js/brain.js +1321 -0
package/src/superlocalmemory/ui/js/clusters.js +123 -4
package/src/superlocalmemory/ui/js/init.js +48 -39
package/src/superlocalmemory/ui/js/memories.js +88 -2
package/src/superlocalmemory/ui/js/modal.js +71 -1
package/src/superlocalmemory/ui/js/ng-shell.js +101 -88
package/src/superlocalmemory/ui/js/trust-dashboard.js +168 -25
package/src/superlocalmemory/ui/vendor/bootstrap-icons/bootstrap-icons.css +2018 -0
package/src/superlocalmemory/ui/vendor/bootstrap-icons/fonts/bootstrap-icons.woff +0 -0
package/src/superlocalmemory/ui/vendor/bootstrap-icons/fonts/bootstrap-icons.woff2 +0 -0
package/src/superlocalmemory/ui/vendor/bootstrap.bundle.min.js +7 -0
package/src/superlocalmemory/ui/vendor/bootstrap.min.css +6 -0
package/src/superlocalmemory/ui/vendor/d3.v7.min.js +2 -0
package/src/superlocalmemory/ui/vendor/graphology-library.min.js +2 -0
package/src/superlocalmemory/ui/vendor/graphology.umd.min.js +2 -0
package/src/superlocalmemory/ui/vendor/inter-ui/inter-variable.min.css +8 -0
package/src/superlocalmemory/ui/vendor/inter-ui/variable/InterVariable-Italic.woff2 +0 -0
package/src/superlocalmemory/ui/vendor/inter-ui/variable/InterVariable.woff2 +0 -0
package/src/superlocalmemory/ui/vendor/sigma.min.js +1 -0
package/src/superlocalmemory/ui/js/behavioral.js +0 -447
package/src/superlocalmemory/ui/js/graph-core.js +0 -447
package/src/superlocalmemory/ui/js/graph-interactions.js +0 -351
package/src/superlocalmemory/ui/js/learning.js +0 -435
package/src/superlocalmemory/ui/js/patterns.js +0 -93
package/src/superlocalmemory.egg-info/PKG-INFO +0 -647
package/src/superlocalmemory.egg-info/SOURCES.txt +0 -335
package/src/superlocalmemory.egg-info/dependency_links.txt +0 -1
package/src/superlocalmemory.egg-info/entry_points.txt +0 -2
package/src/superlocalmemory.egg-info/requires.txt +0 -58
package/src/superlocalmemory.egg-info/top_level.txt +0 -1

package/src/superlocalmemory/learning/database.py CHANGED Viewed

@@ -87,6 +87,32 @@ class LearningDatabase:
         self._lock = threading.Lock()
         self._init_schema()
+    @property
+    def path(self) -> str:
+        """Read-only path to the learning SQLite database.
+        S8-ARC-02 (v3.4.21): public alternative to the underscore-private
+        ``_db_path``. Callers that need a raw connection for specialised
+        read patterns should prefer :meth:`ro_connection` over building
+        one themselves so WAL + busy_timeout pragmas are consistent.
+        """
+        return self._db_path
+    def ro_connection(self, *, timeout: float = 5.0) -> sqlite3.Connection:
+        """Return a read-only-shaped connection with WAL/timeout pragmas set.
+        Callers outside this class previously opened raw
+        ``sqlite3.connect(lrn_db._db_path, ...)`` connections without the
+        WAL/busy_timeout pragmas, making them vulnerable to ``database is
+        locked`` errors under concurrent writer activity. This helper
+        produces a configured connection they can use instead.
+        """
+        conn = sqlite3.connect(self._db_path, timeout=timeout)
+        conn.execute("PRAGMA journal_mode=WAL")
+        conn.execute("PRAGMA busy_timeout=5000")
+        conn.row_factory = sqlite3.Row
+        return conn
     def _connect(self) -> sqlite3.Connection:
         """Create a configured connection to the learning database."""
         conn = sqlite3.connect(self._db_path, timeout=10)
@@ -339,6 +365,236 @@ class LearningDatabase:
         finally:
             conn.close()
+    # ------------------------------------------------------------------
+    # LLD-02 §4.8 — v3.4.21 writer surface
+    # ------------------------------------------------------------------
+    def count_signals(self, profile_id: str) -> int:
+        """Count ``learning_signals`` rows for ``profile_id``.
+        Used by ``_compute_ranker_phase`` + consolidation_worker training
+        gate. Pure SELECT — thread-safe without lock.
+        """
+        conn = self._connect()
+        try:
+            row = conn.execute(
+                "SELECT COUNT(*) AS cnt FROM learning_signals "
+                "WHERE profile_id = ?",
+                (profile_id,),
+            ).fetchone()
+            return int(row["cnt"]) if row else 0
+        finally:
+            conn.close()
+    def persist_model(
+        self,
+        *,
+        profile_id: str,
+        state_bytes: bytes,
+        bytes_sha256: str,
+        feature_names: list[str],
+        trained_on_count: int,
+        metrics: dict,
+        model_version: str = "3.4.21",
+    ) -> int:
+        """Persist a newly trained model and flip the active flag.
+        LLD-02 §4.8 — single TX:
+            1. UPDATE existing active row → is_active = 0.
+            2. INSERT new row with is_active = 1.
+        Requires M002 (columns ``bytes_sha256``, ``feature_names``,
+        ``metrics_json``, ``trained_on_count``, ``is_active``). Raises if
+        M002 hasn't been applied.
+        Returns the new row id.
+        """
+        if not isinstance(state_bytes, (bytes, bytearray)):
+            raise TypeError("state_bytes must be bytes")
+        if not bytes_sha256 or len(bytes_sha256) != 64:
+            raise ValueError("bytes_sha256 must be 64 hex chars")
+        names_json = json.dumps(list(feature_names), separators=(",", ":"))
+        metrics_json = json.dumps(dict(metrics), separators=(",", ":"))
+        now = self._now()
+        with self._lock:
+            conn = self._connect()
+            try:
+                conn.execute("BEGIN IMMEDIATE")
+                conn.execute(
+                    "UPDATE learning_model_state "
+                    "SET is_active = 0 "
+                    "WHERE profile_id = ? AND is_active = 1",
+                    (profile_id,),
+                )
+                cur = conn.execute(
+                    "INSERT INTO learning_model_state "
+                    "(profile_id, model_version, state_bytes, bytes_sha256, "
+                    " trained_on_count, feature_names, metrics_json, "
+                    " is_active, trained_at, updated_at) "
+                    "VALUES (?, ?, ?, ?, ?, ?, ?, 1, ?, ?)",
+                    (
+                        profile_id,
+                        model_version,
+                        bytes(state_bytes),
+                        bytes_sha256.lower(),
+                        int(trained_on_count),
+                        names_json,
+                        metrics_json,
+                        now,
+                        now,
+                    ),
+                )
+                conn.commit()
+                return int(cur.lastrowid or 0)
+            except sqlite3.Error as exc:
+                conn.rollback()
+                logger.error("persist_model failed: %s", exc)
+                raise
+            finally:
+                conn.close()
+    def load_active_model(self, profile_id: str) -> Optional[dict]:
+        """Return the active model row as a dict, or ``None`` if none.
+        Post-M002 schema. Keys: ``state_bytes``, ``bytes_sha256``,
+        ``feature_names`` (JSON str), ``trained_at``, ``model_version``.
+        """
+        conn = self._connect()
+        try:
+            row = conn.execute(
+                "SELECT state_bytes, bytes_sha256, feature_names, trained_at, "
+                "       model_version "
+                "FROM learning_model_state "
+                "WHERE profile_id = ? AND is_active = 1 "
+                "LIMIT 1",
+                (profile_id,),
+            ).fetchone()
+            if row is None:
+                return None
+            return {
+                "state_bytes": bytes(row["state_bytes"]),
+                "bytes_sha256": row["bytes_sha256"],
+                "feature_names": row["feature_names"],
+                "trained_at": row["trained_at"],
+                "model_version": row["model_version"],
+            }
+        except sqlite3.Error as exc:
+            logger.error("load_active_model failed: %s", exc)
+            return None
+        finally:
+            conn.close()
+    # --- training-row fetch (version-gated on M006) --------------------
+    _SQL_POSITION_ONLY = (
+        "SELECT s.id AS signal_id, s.query_id, s.fact_id, s.position, "
+        "       s.created_at, f.features_json, NULL AS outcome_reward "
+        "FROM learning_signals s "
+        "JOIN learning_features f "
+        "  ON f.signal_id = s.id AND f.profile_id = s.profile_id "
+        "WHERE s.profile_id = ? "
+        "  AND s.signal_type IN ('candidate', 'shown', 'legacy_feedback') "
+        "  AND f.is_synthetic = 0 "
+        "ORDER BY s.created_at DESC "
+        "LIMIT ?"
+    )
+    _SQL_WITH_OUTCOMES = (
+        "SELECT s.id AS signal_id, s.query_id, s.fact_id, s.position, "
+        "       s.created_at, f.features_json, o.reward AS outcome_reward "
+        "FROM learning_signals s "
+        "JOIN learning_features f "
+        "  ON f.signal_id = s.id AND f.profile_id = s.profile_id "
+        "LEFT JOIN action_outcomes o "
+        "  ON o.recall_query_id = s.query_id AND o.settled = 1 "
+        "WHERE s.profile_id = ? "
+        "  AND s.signal_type IN ('candidate', 'shown', 'legacy_feedback') "
+        "  AND f.is_synthetic = 0 "
+        "  AND (o.settled IS NULL OR "
+        "       (julianday('now') - julianday(o.settled_at)) * 86400.0 >= ?) "
+        "ORDER BY s.created_at DESC "
+        "LIMIT ?"
+    )
+    def _migration_applied(self, name: str) -> bool:
+        """Return True if ``name`` is recorded complete in migration_log.
+        M006 (action_outcomes.reward) lands in v3.4.21. When absent, we
+        fall back to the position-only training query.
+        """
+        conn = self._connect()
+        try:
+            row = conn.execute(
+                "SELECT status FROM migration_log WHERE name = ?",
+                (name,),
+            ).fetchone()
+        except sqlite3.Error:
+            return False
+        finally:
+            conn.close()
+        if row is None:
+            return False
+        return row["status"] == "complete"
+    def fetch_training_examples(
+        self,
+        *,
+        profile_id: str,
+        limit: int = 2000,
+        min_outcome_age_sec: int = 60,
+        include_synthetic: bool = False,
+    ) -> list[dict]:
+        """Fetch training rows for LightGBM lambdarank training.
+        Version-gated on M006: without the ``reward`` column we return rows
+        with ``outcome_reward = None`` and the labeler falls through to the
+        position proxy (§4.7).
+        When ``include_synthetic`` is True, migrated legacy rows (with
+        ``learning_features.is_synthetic=1``) are included. The default
+        (False) preserves Stage 8 D9 — synthetic rows excluded unless the
+        caller opts in explicitly. The UI exposes this via the
+        "Migrate legacy data" flow so users consciously choose to let their
+        pre-v3.4.21 feedback bootstrap the model.
+        Returns rows sorted newest-first; the caller is expected to regroup
+        by ``query_id`` before training.
+        """
+        m006_applied = self._migration_applied("M006_action_outcomes_reward")
+        sql = self._SQL_WITH_OUTCOMES if m006_applied else self._SQL_POSITION_ONLY
+        if include_synthetic:
+            # Drop the synthetic-filter clause verbatim. Safe because the
+            # surrounding clauses already reference ``f.`` so removing this
+            # one keeps the SQL grammatically valid.
+            sql = sql.replace(" AND f.is_synthetic = 0 ", " ")
+        params: tuple
+        if m006_applied:
+            params = (profile_id, int(min_outcome_age_sec), int(limit))
+        else:
+            params = (profile_id, int(limit))
+        conn = self._connect()
+        try:
+            try:
+                rows = conn.execute(sql, params).fetchall()
+            except sqlite3.Error as exc:
+                logger.warning(
+                    "fetch_training_examples failed (m006=%s): %s",
+                    m006_applied, exc,
+                )
+                return []
+            out: list[dict] = []
+            for row in rows:
+                d = dict(row)
+                try:
+                    d["features"] = json.loads(d.pop("features_json") or "{}")
+                except (ValueError, TypeError):
+                    d["features"] = {}
+                out.append(d)
+            return out
+        finally:
+            conn.close()
     def reset(self, profile_id: Optional[str] = None) -> None:
         """Delete learning data. GDPR Article 17 handler.

package/src/superlocalmemory/learning/dedup_hnsw.py ADDED Viewed

@@ -0,0 +1,413 @@
+# Copyright (c) 2026 Varun Pratap Bhardwaj / Qualixar
+# Licensed under AGPL-3.0-or-later - see LICENSE file
+# Part of SuperLocalMemory v3.4.21 — F4.A Stage-8 H-03/H-17/H-18 fix
+"""HNSW-backed near-duplicate detection for atomic_facts.
+Extracted from ``hnsw_dedup.py`` as part of the F4.A split (Stage 8
+H-03/H-18). Reward-gated archive + strong-memory boost live in
+``reward_archive.py`` + ``reward_boost.py``; the shim
+``hnsw_dedup.py`` re-exports every public symbol.
+Contract refs:
+  - LLD-12 §2 — cosine > 0.95 AND entity_jaccard > 0.8 thresholds.
+  - LLD-12 §3 — hnswlib RAM budget + prefix-dedup fallback.
+  - LLD-00 §7 — ``ram_reservation`` protocol.
+  - Stage 8 H-17 — fallback emits logger.warning + counter.
+"""
+from __future__ import annotations
+import json
+import logging
+import math
+import sqlite3
+import threading
+import time
+from pathlib import Path
+from typing import Any, Iterable, Sequence
+from superlocalmemory.core.ram_lock import ram_reservation
+logger = logging.getLogger(__name__)
+# Stage 8 H-17 — fallback degradation counter.
+#: Incremented every time the HNSW path degrades to the prefix fallback
+#: for any reason (hnswlib missing, RAM refused, schema missing, fact
+#: count above cap). Observable via dashboards + tests.
+_HNSW_DEGRADED_COUNT = 0
+_HNSW_DEGRADED_LOCK = threading.Lock()
+def get_hnsw_degraded_count() -> int:
+    """Return the current cumulative fallback count."""
+    return _HNSW_DEGRADED_COUNT
+def reset_hnsw_degraded_count() -> None:
+    """Reset the counter — for tests only."""
+    global _HNSW_DEGRADED_COUNT
+    with _HNSW_DEGRADED_LOCK:
+        _HNSW_DEGRADED_COUNT = 0
+def _record_degradation(reason: str) -> None:
+    """Increment the degradation counter + emit a logger.warning."""
+    global _HNSW_DEGRADED_COUNT
+    with _HNSW_DEGRADED_LOCK:
+        _HNSW_DEGRADED_COUNT += 1
+    logger.warning("hnsw_dedup: degraded to prefix fallback (%s)", reason)
+__all__ = (
+    "HnswDeduplicator",
+    "get_hnsw_degraded_count",
+    "reset_hnsw_degraded_count",
+    "_parse_embedding",
+    "_cosine",
+    "_jaccard",
+    "_pick_canonical",
+)
+def _parse_embedding(raw: str | None) -> list[float] | None:
+    if not raw:
+        return None
+    try:
+        vec = json.loads(raw)
+    except (TypeError, ValueError):
+        return None
+    if not isinstance(vec, list) or not vec:
+        return None
+    try:
+        return [float(x) for x in vec]
+    except (TypeError, ValueError):
+        return None
+# L-P-01: vectorise ``_cosine`` via NumPy when available. NumPy cold
+# import is ~30 ms, but hnswlib already forces numpy in; the import is
+# effectively free in the consolidation context where these helpers run.
+# Pure-Python fallback is retained for environments where numpy is
+# missing (contract: this module MUST NOT hard-depend on numpy).
+try:  # pragma: no cover — environment-dependent
+    import numpy as _np  # type: ignore
+except Exception:  # pragma: no cover — numpy always present in our deps
+    _np = None
+def _cosine(u: Sequence[float], v: Sequence[float]) -> float:
+    if _np is not None:
+        # S9-W3 M-PERF-04: ``_np.asarray`` is a no-op when the input is
+        # already an ndarray of the target dtype. When it is a list of
+        # Python floats (which is how embeddings arrive from the JSON
+        # fetch path) the cast costs 20-40 μs × N·k in dedup. We still
+        # accept lists for API compatibility but prefer callers to pass
+        # ndarray directly; the fast path kicks in automatically when
+        # they do.
+        ua = u if isinstance(u, _np.ndarray) else _np.asarray(u, dtype=_np.float32)
+        va = v if isinstance(v, _np.ndarray) else _np.asarray(v, dtype=_np.float32)
+        nu = float(_np.linalg.norm(ua))
+        nv = float(_np.linalg.norm(va))
+        if nu == 0.0 or nv == 0.0:
+            return 0.0
+        return float(_np.dot(ua, va)) / (nu * nv)
+    dot = 0.0
+    nu = 0.0
+    nv = 0.0
+    for a, b in zip(u, v):
+        dot += a * b
+        nu += a * a
+        nv += b * b
+    if nu == 0.0 or nv == 0.0:
+        return 0.0
+    return dot / (math.sqrt(nu) * math.sqrt(nv))
+def _jaccard(a: Iterable[str], b: Iterable[str]) -> float:
+    # L-P-01: _jaccard is already O(|a|+|b|) set ops — numpy adds
+    # hashing overhead for short string sets, so we keep the pure-Python
+    # path. The change from the audit is the explicit note here; no
+    # behaviour delta.
+    sa, sb = set(a), set(b)
+    if not sa and not sb:
+        return 0.0
+    union = sa | sb
+    if not union:
+        return 0.0
+    return len(sa & sb) / len(union)
+def _pick_canonical(
+    a: dict[str, Any], b: dict[str, Any],
+) -> tuple[dict[str, Any], dict[str, Any]]:
+    """Canonical = higher importance, tie-break: higher confidence, older."""
+    ai, bi = float(a.get("importance", 0.0)), float(b.get("importance", 0.0))
+    if ai != bi:
+        return (a, b) if ai > bi else (b, a)
+    ac, bc = float(a.get("confidence", 0.0)), float(b.get("confidence", 0.0))
+    if ac != bc:
+        return (a, b) if ac > bc else (b, a)
+    at, bt = a.get("created_at", ""), b.get("created_at", "")
+    return (a, b) if at <= bt else (b, a)
+class HnswDeduplicator:
+    """Find near-duplicate ``atomic_facts`` rows via HNSW ANN + entity overlap.
+    Contract (LLD-12 §2.1):
+      - cosine > COSINE_THRESHOLD AND jaccard > ENTITY_JACCARD_THRESHOLD
+      - Canonical = higher importance, tie-break older created_at
+      - Never delete; merges happen through memory_merge.apply_merges
+    """
+    COSINE_THRESHOLD: float = 0.95
+    ENTITY_JACCARD_THRESHOLD: float = 0.8
+    MAX_FACTS_FOR_HNSW: int = 200_000
+    # S-L01: HNSW init params — stored on the class so ``_estimate_ram_mb``
+    # and ``_ann_candidates`` share ONE source of truth. Previously the
+    # estimator hardcoded M=16 while the real build also used M=16 / ef=100
+    # — the numbers agreed by coincidence, not by construction. If either
+    # knob changes, the estimate tracks automatically and the ``ef_construction``
+    # build-time buffer is captured in the 1.4× multiplier below.
+    HNSW_M: int = 16
+    HNSW_EF_CONSTRUCTION: int = 100
+    # Build-time overhead multiplier vs steady-state footprint. Empirically
+    # hnswlib uses ~1.3× steady RAM during construction due to the
+    # ef_construction candidate pool — we round up to 1.4 for safety on
+    # tight-RAM (Light) profiles.
+    HNSW_BUILD_OVERHEAD: float = 1.4
+    # Per-vector HNSW footprint estimate (LLD-12 §3.1). Kept for
+    # back-compat — callers should prefer ``_estimate_ram_mb``.
+    _BYTES_PER_VEC_DEFAULT: int = 384 * 4 + 16 * 8 * 2
+    def __init__(self, *, memory_db_path: str | Path) -> None:
+        self._db = Path(memory_db_path)
+    # ------------------------------------------------------------------
+    # Public API
+    # ------------------------------------------------------------------
+    def find_merge_candidates(
+        self,
+        profile_id: str,
+        *,
+        wall_seconds: float = 300.0,
+        _force_unavailable: bool = False,
+    ) -> list[tuple[str, str, float, float]]:
+        """Return ``(canonical_id, duplicate_id, cosine, jaccard)`` tuples.
+        Never raises for expected failure modes — falls back to prefix
+        dedup instead. ``wall_seconds`` is the soft budget; we stop
+        emitting new candidates once exceeded.
+        """
+        deadline = time.monotonic() + max(0.0, wall_seconds)
+        rows = self._fetch_live_facts(profile_id)
+        if len(rows) < 2:
+            return []
+        if len(rows) > self.MAX_FACTS_FOR_HNSW:
+            _record_degradation(
+                f"{len(rows)} facts > MAX {self.MAX_FACTS_FOR_HNSW}",
+            )
+            return self._prefix_fallback(rows, deadline)
+        # Estimate RAM; let the reservation reject if the system is tight.
+        est_mb = self._estimate_ram_mb(len(rows), dim=self._detect_dim(rows))
+        required_mb = max(16, int(est_mb * 1.2))
+        hnswlib_mod = None
+        if not _force_unavailable:
+            try:
+                import hnswlib as hnswlib_mod  # type: ignore  # noqa: PLC0415
+            except ImportError:
+                hnswlib_mod = None
+        if hnswlib_mod is None:
+            _record_degradation("hnswlib unavailable")
+            return self._prefix_fallback(rows, deadline)
+        try:
+            with ram_reservation(
+                "hnswlib",
+                required_mb=required_mb,
+                timeout_s=min(30.0, max(1.0, wall_seconds)),
+            ):
+                return self._ann_candidates(rows, hnswlib_mod, deadline)
+        except RuntimeError as exc:
+            _record_degradation(f"ram_reservation refused: {exc}")
+            return self._prefix_fallback(rows, deadline)
+    # ------------------------------------------------------------------
+    # Internal helpers
+    # ------------------------------------------------------------------
+    def _fetch_live_facts(self, profile_id: str) -> list[dict[str, Any]]:
+        conn = sqlite3.connect(str(self._db), timeout=10.0)
+        conn.row_factory = sqlite3.Row
+        try:
+            cursor = conn.execute(
+                "SELECT fact_id, content, canonical_entities_json, "
+                "       embedding, importance, confidence, created_at "
+                "FROM atomic_facts "
+                "WHERE profile_id = ? "
+                "  AND (archive_status IS NULL OR archive_status = 'live') "
+                "  AND (importance IS NULL OR importance < 1.0) "
+                "ORDER BY created_at ASC",
+                (profile_id,),
+            )
+            rows: list[dict[str, Any]] = []
+            for r in cursor.fetchall():
+                rows.append({
+                    "fact_id": r["fact_id"],
+                    "content": r["content"] or "",
+                    "entities": json.loads(r["canonical_entities_json"] or "[]"),
+                    "embedding": _parse_embedding(r["embedding"]),
+                    "importance": float(r["importance"] or 0.0),
+                    "confidence": float(r["confidence"] or 0.0),
+                    "created_at": r["created_at"] or "",
+                })
+            return rows
+        finally:
+            conn.close()
+    @staticmethod
+    def _detect_dim(rows: list[dict[str, Any]]) -> int:
+        for r in rows:
+            emb = r.get("embedding")
+            if emb:
+                return len(emb)
+        return 384
+    def _estimate_ram_mb(self, n: int, *, dim: int) -> float:
+        # S-L01: derive per-vector size from the actual HNSW_M knob so
+        # a future tuning of M updates the estimate automatically. The
+        # 1.4× multiplier folds in the ef_construction build-time
+        # candidate pool that the old 1.10× factor under-counted.
+        bytes_per_vec = dim * 4 + self.HNSW_M * 8 * 2
+        return (n * bytes_per_vec * self.HNSW_BUILD_OVERHEAD) / (1024 * 1024)
+    def _ann_candidates(
+        self,
+        rows: list[dict[str, Any]],
+        hnswlib_mod,
+        deadline: float,
+    ) -> list[tuple[str, str, float, float]]:
+        embedded = [r for r in rows if r["embedding"] is not None]
+        if len(embedded) < 2:
+            return self._prefix_fallback(rows, deadline)
+        dim = len(embedded[0]["embedding"])
+        # Align: drop rows with mismatched dim.
+        embedded = [r for r in embedded if len(r["embedding"]) == dim]
+        if len(embedded) < 2:
+            return self._prefix_fallback(rows, deadline)
+        index = hnswlib_mod.Index(space="cosine", dim=dim)
+        # S-L01: share knobs with ``_estimate_ram_mb`` so RAM reservation
+        # never under-counts.
+        index.init_index(
+            max_elements=len(embedded),
+            ef_construction=self.HNSW_EF_CONSTRUCTION,
+            M=self.HNSW_M,
+        )
+        index.set_ef(min(50, len(embedded)))
+        try:
+            # H-12/C-P-04 + H-12/L-P-05: batch add_items + knn_query instead
+            # of one-at-a-time Python→C round-trips. hnswlib releases the GIL
+            # during the batch call and processes rows in the same order, so
+            # neighbour-label output is unchanged — behavioural equivalence
+            # holds. The subsequent candidate-selection loop below still
+            # drives `seen_losers` inline, so its decisions are identical.
+            #
+            # S9-W3 H-PERF-02: stream ``embedded`` straight into the
+            # index without materialising ``all_embeddings`` as a
+            # second Python list. At N=100k × 384-dim × 4 B this saves
+            # ~150 MB of transient RAM (the previous comprehension
+            # doubled the embedding footprint). hnswlib's add_items
+            # accepts any sized iterable and a parallel list of labels.
+            #
+            # S9-W3 H-SKEP-02: pin ``set_ef(max(50, k*3))`` before the
+            # batched knn so approximate-search quality matches the
+            # pre-refactor per-item default. Stage 9 Skeptic flagged
+            # that batched knn can miss near-duplicates at scale when
+            # ef is not explicitly set.
+            k = min(6, len(embedded))
+            index.set_ef(max(50, k * 3))
+            labels = list(range(len(embedded)))
+            # Pass the DB rows' embedding lists directly — hnswlib
+            # converts to ndarray inside and copies into its own
+            # contiguous buffer, so we never need a second Python list.
+            index.add_items([r["embedding"] for r in embedded], labels)
+            candidates: list[tuple[str, str, float, float]] = []
+            seen_losers: set[str] = set()
+            # H-12/C-P-04: one batched knn_query for all rows. The
+            # same embedding list is consumed once; hnswlib frees its
+            # internal ndarray before this block returns via ``del index``
+            # in the finally.
+            all_labels, all_distances = index.knn_query(
+                [r["embedding"] for r in embedded], k=k,
+            )
+            for i, r in enumerate(embedded):
+                if time.monotonic() > deadline:
+                    break
+                lbls = all_labels[i]
+                dsts = all_distances[i]
+                for nb_idx, dist in zip(lbls, dsts):
+                    if int(nb_idx) == i:
+                        continue
+                    neighbour = embedded[int(nb_idx)]
+                    if neighbour["fact_id"] in seen_losers:
+                        continue
+                    if r["fact_id"] in seen_losers:
+                        break
+                    # hnswlib cosine distance is (1 - cos).
+                    cos = max(0.0, min(1.0, 1.0 - float(dist)))
+                    if cos <= self.COSINE_THRESHOLD:
+                        continue
+                    jac = _jaccard(r["entities"], neighbour["entities"])
+                    if jac <= self.ENTITY_JACCARD_THRESHOLD:
+                        continue
+                    canonical, loser = _pick_canonical(r, neighbour)
+                    if loser["fact_id"] in seen_losers:
+                        continue
+                    candidates.append(
+                        (canonical["fact_id"], loser["fact_id"], cos, jac),
+                    )
+                    seen_losers.add(loser["fact_id"])
+            return candidates
+        finally:
+            # Free ANN RAM immediately (LLD-12 §3.3).
+            del index
+    def _prefix_fallback(
+        self,
+        rows: list[dict[str, Any]],
+        deadline: float,
+    ) -> list[tuple[str, str, float, float]]:
+        """Content-prefix dedup — retained behaviour when hnswlib cannot run."""
+        seen_prefix: dict[str, dict[str, Any]] = {}
+        candidates: list[tuple[str, str, float, float]] = []
+        for r in rows:
+            if time.monotonic() > deadline:
+                break
+            prefix = (r["content"] or "")[:100].strip().lower()
+            if not prefix:
+                continue
+            prior = seen_prefix.get(prefix)
+            if prior is None:
+                seen_prefix[prefix] = r
+                continue
+            canonical, loser = _pick_canonical(prior, r)
+            jac = _jaccard(prior["entities"], r["entities"])
+            candidates.append(
+                (canonical["fact_id"], loser["fact_id"], 1.0, jac),
+            )
+        return candidates