npm - superlocalmemory - Versions diffs - 3.4.18 → 3.4.21 - Mend

superlocalmemory 3.4.18 → 3.4.21

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (172) hide show

package/CHANGELOG.md +35 -0
package/README.md +42 -34
package/bin/slm +11 -0
package/bin/slm.bat +12 -0
package/package.json +4 -3
package/pyproject.toml +3 -2
package/scripts/build-slm-hook.ps1 +40 -0
package/scripts/build-slm-hook.sh +45 -0
package/scripts/build_entry.py +452 -0
package/scripts/ci/stage5b_gate.sh +50 -0
package/scripts/postinstall/validation.js +187 -0
package/scripts/postinstall-interactive.js +756 -0
package/scripts/postinstall_binary.js +287 -0
package/scripts/release_manifest.py +273 -0
package/scripts/slm-hook.spec +56 -0
package/skills/slm-build-graph/SKILL.md +423 -0
package/skills/slm-list-recent/SKILL.md +348 -0
package/skills/slm-recall/SKILL.md +343 -0
package/skills/slm-remember/SKILL.md +194 -0
package/skills/slm-show-patterns/SKILL.md +224 -0
package/skills/slm-status/SKILL.md +363 -0
package/skills/slm-switch-profile/SKILL.md +442 -0
package/src/superlocalmemory/cli/commands.py +219 -79
package/src/superlocalmemory/cli/context_commands.py +192 -0
package/src/superlocalmemory/cli/daemon.py +15 -1
package/src/superlocalmemory/cli/db_migrate.py +80 -0
package/src/superlocalmemory/cli/escape_hatch.py +220 -0
package/src/superlocalmemory/cli/main.py +72 -1
package/src/superlocalmemory/core/context_cache.py +397 -0
package/src/superlocalmemory/core/embeddings.py +8 -2
package/src/superlocalmemory/core/engine.py +38 -2
package/src/superlocalmemory/core/engine_wiring.py +1 -1
package/src/superlocalmemory/core/ram_lock.py +111 -0
package/src/superlocalmemory/core/recall_pipeline.py +433 -3
package/src/superlocalmemory/core/recall_worker.py +8 -3
package/src/superlocalmemory/core/security_primitives.py +635 -0
package/src/superlocalmemory/core/shadow_router.py +319 -0
package/src/superlocalmemory/core/slm_disabled.py +87 -0
package/src/superlocalmemory/core/slmignore.py +125 -0
package/src/superlocalmemory/core/topic_signature.py +143 -0
package/src/superlocalmemory/core/worker_pool.py +14 -3
package/src/superlocalmemory/encoding/cognitive_consolidator.py +2 -2
package/src/superlocalmemory/evolution/budget.py +321 -0
package/src/superlocalmemory/evolution/llm_dispatch.py +508 -0
package/src/superlocalmemory/evolution/skill_evolver.py +144 -94
package/src/superlocalmemory/hooks/_outcome_common.py +506 -0
package/src/superlocalmemory/hooks/adapter_base.py +317 -0
package/src/superlocalmemory/hooks/antigravity_adapter.py +192 -0
package/src/superlocalmemory/hooks/claude_code_hooks.py +33 -1
package/src/superlocalmemory/hooks/context_payload.py +312 -0
package/src/superlocalmemory/hooks/copilot_adapter.py +154 -0
package/src/superlocalmemory/hooks/cross_platform_connector.py +90 -0
package/src/superlocalmemory/hooks/cursor_adapter.py +195 -0
package/src/superlocalmemory/hooks/hook_handlers.py +109 -8
package/src/superlocalmemory/hooks/ide_connector.py +25 -2
package/src/superlocalmemory/hooks/post_tool_async_hook.py +165 -0
package/src/superlocalmemory/hooks/post_tool_outcome_hook.py +223 -0
package/src/superlocalmemory/hooks/prewarm_auth.py +170 -0
package/src/superlocalmemory/hooks/session_registry.py +186 -0
package/src/superlocalmemory/hooks/stop_outcome_hook.py +134 -0
package/src/superlocalmemory/hooks/sync_loop.py +114 -0
package/src/superlocalmemory/hooks/user_prompt_hook.py +128 -0
package/src/superlocalmemory/hooks/user_prompt_rehash_hook.py +202 -0
package/src/superlocalmemory/infra/backup.py +3 -3
package/src/superlocalmemory/infra/cloud_backup.py +2 -2
package/src/superlocalmemory/infra/event_bus.py +2 -2
package/src/superlocalmemory/infra/webhook_dispatcher.py +3 -3
package/src/superlocalmemory/learning/arm_catalog.py +99 -0
package/src/superlocalmemory/learning/bandit.py +526 -0
package/src/superlocalmemory/learning/bandit_cache.py +133 -0
package/src/superlocalmemory/learning/behavioral.py +53 -1
package/src/superlocalmemory/learning/consolidation_cycle.py +381 -0
package/src/superlocalmemory/learning/consolidation_worker.py +188 -520
package/src/superlocalmemory/learning/database.py +256 -0
package/src/superlocalmemory/learning/dedup_hnsw.py +413 -0
package/src/superlocalmemory/learning/ensemble.py +300 -0
package/src/superlocalmemory/learning/fact_outcome_joins.py +207 -0
package/src/superlocalmemory/learning/forgetting_scheduler.py +55 -0
package/src/superlocalmemory/learning/hnsw_dedup.py +69 -0
package/src/superlocalmemory/learning/labeler.py +87 -0
package/src/superlocalmemory/learning/legacy_migration.py +277 -0
package/src/superlocalmemory/learning/memory_merge.py +160 -0
package/src/superlocalmemory/learning/model_cache.py +269 -0
package/src/superlocalmemory/learning/model_rollback.py +278 -0
package/src/superlocalmemory/learning/outcome_queue.py +284 -0
package/src/superlocalmemory/learning/pattern_miner.py +415 -0
package/src/superlocalmemory/learning/pattern_miner_constants.py +47 -0
package/src/superlocalmemory/learning/ranker.py +225 -81
package/src/superlocalmemory/learning/ranker_common.py +163 -0
package/src/superlocalmemory/learning/ranker_retrain_legacy.py +202 -0
package/src/superlocalmemory/learning/ranker_retrain_online.py +411 -0
package/src/superlocalmemory/learning/reward.py +777 -0
package/src/superlocalmemory/learning/reward_archive.py +210 -0
package/src/superlocalmemory/learning/reward_boost.py +201 -0
package/src/superlocalmemory/learning/reward_proxy.py +326 -0
package/src/superlocalmemory/learning/shadow_test.py +524 -0
package/src/superlocalmemory/learning/signal_worker.py +270 -0
package/src/superlocalmemory/learning/signals.py +314 -0
package/src/superlocalmemory/learning/trigram_index.py +547 -0
package/src/superlocalmemory/mcp/server.py +5 -5
package/src/superlocalmemory/mcp/tools_context.py +183 -0
package/src/superlocalmemory/mcp/tools_core.py +92 -27
package/src/superlocalmemory/parameterization/soft_prompt_generator.py +13 -0
package/src/superlocalmemory/retrieval/engine.py +52 -0
package/src/superlocalmemory/retrieval/reranker.py +4 -2
package/src/superlocalmemory/server/api.py +2 -2
package/src/superlocalmemory/server/bandit_loops.py +140 -0
package/src/superlocalmemory/server/middleware/__init__.py +11 -0
package/src/superlocalmemory/server/middleware/security_headers.py +144 -0
package/src/superlocalmemory/server/routes/backup.py +36 -13
package/src/superlocalmemory/server/routes/behavioral.py +50 -19
package/src/superlocalmemory/server/routes/brain.py +1234 -0
package/src/superlocalmemory/server/routes/data_io.py +4 -4
package/src/superlocalmemory/server/routes/events.py +2 -2
package/src/superlocalmemory/server/routes/helpers.py +1 -1
package/src/superlocalmemory/server/routes/learning.py +192 -7
package/src/superlocalmemory/server/routes/memories.py +189 -1
package/src/superlocalmemory/server/routes/prewarm.py +171 -0
package/src/superlocalmemory/server/routes/profiles.py +3 -3
package/src/superlocalmemory/server/routes/token.py +88 -0
package/src/superlocalmemory/server/routes/ws.py +5 -5
package/src/superlocalmemory/server/security_middleware.py +13 -7
package/src/superlocalmemory/server/ui.py +2 -2
package/src/superlocalmemory/server/unified_daemon.py +335 -3
package/src/superlocalmemory/storage/migration_runner.py +545 -0
package/src/superlocalmemory/storage/migrations/M001_add_signal_features_columns.py +67 -0
package/src/superlocalmemory/storage/migrations/M002_model_state_history.py +132 -0
package/src/superlocalmemory/storage/migrations/M003_migration_log.py +38 -0
package/src/superlocalmemory/storage/migrations/M004_cross_platform_sync_log.py +46 -0
package/src/superlocalmemory/storage/migrations/M005_bandit_tables.py +75 -0
package/src/superlocalmemory/storage/migrations/M006_action_outcomes_reward.py +75 -0
package/src/superlocalmemory/storage/migrations/M007_pending_outcomes.py +63 -0
package/src/superlocalmemory/storage/migrations/M009_model_lineage.py +54 -0
package/src/superlocalmemory/storage/migrations/M010_evolution_config.py +75 -0
package/src/superlocalmemory/storage/migrations/M011_archive_and_merge.py +87 -0
package/src/superlocalmemory/storage/migrations/M012_shadow_observations.py +72 -0
package/src/superlocalmemory/storage/migrations/M013_bi_temporal_columns.py +55 -0
package/src/superlocalmemory/storage/migrations/__init__.py +81 -0
package/src/superlocalmemory/storage/models.py +4 -0
package/src/superlocalmemory/ui/css/brain.css +409 -0
package/src/superlocalmemory/ui/css/legacy-dashboard.css +645 -0
package/src/superlocalmemory/ui/index.html +459 -1345
package/src/superlocalmemory/ui/js/brain.js +1321 -0
package/src/superlocalmemory/ui/js/clusters.js +123 -4
package/src/superlocalmemory/ui/js/init.js +48 -39
package/src/superlocalmemory/ui/js/memories.js +88 -2
package/src/superlocalmemory/ui/js/modal.js +71 -1
package/src/superlocalmemory/ui/js/ng-shell.js +101 -88
package/src/superlocalmemory/ui/js/trust-dashboard.js +168 -25
package/src/superlocalmemory/ui/vendor/bootstrap-icons/bootstrap-icons.css +2018 -0
package/src/superlocalmemory/ui/vendor/bootstrap-icons/fonts/bootstrap-icons.woff +0 -0
package/src/superlocalmemory/ui/vendor/bootstrap-icons/fonts/bootstrap-icons.woff2 +0 -0
package/src/superlocalmemory/ui/vendor/bootstrap.bundle.min.js +7 -0
package/src/superlocalmemory/ui/vendor/bootstrap.min.css +6 -0
package/src/superlocalmemory/ui/vendor/d3.v7.min.js +2 -0
package/src/superlocalmemory/ui/vendor/graphology-library.min.js +2 -0
package/src/superlocalmemory/ui/vendor/graphology.umd.min.js +2 -0
package/src/superlocalmemory/ui/vendor/inter-ui/inter-variable.min.css +8 -0
package/src/superlocalmemory/ui/vendor/inter-ui/variable/InterVariable-Italic.woff2 +0 -0
package/src/superlocalmemory/ui/vendor/inter-ui/variable/InterVariable.woff2 +0 -0
package/src/superlocalmemory/ui/vendor/sigma.min.js +1 -0
package/src/superlocalmemory/ui/js/behavioral.js +0 -447
package/src/superlocalmemory/ui/js/graph-core.js +0 -447
package/src/superlocalmemory/ui/js/graph-interactions.js +0 -351
package/src/superlocalmemory/ui/js/learning.js +0 -435
package/src/superlocalmemory/ui/js/patterns.js +0 -93
package/src/superlocalmemory.egg-info/PKG-INFO +0 -647
package/src/superlocalmemory.egg-info/SOURCES.txt +0 -335
package/src/superlocalmemory.egg-info/dependency_links.txt +0 -1
package/src/superlocalmemory.egg-info/entry_points.txt +0 -2
package/src/superlocalmemory.egg-info/requires.txt +0 -58
package/src/superlocalmemory.egg-info/top_level.txt +0 -1

package/src/superlocalmemory/core/recall_pipeline.py CHANGED Viewed

@@ -11,6 +11,8 @@ Part of Qualixar | Author: Varun Pratap Bhardwaj
 from __future__ import annotations
+import hashlib
+import hmac
 import logging
 from typing import TYPE_CHECKING, Any
@@ -19,11 +21,130 @@ if TYPE_CHECKING:
     from superlocalmemory.core.hooks import HookRegistry
     from superlocalmemory.storage.database import DatabaseManager
+from superlocalmemory.core.security_primitives import ensure_install_token
 from superlocalmemory.storage.models import Mode, RecallResponse
 logger = logging.getLogger(__name__)
+# ---------------------------------------------------------------------------
+# LLD-00 §3 — HMAC fact-id markers (P0.4, SEC-C-01 fix)
+# ---------------------------------------------------------------------------
+#
+# Every fact surfaced in a recall response is tagged with
+#   slm:fact:<fact_id>:<hmac8>
+# where hmac8 is the first 8 hex chars of HMAC-SHA256(install_token, fact_id).
+#
+# post_tool_outcome_hook (LLD-09) scans only for this prefix and validates
+# the HMAC. Unverified markers are ignored — this closes the tool-output
+# injection attack where attacker-controlled output could forge engagement
+# signals by spelling a known fact_id.
+_HMAC_MARKER_PREFIX = "slm:fact:"
+_HMAC_LEN = 8
+def _emit_marker(fact_id: str) -> str:
+    """Tag ``fact_id`` with its HMAC so downstream hooks can validate.
+    Deterministic per install: a given (install_token, fact_id) pair always
+    produces the same marker. Token rotation invalidates old markers.
+    """
+    token = ensure_install_token()
+    digest = hmac.new(
+        token.encode("utf-8"), fact_id.encode("utf-8"), hashlib.sha256
+    ).hexdigest()[:_HMAC_LEN]
+    return f"{_HMAC_MARKER_PREFIX}{fact_id}:{digest}"
+def _validate_marker(marker: str) -> str | None:
+    """Return ``fact_id`` if ``marker`` is a valid HMAC marker, else None.
+    Uses constant-time compare. Never raises.
+    """
+    if not isinstance(marker, str) or not marker.startswith(_HMAC_MARKER_PREFIX):
+        return None
+    rest = marker[len(_HMAC_MARKER_PREFIX):]
+    fact_id, sep, presented = rest.rpartition(":")
+    if not sep or not fact_id or len(presented) != _HMAC_LEN:
+        return None
+    try:
+        token = ensure_install_token()
+    except Exception:  # pragma: no cover — install-token I/O failure
+        return None
+    expected = hmac.new(
+        token.encode("utf-8"), fact_id.encode("utf-8"), hashlib.sha256
+    ).hexdigest()[:_HMAC_LEN]
+    if hmac.compare_digest(presented, expected):
+        return fact_id
+    return None
+def _apply_markers_to_response(response: RecallResponse) -> None:
+    """Populate ``result.marker`` on every result in ``response``, in place.
+    Called as the last step of :func:`run_recall` before returning. Empty
+    responses pass through untouched.
+    # L-P-06: audit flagged ``dataclasses.replace`` as a cheaper path.
+    # Verified: ``RecallResult`` is NOT frozen, so the direct in-place
+    # attribute assignment below is the O(1) mutation path — no dataclass
+    # reconstruction happens. ``replace`` would ALLOCATE a fresh instance
+    # per result (strictly slower). Keep the in-place mutation.
+    """
+    for r in response.results:
+        r.marker = _emit_marker(r.fact.fact_id)
+# ---------------------------------------------------------------------------
+# Stage 8 SB-1 — feed shadow_router from recall-settled signals.
+#
+# LLD-10 Track A.3 needs live-recall A/B observations to feed ShadowTest
+# (pre-promotion) and ModelRollback (post-promotion). The ndcg_at_10
+# signal materialises when ``EngagementRewardModel.finalize_outcome``
+# settles a row — that is the natural call site for this helper.
+#
+# This is a THIN wrapper over ``core.shadow_router.get_shadow_router``
+# so the finalize-outcome path does not need to import shadow_router
+# directly. Fail-soft on every error — recall pipeline integrity comes
+# first.
+# ---------------------------------------------------------------------------
+def feed_recall_settled(
+    *,
+    memory_db: str,
+    learning_db: str,
+    profile_id: str,
+    query_id: str,
+    ndcg_at_10: float,
+) -> None:
+    """Route a settled recall's NDCG@10 into the shadow router.
+    The arm is recomputed from ``query_id`` so callers don't need to
+    persist arm assignment anywhere — the router's determinism
+    guarantees the same arm decision at settle-time that was used at
+    recall-time.
+    Called from ``EngagementRewardModel.finalize_outcome`` (LLD-08 §4.2)
+    after the reward row is committed. Cheap on the hot path: one
+    singleton-cache read + one paired-list append.
+    """
+    try:
+        from superlocalmemory.core import shadow_router as _sr
+        router = _sr.get_shadow_router(
+            memory_db=memory_db,
+            learning_db=learning_db,
+            profile_id=profile_id,
+        )
+        arm = router.route_query(query_id)
+        router.on_recall_settled(
+            query_id=query_id, arm=arm, ndcg_at_10=float(ndcg_at_10),
+        )
+    except Exception as exc:  # pragma: no cover — defence in depth
+        logger.debug("feed_recall_settled error: %s", exc)
 # ---------------------------------------------------------------------------
 # V3.3.16: Module-level singletons for recall hot-path objects.
 # Prevents creating new BehavioralTracker / ForgettingScheduler per recall
@@ -54,6 +175,80 @@ def _get_forgetting_scheduler(db: Any, config: Any) -> Any:
     return _forgetting_scheduler_cache[key]
+# ---------------------------------------------------------------------------
+# S8-ARC-04 (v3.4.21): unified ranking entry point.
+# ---------------------------------------------------------------------------
+_RANKING_MODES: frozenset[str] = frozenset({"off", "v1", "v2", "v2-ensemble"})
+def _resolve_ranking_mode(env: "dict[str, str] | os._Environ[str]") -> str:
+    """Map the ``SLM_RANKING`` env var to a canonical mode.
+    Legacy ``SLM_V2_PIPELINE_DISABLED=1`` and ``SLM_BANDIT_DISABLED=1``
+    are honoured for one-release back-compat. Explicit ``SLM_RANKING``
+    wins if both are set.
+    """
+    raw = (env.get("SLM_RANKING", "") or "").strip().lower()
+    if raw in _RANKING_MODES:
+        return raw
+    if (env.get("SLM_V2_PIPELINE_DISABLED", "0") or "0").strip() == "1":
+        # v2 disabled → fall back to v1 adaptive only.
+        return "v1"
+    if (env.get("SLM_BANDIT_DISABLED", "0") or "0").strip() == "1":
+        # Bandit disabled → v2 without ensemble.
+        return "v2"
+    return "v2-ensemble"
+def apply_ranking(
+    response: "RecallResponse",
+    query: str,
+    profile_id: str,
+    query_id: str,
+    *,
+    config: Any = None,
+    pipeline_version: str = "v2-ensemble",
+) -> "RecallResponse":
+    """Run the ranking pipeline at the requested version.
+    Modes:
+      - ``off``: identity — no ranking passes run at all.
+      - ``v1``: v3.1 Active-Memory adaptive rerank only.
+      - ``v2``: v1 + v3.4.21 lambdarank rerank + signal enqueue.
+      - ``v2-ensemble`` (default): v2 + v3.4.21 contextual-bandit ensemble.
+    Each underlying pass is already defensive (catches its own exceptions),
+    so this wrapper adds an outer try/except to guarantee the caller
+    always gets a response back. Previously three separate call sites in
+    run_recall chained these; collapsing keeps precedence explicit.
+    """
+    if pipeline_version == "off":
+        return response
+    try:
+        response = apply_adaptive_ranking(response, query, profile_id,
+                                          config=config)
+    except Exception as exc:  # pragma: no cover — defensive
+        logger.debug("apply_ranking v1 step skipped: %s", exc)
+    if pipeline_version == "v1":
+        return response
+    try:
+        response = apply_v2_adaptive_ranking(
+            response, query, profile_id, query_id,
+        )
+    except Exception as exc:  # pragma: no cover — defensive
+        logger.debug("apply_ranking v2 step skipped: %s", exc)
+    if pipeline_version == "v2":
+        return response
+    try:
+        response = apply_v2_bandit_ensemble(
+            response, query, profile_id, query_id,
+        )
+    except Exception as exc:  # pragma: no cover — defensive
+        logger.debug("apply_ranking ensemble step skipped: %s", exc)
+    return response
 # ---------------------------------------------------------------------------
 # apply_adaptive_ranking  (was MemoryEngine._apply_adaptive_ranking)
 # ---------------------------------------------------------------------------
@@ -118,6 +313,227 @@ def apply_adaptive_ranking(
     )
+# ---------------------------------------------------------------------------
+# apply_v2_adaptive_ranking (LLD-02 §4.3)
+# ---------------------------------------------------------------------------
+#
+# Opt-in v3.4.21 path: load active model from learning.db with SHA-256
+# verification, re-rank via native Booster, enqueue signals async. The
+# existing ``apply_adaptive_ranking`` above stays for 3.4.20 callers.
+# ---------------------------------------------------------------------------
+def apply_v2_adaptive_ranking(
+    response: RecallResponse,
+    query: str,
+    profile_id: str,
+    query_id: str,
+    *,
+    learning_db_path: Any = None,
+) -> RecallResponse:
+    """LLD-02 §4.3 — load verified model, rerank, enqueue signals.
+    Never raises. On any error, returns ``response`` unchanged.
+    """
+    try:
+        from pathlib import Path as _P
+        from superlocalmemory.learning.database import LearningDatabase
+        from superlocalmemory.learning.model_cache import load_active
+        from superlocalmemory.learning.ranker import AdaptiveRanker
+        from superlocalmemory.learning.signals import (
+            SignalBatch,
+            SignalCandidate,
+            enqueue,
+        )
+        db_path = (_P(learning_db_path) if learning_db_path
+                   else _P.home() / ".superlocalmemory" / "learning.db")
+        if not db_path.exists():
+            return response
+        db = LearningDatabase(db_path)
+        signal_count = db.count_signals(profile_id)
+        active = load_active(db, profile_id)
+        ranker = AdaptiveRanker(
+            signal_count=signal_count,
+            active_model=active,
+        )
+        # Build result-dict shape expected by the ranker's rerank() path.
+        result_dicts: list[dict] = []
+        for r in response.results:
+            result_dicts.append({
+                "fact_id": r.fact.fact_id,
+                "score": r.score,
+                "cross_encoder_score": r.score,
+                "trust_score": r.trust_score,
+                "channel_scores": r.channel_scores or {},
+                "fact": {
+                    "age_days": 0,
+                    "access_count": r.fact.access_count,
+                },
+                "_original": r,
+            })
+        query_context = {
+            "query_type": response.query_type,
+            "profile_id": profile_id,
+        }
+        reranked_dicts = ranker.rerank(result_dicts, query_context)
+        new_results = [d["_original"] for d in reranked_dicts
+                       if "_original" in d]
+        # S8-SK-04 fix: signal enqueue is OWNED by ``apply_v2_bandit_ensemble``
+        # (see below), not this function. Previously both emitted a batch
+        # under the same query_id which doubled ``learning_signals`` and
+        # tripped the phase-transition threshold at half the intended
+        # signal count. This function now just re-ranks; the ensemble path
+        # is the single source of signal events.
+        return RecallResponse(
+            query=response.query,
+            mode=response.mode,
+            results=new_results,
+            query_type=response.query_type,
+            channel_weights=response.channel_weights,
+            total_candidates=response.total_candidates,
+            retrieval_time_ms=response.retrieval_time_ms,
+        )
+    except Exception as exc:  # pragma: no cover — defensive
+        logger.debug("apply_v2_adaptive_ranking skipped: %s", exc)
+        return response
+# ---------------------------------------------------------------------------
+# apply_v2_bandit_ensemble (LLD-03 §5.5)
+# ---------------------------------------------------------------------------
+#
+# Contextual Thompson bandit chooses channel weights. If an LGBM model is
+# active, a D8-blended ensemble re-ranks the reweighted candidates. Never
+# raises; honours ``SLM_BANDIT_DISABLED=1`` as a kill switch.
+# ---------------------------------------------------------------------------
+def apply_v2_bandit_ensemble(
+    response: RecallResponse,
+    query: str,
+    profile_id: str,
+    query_id: str,
+    *,
+    learning_db_path: Any = None,
+) -> RecallResponse:
+    """Apply contextual bandit + optional LGBM ensemble rerank. Safe on error."""
+    import os as _os
+    if _os.environ.get("SLM_BANDIT_DISABLED", "0") == "1":
+        return response
+    if not response.results:
+        return response
+    try:
+        from datetime import datetime as _dt
+        from pathlib import Path as _P
+        from superlocalmemory.learning.bandit import ContextualBandit
+        from superlocalmemory.learning.ensemble import (
+            choose_ensemble,
+            ensemble_rerank,
+        )
+        from superlocalmemory.learning.signals import (
+            SignalBatch,
+            SignalCandidate,
+            enqueue,
+        )
+        from superlocalmemory.retrieval.engine import apply_channel_weights
+        db_path = (_P(learning_db_path) if learning_db_path
+                   else _P.home() / ".superlocalmemory" / "learning.db")
+        if not db_path.exists():
+            return response
+        # --- 1. bandit.choose ---------------------------------------------
+        entity_count = 0
+        # Use query_context hints if available on the engine — cheap fallback.
+        bandit = ContextualBandit(db_path, profile_id)
+        choice = bandit.choose(
+            {
+                "query_type": response.query_type,
+                "entity_count": entity_count,
+            },
+            query_id,
+        )
+        # --- 2. apply channel weights -------------------------------------
+        weighted = apply_channel_weights(list(response.results), choice.weights)
+        # --- 3. choose ensemble + load model (optional) -------------------
+        active_model = None
+        signal_count = 0
+        try:
+            from superlocalmemory.learning.database import LearningDatabase
+            from superlocalmemory.learning.model_cache import load_active
+            db = LearningDatabase(db_path)
+            signal_count = db.count_signals(profile_id)
+            active_model = load_active(db, profile_id)
+        except Exception as exc:
+            logger.debug("v2 bandit: model/signal load skipped: %s", exc)
+        weights = choose_ensemble(signal_count, active_model)
+        # --- 4. ensemble rerank -------------------------------------------
+        query_context = {
+            "query_type": response.query_type,
+            "profile_id": profile_id,
+            "query_id": query_id,
+            "bandit_play_id": choice.play_id,
+        }
+        try:
+            final_results = ensemble_rerank(
+                weighted, choice, active_model, weights, query_context,
+            )
+        except Exception as exc:
+            logger.debug("v2 bandit ensemble_rerank skipped: %s", exc)
+            final_results = weighted
+        # --- 5. enqueue signals (non-blocking) ----------------------------
+        try:
+            top20 = final_results[:20]
+            candidates = tuple(
+                SignalCandidate(
+                    fact_id=r.fact.fact_id,
+                    channel_scores=dict(r.channel_scores or {}),
+                    cross_encoder_score=None,
+                    result_dict={"fact_id": r.fact.fact_id,
+                                 "score": r.score},
+                )
+                for r in top20
+            )
+            enqueue(SignalBatch(
+                profile_id=profile_id,
+                query_id=query_id,
+                query_text=query,
+                candidates=candidates,
+                query_context=query_context,
+            ))
+        except Exception as exc:
+            logger.debug("v2 bandit signal enqueue skipped: %s", exc)
+        return RecallResponse(
+            query=response.query,
+            mode=response.mode,
+            results=final_results,
+            query_type=response.query_type,
+            channel_weights=response.channel_weights,
+            total_candidates=response.total_candidates,
+            retrieval_time_ms=response.retrieval_time_ms,
+        )
+    except Exception as exc:  # pragma: no cover — defensive top-level
+        logger.debug("apply_v2_bandit_ensemble skipped: %s", exc)
+        return response
 # ---------------------------------------------------------------------------
 # run_recall  (was MemoryEngine.recall)
 # ---------------------------------------------------------------------------
@@ -278,11 +694,21 @@ def run_recall(
         except Exception as exc:
             logger.debug("Hebbian strengthening: %s", exc)
-    # Adaptive re-ranking (V3.1 Active Memory)
+    # S8-ARC-04 (v3.4.21): unified ranking entry point. Single env-var
+    # (SLM_RANKING=off|v1|v2|v2-ensemble) controls the pipeline. Legacy
+    # SLM_V2_PIPELINE_DISABLED + SLM_BANDIT_DISABLED still honoured for
+    # one-release back-compat. Identity when no active model.
     try:
-        response = apply_adaptive_ranking(response, query, profile_id, config=config)
+        import os as _os
+        import uuid as _uuid
+        query_id = _uuid.uuid4().hex
+        mode = _resolve_ranking_mode(_os.environ)
+        response = apply_ranking(
+            response, query, profile_id, query_id,
+            config=config, pipeline_version=mode,
+        )
     except Exception as exc:
-        logger.debug("Adaptive ranking skipped: %s", exc)
+        logger.debug("Ranking pipeline skipped: %s", exc)
     # Reconsolidation: access updates trust + count (neuroscience principle)
     if trust_scorer:
@@ -321,4 +747,8 @@ def run_recall(
     hook_ctx["query_type"] = response.query_type
     hooks.run_post("recall", hook_ctx)
+    # LLD-00 §3 — stamp HMAC markers on every result so post_tool_outcome_hook
+    # can validate fact_ids observed in downstream tool output.
+    _apply_markers_to_response(response)
     return response

package/src/superlocalmemory/core/recall_worker.py CHANGED Viewed

@@ -72,9 +72,11 @@ def _get_engine():
     return _engine
-def _handle_recall(query: str, limit: int) -> dict:
+def _handle_recall(query: str, limit: int, session_id: str = "") -> dict:
     engine = _get_engine()
-    response = engine.recall(query, limit=limit)
+    response = engine.recall(
+        query, limit=limit, session_id=session_id or None,
+    )
     # Batch-fetch original memory text for all results
     memory_ids = list({r.fact.memory_id for r in response.results[:limit] if r.fact.memory_id})
@@ -288,7 +290,10 @@ def _worker_main() -> None:
         try:
             if cmd == "recall":
-                result = _handle_recall(req.get("query", ""), req.get("limit", 10))
+                result = _handle_recall(
+                    req.get("query", ""), req.get("limit", 10),
+                    req.get("session_id", ""),
+                )
                 _respond(result)
             elif cmd == "store":
                 result = _handle_store(req.get("content", ""), req.get("metadata", {}))