npm - superlocalmemory - Versions diffs - 3.4.18 → 3.4.19 - Mend

superlocalmemory 3.4.18 → 3.4.19

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/CHANGELOG.md +11 -0
package/package.json +1 -1
package/pyproject.toml +1 -1
package/src/superlocalmemory/core/embeddings.py +8 -2
package/src/superlocalmemory/retrieval/reranker.py +4 -2
package/src/superlocalmemory.egg-info/PKG-INFO +1 -1

package/CHANGELOG.md CHANGED Viewed

@@ -10,6 +10,17 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 ---
+## [3.4.19] - 2026-04-17
+### Fixed
+- Recall cold-start eliminated. Embedding + reranker workers stay warm for 30 minutes by default instead of 2 minutes, so bursts of recalls no longer pay a 30-60 second model-load tax on every other query.
+### New environment variables
+- `SLM_EMBED_IDLE_TIMEOUT` — seconds to keep the embedding worker warm (default 1800). Set to 120 to restore pre-v3.4.19 behavior.
+- `SLM_RERANKER_IDLE_TIMEOUT` — same, for the cross-encoder reranker (default 1800).
+---
 ## [3.4.18] - 2026-04-17
 ### Fixed

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "superlocalmemory",
-  "version": "3.4.18",
+  "version": "3.4.19",
   "description": "Information-geometric agent memory with mathematical guarantees. 4-channel retrieval, Fisher-Rao similarity, zero-LLM mode, EU AI Act compliant. Works with Claude, Cursor, Windsurf, and 17+ AI tools.",
   "keywords": [
     "ai-memory",

package/pyproject.toml CHANGED Viewed

@@ -1,6 +1,6 @@
 [project]
 name = "superlocalmemory"
-version = "3.4.18"
+version = "3.4.19"
 description = "Information-geometric agent memory with mathematical guarantees"
 readme = "README.md"
 license = {text = "AGPL-3.0-or-later"}

package/src/superlocalmemory/core/embeddings.py CHANGED Viewed

@@ -140,8 +140,14 @@ def release_embedding_lock() -> None:
         _embedding_lock_fd = None
-_IDLE_TIMEOUT_SECONDS = 120  # 2 minutes — kill worker after idle
-# V3.3.12: Configurable via SLM_EMBED_IDLE_TIMEOUT env var (seconds)
+_IDLE_TIMEOUT_SECONDS = 1800  # 30 minutes — keep model warm across bursty use.
+# V3.3.12: Configurable via SLM_EMBED_IDLE_TIMEOUT env var (seconds).
+# V3.4.19: Bumped from 120 → 1800 to eliminate the 30-60s cold-start pain
+# when the embedding worker was killed too aggressively. Safety: the
+# per-embed RSS self-check (SLM_EMBED_WORKER_RSS_LIMIT_MB, 4GB default) and
+# the daemon memory watchdog (unified_daemon.py, 4GB/60s) still cap any
+# runaway. To restore the old aggressive policy without redeploying, set
+# ``SLM_EMBED_IDLE_TIMEOUT=120`` and ``slm restart``.
 _IDLE_TIMEOUT_SECONDS = int(os.environ.get("SLM_EMBED_IDLE_TIMEOUT", _IDLE_TIMEOUT_SECONDS))
 # V3.3.21: Configurable response timeout — 180s default, but batch ingestion
 # (2-turn chunks across 10 conversations) needs 600s+ to survive cold-start

package/src/superlocalmemory/retrieval/reranker.py CHANGED Viewed

@@ -51,8 +51,10 @@ _live_rerankers: set[weakref.ref] = set()
 logger = logging.getLogger(__name__)
-_IDLE_TIMEOUT_SECONDS = 120  # 2 min → kill worker
-# V3.3.12: Configurable via SLM_RERANKER_IDLE_TIMEOUT env var
+_IDLE_TIMEOUT_SECONDS = 1800  # 30 min — keep cross-encoder warm for active sessions.
+# V3.3.12: Configurable via SLM_RERANKER_IDLE_TIMEOUT env var.
+# V3.4.19: Bumped from 120 → 1800 in lock-step with the embedding worker.
+# Set ``SLM_RERANKER_IDLE_TIMEOUT=120`` + ``slm restart`` to revert.
 _IDLE_TIMEOUT_SECONDS = int(os.environ.get("SLM_RERANKER_IDLE_TIMEOUT", _IDLE_TIMEOUT_SECONDS))
 _SUBPROCESS_RESPONSE_TIMEOUT = 180  # V3.3.12: 180s (was 120s) for stressed system respawns
 _WORKER_RECYCLE_AFTER = 500  # Recycle after N requests

package/src/superlocalmemory.egg-info/PKG-INFO CHANGED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: superlocalmemory
-Version: 3.4.18
+Version: 3.4.19
 Summary: Information-geometric agent memory with mathematical guarantees
 Author-email: Varun Pratap Bhardwaj <admin@superlocalmemory.com>
 License: AGPL-3.0-or-later